summaryrefslogtreecommitdiff
path: root/runs/depth_scaling_hinge/cifar100_20260101-112306/results.json
diff options
context:
space:
mode:
authorYurenHao0426 <blackhao0426@gmail.com>2026-01-13 23:49:05 -0600
committerYurenHao0426 <blackhao0426@gmail.com>2026-01-13 23:49:05 -0600
commitcd99d6b874d9d09b3bb87b8485cc787885af71f1 (patch)
tree59a233959932ca0e4f12f196275e07fcf443b33f /runs/depth_scaling_hinge/cifar100_20260101-112306/results.json
init commit
Diffstat (limited to 'runs/depth_scaling_hinge/cifar100_20260101-112306/results.json')
-rw-r--r--runs/depth_scaling_hinge/cifar100_20260101-112306/results.json16822
1 files changed, 16822 insertions, 0 deletions
diff --git a/runs/depth_scaling_hinge/cifar100_20260101-112306/results.json b/runs/depth_scaling_hinge/cifar100_20260101-112306/results.json
new file mode 100644
index 0000000..97d572e
--- /dev/null
+++ b/runs/depth_scaling_hinge/cifar100_20260101-112306/results.json
@@ -0,0 +1,16822 @@
+{
+ "vanilla": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 4.341291038284302,
+ "train_acc": 0.09568,
+ "test_loss": 3.5902228660583497,
+ "test_acc": 0.1719,
+ "lyapunov": null,
+ "grad_norm": 6.233568552079335,
+ "grad_max_sv": 4.7545679092407225,
+ "grad_min_sv": 1.1250918028338219e-07,
+ "grad_condition": 47144055.51418194,
+ "lr": 0.0009998903417374227,
+ "time_sec": 17.830737352371216
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.4833403620910643,
+ "train_acc": 0.1875,
+ "test_loss": 3.2125896770477294,
+ "test_acc": 0.2413,
+ "lyapunov": null,
+ "grad_norm": 4.2883357141420815,
+ "grad_max_sv": 3.0223524630069734,
+ "grad_min_sv": 7.805360168200437e-08,
+ "grad_condition": 68434745.79111826,
+ "lr": 0.0009995614150494292,
+ "time_sec": 15.740124702453613
+ },
+ {
+ "epoch": 3,
+ "train_loss": 3.014097664794922,
+ "train_acc": 0.26054,
+ "test_loss": 2.8822019165039063,
+ "test_acc": 0.2889,
+ "lyapunov": null,
+ "grad_norm": 3.3688150071564396,
+ "grad_max_sv": 2.1886239469051363,
+ "grad_min_sv": 6.223103937719188e-08,
+ "grad_condition": 42282037.7115659,
+ "lr": 0.0009990133642141358,
+ "time_sec": 15.473703145980835
+ },
+ {
+ "epoch": 4,
+ "train_loss": 2.7143693132019044,
+ "train_acc": 0.31262,
+ "test_loss": 2.702446311187744,
+ "test_acc": 0.3208,
+ "lyapunov": null,
+ "grad_norm": 2.8785406038007317,
+ "grad_max_sv": 1.7646001279354095,
+ "grad_min_sv": 5.3701336399925025e-08,
+ "grad_condition": 43554152.39164617,
+ "lr": 0.0009982464296247522,
+ "time_sec": 15.499403238296509
+ },
+ {
+ "epoch": 5,
+ "train_loss": 2.5030348071289064,
+ "train_acc": 0.3554,
+ "test_loss": 2.763942724990845,
+ "test_acc": 0.329,
+ "lyapunov": null,
+ "grad_norm": 2.5897409787447465,
+ "grad_max_sv": 1.5612378805875777,
+ "grad_min_sv": 4.8854244893981046e-08,
+ "grad_condition": 41333195.00893615,
+ "lr": 0.0009972609476841367,
+ "time_sec": 15.488951683044434
+ },
+ {
+ "epoch": 6,
+ "train_loss": 2.3269909496307375,
+ "train_acc": 0.3938,
+ "test_loss": 2.4710379989624025,
+ "test_acc": 0.3761,
+ "lyapunov": null,
+ "grad_norm": 2.37414912310322,
+ "grad_max_sv": 1.3197038874030114,
+ "grad_min_sv": 4.5427973693196176e-08,
+ "grad_condition": 185703885.27271265,
+ "lr": 0.000996057350657239,
+ "time_sec": 15.497607707977295
+ },
+ {
+ "epoch": 7,
+ "train_loss": 2.1854072467041017,
+ "train_acc": 0.4216,
+ "test_loss": 2.951163561248779,
+ "test_acc": 0.323,
+ "lyapunov": null,
+ "grad_norm": 2.2068200870493837,
+ "grad_max_sv": 1.2339675694704055,
+ "grad_min_sv": 4.277283941478416e-08,
+ "grad_condition": 52095598.918328084,
+ "lr": 0.000994636166481494,
+ "time_sec": 15.472023725509644
+ },
+ {
+ "epoch": 8,
+ "train_loss": 2.0716393295288085,
+ "train_acc": 0.44928,
+ "test_loss": 2.2887711679458618,
+ "test_acc": 0.4114,
+ "lyapunov": null,
+ "grad_norm": 2.076990480510157,
+ "grad_max_sv": 1.131314830482006,
+ "grad_min_sv": 3.9886170205560846e-08,
+ "grad_condition": 41939669.82744624,
+ "lr": 0.0009929980185352525,
+ "time_sec": 15.464510440826416
+ },
+ {
+ "epoch": 9,
+ "train_loss": 1.974085814552307,
+ "train_acc": 0.47136,
+ "test_loss": 2.672110557174683,
+ "test_acc": 0.3601,
+ "lyapunov": null,
+ "grad_norm": 1.9761816566655848,
+ "grad_max_sv": 1.0417343363165856,
+ "grad_min_sv": 3.825020498116061e-08,
+ "grad_condition": 39964162.48622004,
+ "lr": 0.0009911436253643444,
+ "time_sec": 15.494410037994385
+ },
+ {
+ "epoch": 10,
+ "train_loss": 1.8730941659545899,
+ "train_acc": 0.49054,
+ "test_loss": 2.5056158615112305,
+ "test_acc": 0.3813,
+ "lyapunov": null,
+ "grad_norm": 1.8634099386367884,
+ "grad_max_sv": 0.9600013196468353,
+ "grad_min_sv": 3.579910488604732e-08,
+ "grad_condition": 34060738.21798731,
+ "lr": 0.0009890738003669028,
+ "time_sec": 15.488292455673218
+ },
+ {
+ "epoch": 11,
+ "train_loss": 1.7812603790664674,
+ "train_acc": 0.51462,
+ "test_loss": 2.477180172729492,
+ "test_acc": 0.3997,
+ "lyapunov": null,
+ "grad_norm": 1.7790099981650356,
+ "grad_max_sv": 0.9072641983628273,
+ "grad_min_sv": 3.4340940041621694e-08,
+ "grad_condition": 36834828.42576877,
+ "lr": 0.00098678945143658,
+ "time_sec": 15.484249591827393
+ },
+ {
+ "epoch": 12,
+ "train_loss": 1.714907325401306,
+ "train_acc": 0.52888,
+ "test_loss": 2.226099481582642,
+ "test_acc": 0.4353,
+ "lyapunov": null,
+ "grad_norm": 1.701538564781707,
+ "grad_max_sv": 0.8431645318865776,
+ "grad_min_sv": 3.240299342038844e-08,
+ "grad_condition": 64109426.95331051,
+ "lr": 0.0009842915805643154,
+ "time_sec": 15.483522891998291
+ },
+ {
+ "epoch": 13,
+ "train_loss": 1.648736492576599,
+ "train_acc": 0.5449,
+ "test_loss": 2.1634216318130495,
+ "test_acc": 0.4573,
+ "lyapunov": null,
+ "grad_norm": 1.6315158856421696,
+ "grad_max_sv": 0.7919500142335891,
+ "grad_min_sv": 3.0836463893457736e-08,
+ "grad_condition": 50314317.689856075,
+ "lr": 0.000981581283398829,
+ "time_sec": 15.491243362426758
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.5916738232421874,
+ "train_acc": 0.5591,
+ "test_loss": 2.5368153831481934,
+ "test_acc": 0.398,
+ "lyapunov": null,
+ "grad_norm": 1.579987574958028,
+ "grad_max_sv": 0.7741283252835274,
+ "grad_min_sv": 3.031987156898453e-08,
+ "grad_condition": 33629215.75141786,
+ "lr": 0.0009786597487660333,
+ "time_sec": 15.476540565490723
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.5378693001937866,
+ "train_acc": 0.57156,
+ "test_loss": 1.9343770442962647,
+ "test_acc": 0.4989,
+ "lyapunov": null,
+ "grad_norm": 1.5231234313765212,
+ "grad_max_sv": 0.7179134920239448,
+ "grad_min_sv": 2.8637837475031792e-08,
+ "grad_condition": 49527050.380315706,
+ "lr": 0.0009755282581475766,
+ "time_sec": 15.486248970031738
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.478127024307251,
+ "train_acc": 0.58584,
+ "test_loss": 1.9563913166046143,
+ "test_acc": 0.4922,
+ "lyapunov": null,
+ "grad_norm": 1.46325785921816,
+ "grad_max_sv": 0.6841573119163513,
+ "grad_min_sv": 2.716867457952521e-08,
+ "grad_condition": 56699539.529558375,
+ "lr": 0.0009721881851187403,
+ "time_sec": 15.49137544631958
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.429626383972168,
+ "train_acc": 0.59714,
+ "test_loss": 2.326792067337036,
+ "test_acc": 0.4336,
+ "lyapunov": null,
+ "grad_norm": 1.4242655219863833,
+ "grad_max_sv": 0.6712241530418396,
+ "grad_min_sv": 2.6996844360027695e-08,
+ "grad_condition": 40189659.16617282,
+ "lr": 0.0009686409947459456,
+ "time_sec": 15.493090391159058
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.395352936630249,
+ "train_acc": 0.6053,
+ "test_loss": 1.8314157381057738,
+ "test_acc": 0.5182,
+ "lyapunov": null,
+ "grad_norm": 1.3761305598419875,
+ "grad_max_sv": 0.6385130822658539,
+ "grad_min_sv": 2.6239096877211932e-08,
+ "grad_condition": 63284929.054803826,
+ "lr": 0.0009648882429441254,
+ "time_sec": 15.477057695388794
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.340607022781372,
+ "train_acc": 0.61952,
+ "test_loss": 1.9038033363342286,
+ "test_acc": 0.5042,
+ "lyapunov": null,
+ "grad_norm": 1.3323384681348491,
+ "grad_max_sv": 0.613679239153862,
+ "grad_min_sv": 2.4952525421112828e-08,
+ "grad_condition": 1048659082.6601179,
+ "lr": 0.00096093157579425,
+ "time_sec": 15.483818292617798
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.2925908715438843,
+ "train_acc": 0.62856,
+ "test_loss": 2.031341696929932,
+ "test_acc": 0.4835,
+ "lyapunov": null,
+ "grad_norm": 1.3034876314465462,
+ "grad_max_sv": 0.5816340684890747,
+ "grad_min_sv": 2.434145293522816e-08,
+ "grad_condition": 45204778.74017582,
+ "lr": 0.0009567727288213001,
+ "time_sec": 15.512004375457764
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.278655789756775,
+ "train_acc": 0.63278,
+ "test_loss": 1.8846191581726075,
+ "test_acc": 0.5135,
+ "lyapunov": null,
+ "grad_norm": 1.2776040716135673,
+ "grad_max_sv": 0.5780372425913811,
+ "grad_min_sv": 2.405527027016241e-08,
+ "grad_condition": 42159114.019685745,
+ "lr": 0.0009524135262330095,
+ "time_sec": 15.499945878982544
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.2383485181427003,
+ "train_acc": 0.64622,
+ "test_loss": 1.8699242074966431,
+ "test_acc": 0.518,
+ "lyapunov": null,
+ "grad_norm": 1.2460313700260512,
+ "grad_max_sv": 0.5693550139665604,
+ "grad_min_sv": 2.3625755932697724e-08,
+ "grad_condition": 247459954.48036852,
+ "lr": 0.0009478558801197061,
+ "time_sec": 15.489409923553467
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.208611516494751,
+ "train_acc": 0.6519,
+ "test_loss": 1.8377874282836915,
+ "test_acc": 0.526,
+ "lyapunov": null,
+ "grad_norm": 1.2268147245238885,
+ "grad_max_sv": 0.5506495118141175,
+ "grad_min_sv": 2.2982289769879482e-08,
+ "grad_condition": 91532045.29729453,
+ "lr": 0.000943101789615607,
+ "time_sec": 15.503745555877686
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.1756799732208252,
+ "train_acc": 0.66142,
+ "test_loss": 1.8445790365219117,
+ "test_acc": 0.5321,
+ "lyapunov": null,
+ "grad_norm": 1.1995646648047669,
+ "grad_max_sv": 0.5362823188304902,
+ "grad_min_sv": 2.227390833997589e-08,
+ "grad_condition": 39000923.8470154,
+ "lr": 0.0009381533400219313,
+ "time_sec": 15.488165855407715
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.1402707249450683,
+ "train_acc": 0.67004,
+ "test_loss": 2.1079253253936767,
+ "test_acc": 0.4853,
+ "lyapunov": null,
+ "grad_norm": 1.1685820076008453,
+ "grad_max_sv": 0.500711290538311,
+ "grad_min_sv": 2.1209413056388903e-08,
+ "grad_condition": 37717541.68981,
+ "lr": 0.0009330127018922189,
+ "time_sec": 15.519190073013306
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.115832226486206,
+ "train_acc": 0.67608,
+ "test_loss": 1.7950333555221558,
+ "test_acc": 0.5345,
+ "lyapunov": null,
+ "grad_norm": 1.1487591162708706,
+ "grad_max_sv": 0.5033038355410099,
+ "grad_min_sv": 2.1531226807036675e-08,
+ "grad_condition": 34912719.99916558,
+ "lr": 0.000927682130080253,
+ "time_sec": 15.500119924545288
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.0897642765426636,
+ "train_acc": 0.68058,
+ "test_loss": 1.9983017498016358,
+ "test_acc": 0.5014,
+ "lyapunov": null,
+ "grad_norm": 1.1397755659416107,
+ "grad_max_sv": 0.5070834219455719,
+ "grad_min_sv": 2.094801768229293e-08,
+ "grad_condition": 112680773.02319674,
+ "lr": 0.0009221639627510072,
+ "time_sec": 15.487388610839844
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.0600782299995422,
+ "train_acc": 0.6873,
+ "test_loss": 1.7331308700561523,
+ "test_acc": 0.552,
+ "lyapunov": null,
+ "grad_norm": 1.1194293581413437,
+ "grad_max_sv": 0.49243925511837006,
+ "grad_min_sv": 2.061250336264555e-08,
+ "grad_condition": 2391098394.247443,
+ "lr": 0.0009164606203550494,
+ "time_sec": 15.49947738647461
+ },
+ {
+ "epoch": 29,
+ "train_loss": 1.0288162441635131,
+ "train_acc": 0.6958,
+ "test_loss": 1.7574676347732543,
+ "test_acc": 0.5469,
+ "lyapunov": null,
+ "grad_norm": 1.0981602434296158,
+ "grad_max_sv": 0.4940373159945011,
+ "grad_min_sv": 2.0519680072120238e-08,
+ "grad_condition": 152798003.85014075,
+ "lr": 0.0009105746045668516,
+ "time_sec": 15.519279956817627
+ },
+ {
+ "epoch": 30,
+ "train_loss": 1.0005281573104858,
+ "train_acc": 0.70474,
+ "test_loss": 1.7724915187835693,
+ "test_acc": 0.5535,
+ "lyapunov": null,
+ "grad_norm": 1.0821209053569316,
+ "grad_max_sv": 0.4882327690720558,
+ "grad_min_sv": 2.040895886699923e-08,
+ "grad_condition": 106754784.91270833,
+ "lr": 0.0009045084971874733,
+ "time_sec": 15.495746612548828
+ },
+ {
+ "epoch": 31,
+ "train_loss": 0.9887743633651733,
+ "train_acc": 0.70736,
+ "test_loss": 1.803389212989807,
+ "test_acc": 0.5421,
+ "lyapunov": null,
+ "grad_norm": 1.0717360299018484,
+ "grad_max_sv": 0.4644377827644348,
+ "grad_min_sv": 1.9709001528034342e-08,
+ "grad_condition": 35783294.580241755,
+ "lr": 0.0008982649590120977,
+ "time_sec": 15.506318807601929
+ },
+ {
+ "epoch": 32,
+ "train_loss": 0.9635560890579223,
+ "train_acc": 0.71462,
+ "test_loss": 1.7782361072540283,
+ "test_acc": 0.5515,
+ "lyapunov": null,
+ "grad_norm": 1.0547768746381694,
+ "grad_max_sv": 0.47287538424134257,
+ "grad_min_sv": 1.9473239257217223e-08,
+ "grad_condition": 36442794.53940544,
+ "lr": 0.0008918467286629196,
+ "time_sec": 15.525408744812012
+ },
+ {
+ "epoch": 33,
+ "train_loss": 0.9454534896087646,
+ "train_acc": 0.71586,
+ "test_loss": 1.8413972650527954,
+ "test_acc": 0.5387,
+ "lyapunov": null,
+ "grad_norm": 1.0457002240106366,
+ "grad_max_sv": 0.4636484496295452,
+ "grad_min_sv": 1.9625483711760426e-08,
+ "grad_condition": 124503449.94674742,
+ "lr": 0.0008852566213878943,
+ "time_sec": 15.658098459243774
+ },
+ {
+ "epoch": 34,
+ "train_loss": 0.926147558670044,
+ "train_acc": 0.72194,
+ "test_loss": 1.8227524955749512,
+ "test_acc": 0.5492,
+ "lyapunov": null,
+ "grad_norm": 1.030398616328217,
+ "grad_max_sv": 0.44984652400016784,
+ "grad_min_sv": 1.8758673522856208e-08,
+ "grad_condition": 63054578.90943961,
+ "lr": 0.000878497527825878,
+ "time_sec": 15.51594591140747
+ },
+ {
+ "epoch": 35,
+ "train_loss": 0.8910220455551148,
+ "train_acc": 0.7339,
+ "test_loss": 1.7336375022888184,
+ "test_acc": 0.5649,
+ "lyapunov": null,
+ "grad_norm": 1.0076609346644876,
+ "grad_max_sv": 0.44372819289565085,
+ "grad_min_sv": 1.8551427522633945e-08,
+ "grad_condition": 50611185.75714277,
+ "lr": 0.000871572412738697,
+ "time_sec": 15.497729539871216
+ },
+ {
+ "epoch": 36,
+ "train_loss": 0.8785494363021851,
+ "train_acc": 0.73456,
+ "test_loss": 1.7843629848480225,
+ "test_acc": 0.5581,
+ "lyapunov": null,
+ "grad_norm": 0.9989169914835021,
+ "grad_max_sv": 0.4366959437727928,
+ "grad_min_sv": 1.8408271952943812e-08,
+ "grad_condition": 85310005.79090494,
+ "lr": 0.0008644843137107055,
+ "time_sec": 15.490435123443604
+ },
+ {
+ "epoch": 37,
+ "train_loss": 0.856938405303955,
+ "train_acc": 0.74212,
+ "test_loss": 1.78583115940094,
+ "test_acc": 0.5595,
+ "lyapunov": null,
+ "grad_norm": 0.9837943590828618,
+ "grad_max_sv": 0.42913608700037004,
+ "grad_min_sv": 1.799877897834534e-08,
+ "grad_condition": 44955472.82427679,
+ "lr": 0.0008572363398164014,
+ "time_sec": 15.537626266479492
+ },
+ {
+ "epoch": 38,
+ "train_loss": 0.8304045977973938,
+ "train_acc": 0.74954,
+ "test_loss": 1.9540308137893676,
+ "test_acc": 0.5338,
+ "lyapunov": null,
+ "grad_norm": 0.9705660429353747,
+ "grad_max_sv": 0.41689482182264326,
+ "grad_min_sv": 1.7790258101044177e-08,
+ "grad_condition": 85624723.50661872,
+ "lr": 0.0008498316702566826,
+ "time_sec": 15.500178813934326
+ },
+ {
+ "epoch": 39,
+ "train_loss": 0.820258391494751,
+ "train_acc": 0.74884,
+ "test_loss": 1.8685070798873902,
+ "test_acc": 0.5491,
+ "lyapunov": null,
+ "grad_norm": 0.9650066613971798,
+ "grad_max_sv": 0.42203645706176757,
+ "grad_min_sv": 1.7701675934789218e-08,
+ "grad_condition": 38471919.31748825,
+ "lr": 0.0008422735529643442,
+ "time_sec": 15.50774359703064
+ },
+ {
+ "epoch": 40,
+ "train_loss": 0.8059215658950806,
+ "train_acc": 0.75368,
+ "test_loss": 1.7993948059082032,
+ "test_acc": 0.5644,
+ "lyapunov": null,
+ "grad_norm": 0.9599648842149144,
+ "grad_max_sv": 0.42296523600816727,
+ "grad_min_sv": 1.7450433907606477e-08,
+ "grad_condition": 48602019.20439266,
+ "lr": 0.0008345653031794289,
+ "time_sec": 15.5121328830719
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.7813009564971923,
+ "train_acc": 0.76052,
+ "test_loss": 1.8404800394058227,
+ "test_acc": 0.5604,
+ "lyapunov": null,
+ "grad_norm": 0.9418789892686961,
+ "grad_max_sv": 0.40448441356420517,
+ "grad_min_sv": 1.731778200703138e-08,
+ "grad_condition": 98318164.88521431,
+ "lr": 0.0008267103019950526,
+ "time_sec": 15.492136240005493
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.7671393407821655,
+ "train_acc": 0.76604,
+ "test_loss": 1.793884058380127,
+ "test_acc": 0.5618,
+ "lyapunov": null,
+ "grad_norm": 0.9315468648605028,
+ "grad_max_sv": 0.38932052329182626,
+ "grad_min_sv": 1.6337376871483622e-08,
+ "grad_condition": 62943904.80942075,
+ "lr": 0.0008187119948743447,
+ "time_sec": 15.521047592163086
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.7535210326766968,
+ "train_acc": 0.76782,
+ "test_loss": 1.7884279314041138,
+ "test_acc": 0.5658,
+ "lyapunov": null,
+ "grad_norm": 0.9214199202766519,
+ "grad_max_sv": 0.39339111372828484,
+ "grad_min_sv": 1.6136958740434192e-08,
+ "grad_condition": 115362103.47666125,
+ "lr": 0.000810573890139155,
+ "time_sec": 15.505242109298706
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.7410284707832336,
+ "train_acc": 0.77312,
+ "test_loss": 1.7518087032318115,
+ "test_acc": 0.575,
+ "lyapunov": null,
+ "grad_norm": 0.9135862495102605,
+ "grad_max_sv": 0.4029770277440548,
+ "grad_min_sv": 1.6805088312935034e-08,
+ "grad_condition": 94769472.27955042,
+ "lr": 0.0008022995574311873,
+ "time_sec": 15.517944812774658
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.7176916319656372,
+ "train_acc": 0.77704,
+ "test_loss": 2.0678364603042603,
+ "test_acc": 0.5371,
+ "lyapunov": null,
+ "grad_norm": 0.9046856584920682,
+ "grad_max_sv": 0.3983215056359768,
+ "grad_min_sv": 1.613215366361165e-08,
+ "grad_condition": 71122656.74298272,
+ "lr": 0.0007938926261462363,
+ "time_sec": 15.508166313171387
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.7069017255210877,
+ "train_acc": 0.7811,
+ "test_loss": 1.7433353471755981,
+ "test_acc": 0.5852,
+ "lyapunov": null,
+ "grad_norm": 0.8978206260313095,
+ "grad_max_sv": 0.3794424146413803,
+ "grad_min_sv": 1.602237248293781e-08,
+ "grad_condition": 54736720.76954285,
+ "lr": 0.0007853567838422158,
+ "time_sec": 15.502079725265503
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.6877984882736206,
+ "train_acc": 0.7887,
+ "test_loss": 1.818675978088379,
+ "test_acc": 0.571,
+ "lyapunov": null,
+ "grad_norm": 0.8819975234594025,
+ "grad_max_sv": 0.3825521655380726,
+ "grad_min_sv": 1.5721361913863253e-08,
+ "grad_condition": 205362522.60160935,
+ "lr": 0.0007766957746216719,
+ "time_sec": 15.509292840957642
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.6792054767608643,
+ "train_acc": 0.78942,
+ "test_loss": 1.8216966215133668,
+ "test_acc": 0.5718,
+ "lyapunov": null,
+ "grad_norm": 0.8744607628160516,
+ "grad_max_sv": 0.3726635776460171,
+ "grad_min_sv": 1.5723771835604582e-08,
+ "grad_condition": 93081917.25808936,
+ "lr": 0.0007679133974894982,
+ "time_sec": 15.525796890258789
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.6626561027145386,
+ "train_acc": 0.79284,
+ "test_loss": 1.772965872001648,
+ "test_acc": 0.5863,
+ "lyapunov": null,
+ "grad_norm": 0.8660062343667397,
+ "grad_max_sv": 0.3925539918243885,
+ "grad_min_sv": 1.5532864388332138e-08,
+ "grad_condition": 566473525.6824175,
+ "lr": 0.000759013504686565,
+ "time_sec": 15.50195598602295
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.6532552631759644,
+ "train_acc": 0.79666,
+ "test_loss": 1.8317417165756225,
+ "test_acc": 0.5724,
+ "lyapunov": null,
+ "grad_norm": 0.860130500782199,
+ "grad_max_sv": 0.3667507700622082,
+ "grad_min_sv": 1.5443047825941526e-08,
+ "grad_condition": 91486044.66793105,
+ "lr": 0.0007499999999999998,
+ "time_sec": 15.508357286453247
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.6380054843711853,
+ "train_acc": 0.80084,
+ "test_loss": 1.8737646755218507,
+ "test_acc": 0.5686,
+ "lyapunov": null,
+ "grad_norm": 0.8524936007576276,
+ "grad_max_sv": 0.3761135272681713,
+ "grad_min_sv": 1.5451151683110177e-08,
+ "grad_condition": 34353598.33829906,
+ "lr": 0.0007408768370508575,
+ "time_sec": 15.523806810379028
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.6237339858055114,
+ "train_acc": 0.80636,
+ "test_loss": 1.761890636062622,
+ "test_acc": 0.5872,
+ "lyapunov": null,
+ "grad_norm": 0.8410504283608066,
+ "grad_max_sv": 0.358472990244627,
+ "grad_min_sv": 1.503268568618654e-08,
+ "grad_condition": 136795884.7400892,
+ "lr": 0.0007316480175599307,
+ "time_sec": 15.495483636856079
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.6058457711982727,
+ "train_acc": 0.80932,
+ "test_loss": 1.9825311820983886,
+ "test_acc": 0.5638,
+ "lyapunov": null,
+ "grad_norm": 0.8335328667900934,
+ "grad_max_sv": 0.36334397196769713,
+ "grad_min_sv": 1.5307615661760283e-08,
+ "grad_condition": 250366089.5715099,
+ "lr": 0.0007223175895924635,
+ "time_sec": 15.514543771743774
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.6004596606063842,
+ "train_acc": 0.81078,
+ "test_loss": 1.8254186273574828,
+ "test_acc": 0.5794,
+ "lyapunov": null,
+ "grad_norm": 0.8274523113635032,
+ "grad_max_sv": 0.36342041566967964,
+ "grad_min_sv": 1.4868843903077106e-08,
+ "grad_condition": 300576728.02848065,
+ "lr": 0.0007128896457825361,
+ "time_sec": 15.540250062942505
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.5861557857704163,
+ "train_acc": 0.8164,
+ "test_loss": 1.824499238014221,
+ "test_acc": 0.583,
+ "lyapunov": null,
+ "grad_norm": 0.8198101267614993,
+ "grad_max_sv": 0.357354723662138,
+ "grad_min_sv": 1.4506401982417039e-08,
+ "grad_condition": 35029629.47074116,
+ "lr": 0.0007033683215378998,
+ "time_sec": 15.531729459762573
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.5844129343986512,
+ "train_acc": 0.81744,
+ "test_loss": 1.9169658557891847,
+ "test_acc": 0.5711,
+ "lyapunov": null,
+ "grad_norm": 0.8204173814530821,
+ "grad_max_sv": 0.35366991981863977,
+ "grad_min_sv": 1.4835723899028764e-08,
+ "grad_condition": 72623356.9140754,
+ "lr": 0.0006937577932260512,
+ "time_sec": 15.517155647277832
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.567106929988861,
+ "train_acc": 0.82118,
+ "test_loss": 1.872194965362549,
+ "test_acc": 0.5783,
+ "lyapunov": null,
+ "grad_norm": 0.8144173645411016,
+ "grad_max_sv": 0.3568101763725281,
+ "grad_min_sv": 1.459230552047601e-08,
+ "grad_condition": 479856948.8028302,
+ "lr": 0.0006840622763423388,
+ "time_sec": 15.499967098236084
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.5492036812782287,
+ "train_acc": 0.82718,
+ "test_loss": 1.9435380107879638,
+ "test_acc": 0.5717,
+ "lyapunov": null,
+ "grad_norm": 0.8017437900627353,
+ "grad_max_sv": 0.35105792358517646,
+ "grad_min_sv": 1.4126277701753675e-08,
+ "grad_condition": 43594921.05141826,
+ "lr": 0.0006742860236609073,
+ "time_sec": 15.517162084579468
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.5499647881126404,
+ "train_acc": 0.82578,
+ "test_loss": 1.9104221244812012,
+ "test_acc": 0.5719,
+ "lyapunov": null,
+ "grad_norm": 0.8008754176084809,
+ "grad_max_sv": 0.35147457346320155,
+ "grad_min_sv": 1.4486321607987823e-08,
+ "grad_condition": 183104197.19597444,
+ "lr": 0.0006644333233692913,
+ "time_sec": 15.51251220703125
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.534982263879776,
+ "train_acc": 0.83032,
+ "test_loss": 1.8654183416366577,
+ "test_acc": 0.5849,
+ "lyapunov": null,
+ "grad_norm": 0.7872093874708191,
+ "grad_max_sv": 0.3456037163734436,
+ "grad_min_sv": 1.4336570289236833e-08,
+ "grad_condition": 4249914917.2238555,
+ "lr": 0.0006545084971874734,
+ "time_sec": 15.505401134490967
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.5249415069770813,
+ "train_acc": 0.83296,
+ "test_loss": 1.8301967880249024,
+ "test_acc": 0.5899,
+ "lyapunov": null,
+ "grad_norm": 0.7823659308548245,
+ "grad_max_sv": 0.3372106350958347,
+ "grad_min_sv": 1.3865955505228816e-08,
+ "grad_condition": 252598095.01328754,
+ "lr": 0.0006445158984722354,
+ "time_sec": 15.503329277038574
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.510102439250946,
+ "train_acc": 0.8393,
+ "test_loss": 1.866330424118042,
+ "test_acc": 0.5875,
+ "lyapunov": null,
+ "grad_norm": 0.7690765731453699,
+ "grad_max_sv": 0.3254604462534189,
+ "grad_min_sv": 1.3302552516816778e-08,
+ "grad_condition": 201820413.1939206,
+ "lr": 0.0006344599103076324,
+ "time_sec": 15.51197862625122
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.5105279865837097,
+ "train_acc": 0.83724,
+ "test_loss": 1.901947551727295,
+ "test_acc": 0.5827,
+ "lyapunov": null,
+ "grad_norm": 0.7774036231362129,
+ "grad_max_sv": 0.3391082786023617,
+ "grad_min_sv": 1.3618166180666413e-08,
+ "grad_condition": 142624827.53962922,
+ "lr": 0.0006243449435824269,
+ "time_sec": 15.512575387954712
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.4943154125213623,
+ "train_acc": 0.84368,
+ "test_loss": 1.8720532272338868,
+ "test_acc": 0.5871,
+ "lyapunov": null,
+ "grad_norm": 0.7622106739600653,
+ "grad_max_sv": 0.3370689533650875,
+ "grad_min_sv": 1.3509893057039868e-08,
+ "grad_condition": 110330065.15549783,
+ "lr": 0.0006141754350553275,
+ "time_sec": 15.502142667770386
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.47654122495651247,
+ "train_acc": 0.84812,
+ "test_loss": 1.905906325340271,
+ "test_acc": 0.5836,
+ "lyapunov": null,
+ "grad_norm": 0.7485726591566199,
+ "grad_max_sv": 0.3178395930677652,
+ "grad_min_sv": 1.3372613298992531e-08,
+ "grad_condition": 61795906.83332411,
+ "lr": 0.0006039558454088793,
+ "time_sec": 15.515769243240356
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.4698985565757752,
+ "train_acc": 0.85062,
+ "test_loss": 1.9764730356216431,
+ "test_acc": 0.5772,
+ "lyapunov": null,
+ "grad_norm": 0.742030695327052,
+ "grad_max_sv": 0.32952211387455466,
+ "grad_min_sv": 1.321727686021503e-08,
+ "grad_condition": 4546159923.454214,
+ "lr": 0.000593690657292862,
+ "time_sec": 15.48769211769104
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.4604379980945587,
+ "train_acc": 0.8524,
+ "test_loss": 1.796267902946472,
+ "test_acc": 0.6041,
+ "lyapunov": null,
+ "grad_norm": 0.740514981620189,
+ "grad_max_sv": 0.33283664137125013,
+ "grad_min_sv": 1.3323875688170395e-08,
+ "grad_condition": 50110355.592218384,
+ "lr": 0.0005833843733580507,
+ "time_sec": 15.512935638427734
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.44513163749694823,
+ "train_acc": 0.85782,
+ "test_loss": 1.882637822341919,
+ "test_acc": 0.5923,
+ "lyapunov": null,
+ "grad_norm": 0.728632370248676,
+ "grad_max_sv": 0.3257355663925409,
+ "grad_min_sv": 1.2869882924648746e-08,
+ "grad_condition": 63884816.41740811,
+ "lr": 0.0005730415142812054,
+ "time_sec": 15.52915072441101
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.4467424920272827,
+ "train_acc": 0.85622,
+ "test_loss": 1.8523083587646485,
+ "test_acc": 0.5958,
+ "lyapunov": null,
+ "grad_norm": 0.7288387711248852,
+ "grad_max_sv": 0.322311682254076,
+ "grad_min_sv": 1.291249293496055e-08,
+ "grad_condition": 179204657.50522354,
+ "lr": 0.0005626666167821517,
+ "time_sec": 15.511183738708496
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.4350817290687561,
+ "train_acc": 0.86062,
+ "test_loss": 1.9277977352142335,
+ "test_acc": 0.5905,
+ "lyapunov": null,
+ "grad_norm": 0.7211268163108158,
+ "grad_max_sv": 0.3169262710958719,
+ "grad_min_sv": 1.2573862395379165e-08,
+ "grad_condition": 248234270.03092772,
+ "lr": 0.0005522642316338265,
+ "time_sec": 15.514695167541504
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.43583440225601194,
+ "train_acc": 0.86066,
+ "test_loss": 1.940795637512207,
+ "test_acc": 0.59,
+ "lyapunov": null,
+ "grad_norm": 0.7218256453060395,
+ "grad_max_sv": 0.3179506029933691,
+ "grad_min_sv": 1.2854640636141001e-08,
+ "grad_condition": 159315542.25023228,
+ "lr": 0.0005418389216661573,
+ "time_sec": 15.515326499938965
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.414209595451355,
+ "train_acc": 0.86682,
+ "test_loss": 1.9192114906311035,
+ "test_acc": 0.5871,
+ "lyapunov": null,
+ "grad_norm": 0.7026800304062572,
+ "grad_max_sv": 0.3194992933422327,
+ "grad_min_sv": 1.2563614283167892e-08,
+ "grad_condition": 438466879.2604634,
+ "lr": 0.0005313952597646563,
+ "time_sec": 15.508101224899292
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.41810142745018003,
+ "train_acc": 0.86568,
+ "test_loss": 1.9427220703125,
+ "test_acc": 0.5871,
+ "lyapunov": null,
+ "grad_norm": 0.7107104457797438,
+ "grad_max_sv": 0.3116331197321415,
+ "grad_min_sv": 1.2560458482156755e-08,
+ "grad_condition": 218040038.56003165,
+ "lr": 0.0005209378268645994,
+ "time_sec": 15.528023719787598
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.4033842642211914,
+ "train_acc": 0.87,
+ "test_loss": 1.9472733200073242,
+ "test_acc": 0.5874,
+ "lyapunov": null,
+ "grad_norm": 0.6981925142164059,
+ "grad_max_sv": 0.3173716105520725,
+ "grad_min_sv": 1.260878115683789e-08,
+ "grad_condition": 120156618.97368078,
+ "lr": 0.0005104712099416781,
+ "time_sec": 15.506508111953735
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.39077227040290835,
+ "train_acc": 0.87468,
+ "test_loss": 1.857486226272583,
+ "test_acc": 0.598,
+ "lyapunov": null,
+ "grad_norm": 0.6856338799556791,
+ "grad_max_sv": 0.30381867848336697,
+ "grad_min_sv": 1.2063926282295315e-08,
+ "grad_condition": 414020461.3005485,
+ "lr": 0.0004999999999999996,
+ "time_sec": 15.522391557693481
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.3836136112689972,
+ "train_acc": 0.8757,
+ "test_loss": 1.9512550479888917,
+ "test_acc": 0.587,
+ "lyapunov": null,
+ "grad_norm": 0.6870816068446682,
+ "grad_max_sv": 0.3084618851542473,
+ "grad_min_sv": 1.2161173516388873e-08,
+ "grad_condition": 299698503.7116597,
+ "lr": 0.0004895287900583212,
+ "time_sec": 15.51857614517212
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.38193485226631163,
+ "train_acc": 0.87626,
+ "test_loss": 1.8681373037338256,
+ "test_acc": 0.5993,
+ "lyapunov": null,
+ "grad_norm": 0.6828844071671899,
+ "grad_max_sv": 0.30646760389208794,
+ "grad_min_sv": 1.2204253475693593e-08,
+ "grad_condition": 272459180.1924466,
+ "lr": 0.0004790621731353997,
+ "time_sec": 15.519853591918945
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.37069116824150083,
+ "train_acc": 0.88084,
+ "test_loss": 1.875751858139038,
+ "test_acc": 0.6043,
+ "lyapunov": null,
+ "grad_norm": 0.6706724909872018,
+ "grad_max_sv": 0.30184795036911966,
+ "grad_min_sv": 1.1925269455606569e-08,
+ "grad_condition": 303963866.0557478,
+ "lr": 0.000468604740235343,
+ "time_sec": 15.520630836486816
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.3643507383155823,
+ "train_acc": 0.88364,
+ "test_loss": 1.9180334386825562,
+ "test_acc": 0.5942,
+ "lyapunov": null,
+ "grad_norm": 0.6691117052818351,
+ "grad_max_sv": 0.2972587738186121,
+ "grad_min_sv": 1.1847118905870552e-08,
+ "grad_condition": 4229198196.1638947,
+ "lr": 0.00045816107833384175,
+ "time_sec": 15.53023386001587
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.3633389077377319,
+ "train_acc": 0.88294,
+ "test_loss": 1.8658218830108642,
+ "test_acc": 0.6003,
+ "lyapunov": null,
+ "grad_norm": 0.6700579474761854,
+ "grad_max_sv": 0.2936097148805857,
+ "grad_min_sv": 1.1731030144946502e-08,
+ "grad_condition": 196324429.7051069,
+ "lr": 0.0004477357683661729,
+ "time_sec": 15.50595474243164
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.35195467962265015,
+ "train_acc": 0.88632,
+ "test_loss": 1.9072984680175782,
+ "test_acc": 0.5985,
+ "lyapunov": null,
+ "grad_norm": 0.6558349942319918,
+ "grad_max_sv": 0.2942222774028778,
+ "grad_min_sv": 1.1174211227583247e-08,
+ "grad_condition": 686453916.7723808,
+ "lr": 0.00043733338321784746,
+ "time_sec": 15.547033786773682
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.34602870296001437,
+ "train_acc": 0.88766,
+ "test_loss": 1.9684966739654541,
+ "test_acc": 0.5914,
+ "lyapunov": null,
+ "grad_norm": 0.6555903608944951,
+ "grad_max_sv": 0.29228324331343175,
+ "grad_min_sv": 1.1487677028338903e-08,
+ "grad_condition": 383534563.2338952,
+ "lr": 0.0004269584857187939,
+ "time_sec": 15.51542615890503
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.3428422933292389,
+ "train_acc": 0.89108,
+ "test_loss": 1.9337468532562256,
+ "test_acc": 0.5993,
+ "lyapunov": null,
+ "grad_norm": 0.6492331544938933,
+ "grad_max_sv": 0.28135959543287753,
+ "grad_min_sv": 1.1496448484339673e-08,
+ "grad_condition": 414922787.7095521,
+ "lr": 0.0004166156266419484,
+ "time_sec": 15.53177547454834
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.328343852148056,
+ "train_acc": 0.89454,
+ "test_loss": 1.9273885646820068,
+ "test_acc": 0.6009,
+ "lyapunov": null,
+ "grad_norm": 0.6390681347680143,
+ "grad_max_sv": 0.28590504080057144,
+ "grad_min_sv": 1.1241013130221244e-08,
+ "grad_condition": 433920435.0763866,
+ "lr": 0.0004063093427071373,
+ "time_sec": 15.530908346176147
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.3230694122695923,
+ "train_acc": 0.89496,
+ "test_loss": 1.9058713027954102,
+ "test_acc": 0.5998,
+ "lyapunov": null,
+ "grad_norm": 0.6383613950635205,
+ "grad_max_sv": 0.2902642168104649,
+ "grad_min_sv": 1.141585580797036e-08,
+ "grad_condition": 604353313.9340062,
+ "lr": 0.0003960441545911199,
+ "time_sec": 15.515930414199829
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.31695827428817747,
+ "train_acc": 0.8967,
+ "test_loss": 1.9341052951812745,
+ "test_acc": 0.5998,
+ "lyapunov": null,
+ "grad_norm": 0.6323196704290217,
+ "grad_max_sv": 0.30049107149243354,
+ "grad_min_sv": 1.1364172216449253e-08,
+ "grad_condition": 253780845.1911161,
+ "lr": 0.0003858245649446718,
+ "time_sec": 15.52891731262207
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.310550309715271,
+ "train_acc": 0.8979,
+ "test_loss": 1.9645798837661743,
+ "test_acc": 0.5972,
+ "lyapunov": null,
+ "grad_norm": 0.6290293549615046,
+ "grad_max_sv": 0.28168079666793344,
+ "grad_min_sv": 1.1139878612566237e-08,
+ "grad_condition": 3174828807.3372684,
+ "lr": 0.00037565505641757235,
+ "time_sec": 15.527303218841553
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.30801844054222105,
+ "train_acc": 0.89982,
+ "test_loss": 1.9113462907791137,
+ "test_acc": 0.6061,
+ "lyapunov": null,
+ "grad_norm": 0.6261342549488306,
+ "grad_max_sv": 0.2938710656017065,
+ "grad_min_sv": 1.1276199778260943e-08,
+ "grad_condition": 166623199.75638226,
+ "lr": 0.00036554008969236695,
+ "time_sec": 15.515942573547363
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.3031072138786316,
+ "train_acc": 0.90226,
+ "test_loss": 1.932079137611389,
+ "test_acc": 0.6084,
+ "lyapunov": null,
+ "grad_norm": 0.6209363139222046,
+ "grad_max_sv": 0.2818705204874277,
+ "grad_min_sv": 1.0986600190287382e-08,
+ "grad_condition": 235648712.41506353,
+ "lr": 0.0003554841015277638,
+ "time_sec": 15.523046731948853
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.295468587474823,
+ "train_acc": 0.90442,
+ "test_loss": 1.9561836023330688,
+ "test_acc": 0.6029,
+ "lyapunov": null,
+ "grad_norm": 0.6134434549386554,
+ "grad_max_sv": 0.28373970463871956,
+ "grad_min_sv": 1.1000367631294056e-08,
+ "grad_condition": 371761681.0452756,
+ "lr": 0.000345491502812526,
+ "time_sec": 15.52297592163086
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.29119554637908934,
+ "train_acc": 0.90446,
+ "test_loss": 1.993441968536377,
+ "test_acc": 0.6049,
+ "lyapunov": null,
+ "grad_norm": 0.6105333020567495,
+ "grad_max_sv": 0.27541381642222407,
+ "grad_min_sv": 1.0823096196089371e-08,
+ "grad_condition": 473734139.3827542,
+ "lr": 0.0003355666766307081,
+ "time_sec": 15.514235258102417
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.28460477176189425,
+ "train_acc": 0.90876,
+ "test_loss": 1.9682166564941406,
+ "test_acc": 0.6057,
+ "lyapunov": null,
+ "grad_norm": 0.5988483508766865,
+ "grad_max_sv": 0.27126791067421435,
+ "grad_min_sv": 1.0722518893266364e-08,
+ "grad_condition": 97668951.32032181,
+ "lr": 0.00032571397633909225,
+ "time_sec": 15.52116084098816
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.2825835990524292,
+ "train_acc": 0.90854,
+ "test_loss": 1.9348359714508057,
+ "test_acc": 0.6041,
+ "lyapunov": null,
+ "grad_norm": 0.6011972747002627,
+ "grad_max_sv": 0.2796713523566723,
+ "grad_min_sv": 1.0827668426964532e-08,
+ "grad_condition": 881127416.7703698,
+ "lr": 0.00031593772365766094,
+ "time_sec": 15.528529644012451
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.2801620689296722,
+ "train_acc": 0.9097,
+ "test_loss": 1.980628232383728,
+ "test_acc": 0.6055,
+ "lyapunov": null,
+ "grad_norm": 0.5993074321032092,
+ "grad_max_sv": 0.2800555154681206,
+ "grad_min_sv": 1.0468388221378244e-08,
+ "grad_condition": 140732695.72303194,
+ "lr": 0.0003062422067739483,
+ "time_sec": 15.532250165939331
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.26648273178100584,
+ "train_acc": 0.9142,
+ "test_loss": 2.0015383081436156,
+ "test_acc": 0.6016,
+ "lyapunov": null,
+ "grad_norm": 0.5881453904576209,
+ "grad_max_sv": 0.27579851634800434,
+ "grad_min_sv": 1.0274321395227492e-08,
+ "grad_condition": 201871276.47904783,
+ "lr": 0.00029663167846209965,
+ "time_sec": 15.681024551391602
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.26776352972984313,
+ "train_acc": 0.91448,
+ "test_loss": 2.0207461967468263,
+ "test_acc": 0.6012,
+ "lyapunov": null,
+ "grad_norm": 0.5860462649686203,
+ "grad_max_sv": 0.2698933105915785,
+ "grad_min_sv": 1.0329826621857664e-08,
+ "grad_condition": 76135409.2144176,
+ "lr": 0.00028711035421746345,
+ "time_sec": 15.536462545394897
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.25857464953899384,
+ "train_acc": 0.91696,
+ "test_loss": 1.9442026258468628,
+ "test_acc": 0.6066,
+ "lyapunov": null,
+ "grad_norm": 0.579918050497587,
+ "grad_max_sv": 0.28092321269214154,
+ "grad_min_sv": 1.0451780512853865e-08,
+ "grad_condition": 432604154.8635365,
+ "lr": 0.00027768241040753615,
+ "time_sec": 15.520632982254028
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.2567158591556549,
+ "train_acc": 0.91576,
+ "test_loss": 1.952080411529541,
+ "test_acc": 0.6097,
+ "lyapunov": null,
+ "grad_norm": 0.5815827800021661,
+ "grad_max_sv": 0.26784452944993975,
+ "grad_min_sv": 9.97831211164979e-09,
+ "grad_condition": 91061008.30272922,
+ "lr": 0.00026835198244006903,
+ "time_sec": 15.535520553588867
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.24892670249938964,
+ "train_acc": 0.9202,
+ "test_loss": 2.033794689941406,
+ "test_acc": 0.6019,
+ "lyapunov": null,
+ "grad_norm": 0.5696851893969495,
+ "grad_max_sv": 0.2726339440792799,
+ "grad_min_sv": 9.946045926049683e-09,
+ "grad_condition": 1696689541.1727843,
+ "lr": 0.0002591231629491421,
+ "time_sec": 15.538635969161987
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.24926711993694306,
+ "train_acc": 0.91978,
+ "test_loss": 1.9742811960220337,
+ "test_acc": 0.6068,
+ "lyapunov": null,
+ "grad_norm": 0.5702583833389835,
+ "grad_max_sv": 0.26799715869128704,
+ "grad_min_sv": 9.895174417351438e-09,
+ "grad_condition": 297572156.6297859,
+ "lr": 0.0002499999999999997,
+ "time_sec": 15.536820650100708
+ },
+ {
+ "epoch": 101,
+ "train_loss": 0.2401547999382019,
+ "train_acc": 0.92344,
+ "test_loss": 1.99689197101593,
+ "test_acc": 0.6077,
+ "lyapunov": null,
+ "grad_norm": 0.5610283078331603,
+ "grad_max_sv": 0.2691540464758873,
+ "grad_min_sv": 9.99432525588921e-09,
+ "grad_condition": 545457041.2762839,
+ "lr": 0.00024098649531343477,
+ "time_sec": 15.541125774383545
+ },
+ {
+ "epoch": 102,
+ "train_loss": 0.2366540629529953,
+ "train_acc": 0.92332,
+ "test_loss": 1.9686679859161378,
+ "test_acc": 0.6043,
+ "lyapunov": null,
+ "grad_norm": 0.5596319863447712,
+ "grad_max_sv": 0.2598999205976725,
+ "grad_min_sv": 9.748093400801378e-09,
+ "grad_condition": 280631646.0385326,
+ "lr": 0.0002320866025105016,
+ "time_sec": 15.642221689224243
+ },
+ {
+ "epoch": 103,
+ "train_loss": 0.23095350846290588,
+ "train_acc": 0.92478,
+ "test_loss": 1.9796740842819214,
+ "test_acc": 0.6086,
+ "lyapunov": null,
+ "grad_norm": 0.5527105531261713,
+ "grad_max_sv": 0.2648670017719269,
+ "grad_min_sv": 1.0250657645751934e-08,
+ "grad_condition": 501602567.1069907,
+ "lr": 0.0002233042253783278,
+ "time_sec": 15.533202886581421
+ },
+ {
+ "epoch": 104,
+ "train_loss": 0.23427851341247558,
+ "train_acc": 0.92466,
+ "test_loss": 1.9721594404220582,
+ "test_acc": 0.6107,
+ "lyapunov": null,
+ "grad_norm": 0.5589041472139786,
+ "grad_max_sv": 0.25932734124362466,
+ "grad_min_sv": 9.605904077877003e-09,
+ "grad_condition": 1031803946.0677515,
+ "lr": 0.000214643216157784,
+ "time_sec": 15.51241683959961
+ },
+ {
+ "epoch": 105,
+ "train_loss": 0.219517624874115,
+ "train_acc": 0.9293,
+ "test_loss": 2.0007881326675414,
+ "test_acc": 0.6035,
+ "lyapunov": null,
+ "grad_norm": 0.5422594048752922,
+ "grad_max_sv": 0.2685978960245848,
+ "grad_min_sv": 9.883629456617499e-09,
+ "grad_condition": 224740616.11832863,
+ "lr": 0.00020610737385376332,
+ "time_sec": 15.537052392959595
+ },
+ {
+ "epoch": 106,
+ "train_loss": 0.2232757794523239,
+ "train_acc": 0.92674,
+ "test_loss": 2.0058324546813964,
+ "test_acc": 0.6093,
+ "lyapunov": null,
+ "grad_norm": 0.5472900635805251,
+ "grad_max_sv": 0.2613681871443987,
+ "grad_min_sv": 9.819886173656478e-09,
+ "grad_condition": 176319742.57465333,
+ "lr": 0.00019770044256881242,
+ "time_sec": 15.542799949645996
+ },
+ {
+ "epoch": 107,
+ "train_loss": 0.21997562067031862,
+ "train_acc": 0.92926,
+ "test_loss": 1.989624990081787,
+ "test_acc": 0.6099,
+ "lyapunov": null,
+ "grad_norm": 0.5414473725256549,
+ "grad_max_sv": 0.2557095166295767,
+ "grad_min_sv": 9.448845216301038e-09,
+ "grad_condition": 1407753979.8512912,
+ "lr": 0.0001894261098608447,
+ "time_sec": 15.52652359008789
+ },
+ {
+ "epoch": 108,
+ "train_loss": 0.2132127531719208,
+ "train_acc": 0.93122,
+ "test_loss": 2.043244864463806,
+ "test_acc": 0.6013,
+ "lyapunov": null,
+ "grad_norm": 0.5380471333664735,
+ "grad_max_sv": 0.255327982082963,
+ "grad_min_sv": 9.992253989770521e-09,
+ "grad_condition": 429655462.4469593,
+ "lr": 0.000181288005125655,
+ "time_sec": 15.52126145362854
+ },
+ {
+ "epoch": 109,
+ "train_loss": 0.21187591857910157,
+ "train_acc": 0.93122,
+ "test_loss": 1.9954864723205565,
+ "test_acc": 0.6098,
+ "lyapunov": null,
+ "grad_norm": 0.5380204381544875,
+ "grad_max_sv": 0.26441522017121316,
+ "grad_min_sv": 9.557367238854226e-09,
+ "grad_condition": 237566723.1979712,
+ "lr": 0.0001732896980049473,
+ "time_sec": 15.548521995544434
+ },
+ {
+ "epoch": 110,
+ "train_loss": 0.20928363649368287,
+ "train_acc": 0.9326,
+ "test_loss": 1.9480315828323365,
+ "test_acc": 0.6146,
+ "lyapunov": null,
+ "grad_norm": 0.5298971206452113,
+ "grad_max_sv": 0.26398450396955014,
+ "grad_min_sv": 9.874217052428108e-09,
+ "grad_condition": 197519783.8891028,
+ "lr": 0.00016543469682057076,
+ "time_sec": 15.51990032196045
+ },
+ {
+ "epoch": 111,
+ "train_loss": 0.20472501375198365,
+ "train_acc": 0.93442,
+ "test_loss": 1.9880135498046876,
+ "test_acc": 0.6114,
+ "lyapunov": null,
+ "grad_norm": 0.5226715722616327,
+ "grad_max_sv": 0.25575212091207505,
+ "grad_min_sv": 9.559482279462156e-09,
+ "grad_condition": 213563040.67873913,
+ "lr": 0.00015772644703565552,
+ "time_sec": 15.518001079559326
+ },
+ {
+ "epoch": 112,
+ "train_loss": 0.20579987778663636,
+ "train_acc": 0.93296,
+ "test_loss": 2.016691120529175,
+ "test_acc": 0.6117,
+ "lyapunov": null,
+ "grad_norm": 0.5297683532569843,
+ "grad_max_sv": 0.25805489346385,
+ "grad_min_sv": 9.560597037899625e-09,
+ "grad_condition": 1064723629.28162,
+ "lr": 0.00015016832974331713,
+ "time_sec": 15.522767305374146
+ },
+ {
+ "epoch": 113,
+ "train_loss": 0.20068273310422896,
+ "train_acc": 0.93668,
+ "test_loss": 2.0594107456207276,
+ "test_acc": 0.6086,
+ "lyapunov": null,
+ "grad_norm": 0.5184460551642818,
+ "grad_max_sv": 0.24561816416680812,
+ "grad_min_sv": 9.581332657826458e-09,
+ "grad_condition": 364510178.3461688,
+ "lr": 0.00014276366018359834,
+ "time_sec": 15.533010005950928
+ },
+ {
+ "epoch": 114,
+ "train_loss": 0.19722092057228088,
+ "train_acc": 0.93788,
+ "test_loss": 2.008504161453247,
+ "test_acc": 0.6083,
+ "lyapunov": null,
+ "grad_norm": 0.5143544627139274,
+ "grad_max_sv": 0.26034388653934004,
+ "grad_min_sv": 9.650303647423114e-09,
+ "grad_condition": 3361687889.542286,
+ "lr": 0.00013551568628929425,
+ "time_sec": 15.531035661697388
+ },
+ {
+ "epoch": 115,
+ "train_loss": 0.19389657697677612,
+ "train_acc": 0.93868,
+ "test_loss": 2.0233098300933836,
+ "test_acc": 0.6117,
+ "lyapunov": null,
+ "grad_norm": 0.5104261903820102,
+ "grad_max_sv": 0.24447884745895862,
+ "grad_min_sv": 9.077133606870055e-09,
+ "grad_condition": 461064774.41410434,
+ "lr": 0.00012842758726130276,
+ "time_sec": 15.524327993392944
+ },
+ {
+ "epoch": 116,
+ "train_loss": 0.19362226080417633,
+ "train_acc": 0.93796,
+ "test_loss": 2.053111413192749,
+ "test_acc": 0.6054,
+ "lyapunov": null,
+ "grad_norm": 0.5131743880915615,
+ "grad_max_sv": 0.2492377854883671,
+ "grad_min_sv": 9.515753446841246e-09,
+ "grad_condition": 206396866.4016946,
+ "lr": 0.0001215024721741218,
+ "time_sec": 15.513204574584961
+ },
+ {
+ "epoch": 117,
+ "train_loss": 0.18898310523986817,
+ "train_acc": 0.93976,
+ "test_loss": 2.015893176269531,
+ "test_acc": 0.6127,
+ "lyapunov": null,
+ "grad_norm": 0.5048514988009624,
+ "grad_max_sv": 0.23975766226649284,
+ "grad_min_sv": 9.193109389200611e-09,
+ "grad_condition": 1880002960.4112122,
+ "lr": 0.00011474337861210538,
+ "time_sec": 15.531865119934082
+ },
+ {
+ "epoch": 118,
+ "train_loss": 0.18859933629989625,
+ "train_acc": 0.93992,
+ "test_loss": 2.0275477882385253,
+ "test_acc": 0.613,
+ "lyapunov": null,
+ "grad_norm": 0.5070579132326548,
+ "grad_max_sv": 0.2569826778024435,
+ "grad_min_sv": 9.573198521970264e-09,
+ "grad_condition": 946919734.9405922,
+ "lr": 0.00010815327133708009,
+ "time_sec": 15.528860330581665
+ },
+ {
+ "epoch": 119,
+ "train_loss": 0.18436414319992064,
+ "train_acc": 0.9409,
+ "test_loss": 2.035816400527954,
+ "test_acc": 0.6094,
+ "lyapunov": null,
+ "grad_norm": 0.49869022882133546,
+ "grad_max_sv": 0.24773051403462887,
+ "grad_min_sv": 9.154285843075704e-09,
+ "grad_condition": 330957531.4847302,
+ "lr": 0.00010173504098790182,
+ "time_sec": 15.546629190444946
+ },
+ {
+ "epoch": 120,
+ "train_loss": 0.18639450643777847,
+ "train_acc": 0.94082,
+ "test_loss": 2.0497810037612916,
+ "test_acc": 0.6101,
+ "lyapunov": null,
+ "grad_norm": 0.5054264593475204,
+ "grad_max_sv": 0.24650247804820538,
+ "grad_min_sv": 9.350194245597021e-09,
+ "grad_condition": 546741093.3651453,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 15.52673053741455
+ },
+ {
+ "epoch": 121,
+ "train_loss": 0.18135397327423095,
+ "train_acc": 0.94364,
+ "test_loss": 2.0228085262298583,
+ "test_acc": 0.6112,
+ "lyapunov": null,
+ "grad_norm": 0.49196950746055856,
+ "grad_max_sv": 0.25292878448963163,
+ "grad_min_sv": 9.245442955446368e-09,
+ "grad_condition": 345415022.7201654,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 15.530716180801392
+ },
+ {
+ "epoch": 122,
+ "train_loss": 0.17821871382713317,
+ "train_acc": 0.94288,
+ "test_loss": 2.015850890350342,
+ "test_acc": 0.6127,
+ "lyapunov": null,
+ "grad_norm": 0.4943397097989714,
+ "grad_max_sv": 0.2537323322147131,
+ "grad_min_sv": 9.237968556525395e-09,
+ "grad_condition": 263035591.43015513,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 15.536164045333862
+ },
+ {
+ "epoch": 123,
+ "train_loss": 0.17632093348026276,
+ "train_acc": 0.9444,
+ "test_loss": 2.029286048698425,
+ "test_acc": 0.6089,
+ "lyapunov": null,
+ "grad_norm": 0.48806288568095135,
+ "grad_max_sv": 0.2458991575986147,
+ "grad_min_sv": 9.06146269260763e-09,
+ "grad_condition": 386283353.8532323,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 15.518115997314453
+ },
+ {
+ "epoch": 124,
+ "train_loss": 0.1732941804933548,
+ "train_acc": 0.94456,
+ "test_loss": 2.099158185958862,
+ "test_acc": 0.6025,
+ "lyapunov": null,
+ "grad_norm": 0.4868912892942884,
+ "grad_max_sv": 0.24448585212230683,
+ "grad_min_sv": 8.980524343182167e-09,
+ "grad_condition": 336891094.31355625,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 15.542467832565308
+ },
+ {
+ "epoch": 125,
+ "train_loss": 0.17837541491031647,
+ "train_acc": 0.94274,
+ "test_loss": 2.0764820568084716,
+ "test_acc": 0.61,
+ "lyapunov": null,
+ "grad_norm": 0.4948203710715524,
+ "grad_max_sv": 0.24412455931305885,
+ "grad_min_sv": 9.184420232503931e-09,
+ "grad_condition": 716346437.4859622,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 15.55189299583435
+ },
+ {
+ "epoch": 126,
+ "train_loss": 0.1735024337530136,
+ "train_acc": 0.94474,
+ "test_loss": 2.0553098888397217,
+ "test_acc": 0.6111,
+ "lyapunov": null,
+ "grad_norm": 0.4854349633437902,
+ "grad_max_sv": 0.2419682189822197,
+ "grad_min_sv": 8.905077519393705e-09,
+ "grad_condition": 839365296.5454277,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 15.54058313369751
+ },
+ {
+ "epoch": 127,
+ "train_loss": 0.1715146116065979,
+ "train_acc": 0.94478,
+ "test_loss": 2.0106375900268554,
+ "test_acc": 0.6128,
+ "lyapunov": null,
+ "grad_norm": 0.4816957588601112,
+ "grad_max_sv": 0.23674072176218033,
+ "grad_min_sv": 8.675588131831085e-09,
+ "grad_condition": 478973714.0473558,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 15.529821157455444
+ },
+ {
+ "epoch": 128,
+ "train_loss": 0.1660640141773224,
+ "train_acc": 0.9478,
+ "test_loss": 2.0750678112030028,
+ "test_acc": 0.6111,
+ "lyapunov": null,
+ "grad_norm": 0.4757528664416431,
+ "grad_max_sv": 0.244390731677413,
+ "grad_min_sv": 8.79119548703039e-09,
+ "grad_condition": 457083152.2974655,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 15.54984712600708
+ },
+ {
+ "epoch": 129,
+ "train_loss": 0.1666716690993309,
+ "train_acc": 0.94686,
+ "test_loss": 2.0469725986480714,
+ "test_acc": 0.6123,
+ "lyapunov": null,
+ "grad_norm": 0.478310500713372,
+ "grad_max_sv": 0.23569908998906614,
+ "grad_min_sv": 8.542899999821468e-09,
+ "grad_condition": 598853903.3316209,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 15.545772552490234
+ },
+ {
+ "epoch": 130,
+ "train_loss": 0.16598962943553924,
+ "train_acc": 0.94712,
+ "test_loss": 1.9995166748046875,
+ "test_acc": 0.6146,
+ "lyapunov": null,
+ "grad_norm": 0.4758526221040286,
+ "grad_max_sv": 0.23986518271267415,
+ "grad_min_sv": 8.749124542689266e-09,
+ "grad_condition": 608746268.1362782,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 15.54599404335022
+ },
+ {
+ "epoch": 131,
+ "train_loss": 0.16668007793426515,
+ "train_acc": 0.9479,
+ "test_loss": 2.0491572677612306,
+ "test_acc": 0.6109,
+ "lyapunov": null,
+ "grad_norm": 0.4755344205180913,
+ "grad_max_sv": 0.23323244228959084,
+ "grad_min_sv": 8.472622621633757e-09,
+ "grad_condition": 233979199.2625857,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 15.524599552154541
+ },
+ {
+ "epoch": 132,
+ "train_loss": 0.16224975943565367,
+ "train_acc": 0.94862,
+ "test_loss": 2.0500082311630248,
+ "test_acc": 0.6134,
+ "lyapunov": null,
+ "grad_norm": 0.46871867660355254,
+ "grad_max_sv": 0.2372895274311304,
+ "grad_min_sv": 8.64411044331978e-09,
+ "grad_condition": 287263322.167899,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 15.527011156082153
+ },
+ {
+ "epoch": 133,
+ "train_loss": 0.16492341012477874,
+ "train_acc": 0.94736,
+ "test_loss": 2.0346584928512574,
+ "test_acc": 0.6142,
+ "lyapunov": null,
+ "grad_norm": 0.47534738241769,
+ "grad_max_sv": 0.24461643844842912,
+ "grad_min_sv": 9.178972258834517e-09,
+ "grad_condition": 500309812.0406585,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 15.547746658325195
+ },
+ {
+ "epoch": 134,
+ "train_loss": 0.16421831488609315,
+ "train_acc": 0.94756,
+ "test_loss": 2.0132702159881593,
+ "test_acc": 0.6162,
+ "lyapunov": null,
+ "grad_norm": 0.4772419829809968,
+ "grad_max_sv": 0.23413821049034594,
+ "grad_min_sv": 9.002530253383878e-09,
+ "grad_condition": 363205059.0549506,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 15.531517505645752
+ },
+ {
+ "epoch": 135,
+ "train_loss": 0.16381137976646423,
+ "train_acc": 0.94842,
+ "test_loss": 2.0648642013549803,
+ "test_acc": 0.6083,
+ "lyapunov": null,
+ "grad_norm": 0.4736658227067323,
+ "grad_max_sv": 0.23049395270645617,
+ "grad_min_sv": 8.56864400186879e-09,
+ "grad_condition": 1442465508.733611,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 15.541293859481812
+ },
+ {
+ "epoch": 136,
+ "train_loss": 0.16108462400436402,
+ "train_acc": 0.94976,
+ "test_loss": 2.0012967403411865,
+ "test_acc": 0.6119,
+ "lyapunov": null,
+ "grad_norm": 0.465643715209168,
+ "grad_max_sv": 0.23518772274255753,
+ "grad_min_sv": 8.637825488558292e-09,
+ "grad_condition": 243388926.8874995,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 15.512713193893433
+ },
+ {
+ "epoch": 137,
+ "train_loss": 0.1584918847179413,
+ "train_acc": 0.94912,
+ "test_loss": 2.050839980697632,
+ "test_acc": 0.6104,
+ "lyapunov": null,
+ "grad_norm": 0.46730923038258504,
+ "grad_max_sv": 0.23510748259723185,
+ "grad_min_sv": 8.813612497248977e-09,
+ "grad_condition": 1210234116.5017686,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 15.537960052490234
+ },
+ {
+ "epoch": 138,
+ "train_loss": 0.15678886548519136,
+ "train_acc": 0.9508,
+ "test_loss": 2.0579080810546877,
+ "test_acc": 0.6137,
+ "lyapunov": null,
+ "grad_norm": 0.46202513180941285,
+ "grad_max_sv": 0.22975999489426613,
+ "grad_min_sv": 8.437959897781514e-09,
+ "grad_condition": 1365594635.574403,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 15.53256607055664
+ },
+ {
+ "epoch": 139,
+ "train_loss": 0.15868934306621552,
+ "train_acc": 0.95058,
+ "test_loss": 2.0891008211135866,
+ "test_acc": 0.607,
+ "lyapunov": null,
+ "grad_norm": 0.46370376954923076,
+ "grad_max_sv": 0.239790453761816,
+ "grad_min_sv": 8.653809858939418e-09,
+ "grad_condition": 751331866.6462338,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 15.542593002319336
+ },
+ {
+ "epoch": 140,
+ "train_loss": 0.16018940447807312,
+ "train_acc": 0.94944,
+ "test_loss": 2.0365436012268066,
+ "test_acc": 0.6134,
+ "lyapunov": null,
+ "grad_norm": 0.46850944550951273,
+ "grad_max_sv": 0.24336591213941575,
+ "grad_min_sv": 8.69392097297767e-09,
+ "grad_condition": 6372417042.7504635,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 15.530508279800415
+ },
+ {
+ "epoch": 141,
+ "train_loss": 0.1577048332262039,
+ "train_acc": 0.95192,
+ "test_loss": 2.048553763961792,
+ "test_acc": 0.6177,
+ "lyapunov": null,
+ "grad_norm": 0.46173934960898333,
+ "grad_max_sv": 0.2323433578014374,
+ "grad_min_sv": 8.582540832018093e-09,
+ "grad_condition": 374128300.47680604,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 15.53349781036377
+ },
+ {
+ "epoch": 142,
+ "train_loss": 0.15599479459762572,
+ "train_acc": 0.95136,
+ "test_loss": 2.0303194038391115,
+ "test_acc": 0.6141,
+ "lyapunov": null,
+ "grad_norm": 0.46112847461678763,
+ "grad_max_sv": 0.23407747074961663,
+ "grad_min_sv": 8.815537186779992e-09,
+ "grad_condition": 888764932.2294099,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 15.521865129470825
+ },
+ {
+ "epoch": 143,
+ "train_loss": 0.1572772634601593,
+ "train_acc": 0.95076,
+ "test_loss": 2.015152719116211,
+ "test_acc": 0.6117,
+ "lyapunov": null,
+ "grad_norm": 0.46482832090967446,
+ "grad_max_sv": 0.23328317552804947,
+ "grad_min_sv": 8.496040210356943e-09,
+ "grad_condition": 794958780.6842709,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 15.530633926391602
+ },
+ {
+ "epoch": 144,
+ "train_loss": 0.1607058820438385,
+ "train_acc": 0.94982,
+ "test_loss": 2.028663912010193,
+ "test_acc": 0.6144,
+ "lyapunov": null,
+ "grad_norm": 0.46757658167064325,
+ "grad_max_sv": 0.23105027191340924,
+ "grad_min_sv": 8.55830176145836e-09,
+ "grad_condition": 1653881177.8200665,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 15.53608751296997
+ },
+ {
+ "epoch": 145,
+ "train_loss": 0.1565204811191559,
+ "train_acc": 0.95166,
+ "test_loss": 2.0279767280578613,
+ "test_acc": 0.6155,
+ "lyapunov": null,
+ "grad_norm": 0.4638655873772094,
+ "grad_max_sv": 0.23327881954610347,
+ "grad_min_sv": 8.597103550930796e-09,
+ "grad_condition": 316875488.0827421,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 15.526829719543457
+ },
+ {
+ "epoch": 146,
+ "train_loss": 0.15728166580677033,
+ "train_acc": 0.95086,
+ "test_loss": 1.9891761138916015,
+ "test_acc": 0.6145,
+ "lyapunov": null,
+ "grad_norm": 0.46488895344189896,
+ "grad_max_sv": 0.24002570435404777,
+ "grad_min_sv": 8.740120454957777e-09,
+ "grad_condition": 455470499.4939662,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 15.529450178146362
+ },
+ {
+ "epoch": 147,
+ "train_loss": 0.15490476808547973,
+ "train_acc": 0.95148,
+ "test_loss": 2.058331818771362,
+ "test_acc": 0.61,
+ "lyapunov": null,
+ "grad_norm": 0.46221701830974254,
+ "grad_max_sv": 0.2296001013368368,
+ "grad_min_sv": 8.541372666505225e-09,
+ "grad_condition": 659563768.7689784,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 15.537895441055298
+ },
+ {
+ "epoch": 148,
+ "train_loss": 0.15796600056648255,
+ "train_acc": 0.94986,
+ "test_loss": 2.0414266393661498,
+ "test_acc": 0.6093,
+ "lyapunov": null,
+ "grad_norm": 0.46494816666423244,
+ "grad_max_sv": 0.2453433360904455,
+ "grad_min_sv": 8.874223652883401e-09,
+ "grad_condition": 791324939.5663835,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 15.552018165588379
+ },
+ {
+ "epoch": 149,
+ "train_loss": 0.1572165874862671,
+ "train_acc": 0.9503,
+ "test_loss": 2.0304482383728026,
+ "test_acc": 0.6163,
+ "lyapunov": null,
+ "grad_norm": 0.46454324009038384,
+ "grad_max_sv": 0.23642796650528908,
+ "grad_min_sv": 8.51550397435591e-09,
+ "grad_condition": 463955776.24121666,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 15.526931762695312
+ },
+ {
+ "epoch": 150,
+ "train_loss": 0.15873465202331544,
+ "train_acc": 0.94998,
+ "test_loss": 2.0263592735290525,
+ "test_acc": 0.6123,
+ "lyapunov": null,
+ "grad_norm": 0.46823921364683874,
+ "grad_max_sv": 0.24224489107728003,
+ "grad_min_sv": 8.409305788867338e-09,
+ "grad_condition": 491457160.41681844,
+ "lr": 0.0,
+ "time_sec": 15.518765687942505
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 4.593809753570556,
+ "train_acc": 0.06056,
+ "test_loss": 4.250240661239624,
+ "test_acc": 0.0724,
+ "lyapunov": null,
+ "grad_norm": 6.28680857536701,
+ "grad_max_sv": 5.32494820356369,
+ "grad_min_sv": 1.0926536573307998e-07,
+ "grad_condition": 75430538.96608621,
+ "lr": 0.0009998903417374227,
+ "time_sec": 32.64524722099304
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.8781360272216796,
+ "train_acc": 0.12202,
+ "test_loss": 3.828091265106201,
+ "test_acc": 0.1187,
+ "lyapunov": null,
+ "grad_norm": 4.685766976401904,
+ "grad_max_sv": 3.971551901102066,
+ "grad_min_sv": 8.512232171353773e-08,
+ "grad_condition": 73925683.02884856,
+ "lr": 0.0009995614150494292,
+ "time_sec": 32.55369710922241
+ },
+ {
+ "epoch": 3,
+ "train_loss": 3.5183256304931643,
+ "train_acc": 0.16986,
+ "test_loss": 3.603372495651245,
+ "test_acc": 0.1458,
+ "lyapunov": null,
+ "grad_norm": 3.857816495796443,
+ "grad_max_sv": 3.131850999593735,
+ "grad_min_sv": 7.069926738628718e-08,
+ "grad_condition": 597358447.7631978,
+ "lr": 0.0009990133642141358,
+ "time_sec": 32.61470580101013
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.2580047064208983,
+ "train_acc": 0.21016,
+ "test_loss": 3.3982357917785646,
+ "test_acc": 0.1898,
+ "lyapunov": null,
+ "grad_norm": 3.25322967284326,
+ "grad_max_sv": 2.4588119089603424,
+ "grad_min_sv": 6.045808895738247e-08,
+ "grad_condition": 47197928.09495263,
+ "lr": 0.0009982464296247522,
+ "time_sec": 32.569292306900024
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.0406500122070312,
+ "train_acc": 0.24896,
+ "test_loss": 3.1738818031311036,
+ "test_acc": 0.2326,
+ "lyapunov": null,
+ "grad_norm": 2.772030407825626,
+ "grad_max_sv": 1.9638817846775054,
+ "grad_min_sv": 5.119714804324715e-08,
+ "grad_condition": 73515114.69409783,
+ "lr": 0.0009972609476841367,
+ "time_sec": 32.59326457977295
+ },
+ {
+ "epoch": 6,
+ "train_loss": 2.8603873377227784,
+ "train_acc": 0.28122,
+ "test_loss": 3.040658945083618,
+ "test_acc": 0.2441,
+ "lyapunov": null,
+ "grad_norm": 2.406511937670546,
+ "grad_max_sv": 1.6028138607740403,
+ "grad_min_sv": 4.437380299870952e-08,
+ "grad_condition": 42435152.16608156,
+ "lr": 0.000996057350657239,
+ "time_sec": 32.59000778198242
+ },
+ {
+ "epoch": 7,
+ "train_loss": 2.696464497909546,
+ "train_acc": 0.3124,
+ "test_loss": 2.7883455558776857,
+ "test_acc": 0.3055,
+ "lyapunov": null,
+ "grad_norm": 2.1276389781637293,
+ "grad_max_sv": 1.321936309337616,
+ "grad_min_sv": 3.9740869406390546e-08,
+ "grad_condition": 38077617.12004892,
+ "lr": 0.000994636166481494,
+ "time_sec": 32.58612537384033
+ },
+ {
+ "epoch": 8,
+ "train_loss": 2.5476934342956543,
+ "train_acc": 0.34226,
+ "test_loss": 2.7284567352294924,
+ "test_acc": 0.3201,
+ "lyapunov": null,
+ "grad_norm": 1.9443800586445228,
+ "grad_max_sv": 1.1562949120998383,
+ "grad_min_sv": 3.6514397544484825e-08,
+ "grad_condition": 50793777.88100208,
+ "lr": 0.0009929980185352525,
+ "time_sec": 32.609519958496094
+ },
+ {
+ "epoch": 9,
+ "train_loss": 2.420484928741455,
+ "train_acc": 0.37,
+ "test_loss": 2.5651690574645998,
+ "test_acc": 0.3474,
+ "lyapunov": null,
+ "grad_norm": 1.7908327823271384,
+ "grad_max_sv": 0.9936118766665458,
+ "grad_min_sv": 3.386289501583484e-08,
+ "grad_condition": 38337683.052389994,
+ "lr": 0.0009911436253643444,
+ "time_sec": 32.608171224594116
+ },
+ {
+ "epoch": 10,
+ "train_loss": 2.3262426779937746,
+ "train_acc": 0.38734,
+ "test_loss": 2.4693000373840333,
+ "test_acc": 0.3722,
+ "lyapunov": null,
+ "grad_norm": 1.6585340858173223,
+ "grad_max_sv": 0.8407874166965484,
+ "grad_min_sv": 3.068910873760267e-08,
+ "grad_condition": 34328942.84679211,
+ "lr": 0.0009890738003669028,
+ "time_sec": 32.64034914970398
+ },
+ {
+ "epoch": 11,
+ "train_loss": 2.2108732919311525,
+ "train_acc": 0.41382,
+ "test_loss": 2.465538624572754,
+ "test_acc": 0.3705,
+ "lyapunov": null,
+ "grad_norm": 1.5729603360376456,
+ "grad_max_sv": 0.778350618481636,
+ "grad_min_sv": 2.959336372621024e-08,
+ "grad_condition": 73499461.7080038,
+ "lr": 0.00098678945143658,
+ "time_sec": 32.57490301132202
+ },
+ {
+ "epoch": 12,
+ "train_loss": 2.1315050006103515,
+ "train_acc": 0.4307,
+ "test_loss": 2.3204302642822268,
+ "test_acc": 0.3954,
+ "lyapunov": null,
+ "grad_norm": 1.5011321305083667,
+ "grad_max_sv": 0.699262747168541,
+ "grad_min_sv": 2.8460571517563427e-08,
+ "grad_condition": 48774252.99057761,
+ "lr": 0.0009842915805643154,
+ "time_sec": 32.6048150062561
+ },
+ {
+ "epoch": 13,
+ "train_loss": 2.0442165532684324,
+ "train_acc": 0.44988,
+ "test_loss": 2.376241368865967,
+ "test_acc": 0.3938,
+ "lyapunov": null,
+ "grad_norm": 1.4288710226212364,
+ "grad_max_sv": 0.651852785050869,
+ "grad_min_sv": 2.6736829209427978e-08,
+ "grad_condition": 911183246.0701777,
+ "lr": 0.000981581283398829,
+ "time_sec": 32.5588493347168
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.9779467534637452,
+ "train_acc": 0.46564,
+ "test_loss": 2.3095103010177613,
+ "test_acc": 0.3997,
+ "lyapunov": null,
+ "grad_norm": 1.3745196502469326,
+ "grad_max_sv": 0.6157992795109749,
+ "grad_min_sv": 2.619163226788568e-08,
+ "grad_condition": 133496832.32967322,
+ "lr": 0.0009786597487660333,
+ "time_sec": 32.544082164764404
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.9085535586547853,
+ "train_acc": 0.48116,
+ "test_loss": 2.277028215789795,
+ "test_acc": 0.4192,
+ "lyapunov": null,
+ "grad_norm": 1.3371637415095632,
+ "grad_max_sv": 0.6050588846206665,
+ "grad_min_sv": 2.4948501375562925e-08,
+ "grad_condition": 111100134.80615222,
+ "lr": 0.0009755282581475766,
+ "time_sec": 32.55138826370239
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.8528347210693359,
+ "train_acc": 0.49492,
+ "test_loss": 2.1695428279876707,
+ "test_acc": 0.4331,
+ "lyapunov": null,
+ "grad_norm": 1.2814778531944382,
+ "grad_max_sv": 0.5591228373348713,
+ "grad_min_sv": 2.4496722306199815e-08,
+ "grad_condition": 25867184.37629143,
+ "lr": 0.0009721881851187403,
+ "time_sec": 32.59131908416748
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.7864885725402833,
+ "train_acc": 0.5083,
+ "test_loss": 2.2167986530303954,
+ "test_acc": 0.428,
+ "lyapunov": null,
+ "grad_norm": 1.2365928586283268,
+ "grad_max_sv": 0.5188852399587631,
+ "grad_min_sv": 2.3400686853525254e-08,
+ "grad_condition": 39202676.90349869,
+ "lr": 0.0009686409947459456,
+ "time_sec": 32.55093550682068
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.7305231869888307,
+ "train_acc": 0.52088,
+ "test_loss": 2.1779684148788454,
+ "test_acc": 0.4405,
+ "lyapunov": null,
+ "grad_norm": 1.2047689336699439,
+ "grad_max_sv": 0.5065509222447873,
+ "grad_min_sv": 2.279239488256479e-08,
+ "grad_condition": 28341315.825680755,
+ "lr": 0.0009648882429441254,
+ "time_sec": 32.556524991989136
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.6774425074768067,
+ "train_acc": 0.53444,
+ "test_loss": 2.22588055267334,
+ "test_acc": 0.4357,
+ "lyapunov": null,
+ "grad_norm": 1.1702937955790653,
+ "grad_max_sv": 0.4866269282996655,
+ "grad_min_sv": 2.1823409551702255e-08,
+ "grad_condition": 34695081.35711311,
+ "lr": 0.00096093157579425,
+ "time_sec": 32.57441163063049
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.6186258012771606,
+ "train_acc": 0.54752,
+ "test_loss": 2.1861088802337645,
+ "test_acc": 0.4422,
+ "lyapunov": null,
+ "grad_norm": 1.1434442793867807,
+ "grad_max_sv": 0.4658520080149174,
+ "grad_min_sv": 2.124641216849632e-08,
+ "grad_condition": 35023634.55777504,
+ "lr": 0.0009567727288213001,
+ "time_sec": 32.563255071640015
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.5804412273406983,
+ "train_acc": 0.5552,
+ "test_loss": 2.116827065849304,
+ "test_acc": 0.4608,
+ "lyapunov": null,
+ "grad_norm": 1.1174809929853884,
+ "grad_max_sv": 0.4587864212691784,
+ "grad_min_sv": 2.115127252788618e-08,
+ "grad_condition": 25409623.926622026,
+ "lr": 0.0009524135262330095,
+ "time_sec": 32.548664808273315
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.5373576833343505,
+ "train_acc": 0.56826,
+ "test_loss": 2.188752991104126,
+ "test_acc": 0.4488,
+ "lyapunov": null,
+ "grad_norm": 1.0855473101193578,
+ "grad_max_sv": 0.43056059926748275,
+ "grad_min_sv": 2.025934667526652e-08,
+ "grad_condition": 28615900.007624805,
+ "lr": 0.0009478558801197061,
+ "time_sec": 32.611814737319946
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.506667826461792,
+ "train_acc": 0.57494,
+ "test_loss": 2.174818174743652,
+ "test_acc": 0.4577,
+ "lyapunov": null,
+ "grad_norm": 1.0696030802642686,
+ "grad_max_sv": 0.43318344950675963,
+ "grad_min_sv": 2.0166759195916484e-08,
+ "grad_condition": 43974441.149682686,
+ "lr": 0.000943101789615607,
+ "time_sec": 32.57555532455444
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.47097098236084,
+ "train_acc": 0.5857,
+ "test_loss": 2.0404002576828004,
+ "test_acc": 0.4847,
+ "lyapunov": null,
+ "grad_norm": 1.0479522200281932,
+ "grad_max_sv": 0.4198159731924534,
+ "grad_min_sv": 1.9698220292407863e-08,
+ "grad_condition": 45870756.831042506,
+ "lr": 0.0009381533400219313,
+ "time_sec": 32.5772430896759
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.4312325327301025,
+ "train_acc": 0.59378,
+ "test_loss": 2.106845015716553,
+ "test_acc": 0.4767,
+ "lyapunov": null,
+ "grad_norm": 1.0240308878342053,
+ "grad_max_sv": 0.41350489780306815,
+ "grad_min_sv": 1.9328133177981543e-08,
+ "grad_condition": 69115062.26987141,
+ "lr": 0.0009330127018922189,
+ "time_sec": 32.557268142700195
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.3932979926300049,
+ "train_acc": 0.60466,
+ "test_loss": 2.0442503452301026,
+ "test_acc": 0.4874,
+ "lyapunov": null,
+ "grad_norm": 1.0080444681764495,
+ "grad_max_sv": 0.39995783641934396,
+ "grad_min_sv": 1.8682676014569743e-08,
+ "grad_condition": 33480939.457173,
+ "lr": 0.000927682130080253,
+ "time_sec": 32.54329538345337
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.3626447483444213,
+ "train_acc": 0.61088,
+ "test_loss": 2.1529213762283326,
+ "test_acc": 0.4772,
+ "lyapunov": null,
+ "grad_norm": 0.9916083960305544,
+ "grad_max_sv": 0.38913136497139933,
+ "grad_min_sv": 1.803411719611403e-08,
+ "grad_condition": 125553964.7328368,
+ "lr": 0.0009221639627510072,
+ "time_sec": 32.55648422241211
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.332198992652893,
+ "train_acc": 0.6166,
+ "test_loss": 2.2807082765579225,
+ "test_acc": 0.4558,
+ "lyapunov": null,
+ "grad_norm": 0.9771496174881384,
+ "grad_max_sv": 0.39622113704681394,
+ "grad_min_sv": 1.8371455795529455e-08,
+ "grad_condition": 25402444.150790665,
+ "lr": 0.0009164606203550494,
+ "time_sec": 32.56743788719177
+ },
+ {
+ "epoch": 29,
+ "train_loss": 1.3056928281402589,
+ "train_acc": 0.62548,
+ "test_loss": 2.3650270275115965,
+ "test_acc": 0.4494,
+ "lyapunov": null,
+ "grad_norm": 0.9678089971160496,
+ "grad_max_sv": 0.3883704259991646,
+ "grad_min_sv": 1.808786349449809e-08,
+ "grad_condition": 34866235.35928585,
+ "lr": 0.0009105746045668516,
+ "time_sec": 32.53697896003723
+ },
+ {
+ "epoch": 30,
+ "train_loss": 1.2669909148025513,
+ "train_acc": 0.63598,
+ "test_loss": 2.194760869216919,
+ "test_acc": 0.4794,
+ "lyapunov": null,
+ "grad_norm": 0.9467141888064133,
+ "grad_max_sv": 0.3744235411286354,
+ "grad_min_sv": 1.7651215561236e-08,
+ "grad_condition": 139376880.96042347,
+ "lr": 0.0009045084971874733,
+ "time_sec": 32.55838894844055
+ },
+ {
+ "epoch": 31,
+ "train_loss": 1.2365936059951783,
+ "train_acc": 0.64152,
+ "test_loss": 2.251469213104248,
+ "test_acc": 0.4728,
+ "lyapunov": null,
+ "grad_norm": 0.9363746920375892,
+ "grad_max_sv": 0.3752880610525608,
+ "grad_min_sv": 1.7496447651810243e-08,
+ "grad_condition": 33435292.843927078,
+ "lr": 0.0008982649590120977,
+ "time_sec": 32.56987476348877
+ },
+ {
+ "epoch": 32,
+ "train_loss": 1.2132414292144775,
+ "train_acc": 0.6457,
+ "test_loss": 2.155212931251526,
+ "test_acc": 0.4953,
+ "lyapunov": null,
+ "grad_norm": 0.9198517753600641,
+ "grad_max_sv": 0.3622582726180553,
+ "grad_min_sv": 1.7169938390428767e-08,
+ "grad_condition": 301357597.1554047,
+ "lr": 0.0008918467286629196,
+ "time_sec": 32.644938468933105
+ },
+ {
+ "epoch": 33,
+ "train_loss": 1.184193948135376,
+ "train_acc": 0.654,
+ "test_loss": 2.2338722274780274,
+ "test_acc": 0.4833,
+ "lyapunov": null,
+ "grad_norm": 0.9078833042188178,
+ "grad_max_sv": 0.3615180656313896,
+ "grad_min_sv": 1.6779444181325154e-08,
+ "grad_condition": 31157779.01941774,
+ "lr": 0.0008852566213878943,
+ "time_sec": 32.592013359069824
+ },
+ {
+ "epoch": 34,
+ "train_loss": 1.1604648839569092,
+ "train_acc": 0.6605,
+ "test_loss": 2.144485057640076,
+ "test_acc": 0.4963,
+ "lyapunov": null,
+ "grad_norm": 0.8972811549201535,
+ "grad_max_sv": 0.34557069540023805,
+ "grad_min_sv": 1.606287251786076e-08,
+ "grad_condition": 75723670.78622702,
+ "lr": 0.000878497527825878,
+ "time_sec": 32.58034062385559
+ },
+ {
+ "epoch": 35,
+ "train_loss": 1.1375362993240357,
+ "train_acc": 0.66418,
+ "test_loss": 2.181222864341736,
+ "test_acc": 0.4898,
+ "lyapunov": null,
+ "grad_norm": 0.8889790406396809,
+ "grad_max_sv": 0.35035020038485526,
+ "grad_min_sv": 1.6642615324746756e-08,
+ "grad_condition": 30786547.22695731,
+ "lr": 0.000871572412738697,
+ "time_sec": 32.54904317855835
+ },
+ {
+ "epoch": 36,
+ "train_loss": 1.1133264205932618,
+ "train_acc": 0.67238,
+ "test_loss": 2.1131927043914795,
+ "test_acc": 0.5058,
+ "lyapunov": null,
+ "grad_norm": 0.8832491549304202,
+ "grad_max_sv": 0.34634757712483405,
+ "grad_min_sv": 1.6018088946911922e-08,
+ "grad_condition": 49284260.37621014,
+ "lr": 0.0008644843137107055,
+ "time_sec": 32.58738970756531
+ },
+ {
+ "epoch": 37,
+ "train_loss": 1.0785640783309935,
+ "train_acc": 0.67878,
+ "test_loss": 2.2109802129745484,
+ "test_acc": 0.4946,
+ "lyapunov": null,
+ "grad_norm": 0.8741999013148335,
+ "grad_max_sv": 0.3421505123376846,
+ "grad_min_sv": 1.5883508850886296e-08,
+ "grad_condition": 147125609.85023776,
+ "lr": 0.0008572363398164014,
+ "time_sec": 32.6028311252594
+ },
+ {
+ "epoch": 38,
+ "train_loss": 1.0444296839141847,
+ "train_acc": 0.68996,
+ "test_loss": 2.2259356287002565,
+ "test_acc": 0.4923,
+ "lyapunov": null,
+ "grad_norm": 0.8523318198837474,
+ "grad_max_sv": 0.33938159644603727,
+ "grad_min_sv": 1.5807346684382218e-08,
+ "grad_condition": 34226370.63225422,
+ "lr": 0.0008498316702566826,
+ "time_sec": 32.560999393463135
+ },
+ {
+ "epoch": 39,
+ "train_loss": 1.023456362953186,
+ "train_acc": 0.69698,
+ "test_loss": 2.1364882369995115,
+ "test_acc": 0.5049,
+ "lyapunov": null,
+ "grad_norm": 0.8498222777562341,
+ "grad_max_sv": 0.3415807694196701,
+ "grad_min_sv": 1.5869645431099144e-08,
+ "grad_condition": 27853151.39901676,
+ "lr": 0.0008422735529643442,
+ "time_sec": 32.56105279922485
+ },
+ {
+ "epoch": 40,
+ "train_loss": 1.0050300610351564,
+ "train_acc": 0.7014,
+ "test_loss": 2.150569340324402,
+ "test_acc": 0.5071,
+ "lyapunov": null,
+ "grad_norm": 0.8356269441634138,
+ "grad_max_sv": 0.3239683095365763,
+ "grad_min_sv": 1.5381535548204818e-08,
+ "grad_condition": 155224453.46718103,
+ "lr": 0.0008345653031794289,
+ "time_sec": 32.59518837928772
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.9930689501571656,
+ "train_acc": 0.7026,
+ "test_loss": 2.154064438056946,
+ "test_acc": 0.5136,
+ "lyapunov": null,
+ "grad_norm": 0.8262418740899825,
+ "grad_max_sv": 0.3324408046901226,
+ "grad_min_sv": 1.5276669600161607e-08,
+ "grad_condition": 51863928.79048334,
+ "lr": 0.0008267103019950526,
+ "time_sec": 32.57974171638489
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.957993507232666,
+ "train_acc": 0.7135,
+ "test_loss": 2.1310552421569824,
+ "test_acc": 0.5193,
+ "lyapunov": null,
+ "grad_norm": 0.8217377307572092,
+ "grad_max_sv": 0.31569988913834096,
+ "grad_min_sv": 1.4821617464605419e-08,
+ "grad_condition": 57225046.557756186,
+ "lr": 0.0008187119948743447,
+ "time_sec": 32.74825191497803
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.9496447095489502,
+ "train_acc": 0.71474,
+ "test_loss": 2.1654404600143433,
+ "test_acc": 0.5088,
+ "lyapunov": null,
+ "grad_norm": 0.8130839223264894,
+ "grad_max_sv": 0.32253594174981115,
+ "grad_min_sv": 1.506773582987675e-08,
+ "grad_condition": 93723846.88549985,
+ "lr": 0.000810573890139155,
+ "time_sec": 32.602092027664185
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.9342586210250855,
+ "train_acc": 0.71974,
+ "test_loss": 2.290501368904114,
+ "test_acc": 0.5013,
+ "lyapunov": null,
+ "grad_norm": 0.8096736459411619,
+ "grad_max_sv": 0.32218324691057204,
+ "grad_min_sv": 1.5053544679538565e-08,
+ "grad_condition": 44430049.08800385,
+ "lr": 0.0008022995574311873,
+ "time_sec": 32.594489097595215
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.9010325805664062,
+ "train_acc": 0.72686,
+ "test_loss": 2.4134263542175294,
+ "test_acc": 0.4913,
+ "lyapunov": null,
+ "grad_norm": 0.799116269115145,
+ "grad_max_sv": 0.31640069633722306,
+ "grad_min_sv": 1.5047001319934415e-08,
+ "grad_condition": 50608547.42886399,
+ "lr": 0.0007938926261462363,
+ "time_sec": 32.557663917541504
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.8911659923553467,
+ "train_acc": 0.73008,
+ "test_loss": 2.2884033529281615,
+ "test_acc": 0.5057,
+ "lyapunov": null,
+ "grad_norm": 0.7934582132141624,
+ "grad_max_sv": 0.31383398175239563,
+ "grad_min_sv": 1.4469329700584135e-08,
+ "grad_condition": 467744144.1725038,
+ "lr": 0.0007853567838422158,
+ "time_sec": 32.56327676773071
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.8638532521438599,
+ "train_acc": 0.73696,
+ "test_loss": 2.2446172203063965,
+ "test_acc": 0.5076,
+ "lyapunov": null,
+ "grad_norm": 0.7837979602809746,
+ "grad_max_sv": 0.31239640712738037,
+ "grad_min_sv": 1.4274264739655428e-08,
+ "grad_condition": 50193793.36053495,
+ "lr": 0.0007766957746216719,
+ "time_sec": 32.57334923744202
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.8375042049598694,
+ "train_acc": 0.74282,
+ "test_loss": 2.227299571418762,
+ "test_acc": 0.5202,
+ "lyapunov": null,
+ "grad_norm": 0.77427016194081,
+ "grad_max_sv": 0.31100503690540793,
+ "grad_min_sv": 1.4236399661915477e-08,
+ "grad_condition": 50469567.486968085,
+ "lr": 0.0007679133974894982,
+ "time_sec": 32.569188356399536
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.8221629112625122,
+ "train_acc": 0.74886,
+ "test_loss": 2.3033808235168456,
+ "test_acc": 0.5082,
+ "lyapunov": null,
+ "grad_norm": 0.7673158740604195,
+ "grad_max_sv": 0.2993927221745253,
+ "grad_min_sv": 1.3854600900906066e-08,
+ "grad_condition": 304920112.4622501,
+ "lr": 0.000759013504686565,
+ "time_sec": 32.584622621536255
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.8111858353424072,
+ "train_acc": 0.75248,
+ "test_loss": 2.386407151031494,
+ "test_acc": 0.5007,
+ "lyapunov": null,
+ "grad_norm": 0.7677657118676934,
+ "grad_max_sv": 0.3098601832985878,
+ "grad_min_sv": 1.3993020677935397e-08,
+ "grad_condition": 150857500.73279318,
+ "lr": 0.0007499999999999998,
+ "time_sec": 32.59726119041443
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.8006631660461426,
+ "train_acc": 0.7542,
+ "test_loss": 2.322489023399353,
+ "test_acc": 0.5061,
+ "lyapunov": null,
+ "grad_norm": 0.7571398534411352,
+ "grad_max_sv": 0.3029158480465412,
+ "grad_min_sv": 1.366701978661438e-08,
+ "grad_condition": 1198508278.0301957,
+ "lr": 0.0007408768370508575,
+ "time_sec": 32.566423654556274
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.7743014498138427,
+ "train_acc": 0.7611,
+ "test_loss": 2.446239744186401,
+ "test_acc": 0.5001,
+ "lyapunov": null,
+ "grad_norm": 0.7494625172701129,
+ "grad_max_sv": 0.30184583105146884,
+ "grad_min_sv": 1.3538439711142935e-08,
+ "grad_condition": 454382825.5364168,
+ "lr": 0.0007316480175599307,
+ "time_sec": 32.606823205947876
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.7602159348106384,
+ "train_acc": 0.76546,
+ "test_loss": 2.3079547737121584,
+ "test_acc": 0.5179,
+ "lyapunov": null,
+ "grad_norm": 0.743347450494438,
+ "grad_max_sv": 0.3061353128403425,
+ "grad_min_sv": 1.348931551216348e-08,
+ "grad_condition": 80924083.81225905,
+ "lr": 0.0007223175895924635,
+ "time_sec": 32.580427408218384
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.7339858147239685,
+ "train_acc": 0.77348,
+ "test_loss": 2.388110917472839,
+ "test_acc": 0.5122,
+ "lyapunov": null,
+ "grad_norm": 0.7398005246039192,
+ "grad_max_sv": 0.2995276223868132,
+ "grad_min_sv": 1.3313009213089532e-08,
+ "grad_condition": 46213404.23441851,
+ "lr": 0.0007128896457825361,
+ "time_sec": 32.57850360870361
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.7361176003837585,
+ "train_acc": 0.77096,
+ "test_loss": 2.3849290475845337,
+ "test_acc": 0.5096,
+ "lyapunov": null,
+ "grad_norm": 0.7355302680365016,
+ "grad_max_sv": 0.2989551298320293,
+ "grad_min_sv": 1.3770161400267037e-08,
+ "grad_condition": 1196071659.3025665,
+ "lr": 0.0007033683215378998,
+ "time_sec": 32.57127046585083
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.7056646187782287,
+ "train_acc": 0.78266,
+ "test_loss": 2.5353955261230467,
+ "test_acc": 0.5094,
+ "lyapunov": null,
+ "grad_norm": 0.7263545559812212,
+ "grad_max_sv": 0.29214551076292994,
+ "grad_min_sv": 1.2961420287754821e-08,
+ "grad_condition": 55296196.635770574,
+ "lr": 0.0006937577932260512,
+ "time_sec": 32.6073100566864
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.6901627484321594,
+ "train_acc": 0.78498,
+ "test_loss": 2.424652412033081,
+ "test_acc": 0.515,
+ "lyapunov": null,
+ "grad_norm": 0.7255525918000217,
+ "grad_max_sv": 0.2947526901960373,
+ "grad_min_sv": 1.3273521161719094e-08,
+ "grad_condition": 81805484.33683524,
+ "lr": 0.0006840622763423388,
+ "time_sec": 32.587172746658325
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.6748793490219116,
+ "train_acc": 0.79032,
+ "test_loss": 2.4186749195098876,
+ "test_acc": 0.5152,
+ "lyapunov": null,
+ "grad_norm": 0.7152761560999475,
+ "grad_max_sv": 0.2920954205095768,
+ "grad_min_sv": 1.3006854693124736e-08,
+ "grad_condition": 92386117.68065517,
+ "lr": 0.0006742860236609073,
+ "time_sec": 32.59625577926636
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.6585909474945069,
+ "train_acc": 0.79492,
+ "test_loss": 2.423396731376648,
+ "test_acc": 0.5147,
+ "lyapunov": null,
+ "grad_norm": 0.7000734196662035,
+ "grad_max_sv": 0.27961262725293634,
+ "grad_min_sv": 1.2433090768732002e-08,
+ "grad_condition": 44055598.930747576,
+ "lr": 0.0006644333233692913,
+ "time_sec": 32.56940460205078
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.6509319092178345,
+ "train_acc": 0.7971,
+ "test_loss": 2.4439749031066893,
+ "test_acc": 0.5172,
+ "lyapunov": null,
+ "grad_norm": 0.7014808778975755,
+ "grad_max_sv": 0.279667991027236,
+ "grad_min_sv": 1.213204634045728e-08,
+ "grad_condition": 71422713.53211066,
+ "lr": 0.0006545084971874734,
+ "time_sec": 32.592474699020386
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.6274669117927552,
+ "train_acc": 0.80326,
+ "test_loss": 2.6459867664337158,
+ "test_acc": 0.4988,
+ "lyapunov": null,
+ "grad_norm": 0.6875040317915668,
+ "grad_max_sv": 0.2785758938640356,
+ "grad_min_sv": 1.2619559043233753e-08,
+ "grad_condition": 171857029.8323717,
+ "lr": 0.0006445158984722354,
+ "time_sec": 32.630576610565186
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.6170748471164703,
+ "train_acc": 0.80476,
+ "test_loss": 2.5383020797729494,
+ "test_acc": 0.507,
+ "lyapunov": null,
+ "grad_norm": 0.6898214493116677,
+ "grad_max_sv": 0.27117876932024954,
+ "grad_min_sv": 1.216634772142032e-08,
+ "grad_condition": 368391230.9870256,
+ "lr": 0.0006344599103076324,
+ "time_sec": 32.61634922027588
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.6143111569595336,
+ "train_acc": 0.80454,
+ "test_loss": 2.4434647581100464,
+ "test_acc": 0.5183,
+ "lyapunov": null,
+ "grad_norm": 0.6875312632959335,
+ "grad_max_sv": 0.28126552477478983,
+ "grad_min_sv": 1.246990521854962e-08,
+ "grad_condition": 798988222.1191355,
+ "lr": 0.0006243449435824269,
+ "time_sec": 32.61603879928589
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.593730930519104,
+ "train_acc": 0.81294,
+ "test_loss": 2.4702172830581666,
+ "test_acc": 0.5204,
+ "lyapunov": null,
+ "grad_norm": 0.6805278132405531,
+ "grad_max_sv": 0.27184186428785323,
+ "grad_min_sv": 1.2160773926804362e-08,
+ "grad_condition": 897317916.9202541,
+ "lr": 0.0006141754350553275,
+ "time_sec": 32.62076783180237
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.5915982696533203,
+ "train_acc": 0.81346,
+ "test_loss": 2.5983056301116942,
+ "test_acc": 0.5091,
+ "lyapunov": null,
+ "grad_norm": 0.6786733542651691,
+ "grad_max_sv": 0.2730319045484066,
+ "grad_min_sv": 1.195807074368116e-08,
+ "grad_condition": 100225768.74912949,
+ "lr": 0.0006039558454088793,
+ "time_sec": 32.57223296165466
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.5778841704368591,
+ "train_acc": 0.8164,
+ "test_loss": 2.5375493215560914,
+ "test_acc": 0.5166,
+ "lyapunov": null,
+ "grad_norm": 0.6661254148265577,
+ "grad_max_sv": 0.27218331433832643,
+ "grad_min_sv": 1.21305288360192e-08,
+ "grad_condition": 409516154.47474587,
+ "lr": 0.000593690657292862,
+ "time_sec": 32.60103678703308
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.5534152274894715,
+ "train_acc": 0.82388,
+ "test_loss": 2.525739343261719,
+ "test_acc": 0.5172,
+ "lyapunov": null,
+ "grad_norm": 0.66286867140097,
+ "grad_max_sv": 0.27192877791821957,
+ "grad_min_sv": 1.1918128833138253e-08,
+ "grad_condition": 43219144.55143875,
+ "lr": 0.0005833843733580507,
+ "time_sec": 32.570470571517944
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.5373673023986817,
+ "train_acc": 0.82976,
+ "test_loss": 2.5977006465911865,
+ "test_acc": 0.517,
+ "lyapunov": null,
+ "grad_norm": 0.6509079409235867,
+ "grad_max_sv": 0.26122898012399676,
+ "grad_min_sv": 1.1391138144897784e-08,
+ "grad_condition": 68515123.47894785,
+ "lr": 0.0005730415142812054,
+ "time_sec": 32.60091519355774
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.5234087624740601,
+ "train_acc": 0.83328,
+ "test_loss": 2.5398946479797364,
+ "test_acc": 0.5195,
+ "lyapunov": null,
+ "grad_norm": 0.6514320709102108,
+ "grad_max_sv": 0.2681581676006317,
+ "grad_min_sv": 1.1655683266427116e-08,
+ "grad_condition": 706218189.6988381,
+ "lr": 0.0005626666167821517,
+ "time_sec": 32.60088515281677
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.5105544789123535,
+ "train_acc": 0.83858,
+ "test_loss": 2.6386670696258543,
+ "test_acc": 0.5124,
+ "lyapunov": null,
+ "grad_norm": 0.6433463540817135,
+ "grad_max_sv": 0.2647452913224697,
+ "grad_min_sv": 1.1366260942169416e-08,
+ "grad_condition": 65156065.92607037,
+ "lr": 0.0005522642316338265,
+ "time_sec": 32.64759874343872
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.5010787317276001,
+ "train_acc": 0.83912,
+ "test_loss": 2.6461667497634886,
+ "test_acc": 0.5113,
+ "lyapunov": null,
+ "grad_norm": 0.6437656983932116,
+ "grad_max_sv": 0.27069182582199575,
+ "grad_min_sv": 1.1655098845937683e-08,
+ "grad_condition": 152350561.59014112,
+ "lr": 0.0005418389216661573,
+ "time_sec": 32.59350061416626
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.48393970026969907,
+ "train_acc": 0.84504,
+ "test_loss": 2.714662640762329,
+ "test_acc": 0.5138,
+ "lyapunov": null,
+ "grad_norm": 0.6380630437719501,
+ "grad_max_sv": 0.2641098305583,
+ "grad_min_sv": 1.1268197760809507e-08,
+ "grad_condition": 120257137.75772035,
+ "lr": 0.0005313952597646563,
+ "time_sec": 32.596872329711914
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.48754292858123777,
+ "train_acc": 0.84344,
+ "test_loss": 2.7237933948516844,
+ "test_acc": 0.5121,
+ "lyapunov": null,
+ "grad_norm": 0.6383299877925953,
+ "grad_max_sv": 0.26338610500097276,
+ "grad_min_sv": 1.1300838716199468e-08,
+ "grad_condition": 111884472.4678097,
+ "lr": 0.0005209378268645994,
+ "time_sec": 32.5793662071228
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.47278374366760256,
+ "train_acc": 0.84774,
+ "test_loss": 2.6715963176727295,
+ "test_acc": 0.5175,
+ "lyapunov": null,
+ "grad_norm": 0.6274777670934027,
+ "grad_max_sv": 0.2674501951783895,
+ "grad_min_sv": 1.1504576969084777e-08,
+ "grad_condition": 1355085877.4304867,
+ "lr": 0.0005104712099416781,
+ "time_sec": 32.57535362243652
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.46160235664367677,
+ "train_acc": 0.8514,
+ "test_loss": 2.648087367248535,
+ "test_acc": 0.5256,
+ "lyapunov": null,
+ "grad_norm": 0.6267372816019459,
+ "grad_max_sv": 0.2574677299708128,
+ "grad_min_sv": 1.0966666171572172e-08,
+ "grad_condition": 334727656.01781523,
+ "lr": 0.0004999999999999996,
+ "time_sec": 32.610466957092285
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.4535921633911133,
+ "train_acc": 0.85614,
+ "test_loss": 2.6602814262390138,
+ "test_acc": 0.523,
+ "lyapunov": null,
+ "grad_norm": 0.6107123792245788,
+ "grad_max_sv": 0.2529071237891912,
+ "grad_min_sv": 1.1059093659587793e-08,
+ "grad_condition": 120836694.63569286,
+ "lr": 0.0004895287900583212,
+ "time_sec": 32.60012149810791
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.4353150751876831,
+ "train_acc": 0.85868,
+ "test_loss": 2.704223956680298,
+ "test_acc": 0.515,
+ "lyapunov": null,
+ "grad_norm": 0.6089035015325723,
+ "grad_max_sv": 0.26519037671387197,
+ "grad_min_sv": 1.1131827913862629e-08,
+ "grad_condition": 731888345.2288473,
+ "lr": 0.0004790621731353997,
+ "time_sec": 32.5684015750885
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.4266960339736938,
+ "train_acc": 0.86162,
+ "test_loss": 2.621325074005127,
+ "test_acc": 0.5293,
+ "lyapunov": null,
+ "grad_norm": 0.6005077005692222,
+ "grad_max_sv": 0.24986533373594283,
+ "grad_min_sv": 1.066437155744851e-08,
+ "grad_condition": 323621690.1204275,
+ "lr": 0.000468604740235343,
+ "time_sec": 32.593501567840576
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.40983675064086916,
+ "train_acc": 0.86828,
+ "test_loss": 2.654561376953125,
+ "test_acc": 0.5278,
+ "lyapunov": null,
+ "grad_norm": 0.5926958478419567,
+ "grad_max_sv": 0.253178546205163,
+ "grad_min_sv": 1.0804884827174745e-08,
+ "grad_condition": 432601908.1535362,
+ "lr": 0.00045816107833384175,
+ "time_sec": 32.603999376297
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.4048340177345276,
+ "train_acc": 0.86952,
+ "test_loss": 2.7457454587936403,
+ "test_acc": 0.5169,
+ "lyapunov": null,
+ "grad_norm": 0.5908548576457587,
+ "grad_max_sv": 0.25038131698966026,
+ "grad_min_sv": 1.0512154793168581e-08,
+ "grad_condition": 130905588.43349023,
+ "lr": 0.0004477357683661729,
+ "time_sec": 32.603445053100586
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.3956010137653351,
+ "train_acc": 0.87362,
+ "test_loss": 2.6873944789886473,
+ "test_acc": 0.5209,
+ "lyapunov": null,
+ "grad_norm": 0.584388729391549,
+ "grad_max_sv": 0.24884492233395578,
+ "grad_min_sv": 1.0513768951801727e-08,
+ "grad_condition": 247213360.42633313,
+ "lr": 0.00043733338321784746,
+ "time_sec": 32.59891176223755
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.39998871772766115,
+ "train_acc": 0.87126,
+ "test_loss": 2.7860556625366213,
+ "test_acc": 0.5159,
+ "lyapunov": null,
+ "grad_norm": 0.5914248649657466,
+ "grad_max_sv": 0.2658348709344864,
+ "grad_min_sv": 1.082797196690511e-08,
+ "grad_condition": 1133342480.7967758,
+ "lr": 0.0004269584857187939,
+ "time_sec": 32.59586429595947
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.3816492418861389,
+ "train_acc": 0.877,
+ "test_loss": 2.7754603567123413,
+ "test_acc": 0.5172,
+ "lyapunov": null,
+ "grad_norm": 0.5821106701045357,
+ "grad_max_sv": 0.2504717506468296,
+ "grad_min_sv": 1.0313228220211468e-08,
+ "grad_condition": 79983143.9616401,
+ "lr": 0.0004166156266419484,
+ "time_sec": 32.61333727836609
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.3718857811355591,
+ "train_acc": 0.88052,
+ "test_loss": 2.711159196472168,
+ "test_acc": 0.5308,
+ "lyapunov": null,
+ "grad_norm": 0.5753178111464781,
+ "grad_max_sv": 0.24524039030075073,
+ "grad_min_sv": 1.0231703595139919e-08,
+ "grad_condition": 185067792.66451305,
+ "lr": 0.0004063093427071373,
+ "time_sec": 32.58551812171936
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.3627623717498779,
+ "train_acc": 0.8827,
+ "test_loss": 2.7379925659179687,
+ "test_acc": 0.5259,
+ "lyapunov": null,
+ "grad_norm": 0.5629491927418928,
+ "grad_max_sv": 0.24136969707906247,
+ "grad_min_sv": 9.91763398714568e-09,
+ "grad_condition": 152636209.94255581,
+ "lr": 0.0003960441545911199,
+ "time_sec": 32.603590965270996
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.346252275390625,
+ "train_acc": 0.88882,
+ "test_loss": 2.766578482246399,
+ "test_acc": 0.5312,
+ "lyapunov": null,
+ "grad_norm": 0.5515259268132012,
+ "grad_max_sv": 0.24355790987610818,
+ "grad_min_sv": 1.0009752546454032e-08,
+ "grad_condition": 97406517.6245994,
+ "lr": 0.0003858245649446718,
+ "time_sec": 32.584232807159424
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.34051946352005,
+ "train_acc": 0.89098,
+ "test_loss": 2.779722568702698,
+ "test_acc": 0.528,
+ "lyapunov": null,
+ "grad_norm": 0.5519101007375313,
+ "grad_max_sv": 0.24400133974850177,
+ "grad_min_sv": 9.877336406855648e-09,
+ "grad_condition": 712710697.5623571,
+ "lr": 0.00037565505641757235,
+ "time_sec": 32.6142373085022
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.33136254326820375,
+ "train_acc": 0.89032,
+ "test_loss": 2.719365368270874,
+ "test_acc": 0.535,
+ "lyapunov": null,
+ "grad_norm": 0.5511773242388698,
+ "grad_max_sv": 0.23767127953469752,
+ "grad_min_sv": 9.902577505389865e-09,
+ "grad_condition": 127351733.7757211,
+ "lr": 0.00036554008969236695,
+ "time_sec": 32.62907528877258
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.32775797492980957,
+ "train_acc": 0.89324,
+ "test_loss": 2.790045444488525,
+ "test_acc": 0.5299,
+ "lyapunov": null,
+ "grad_norm": 0.5479128041042186,
+ "grad_max_sv": 0.2417389802634716,
+ "grad_min_sv": 9.801050153543031e-09,
+ "grad_condition": 342834303.4129317,
+ "lr": 0.0003554841015277638,
+ "time_sec": 32.58039617538452
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.32945220873832703,
+ "train_acc": 0.8918,
+ "test_loss": 2.922000147628784,
+ "test_acc": 0.5182,
+ "lyapunov": null,
+ "grad_norm": 0.5550461625192047,
+ "grad_max_sv": 0.24011647067964076,
+ "grad_min_sv": 9.800379771726567e-09,
+ "grad_condition": 1256581334.5865822,
+ "lr": 0.000345491502812526,
+ "time_sec": 32.59003448486328
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.3192555838537216,
+ "train_acc": 0.89716,
+ "test_loss": 2.8951302070617677,
+ "test_acc": 0.5263,
+ "lyapunov": null,
+ "grad_norm": 0.5399705873184968,
+ "grad_max_sv": 0.2398311447352171,
+ "grad_min_sv": 9.757036307719846e-09,
+ "grad_condition": 127427759.95651396,
+ "lr": 0.0003355666766307081,
+ "time_sec": 32.6045126914978
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.3078860513591766,
+ "train_acc": 0.90134,
+ "test_loss": 2.8668867027282716,
+ "test_acc": 0.5242,
+ "lyapunov": null,
+ "grad_norm": 0.529771320174461,
+ "grad_max_sv": 0.24304427802562714,
+ "grad_min_sv": 9.90028982024438e-09,
+ "grad_condition": 134692222.21263316,
+ "lr": 0.00032571397633909225,
+ "time_sec": 32.59454321861267
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.2954711162376404,
+ "train_acc": 0.90374,
+ "test_loss": 2.8291058578491213,
+ "test_acc": 0.5338,
+ "lyapunov": null,
+ "grad_norm": 0.5270179348539408,
+ "grad_max_sv": 0.23493569679558277,
+ "grad_min_sv": 9.681322873239529e-09,
+ "grad_condition": 154310830.71851045,
+ "lr": 0.00031593772365766094,
+ "time_sec": 32.637152433395386
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.29190866079330446,
+ "train_acc": 0.90516,
+ "test_loss": 2.8675409421920777,
+ "test_acc": 0.5267,
+ "lyapunov": null,
+ "grad_norm": 0.5236741934845208,
+ "grad_max_sv": 0.23337335288524627,
+ "grad_min_sv": 9.406507730548574e-09,
+ "grad_condition": 172022555.775852,
+ "lr": 0.0003062422067739483,
+ "time_sec": 32.615885496139526
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.2843532346916199,
+ "train_acc": 0.90826,
+ "test_loss": 2.9124584104537963,
+ "test_acc": 0.5294,
+ "lyapunov": null,
+ "grad_norm": 0.5141183140073359,
+ "grad_max_sv": 0.22986465878784657,
+ "grad_min_sv": 9.210905181113172e-09,
+ "grad_condition": 336375534.72882974,
+ "lr": 0.00029663167846209965,
+ "time_sec": 32.62099742889404
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.28095845563411714,
+ "train_acc": 0.90888,
+ "test_loss": 2.9585642152786256,
+ "test_acc": 0.5188,
+ "lyapunov": null,
+ "grad_norm": 0.5209337851609864,
+ "grad_max_sv": 0.24165461957454681,
+ "grad_min_sv": 9.822391551029056e-09,
+ "grad_condition": 3734850942.353486,
+ "lr": 0.00028711035421746345,
+ "time_sec": 32.606362104415894
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.270245605134964,
+ "train_acc": 0.91376,
+ "test_loss": 2.8790921213150025,
+ "test_acc": 0.535,
+ "lyapunov": null,
+ "grad_norm": 0.5018050404070028,
+ "grad_max_sv": 0.2287111472338438,
+ "grad_min_sv": 9.100506417479732e-09,
+ "grad_condition": 1286046088.0897596,
+ "lr": 0.00027768241040753615,
+ "time_sec": 32.605376958847046
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.26737561470508575,
+ "train_acc": 0.91348,
+ "test_loss": 2.9673530891418456,
+ "test_acc": 0.52,
+ "lyapunov": null,
+ "grad_norm": 0.5026625596288345,
+ "grad_max_sv": 0.22773091793060302,
+ "grad_min_sv": 9.130605362089221e-09,
+ "grad_condition": 2561536325.8505445,
+ "lr": 0.00026835198244006903,
+ "time_sec": 32.61582803726196
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.25649453671455386,
+ "train_acc": 0.91706,
+ "test_loss": 2.960128957557678,
+ "test_acc": 0.5285,
+ "lyapunov": null,
+ "grad_norm": 0.4959587348752051,
+ "grad_max_sv": 0.22662512063980103,
+ "grad_min_sv": 9.021708526762983e-09,
+ "grad_condition": 2170055259.576285,
+ "lr": 0.0002591231629491421,
+ "time_sec": 32.59518361091614
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.25298852029800417,
+ "train_acc": 0.91614,
+ "test_loss": 2.999088920211792,
+ "test_acc": 0.5213,
+ "lyapunov": null,
+ "grad_norm": 0.49694281512357663,
+ "grad_max_sv": 0.2285677995532751,
+ "grad_min_sv": 9.117687981181898e-09,
+ "grad_condition": 153385408.53154242,
+ "lr": 0.0002499999999999997,
+ "time_sec": 32.60006618499756
+ },
+ {
+ "epoch": 101,
+ "train_loss": 0.24837311635971068,
+ "train_acc": 0.92042,
+ "test_loss": 2.9769588521957395,
+ "test_acc": 0.527,
+ "lyapunov": null,
+ "grad_norm": 0.49156384156747235,
+ "grad_max_sv": 0.23404922261834143,
+ "grad_min_sv": 9.245040229915492e-09,
+ "grad_condition": 730777146.0902932,
+ "lr": 0.00024098649531343477,
+ "time_sec": 32.58926057815552
+ },
+ {
+ "epoch": 102,
+ "train_loss": 0.24679850215435029,
+ "train_acc": 0.91974,
+ "test_loss": 2.983294668197632,
+ "test_acc": 0.5239,
+ "lyapunov": null,
+ "grad_norm": 0.4891194067973055,
+ "grad_max_sv": 0.22282884679734707,
+ "grad_min_sv": 8.780173748647313e-09,
+ "grad_condition": 157121553.36478597,
+ "lr": 0.0002320866025105016,
+ "time_sec": 32.61522173881531
+ },
+ {
+ "epoch": 103,
+ "train_loss": 0.235624645652771,
+ "train_acc": 0.9236,
+ "test_loss": 2.97529112701416,
+ "test_acc": 0.5278,
+ "lyapunov": null,
+ "grad_norm": 0.47526538494931814,
+ "grad_max_sv": 0.2206702034920454,
+ "grad_min_sv": 8.61680920262453e-09,
+ "grad_condition": 145823760.67239988,
+ "lr": 0.0002233042253783278,
+ "time_sec": 32.67024850845337
+ },
+ {
+ "epoch": 104,
+ "train_loss": 0.23265846648216248,
+ "train_acc": 0.92502,
+ "test_loss": 2.9763864707946777,
+ "test_acc": 0.5263,
+ "lyapunov": null,
+ "grad_norm": 0.47725567627138915,
+ "grad_max_sv": 0.22133470103144645,
+ "grad_min_sv": 8.68051782312168e-09,
+ "grad_condition": 267574471.67175755,
+ "lr": 0.000214643216157784,
+ "time_sec": 32.611361265182495
+ },
+ {
+ "epoch": 105,
+ "train_loss": 0.22897292974472047,
+ "train_acc": 0.92568,
+ "test_loss": 3.0474896495819093,
+ "test_acc": 0.5212,
+ "lyapunov": null,
+ "grad_norm": 0.4764754544051647,
+ "grad_max_sv": 0.22653804197907448,
+ "grad_min_sv": 8.760947359104918e-09,
+ "grad_condition": 3219418687.447474,
+ "lr": 0.00020610737385376332,
+ "time_sec": 32.5970995426178
+ },
+ {
+ "epoch": 106,
+ "train_loss": 0.22509269979476929,
+ "train_acc": 0.9271,
+ "test_loss": 2.9895481927871703,
+ "test_acc": 0.5276,
+ "lyapunov": null,
+ "grad_norm": 0.47179914735427825,
+ "grad_max_sv": 0.22902226410806178,
+ "grad_min_sv": 8.651995134743851e-09,
+ "grad_condition": 188321170.63109916,
+ "lr": 0.00019770044256881242,
+ "time_sec": 32.61952805519104
+ },
+ {
+ "epoch": 107,
+ "train_loss": 0.22124877912521362,
+ "train_acc": 0.92918,
+ "test_loss": 2.9869052186965943,
+ "test_acc": 0.5261,
+ "lyapunov": null,
+ "grad_norm": 0.4676814721095271,
+ "grad_max_sv": 0.23612426966428757,
+ "grad_min_sv": 8.830977354858538e-09,
+ "grad_condition": 1324097462.1438193,
+ "lr": 0.0001894261098608447,
+ "time_sec": 32.63655757904053
+ },
+ {
+ "epoch": 108,
+ "train_loss": 0.2119530977487564,
+ "train_acc": 0.93214,
+ "test_loss": 2.957085295295715,
+ "test_acc": 0.5283,
+ "lyapunov": null,
+ "grad_norm": 0.4597233192330978,
+ "grad_max_sv": 0.21893165111541749,
+ "grad_min_sv": 8.44588889763187e-09,
+ "grad_condition": 325299909.8181821,
+ "lr": 0.000181288005125655,
+ "time_sec": 32.6324462890625
+ },
+ {
+ "epoch": 109,
+ "train_loss": 0.2096145883345604,
+ "train_acc": 0.93168,
+ "test_loss": 3.0633232662200927,
+ "test_acc": 0.5232,
+ "lyapunov": null,
+ "grad_norm": 0.46012619309211217,
+ "grad_max_sv": 0.21432300768792628,
+ "grad_min_sv": 8.437937682305527e-09,
+ "grad_condition": 912797689.183795,
+ "lr": 0.0001732896980049473,
+ "time_sec": 32.59154772758484
+ },
+ {
+ "epoch": 110,
+ "train_loss": 0.20650233900070192,
+ "train_acc": 0.9334,
+ "test_loss": 3.0124371912002563,
+ "test_acc": 0.5288,
+ "lyapunov": null,
+ "grad_norm": 0.45267852009677,
+ "grad_max_sv": 0.2197608083486557,
+ "grad_min_sv": 8.136439059915762e-09,
+ "grad_condition": 214553728.36221018,
+ "lr": 0.00016543469682057076,
+ "time_sec": 32.58715891838074
+ },
+ {
+ "epoch": 111,
+ "train_loss": 0.202456818523407,
+ "train_acc": 0.93476,
+ "test_loss": 2.953989649581909,
+ "test_acc": 0.5364,
+ "lyapunov": null,
+ "grad_norm": 0.44877046173685803,
+ "grad_max_sv": 0.2101663440465927,
+ "grad_min_sv": 8.111785431298008e-09,
+ "grad_condition": 181357744.46055207,
+ "lr": 0.00015772644703565552,
+ "time_sec": 32.61166739463806
+ },
+ {
+ "epoch": 112,
+ "train_loss": 0.19417572572231293,
+ "train_acc": 0.93836,
+ "test_loss": 3.0636728370666506,
+ "test_acc": 0.5294,
+ "lyapunov": null,
+ "grad_norm": 0.44228389201963325,
+ "grad_max_sv": 0.2184779081493616,
+ "grad_min_sv": 8.052494614532204e-09,
+ "grad_condition": 701685099.8537222,
+ "lr": 0.00015016832974331713,
+ "time_sec": 32.61799240112305
+ },
+ {
+ "epoch": 113,
+ "train_loss": 0.1894145729970932,
+ "train_acc": 0.93984,
+ "test_loss": 2.981136636924744,
+ "test_acc": 0.5323,
+ "lyapunov": null,
+ "grad_norm": 0.4358812319975278,
+ "grad_max_sv": 0.20872662551701068,
+ "grad_min_sv": 7.95152020114211e-09,
+ "grad_condition": 1423865321.2329361,
+ "lr": 0.00014276366018359834,
+ "time_sec": 32.6167311668396
+ },
+ {
+ "epoch": 114,
+ "train_loss": 0.18947952261924744,
+ "train_acc": 0.9398,
+ "test_loss": 3.0828820104598997,
+ "test_acc": 0.5292,
+ "lyapunov": null,
+ "grad_norm": 0.43739466792043646,
+ "grad_max_sv": 0.2058663982897997,
+ "grad_min_sv": 7.741768523156016e-09,
+ "grad_condition": 7243536793.4379,
+ "lr": 0.00013551568628929425,
+ "time_sec": 32.59801626205444
+ },
+ {
+ "epoch": 115,
+ "train_loss": 0.1862397237443924,
+ "train_acc": 0.94078,
+ "test_loss": 2.9763780981063843,
+ "test_acc": 0.538,
+ "lyapunov": null,
+ "grad_norm": 0.43528746000323826,
+ "grad_max_sv": 0.20504732690751554,
+ "grad_min_sv": 8.141562394137907e-09,
+ "grad_condition": 139509610.14712492,
+ "lr": 0.00012842758726130276,
+ "time_sec": 32.612173080444336
+ },
+ {
+ "epoch": 116,
+ "train_loss": 0.17998726233482362,
+ "train_acc": 0.9426,
+ "test_loss": 3.0221671098709106,
+ "test_acc": 0.5357,
+ "lyapunov": null,
+ "grad_norm": 0.4288718122641706,
+ "grad_max_sv": 0.2140086382627487,
+ "grad_min_sv": 7.976556949608644e-09,
+ "grad_condition": 784872577.917934,
+ "lr": 0.0001215024721741218,
+ "time_sec": 32.63769769668579
+ },
+ {
+ "epoch": 117,
+ "train_loss": 0.17653137303352356,
+ "train_acc": 0.94314,
+ "test_loss": 3.0061340055465697,
+ "test_acc": 0.5323,
+ "lyapunov": null,
+ "grad_norm": 0.4236151447378006,
+ "grad_max_sv": 0.20592431761324406,
+ "grad_min_sv": 7.804582891849515e-09,
+ "grad_condition": 232091482.5503703,
+ "lr": 0.00011474337861210538,
+ "time_sec": 32.63769888877869
+ },
+ {
+ "epoch": 118,
+ "train_loss": 0.18115964114189148,
+ "train_acc": 0.94264,
+ "test_loss": 2.9955945150375367,
+ "test_acc": 0.5394,
+ "lyapunov": null,
+ "grad_norm": 0.43031955217275497,
+ "grad_max_sv": 0.21836008243262767,
+ "grad_min_sv": 7.966632081498128e-09,
+ "grad_condition": 338791411.5737727,
+ "lr": 0.00010815327133708009,
+ "time_sec": 32.59054613113403
+ },
+ {
+ "epoch": 119,
+ "train_loss": 0.1751684021663666,
+ "train_acc": 0.94342,
+ "test_loss": 3.0028031162261963,
+ "test_acc": 0.5344,
+ "lyapunov": null,
+ "grad_norm": 0.4234025902326238,
+ "grad_max_sv": 0.2052937986329198,
+ "grad_min_sv": 7.743973756604156e-09,
+ "grad_condition": 205737178.47096592,
+ "lr": 0.00010173504098790182,
+ "time_sec": 32.63575482368469
+ },
+ {
+ "epoch": 120,
+ "train_loss": 0.17288655778884887,
+ "train_acc": 0.9449,
+ "test_loss": 3.026424203681946,
+ "test_acc": 0.5381,
+ "lyapunov": null,
+ "grad_norm": 0.41773026543709724,
+ "grad_max_sv": 0.2095510721206665,
+ "grad_min_sv": 7.937595827254033e-09,
+ "grad_condition": 6330317379.225478,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 32.587223052978516
+ },
+ {
+ "epoch": 121,
+ "train_loss": 0.17101951307296753,
+ "train_acc": 0.94462,
+ "test_loss": 3.165215256309509,
+ "test_acc": 0.5219,
+ "lyapunov": null,
+ "grad_norm": 0.42195608937670603,
+ "grad_max_sv": 0.20825999304652215,
+ "grad_min_sv": 7.99512678009099e-09,
+ "grad_condition": 653203712.6193202,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 32.596564531326294
+ },
+ {
+ "epoch": 122,
+ "train_loss": 0.1693978008031845,
+ "train_acc": 0.94588,
+ "test_loss": 3.0062981233596804,
+ "test_acc": 0.5348,
+ "lyapunov": null,
+ "grad_norm": 0.41591242620468016,
+ "grad_max_sv": 0.2059656113386154,
+ "grad_min_sv": 7.704039686772836e-09,
+ "grad_condition": 1004445609.8434451,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 32.61800956726074
+ },
+ {
+ "epoch": 123,
+ "train_loss": 0.16728713005065918,
+ "train_acc": 0.94756,
+ "test_loss": 3.1665957611083986,
+ "test_acc": 0.5246,
+ "lyapunov": null,
+ "grad_norm": 0.41526238625867323,
+ "grad_max_sv": 0.20129744820296763,
+ "grad_min_sv": 7.569636380905243e-09,
+ "grad_condition": 407190475.77847266,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 32.61078882217407
+ },
+ {
+ "epoch": 124,
+ "train_loss": 0.1635257438659668,
+ "train_acc": 0.94798,
+ "test_loss": 3.1016404109954836,
+ "test_acc": 0.5367,
+ "lyapunov": null,
+ "grad_norm": 0.4079868295136817,
+ "grad_max_sv": 0.20866212155669928,
+ "grad_min_sv": 7.864988894011604e-09,
+ "grad_condition": 294549971.18264663,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 32.627676486968994
+ },
+ {
+ "epoch": 125,
+ "train_loss": 0.1641435864830017,
+ "train_acc": 0.94756,
+ "test_loss": 3.0870759466171265,
+ "test_acc": 0.5259,
+ "lyapunov": null,
+ "grad_norm": 0.4108898930410538,
+ "grad_max_sv": 0.21254582721740006,
+ "grad_min_sv": 7.773244741892532e-09,
+ "grad_condition": 192549384.92611116,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 32.60348701477051
+ },
+ {
+ "epoch": 126,
+ "train_loss": 0.15524960072517396,
+ "train_acc": 0.95126,
+ "test_loss": 3.106667465209961,
+ "test_acc": 0.5253,
+ "lyapunov": null,
+ "grad_norm": 0.39708975035952015,
+ "grad_max_sv": 0.20546648390591143,
+ "grad_min_sv": 7.524984951411303e-09,
+ "grad_condition": 594241717.5398318,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 32.62395262718201
+ },
+ {
+ "epoch": 127,
+ "train_loss": 0.16405641248226166,
+ "train_acc": 0.94786,
+ "test_loss": 3.0382690155029297,
+ "test_acc": 0.5344,
+ "lyapunov": null,
+ "grad_norm": 0.41136197829373494,
+ "grad_max_sv": 0.20878486707806587,
+ "grad_min_sv": 7.634084871223142e-09,
+ "grad_condition": 4480646318.175786,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 32.58641195297241
+ },
+ {
+ "epoch": 128,
+ "train_loss": 0.15556303625106813,
+ "train_acc": 0.95,
+ "test_loss": 3.0696772289276124,
+ "test_acc": 0.5291,
+ "lyapunov": null,
+ "grad_norm": 0.399629179039621,
+ "grad_max_sv": 0.19112058784812688,
+ "grad_min_sv": 7.558967303998576e-09,
+ "grad_condition": 130958494.19530413,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 32.6273717880249
+ },
+ {
+ "epoch": 129,
+ "train_loss": 0.15622675662994384,
+ "train_acc": 0.94962,
+ "test_loss": 3.0737016366958616,
+ "test_acc": 0.53,
+ "lyapunov": null,
+ "grad_norm": 0.4021852855426899,
+ "grad_max_sv": 0.20368068106472492,
+ "grad_min_sv": 7.91968607510862e-09,
+ "grad_condition": 4092034646.124222,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 32.61072516441345
+ },
+ {
+ "epoch": 130,
+ "train_loss": 0.15069342103004454,
+ "train_acc": 0.95206,
+ "test_loss": 3.138083388710022,
+ "test_acc": 0.5303,
+ "lyapunov": null,
+ "grad_norm": 0.3967446109539621,
+ "grad_max_sv": 0.20565238259732724,
+ "grad_min_sv": 7.903937278850096e-09,
+ "grad_condition": 403356372.5201774,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 32.60817766189575
+ },
+ {
+ "epoch": 131,
+ "train_loss": 0.1475225008201599,
+ "train_acc": 0.95388,
+ "test_loss": 3.097823154640198,
+ "test_acc": 0.5262,
+ "lyapunov": null,
+ "grad_norm": 0.3911645556854745,
+ "grad_max_sv": 0.2029418082907796,
+ "grad_min_sv": 7.451206509700297e-09,
+ "grad_condition": 184512637.53159684,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 32.620972633361816
+ },
+ {
+ "epoch": 132,
+ "train_loss": 0.14910545247793197,
+ "train_acc": 0.95376,
+ "test_loss": 3.1958837438583374,
+ "test_acc": 0.5255,
+ "lyapunov": null,
+ "grad_norm": 0.39312251468793336,
+ "grad_max_sv": 0.19356854669749737,
+ "grad_min_sv": 7.3685526407948895e-09,
+ "grad_condition": 474360013.88184536,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 32.62202000617981
+ },
+ {
+ "epoch": 133,
+ "train_loss": 0.14772581936836243,
+ "train_acc": 0.95306,
+ "test_loss": 3.1449778295516966,
+ "test_acc": 0.528,
+ "lyapunov": null,
+ "grad_norm": 0.39083628600782144,
+ "grad_max_sv": 0.18662805538624525,
+ "grad_min_sv": 7.411569982176611e-09,
+ "grad_condition": 590179948.2869803,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 32.62527775764465
+ },
+ {
+ "epoch": 134,
+ "train_loss": 0.1473908689570427,
+ "train_acc": 0.95432,
+ "test_loss": 3.060500933647156,
+ "test_acc": 0.532,
+ "lyapunov": null,
+ "grad_norm": 0.39321527574531456,
+ "grad_max_sv": 0.1960258588194847,
+ "grad_min_sv": 7.530598097665528e-09,
+ "grad_condition": 690149093.5169044,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 32.611403942108154
+ },
+ {
+ "epoch": 135,
+ "train_loss": 0.1489419222688675,
+ "train_acc": 0.95216,
+ "test_loss": 3.0586274435043337,
+ "test_acc": 0.5333,
+ "lyapunov": null,
+ "grad_norm": 0.3951339678077363,
+ "grad_max_sv": 0.19855166971683502,
+ "grad_min_sv": 7.4231230849652885e-09,
+ "grad_condition": 338026036.5432772,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 32.57758116722107
+ },
+ {
+ "epoch": 136,
+ "train_loss": 0.1439458827161789,
+ "train_acc": 0.9552,
+ "test_loss": 3.1572901706695555,
+ "test_acc": 0.5268,
+ "lyapunov": null,
+ "grad_norm": 0.38505775133385556,
+ "grad_max_sv": 0.20576392244547606,
+ "grad_min_sv": 7.578524123253968e-09,
+ "grad_condition": 2346058745.0245013,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 32.60840678215027
+ },
+ {
+ "epoch": 137,
+ "train_loss": 0.14263056889772416,
+ "train_acc": 0.95558,
+ "test_loss": 3.0500190071105955,
+ "test_acc": 0.5343,
+ "lyapunov": null,
+ "grad_norm": 0.38315618240250937,
+ "grad_max_sv": 0.19492608066648245,
+ "grad_min_sv": 7.437362629664907e-09,
+ "grad_condition": 445968074.97881687,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 32.5784227848053
+ },
+ {
+ "epoch": 138,
+ "train_loss": 0.14197950773239135,
+ "train_acc": 0.95516,
+ "test_loss": 3.054612173843384,
+ "test_acc": 0.5379,
+ "lyapunov": null,
+ "grad_norm": 0.3842449580292686,
+ "grad_max_sv": 0.20386305153369905,
+ "grad_min_sv": 7.256548800879062e-09,
+ "grad_condition": 4009126006.180674,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 32.58382248878479
+ },
+ {
+ "epoch": 139,
+ "train_loss": 0.14526520327091216,
+ "train_acc": 0.95412,
+ "test_loss": 3.0950862688064573,
+ "test_acc": 0.5323,
+ "lyapunov": null,
+ "grad_norm": 0.38739146310202444,
+ "grad_max_sv": 0.19300882443785666,
+ "grad_min_sv": 7.3080626628160495e-09,
+ "grad_condition": 1317753085.472504,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 32.599539041519165
+ },
+ {
+ "epoch": 140,
+ "train_loss": 0.14277389855384826,
+ "train_acc": 0.9551,
+ "test_loss": 3.0536239072799685,
+ "test_acc": 0.5334,
+ "lyapunov": null,
+ "grad_norm": 0.3812502385842012,
+ "grad_max_sv": 0.2037056451663375,
+ "grad_min_sv": 7.302020117101499e-09,
+ "grad_condition": 4685216825.833342,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 32.60143446922302
+ },
+ {
+ "epoch": 141,
+ "train_loss": 0.14106001211643218,
+ "train_acc": 0.95592,
+ "test_loss": 3.0723882249832153,
+ "test_acc": 0.5322,
+ "lyapunov": null,
+ "grad_norm": 0.38539484766071236,
+ "grad_max_sv": 0.19134777113795282,
+ "grad_min_sv": 7.162904132459666e-09,
+ "grad_condition": 370718600.83184236,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 32.604408740997314
+ },
+ {
+ "epoch": 142,
+ "train_loss": 0.1438280531835556,
+ "train_acc": 0.95406,
+ "test_loss": 3.1630526540756225,
+ "test_acc": 0.526,
+ "lyapunov": null,
+ "grad_norm": 0.3885005879930968,
+ "grad_max_sv": 0.19621171467006207,
+ "grad_min_sv": 7.508452308209804e-09,
+ "grad_condition": 440340049.22603464,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 32.600708961486816
+ },
+ {
+ "epoch": 143,
+ "train_loss": 0.1418447697210312,
+ "train_acc": 0.95556,
+ "test_loss": 3.0879846578598023,
+ "test_acc": 0.5291,
+ "lyapunov": null,
+ "grad_norm": 0.3836324164118778,
+ "grad_max_sv": 0.188724672421813,
+ "grad_min_sv": 7.507878820815078e-09,
+ "grad_condition": 1051208641.6769501,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 32.61192798614502
+ },
+ {
+ "epoch": 144,
+ "train_loss": 0.14410037503242493,
+ "train_acc": 0.95534,
+ "test_loss": 3.1234459602355957,
+ "test_acc": 0.5318,
+ "lyapunov": null,
+ "grad_norm": 0.38512540576239257,
+ "grad_max_sv": 0.20008118823170662,
+ "grad_min_sv": 7.477710552595152e-09,
+ "grad_condition": 1216378712.8275027,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 32.67555069923401
+ },
+ {
+ "epoch": 145,
+ "train_loss": 0.14076073776245118,
+ "train_acc": 0.95618,
+ "test_loss": 3.0669401094436646,
+ "test_acc": 0.5376,
+ "lyapunov": null,
+ "grad_norm": 0.38185175053609804,
+ "grad_max_sv": 0.19599322322756052,
+ "grad_min_sv": 7.380410241113189e-09,
+ "grad_condition": 248121028.65324074,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 32.595621824264526
+ },
+ {
+ "epoch": 146,
+ "train_loss": 0.14235492443561554,
+ "train_acc": 0.95542,
+ "test_loss": 3.1099600078582763,
+ "test_acc": 0.5303,
+ "lyapunov": null,
+ "grad_norm": 0.3833756904141184,
+ "grad_max_sv": 0.19929019846022128,
+ "grad_min_sv": 7.511771148854818e-09,
+ "grad_condition": 234726041.20136175,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 32.61228895187378
+ },
+ {
+ "epoch": 147,
+ "train_loss": 0.1437687619996071,
+ "train_acc": 0.95498,
+ "test_loss": 3.1555084846496584,
+ "test_acc": 0.5253,
+ "lyapunov": null,
+ "grad_norm": 0.38692842594278615,
+ "grad_max_sv": 0.19934902153909206,
+ "grad_min_sv": 7.2967766568429565e-09,
+ "grad_condition": 2247202882.6063395,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 32.581571102142334
+ },
+ {
+ "epoch": 148,
+ "train_loss": 0.13997777037143708,
+ "train_acc": 0.95636,
+ "test_loss": 3.126287574195862,
+ "test_acc": 0.5349,
+ "lyapunov": null,
+ "grad_norm": 0.37982964494822274,
+ "grad_max_sv": 0.19688362777233123,
+ "grad_min_sv": 7.199474146620671e-09,
+ "grad_condition": 410986683.7547163,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 32.614789724349976
+ },
+ {
+ "epoch": 149,
+ "train_loss": 0.13758307416915894,
+ "train_acc": 0.9559,
+ "test_loss": 3.0673478214263916,
+ "test_acc": 0.5359,
+ "lyapunov": null,
+ "grad_norm": 0.37705013515223074,
+ "grad_max_sv": 0.20387833528220653,
+ "grad_min_sv": 7.47520324575064e-09,
+ "grad_condition": 2818005270.75425,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 32.597362995147705
+ },
+ {
+ "epoch": 150,
+ "train_loss": 0.13772287871360778,
+ "train_acc": 0.95614,
+ "test_loss": 3.273663801765442,
+ "test_acc": 0.5186,
+ "lyapunov": null,
+ "grad_norm": 0.3790080333138129,
+ "grad_max_sv": 0.2025493886321783,
+ "grad_min_sv": 7.3542313326689475e-09,
+ "grad_condition": 1465090879.8372142,
+ "lr": 0.0,
+ "time_sec": 32.61164855957031
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 4.866019581298828,
+ "train_acc": 0.03074,
+ "test_loss": 4.872710034179687,
+ "test_acc": 0.0143,
+ "lyapunov": null,
+ "grad_norm": 5.904015758743758,
+ "grad_max_sv": 5.3000179648399355,
+ "grad_min_sv": 9.986983708909492e-08,
+ "grad_condition": 75746426.03647776,
+ "lr": 0.0009998903417374227,
+ "time_sec": 49.65879511833191
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.336319505615235,
+ "train_acc": 0.05884,
+ "test_loss": 5.078699280548095,
+ "test_acc": 0.0179,
+ "lyapunov": null,
+ "grad_norm": 4.512132309010241,
+ "grad_max_sv": 3.9969229817390444,
+ "grad_min_sv": 7.723465306475052e-08,
+ "grad_condition": 99844248.01218227,
+ "lr": 0.0009995614150494292,
+ "time_sec": 49.67804217338562
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.054194154663086,
+ "train_acc": 0.08442,
+ "test_loss": 4.735939234924317,
+ "test_acc": 0.0289,
+ "lyapunov": null,
+ "grad_norm": 3.6216238346079055,
+ "grad_max_sv": 3.0721623718738558,
+ "grad_min_sv": 6.332745707271492e-08,
+ "grad_condition": 68533376.3072471,
+ "lr": 0.0009990133642141358,
+ "time_sec": 49.650996685028076
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.8553889916229247,
+ "train_acc": 0.11068,
+ "test_loss": 4.7776531311035155,
+ "test_acc": 0.04,
+ "lyapunov": null,
+ "grad_norm": 3.0027283473808,
+ "grad_max_sv": 2.4722895294427873,
+ "grad_min_sv": 5.260577265187028e-08,
+ "grad_condition": 133218192.19257763,
+ "lr": 0.0009982464296247522,
+ "time_sec": 49.62583518028259
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.6851790403747557,
+ "train_acc": 0.13608,
+ "test_loss": 4.847144582366943,
+ "test_acc": 0.0436,
+ "lyapunov": null,
+ "grad_norm": 2.4406262601219466,
+ "grad_max_sv": 1.8893477827310563,
+ "grad_min_sv": 4.253873583381917e-08,
+ "grad_condition": 53203728.717256345,
+ "lr": 0.0009972609476841367,
+ "time_sec": 49.64903235435486
+ },
+ {
+ "epoch": 6,
+ "train_loss": 3.557223811721802,
+ "train_acc": 0.1541,
+ "test_loss": 4.846635614776611,
+ "test_acc": 0.0504,
+ "lyapunov": null,
+ "grad_norm": 1.9869329520709325,
+ "grad_max_sv": 1.4254269927740097,
+ "grad_min_sv": 3.4773817814137684e-08,
+ "grad_condition": 109287419.58926606,
+ "lr": 0.000996057350657239,
+ "time_sec": 49.632389545440674
+ },
+ {
+ "epoch": 7,
+ "train_loss": 3.448442996292114,
+ "train_acc": 0.17344,
+ "test_loss": 5.146338744354248,
+ "test_acc": 0.0432,
+ "lyapunov": null,
+ "grad_norm": 1.6934869679578504,
+ "grad_max_sv": 1.111972664296627,
+ "grad_min_sv": 3.0129338379758507e-08,
+ "grad_condition": 49145502.73266151,
+ "lr": 0.000994636166481494,
+ "time_sec": 49.63013672828674
+ },
+ {
+ "epoch": 8,
+ "train_loss": 3.3602959382629396,
+ "train_acc": 0.18858,
+ "test_loss": 4.997173266601562,
+ "test_acc": 0.0549,
+ "lyapunov": null,
+ "grad_norm": 1.4715658174689026,
+ "grad_max_sv": 0.8646033376455307,
+ "grad_min_sv": 2.5999903535689484e-08,
+ "grad_condition": 38484605.38778691,
+ "lr": 0.0009929980185352525,
+ "time_sec": 49.63576054573059
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.2854549378204347,
+ "train_acc": 0.20336,
+ "test_loss": 5.892930588531494,
+ "test_acc": 0.0446,
+ "lyapunov": null,
+ "grad_norm": 1.3451340821865851,
+ "grad_max_sv": 0.7257503181695938,
+ "grad_min_sv": 2.3997866654967837e-08,
+ "grad_condition": 36951868.39671626,
+ "lr": 0.0009911436253643444,
+ "time_sec": 49.629499197006226
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.2246680919647215,
+ "train_acc": 0.21242,
+ "test_loss": 5.3121603576660155,
+ "test_acc": 0.0492,
+ "lyapunov": null,
+ "grad_norm": 1.2440111786697226,
+ "grad_max_sv": 0.6271802522242069,
+ "grad_min_sv": 2.25186588764803e-08,
+ "grad_condition": 32332715.425953984,
+ "lr": 0.0009890738003669028,
+ "time_sec": 49.677348613739014
+ },
+ {
+ "epoch": 11,
+ "train_loss": 3.1626394175720214,
+ "train_acc": 0.22606,
+ "test_loss": 6.13012219543457,
+ "test_acc": 0.0509,
+ "lyapunov": null,
+ "grad_norm": 1.1630276076372463,
+ "grad_max_sv": 0.5456254407763481,
+ "grad_min_sv": 2.0650329043969684e-08,
+ "grad_condition": 43285920.578072175,
+ "lr": 0.00098678945143658,
+ "time_sec": 49.63444662094116
+ },
+ {
+ "epoch": 12,
+ "train_loss": 3.105594987640381,
+ "train_acc": 0.2381,
+ "test_loss": 6.692684747314453,
+ "test_acc": 0.0337,
+ "lyapunov": null,
+ "grad_norm": 1.0991523249692334,
+ "grad_max_sv": 0.5055619306862355,
+ "grad_min_sv": 2.044758472541375e-08,
+ "grad_condition": 38174879.70426883,
+ "lr": 0.0009842915805643154,
+ "time_sec": 49.667534828186035
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.071034761581421,
+ "train_acc": 0.24202,
+ "test_loss": 6.808190565490722,
+ "test_acc": 0.0313,
+ "lyapunov": null,
+ "grad_norm": 1.0461733390262893,
+ "grad_max_sv": 0.45393969416618346,
+ "grad_min_sv": 1.9080661878279058e-08,
+ "grad_condition": 26144165.717305023,
+ "lr": 0.000981581283398829,
+ "time_sec": 49.651849031448364
+ },
+ {
+ "epoch": 14,
+ "train_loss": 3.031006901779175,
+ "train_acc": 0.25136,
+ "test_loss": 6.8066056442260745,
+ "test_acc": 0.0421,
+ "lyapunov": null,
+ "grad_norm": 1.0001345448432042,
+ "grad_max_sv": 0.4178654387593269,
+ "grad_min_sv": 1.817219532629366e-08,
+ "grad_condition": 26243292.8670463,
+ "lr": 0.0009786597487660333,
+ "time_sec": 49.67574381828308
+ },
+ {
+ "epoch": 15,
+ "train_loss": 2.992844039916992,
+ "train_acc": 0.25788,
+ "test_loss": 6.2335087615966795,
+ "test_acc": 0.0415,
+ "lyapunov": null,
+ "grad_norm": 0.9709343078677097,
+ "grad_max_sv": 0.40159890055656433,
+ "grad_min_sv": 1.7637466787068233e-08,
+ "grad_condition": 31130355.004485857,
+ "lr": 0.0009755282581475766,
+ "time_sec": 49.648940324783325
+ },
+ {
+ "epoch": 16,
+ "train_loss": 2.9533546379089355,
+ "train_acc": 0.2654,
+ "test_loss": 6.982061653900146,
+ "test_acc": 0.0331,
+ "lyapunov": null,
+ "grad_norm": 0.9294555695312433,
+ "grad_max_sv": 0.38935905918478964,
+ "grad_min_sv": 1.7345642956689833e-08,
+ "grad_condition": 34633361.17032104,
+ "lr": 0.0009721881851187403,
+ "time_sec": 49.62569880485535
+ },
+ {
+ "epoch": 17,
+ "train_loss": 2.9248884143066407,
+ "train_acc": 0.27134,
+ "test_loss": 5.847897528839112,
+ "test_acc": 0.0375,
+ "lyapunov": null,
+ "grad_norm": 0.8931744987288306,
+ "grad_max_sv": 0.3547165349125862,
+ "grad_min_sv": 1.6551659471827906e-08,
+ "grad_condition": 78906912.01626787,
+ "lr": 0.0009686409947459456,
+ "time_sec": 49.628357887268066
+ },
+ {
+ "epoch": 18,
+ "train_loss": 2.896197442779541,
+ "train_acc": 0.27548,
+ "test_loss": 6.654647819519043,
+ "test_acc": 0.0387,
+ "lyapunov": null,
+ "grad_norm": 0.8750290297759321,
+ "grad_max_sv": 0.3526077255606651,
+ "grad_min_sv": 1.6023472331015005e-08,
+ "grad_condition": 266939500.3731903,
+ "lr": 0.0009648882429441254,
+ "time_sec": 49.64867830276489
+ },
+ {
+ "epoch": 19,
+ "train_loss": 2.8669221867370607,
+ "train_acc": 0.28036,
+ "test_loss": 5.810343419647217,
+ "test_acc": 0.0502,
+ "lyapunov": null,
+ "grad_norm": 0.8587949296642396,
+ "grad_max_sv": 0.34078171029686927,
+ "grad_min_sv": 1.6171859118507826e-08,
+ "grad_condition": 22947806.160383917,
+ "lr": 0.00096093157579425,
+ "time_sec": 49.63094878196716
+ },
+ {
+ "epoch": 20,
+ "train_loss": 2.82938760848999,
+ "train_acc": 0.289,
+ "test_loss": 5.896671797180176,
+ "test_acc": 0.0461,
+ "lyapunov": null,
+ "grad_norm": 0.839027246743402,
+ "grad_max_sv": 0.3308767855167389,
+ "grad_min_sv": 1.570504673531481e-08,
+ "grad_condition": 24206043.26616613,
+ "lr": 0.0009567727288213001,
+ "time_sec": 49.6539568901062
+ },
+ {
+ "epoch": 21,
+ "train_loss": 2.8006727541351317,
+ "train_acc": 0.2938,
+ "test_loss": 6.180831294250488,
+ "test_acc": 0.0398,
+ "lyapunov": null,
+ "grad_norm": 0.8110141308366953,
+ "grad_max_sv": 0.3095390945672989,
+ "grad_min_sv": 1.4921404802026306e-08,
+ "grad_condition": 34079256.769043334,
+ "lr": 0.0009524135262330095,
+ "time_sec": 49.64039897918701
+ },
+ {
+ "epoch": 22,
+ "train_loss": 2.7774745903778078,
+ "train_acc": 0.29804,
+ "test_loss": 6.308743616485596,
+ "test_acc": 0.045,
+ "lyapunov": null,
+ "grad_norm": 0.8004103125902539,
+ "grad_max_sv": 0.31844869926571845,
+ "grad_min_sv": 1.5020042806734857e-08,
+ "grad_condition": 27917630.374082875,
+ "lr": 0.0009478558801197061,
+ "time_sec": 49.63332271575928
+ },
+ {
+ "epoch": 23,
+ "train_loss": 2.7524796044921875,
+ "train_acc": 0.30316,
+ "test_loss": 5.521375189208984,
+ "test_acc": 0.0535,
+ "lyapunov": null,
+ "grad_norm": 0.7869460876794067,
+ "grad_max_sv": 0.292531880363822,
+ "grad_min_sv": 1.448369401080285e-08,
+ "grad_condition": 35029756.554903194,
+ "lr": 0.000943101789615607,
+ "time_sec": 49.63528370857239
+ },
+ {
+ "epoch": 24,
+ "train_loss": 2.7253317372131347,
+ "train_acc": 0.3104,
+ "test_loss": 6.1194743759155275,
+ "test_acc": 0.0494,
+ "lyapunov": null,
+ "grad_norm": 0.7678368002286986,
+ "grad_max_sv": 0.29576918072998526,
+ "grad_min_sv": 1.4323617783529307e-08,
+ "grad_condition": 28702466.777186085,
+ "lr": 0.0009381533400219313,
+ "time_sec": 49.64074897766113
+ },
+ {
+ "epoch": 25,
+ "train_loss": 2.7074700713348387,
+ "train_acc": 0.31266,
+ "test_loss": 6.289851884460449,
+ "test_acc": 0.0462,
+ "lyapunov": null,
+ "grad_norm": 0.7683642905855677,
+ "grad_max_sv": 0.2851465784013271,
+ "grad_min_sv": 1.4292519384673242e-08,
+ "grad_condition": 22761462.806346737,
+ "lr": 0.0009330127018922189,
+ "time_sec": 49.631171464920044
+ },
+ {
+ "epoch": 26,
+ "train_loss": 2.686272830505371,
+ "train_acc": 0.3169,
+ "test_loss": 6.941660729980469,
+ "test_acc": 0.0479,
+ "lyapunov": null,
+ "grad_norm": 0.755488240958268,
+ "grad_max_sv": 0.28228237964212893,
+ "grad_min_sv": 1.4025971441233854e-08,
+ "grad_condition": 35803882.89457456,
+ "lr": 0.000927682130080253,
+ "time_sec": 49.64768934249878
+ },
+ {
+ "epoch": 27,
+ "train_loss": 2.6507435781860353,
+ "train_acc": 0.32476,
+ "test_loss": 5.651136081695556,
+ "test_acc": 0.0552,
+ "lyapunov": null,
+ "grad_norm": 0.7510174800021984,
+ "grad_max_sv": 0.2705878522247076,
+ "grad_min_sv": 1.3801869563900837e-08,
+ "grad_condition": 24650339.234644465,
+ "lr": 0.0009221639627510072,
+ "time_sec": 49.63985729217529
+ },
+ {
+ "epoch": 28,
+ "train_loss": 2.6402551649475097,
+ "train_acc": 0.32708,
+ "test_loss": 6.290144860839844,
+ "test_acc": 0.042,
+ "lyapunov": null,
+ "grad_norm": 0.7327305496870947,
+ "grad_max_sv": 0.26595143899321555,
+ "grad_min_sv": 1.3485531080714708e-08,
+ "grad_condition": 24838092.070290618,
+ "lr": 0.0009164606203550494,
+ "time_sec": 49.668391704559326
+ },
+ {
+ "epoch": 29,
+ "train_loss": 2.6250381271362304,
+ "train_acc": 0.32904,
+ "test_loss": 5.969137829589844,
+ "test_acc": 0.0584,
+ "lyapunov": null,
+ "grad_norm": 0.7326068006390382,
+ "grad_max_sv": 0.27750224173069,
+ "grad_min_sv": 1.3820259439634164e-08,
+ "grad_condition": 23369103.19183632,
+ "lr": 0.0009105746045668516,
+ "time_sec": 49.66312098503113
+ },
+ {
+ "epoch": 30,
+ "train_loss": 2.5943477003479005,
+ "train_acc": 0.3349,
+ "test_loss": 5.8657053939819335,
+ "test_acc": 0.0662,
+ "lyapunov": null,
+ "grad_norm": 0.7282576381570287,
+ "grad_max_sv": 0.267722587287426,
+ "grad_min_sv": 1.3611432567173232e-08,
+ "grad_condition": 33832306.890324585,
+ "lr": 0.0009045084971874733,
+ "time_sec": 49.635533809661865
+ },
+ {
+ "epoch": 31,
+ "train_loss": 2.5734296069335936,
+ "train_acc": 0.3377,
+ "test_loss": 5.947202941894531,
+ "test_acc": 0.0536,
+ "lyapunov": null,
+ "grad_norm": 0.72371197105418,
+ "grad_max_sv": 0.2766475807875395,
+ "grad_min_sv": 1.3626912859915353e-08,
+ "grad_condition": 57961221.39827029,
+ "lr": 0.0008982649590120977,
+ "time_sec": 49.64917349815369
+ },
+ {
+ "epoch": 32,
+ "train_loss": 2.564406160736084,
+ "train_acc": 0.34312,
+ "test_loss": 5.720430706787109,
+ "test_acc": 0.0515,
+ "lyapunov": null,
+ "grad_norm": 0.7163915374705971,
+ "grad_max_sv": 0.25801267102360725,
+ "grad_min_sv": 1.3336803814101295e-08,
+ "grad_condition": 26182544.879379902,
+ "lr": 0.0008918467286629196,
+ "time_sec": 49.67513680458069
+ },
+ {
+ "epoch": 33,
+ "train_loss": 2.5487507371520994,
+ "train_acc": 0.3468,
+ "test_loss": 6.23959475479126,
+ "test_acc": 0.0534,
+ "lyapunov": null,
+ "grad_norm": 0.7054942364907418,
+ "grad_max_sv": 0.24919774606823922,
+ "grad_min_sv": 1.306408175666407e-08,
+ "grad_condition": 26801620.75531055,
+ "lr": 0.0008852566213878943,
+ "time_sec": 49.64692521095276
+ },
+ {
+ "epoch": 34,
+ "train_loss": 2.5242181804656982,
+ "train_acc": 0.34942,
+ "test_loss": 6.2963892974853515,
+ "test_acc": 0.0553,
+ "lyapunov": null,
+ "grad_norm": 0.7016169815154498,
+ "grad_max_sv": 0.25484145022928717,
+ "grad_min_sv": 1.3042181151723397e-08,
+ "grad_condition": 22430709.73115928,
+ "lr": 0.000878497527825878,
+ "time_sec": 49.654839754104614
+ },
+ {
+ "epoch": 35,
+ "train_loss": 2.5094819609832766,
+ "train_acc": 0.35066,
+ "test_loss": 6.719456141662597,
+ "test_acc": 0.0546,
+ "lyapunov": null,
+ "grad_norm": 0.6984323559876441,
+ "grad_max_sv": 0.25291088260710237,
+ "grad_min_sv": 1.3091225495309722e-08,
+ "grad_condition": 24055952.13732664,
+ "lr": 0.000871572412738697,
+ "time_sec": 49.63660550117493
+ },
+ {
+ "epoch": 36,
+ "train_loss": 2.482266076126099,
+ "train_acc": 0.35974,
+ "test_loss": 6.552088442993164,
+ "test_acc": 0.0652,
+ "lyapunov": null,
+ "grad_norm": 0.6961085506168149,
+ "grad_max_sv": 0.25587535500526426,
+ "grad_min_sv": 1.3084706912414034e-08,
+ "grad_condition": 29953242.59302296,
+ "lr": 0.0008644843137107055,
+ "time_sec": 49.636728286743164
+ },
+ {
+ "epoch": 37,
+ "train_loss": 2.4597298861694337,
+ "train_acc": 0.36194,
+ "test_loss": 7.314365348815918,
+ "test_acc": 0.0495,
+ "lyapunov": null,
+ "grad_norm": 0.6914952761349973,
+ "grad_max_sv": 0.24747973680496216,
+ "grad_min_sv": 1.3026676748406629e-08,
+ "grad_condition": 27342755.995011915,
+ "lr": 0.0008572363398164014,
+ "time_sec": 49.638224363327026
+ },
+ {
+ "epoch": 38,
+ "train_loss": 2.4654034370422364,
+ "train_acc": 0.36094,
+ "test_loss": 6.702982992553711,
+ "test_acc": 0.0509,
+ "lyapunov": null,
+ "grad_norm": 0.6892432022946228,
+ "grad_max_sv": 0.2394346885383129,
+ "grad_min_sv": 1.273180681438113e-08,
+ "grad_condition": 22022203.054304175,
+ "lr": 0.0008498316702566826,
+ "time_sec": 49.639644145965576
+ },
+ {
+ "epoch": 39,
+ "train_loss": 2.42667671333313,
+ "train_acc": 0.36782,
+ "test_loss": 6.179627616882324,
+ "test_acc": 0.0407,
+ "lyapunov": null,
+ "grad_norm": 0.6855295822993354,
+ "grad_max_sv": 0.24026529379189016,
+ "grad_min_sv": 1.2694210569513809e-08,
+ "grad_condition": 40057775.67721417,
+ "lr": 0.0008422735529643442,
+ "time_sec": 49.63581466674805
+ },
+ {
+ "epoch": 40,
+ "train_loss": 2.4109215718841552,
+ "train_acc": 0.37052,
+ "test_loss": 6.805292085266113,
+ "test_acc": 0.0527,
+ "lyapunov": null,
+ "grad_norm": 0.6807278981220505,
+ "grad_max_sv": 0.23731110394001007,
+ "grad_min_sv": 1.2639894338140056e-08,
+ "grad_condition": 27610612.2175704,
+ "lr": 0.0008345653031794289,
+ "time_sec": 49.64470100402832
+ },
+ {
+ "epoch": 41,
+ "train_loss": 2.394052338409424,
+ "train_acc": 0.37456,
+ "test_loss": 6.000495677947998,
+ "test_acc": 0.0498,
+ "lyapunov": null,
+ "grad_norm": 0.684187370269629,
+ "grad_max_sv": 0.24500937685370444,
+ "grad_min_sv": 1.290876201071045e-08,
+ "grad_condition": 57507496.68239377,
+ "lr": 0.0008267103019950526,
+ "time_sec": 49.64144778251648
+ },
+ {
+ "epoch": 42,
+ "train_loss": 2.369488366241455,
+ "train_acc": 0.37932,
+ "test_loss": 5.813188542175293,
+ "test_acc": 0.0442,
+ "lyapunov": null,
+ "grad_norm": 0.6660607900191566,
+ "grad_max_sv": 0.23581123538315296,
+ "grad_min_sv": 1.243826876218268e-08,
+ "grad_condition": 43225809.82445784,
+ "lr": 0.0008187119948743447,
+ "time_sec": 49.65106153488159
+ },
+ {
+ "epoch": 43,
+ "train_loss": 2.349871713409424,
+ "train_acc": 0.38354,
+ "test_loss": 6.650400701904297,
+ "test_acc": 0.054,
+ "lyapunov": null,
+ "grad_norm": 0.6728559080292662,
+ "grad_max_sv": 0.23216901496052741,
+ "grad_min_sv": 1.2423243067605228e-08,
+ "grad_condition": 97229672.46407479,
+ "lr": 0.000810573890139155,
+ "time_sec": 49.6483952999115
+ },
+ {
+ "epoch": 44,
+ "train_loss": 2.3327147588348387,
+ "train_acc": 0.38762,
+ "test_loss": 7.37770638885498,
+ "test_acc": 0.0556,
+ "lyapunov": null,
+ "grad_norm": 0.6708437479650249,
+ "grad_max_sv": 0.2353798534721136,
+ "grad_min_sv": 1.2329054610571433e-08,
+ "grad_condition": 24315327.09270349,
+ "lr": 0.0008022995574311873,
+ "time_sec": 49.649359464645386
+ },
+ {
+ "epoch": 45,
+ "train_loss": 2.3379388195037842,
+ "train_acc": 0.38554,
+ "test_loss": 7.32100400390625,
+ "test_acc": 0.0447,
+ "lyapunov": null,
+ "grad_norm": 0.6690933212170967,
+ "grad_max_sv": 0.23992121778428555,
+ "grad_min_sv": 1.2581548722301328e-08,
+ "grad_condition": 23582198.377444454,
+ "lr": 0.0007938926261462363,
+ "time_sec": 49.65408158302307
+ },
+ {
+ "epoch": 46,
+ "train_loss": 2.3259339227294924,
+ "train_acc": 0.3881,
+ "test_loss": 5.903630683898926,
+ "test_acc": 0.0532,
+ "lyapunov": null,
+ "grad_norm": 0.6696674111669629,
+ "grad_max_sv": 0.24237493835389615,
+ "grad_min_sv": 1.264802341723395e-08,
+ "grad_condition": 189995164.68487653,
+ "lr": 0.0007853567838422158,
+ "time_sec": 49.62894296646118
+ },
+ {
+ "epoch": 47,
+ "train_loss": 2.3060372606658937,
+ "train_acc": 0.39222,
+ "test_loss": 6.722331466674805,
+ "test_acc": 0.052,
+ "lyapunov": null,
+ "grad_norm": 0.6608950831630619,
+ "grad_max_sv": 0.2247944913804531,
+ "grad_min_sv": 1.2062996512373236e-08,
+ "grad_condition": 1083025267.50655,
+ "lr": 0.0007766957746216719,
+ "time_sec": 49.62338829040527
+ },
+ {
+ "epoch": 48,
+ "train_loss": 2.283214527587891,
+ "train_acc": 0.39554,
+ "test_loss": 6.30029787979126,
+ "test_acc": 0.058,
+ "lyapunov": null,
+ "grad_norm": 0.6607285996206229,
+ "grad_max_sv": 0.23341836147010325,
+ "grad_min_sv": 1.2354938326575304e-08,
+ "grad_condition": 30471435.85248127,
+ "lr": 0.0007679133974894982,
+ "time_sec": 49.62940454483032
+ },
+ {
+ "epoch": 49,
+ "train_loss": 2.2607837000274658,
+ "train_acc": 0.39988,
+ "test_loss": 5.6582544311523435,
+ "test_acc": 0.0597,
+ "lyapunov": null,
+ "grad_norm": 0.6558663174998175,
+ "grad_max_sv": 0.22986114919185638,
+ "grad_min_sv": 1.2380245191512263e-08,
+ "grad_condition": 37434404.18782197,
+ "lr": 0.000759013504686565,
+ "time_sec": 49.63751459121704
+ },
+ {
+ "epoch": 50,
+ "train_loss": 2.245105714797974,
+ "train_acc": 0.40408,
+ "test_loss": 6.382824391937256,
+ "test_acc": 0.0387,
+ "lyapunov": null,
+ "grad_norm": 0.6549241097715082,
+ "grad_max_sv": 0.2248407918959856,
+ "grad_min_sv": 1.2180415326357163e-08,
+ "grad_condition": 21126842.856077008,
+ "lr": 0.0007499999999999998,
+ "time_sec": 49.62160301208496
+ },
+ {
+ "epoch": 51,
+ "train_loss": 2.235931240615845,
+ "train_acc": 0.40734,
+ "test_loss": 5.594304537963867,
+ "test_acc": 0.0703,
+ "lyapunov": null,
+ "grad_norm": 0.6606674978525966,
+ "grad_max_sv": 0.23265439458191395,
+ "grad_min_sv": 1.2417693201483005e-08,
+ "grad_condition": 38123270.60577395,
+ "lr": 0.0007408768370508575,
+ "time_sec": 49.63914489746094
+ },
+ {
+ "epoch": 52,
+ "train_loss": 2.220252141571045,
+ "train_acc": 0.40908,
+ "test_loss": 5.49668860168457,
+ "test_acc": 0.0417,
+ "lyapunov": null,
+ "grad_norm": 0.6502905279074903,
+ "grad_max_sv": 0.23435013145208358,
+ "grad_min_sv": 1.2266832496304891e-08,
+ "grad_condition": 38310230.157323316,
+ "lr": 0.0007316480175599307,
+ "time_sec": 49.623440980911255
+ },
+ {
+ "epoch": 53,
+ "train_loss": 2.20186401260376,
+ "train_acc": 0.41488,
+ "test_loss": 6.196598785400391,
+ "test_acc": 0.052,
+ "lyapunov": null,
+ "grad_norm": 0.6529977877477179,
+ "grad_max_sv": 0.23160336054861547,
+ "grad_min_sv": 1.213869888216923e-08,
+ "grad_condition": 32786030.078148127,
+ "lr": 0.0007223175895924635,
+ "time_sec": 49.645137548446655
+ },
+ {
+ "epoch": 54,
+ "train_loss": 2.192180712852478,
+ "train_acc": 0.41462,
+ "test_loss": 6.966438492584229,
+ "test_acc": 0.0515,
+ "lyapunov": null,
+ "grad_norm": 0.6546718868496101,
+ "grad_max_sv": 0.23001223765313625,
+ "grad_min_sv": 1.2304833968412864e-08,
+ "grad_condition": 26553928.3741663,
+ "lr": 0.0007128896457825361,
+ "time_sec": 49.642454862594604
+ },
+ {
+ "epoch": 55,
+ "train_loss": 2.1692851805114746,
+ "train_acc": 0.42174,
+ "test_loss": 6.76854267578125,
+ "test_acc": 0.0514,
+ "lyapunov": null,
+ "grad_norm": 0.6573722021244011,
+ "grad_max_sv": 0.22808259911835194,
+ "grad_min_sv": 1.2273855956590473e-08,
+ "grad_condition": 23253160.925169718,
+ "lr": 0.0007033683215378998,
+ "time_sec": 49.62129521369934
+ },
+ {
+ "epoch": 56,
+ "train_loss": 2.1607114459228516,
+ "train_acc": 0.42392,
+ "test_loss": 6.366939366912842,
+ "test_acc": 0.0595,
+ "lyapunov": null,
+ "grad_norm": 0.6541197760013122,
+ "grad_max_sv": 0.2261738982051611,
+ "grad_min_sv": 1.2211666097772245e-08,
+ "grad_condition": 40339824.5426622,
+ "lr": 0.0006937577932260512,
+ "time_sec": 49.614548444747925
+ },
+ {
+ "epoch": 57,
+ "train_loss": 2.1550695499420165,
+ "train_acc": 0.42292,
+ "test_loss": 6.088698851013183,
+ "test_acc": 0.0407,
+ "lyapunov": null,
+ "grad_norm": 0.6495499294349419,
+ "grad_max_sv": 0.22787895202636718,
+ "grad_min_sv": 1.2191535223027294e-08,
+ "grad_condition": 46151755.99995027,
+ "lr": 0.0006840622763423388,
+ "time_sec": 49.86520218849182
+ },
+ {
+ "epoch": 58,
+ "train_loss": 2.1309228759002687,
+ "train_acc": 0.4298,
+ "test_loss": 6.714969717407227,
+ "test_acc": 0.0476,
+ "lyapunov": null,
+ "grad_norm": 0.6501923826294874,
+ "grad_max_sv": 0.2294207103550434,
+ "grad_min_sv": 1.2324306024324993e-08,
+ "grad_condition": 27012371.00660652,
+ "lr": 0.0006742860236609073,
+ "time_sec": 49.61659789085388
+ },
+ {
+ "epoch": 59,
+ "train_loss": 2.1276511294555664,
+ "train_acc": 0.43052,
+ "test_loss": 7.850105988311768,
+ "test_acc": 0.0531,
+ "lyapunov": null,
+ "grad_norm": 0.6522053097296127,
+ "grad_max_sv": 0.23177195861935615,
+ "grad_min_sv": 1.2570549945412068e-08,
+ "grad_condition": 21066069.902124517,
+ "lr": 0.0006644333233692913,
+ "time_sec": 49.61627125740051
+ },
+ {
+ "epoch": 60,
+ "train_loss": 2.108223154907227,
+ "train_acc": 0.43206,
+ "test_loss": 6.194909986877441,
+ "test_acc": 0.0601,
+ "lyapunov": null,
+ "grad_norm": 0.6509457366232547,
+ "grad_max_sv": 0.2232413150370121,
+ "grad_min_sv": 1.2092985912648402e-08,
+ "grad_condition": 20482533.369790833,
+ "lr": 0.0006545084971874734,
+ "time_sec": 49.638840198516846
+ },
+ {
+ "epoch": 61,
+ "train_loss": 2.0873364936828613,
+ "train_acc": 0.43732,
+ "test_loss": 7.149879702758789,
+ "test_acc": 0.0579,
+ "lyapunov": null,
+ "grad_norm": 0.6448496636259025,
+ "grad_max_sv": 0.2204914376139641,
+ "grad_min_sv": 1.2118930678428619e-08,
+ "grad_condition": 22158498.545212857,
+ "lr": 0.0006445158984722354,
+ "time_sec": 49.64352631568909
+ },
+ {
+ "epoch": 62,
+ "train_loss": 2.0711798847961425,
+ "train_acc": 0.4403,
+ "test_loss": 6.873784851074219,
+ "test_acc": 0.0519,
+ "lyapunov": null,
+ "grad_norm": 0.650740813617645,
+ "grad_max_sv": 0.23042820766568184,
+ "grad_min_sv": 1.2226469767173676e-08,
+ "grad_condition": 22253714.267564178,
+ "lr": 0.0006344599103076324,
+ "time_sec": 49.61197328567505
+ },
+ {
+ "epoch": 63,
+ "train_loss": 2.0670838510131837,
+ "train_acc": 0.44428,
+ "test_loss": 8.138898289489745,
+ "test_acc": 0.0465,
+ "lyapunov": null,
+ "grad_norm": 0.6500300321497959,
+ "grad_max_sv": 0.22807052806019784,
+ "grad_min_sv": 1.2282747885450362e-08,
+ "grad_condition": 25613801.10650332,
+ "lr": 0.0006243449435824269,
+ "time_sec": 49.64067339897156
+ },
+ {
+ "epoch": 64,
+ "train_loss": 2.0602053503417967,
+ "train_acc": 0.44336,
+ "test_loss": 6.739065780639648,
+ "test_acc": 0.0435,
+ "lyapunov": null,
+ "grad_norm": 0.6438167751087027,
+ "grad_max_sv": 0.21950027868151664,
+ "grad_min_sv": 1.1978744509505424e-08,
+ "grad_condition": 69086045.79764383,
+ "lr": 0.0006141754350553275,
+ "time_sec": 49.63843250274658
+ },
+ {
+ "epoch": 65,
+ "train_loss": 2.0289339319610598,
+ "train_acc": 0.4504,
+ "test_loss": 5.612693282318115,
+ "test_acc": 0.0624,
+ "lyapunov": null,
+ "grad_norm": 0.643091891417901,
+ "grad_max_sv": 0.2296879008412361,
+ "grad_min_sv": 1.2095985612095573e-08,
+ "grad_condition": 207267738.03108597,
+ "lr": 0.0006039558454088793,
+ "time_sec": 49.621809244155884
+ },
+ {
+ "epoch": 66,
+ "train_loss": 2.017880793533325,
+ "train_acc": 0.45524,
+ "test_loss": 5.917317507934571,
+ "test_acc": 0.0569,
+ "lyapunov": null,
+ "grad_norm": 0.6458313703477052,
+ "grad_max_sv": 0.2203237745910883,
+ "grad_min_sv": 1.2053612886975263e-08,
+ "grad_condition": 30573308.01952803,
+ "lr": 0.000593690657292862,
+ "time_sec": 49.62665867805481
+ },
+ {
+ "epoch": 67,
+ "train_loss": 2.00664087310791,
+ "train_acc": 0.45516,
+ "test_loss": 5.649988233947754,
+ "test_acc": 0.0551,
+ "lyapunov": null,
+ "grad_norm": 0.6469506065081965,
+ "grad_max_sv": 0.22469568885862828,
+ "grad_min_sv": 1.2245062176730048e-08,
+ "grad_condition": 29605005.92733214,
+ "lr": 0.0005833843733580507,
+ "time_sec": 49.66580653190613
+ },
+ {
+ "epoch": 68,
+ "train_loss": 1.9934558868789674,
+ "train_acc": 0.45752,
+ "test_loss": 6.518855290222168,
+ "test_acc": 0.0474,
+ "lyapunov": null,
+ "grad_norm": 0.6449120600766396,
+ "grad_max_sv": 0.22343773469328881,
+ "grad_min_sv": 1.2075202887595893e-08,
+ "grad_condition": 20470063.13805929,
+ "lr": 0.0005730415142812054,
+ "time_sec": 49.649908781051636
+ },
+ {
+ "epoch": 69,
+ "train_loss": 1.9819465933609008,
+ "train_acc": 0.4615,
+ "test_loss": 5.741820652770996,
+ "test_acc": 0.0576,
+ "lyapunov": null,
+ "grad_norm": 0.6444073081455958,
+ "grad_max_sv": 0.2133765324950218,
+ "grad_min_sv": 1.1591837454538903e-08,
+ "grad_condition": 7400690970.849569,
+ "lr": 0.0005626666167821517,
+ "time_sec": 49.64708852767944
+ },
+ {
+ "epoch": 70,
+ "train_loss": 1.9717326400756836,
+ "train_acc": 0.4635,
+ "test_loss": 6.180095139312744,
+ "test_acc": 0.0538,
+ "lyapunov": null,
+ "grad_norm": 0.646339670655307,
+ "grad_max_sv": 0.22971010841429235,
+ "grad_min_sv": 1.1938921282844683e-08,
+ "grad_condition": 42308986.45036293,
+ "lr": 0.0005522642316338265,
+ "time_sec": 49.65745282173157
+ },
+ {
+ "epoch": 71,
+ "train_loss": 1.947042868385315,
+ "train_acc": 0.46858,
+ "test_loss": 5.758691899871827,
+ "test_acc": 0.0481,
+ "lyapunov": null,
+ "grad_norm": 0.6454285691467331,
+ "grad_max_sv": 0.21988087929785252,
+ "grad_min_sv": 1.2038080984128063e-08,
+ "grad_condition": 54275907.24262571,
+ "lr": 0.0005418389216661573,
+ "time_sec": 49.655876874923706
+ },
+ {
+ "epoch": 72,
+ "train_loss": 1.9380216747283936,
+ "train_acc": 0.47278,
+ "test_loss": 5.360606885528564,
+ "test_acc": 0.0499,
+ "lyapunov": null,
+ "grad_norm": 0.6445951712238421,
+ "grad_max_sv": 0.22141558788716792,
+ "grad_min_sv": 1.2052524836839163e-08,
+ "grad_condition": 52658770.62947424,
+ "lr": 0.0005313952597646563,
+ "time_sec": 49.643407106399536
+ },
+ {
+ "epoch": 73,
+ "train_loss": 1.9315852340698243,
+ "train_acc": 0.47042,
+ "test_loss": 5.562986553955078,
+ "test_acc": 0.0528,
+ "lyapunov": null,
+ "grad_norm": 0.6455449182300289,
+ "grad_max_sv": 0.22759805843234063,
+ "grad_min_sv": 1.2166670372570909e-08,
+ "grad_condition": 25263034.87545003,
+ "lr": 0.0005209378268645994,
+ "time_sec": 49.65730333328247
+ },
+ {
+ "epoch": 74,
+ "train_loss": 1.9174984769439698,
+ "train_acc": 0.47274,
+ "test_loss": 5.779887171173096,
+ "test_acc": 0.0526,
+ "lyapunov": null,
+ "grad_norm": 0.6408982744466406,
+ "grad_max_sv": 0.223176771402359,
+ "grad_min_sv": 1.1881650463507754e-08,
+ "grad_condition": 21609418.938555025,
+ "lr": 0.0005104712099416781,
+ "time_sec": 49.63982319831848
+ },
+ {
+ "epoch": 75,
+ "train_loss": 1.9022090718841553,
+ "train_acc": 0.47956,
+ "test_loss": 6.74227056427002,
+ "test_acc": 0.0396,
+ "lyapunov": null,
+ "grad_norm": 0.6439391169821848,
+ "grad_max_sv": 0.22340110316872597,
+ "grad_min_sv": 1.1930816612437667e-08,
+ "grad_condition": 22835938.88370643,
+ "lr": 0.0004999999999999996,
+ "time_sec": 49.6373016834259
+ },
+ {
+ "epoch": 76,
+ "train_loss": 1.8833642294311523,
+ "train_acc": 0.48212,
+ "test_loss": 6.253941902160644,
+ "test_acc": 0.0401,
+ "lyapunov": null,
+ "grad_norm": 0.6458465784916259,
+ "grad_max_sv": 0.2219920836389065,
+ "grad_min_sv": 1.1862058124645358e-08,
+ "grad_condition": 24923864.351812743,
+ "lr": 0.0004895287900583212,
+ "time_sec": 49.63244032859802
+ },
+ {
+ "epoch": 77,
+ "train_loss": 1.872097596054077,
+ "train_acc": 0.4862,
+ "test_loss": 7.115831829833985,
+ "test_acc": 0.0455,
+ "lyapunov": null,
+ "grad_norm": 0.6389496343286681,
+ "grad_max_sv": 0.2166093897074461,
+ "grad_min_sv": 1.1753041695428124e-08,
+ "grad_condition": 123847363.5090142,
+ "lr": 0.0004790621731353997,
+ "time_sec": 49.65565347671509
+ },
+ {
+ "epoch": 78,
+ "train_loss": 1.8647768477630615,
+ "train_acc": 0.48824,
+ "test_loss": 6.585789360046387,
+ "test_acc": 0.0461,
+ "lyapunov": null,
+ "grad_norm": 0.6430712356182874,
+ "grad_max_sv": 0.2195899412035942,
+ "grad_min_sv": 1.2243656302224696e-08,
+ "grad_condition": 424951771.80469763,
+ "lr": 0.000468604740235343,
+ "time_sec": 49.62981295585632
+ },
+ {
+ "epoch": 79,
+ "train_loss": 1.8419312603759765,
+ "train_acc": 0.49144,
+ "test_loss": 6.8796092208862305,
+ "test_acc": 0.0534,
+ "lyapunov": null,
+ "grad_norm": 0.6438732522551095,
+ "grad_max_sv": 0.223552468046546,
+ "grad_min_sv": 1.2100811991712716e-08,
+ "grad_condition": 310767823.54431427,
+ "lr": 0.00045816107833384175,
+ "time_sec": 49.63279318809509
+ },
+ {
+ "epoch": 80,
+ "train_loss": 1.8222150116348266,
+ "train_acc": 0.49938,
+ "test_loss": 6.9083010223388674,
+ "test_acc": 0.0574,
+ "lyapunov": null,
+ "grad_norm": 0.646876723364354,
+ "grad_max_sv": 0.22485989183187485,
+ "grad_min_sv": 1.2241183645900212e-08,
+ "grad_condition": 28086849.755860113,
+ "lr": 0.0004477357683661729,
+ "time_sec": 49.6425895690918
+ },
+ {
+ "epoch": 81,
+ "train_loss": 1.813687347946167,
+ "train_acc": 0.49976,
+ "test_loss": 6.90407081451416,
+ "test_acc": 0.04,
+ "lyapunov": null,
+ "grad_norm": 0.642733217341124,
+ "grad_max_sv": 0.22463089227676392,
+ "grad_min_sv": 1.2082413675118531e-08,
+ "grad_condition": 22301589.48218178,
+ "lr": 0.00043733338321784746,
+ "time_sec": 49.629480838775635
+ },
+ {
+ "epoch": 82,
+ "train_loss": 1.7951585668945313,
+ "train_acc": 0.5034,
+ "test_loss": 7.836273937988281,
+ "test_acc": 0.0512,
+ "lyapunov": null,
+ "grad_norm": 0.6454340294520209,
+ "grad_max_sv": 0.22539752162992954,
+ "grad_min_sv": 1.1886250314216417e-08,
+ "grad_condition": 59544024.862964645,
+ "lr": 0.0004269584857187939,
+ "time_sec": 49.61994457244873
+ },
+ {
+ "epoch": 83,
+ "train_loss": 1.7966358541488647,
+ "train_acc": 0.50272,
+ "test_loss": 7.222357276916504,
+ "test_acc": 0.0579,
+ "lyapunov": null,
+ "grad_norm": 0.6453223951998842,
+ "grad_max_sv": 0.22831037007272242,
+ "grad_min_sv": 1.203974950118869e-08,
+ "grad_condition": 82894748.52704917,
+ "lr": 0.0004166156266419484,
+ "time_sec": 49.673835039138794
+ },
+ {
+ "epoch": 84,
+ "train_loss": 1.7854290616226196,
+ "train_acc": 0.50408,
+ "test_loss": 6.414771678161621,
+ "test_acc": 0.0601,
+ "lyapunov": null,
+ "grad_norm": 0.6427673490554981,
+ "grad_max_sv": 0.2182640478014946,
+ "grad_min_sv": 1.202259434229802e-08,
+ "grad_condition": 21861556.418338913,
+ "lr": 0.0004063093427071373,
+ "time_sec": 49.64637732505798
+ },
+ {
+ "epoch": 85,
+ "train_loss": 1.7772653774261475,
+ "train_acc": 0.5111,
+ "test_loss": 7.505108009338379,
+ "test_acc": 0.0616,
+ "lyapunov": null,
+ "grad_norm": 0.6410246970315546,
+ "grad_max_sv": 0.2277263168245554,
+ "grad_min_sv": 1.1847804396586393e-08,
+ "grad_condition": 36055137.59124441,
+ "lr": 0.0003960441545911199,
+ "time_sec": 49.642088174819946
+ },
+ {
+ "epoch": 86,
+ "train_loss": 1.7477331000518799,
+ "train_acc": 0.5147,
+ "test_loss": 7.709722770690918,
+ "test_acc": 0.0449,
+ "lyapunov": null,
+ "grad_norm": 0.6439998427728569,
+ "grad_max_sv": 0.22573819942772388,
+ "grad_min_sv": 1.2154757376287017e-08,
+ "grad_condition": 47618357.203088775,
+ "lr": 0.0003858245649446718,
+ "time_sec": 49.63089942932129
+ },
+ {
+ "epoch": 87,
+ "train_loss": 1.7338512952423095,
+ "train_acc": 0.51864,
+ "test_loss": 7.293183726501465,
+ "test_acc": 0.0531,
+ "lyapunov": null,
+ "grad_norm": 0.6450352139357391,
+ "grad_max_sv": 0.2251686044037342,
+ "grad_min_sv": 1.2090907994255495e-08,
+ "grad_condition": 23129638.107943743,
+ "lr": 0.00037565505641757235,
+ "time_sec": 49.62959694862366
+ },
+ {
+ "epoch": 88,
+ "train_loss": 1.7305470868301391,
+ "train_acc": 0.51752,
+ "test_loss": 6.886636978912353,
+ "test_acc": 0.0621,
+ "lyapunov": null,
+ "grad_norm": 0.6466229739487265,
+ "grad_max_sv": 0.2285929098725319,
+ "grad_min_sv": 1.2207108990238031e-08,
+ "grad_condition": 639961294.3776948,
+ "lr": 0.00036554008969236695,
+ "time_sec": 49.64359998703003
+ },
+ {
+ "epoch": 89,
+ "train_loss": 1.7247330599212647,
+ "train_acc": 0.52118,
+ "test_loss": 7.737054846954345,
+ "test_acc": 0.0492,
+ "lyapunov": null,
+ "grad_norm": 0.6431070021674609,
+ "grad_max_sv": 0.21853713542222977,
+ "grad_min_sv": 1.1871128499651996e-08,
+ "grad_condition": 34316573.10990389,
+ "lr": 0.0003554841015277638,
+ "time_sec": 49.6319477558136
+ },
+ {
+ "epoch": 90,
+ "train_loss": 1.704887728881836,
+ "train_acc": 0.52374,
+ "test_loss": 6.713198412322998,
+ "test_acc": 0.0556,
+ "lyapunov": null,
+ "grad_norm": 0.6451375385492529,
+ "grad_max_sv": 0.22224950045347214,
+ "grad_min_sv": 1.2021271361684072e-08,
+ "grad_condition": 25574543.625141606,
+ "lr": 0.000345491502812526,
+ "time_sec": 49.63963174819946
+ },
+ {
+ "epoch": 91,
+ "train_loss": 1.701412860145569,
+ "train_acc": 0.52644,
+ "test_loss": 7.295478704833984,
+ "test_acc": 0.0429,
+ "lyapunov": null,
+ "grad_norm": 0.6447266155116032,
+ "grad_max_sv": 0.23335366621613501,
+ "grad_min_sv": 1.257304017843186e-08,
+ "grad_condition": 24036732.36328527,
+ "lr": 0.0003355666766307081,
+ "time_sec": 49.665791511535645
+ },
+ {
+ "epoch": 92,
+ "train_loss": 1.6871472067642213,
+ "train_acc": 0.53048,
+ "test_loss": 7.389536867523193,
+ "test_acc": 0.0375,
+ "lyapunov": null,
+ "grad_norm": 0.6468836541708367,
+ "grad_max_sv": 0.2225259728729725,
+ "grad_min_sv": 1.1890293904331939e-08,
+ "grad_condition": 29650216.370129876,
+ "lr": 0.00032571397633909225,
+ "time_sec": 49.64622926712036
+ },
+ {
+ "epoch": 93,
+ "train_loss": 1.6749127053833008,
+ "train_acc": 0.53202,
+ "test_loss": 8.144829412078858,
+ "test_acc": 0.0401,
+ "lyapunov": null,
+ "grad_norm": 0.6416574148081634,
+ "grad_max_sv": 0.22841569185256957,
+ "grad_min_sv": 1.2051048693673128e-08,
+ "grad_condition": 29017060.070413183,
+ "lr": 0.00031593772365766094,
+ "time_sec": 49.649181604385376
+ },
+ {
+ "epoch": 94,
+ "train_loss": 1.6659465893936156,
+ "train_acc": 0.53198,
+ "test_loss": 7.906325871276856,
+ "test_acc": 0.0523,
+ "lyapunov": null,
+ "grad_norm": 0.6442484947336338,
+ "grad_max_sv": 0.22283854335546494,
+ "grad_min_sv": 1.1940718097624981e-08,
+ "grad_condition": 23900914.940908086,
+ "lr": 0.0003062422067739483,
+ "time_sec": 49.64401292800903
+ },
+ {
+ "epoch": 95,
+ "train_loss": 1.6399671975326537,
+ "train_acc": 0.53952,
+ "test_loss": 7.157633497619629,
+ "test_acc": 0.0527,
+ "lyapunov": null,
+ "grad_norm": 0.6406645370679923,
+ "grad_max_sv": 0.22293368987739087,
+ "grad_min_sv": 1.2085724485771942e-08,
+ "grad_condition": 56163384.20133088,
+ "lr": 0.00029663167846209965,
+ "time_sec": 49.6225950717926
+ },
+ {
+ "epoch": 96,
+ "train_loss": 1.6436440280532838,
+ "train_acc": 0.5397,
+ "test_loss": 8.535991598510742,
+ "test_acc": 0.0515,
+ "lyapunov": null,
+ "grad_norm": 0.6492588500387332,
+ "grad_max_sv": 0.22496760375797747,
+ "grad_min_sv": 1.180983480297132e-08,
+ "grad_condition": 106906297.43684229,
+ "lr": 0.00028711035421746345,
+ "time_sec": 49.64288353919983
+ },
+ {
+ "epoch": 97,
+ "train_loss": 1.6246039770889282,
+ "train_acc": 0.54446,
+ "test_loss": 8.059152350616456,
+ "test_acc": 0.0505,
+ "lyapunov": null,
+ "grad_norm": 0.6473823340688163,
+ "grad_max_sv": 0.23146028257906437,
+ "grad_min_sv": 1.2134549565862019e-08,
+ "grad_condition": 35822540.74264745,
+ "lr": 0.00027768241040753615,
+ "time_sec": 49.6298463344574
+ },
+ {
+ "epoch": 98,
+ "train_loss": 1.61877662109375,
+ "train_acc": 0.54736,
+ "test_loss": 8.167729595947266,
+ "test_acc": 0.038,
+ "lyapunov": null,
+ "grad_norm": 0.6455041816035443,
+ "grad_max_sv": 0.22865931317210197,
+ "grad_min_sv": 1.1919900413936979e-08,
+ "grad_condition": 28498587.531759303,
+ "lr": 0.00026835198244006903,
+ "time_sec": 49.63332438468933
+ },
+ {
+ "epoch": 99,
+ "train_loss": 3.068192625274658,
+ "train_acc": 0.31474,
+ "test_loss": 5.048260988616943,
+ "test_acc": 0.1146,
+ "lyapunov": null,
+ "grad_norm": 0.8608040247164788,
+ "grad_max_sv": 0.3330514427274466,
+ "grad_min_sv": 1.6094786775555646e-08,
+ "grad_condition": 28526093.82209841,
+ "lr": 0.0002591231629491421,
+ "time_sec": 49.662447690963745
+ },
+ {
+ "epoch": 100,
+ "train_loss": 2.316078476104736,
+ "train_acc": 0.39026,
+ "test_loss": 5.392445658874512,
+ "test_acc": 0.0879,
+ "lyapunov": null,
+ "grad_norm": 0.658192665007455,
+ "grad_max_sv": 0.22761380225419997,
+ "grad_min_sv": 1.2582580913994557e-08,
+ "grad_condition": 55399675.47104869,
+ "lr": 0.0002499999999999997,
+ "time_sec": 49.64076352119446
+ },
+ {
+ "epoch": 101,
+ "train_loss": 2.1483063832855223,
+ "train_acc": 0.42276,
+ "test_loss": 5.986578815460205,
+ "test_acc": 0.0707,
+ "lyapunov": null,
+ "grad_norm": 0.6484922643705857,
+ "grad_max_sv": 0.22837907671928406,
+ "grad_min_sv": 1.2391293061075892e-08,
+ "grad_condition": 23094080.352399424,
+ "lr": 0.00024098649531343477,
+ "time_sec": 49.6578733921051
+ },
+ {
+ "epoch": 102,
+ "train_loss": 2.05953384185791,
+ "train_acc": 0.4427,
+ "test_loss": 6.080546961212158,
+ "test_acc": 0.0573,
+ "lyapunov": null,
+ "grad_norm": 0.6484188898656511,
+ "grad_max_sv": 0.22914629317820073,
+ "grad_min_sv": 1.2451091090104338e-08,
+ "grad_condition": 62209882.03375574,
+ "lr": 0.0002320866025105016,
+ "time_sec": 49.63767695426941
+ },
+ {
+ "epoch": 103,
+ "train_loss": 2.004299710121155,
+ "train_acc": 0.45614,
+ "test_loss": 5.895175799560547,
+ "test_acc": 0.0578,
+ "lyapunov": null,
+ "grad_norm": 0.6399422615270736,
+ "grad_max_sv": 0.23107412382960318,
+ "grad_min_sv": 1.2409910121746748e-08,
+ "grad_condition": 22284137.40025208,
+ "lr": 0.0002233042253783278,
+ "time_sec": 49.65248942375183
+ },
+ {
+ "epoch": 104,
+ "train_loss": 1.9571235482788085,
+ "train_acc": 0.46526,
+ "test_loss": 5.738465850830078,
+ "test_acc": 0.0523,
+ "lyapunov": null,
+ "grad_norm": 0.6391319009023594,
+ "grad_max_sv": 0.2172716658562422,
+ "grad_min_sv": 1.1984206682580378e-08,
+ "grad_condition": 20112915.921763636,
+ "lr": 0.000214643216157784,
+ "time_sec": 49.633373975753784
+ },
+ {
+ "epoch": 105,
+ "train_loss": 1.9224023293304444,
+ "train_acc": 0.47322,
+ "test_loss": 6.117083155059815,
+ "test_acc": 0.05,
+ "lyapunov": null,
+ "grad_norm": 0.6402482339469217,
+ "grad_max_sv": 0.21523526906967164,
+ "grad_min_sv": 1.1972073542948491e-08,
+ "grad_condition": 36228791.07592559,
+ "lr": 0.00020610737385376332,
+ "time_sec": 49.63998031616211
+ },
+ {
+ "epoch": 106,
+ "train_loss": 1.8866684201812745,
+ "train_acc": 0.4833,
+ "test_loss": 5.936769345855713,
+ "test_acc": 0.0439,
+ "lyapunov": null,
+ "grad_norm": 0.6419042012012792,
+ "grad_max_sv": 0.22602429389953613,
+ "grad_min_sv": 1.2054361504115762e-08,
+ "grad_condition": 48343281.63861313,
+ "lr": 0.00019770044256881242,
+ "time_sec": 49.65153455734253
+ },
+ {
+ "epoch": 107,
+ "train_loss": 1.8594331677246094,
+ "train_acc": 0.48626,
+ "test_loss": 6.035185343170166,
+ "test_acc": 0.046,
+ "lyapunov": null,
+ "grad_norm": 0.6436629646723144,
+ "grad_max_sv": 0.21455634236335755,
+ "grad_min_sv": 1.1783472720489074e-08,
+ "grad_condition": 38784276.09698713,
+ "lr": 0.0001894261098608447,
+ "time_sec": 49.66721272468567
+ },
+ {
+ "epoch": 108,
+ "train_loss": 1.8262966638946534,
+ "train_acc": 0.49558,
+ "test_loss": 6.42567989654541,
+ "test_acc": 0.0425,
+ "lyapunov": null,
+ "grad_norm": 0.6468304513936767,
+ "grad_max_sv": 0.22701141163706778,
+ "grad_min_sv": 1.216740327554533e-08,
+ "grad_condition": 72116525.85188936,
+ "lr": 0.000181288005125655,
+ "time_sec": 49.65104866027832
+ },
+ {
+ "epoch": 109,
+ "train_loss": 1.8205863860321045,
+ "train_acc": 0.49754,
+ "test_loss": 5.783528507995605,
+ "test_acc": 0.0367,
+ "lyapunov": null,
+ "grad_norm": 0.643976690980956,
+ "grad_max_sv": 0.21868419870734215,
+ "grad_min_sv": 1.2079363115313768e-08,
+ "grad_condition": 20195547.998739578,
+ "lr": 0.0001732896980049473,
+ "time_sec": 49.66611671447754
+ },
+ {
+ "epoch": 110,
+ "train_loss": 1.793330860900879,
+ "train_acc": 0.5022,
+ "test_loss": 6.1977317413330075,
+ "test_acc": 0.0425,
+ "lyapunov": null,
+ "grad_norm": 0.6468160086891667,
+ "grad_max_sv": 0.2236340381205082,
+ "grad_min_sv": 1.1926133475226308e-08,
+ "grad_condition": 32237535.591110267,
+ "lr": 0.00016543469682057076,
+ "time_sec": 49.63362669944763
+ },
+ {
+ "epoch": 111,
+ "train_loss": 1.7825101839828492,
+ "train_acc": 0.5064,
+ "test_loss": 6.178716979980469,
+ "test_acc": 0.0443,
+ "lyapunov": null,
+ "grad_norm": 0.6424263059147781,
+ "grad_max_sv": 0.22070568352937697,
+ "grad_min_sv": 1.1919835535972866e-08,
+ "grad_condition": 37842182.06602182,
+ "lr": 0.00015772644703565552,
+ "time_sec": 49.65402150154114
+ },
+ {
+ "epoch": 112,
+ "train_loss": 1.7541921194458008,
+ "train_acc": 0.5103,
+ "test_loss": 6.0973250106811525,
+ "test_acc": 0.0475,
+ "lyapunov": null,
+ "grad_norm": 0.6481497742539534,
+ "grad_max_sv": 0.22489695958793163,
+ "grad_min_sv": 1.2136619546854188e-08,
+ "grad_condition": 29561688.482165914,
+ "lr": 0.00015016832974331713,
+ "time_sec": 49.65926122665405
+ },
+ {
+ "epoch": 113,
+ "train_loss": 1.7488899993515015,
+ "train_acc": 0.51458,
+ "test_loss": 5.979724680328369,
+ "test_acc": 0.0424,
+ "lyapunov": null,
+ "grad_norm": 0.6406667137370472,
+ "grad_max_sv": 0.22864535339176656,
+ "grad_min_sv": 1.191089982824356e-08,
+ "grad_condition": 56508420.06490357,
+ "lr": 0.00014276366018359834,
+ "time_sec": 49.62884473800659
+ },
+ {
+ "epoch": 114,
+ "train_loss": 1.7389903827667237,
+ "train_acc": 0.51522,
+ "test_loss": 5.958202845001221,
+ "test_acc": 0.0517,
+ "lyapunov": null,
+ "grad_norm": 0.6426356824149351,
+ "grad_max_sv": 0.22491934411227704,
+ "grad_min_sv": 1.2247705622608906e-08,
+ "grad_condition": 58131203.41244085,
+ "lr": 0.00013551568628929425,
+ "time_sec": 49.62388038635254
+ },
+ {
+ "epoch": 115,
+ "train_loss": 1.7231919304656982,
+ "train_acc": 0.52138,
+ "test_loss": 6.056362869262696,
+ "test_acc": 0.0478,
+ "lyapunov": null,
+ "grad_norm": 0.6495040089755264,
+ "grad_max_sv": 0.22354965060949325,
+ "grad_min_sv": 1.2017865864966116e-08,
+ "grad_condition": 28069335.9052594,
+ "lr": 0.00012842758726130276,
+ "time_sec": 49.6635365486145
+ },
+ {
+ "epoch": 116,
+ "train_loss": 1.6999663226699828,
+ "train_acc": 0.52556,
+ "test_loss": 6.322325106811523,
+ "test_acc": 0.0459,
+ "lyapunov": null,
+ "grad_norm": 0.6439980745634726,
+ "grad_max_sv": 0.22484406568109988,
+ "grad_min_sv": 1.2245539982025377e-08,
+ "grad_condition": 27693634.55346756,
+ "lr": 0.0001215024721741218,
+ "time_sec": 49.667264223098755
+ },
+ {
+ "epoch": 117,
+ "train_loss": 1.6914007580566406,
+ "train_acc": 0.52596,
+ "test_loss": 6.2398702270507815,
+ "test_acc": 0.0358,
+ "lyapunov": null,
+ "grad_norm": 0.6406992341206976,
+ "grad_max_sv": 0.22702743746340276,
+ "grad_min_sv": 1.2027920018309323e-08,
+ "grad_condition": 25480937.943885125,
+ "lr": 0.00011474337861210538,
+ "time_sec": 49.75715970993042
+ },
+ {
+ "epoch": 118,
+ "train_loss": 1.682532057723999,
+ "train_acc": 0.5269,
+ "test_loss": 6.022721984863281,
+ "test_acc": 0.0502,
+ "lyapunov": null,
+ "grad_norm": 0.6475614121887046,
+ "grad_max_sv": 0.22498515360057353,
+ "grad_min_sv": 1.2050166899382763e-08,
+ "grad_condition": 76251711.1097268,
+ "lr": 0.00010815327133708009,
+ "time_sec": 49.63880777359009
+ },
+ {
+ "epoch": 119,
+ "train_loss": 1.6772437452697755,
+ "train_acc": 0.53014,
+ "test_loss": 5.847724533081054,
+ "test_acc": 0.0456,
+ "lyapunov": null,
+ "grad_norm": 0.645505943920055,
+ "grad_max_sv": 0.22384067326784135,
+ "grad_min_sv": 1.1783700598622104e-08,
+ "grad_condition": 22583004.98493171,
+ "lr": 0.00010173504098790182,
+ "time_sec": 49.63686180114746
+ },
+ {
+ "epoch": 120,
+ "train_loss": 1.6719491082763671,
+ "train_acc": 0.53248,
+ "test_loss": 5.856200427246094,
+ "test_acc": 0.0427,
+ "lyapunov": null,
+ "grad_norm": 0.6466969899308954,
+ "grad_max_sv": 0.2293648473918438,
+ "grad_min_sv": 1.2215246461555474e-08,
+ "grad_condition": 26750165.211627714,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 49.633697748184204
+ },
+ {
+ "epoch": 121,
+ "train_loss": 1.6578344228744506,
+ "train_acc": 0.53442,
+ "test_loss": 5.862105746459961,
+ "test_acc": 0.0534,
+ "lyapunov": null,
+ "grad_norm": 0.6460809469464214,
+ "grad_max_sv": 0.2225838266313076,
+ "grad_min_sv": 1.212055693311509e-08,
+ "grad_condition": 24676272.501794428,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 49.647422790527344
+ },
+ {
+ "epoch": 122,
+ "train_loss": 1.6389700134658813,
+ "train_acc": 0.54052,
+ "test_loss": 5.913293504333496,
+ "test_acc": 0.0439,
+ "lyapunov": null,
+ "grad_norm": 0.6468970710870378,
+ "grad_max_sv": 0.22489394322037698,
+ "grad_min_sv": 1.1876642090624667e-08,
+ "grad_condition": 27879869.134462822,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 49.6471688747406
+ },
+ {
+ "epoch": 123,
+ "train_loss": 1.6408760947418213,
+ "train_acc": 0.539,
+ "test_loss": 5.881608892822266,
+ "test_acc": 0.0455,
+ "lyapunov": null,
+ "grad_norm": 0.6409502867501498,
+ "grad_max_sv": 0.2229029569774866,
+ "grad_min_sv": 1.1994366785894606e-08,
+ "grad_condition": 23946080.329339217,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 49.645761013031006
+ },
+ {
+ "epoch": 124,
+ "train_loss": 1.6327575244140624,
+ "train_acc": 0.54088,
+ "test_loss": 6.092592315673828,
+ "test_acc": 0.0442,
+ "lyapunov": null,
+ "grad_norm": 0.6388358623443664,
+ "grad_max_sv": 0.22407596856355666,
+ "grad_min_sv": 1.1999070549661983e-08,
+ "grad_condition": 29088864.422511287,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 49.63370180130005
+ },
+ {
+ "epoch": 125,
+ "train_loss": 1.626538638381958,
+ "train_acc": 0.54214,
+ "test_loss": 6.060646697998047,
+ "test_acc": 0.0498,
+ "lyapunov": null,
+ "grad_norm": 0.649112571277706,
+ "grad_max_sv": 0.22536444179713727,
+ "grad_min_sv": 1.2212023835916908e-08,
+ "grad_condition": 35126636.74446645,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 49.61126947402954
+ },
+ {
+ "epoch": 126,
+ "train_loss": 1.6151732135009766,
+ "train_acc": 0.54378,
+ "test_loss": 6.19133405456543,
+ "test_acc": 0.0452,
+ "lyapunov": null,
+ "grad_norm": 0.645551187410472,
+ "grad_max_sv": 0.227165062725544,
+ "grad_min_sv": 1.194181808161776e-08,
+ "grad_condition": 24734104.665951073,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 49.74283456802368
+ },
+ {
+ "epoch": 127,
+ "train_loss": 1.6116835289764404,
+ "train_acc": 0.54702,
+ "test_loss": 6.264876268768311,
+ "test_acc": 0.0576,
+ "lyapunov": null,
+ "grad_norm": 0.6449882086043084,
+ "grad_max_sv": 0.2281236581504345,
+ "grad_min_sv": 1.2174795581409992e-08,
+ "grad_condition": 33327591.078247894,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 49.66547632217407
+ },
+ {
+ "epoch": 128,
+ "train_loss": 1.6025007713317871,
+ "train_acc": 0.55014,
+ "test_loss": 6.29011365814209,
+ "test_acc": 0.0469,
+ "lyapunov": null,
+ "grad_norm": 0.6498584112316286,
+ "grad_max_sv": 0.22942896112799643,
+ "grad_min_sv": 1.2217025608090431e-08,
+ "grad_condition": 181633490.37894756,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 49.644524574279785
+ },
+ {
+ "epoch": 129,
+ "train_loss": 1.6006367045974732,
+ "train_acc": 0.55154,
+ "test_loss": 5.960230406188965,
+ "test_acc": 0.0484,
+ "lyapunov": null,
+ "grad_norm": 0.6474761633146622,
+ "grad_max_sv": 0.22425766214728354,
+ "grad_min_sv": 1.2069871824227363e-08,
+ "grad_condition": 25614798.36847374,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 49.63229012489319
+ },
+ {
+ "epoch": 130,
+ "train_loss": 1.5994749016952514,
+ "train_acc": 0.54798,
+ "test_loss": 6.082809280395508,
+ "test_acc": 0.0462,
+ "lyapunov": null,
+ "grad_norm": 0.6436297587317452,
+ "grad_max_sv": 0.2260743647813797,
+ "grad_min_sv": 1.197359623186789e-08,
+ "grad_condition": 47224918.84575805,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 49.653711795806885
+ },
+ {
+ "epoch": 131,
+ "train_loss": 1.5907676587677002,
+ "train_acc": 0.55338,
+ "test_loss": 6.253540195465088,
+ "test_acc": 0.0493,
+ "lyapunov": null,
+ "grad_norm": 0.6404122118978958,
+ "grad_max_sv": 0.2243455123156309,
+ "grad_min_sv": 1.1890854798024541e-08,
+ "grad_condition": 28094398.171041556,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 49.65587568283081
+ },
+ {
+ "epoch": 132,
+ "train_loss": 1.591219468383789,
+ "train_acc": 0.55168,
+ "test_loss": 6.408939161682129,
+ "test_acc": 0.0426,
+ "lyapunov": null,
+ "grad_norm": 0.6506622903315123,
+ "grad_max_sv": 0.23343092501163482,
+ "grad_min_sv": 1.2356089287846039e-08,
+ "grad_condition": 31524710.75405284,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 49.64363932609558
+ },
+ {
+ "epoch": 133,
+ "train_loss": 1.5818653707885741,
+ "train_acc": 0.55544,
+ "test_loss": 6.288112886047363,
+ "test_acc": 0.0416,
+ "lyapunov": null,
+ "grad_norm": 0.641538436455134,
+ "grad_max_sv": 0.22353356778621675,
+ "grad_min_sv": 1.1930217144046074e-08,
+ "grad_condition": 35984070.824167676,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 49.6272132396698
+ },
+ {
+ "epoch": 134,
+ "train_loss": 1.5757408687973022,
+ "train_acc": 0.5551,
+ "test_loss": 6.169788475036621,
+ "test_acc": 0.0436,
+ "lyapunov": null,
+ "grad_norm": 0.6422263506494424,
+ "grad_max_sv": 0.22716106660664082,
+ "grad_min_sv": 1.1833126612598166e-08,
+ "grad_condition": 52859395.957509615,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 49.634817600250244
+ },
+ {
+ "epoch": 135,
+ "train_loss": 1.573296899986267,
+ "train_acc": 0.5586,
+ "test_loss": 6.409516627502441,
+ "test_acc": 0.0398,
+ "lyapunov": null,
+ "grad_norm": 0.6422323193959601,
+ "grad_max_sv": 0.21986942775547505,
+ "grad_min_sv": 1.1918038018803035e-08,
+ "grad_condition": 135103466.34543505,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 49.644601583480835
+ },
+ {
+ "epoch": 136,
+ "train_loss": 1.5735322719573974,
+ "train_acc": 0.55498,
+ "test_loss": 6.962667681884765,
+ "test_acc": 0.0438,
+ "lyapunov": null,
+ "grad_norm": 0.6425705125331251,
+ "grad_max_sv": 0.22957376427948475,
+ "grad_min_sv": 1.2022417819265719e-08,
+ "grad_condition": 84953424.74808493,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 49.65340971946716
+ },
+ {
+ "epoch": 137,
+ "train_loss": 1.5703629438018798,
+ "train_acc": 0.55592,
+ "test_loss": 6.347426979064942,
+ "test_acc": 0.0416,
+ "lyapunov": null,
+ "grad_norm": 0.6470089432203813,
+ "grad_max_sv": 0.22675703540444375,
+ "grad_min_sv": 1.1964806787001515e-08,
+ "grad_condition": 42242032.09383811,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 49.65664100646973
+ },
+ {
+ "epoch": 138,
+ "train_loss": 1.5664401405334472,
+ "train_acc": 0.55756,
+ "test_loss": 6.496471109771728,
+ "test_acc": 0.0445,
+ "lyapunov": null,
+ "grad_norm": 0.6430396727274027,
+ "grad_max_sv": 0.22493685856461526,
+ "grad_min_sv": 1.2061497275950295e-08,
+ "grad_condition": 23954534.1998593,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 49.642067432403564
+ },
+ {
+ "epoch": 139,
+ "train_loss": 1.5627032785415649,
+ "train_acc": 0.5605,
+ "test_loss": 6.283855271148681,
+ "test_acc": 0.0447,
+ "lyapunov": null,
+ "grad_norm": 0.6409841113210015,
+ "grad_max_sv": 0.2232666589319706,
+ "grad_min_sv": 1.1962911396386222e-08,
+ "grad_condition": 259592659.58503166,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 49.632962465286255
+ },
+ {
+ "epoch": 140,
+ "train_loss": 1.5663015616226197,
+ "train_acc": 0.55768,
+ "test_loss": 6.220936709594727,
+ "test_acc": 0.0479,
+ "lyapunov": null,
+ "grad_norm": 0.6429008373506699,
+ "grad_max_sv": 0.22778371684253215,
+ "grad_min_sv": 1.2041603553170077e-08,
+ "grad_condition": 67987905.64758533,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 49.615734338760376
+ },
+ {
+ "epoch": 141,
+ "train_loss": 1.5625858126068115,
+ "train_acc": 0.56096,
+ "test_loss": 6.526646176147461,
+ "test_acc": 0.0493,
+ "lyapunov": null,
+ "grad_norm": 0.6377897998533895,
+ "grad_max_sv": 0.2237264908850193,
+ "grad_min_sv": 1.2073943828072586e-08,
+ "grad_condition": 21432345.22954327,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 49.64499115943909
+ },
+ {
+ "epoch": 142,
+ "train_loss": 1.551087869529724,
+ "train_acc": 0.56178,
+ "test_loss": 6.401860023498535,
+ "test_acc": 0.0441,
+ "lyapunov": null,
+ "grad_norm": 0.6415643857015031,
+ "grad_max_sv": 0.2261370625346899,
+ "grad_min_sv": 1.2029182526809845e-08,
+ "grad_condition": 66314375.58164777,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 49.65327548980713
+ },
+ {
+ "epoch": 143,
+ "train_loss": 1.5571945658111572,
+ "train_acc": 0.55928,
+ "test_loss": 6.133491006469726,
+ "test_acc": 0.0486,
+ "lyapunov": null,
+ "grad_norm": 0.6447257277887289,
+ "grad_max_sv": 0.22846047319471835,
+ "grad_min_sv": 1.2135202965418701e-08,
+ "grad_condition": 37586048.51019514,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 49.65649223327637
+ },
+ {
+ "epoch": 144,
+ "train_loss": 1.5559558386611938,
+ "train_acc": 0.5614,
+ "test_loss": 6.064924475097656,
+ "test_acc": 0.052,
+ "lyapunov": null,
+ "grad_norm": 0.6401487690577669,
+ "grad_max_sv": 0.2242697723209858,
+ "grad_min_sv": 1.1992281666317605e-08,
+ "grad_condition": 25437338.27988875,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 49.635279178619385
+ },
+ {
+ "epoch": 145,
+ "train_loss": 1.553707954940796,
+ "train_acc": 0.56286,
+ "test_loss": 6.5988156112670895,
+ "test_acc": 0.0458,
+ "lyapunov": null,
+ "grad_norm": 0.6407793832198755,
+ "grad_max_sv": 0.23003120347857475,
+ "grad_min_sv": 1.1913595625301366e-08,
+ "grad_condition": 32004871.034651928,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 49.659799575805664
+ },
+ {
+ "epoch": 146,
+ "train_loss": 1.556730777015686,
+ "train_acc": 0.56224,
+ "test_loss": 6.555442190551758,
+ "test_acc": 0.0442,
+ "lyapunov": null,
+ "grad_norm": 0.6414928448640214,
+ "grad_max_sv": 0.22317990958690642,
+ "grad_min_sv": 1.2069366867430501e-08,
+ "grad_condition": 382827154.51718956,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 49.64200186729431
+ },
+ {
+ "epoch": 147,
+ "train_loss": 1.5659333599090577,
+ "train_acc": 0.55716,
+ "test_loss": 6.271022132873535,
+ "test_acc": 0.0492,
+ "lyapunov": null,
+ "grad_norm": 0.6449744450875666,
+ "grad_max_sv": 0.22341229021549225,
+ "grad_min_sv": 1.2069372681833279e-08,
+ "grad_condition": 29803939.928126138,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 49.677895069122314
+ },
+ {
+ "epoch": 148,
+ "train_loss": 1.55233530418396,
+ "train_acc": 0.5624,
+ "test_loss": 6.24937745513916,
+ "test_acc": 0.0474,
+ "lyapunov": null,
+ "grad_norm": 0.643448067037432,
+ "grad_max_sv": 0.22757547162473202,
+ "grad_min_sv": 1.2111119601643239e-08,
+ "grad_condition": 33967427.03926191,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 49.623542070388794
+ },
+ {
+ "epoch": 149,
+ "train_loss": 1.5480224239730835,
+ "train_acc": 0.5639,
+ "test_loss": 6.394064616394043,
+ "test_acc": 0.0438,
+ "lyapunov": null,
+ "grad_norm": 0.642149980505916,
+ "grad_max_sv": 0.21981638856232166,
+ "grad_min_sv": 1.1695069362070709e-08,
+ "grad_condition": 254731993.0398627,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 49.63520789146423
+ },
+ {
+ "epoch": 150,
+ "train_loss": 1.5609092629623413,
+ "train_acc": 0.55828,
+ "test_loss": 6.494824208068848,
+ "test_acc": 0.042,
+ "lyapunov": null,
+ "grad_norm": 0.645124236315014,
+ "grad_max_sv": 0.2247354317456484,
+ "grad_min_sv": 1.2051133440466044e-08,
+ "grad_condition": 35388252.370039664,
+ "lr": 0.0,
+ "time_sec": 49.63965940475464
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 5.089254416656495,
+ "train_acc": 0.01344,
+ "test_loss": 4.870831555175781,
+ "test_acc": 0.01,
+ "lyapunov": null,
+ "grad_norm": 5.582063459208639,
+ "grad_max_sv": 5.0306542873382565,
+ "grad_min_sv": 8.441757832766683e-08,
+ "grad_condition": 74707534.78681344,
+ "lr": 0.0009998903417374227,
+ "time_sec": 66.78056359291077
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.736304296569824,
+ "train_acc": 0.02172,
+ "test_loss": 4.92340059890747,
+ "test_acc": 0.01,
+ "lyapunov": null,
+ "grad_norm": 4.087296772772229,
+ "grad_max_sv": 3.672157108783722,
+ "grad_min_sv": 6.109624839933935e-08,
+ "grad_condition": 230714811.36310124,
+ "lr": 0.0009995614150494292,
+ "time_sec": 66.77934241294861
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.52685978515625,
+ "train_acc": 0.03204,
+ "test_loss": 5.045831031799317,
+ "test_acc": 0.0094,
+ "lyapunov": null,
+ "grad_norm": 3.1470044543912175,
+ "grad_max_sv": 2.6447540044784548,
+ "grad_min_sv": 4.639755384339139e-08,
+ "grad_condition": 65625701.84585605,
+ "lr": 0.0009990133642141358,
+ "time_sec": 66.76001167297363
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.371717319641113,
+ "train_acc": 0.04112,
+ "test_loss": 4.993129699707032,
+ "test_acc": 0.0115,
+ "lyapunov": null,
+ "grad_norm": 2.5123688948843395,
+ "grad_max_sv": 2.1027904629707335,
+ "grad_min_sv": 3.615837387664633e-08,
+ "grad_condition": 418817692.03399765,
+ "lr": 0.0009982464296247522,
+ "time_sec": 66.79424738883972
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.27407361251831,
+ "train_acc": 0.0488,
+ "test_loss": 5.161634465789795,
+ "test_acc": 0.0119,
+ "lyapunov": null,
+ "grad_norm": 1.9573801826064445,
+ "grad_max_sv": 1.613087645173073,
+ "grad_min_sv": 2.8529539808364034e-08,
+ "grad_condition": 62747668.20627429,
+ "lr": 0.0009972609476841367,
+ "time_sec": 66.81961727142334
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.183251854553222,
+ "train_acc": 0.05812,
+ "test_loss": 5.447854755401611,
+ "test_acc": 0.0093,
+ "lyapunov": null,
+ "grad_norm": 1.436449079599314,
+ "grad_max_sv": 1.0459295481443405,
+ "grad_min_sv": 2.0654144772258576e-08,
+ "grad_condition": 94732574.16372415,
+ "lr": 0.000996057350657239,
+ "time_sec": 66.73661756515503
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.103355536193848,
+ "train_acc": 0.06872,
+ "test_loss": 5.544150679016114,
+ "test_acc": 0.0124,
+ "lyapunov": null,
+ "grad_norm": 1.082624040556548,
+ "grad_max_sv": 0.678101472556591,
+ "grad_min_sv": 1.6660088839048904e-08,
+ "grad_condition": 49338508.46283151,
+ "lr": 0.000994636166481494,
+ "time_sec": 66.81501913070679
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.040529095458984,
+ "train_acc": 0.07876,
+ "test_loss": 5.577163777160645,
+ "test_acc": 0.0172,
+ "lyapunov": null,
+ "grad_norm": 0.963869121683512,
+ "grad_max_sv": 0.5578698106110096,
+ "grad_min_sv": 1.4817374840991882e-08,
+ "grad_condition": 46172185.25999212,
+ "lr": 0.0009929980185352525,
+ "time_sec": 66.78599071502686
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.999490645446777,
+ "train_acc": 0.0856,
+ "test_loss": 5.472281336975097,
+ "test_acc": 0.0116,
+ "lyapunov": null,
+ "grad_norm": 0.9198022107734598,
+ "grad_max_sv": 0.5003849364817142,
+ "grad_min_sv": 1.3862486752946878e-08,
+ "grad_condition": 137028895.09887612,
+ "lr": 0.0009911436253643444,
+ "time_sec": 66.77566862106323
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.9641557629394533,
+ "train_acc": 0.09124,
+ "test_loss": 5.43024553604126,
+ "test_acc": 0.0112,
+ "lyapunov": null,
+ "grad_norm": 0.8539816540258655,
+ "grad_max_sv": 0.4397390566766262,
+ "grad_min_sv": 1.3177782898221579e-08,
+ "grad_condition": 50953468.3517745,
+ "lr": 0.0009890738003669028,
+ "time_sec": 66.84108996391296
+ },
+ {
+ "epoch": 11,
+ "train_loss": 3.9142907052612306,
+ "train_acc": 0.09788,
+ "test_loss": 5.24972756652832,
+ "test_acc": 0.0174,
+ "lyapunov": null,
+ "grad_norm": 0.8303589651826888,
+ "grad_max_sv": 0.4246540553867817,
+ "grad_min_sv": 1.288730961390705e-08,
+ "grad_condition": 88294678.08247125,
+ "lr": 0.00098678945143658,
+ "time_sec": 66.87874603271484
+ },
+ {
+ "epoch": 12,
+ "train_loss": 3.881778168411255,
+ "train_acc": 0.1037,
+ "test_loss": 5.765969756317139,
+ "test_acc": 0.0186,
+ "lyapunov": null,
+ "grad_norm": 0.7855031029198277,
+ "grad_max_sv": 0.3756070680916309,
+ "grad_min_sv": 1.2611303298881715e-08,
+ "grad_condition": 36786532.210794725,
+ "lr": 0.0009842915805643154,
+ "time_sec": 66.82181406021118
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.8490214154815674,
+ "train_acc": 0.1068,
+ "test_loss": 5.832162282562256,
+ "test_acc": 0.0138,
+ "lyapunov": null,
+ "grad_norm": 0.7681061932199776,
+ "grad_max_sv": 0.3604050487279892,
+ "grad_min_sv": 1.2243067453593382e-08,
+ "grad_condition": 131143000.26933214,
+ "lr": 0.000981581283398829,
+ "time_sec": 66.72735929489136
+ },
+ {
+ "epoch": 14,
+ "train_loss": 3.828877674636841,
+ "train_acc": 0.11234,
+ "test_loss": 6.293205305480957,
+ "test_acc": 0.0134,
+ "lyapunov": null,
+ "grad_norm": 0.7460407539013362,
+ "grad_max_sv": 0.34510768875479697,
+ "grad_min_sv": 1.1813573212726692e-08,
+ "grad_condition": 49629148.15911349,
+ "lr": 0.0009786597487660333,
+ "time_sec": 66.80630326271057
+ },
+ {
+ "epoch": 15,
+ "train_loss": 3.803487832107544,
+ "train_acc": 0.1159,
+ "test_loss": 6.4087516273498535,
+ "test_acc": 0.013,
+ "lyapunov": null,
+ "grad_norm": 0.716379034773642,
+ "grad_max_sv": 0.3261814657598734,
+ "grad_min_sv": 1.1572917107960378e-08,
+ "grad_condition": 31644703.4401185,
+ "lr": 0.0009755282581475766,
+ "time_sec": 66.77157950401306
+ },
+ {
+ "epoch": 16,
+ "train_loss": 3.7804446031188963,
+ "train_acc": 0.11974,
+ "test_loss": 6.637075031280518,
+ "test_acc": 0.0121,
+ "lyapunov": null,
+ "grad_norm": 0.696010315133547,
+ "grad_max_sv": 0.3137427795678377,
+ "grad_min_sv": 1.127850834219124e-08,
+ "grad_condition": 69462833.27053933,
+ "lr": 0.0009721881851187403,
+ "time_sec": 66.79616379737854
+ },
+ {
+ "epoch": 17,
+ "train_loss": 3.752294116973877,
+ "train_acc": 0.12396,
+ "test_loss": 6.783492227935791,
+ "test_acc": 0.0146,
+ "lyapunov": null,
+ "grad_norm": 0.6728326480937213,
+ "grad_max_sv": 0.29628029987216,
+ "grad_min_sv": 1.0862121784666057e-08,
+ "grad_condition": 67951530.61721244,
+ "lr": 0.0009686409947459456,
+ "time_sec": 66.90411448478699
+ },
+ {
+ "epoch": 18,
+ "train_loss": 3.7320939672851563,
+ "train_acc": 0.12876,
+ "test_loss": 6.78950693283081,
+ "test_acc": 0.0166,
+ "lyapunov": null,
+ "grad_norm": 0.6616867936990236,
+ "grad_max_sv": 0.2953863974660635,
+ "grad_min_sv": 1.095610695379251e-08,
+ "grad_condition": 136390664.3535565,
+ "lr": 0.0009648882429441254,
+ "time_sec": 66.75479531288147
+ },
+ {
+ "epoch": 19,
+ "train_loss": 3.7112531086730955,
+ "train_acc": 0.13056,
+ "test_loss": 6.585515812683106,
+ "test_acc": 0.0163,
+ "lyapunov": null,
+ "grad_norm": 0.6494124624609345,
+ "grad_max_sv": 0.2933062981814146,
+ "grad_min_sv": 1.0763416760650734e-08,
+ "grad_condition": 31017442.193528943,
+ "lr": 0.00096093157579425,
+ "time_sec": 66.74547505378723
+ },
+ {
+ "epoch": 20,
+ "train_loss": 3.6964602882385256,
+ "train_acc": 0.13444,
+ "test_loss": 6.817514788818359,
+ "test_acc": 0.0125,
+ "lyapunov": null,
+ "grad_norm": 0.6419428954986147,
+ "grad_max_sv": 0.28524503484368324,
+ "grad_min_sv": 1.07556832606992e-08,
+ "grad_condition": 29053863.493932776,
+ "lr": 0.0009567727288213001,
+ "time_sec": 66.75940012931824
+ },
+ {
+ "epoch": 21,
+ "train_loss": 3.6749328507995607,
+ "train_acc": 0.13862,
+ "test_loss": 6.693168528747559,
+ "test_acc": 0.0132,
+ "lyapunov": null,
+ "grad_norm": 0.6273897945446711,
+ "grad_max_sv": 0.27434321865439415,
+ "grad_min_sv": 1.0629087081326371e-08,
+ "grad_condition": 34272866.07000697,
+ "lr": 0.0009524135262330095,
+ "time_sec": 66.76537322998047
+ },
+ {
+ "epoch": 22,
+ "train_loss": 3.6651853931427003,
+ "train_acc": 0.13714,
+ "test_loss": 7.5128926712036135,
+ "test_acc": 0.0145,
+ "lyapunov": null,
+ "grad_norm": 0.6127571430728127,
+ "grad_max_sv": 0.2585024815052748,
+ "grad_min_sv": 9.990007998617045e-09,
+ "grad_condition": 29464610.145040773,
+ "lr": 0.0009478558801197061,
+ "time_sec": 66.88315868377686
+ },
+ {
+ "epoch": 23,
+ "train_loss": 3.6479580931091307,
+ "train_acc": 0.14048,
+ "test_loss": 7.259157413482666,
+ "test_acc": 0.013,
+ "lyapunov": null,
+ "grad_norm": 0.6101108448302026,
+ "grad_max_sv": 0.26707915738224985,
+ "grad_min_sv": 1.0416663243084657e-08,
+ "grad_condition": 44782214.320293196,
+ "lr": 0.000943101789615607,
+ "time_sec": 66.73595952987671
+ },
+ {
+ "epoch": 24,
+ "train_loss": 3.630135404510498,
+ "train_acc": 0.14444,
+ "test_loss": 6.769294599151611,
+ "test_acc": 0.0187,
+ "lyapunov": null,
+ "grad_norm": 0.5973985296812159,
+ "grad_max_sv": 0.25335801765322685,
+ "grad_min_sv": 9.992184554080685e-09,
+ "grad_condition": 42939810.102056004,
+ "lr": 0.0009381533400219313,
+ "time_sec": 66.83198976516724
+ },
+ {
+ "epoch": 25,
+ "train_loss": 3.6139439612579345,
+ "train_acc": 0.14892,
+ "test_loss": 6.755159613037109,
+ "test_acc": 0.0168,
+ "lyapunov": null,
+ "grad_norm": 0.5830251618606708,
+ "grad_max_sv": 0.2401360861957073,
+ "grad_min_sv": 9.682792681542374e-09,
+ "grad_condition": 104126991.37138663,
+ "lr": 0.0009330127018922189,
+ "time_sec": 66.7968385219574
+ },
+ {
+ "epoch": 26,
+ "train_loss": 3.5970758290100098,
+ "train_acc": 0.14988,
+ "test_loss": 6.900474179840088,
+ "test_acc": 0.0154,
+ "lyapunov": null,
+ "grad_norm": 0.5787074408614666,
+ "grad_max_sv": 0.23566974550485612,
+ "grad_min_sv": 9.719574232958105e-09,
+ "grad_condition": 38538660.37346102,
+ "lr": 0.000927682130080253,
+ "time_sec": 66.79184246063232
+ },
+ {
+ "epoch": 27,
+ "train_loss": 3.5895483708190916,
+ "train_acc": 0.1518,
+ "test_loss": 6.669962855529785,
+ "test_acc": 0.0167,
+ "lyapunov": null,
+ "grad_norm": 0.5803094423675084,
+ "grad_max_sv": 0.2358210153877735,
+ "grad_min_sv": 9.626696496206621e-09,
+ "grad_condition": 193890246.2613204,
+ "lr": 0.0009221639627510072,
+ "time_sec": 66.7768383026123
+ },
+ {
+ "epoch": 28,
+ "train_loss": 3.5726418092346193,
+ "train_acc": 0.15258,
+ "test_loss": 7.085537405395508,
+ "test_acc": 0.0168,
+ "lyapunov": null,
+ "grad_norm": 0.570193330921248,
+ "grad_max_sv": 0.23036426715552807,
+ "grad_min_sv": 9.589828041736691e-09,
+ "grad_condition": 89352936.15952519,
+ "lr": 0.0009164606203550494,
+ "time_sec": 66.79721999168396
+ },
+ {
+ "epoch": 29,
+ "train_loss": 3.5572311797332765,
+ "train_acc": 0.15608,
+ "test_loss": 6.67531994934082,
+ "test_acc": 0.0189,
+ "lyapunov": null,
+ "grad_norm": 0.5675152442756493,
+ "grad_max_sv": 0.22562474496662616,
+ "grad_min_sv": 9.685276963766754e-09,
+ "grad_condition": 25178417.23491483,
+ "lr": 0.0009105746045668516,
+ "time_sec": 66.85751271247864
+ },
+ {
+ "epoch": 30,
+ "train_loss": 3.548038801879883,
+ "train_acc": 0.15748,
+ "test_loss": 6.45415048828125,
+ "test_acc": 0.0219,
+ "lyapunov": null,
+ "grad_norm": 0.5621117218085827,
+ "grad_max_sv": 0.222617195174098,
+ "grad_min_sv": 9.435066891660959e-09,
+ "grad_condition": 26340041.97866543,
+ "lr": 0.0009045084971874733,
+ "time_sec": 66.79050874710083
+ },
+ {
+ "epoch": 31,
+ "train_loss": 3.5402868547058106,
+ "train_acc": 0.16092,
+ "test_loss": 6.451704531860352,
+ "test_acc": 0.0227,
+ "lyapunov": null,
+ "grad_norm": 0.5521957030096883,
+ "grad_max_sv": 0.22002805732190608,
+ "grad_min_sv": 9.47574586573907e-09,
+ "grad_condition": 26149277.514949474,
+ "lr": 0.0008982649590120977,
+ "time_sec": 66.78902292251587
+ },
+ {
+ "epoch": 32,
+ "train_loss": 3.5309471380615234,
+ "train_acc": 0.16198,
+ "test_loss": 6.8702184638977055,
+ "test_acc": 0.022,
+ "lyapunov": null,
+ "grad_norm": 0.5464579230817538,
+ "grad_max_sv": 0.21435559950768948,
+ "grad_min_sv": 9.215979125329344e-09,
+ "grad_condition": 59638036.88956574,
+ "lr": 0.0008918467286629196,
+ "time_sec": 66.78767824172974
+ },
+ {
+ "epoch": 33,
+ "train_loss": 3.5130342961120604,
+ "train_acc": 0.16284,
+ "test_loss": 7.181190188598633,
+ "test_acc": 0.0173,
+ "lyapunov": null,
+ "grad_norm": 0.5437244358450883,
+ "grad_max_sv": 0.22251709625124932,
+ "grad_min_sv": 9.34404511543363e-09,
+ "grad_condition": 28699663.06993841,
+ "lr": 0.0008852566213878943,
+ "time_sec": 66.71953392028809
+ },
+ {
+ "epoch": 34,
+ "train_loss": 3.51255979675293,
+ "train_acc": 0.16636,
+ "test_loss": 7.333110241699218,
+ "test_acc": 0.0181,
+ "lyapunov": null,
+ "grad_norm": 0.5393640775064226,
+ "grad_max_sv": 0.20921555384993554,
+ "grad_min_sv": 9.167450806812916e-09,
+ "grad_condition": 25706901.28825941,
+ "lr": 0.000878497527825878,
+ "time_sec": 66.7765941619873
+ },
+ {
+ "epoch": 35,
+ "train_loss": 3.4977930699157715,
+ "train_acc": 0.16716,
+ "test_loss": 7.278058241271973,
+ "test_acc": 0.0212,
+ "lyapunov": null,
+ "grad_norm": 0.5438001473750539,
+ "grad_max_sv": 0.20897603183984756,
+ "grad_min_sv": 9.184564683795137e-09,
+ "grad_condition": 34997969.65153339,
+ "lr": 0.000871572412738697,
+ "time_sec": 66.78994917869568
+ },
+ {
+ "epoch": 36,
+ "train_loss": 3.4839546405029296,
+ "train_acc": 0.17056,
+ "test_loss": 6.461000657653808,
+ "test_acc": 0.0224,
+ "lyapunov": null,
+ "grad_norm": 0.5343462863238121,
+ "grad_max_sv": 0.20449809469282626,
+ "grad_min_sv": 9.16483587076744e-09,
+ "grad_condition": 24381579.447592642,
+ "lr": 0.0008644843137107055,
+ "time_sec": 66.78629851341248
+ },
+ {
+ "epoch": 37,
+ "train_loss": 3.473933819503784,
+ "train_acc": 0.16984,
+ "test_loss": 6.470654428100586,
+ "test_acc": 0.0179,
+ "lyapunov": null,
+ "grad_norm": 0.5324136173248342,
+ "grad_max_sv": 0.20008243359625338,
+ "grad_min_sv": 9.049705299718491e-09,
+ "grad_condition": 34636922.167240486,
+ "lr": 0.0008572363398164014,
+ "time_sec": 66.79992747306824
+ },
+ {
+ "epoch": 38,
+ "train_loss": 3.4661802910614012,
+ "train_acc": 0.17092,
+ "test_loss": 6.690065528869629,
+ "test_acc": 0.0169,
+ "lyapunov": null,
+ "grad_norm": 0.5281123151657661,
+ "grad_max_sv": 0.20084053687751294,
+ "grad_min_sv": 8.970145487507963e-09,
+ "grad_condition": 26480283.34014668,
+ "lr": 0.0008498316702566826,
+ "time_sec": 66.92348313331604
+ },
+ {
+ "epoch": 39,
+ "train_loss": 3.4540661865997313,
+ "train_acc": 0.17118,
+ "test_loss": 6.078438919830322,
+ "test_acc": 0.0211,
+ "lyapunov": null,
+ "grad_norm": 0.5227451103728683,
+ "grad_max_sv": 0.1980721667408943,
+ "grad_min_sv": 8.970438091903537e-09,
+ "grad_condition": 149441951.98208869,
+ "lr": 0.0008422735529643442,
+ "time_sec": 66.80566644668579
+ },
+ {
+ "epoch": 40,
+ "train_loss": 3.439123515701294,
+ "train_acc": 0.17768,
+ "test_loss": 6.255719974517822,
+ "test_acc": 0.0246,
+ "lyapunov": null,
+ "grad_norm": 0.5238902894663456,
+ "grad_max_sv": 0.2012732930481434,
+ "grad_min_sv": 8.989019251171015e-09,
+ "grad_condition": 26996532.399999082,
+ "lr": 0.0008345653031794289,
+ "time_sec": 66.78863906860352
+ },
+ {
+ "epoch": 41,
+ "train_loss": 3.4350976667022706,
+ "train_acc": 0.17682,
+ "test_loss": 5.942692041015625,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.5230791130306572,
+ "grad_max_sv": 0.19939371161162853,
+ "grad_min_sv": 9.040618726557925e-09,
+ "grad_condition": 35747119.67190552,
+ "lr": 0.0008267103019950526,
+ "time_sec": 66.78709435462952
+ },
+ {
+ "epoch": 42,
+ "train_loss": 3.4243579791259764,
+ "train_acc": 0.17844,
+ "test_loss": 6.007703511047363,
+ "test_acc": 0.0262,
+ "lyapunov": null,
+ "grad_norm": 0.517545208070228,
+ "grad_max_sv": 0.1922302544116974,
+ "grad_min_sv": 8.860449580982976e-09,
+ "grad_condition": 30602577.279376544,
+ "lr": 0.0008187119948743447,
+ "time_sec": 66.81675243377686
+ },
+ {
+ "epoch": 43,
+ "train_loss": 3.41020792137146,
+ "train_acc": 0.1805,
+ "test_loss": 6.532727696228028,
+ "test_acc": 0.0201,
+ "lyapunov": null,
+ "grad_norm": 0.5184771014750174,
+ "grad_max_sv": 0.1960398443043232,
+ "grad_min_sv": 9.042896009781032e-09,
+ "grad_condition": 109678067.45442054,
+ "lr": 0.000810573890139155,
+ "time_sec": 66.88858389854431
+ },
+ {
+ "epoch": 44,
+ "train_loss": 3.407023912811279,
+ "train_acc": 0.18096,
+ "test_loss": 6.134778085327149,
+ "test_acc": 0.0212,
+ "lyapunov": null,
+ "grad_norm": 0.5141850532973719,
+ "grad_max_sv": 0.18923728726804256,
+ "grad_min_sv": 9.02819977631475e-09,
+ "grad_condition": 100774753.52111238,
+ "lr": 0.0008022995574311873,
+ "time_sec": 66.80017518997192
+ },
+ {
+ "epoch": 45,
+ "train_loss": 3.395647827911377,
+ "train_acc": 0.1839,
+ "test_loss": 6.376823687744141,
+ "test_acc": 0.0222,
+ "lyapunov": null,
+ "grad_norm": 0.5126811791455754,
+ "grad_max_sv": 0.18771996162831783,
+ "grad_min_sv": 9.025198291837122e-09,
+ "grad_condition": 44468339.93349115,
+ "lr": 0.0007938926261462363,
+ "time_sec": 66.7608630657196
+ },
+ {
+ "epoch": 46,
+ "train_loss": 3.3928714478302,
+ "train_acc": 0.18238,
+ "test_loss": 6.053843517303466,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.5084041434605487,
+ "grad_max_sv": 0.1855287253856659,
+ "grad_min_sv": 8.774856632975947e-09,
+ "grad_condition": 31787391.609472472,
+ "lr": 0.0007853567838422158,
+ "time_sec": 66.74166297912598
+ },
+ {
+ "epoch": 47,
+ "train_loss": 3.379834383621216,
+ "train_acc": 0.18724,
+ "test_loss": 6.8861193962097165,
+ "test_acc": 0.0191,
+ "lyapunov": null,
+ "grad_norm": 0.5060633641106507,
+ "grad_max_sv": 0.1826419185847044,
+ "grad_min_sv": 8.790497434824073e-09,
+ "grad_condition": 34120677.482305124,
+ "lr": 0.0007766957746216719,
+ "time_sec": 66.7685010433197
+ },
+ {
+ "epoch": 48,
+ "train_loss": 3.374839401092529,
+ "train_acc": 0.1861,
+ "test_loss": 5.864614242553711,
+ "test_acc": 0.0184,
+ "lyapunov": null,
+ "grad_norm": 0.5042105096702133,
+ "grad_max_sv": 0.18606598749756814,
+ "grad_min_sv": 8.831608784565237e-09,
+ "grad_condition": 28878813.551795878,
+ "lr": 0.0007679133974894982,
+ "time_sec": 66.80099678039551
+ },
+ {
+ "epoch": 49,
+ "train_loss": 3.3662559477996825,
+ "train_acc": 0.1887,
+ "test_loss": 6.230384608459473,
+ "test_acc": 0.0213,
+ "lyapunov": null,
+ "grad_norm": 0.5036215455963197,
+ "grad_max_sv": 0.19020347222685813,
+ "grad_min_sv": 8.961205007554373e-09,
+ "grad_condition": 47201312.24723457,
+ "lr": 0.000759013504686565,
+ "time_sec": 66.75482654571533
+ },
+ {
+ "epoch": 50,
+ "train_loss": 3.360496557159424,
+ "train_acc": 0.18832,
+ "test_loss": 6.6197496559143065,
+ "test_acc": 0.0224,
+ "lyapunov": null,
+ "grad_norm": 0.5042398036515723,
+ "grad_max_sv": 0.1836124774068594,
+ "grad_min_sv": 8.934804758553572e-09,
+ "grad_condition": 69600275.62778898,
+ "lr": 0.0007499999999999998,
+ "time_sec": 66.77506113052368
+ },
+ {
+ "epoch": 51,
+ "train_loss": 3.350079543914795,
+ "train_acc": 0.1919,
+ "test_loss": 6.343868575286865,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.5043278001350275,
+ "grad_max_sv": 0.1825037430971861,
+ "grad_min_sv": 8.887193922446634e-09,
+ "grad_condition": 30024861.754817694,
+ "lr": 0.0007408768370508575,
+ "time_sec": 66.72825312614441
+ },
+ {
+ "epoch": 52,
+ "train_loss": 3.3426339905548095,
+ "train_acc": 0.1928,
+ "test_loss": 7.225718658447265,
+ "test_acc": 0.0199,
+ "lyapunov": null,
+ "grad_norm": 0.50252992009141,
+ "grad_max_sv": 0.17567641101777554,
+ "grad_min_sv": 8.804220427770064e-09,
+ "grad_condition": 740966766.3274126,
+ "lr": 0.0007316480175599307,
+ "time_sec": 66.72319173812866
+ },
+ {
+ "epoch": 53,
+ "train_loss": 3.3341299864959715,
+ "train_acc": 0.1933,
+ "test_loss": 6.803897232055664,
+ "test_acc": 0.0206,
+ "lyapunov": null,
+ "grad_norm": 0.5011496244728447,
+ "grad_max_sv": 0.17870272882282734,
+ "grad_min_sv": 8.831609968340536e-09,
+ "grad_condition": 22412356.279497318,
+ "lr": 0.0007223175895924635,
+ "time_sec": 66.7704975605011
+ },
+ {
+ "epoch": 54,
+ "train_loss": 3.3261182179260254,
+ "train_acc": 0.19572,
+ "test_loss": 6.764497369384766,
+ "test_acc": 0.028,
+ "lyapunov": null,
+ "grad_norm": 0.4979381618436104,
+ "grad_max_sv": 0.1770651936531067,
+ "grad_min_sv": 8.860568483093357e-09,
+ "grad_condition": 25306461.91969143,
+ "lr": 0.0007128896457825361,
+ "time_sec": 66.77421927452087
+ },
+ {
+ "epoch": 55,
+ "train_loss": 3.316899408569336,
+ "train_acc": 0.196,
+ "test_loss": 6.540015605163574,
+ "test_acc": 0.024,
+ "lyapunov": null,
+ "grad_norm": 0.4977367964912547,
+ "grad_max_sv": 0.17745399177074433,
+ "grad_min_sv": 8.913811780364434e-09,
+ "grad_condition": 22903051.94229058,
+ "lr": 0.0007033683215378998,
+ "time_sec": 66.79190754890442
+ },
+ {
+ "epoch": 56,
+ "train_loss": 3.310275382003784,
+ "train_acc": 0.19632,
+ "test_loss": 6.745750244140625,
+ "test_acc": 0.0197,
+ "lyapunov": null,
+ "grad_norm": 0.4988650354422387,
+ "grad_max_sv": 0.17153157331049443,
+ "grad_min_sv": 8.749649851869101e-09,
+ "grad_condition": 22030625.492303018,
+ "lr": 0.0006937577932260512,
+ "time_sec": 66.7638955116272
+ },
+ {
+ "epoch": 57,
+ "train_loss": 3.290559967803955,
+ "train_acc": 0.20002,
+ "test_loss": 6.366741171264648,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.4982910029946987,
+ "grad_max_sv": 0.17201930955052375,
+ "grad_min_sv": 8.79568313487053e-09,
+ "grad_condition": 151885613.93341595,
+ "lr": 0.0006840622763423388,
+ "time_sec": 66.78560328483582
+ },
+ {
+ "epoch": 58,
+ "train_loss": 3.2923309088134767,
+ "train_acc": 0.20166,
+ "test_loss": 6.417476829528809,
+ "test_acc": 0.0246,
+ "lyapunov": null,
+ "grad_norm": 0.49889716140548146,
+ "grad_max_sv": 0.17567893117666245,
+ "grad_min_sv": 8.913143439981397e-09,
+ "grad_condition": 24256220.95115678,
+ "lr": 0.0006742860236609073,
+ "time_sec": 66.843590259552
+ },
+ {
+ "epoch": 59,
+ "train_loss": 3.2908721295928953,
+ "train_acc": 0.19948,
+ "test_loss": 6.640488920593262,
+ "test_acc": 0.0279,
+ "lyapunov": null,
+ "grad_norm": 0.49266049285108265,
+ "grad_max_sv": 0.17507032714784146,
+ "grad_min_sv": 8.739878155916703e-09,
+ "grad_condition": 26595294.449066617,
+ "lr": 0.0006644333233692913,
+ "time_sec": 66.74992251396179
+ },
+ {
+ "epoch": 60,
+ "train_loss": 3.284796617889404,
+ "train_acc": 0.2013,
+ "test_loss": 6.291868576049804,
+ "test_acc": 0.0273,
+ "lyapunov": null,
+ "grad_norm": 0.49223922966029576,
+ "grad_max_sv": 0.17198019847273827,
+ "grad_min_sv": 8.672205609183693e-09,
+ "grad_condition": 22947196.39326378,
+ "lr": 0.0006545084971874734,
+ "time_sec": 66.7844717502594
+ },
+ {
+ "epoch": 61,
+ "train_loss": 3.2731484245300293,
+ "train_acc": 0.20498,
+ "test_loss": 6.035749476623535,
+ "test_acc": 0.0304,
+ "lyapunov": null,
+ "grad_norm": 0.49100354548098263,
+ "grad_max_sv": 0.1670747336000204,
+ "grad_min_sv": 8.751909007925774e-09,
+ "grad_condition": 38402617.820078045,
+ "lr": 0.0006445158984722354,
+ "time_sec": 66.78787755966187
+ },
+ {
+ "epoch": 62,
+ "train_loss": 3.2566023439025877,
+ "train_acc": 0.20938,
+ "test_loss": 6.511487716674805,
+ "test_acc": 0.0285,
+ "lyapunov": null,
+ "grad_norm": 0.4914300539125354,
+ "grad_max_sv": 0.16597167886793612,
+ "grad_min_sv": 8.786484798073424e-09,
+ "grad_condition": 21670471.110839043,
+ "lr": 0.0006344599103076324,
+ "time_sec": 66.70972204208374
+ },
+ {
+ "epoch": 63,
+ "train_loss": 3.2568167697143555,
+ "train_acc": 0.20498,
+ "test_loss": 6.652309313964844,
+ "test_acc": 0.0253,
+ "lyapunov": null,
+ "grad_norm": 0.4918024874902063,
+ "grad_max_sv": 0.16560027711093425,
+ "grad_min_sv": 8.785258739235635e-09,
+ "grad_condition": 71694500.46039832,
+ "lr": 0.0006243449435824269,
+ "time_sec": 66.82298398017883
+ },
+ {
+ "epoch": 64,
+ "train_loss": 3.2456203374481203,
+ "train_acc": 0.20808,
+ "test_loss": 6.344074755859375,
+ "test_acc": 0.0255,
+ "lyapunov": null,
+ "grad_norm": 0.49095369226258845,
+ "grad_max_sv": 0.1667012270539999,
+ "grad_min_sv": 8.78574491491868e-09,
+ "grad_condition": 23075446.134346228,
+ "lr": 0.0006141754350553275,
+ "time_sec": 66.78016519546509
+ },
+ {
+ "epoch": 65,
+ "train_loss": 3.236674240646362,
+ "train_acc": 0.21152,
+ "test_loss": 6.2899073806762695,
+ "test_acc": 0.0224,
+ "lyapunov": null,
+ "grad_norm": 0.4921779891011333,
+ "grad_max_sv": 0.1677238956093788,
+ "grad_min_sv": 8.828472619626382e-09,
+ "grad_condition": 22441240.736154817,
+ "lr": 0.0006039558454088793,
+ "time_sec": 66.85806608200073
+ },
+ {
+ "epoch": 66,
+ "train_loss": 3.22965085647583,
+ "train_acc": 0.2126,
+ "test_loss": 6.429703979492188,
+ "test_acc": 0.0282,
+ "lyapunov": null,
+ "grad_norm": 0.4881811720746172,
+ "grad_max_sv": 0.164219119399786,
+ "grad_min_sv": 8.673666965219873e-09,
+ "grad_condition": 21892913.98496552,
+ "lr": 0.000593690657292862,
+ "time_sec": 66.78576803207397
+ },
+ {
+ "epoch": 67,
+ "train_loss": 3.224384484176636,
+ "train_acc": 0.21134,
+ "test_loss": 6.922704602050781,
+ "test_acc": 0.0234,
+ "lyapunov": null,
+ "grad_norm": 0.48741557028554877,
+ "grad_max_sv": 0.16480680033564568,
+ "grad_min_sv": 8.729063946666394e-09,
+ "grad_condition": 23200356.121009313,
+ "lr": 0.0005833843733580507,
+ "time_sec": 66.77217102050781
+ },
+ {
+ "epoch": 68,
+ "train_loss": 3.2157058325195313,
+ "train_acc": 0.21262,
+ "test_loss": 6.7681282539367675,
+ "test_acc": 0.0231,
+ "lyapunov": null,
+ "grad_norm": 0.493681050551615,
+ "grad_max_sv": 0.16986403651535512,
+ "grad_min_sv": 8.815265072070754e-09,
+ "grad_condition": 29441294.083651233,
+ "lr": 0.0005730415142812054,
+ "time_sec": 66.77236366271973
+ },
+ {
+ "epoch": 69,
+ "train_loss": 3.210006919326782,
+ "train_acc": 0.21728,
+ "test_loss": 6.470967771148682,
+ "test_acc": 0.0254,
+ "lyapunov": null,
+ "grad_norm": 0.4878926422472019,
+ "grad_max_sv": 0.1638301569968462,
+ "grad_min_sv": 8.75584678441954e-09,
+ "grad_condition": 52016652.85495178,
+ "lr": 0.0005626666167821517,
+ "time_sec": 66.80931973457336
+ },
+ {
+ "epoch": 70,
+ "train_loss": 3.196190078125,
+ "train_acc": 0.21792,
+ "test_loss": 5.951667370605469,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.48950735034118803,
+ "grad_max_sv": 0.16142398156225682,
+ "grad_min_sv": 8.815271614059927e-09,
+ "grad_condition": 24483281.259911567,
+ "lr": 0.0005522642316338265,
+ "time_sec": 66.77829360961914
+ },
+ {
+ "epoch": 71,
+ "train_loss": 3.2064027897644043,
+ "train_acc": 0.21506,
+ "test_loss": 6.750360327148438,
+ "test_acc": 0.0227,
+ "lyapunov": null,
+ "grad_norm": 0.4871695073962276,
+ "grad_max_sv": 0.16285001635551452,
+ "grad_min_sv": 8.758729140578848e-09,
+ "grad_condition": 23565681.777415752,
+ "lr": 0.0005418389216661573,
+ "time_sec": 66.78215885162354
+ },
+ {
+ "epoch": 72,
+ "train_loss": 3.1924329637908935,
+ "train_acc": 0.21822,
+ "test_loss": 6.714482778167724,
+ "test_acc": 0.025,
+ "lyapunov": null,
+ "grad_norm": 0.48778155896125935,
+ "grad_max_sv": 0.1631274577230215,
+ "grad_min_sv": 8.720527765009033e-09,
+ "grad_condition": 63496326.10433636,
+ "lr": 0.0005313952597646563,
+ "time_sec": 66.8333637714386
+ },
+ {
+ "epoch": 73,
+ "train_loss": 3.188364574279785,
+ "train_acc": 0.2196,
+ "test_loss": 7.193912121582032,
+ "test_acc": 0.0213,
+ "lyapunov": null,
+ "grad_norm": 0.4880279755205525,
+ "grad_max_sv": 0.1620686575770378,
+ "grad_min_sv": 8.740592850886574e-09,
+ "grad_condition": 27935085.988161374,
+ "lr": 0.0005209378268645994,
+ "time_sec": 66.71236157417297
+ },
+ {
+ "epoch": 74,
+ "train_loss": 3.1774999662780763,
+ "train_acc": 0.22036,
+ "test_loss": 6.498540209960938,
+ "test_acc": 0.0266,
+ "lyapunov": null,
+ "grad_norm": 0.48663554748850196,
+ "grad_max_sv": 0.16149300280958415,
+ "grad_min_sv": 8.688670802628472e-09,
+ "grad_condition": 102102915.61516626,
+ "lr": 0.0005104712099416781,
+ "time_sec": 66.7784776687622
+ },
+ {
+ "epoch": 75,
+ "train_loss": 3.1686367027282714,
+ "train_acc": 0.22206,
+ "test_loss": 7.174583370971679,
+ "test_acc": 0.0209,
+ "lyapunov": null,
+ "grad_norm": 0.48682394841302745,
+ "grad_max_sv": 0.16311258710920812,
+ "grad_min_sv": 8.786071105382209e-09,
+ "grad_condition": 24724999.404770423,
+ "lr": 0.0004999999999999996,
+ "time_sec": 66.76251482963562
+ },
+ {
+ "epoch": 76,
+ "train_loss": 3.1639041161346437,
+ "train_acc": 0.225,
+ "test_loss": 7.478772677612305,
+ "test_acc": 0.0197,
+ "lyapunov": null,
+ "grad_norm": 0.49049069180345295,
+ "grad_max_sv": 0.16360066644847393,
+ "grad_min_sv": 8.74060119004927e-09,
+ "grad_condition": 24496844.849027783,
+ "lr": 0.0004895287900583212,
+ "time_sec": 66.72801065444946
+ },
+ {
+ "epoch": 77,
+ "train_loss": 3.154632388381958,
+ "train_acc": 0.22396,
+ "test_loss": 6.57794190826416,
+ "test_acc": 0.0277,
+ "lyapunov": null,
+ "grad_norm": 0.4868448729214284,
+ "grad_max_sv": 0.1649958923459053,
+ "grad_min_sv": 8.840505302809554e-09,
+ "grad_condition": 21095789.830121905,
+ "lr": 0.0004790621731353997,
+ "time_sec": 66.73516988754272
+ },
+ {
+ "epoch": 78,
+ "train_loss": 3.1528517010498045,
+ "train_acc": 0.22312,
+ "test_loss": 7.1080197311401365,
+ "test_acc": 0.0217,
+ "lyapunov": null,
+ "grad_norm": 0.4887319331046421,
+ "grad_max_sv": 0.1634005270898342,
+ "grad_min_sv": 8.874131324221323e-09,
+ "grad_condition": 20245229.779506456,
+ "lr": 0.000468604740235343,
+ "time_sec": 66.71177268028259
+ },
+ {
+ "epoch": 79,
+ "train_loss": 3.1432092308807373,
+ "train_acc": 0.229,
+ "test_loss": 7.214095246887207,
+ "test_acc": 0.0247,
+ "lyapunov": null,
+ "grad_norm": 0.48838038818221724,
+ "grad_max_sv": 0.16252909004688262,
+ "grad_min_sv": 8.819199073806239e-09,
+ "grad_condition": 26520623.470668785,
+ "lr": 0.00045816107833384175,
+ "time_sec": 66.7255470752716
+ },
+ {
+ "epoch": 80,
+ "train_loss": 3.1343304455566408,
+ "train_acc": 0.22744,
+ "test_loss": 6.940009968566894,
+ "test_acc": 0.0255,
+ "lyapunov": null,
+ "grad_norm": 0.48846815734372934,
+ "grad_max_sv": 0.1635790452361107,
+ "grad_min_sv": 8.798821884981045e-09,
+ "grad_condition": 21131375.648625843,
+ "lr": 0.0004477357683661729,
+ "time_sec": 66.72595143318176
+ },
+ {
+ "epoch": 81,
+ "train_loss": 3.1298222771453856,
+ "train_acc": 0.22642,
+ "test_loss": 7.29024638671875,
+ "test_acc": 0.0259,
+ "lyapunov": null,
+ "grad_norm": 0.49086957943567056,
+ "grad_max_sv": 0.15947132408618928,
+ "grad_min_sv": 8.788132586923236e-09,
+ "grad_condition": 28060653.55060955,
+ "lr": 0.00043733338321784746,
+ "time_sec": 66.77222657203674
+ },
+ {
+ "epoch": 82,
+ "train_loss": 3.117735626373291,
+ "train_acc": 0.23038,
+ "test_loss": 6.9144718528747555,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.49138593312101014,
+ "grad_max_sv": 0.159454994648695,
+ "grad_min_sv": 8.759537291390742e-09,
+ "grad_condition": 308046195.23178655,
+ "lr": 0.0004269584857187939,
+ "time_sec": 66.75987410545349
+ },
+ {
+ "epoch": 83,
+ "train_loss": 3.1175857275390624,
+ "train_acc": 0.23194,
+ "test_loss": 6.706077085876465,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.4924089866784705,
+ "grad_max_sv": 0.16311928667128087,
+ "grad_min_sv": 8.90124301697326e-09,
+ "grad_condition": 32153498.186816484,
+ "lr": 0.0004166156266419484,
+ "time_sec": 66.74847078323364
+ },
+ {
+ "epoch": 84,
+ "train_loss": 3.1045476649475097,
+ "train_acc": 0.23228,
+ "test_loss": 6.154573769378662,
+ "test_acc": 0.0282,
+ "lyapunov": null,
+ "grad_norm": 0.49118329484452294,
+ "grad_max_sv": 0.16205354779958725,
+ "grad_min_sv": 8.760578144861864e-09,
+ "grad_condition": 52646848.44888155,
+ "lr": 0.0004063093427071373,
+ "time_sec": 66.74011945724487
+ },
+ {
+ "epoch": 85,
+ "train_loss": 3.1078517518615723,
+ "train_acc": 0.2344,
+ "test_loss": 6.530753035736084,
+ "test_acc": 0.0282,
+ "lyapunov": null,
+ "grad_norm": 0.4904367995984335,
+ "grad_max_sv": 0.161368178576231,
+ "grad_min_sv": 8.888137861817746e-09,
+ "grad_condition": 21303276.13293609,
+ "lr": 0.0003960441545911199,
+ "time_sec": 66.72609543800354
+ },
+ {
+ "epoch": 86,
+ "train_loss": 3.0952324195861816,
+ "train_acc": 0.23368,
+ "test_loss": 6.240639804077149,
+ "test_acc": 0.0308,
+ "lyapunov": null,
+ "grad_norm": 0.49428635963779644,
+ "grad_max_sv": 0.15839767456054688,
+ "grad_min_sv": 8.964046511322766e-09,
+ "grad_condition": 28785588.134401,
+ "lr": 0.0003858245649446718,
+ "time_sec": 66.74975419044495
+ },
+ {
+ "epoch": 87,
+ "train_loss": 3.0952587001037597,
+ "train_acc": 0.23356,
+ "test_loss": 6.628809076690674,
+ "test_acc": 0.0322,
+ "lyapunov": null,
+ "grad_norm": 0.49144116518393927,
+ "grad_max_sv": 0.16221071667969228,
+ "grad_min_sv": 8.962699898917847e-09,
+ "grad_condition": 20571826.020635325,
+ "lr": 0.00037565505641757235,
+ "time_sec": 66.7199854850769
+ },
+ {
+ "epoch": 88,
+ "train_loss": 3.0922299211120605,
+ "train_acc": 0.2344,
+ "test_loss": 6.5014627777099605,
+ "test_acc": 0.0295,
+ "lyapunov": null,
+ "grad_norm": 0.49360674992051745,
+ "grad_max_sv": 0.1644837912172079,
+ "grad_min_sv": 8.975622673573769e-09,
+ "grad_condition": 28771115.174499214,
+ "lr": 0.00036554008969236695,
+ "time_sec": 66.74195861816406
+ },
+ {
+ "epoch": 89,
+ "train_loss": 3.0761431072235106,
+ "train_acc": 0.23966,
+ "test_loss": 7.287914637756348,
+ "test_acc": 0.0263,
+ "lyapunov": null,
+ "grad_norm": 0.4909525286245839,
+ "grad_max_sv": 0.16159643046557903,
+ "grad_min_sv": 8.858207814488317e-09,
+ "grad_condition": 22425426.033500116,
+ "lr": 0.0003554841015277638,
+ "time_sec": 66.68954610824585
+ },
+ {
+ "epoch": 90,
+ "train_loss": 3.0747881409454347,
+ "train_acc": 0.2377,
+ "test_loss": 7.193168222808838,
+ "test_acc": 0.0262,
+ "lyapunov": null,
+ "grad_norm": 0.4911854264861308,
+ "grad_max_sv": 0.1574687145650387,
+ "grad_min_sv": 8.917724771215912e-09,
+ "grad_condition": 118300212.93482408,
+ "lr": 0.000345491502812526,
+ "time_sec": 66.77580857276917
+ },
+ {
+ "epoch": 91,
+ "train_loss": 3.070805363311768,
+ "train_acc": 0.23994,
+ "test_loss": 6.052177616882324,
+ "test_acc": 0.0304,
+ "lyapunov": null,
+ "grad_norm": 0.49339922868661756,
+ "grad_max_sv": 0.1602653257548809,
+ "grad_min_sv": 8.95202442799392e-09,
+ "grad_condition": 44017380.37680817,
+ "lr": 0.0003355666766307081,
+ "time_sec": 66.69368362426758
+ },
+ {
+ "epoch": 92,
+ "train_loss": 3.0647792414855957,
+ "train_acc": 0.23982,
+ "test_loss": 6.179595366668702,
+ "test_acc": 0.0301,
+ "lyapunov": null,
+ "grad_norm": 0.4931917462731246,
+ "grad_max_sv": 0.1606559857726097,
+ "grad_min_sv": 9.0662935353647e-09,
+ "grad_condition": 19908430.164367903,
+ "lr": 0.00032571397633909225,
+ "time_sec": 66.70123243331909
+ },
+ {
+ "epoch": 93,
+ "train_loss": 3.0550636367034913,
+ "train_acc": 0.2422,
+ "test_loss": 6.34838355255127,
+ "test_acc": 0.0271,
+ "lyapunov": null,
+ "grad_norm": 0.49186583360988956,
+ "grad_max_sv": 0.1579043295234442,
+ "grad_min_sv": 8.987567995388801e-09,
+ "grad_condition": 22006714.29709431,
+ "lr": 0.00031593772365766094,
+ "time_sec": 66.71771335601807
+ },
+ {
+ "epoch": 94,
+ "train_loss": 3.043202466583252,
+ "train_acc": 0.24232,
+ "test_loss": 6.682511094665528,
+ "test_acc": 0.0279,
+ "lyapunov": null,
+ "grad_norm": 0.4962595942491337,
+ "grad_max_sv": 0.1622728668153286,
+ "grad_min_sv": 9.030461697867587e-09,
+ "grad_condition": 30360701.35233465,
+ "lr": 0.0003062422067739483,
+ "time_sec": 66.82941317558289
+ },
+ {
+ "epoch": 95,
+ "train_loss": 3.0412676640319822,
+ "train_acc": 0.2447,
+ "test_loss": 6.22475659866333,
+ "test_acc": 0.0318,
+ "lyapunov": null,
+ "grad_norm": 0.4915093368948821,
+ "grad_max_sv": 0.15892955474555492,
+ "grad_min_sv": 8.946618996336086e-09,
+ "grad_condition": 69026491.3661272,
+ "lr": 0.00029663167846209965,
+ "time_sec": 66.73191213607788
+ },
+ {
+ "epoch": 96,
+ "train_loss": 3.0352964888000487,
+ "train_acc": 0.2471,
+ "test_loss": 6.5577602828979495,
+ "test_acc": 0.0293,
+ "lyapunov": null,
+ "grad_norm": 0.49248702226826524,
+ "grad_max_sv": 0.1611651573330164,
+ "grad_min_sv": 8.952907482040472e-09,
+ "grad_condition": 31830348.776786767,
+ "lr": 0.00028711035421746345,
+ "time_sec": 66.75891017913818
+ },
+ {
+ "epoch": 97,
+ "train_loss": 3.029721915130615,
+ "train_acc": 0.24842,
+ "test_loss": 6.651570160675049,
+ "test_acc": 0.0289,
+ "lyapunov": null,
+ "grad_norm": 0.4943874310747337,
+ "grad_max_sv": 0.1606567233800888,
+ "grad_min_sv": 9.076670715035818e-09,
+ "grad_condition": 36874515.58106691,
+ "lr": 0.00027768241040753615,
+ "time_sec": 66.74775719642639
+ },
+ {
+ "epoch": 98,
+ "train_loss": 3.0293620677948,
+ "train_acc": 0.24548,
+ "test_loss": 6.7938948928833005,
+ "test_acc": 0.0291,
+ "lyapunov": null,
+ "grad_norm": 0.4970218817533374,
+ "grad_max_sv": 0.15979058742523194,
+ "grad_min_sv": 9.025258917993995e-09,
+ "grad_condition": 21461503.719760668,
+ "lr": 0.00026835198244006903,
+ "time_sec": 66.71226525306702
+ },
+ {
+ "epoch": 99,
+ "train_loss": 3.0232276085662844,
+ "train_acc": 0.24992,
+ "test_loss": 6.842255628967285,
+ "test_acc": 0.0287,
+ "lyapunov": null,
+ "grad_norm": 0.4964386837271484,
+ "grad_max_sv": 0.16297372654080391,
+ "grad_min_sv": 9.074463314107107e-09,
+ "grad_condition": 38263953.83433555,
+ "lr": 0.0002591231629491421,
+ "time_sec": 66.73949241638184
+ },
+ {
+ "epoch": 100,
+ "train_loss": 3.0220013402557373,
+ "train_acc": 0.24942,
+ "test_loss": 7.044534214782715,
+ "test_acc": 0.0264,
+ "lyapunov": null,
+ "grad_norm": 0.4963097153496672,
+ "grad_max_sv": 0.1608368031680584,
+ "grad_min_sv": 8.999894975450506e-09,
+ "grad_condition": 41372527.951466024,
+ "lr": 0.0002499999999999997,
+ "time_sec": 66.77927494049072
+ },
+ {
+ "epoch": 101,
+ "train_loss": 3.0203451880645753,
+ "train_acc": 0.2487,
+ "test_loss": 6.837228249359131,
+ "test_acc": 0.0287,
+ "lyapunov": null,
+ "grad_norm": 0.49771273059241083,
+ "grad_max_sv": 0.16355772241950034,
+ "grad_min_sv": 9.09030489493201e-09,
+ "grad_condition": 21122520.470805176,
+ "lr": 0.00024098649531343477,
+ "time_sec": 66.73630166053772
+ },
+ {
+ "epoch": 102,
+ "train_loss": 3.0023662061309815,
+ "train_acc": 0.2517,
+ "test_loss": 7.122745419311523,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.4990559135673985,
+ "grad_max_sv": 0.16072520166635512,
+ "grad_min_sv": 9.129048311740107e-09,
+ "grad_condition": 20645009.356589716,
+ "lr": 0.0002320866025105016,
+ "time_sec": 66.75698280334473
+ },
+ {
+ "epoch": 103,
+ "train_loss": 2.998011736526489,
+ "train_acc": 0.25374,
+ "test_loss": 7.035623414611816,
+ "test_acc": 0.0277,
+ "lyapunov": null,
+ "grad_norm": 0.49574085619625,
+ "grad_max_sv": 0.15668718423694372,
+ "grad_min_sv": 9.148743505132951e-09,
+ "grad_condition": 33626359.10658366,
+ "lr": 0.0002233042253783278,
+ "time_sec": 66.75562310218811
+ },
+ {
+ "epoch": 104,
+ "train_loss": 2.997530387496948,
+ "train_acc": 0.25132,
+ "test_loss": 6.999302207946777,
+ "test_acc": 0.0292,
+ "lyapunov": null,
+ "grad_norm": 0.5002716771455139,
+ "grad_max_sv": 0.16238998733460902,
+ "grad_min_sv": 9.078950441443468e-09,
+ "grad_condition": 20349177.478017032,
+ "lr": 0.000214643216157784,
+ "time_sec": 66.79467344284058
+ },
+ {
+ "epoch": 105,
+ "train_loss": 2.9906964135742187,
+ "train_acc": 0.25506,
+ "test_loss": 7.1786759597778325,
+ "test_acc": 0.0273,
+ "lyapunov": null,
+ "grad_norm": 0.4946350333441307,
+ "grad_max_sv": 0.1600412342697382,
+ "grad_min_sv": 9.088851333008408e-09,
+ "grad_condition": 57224884.57519225,
+ "lr": 0.00020610737385376332,
+ "time_sec": 66.74862432479858
+ },
+ {
+ "epoch": 106,
+ "train_loss": 2.984202498321533,
+ "train_acc": 0.25656,
+ "test_loss": 7.172381106567383,
+ "test_acc": 0.0269,
+ "lyapunov": null,
+ "grad_norm": 0.4982362018645274,
+ "grad_max_sv": 0.1571014266461134,
+ "grad_min_sv": 9.054493026183775e-09,
+ "grad_condition": 22960817.2493112,
+ "lr": 0.00019770044256881242,
+ "time_sec": 66.77469301223755
+ },
+ {
+ "epoch": 107,
+ "train_loss": 2.975272487335205,
+ "train_acc": 0.25552,
+ "test_loss": 7.0334813690185545,
+ "test_acc": 0.0316,
+ "lyapunov": null,
+ "grad_norm": 0.49588396234922755,
+ "grad_max_sv": 0.16075790040194987,
+ "grad_min_sv": 9.117187717289087e-09,
+ "grad_condition": 22400105.746660806,
+ "lr": 0.0001894261098608447,
+ "time_sec": 66.76792025566101
+ },
+ {
+ "epoch": 108,
+ "train_loss": 2.9756462240600587,
+ "train_acc": 0.25536,
+ "test_loss": 7.59121438293457,
+ "test_acc": 0.0288,
+ "lyapunov": null,
+ "grad_norm": 0.4971626921836716,
+ "grad_max_sv": 0.15787492766976358,
+ "grad_min_sv": 9.170698456424448e-09,
+ "grad_condition": 2842260093.4746685,
+ "lr": 0.000181288005125655,
+ "time_sec": 66.72157907485962
+ },
+ {
+ "epoch": 109,
+ "train_loss": 2.9735143406677245,
+ "train_acc": 0.25872,
+ "test_loss": 6.839995979309082,
+ "test_acc": 0.0305,
+ "lyapunov": null,
+ "grad_norm": 0.49760629850795685,
+ "grad_max_sv": 0.16163251921534538,
+ "grad_min_sv": 9.179918801505149e-09,
+ "grad_condition": 26931510.48697853,
+ "lr": 0.0001732896980049473,
+ "time_sec": 66.76784825325012
+ },
+ {
+ "epoch": 110,
+ "train_loss": 2.971026375198364,
+ "train_acc": 0.25932,
+ "test_loss": 6.99457964477539,
+ "test_acc": 0.0301,
+ "lyapunov": null,
+ "grad_norm": 0.4972222462184193,
+ "grad_max_sv": 0.1576628390699625,
+ "grad_min_sv": 9.118256634466082e-09,
+ "grad_condition": 25805428.695002638,
+ "lr": 0.00016543469682057076,
+ "time_sec": 66.7546181678772
+ },
+ {
+ "epoch": 111,
+ "train_loss": 2.961785153198242,
+ "train_acc": 0.25938,
+ "test_loss": 7.5968095703125,
+ "test_acc": 0.0278,
+ "lyapunov": null,
+ "grad_norm": 0.499682712724269,
+ "grad_max_sv": 0.16410896554589272,
+ "grad_min_sv": 9.131004422013866e-09,
+ "grad_condition": 21672900.170981936,
+ "lr": 0.00015772644703565552,
+ "time_sec": 66.74458265304565
+ },
+ {
+ "epoch": 112,
+ "train_loss": 2.9625577368927,
+ "train_acc": 0.25878,
+ "test_loss": 7.764190951538086,
+ "test_acc": 0.026,
+ "lyapunov": null,
+ "grad_norm": 0.498213643225678,
+ "grad_max_sv": 0.15600935891270637,
+ "grad_min_sv": 9.151295493614598e-09,
+ "grad_condition": 20410187.211308915,
+ "lr": 0.00015016832974331713,
+ "time_sec": 66.75516033172607
+ },
+ {
+ "epoch": 113,
+ "train_loss": 2.95476414642334,
+ "train_acc": 0.25912,
+ "test_loss": 7.14678690032959,
+ "test_acc": 0.0306,
+ "lyapunov": null,
+ "grad_norm": 0.4989192084378189,
+ "grad_max_sv": 0.16326018050312996,
+ "grad_min_sv": 9.208972755539447e-09,
+ "grad_condition": 51946084.62151481,
+ "lr": 0.00014276366018359834,
+ "time_sec": 66.8117504119873
+ },
+ {
+ "epoch": 114,
+ "train_loss": 2.959580585861206,
+ "train_acc": 0.26152,
+ "test_loss": 7.228822399902343,
+ "test_acc": 0.0306,
+ "lyapunov": null,
+ "grad_norm": 0.4993052937105196,
+ "grad_max_sv": 0.1597112886607647,
+ "grad_min_sv": 9.184225070735242e-09,
+ "grad_condition": 24287456.61544974,
+ "lr": 0.00013551568628929425,
+ "time_sec": 66.71526288986206
+ },
+ {
+ "epoch": 115,
+ "train_loss": 2.951429924316406,
+ "train_acc": 0.2597,
+ "test_loss": 6.857805014038086,
+ "test_acc": 0.0311,
+ "lyapunov": null,
+ "grad_norm": 0.5001172379881009,
+ "grad_max_sv": 0.16317447423934936,
+ "grad_min_sv": 9.167603101656319e-09,
+ "grad_condition": 19878785.72490542,
+ "lr": 0.00012842758726130276,
+ "time_sec": 66.7846131324768
+ },
+ {
+ "epoch": 116,
+ "train_loss": 2.9463225456237794,
+ "train_acc": 0.26044,
+ "test_loss": 7.2446568466186525,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.4998364506796334,
+ "grad_max_sv": 0.16249994188547134,
+ "grad_min_sv": 9.130782213651045e-09,
+ "grad_condition": 19998723.305069156,
+ "lr": 0.0001215024721741218,
+ "time_sec": 66.7700080871582
+ },
+ {
+ "epoch": 117,
+ "train_loss": 2.937184557876587,
+ "train_acc": 0.26268,
+ "test_loss": 7.438090939331055,
+ "test_acc": 0.0265,
+ "lyapunov": null,
+ "grad_norm": 0.5024891978806302,
+ "grad_max_sv": 0.16552512347698212,
+ "grad_min_sv": 9.170617681214522e-09,
+ "grad_condition": 40015057.54321941,
+ "lr": 0.00011474337861210538,
+ "time_sec": 66.80615854263306
+ },
+ {
+ "epoch": 118,
+ "train_loss": 2.942110910797119,
+ "train_acc": 0.2621,
+ "test_loss": 7.324624530029297,
+ "test_acc": 0.0273,
+ "lyapunov": null,
+ "grad_norm": 0.5000364684279365,
+ "grad_max_sv": 0.16344034522771836,
+ "grad_min_sv": 9.328158331878279e-09,
+ "grad_condition": 21122225.248831175,
+ "lr": 0.00010815327133708009,
+ "time_sec": 66.78372955322266
+ },
+ {
+ "epoch": 119,
+ "train_loss": 2.93369575592041,
+ "train_acc": 0.26596,
+ "test_loss": 8.056785229492187,
+ "test_acc": 0.0234,
+ "lyapunov": null,
+ "grad_norm": 0.5006441450285836,
+ "grad_max_sv": 0.1595278237015009,
+ "grad_min_sv": 9.219788181871746e-09,
+ "grad_condition": 69721984.41132018,
+ "lr": 0.00010173504098790182,
+ "time_sec": 66.76624512672424
+ },
+ {
+ "epoch": 120,
+ "train_loss": 2.932797766189575,
+ "train_acc": 0.26344,
+ "test_loss": 7.282906192016601,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.5037900163559795,
+ "grad_max_sv": 0.16313258111476897,
+ "grad_min_sv": 9.198472578075822e-09,
+ "grad_condition": 21164339.052237906,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 66.71441149711609
+ },
+ {
+ "epoch": 121,
+ "train_loss": 2.9284527645874023,
+ "train_acc": 0.26852,
+ "test_loss": 7.262115740966797,
+ "test_acc": 0.0293,
+ "lyapunov": null,
+ "grad_norm": 0.5036251360683918,
+ "grad_max_sv": 0.1591605730354786,
+ "grad_min_sv": 9.272000557614124e-09,
+ "grad_condition": 40898149.281216756,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 66.74046039581299
+ },
+ {
+ "epoch": 122,
+ "train_loss": 2.936891605682373,
+ "train_acc": 0.2668,
+ "test_loss": 7.490768426513672,
+ "test_acc": 0.0269,
+ "lyapunov": null,
+ "grad_norm": 0.5021434540478252,
+ "grad_max_sv": 0.16143947280943394,
+ "grad_min_sv": 9.394398098327983e-09,
+ "grad_condition": 19799976.943244066,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 66.81744265556335
+ },
+ {
+ "epoch": 123,
+ "train_loss": 2.9236154601287843,
+ "train_acc": 0.26716,
+ "test_loss": 7.120488947296143,
+ "test_acc": 0.0285,
+ "lyapunov": null,
+ "grad_norm": 0.5028382354847799,
+ "grad_max_sv": 0.15968299470841885,
+ "grad_min_sv": 9.204075489266384e-09,
+ "grad_condition": 47939633.576168984,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 66.76852679252625
+ },
+ {
+ "epoch": 124,
+ "train_loss": 2.92061264755249,
+ "train_acc": 0.2666,
+ "test_loss": 7.461192834472656,
+ "test_acc": 0.0278,
+ "lyapunov": null,
+ "grad_norm": 0.5005688158224261,
+ "grad_max_sv": 0.1629866801202297,
+ "grad_min_sv": 9.212228484906105e-09,
+ "grad_condition": 33814966.96761195,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 66.7814073562622
+ },
+ {
+ "epoch": 125,
+ "train_loss": 2.9229219720458985,
+ "train_acc": 0.26648,
+ "test_loss": 7.498983331298828,
+ "test_acc": 0.0285,
+ "lyapunov": null,
+ "grad_norm": 0.5030160580327866,
+ "grad_max_sv": 0.16155149266123772,
+ "grad_min_sv": 9.212426940741203e-09,
+ "grad_condition": 19527956.667884845,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 66.79239439964294
+ },
+ {
+ "epoch": 126,
+ "train_loss": 2.9202857413482666,
+ "train_acc": 0.26618,
+ "test_loss": 7.286036429595947,
+ "test_acc": 0.0279,
+ "lyapunov": null,
+ "grad_norm": 0.5046458563501821,
+ "grad_max_sv": 0.16270169503986837,
+ "grad_min_sv": 9.235521156170102e-09,
+ "grad_condition": 21514883.897712767,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 66.79009366035461
+ },
+ {
+ "epoch": 127,
+ "train_loss": 2.9112009690093994,
+ "train_acc": 0.27148,
+ "test_loss": 6.8060284591674804,
+ "test_acc": 0.0299,
+ "lyapunov": null,
+ "grad_norm": 0.5048043752309758,
+ "grad_max_sv": 0.1627126146107912,
+ "grad_min_sv": 9.337147274801615e-09,
+ "grad_condition": 20067936.42847693,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 66.7122654914856
+ },
+ {
+ "epoch": 128,
+ "train_loss": 2.915534998703003,
+ "train_acc": 0.26936,
+ "test_loss": 7.528692306518555,
+ "test_acc": 0.027,
+ "lyapunov": null,
+ "grad_norm": 0.505141680481134,
+ "grad_max_sv": 0.15927630066871643,
+ "grad_min_sv": 9.138972020816815e-09,
+ "grad_condition": 283653990.6139595,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 66.76755571365356
+ },
+ {
+ "epoch": 129,
+ "train_loss": 2.911044763031006,
+ "train_acc": 0.26856,
+ "test_loss": 7.442652993774414,
+ "test_acc": 0.0313,
+ "lyapunov": null,
+ "grad_norm": 0.5029480129383956,
+ "grad_max_sv": 0.16405761763453483,
+ "grad_min_sv": 9.220356501568604e-09,
+ "grad_condition": 46047919.55891801,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 66.69603776931763
+ },
+ {
+ "epoch": 130,
+ "train_loss": 2.907666951751709,
+ "train_acc": 0.26828,
+ "test_loss": 7.026823535919189,
+ "test_acc": 0.0288,
+ "lyapunov": null,
+ "grad_norm": 0.5025376312973467,
+ "grad_max_sv": 0.15946717746555805,
+ "grad_min_sv": 9.221378457352492e-09,
+ "grad_condition": 33199750.366487652,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 66.69535183906555
+ },
+ {
+ "epoch": 131,
+ "train_loss": 2.902869781417847,
+ "train_acc": 0.26958,
+ "test_loss": 7.536094513702393,
+ "test_acc": 0.0292,
+ "lyapunov": null,
+ "grad_norm": 0.5050312390729839,
+ "grad_max_sv": 0.16128032505512238,
+ "grad_min_sv": 9.28452798905008e-09,
+ "grad_condition": 135705763.13078815,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 66.77000784873962
+ },
+ {
+ "epoch": 132,
+ "train_loss": 2.9037561528778078,
+ "train_acc": 0.27136,
+ "test_loss": 7.281431489562988,
+ "test_acc": 0.0271,
+ "lyapunov": null,
+ "grad_norm": 0.5052870516198174,
+ "grad_max_sv": 0.1615588180720806,
+ "grad_min_sv": 9.289024057758388e-09,
+ "grad_condition": 128507811.16031823,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 66.75163435935974
+ },
+ {
+ "epoch": 133,
+ "train_loss": 2.8991165522766114,
+ "train_acc": 0.27156,
+ "test_loss": 7.282987453460693,
+ "test_acc": 0.0274,
+ "lyapunov": null,
+ "grad_norm": 0.5034061589294716,
+ "grad_max_sv": 0.1581054452806711,
+ "grad_min_sv": 9.274782794554958e-09,
+ "grad_condition": 19574470.928057812,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 66.75138425827026
+ },
+ {
+ "epoch": 134,
+ "train_loss": 2.9077910748291016,
+ "train_acc": 0.2711,
+ "test_loss": 7.448024377441406,
+ "test_acc": 0.0294,
+ "lyapunov": null,
+ "grad_norm": 0.5046423793403062,
+ "grad_max_sv": 0.1635249551385641,
+ "grad_min_sv": 9.433638015199363e-09,
+ "grad_condition": 28668380.335333012,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 66.7329490184784
+ },
+ {
+ "epoch": 135,
+ "train_loss": 2.896955527267456,
+ "train_acc": 0.27268,
+ "test_loss": 7.478409793090821,
+ "test_acc": 0.028,
+ "lyapunov": null,
+ "grad_norm": 0.5037173672388571,
+ "grad_max_sv": 0.1622908242046833,
+ "grad_min_sv": 9.298784615918709e-09,
+ "grad_condition": 61773843.27193861,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 66.7459568977356
+ },
+ {
+ "epoch": 136,
+ "train_loss": 2.8964898432922364,
+ "train_acc": 0.27182,
+ "test_loss": 7.354159661865235,
+ "test_acc": 0.028,
+ "lyapunov": null,
+ "grad_norm": 0.5028619652958791,
+ "grad_max_sv": 0.1600797414779663,
+ "grad_min_sv": 9.074624002236575e-09,
+ "grad_condition": 22249764.299153708,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 66.75164866447449
+ },
+ {
+ "epoch": 137,
+ "train_loss": 2.895348368530273,
+ "train_acc": 0.27172,
+ "test_loss": 7.632054917144775,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.5031853951467254,
+ "grad_max_sv": 0.16463851928710938,
+ "grad_min_sv": 9.441171729823727e-09,
+ "grad_condition": 30855600.541313868,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 66.75186562538147
+ },
+ {
+ "epoch": 138,
+ "train_loss": 2.900583278427124,
+ "train_acc": 0.2717,
+ "test_loss": 7.199238876342774,
+ "test_acc": 0.0295,
+ "lyapunov": null,
+ "grad_norm": 0.5034869997386973,
+ "grad_max_sv": 0.16063327342271805,
+ "grad_min_sv": 9.296063535613186e-09,
+ "grad_condition": 25145907.489137426,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 66.75230479240417
+ },
+ {
+ "epoch": 139,
+ "train_loss": 2.8933637355804445,
+ "train_acc": 0.27194,
+ "test_loss": 7.248442086029053,
+ "test_acc": 0.03,
+ "lyapunov": null,
+ "grad_norm": 0.504304603082473,
+ "grad_max_sv": 0.162884946167469,
+ "grad_min_sv": 9.367608214128075e-09,
+ "grad_condition": 19993036.722377926,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 66.7671320438385
+ },
+ {
+ "epoch": 140,
+ "train_loss": 2.894832459564209,
+ "train_acc": 0.27222,
+ "test_loss": 7.71000400390625,
+ "test_acc": 0.0294,
+ "lyapunov": null,
+ "grad_norm": 0.5047832470696201,
+ "grad_max_sv": 0.16155096814036368,
+ "grad_min_sv": 9.160464450874706e-09,
+ "grad_condition": 20567241.25641649,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 66.73179697990417
+ },
+ {
+ "epoch": 141,
+ "train_loss": 2.897352989578247,
+ "train_acc": 0.27064,
+ "test_loss": 7.4464299194335934,
+ "test_acc": 0.0313,
+ "lyapunov": null,
+ "grad_norm": 0.5061737427703262,
+ "grad_max_sv": 0.16413113810122013,
+ "grad_min_sv": 9.289870605763695e-09,
+ "grad_condition": 51343563.84333199,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 66.75452041625977
+ },
+ {
+ "epoch": 142,
+ "train_loss": 2.8876253887939454,
+ "train_acc": 0.2751,
+ "test_loss": 7.67550869064331,
+ "test_acc": 0.0285,
+ "lyapunov": null,
+ "grad_norm": 0.50486204633145,
+ "grad_max_sv": 0.16515321880578995,
+ "grad_min_sv": 9.218709545733006e-09,
+ "grad_condition": 25662988.761511788,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 66.76586389541626
+ },
+ {
+ "epoch": 143,
+ "train_loss": 2.8951072731781005,
+ "train_acc": 0.2711,
+ "test_loss": 7.276433151245117,
+ "test_acc": 0.0265,
+ "lyapunov": null,
+ "grad_norm": 0.5066003424324655,
+ "grad_max_sv": 0.16512982696294784,
+ "grad_min_sv": 9.368238332307932e-09,
+ "grad_condition": 20872282.150921334,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 66.77883982658386
+ },
+ {
+ "epoch": 144,
+ "train_loss": 2.896107662887573,
+ "train_acc": 0.27174,
+ "test_loss": 7.442941972351075,
+ "test_acc": 0.0282,
+ "lyapunov": null,
+ "grad_norm": 0.5058752626030726,
+ "grad_max_sv": 0.1646978858858347,
+ "grad_min_sv": 9.187450514258621e-09,
+ "grad_condition": 21323054.46289139,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 66.74654960632324
+ },
+ {
+ "epoch": 145,
+ "train_loss": 2.8981069023132324,
+ "train_acc": 0.27052,
+ "test_loss": 7.511137809753418,
+ "test_acc": 0.0286,
+ "lyapunov": null,
+ "grad_norm": 0.5043941197302124,
+ "grad_max_sv": 0.16361674722284078,
+ "grad_min_sv": 9.248454605793876e-09,
+ "grad_condition": 124843071.51810357,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 66.71942782402039
+ },
+ {
+ "epoch": 146,
+ "train_loss": 2.897443035583496,
+ "train_acc": 0.27094,
+ "test_loss": 7.219273558044433,
+ "test_acc": 0.0301,
+ "lyapunov": null,
+ "grad_norm": 0.5044889597609223,
+ "grad_max_sv": 0.1617003157734871,
+ "grad_min_sv": 9.33726697904813e-09,
+ "grad_condition": 20578970.810026187,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 66.74967193603516
+ },
+ {
+ "epoch": 147,
+ "train_loss": 2.8972148944854736,
+ "train_acc": 0.27036,
+ "test_loss": 7.628332612609864,
+ "test_acc": 0.0279,
+ "lyapunov": null,
+ "grad_norm": 0.5052009377242357,
+ "grad_max_sv": 0.15890285596251488,
+ "grad_min_sv": 9.382556353555727e-09,
+ "grad_condition": 91821063.92388035,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 66.73621463775635
+ },
+ {
+ "epoch": 148,
+ "train_loss": 2.8898702787017823,
+ "train_acc": 0.27194,
+ "test_loss": 7.505082284545899,
+ "test_acc": 0.0258,
+ "lyapunov": null,
+ "grad_norm": 0.5047197831030149,
+ "grad_max_sv": 0.16516413502395152,
+ "grad_min_sv": 9.324620061507139e-09,
+ "grad_condition": 43789169.5949554,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 66.76141929626465
+ },
+ {
+ "epoch": 149,
+ "train_loss": 2.9011361352539065,
+ "train_acc": 0.26824,
+ "test_loss": 7.6542517242431645,
+ "test_acc": 0.0271,
+ "lyapunov": null,
+ "grad_norm": 0.5054339021083573,
+ "grad_max_sv": 0.16298294067382812,
+ "grad_min_sv": 9.178197371562114e-09,
+ "grad_condition": 21653740.393576562,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 66.75421690940857
+ },
+ {
+ "epoch": 150,
+ "train_loss": 2.9011223357391356,
+ "train_acc": 0.27114,
+ "test_loss": 7.460437265014648,
+ "test_acc": 0.029,
+ "lyapunov": null,
+ "grad_norm": 0.5059469716903541,
+ "grad_max_sv": 0.16557817347347736,
+ "grad_min_sv": 9.153120701372967e-09,
+ "grad_condition": 361494763.7112081,
+ "lr": 0.0,
+ "time_sec": 66.78962397575378
+ }
+ ]
+ },
+ "lyapunov": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 4.580237577819824,
+ "train_acc": 0.07172,
+ "test_loss": 4.204835011291504,
+ "test_acc": 0.0865,
+ "lyapunov": 2.1020694111314273,
+ "grad_norm": 5.891421444416132,
+ "grad_max_sv": 4.6086235523223875,
+ "grad_min_sv": 1.0778671248878879e-07,
+ "grad_condition": 54871165.85509853,
+ "lr": 0.0009998903417374227,
+ "time_sec": 41.860575914382935
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.172055626296997,
+ "train_acc": 0.0921,
+ "test_loss": 4.402019414520264,
+ "test_acc": 0.0558,
+ "lyapunov": 1.6787975471647805,
+ "grad_norm": 3.9258769364442525,
+ "grad_max_sv": 2.9158192813396453,
+ "grad_min_sv": 7.291154454081017e-08,
+ "grad_condition": 84308361.49485277,
+ "lr": 0.0009995614150494292,
+ "time_sec": 41.754839181900024
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.050799645080566,
+ "train_acc": 0.10584,
+ "test_loss": 5.545398815917968,
+ "test_acc": 0.041,
+ "lyapunov": 1.5661922080437545,
+ "grad_norm": 3.128537052862856,
+ "grad_max_sv": 2.1766103327274324,
+ "grad_min_sv": 5.8618463349979774e-08,
+ "grad_condition": 41372858.502355784,
+ "lr": 0.0009990133642141358,
+ "time_sec": 41.694422006607056
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.9627039431762694,
+ "train_acc": 0.11682,
+ "test_loss": 6.328290705871582,
+ "test_acc": 0.0228,
+ "lyapunov": 1.5445425864070883,
+ "grad_norm": 2.5082278391489035,
+ "grad_max_sv": 1.6217471033334732,
+ "grad_min_sv": 4.5938650922172644e-08,
+ "grad_condition": 63153156.340209946,
+ "lr": 0.0009982464296247522,
+ "time_sec": 41.7418487071991
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.9077672985839844,
+ "train_acc": 0.1305,
+ "test_loss": 6.821084007263184,
+ "test_acc": 0.0156,
+ "lyapunov": 1.530182860086641,
+ "grad_norm": 2.041783975921356,
+ "grad_max_sv": 1.2541583150625228,
+ "grad_min_sv": 3.773506419557649e-08,
+ "grad_condition": 36438804.96965951,
+ "lr": 0.0009972609476841367,
+ "time_sec": 41.74874401092529
+ },
+ {
+ "epoch": 6,
+ "train_loss": 3.978193638305664,
+ "train_acc": 0.1273,
+ "test_loss": 10.715914828491211,
+ "test_acc": 0.015,
+ "lyapunov": 1.5294916736500344,
+ "grad_norm": 1.884529182522603,
+ "grad_max_sv": 1.174074074625969,
+ "grad_min_sv": 3.492432684992774e-08,
+ "grad_condition": 56687028.60603394,
+ "lr": 0.000996057350657239,
+ "time_sec": 41.79358172416687
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.028493068466187,
+ "train_acc": 0.12364,
+ "test_loss": 8.849580982971192,
+ "test_acc": 0.0108,
+ "lyapunov": 1.5220741317095354,
+ "grad_norm": 1.6311583818363289,
+ "grad_max_sv": 0.9764176219701767,
+ "grad_min_sv": 2.9745892293764343e-08,
+ "grad_condition": 38380014.867613696,
+ "lr": 0.000994636166481494,
+ "time_sec": 41.74577260017395
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.104167304382324,
+ "train_acc": 0.11452,
+ "test_loss": 9.404642602539063,
+ "test_acc": 0.0179,
+ "lyapunov": 1.5335235891439725,
+ "grad_norm": 1.4435862607793115,
+ "grad_max_sv": 0.8796723946928978,
+ "grad_min_sv": 2.6115679115784607e-08,
+ "grad_condition": 100856221.49209695,
+ "lr": 0.0009929980185352525,
+ "time_sec": 41.813751220703125
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.36510063079834,
+ "train_acc": 0.08636,
+ "test_loss": 7.074767668151855,
+ "test_acc": 0.0144,
+ "lyapunov": 1.5799841203957872,
+ "grad_norm": 1.3148798714645298,
+ "grad_max_sv": 0.7969768509268761,
+ "grad_min_sv": 2.3226430623246585e-08,
+ "grad_condition": 42533078.34572536,
+ "lr": 0.0009911436253643444,
+ "time_sec": 41.729400634765625
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.559664976348877,
+ "train_acc": 0.06118,
+ "test_loss": 6.018364582824707,
+ "test_acc": 0.01,
+ "lyapunov": 1.5615371959593596,
+ "grad_norm": 1.0712815395536825,
+ "grad_max_sv": 0.5929864205420017,
+ "grad_min_sv": 1.803380545450928e-08,
+ "grad_condition": 45789422.46232475,
+ "lr": 0.0009890738003669028,
+ "time_sec": 41.75548052787781
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.644180833282471,
+ "train_acc": 0.05202,
+ "test_loss": 6.277861665344238,
+ "test_acc": 0.01,
+ "lyapunov": 1.5085474514900266,
+ "grad_norm": 0.9280338123504958,
+ "grad_max_sv": 0.5784458503127098,
+ "grad_min_sv": 1.5023789502743857e-08,
+ "grad_condition": 63657686.089994095,
+ "lr": 0.00098678945143658,
+ "time_sec": 41.724050760269165
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.769687054901123,
+ "train_acc": 0.03436,
+ "test_loss": 7.280889709472656,
+ "test_acc": 0.01,
+ "lyapunov": 1.4389935622129904,
+ "grad_norm": 0.7003645750231552,
+ "grad_max_sv": 0.4854817561805248,
+ "grad_min_sv": 1.030722744932433e-08,
+ "grad_condition": 53249509.08795764,
+ "lr": 0.0009842915805643154,
+ "time_sec": 41.72962784767151
+ },
+ {
+ "epoch": 13,
+ "train_loss": 4.684542055053711,
+ "train_acc": 0.047,
+ "test_loss": 6.991418453979493,
+ "test_acc": 0.0112,
+ "lyapunov": 1.4236155184333588,
+ "grad_norm": 0.5991208192017541,
+ "grad_max_sv": 0.38398267030715943,
+ "grad_min_sv": 9.323978394926158e-09,
+ "grad_condition": 49967645.39513852,
+ "lr": 0.000981581283398829,
+ "time_sec": 41.743834018707275
+ },
+ {
+ "epoch": 14,
+ "train_loss": 4.875620534667969,
+ "train_acc": 0.02944,
+ "test_loss": 7.128801351165771,
+ "test_acc": 0.01,
+ "lyapunov": 1.427685697060412,
+ "grad_norm": 0.5025111739329319,
+ "grad_max_sv": 0.35512366965413095,
+ "grad_min_sv": 6.843199759284935e-09,
+ "grad_condition": 179836296.82542375,
+ "lr": 0.0009786597487660333,
+ "time_sec": 41.73904871940613
+ },
+ {
+ "epoch": 15,
+ "train_loss": 4.896511934967041,
+ "train_acc": 0.0335,
+ "test_loss": 17.298480625915527,
+ "test_acc": 0.01,
+ "lyapunov": 1.4632702230492516,
+ "grad_norm": 0.6331107294627782,
+ "grad_max_sv": 0.40708996057510377,
+ "grad_min_sv": 8.00606376749613e-09,
+ "grad_condition": 61874764.454221845,
+ "lr": 0.0009755282581475766,
+ "time_sec": 41.74419069290161
+ },
+ {
+ "epoch": 16,
+ "train_loss": 4.912100847015381,
+ "train_acc": 0.03632,
+ "test_loss": 8.131814362335206,
+ "test_acc": 0.0173,
+ "lyapunov": 1.4873096464235154,
+ "grad_norm": 0.826404597993897,
+ "grad_max_sv": 0.5076741345226765,
+ "grad_min_sv": 9.837833857273547e-09,
+ "grad_condition": 88718975.42972028,
+ "lr": 0.0009721881851187403,
+ "time_sec": 41.72049045562744
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.142030757446289,
+ "train_acc": 0.01672,
+ "test_loss": 6.458518544006347,
+ "test_acc": 0.01,
+ "lyapunov": 1.4868055615583649,
+ "grad_norm": 0.685951759542417,
+ "grad_max_sv": 0.5134769573807716,
+ "grad_min_sv": 7.799288968823869e-09,
+ "grad_condition": 85468742.13553956,
+ "lr": 0.0009686409947459456,
+ "time_sec": 41.73842525482178
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.188919100646973,
+ "train_acc": 0.00968,
+ "test_loss": 10.075014764404298,
+ "test_acc": 0.01,
+ "lyapunov": 1.4449111775059225,
+ "grad_norm": 0.4332247860431087,
+ "grad_max_sv": 0.3550705298781395,
+ "grad_min_sv": 4.337704034504397e-09,
+ "grad_condition": 117230068.9379596,
+ "lr": 0.0009648882429441254,
+ "time_sec": 41.763601779937744
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.226645467529297,
+ "train_acc": 0.01012,
+ "test_loss": 10.154055513000488,
+ "test_acc": 0.01,
+ "lyapunov": 1.4546792269362818,
+ "grad_norm": 0.3237987289049562,
+ "grad_max_sv": 0.2639503736048937,
+ "grad_min_sv": 2.060994466181133e-09,
+ "grad_condition": 14048870017.770252,
+ "lr": 0.00096093157579425,
+ "time_sec": 41.76903176307678
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.22861256149292,
+ "train_acc": 0.00962,
+ "test_loss": 9.159314030456542,
+ "test_acc": 0.01,
+ "lyapunov": 1.4311617704303674,
+ "grad_norm": 0.2580272391441697,
+ "grad_max_sv": 0.2014818772673607,
+ "grad_min_sv": 4.775887305801581e-11,
+ "grad_condition": 131599872645.97823,
+ "lr": 0.0009567727288213001,
+ "time_sec": 41.77689838409424
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.2369175091552735,
+ "train_acc": 0.0091,
+ "test_loss": 9.329907885742188,
+ "test_acc": 0.01,
+ "lyapunov": 1.4427513545736328,
+ "grad_norm": 0.20829668219493744,
+ "grad_max_sv": 0.15635721795260907,
+ "grad_min_sv": 7.96448125755094e-11,
+ "grad_condition": 123768275801.26958,
+ "lr": 0.0009524135262330095,
+ "time_sec": 41.749500036239624
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.232069122619629,
+ "train_acc": 0.00928,
+ "test_loss": 8.256287899780274,
+ "test_acc": 0.01,
+ "lyapunov": 1.43826272115683,
+ "grad_norm": 0.18574459317073533,
+ "grad_max_sv": 0.13343477975577117,
+ "grad_min_sv": 3.891468616243542e-11,
+ "grad_condition": 128132122536.13669,
+ "lr": 0.0009478558801197061,
+ "time_sec": 41.73808455467224
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.223144430541992,
+ "train_acc": 0.00912,
+ "test_loss": 8.333074249267579,
+ "test_acc": 0.01,
+ "lyapunov": 1.431471188659863,
+ "grad_norm": 0.15147554959008916,
+ "grad_max_sv": 0.10204733423888683,
+ "grad_min_sv": 2.03341283080962e-15,
+ "grad_condition": 101827814032.01648,
+ "lr": 0.000943101789615607,
+ "time_sec": 41.746745347976685
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.233420145263672,
+ "train_acc": 0.00942,
+ "test_loss": 7.730482585906983,
+ "test_acc": 0.01,
+ "lyapunov": 1.443052962917806,
+ "grad_norm": 0.1288834602441298,
+ "grad_max_sv": 0.07254640674218535,
+ "grad_min_sv": 1.1788800604957402e-13,
+ "grad_condition": 69609233199.00801,
+ "lr": 0.0009381533400219313,
+ "time_sec": 41.73458123207092
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.248794226074219,
+ "train_acc": 0.01224,
+ "test_loss": 6.550568232727051,
+ "test_acc": 0.01,
+ "lyapunov": 1.4743182287191796,
+ "grad_norm": 0.19543413013737237,
+ "grad_max_sv": 0.08613794101402164,
+ "grad_min_sv": 6.309014754681635e-11,
+ "grad_condition": 60792110328.20559,
+ "lr": 0.0009330127018922189,
+ "time_sec": 41.73256278038025
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.226683191070556,
+ "train_acc": 0.00892,
+ "test_loss": 5.647989534759522,
+ "test_acc": 0.01,
+ "lyapunov": 1.434842828289627,
+ "grad_norm": 0.14721341402984697,
+ "grad_max_sv": 0.09509434262290598,
+ "grad_min_sv": 1.0618768151186443e-15,
+ "grad_condition": 94978842737.15823,
+ "lr": 0.000927682130080253,
+ "time_sec": 41.72614550590515
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.229176857604981,
+ "train_acc": 0.00972,
+ "test_loss": 5.612284447479248,
+ "test_acc": 0.01,
+ "lyapunov": 1.4389631537830128,
+ "grad_norm": 0.1286875557895635,
+ "grad_max_sv": 0.07554986858740449,
+ "grad_min_sv": 1.9029346441684858e-16,
+ "grad_condition": 75528406184.49973,
+ "lr": 0.0009221639627510072,
+ "time_sec": 41.73252606391907
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.226171473999023,
+ "train_acc": 0.00934,
+ "test_loss": 5.924600332641601,
+ "test_acc": 0.01,
+ "lyapunov": 1.4371787568797236,
+ "grad_norm": 0.10743150341998972,
+ "grad_max_sv": 0.048194893449544904,
+ "grad_min_sv": 0.0,
+ "grad_condition": 48194893449.54491,
+ "lr": 0.0009164606203550494,
+ "time_sec": 41.72467064857483
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.230549348297119,
+ "train_acc": 0.00932,
+ "test_loss": 5.312363116455078,
+ "test_acc": 0.01,
+ "lyapunov": 1.4417800442946842,
+ "grad_norm": 0.10913623720356962,
+ "grad_max_sv": 0.050634372420608996,
+ "grad_min_sv": 0.0,
+ "grad_condition": 50634372420.60899,
+ "lr": 0.0009105746045668516,
+ "time_sec": 41.754605531692505
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.229708560028076,
+ "train_acc": 0.0092,
+ "test_loss": 5.395946918487549,
+ "test_acc": 0.01,
+ "lyapunov": 1.441019511588699,
+ "grad_norm": 0.10497591874908667,
+ "grad_max_sv": 0.04387410613708198,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43874106137.081985,
+ "lr": 0.0009045084971874733,
+ "time_sec": 41.71743130683899
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.2316739025878904,
+ "train_acc": 0.00982,
+ "test_loss": 6.248269965362549,
+ "test_acc": 0.01,
+ "lyapunov": 1.443965878023211,
+ "grad_norm": 0.10154022323683165,
+ "grad_max_sv": 0.03353279777802527,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33532797778.02527,
+ "lr": 0.0008982649590120977,
+ "time_sec": 41.701202392578125
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.23400792678833,
+ "train_acc": 0.00938,
+ "test_loss": 5.782683653259277,
+ "test_acc": 0.01,
+ "lyapunov": 1.446322088046452,
+ "grad_norm": 0.10537953489915908,
+ "grad_max_sv": 0.04410789059475064,
+ "grad_min_sv": 0.0,
+ "grad_condition": 44107890594.75064,
+ "lr": 0.0008918467286629196,
+ "time_sec": 41.70464754104614
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.232683167877197,
+ "train_acc": 0.00858,
+ "test_loss": 5.318116857910156,
+ "test_acc": 0.01,
+ "lyapunov": 1.4452067232497818,
+ "grad_norm": 0.1008655295742077,
+ "grad_max_sv": 0.03291638647206128,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32916386472.06128,
+ "lr": 0.0008852566213878943,
+ "time_sec": 41.68885540962219
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.237297785339355,
+ "train_acc": 0.00966,
+ "test_loss": 5.309081327819825,
+ "test_acc": 0.01,
+ "lyapunov": 1.450283215783746,
+ "grad_norm": 0.10345313863412257,
+ "grad_max_sv": 0.04121980397030711,
+ "grad_min_sv": 0.0,
+ "grad_condition": 41219803970.30711,
+ "lr": 0.000878497527825878,
+ "time_sec": 41.72196674346924
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.240170780029297,
+ "train_acc": 0.00886,
+ "test_loss": 5.1140812942504885,
+ "test_acc": 0.01,
+ "lyapunov": 1.4520895359156383,
+ "grad_norm": 0.10252991679320593,
+ "grad_max_sv": 0.038473002053797244,
+ "grad_min_sv": 0.0,
+ "grad_condition": 38473002053.79725,
+ "lr": 0.000871572412738697,
+ "time_sec": 41.704707622528076
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.237992069244385,
+ "train_acc": 0.0091,
+ "test_loss": 5.254914206695557,
+ "test_acc": 0.01,
+ "lyapunov": 1.4511004372326004,
+ "grad_norm": 0.1034357825731679,
+ "grad_max_sv": 0.03689436963759363,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36894369637.59363,
+ "lr": 0.0008644843137107055,
+ "time_sec": 41.68847870826721
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.24728928100586,
+ "train_acc": 0.00948,
+ "test_loss": 5.015587938690185,
+ "test_acc": 0.01,
+ "lyapunov": 1.4593792114111468,
+ "grad_norm": 0.10030700112378006,
+ "grad_max_sv": 0.027813022676855325,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27813022676.855324,
+ "lr": 0.0008572363398164014,
+ "time_sec": 41.67623424530029
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.240536932220459,
+ "train_acc": 0.0092,
+ "test_loss": 4.961225141906739,
+ "test_acc": 0.01,
+ "lyapunov": 1.454334620319669,
+ "grad_norm": 0.09505358413147648,
+ "grad_max_sv": 0.022648979304358365,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22648979304.35836,
+ "lr": 0.0008498316702566826,
+ "time_sec": 41.65856647491455
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.24094622467041,
+ "train_acc": 0.00906,
+ "test_loss": 4.902838454437256,
+ "test_acc": 0.01,
+ "lyapunov": 1.4547367199607517,
+ "grad_norm": 0.09365021131775912,
+ "grad_max_sv": 0.02316552624106407,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23165526241.06407,
+ "lr": 0.0008422735529643442,
+ "time_sec": 41.66074347496033
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.245578489685059,
+ "train_acc": 0.00954,
+ "test_loss": 4.859429032897949,
+ "test_acc": 0.01,
+ "lyapunov": 1.4598181689791667,
+ "grad_norm": 0.10147367716516044,
+ "grad_max_sv": 0.023039095243439077,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23039095243.43908,
+ "lr": 0.0008345653031794289,
+ "time_sec": 41.646554708480835
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.245340968780518,
+ "train_acc": 0.00972,
+ "test_loss": 5.133834055328369,
+ "test_acc": 0.01,
+ "lyapunov": 1.4597191298404313,
+ "grad_norm": 0.09983575491941106,
+ "grad_max_sv": 0.023509565647691487,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23509565647.69149,
+ "lr": 0.0008267103019950526,
+ "time_sec": 41.67466497421265
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.243727160949707,
+ "train_acc": 0.0094,
+ "test_loss": 5.177202513122559,
+ "test_acc": 0.01,
+ "lyapunov": 1.457551447936641,
+ "grad_norm": 0.10012844556744109,
+ "grad_max_sv": 0.04022635291330516,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40226352913.30516,
+ "lr": 0.0008187119948743447,
+ "time_sec": 41.69778633117676
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.245192972717285,
+ "train_acc": 0.00916,
+ "test_loss": 4.837023108673096,
+ "test_acc": 0.01,
+ "lyapunov": 1.4592695629505246,
+ "grad_norm": 0.0977089071025598,
+ "grad_max_sv": 0.02978864456526935,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29788644565.269356,
+ "lr": 0.000810573890139155,
+ "time_sec": 41.68951177597046
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.2786666191101075,
+ "train_acc": 0.01064,
+ "test_loss": 5.4122274887084965,
+ "test_acc": 0.01,
+ "lyapunov": 1.5007501855835585,
+ "grad_norm": 0.12265113875538343,
+ "grad_max_sv": 0.033590356819331646,
+ "grad_min_sv": 5.169785690831125e-14,
+ "grad_condition": 31777859057.197426,
+ "lr": 0.0008022995574311873,
+ "time_sec": 41.67222714424133
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.251278916320801,
+ "train_acc": 0.00912,
+ "test_loss": 5.717527485656738,
+ "test_acc": 0.01,
+ "lyapunov": 1.4666499061047877,
+ "grad_norm": 0.09464479083441923,
+ "grad_max_sv": 0.015212097018957139,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15212097018.957138,
+ "lr": 0.0007938926261462363,
+ "time_sec": 41.66761112213135
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.248660043487549,
+ "train_acc": 0.00922,
+ "test_loss": 5.687412886047364,
+ "test_acc": 0.01,
+ "lyapunov": 1.4640466523597309,
+ "grad_norm": 0.09250900682814509,
+ "grad_max_sv": 0.00974161345511675,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9741613455.116749,
+ "lr": 0.0007853567838422158,
+ "time_sec": 41.62896704673767
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.249529778289795,
+ "train_acc": 0.00976,
+ "test_loss": 5.35712462310791,
+ "test_acc": 0.01,
+ "lyapunov": 1.4639555450595554,
+ "grad_norm": 0.09683136939926335,
+ "grad_max_sv": 0.02266658809967339,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22666588099.67339,
+ "lr": 0.0007766957746216719,
+ "time_sec": 41.632965326309204
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.2507288345336915,
+ "train_acc": 0.00952,
+ "test_loss": 5.053029971313476,
+ "test_acc": 0.01,
+ "lyapunov": 1.46576005692982,
+ "grad_norm": 0.09407593048273037,
+ "grad_max_sv": 0.027120837941765785,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27120837941.765785,
+ "lr": 0.0007679133974894982,
+ "time_sec": 41.65870714187622
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.249875890960693,
+ "train_acc": 0.00884,
+ "test_loss": 5.38174955444336,
+ "test_acc": 0.01,
+ "lyapunov": 1.465318091690083,
+ "grad_norm": 0.09064589183935413,
+ "grad_max_sv": 0.008867102395743131,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8867102395.743132,
+ "lr": 0.000759013504686565,
+ "time_sec": 41.735912561416626
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.250207867889404,
+ "train_acc": 0.00898,
+ "test_loss": 5.739707115173339,
+ "test_acc": 0.01,
+ "lyapunov": 1.4655792646091004,
+ "grad_norm": 0.09717189190349201,
+ "grad_max_sv": 0.021169214555993677,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21169214555.993675,
+ "lr": 0.0007499999999999998,
+ "time_sec": 41.72933316230774
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.250648717803955,
+ "train_acc": 0.00912,
+ "test_loss": 6.128197521972656,
+ "test_acc": 0.01,
+ "lyapunov": 1.4661765546749925,
+ "grad_norm": 0.09095698035941559,
+ "grad_max_sv": 0.01055141636170447,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10551416361.704468,
+ "lr": 0.0007408768370508575,
+ "time_sec": 41.69919180870056
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.251839170684814,
+ "train_acc": 0.00908,
+ "test_loss": 6.067484506225586,
+ "test_acc": 0.01,
+ "lyapunov": 1.4675627587091586,
+ "grad_norm": 0.09067609636620885,
+ "grad_max_sv": 0.004669012082740664,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4669012082.7406645,
+ "lr": 0.0007316480175599307,
+ "time_sec": 41.654059171676636
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.253518835144043,
+ "train_acc": 0.00896,
+ "test_loss": 5.7827218193054195,
+ "test_acc": 0.01,
+ "lyapunov": 1.4693938874832504,
+ "grad_norm": 0.09137616955031719,
+ "grad_max_sv": 0.010091183660551905,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10091183660.551905,
+ "lr": 0.0007223175895924635,
+ "time_sec": 41.642850160598755
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.254051934051514,
+ "train_acc": 0.00872,
+ "test_loss": 5.591477861022949,
+ "test_acc": 0.01,
+ "lyapunov": 1.4702323230026324,
+ "grad_norm": 0.08996816491022355,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007128896457825361,
+ "time_sec": 41.657779932022095
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.255190885314941,
+ "train_acc": 0.00916,
+ "test_loss": 5.435504406738281,
+ "test_acc": 0.01,
+ "lyapunov": 1.4712699441348804,
+ "grad_norm": 0.09391959822012276,
+ "grad_max_sv": 0.005470911040902138,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5470911040.902138,
+ "lr": 0.0007033683215378998,
+ "time_sec": 41.70645236968994
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.254567480010986,
+ "train_acc": 0.0092,
+ "test_loss": 5.745911796569824,
+ "test_acc": 0.01,
+ "lyapunov": 1.470891768670143,
+ "grad_norm": 0.08856701808364516,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006937577932260512,
+ "time_sec": 41.71012330055237
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.255953155822754,
+ "train_acc": 0.00902,
+ "test_loss": 5.410791555023193,
+ "test_acc": 0.01,
+ "lyapunov": 1.4723095774955457,
+ "grad_norm": 0.0914524874609732,
+ "grad_max_sv": 0.005876953201368451,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5876953201.368451,
+ "lr": 0.0006840622763423388,
+ "time_sec": 41.65397572517395
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.255620794372558,
+ "train_acc": 0.00814,
+ "test_loss": 5.248719776153565,
+ "test_acc": 0.01,
+ "lyapunov": 1.4720726202211112,
+ "grad_norm": 0.08957407910190007,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006742860236609073,
+ "time_sec": 41.596808195114136
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.256758173370361,
+ "train_acc": 0.00904,
+ "test_loss": 5.839924575805664,
+ "test_acc": 0.01,
+ "lyapunov": 1.4729903738212098,
+ "grad_norm": 0.09261814392317223,
+ "grad_max_sv": 0.016021678689867258,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16021678689.867258,
+ "lr": 0.0006644333233692913,
+ "time_sec": 41.65124177932739
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.256810084991455,
+ "train_acc": 0.00942,
+ "test_loss": 5.447851982879639,
+ "test_acc": 0.01,
+ "lyapunov": 1.4729429684636537,
+ "grad_norm": 0.09328751710854948,
+ "grad_max_sv": 0.018184319231659175,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18184319231.659172,
+ "lr": 0.0006545084971874734,
+ "time_sec": 41.677849769592285
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.257736980895996,
+ "train_acc": 0.00956,
+ "test_loss": 5.214775198364258,
+ "test_acc": 0.01,
+ "lyapunov": 1.4742664586552574,
+ "grad_norm": 0.09141104511491621,
+ "grad_max_sv": 0.014100066805258393,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14100066805.258392,
+ "lr": 0.0006445158984722354,
+ "time_sec": 41.65701365470886
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.257541732788086,
+ "train_acc": 0.00888,
+ "test_loss": 5.395826309204102,
+ "test_acc": 0.01,
+ "lyapunov": 1.4742513254780294,
+ "grad_norm": 0.08871521712913655,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006344599103076324,
+ "time_sec": 41.64438438415527
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.258026624908447,
+ "train_acc": 0.00826,
+ "test_loss": 5.438673513793946,
+ "test_acc": 0.01,
+ "lyapunov": 1.474777021066612,
+ "grad_norm": 0.08974006980177573,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006243449435824269,
+ "time_sec": 41.659621477127075
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.256656706237793,
+ "train_acc": 0.00858,
+ "test_loss": 5.30103558959961,
+ "test_acc": 0.01,
+ "lyapunov": 1.4732483726023409,
+ "grad_norm": 0.08966165557801938,
+ "grad_max_sv": 0.002812969218939543,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2812969218.939543,
+ "lr": 0.0006141754350553275,
+ "time_sec": 41.680859327316284
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.25918576675415,
+ "train_acc": 0.00894,
+ "test_loss": 5.125008965301514,
+ "test_acc": 0.01,
+ "lyapunov": 1.4760865912108165,
+ "grad_norm": 0.0887662183827418,
+ "grad_max_sv": 0.0005635306239128113,
+ "grad_min_sv": 0.0,
+ "grad_condition": 563530623.9128113,
+ "lr": 0.0006039558454088793,
+ "time_sec": 41.60912251472473
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.260574841461182,
+ "train_acc": 0.00874,
+ "test_loss": 5.454896185302735,
+ "test_acc": 0.01,
+ "lyapunov": 1.4776358738579713,
+ "grad_norm": 0.11531617666338094,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000593690657292862,
+ "time_sec": 41.6300413608551
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.259261641082763,
+ "train_acc": 0.00928,
+ "test_loss": 5.808028590393066,
+ "test_acc": 0.01,
+ "lyapunov": 1.4762413047463692,
+ "grad_norm": 0.08815522678931535,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005833843733580507,
+ "time_sec": 41.62497115135193
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.2594527183532715,
+ "train_acc": 0.00938,
+ "test_loss": 5.654487629699707,
+ "test_acc": 0.01,
+ "lyapunov": 1.4761893337644885,
+ "grad_norm": 0.09333979255701338,
+ "grad_max_sv": 0.014018809190019965,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14018809190.019964,
+ "lr": 0.0005730415142812054,
+ "time_sec": 41.621119260787964
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.26328825378418,
+ "train_acc": 0.00966,
+ "test_loss": 5.534258514404297,
+ "test_acc": 0.01,
+ "lyapunov": 1.4803016765038375,
+ "grad_norm": 0.10303270455881028,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005626666167821517,
+ "time_sec": 41.61156606674194
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.261220071105957,
+ "train_acc": 0.00968,
+ "test_loss": 5.542517721557617,
+ "test_acc": 0.01,
+ "lyapunov": 1.4784168117796368,
+ "grad_norm": 0.08844874021214537,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005522642316338265,
+ "time_sec": 41.62671518325806
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.260938765716553,
+ "train_acc": 0.00862,
+ "test_loss": 5.420013078308106,
+ "test_acc": 0.01,
+ "lyapunov": 1.4779477622502906,
+ "grad_norm": 0.0889283460956175,
+ "grad_max_sv": 0.0034733008593320846,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3473300859.3320847,
+ "lr": 0.0005418389216661573,
+ "time_sec": 41.62442445755005
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.260601893157959,
+ "train_acc": 0.00902,
+ "test_loss": 5.176327791595459,
+ "test_acc": 0.01,
+ "lyapunov": 1.4776618431901078,
+ "grad_norm": 0.0902718541800826,
+ "grad_max_sv": 0.012300812685862184,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12300812685.862183,
+ "lr": 0.0005313952597646563,
+ "time_sec": 41.66868996620178
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.264250277404785,
+ "train_acc": 0.00884,
+ "test_loss": 5.100635796356201,
+ "test_acc": 0.01,
+ "lyapunov": 1.4813997955883251,
+ "grad_norm": 0.0903405536598621,
+ "grad_max_sv": 0.007483795657753945,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7483795657.7539425,
+ "lr": 0.0005209378268645994,
+ "time_sec": 41.626320600509644
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.26120802658081,
+ "train_acc": 0.0087,
+ "test_loss": 5.235371070861817,
+ "test_acc": 0.01,
+ "lyapunov": 1.4784196508510032,
+ "grad_norm": 0.0879091159548037,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005104712099416781,
+ "time_sec": 41.62154483795166
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.267138383178711,
+ "train_acc": 0.00858,
+ "test_loss": 4.973852683258056,
+ "test_acc": 0.01,
+ "lyapunov": 1.4819577859185846,
+ "grad_norm": 0.08881358787274304,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004999999999999996,
+ "time_sec": 41.638519048690796
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.2642199221801755,
+ "train_acc": 0.00822,
+ "test_loss": 5.071284794616699,
+ "test_acc": 0.01,
+ "lyapunov": 1.4816657048661996,
+ "grad_norm": 0.08882388372557563,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004895287900583212,
+ "time_sec": 41.619221925735474
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.273737740020752,
+ "train_acc": 0.00884,
+ "test_loss": 4.974697065734864,
+ "test_acc": 0.01,
+ "lyapunov": 1.490840724667015,
+ "grad_norm": 0.08942192638502924,
+ "grad_max_sv": 0.0068177991081029175,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6817799108.102918,
+ "lr": 0.0004790621731353997,
+ "time_sec": 41.63776922225952
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.261278802490234,
+ "train_acc": 0.00874,
+ "test_loss": 4.976500602722168,
+ "test_acc": 0.01,
+ "lyapunov": 1.4785530381190501,
+ "grad_norm": 0.0880515343100226,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000468604740235343,
+ "time_sec": 41.607832193374634
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.263828933258057,
+ "train_acc": 0.00816,
+ "test_loss": 4.9257099716186525,
+ "test_acc": 0.01,
+ "lyapunov": 1.4813517496713897,
+ "grad_norm": 0.08863134124223197,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00045816107833384175,
+ "time_sec": 41.631874561309814
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.268178493652344,
+ "train_acc": 0.00912,
+ "test_loss": 4.912583598327637,
+ "test_acc": 0.01,
+ "lyapunov": 1.4849315034154127,
+ "grad_norm": 0.08860861584524822,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004477357683661729,
+ "time_sec": 41.710554122924805
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.26138502532959,
+ "train_acc": 0.00922,
+ "test_loss": 4.878695037841797,
+ "test_acc": 0.01,
+ "lyapunov": 1.478672110820975,
+ "grad_norm": 0.09157782940494599,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00043733338321784746,
+ "time_sec": 41.64098763465881
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.268409018859863,
+ "train_acc": 0.00922,
+ "test_loss": 4.908391270446777,
+ "test_acc": 0.01,
+ "lyapunov": 1.4861254643296342,
+ "grad_norm": 0.11020465642062108,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004269584857187939,
+ "time_sec": 41.60934782028198
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.265614703063965,
+ "train_acc": 0.00942,
+ "test_loss": 4.864893129730224,
+ "test_acc": 0.01,
+ "lyapunov": 1.4825067782341061,
+ "grad_norm": 0.09011764156233357,
+ "grad_max_sv": 0.002433748124167323,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2433748124.167323,
+ "lr": 0.0004166156266419484,
+ "time_sec": 41.60301470756531
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.262646561889649,
+ "train_acc": 0.0091,
+ "test_loss": 4.719803262329101,
+ "test_acc": 0.01,
+ "lyapunov": 1.4800378392114664,
+ "grad_norm": 0.08987030714157009,
+ "grad_max_sv": 0.005705382255837321,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5705382255.837321,
+ "lr": 0.0004063093427071373,
+ "time_sec": 41.6301634311676
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.263007119445801,
+ "train_acc": 0.00892,
+ "test_loss": 4.765390521240234,
+ "test_acc": 0.01,
+ "lyapunov": 1.4803728941456435,
+ "grad_norm": 0.08908420576392925,
+ "grad_max_sv": 0.005673544481396675,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5673544481.396675,
+ "lr": 0.0003960441545911199,
+ "time_sec": 41.6158664226532
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.261938611297607,
+ "train_acc": 0.00896,
+ "test_loss": 4.7486605583190915,
+ "test_acc": 0.01,
+ "lyapunov": 1.479363068900145,
+ "grad_norm": 0.08783615573103698,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003858245649446718,
+ "time_sec": 41.63826298713684
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.263675572814941,
+ "train_acc": 0.00854,
+ "test_loss": 4.729234335327148,
+ "test_acc": 0.01,
+ "lyapunov": 1.481331856354423,
+ "grad_norm": 0.08839938213840319,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00037565505641757235,
+ "time_sec": 41.63784456253052
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.262854153900147,
+ "train_acc": 0.00876,
+ "test_loss": 4.702548780822754,
+ "test_acc": 0.01,
+ "lyapunov": 1.4803594689235053,
+ "grad_norm": 0.08793981551347788,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00036554008969236695,
+ "time_sec": 41.71681451797485
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.2630352787780765,
+ "train_acc": 0.00878,
+ "test_loss": 4.71384239654541,
+ "test_acc": 0.01,
+ "lyapunov": 1.4806065233162298,
+ "grad_norm": 0.08814160681144886,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003554841015277638,
+ "time_sec": 41.7017023563385
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.262895381469726,
+ "train_acc": 0.00916,
+ "test_loss": 4.708866213226318,
+ "test_acc": 0.01,
+ "lyapunov": 1.4804326811105089,
+ "grad_norm": 0.08915485528106772,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000345491502812526,
+ "time_sec": 41.66344165802002
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.2640660131835935,
+ "train_acc": 0.00894,
+ "test_loss": 4.7449420501708985,
+ "test_acc": 0.01,
+ "lyapunov": 1.481703461588496,
+ "grad_norm": 0.09104557989631236,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003355666766307081,
+ "time_sec": 41.65228295326233
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.2634638612365725,
+ "train_acc": 0.00882,
+ "test_loss": 4.755833000946045,
+ "test_acc": 0.01,
+ "lyapunov": 1.4810923280008614,
+ "grad_norm": 0.08888836178350999,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00032571397633909225,
+ "time_sec": 41.6901330947876
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.264835737762451,
+ "train_acc": 0.00874,
+ "test_loss": 4.721351288604736,
+ "test_acc": 0.01,
+ "lyapunov": 1.4826934395543754,
+ "grad_norm": 0.08947356736587055,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00031593772365766094,
+ "time_sec": 41.6052131652832
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.263670272369385,
+ "train_acc": 0.00868,
+ "test_loss": 4.785962379455566,
+ "test_acc": 0.01,
+ "lyapunov": 1.4813081669380597,
+ "grad_norm": 0.08849247443481073,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003062422067739483,
+ "time_sec": 41.60963582992554
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.2619873828125,
+ "train_acc": 0.00798,
+ "test_loss": 4.723102865600586,
+ "test_acc": 0.01,
+ "lyapunov": 1.479443594927678,
+ "grad_norm": 0.08787170616898271,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00029663167846209965,
+ "time_sec": 41.6090726852417
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.264093981323242,
+ "train_acc": 0.00886,
+ "test_loss": 4.719023175048828,
+ "test_acc": 0.01,
+ "lyapunov": 1.4818146923923736,
+ "grad_norm": 0.08820019238952795,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00028711035421746345,
+ "time_sec": 41.62479615211487
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.2660337771606445,
+ "train_acc": 0.00826,
+ "test_loss": 4.683718409729004,
+ "test_acc": 0.01,
+ "lyapunov": 1.4838567975232058,
+ "grad_norm": 0.08832542758192675,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00027768241040753615,
+ "time_sec": 41.61792826652527
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.264854827270508,
+ "train_acc": 0.00872,
+ "test_loss": 4.66099263305664,
+ "test_acc": 0.01,
+ "lyapunov": 1.4826005797861788,
+ "grad_norm": 0.08770768444548716,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00026835198244006903,
+ "time_sec": 41.65434980392456
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.26445282623291,
+ "train_acc": 0.00872,
+ "test_loss": 4.680420280456543,
+ "test_acc": 0.01,
+ "lyapunov": 1.482219386588582,
+ "grad_norm": 0.08789455257207789,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002591231629491421,
+ "time_sec": 41.626431465148926
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.267974179992676,
+ "train_acc": 0.00926,
+ "test_loss": 4.719721762084961,
+ "test_acc": 0.01,
+ "lyapunov": 1.4858673469489798,
+ "grad_norm": 0.08804026825834858,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002499999999999997,
+ "time_sec": 41.61785125732422
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.265785012969971,
+ "train_acc": 0.00908,
+ "test_loss": 4.677582652282715,
+ "test_acc": 0.01,
+ "lyapunov": 1.4835739272939579,
+ "grad_norm": 0.08811206484625347,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00024098649531343477,
+ "time_sec": 41.61317491531372
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.262550980682373,
+ "train_acc": 0.00804,
+ "test_loss": 4.721813179779053,
+ "test_acc": 0.01,
+ "lyapunov": 1.4801046043405752,
+ "grad_norm": 0.08851673086495025,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002320866025105016,
+ "time_sec": 41.67564344406128
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.2642667413330075,
+ "train_acc": 0.00882,
+ "test_loss": 4.740510238647461,
+ "test_acc": 0.01,
+ "lyapunov": 1.4820212802618666,
+ "grad_norm": 0.08821117687751044,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002233042253783278,
+ "time_sec": 41.63251256942749
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.263534827728272,
+ "train_acc": 0.0081,
+ "test_loss": 4.700486143493652,
+ "test_acc": 0.01,
+ "lyapunov": 1.4811951995200818,
+ "grad_norm": 0.08907217589685106,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000214643216157784,
+ "time_sec": 41.62003540992737
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.263595247192383,
+ "train_acc": 0.00866,
+ "test_loss": 4.685244355773926,
+ "test_acc": 0.01,
+ "lyapunov": 1.4812764624500518,
+ "grad_norm": 0.087999698905291,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376332,
+ "time_sec": 41.59307098388672
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.2640459841918945,
+ "train_acc": 0.00788,
+ "test_loss": 4.679230912780762,
+ "test_acc": 0.01,
+ "lyapunov": 1.481674498914148,
+ "grad_norm": 0.08791576128060906,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019770044256881242,
+ "time_sec": 41.62804102897644
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.264458420715332,
+ "train_acc": 0.00878,
+ "test_loss": 4.693680247497559,
+ "test_acc": 0.01,
+ "lyapunov": 1.4822333346852257,
+ "grad_norm": 0.0877864562223225,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001894261098608447,
+ "time_sec": 41.72821760177612
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.263148934020996,
+ "train_acc": 0.0092,
+ "test_loss": 4.703213790130615,
+ "test_acc": 0.01,
+ "lyapunov": 1.480785415300628,
+ "grad_norm": 0.08786524330498742,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000181288005125655,
+ "time_sec": 41.68737983703613
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.264703175201416,
+ "train_acc": 0.0078,
+ "test_loss": 4.703215410614014,
+ "test_acc": 0.01,
+ "lyapunov": 1.482531173454831,
+ "grad_norm": 0.0887187166875537,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001732896980049473,
+ "time_sec": 41.6301372051239
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.262354034423828,
+ "train_acc": 0.00878,
+ "test_loss": 4.673253472900391,
+ "test_acc": 0.01,
+ "lyapunov": 1.4798865848794922,
+ "grad_norm": 0.08823123281084728,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016543469682057076,
+ "time_sec": 41.61501979827881
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.261907596282959,
+ "train_acc": 0.00774,
+ "test_loss": 4.6810761657714846,
+ "test_acc": 0.01,
+ "lyapunov": 1.4794099962010103,
+ "grad_norm": 0.08847327230851044,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 41.66792058944702
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.263451714782715,
+ "train_acc": 0.00876,
+ "test_loss": 4.675498142242431,
+ "test_acc": 0.01,
+ "lyapunov": 1.4811130951127738,
+ "grad_norm": 0.08821763372055312,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 41.6463463306427
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.271167716522217,
+ "train_acc": 0.00842,
+ "test_loss": 4.685236253356933,
+ "test_acc": 0.01,
+ "lyapunov": 1.489286311447163,
+ "grad_norm": 0.08951867713473023,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 41.74271559715271
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.271448510589599,
+ "train_acc": 0.00896,
+ "test_loss": 4.690647507476807,
+ "test_acc": 0.01,
+ "lyapunov": 1.4897843382852463,
+ "grad_norm": 0.08820177476113898,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00013551568628929425,
+ "time_sec": 41.668110609054565
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.2816896908569335,
+ "train_acc": 0.00868,
+ "test_loss": 4.690107788085937,
+ "test_acc": 0.01,
+ "lyapunov": 1.49836193996927,
+ "grad_norm": 0.0881224924879974,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 41.65963578224182
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.265034445343018,
+ "train_acc": 0.00848,
+ "test_loss": 4.69013021774292,
+ "test_acc": 0.01,
+ "lyapunov": 1.4828510912483002,
+ "grad_norm": 0.0884889002186026,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 41.68511462211609
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.26604537612915,
+ "train_acc": 0.00834,
+ "test_loss": 4.690117681884765,
+ "test_acc": 0.01,
+ "lyapunov": 1.4837996590777736,
+ "grad_norm": 0.087812082346243,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 41.62825393676758
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.271575555877686,
+ "train_acc": 0.00838,
+ "test_loss": 4.688699510192871,
+ "test_acc": 0.01,
+ "lyapunov": 1.4897897758752183,
+ "grad_norm": 0.08852661249085975,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010815327133708009,
+ "time_sec": 41.813793897628784
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.270083126525879,
+ "train_acc": 0.00882,
+ "test_loss": 4.678613103485107,
+ "test_acc": 0.01,
+ "lyapunov": 1.4881404150477455,
+ "grad_norm": 0.08809098199633093,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010173504098790182,
+ "time_sec": 41.60239052772522
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.2668604069519045,
+ "train_acc": 0.00916,
+ "test_loss": 4.668810566711426,
+ "test_acc": 0.01,
+ "lyapunov": 1.484404284630895,
+ "grad_norm": 0.08801465824181619,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 41.67430233955383
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.270687980041504,
+ "train_acc": 0.00844,
+ "test_loss": 4.678598808288574,
+ "test_acc": 0.01,
+ "lyapunov": 1.4865265313316793,
+ "grad_norm": 0.08823636157170499,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 41.651268005371094
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.262444466705322,
+ "train_acc": 0.00858,
+ "test_loss": 4.678612301635742,
+ "test_acc": 0.01,
+ "lyapunov": 1.48004513079553,
+ "grad_norm": 0.09003261469940216,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 41.676185607910156
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.263941179351806,
+ "train_acc": 0.0086,
+ "test_loss": 4.671801266479492,
+ "test_acc": 0.01,
+ "lyapunov": 1.4817558716020316,
+ "grad_norm": 0.09047110449687606,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 41.740845918655396
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.269082255859375,
+ "train_acc": 0.00892,
+ "test_loss": 4.671809730529785,
+ "test_acc": 0.01,
+ "lyapunov": 1.4871390643327131,
+ "grad_norm": 0.08793369061349017,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 41.75574517250061
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.262843768310547,
+ "train_acc": 0.00886,
+ "test_loss": 4.662115892028808,
+ "test_acc": 0.01,
+ "lyapunov": 1.4804938851719927,
+ "grad_norm": 0.08792553586108803,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 41.601502656936646
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.262783556365966,
+ "train_acc": 0.0087,
+ "test_loss": 4.671795330810546,
+ "test_acc": 0.01,
+ "lyapunov": 1.4804595739335356,
+ "grad_norm": 0.08818916489651518,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 41.719630002975464
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.287085924682617,
+ "train_acc": 0.00884,
+ "test_loss": 4.670085035705567,
+ "test_acc": 0.01,
+ "lyapunov": 1.5052251651159028,
+ "grad_norm": 0.09375403073023182,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 41.655165672302246
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.3060646118164065,
+ "train_acc": 0.00794,
+ "test_loss": 4.6709625457763675,
+ "test_acc": 0.01,
+ "lyapunov": 1.5216917436750954,
+ "grad_norm": 0.08857015682665342,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 41.698471546173096
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.263810299682617,
+ "train_acc": 0.00862,
+ "test_loss": 4.679794757080078,
+ "test_acc": 0.01,
+ "lyapunov": 1.4815860233648355,
+ "grad_norm": 0.08793008720913074,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 41.65286087989807
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.2642881167602535,
+ "train_acc": 0.00886,
+ "test_loss": 4.679787918853759,
+ "test_acc": 0.01,
+ "lyapunov": 1.4821607542159918,
+ "grad_norm": 0.08826309404088324,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 41.60878133773804
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.264142718353272,
+ "train_acc": 0.00912,
+ "test_loss": 4.679794540405274,
+ "test_acc": 0.01,
+ "lyapunov": 1.4819643613322617,
+ "grad_norm": 0.0879145106714535,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 41.631954193115234
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.264426311187744,
+ "train_acc": 0.00912,
+ "test_loss": 4.686964068603515,
+ "test_acc": 0.01,
+ "lyapunov": 1.4822249098507034,
+ "grad_norm": 0.08772387144138033,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 41.61648106575012
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.263279991149902,
+ "train_acc": 0.00928,
+ "test_loss": 4.673583326721191,
+ "test_acc": 0.01,
+ "lyapunov": 1.481004032332574,
+ "grad_norm": 0.08756701265820996,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 41.61954092979431
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.264391135559082,
+ "train_acc": 0.00916,
+ "test_loss": 4.673584260559082,
+ "test_acc": 0.01,
+ "lyapunov": 1.482238910387239,
+ "grad_norm": 0.08773099630417767,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 41.636422872543335
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.264316839904785,
+ "train_acc": 0.00918,
+ "test_loss": 4.673586289215088,
+ "test_acc": 0.01,
+ "lyapunov": 1.4821837125226969,
+ "grad_norm": 0.0883951408561693,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 41.637362241744995
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.263837189178467,
+ "train_acc": 0.00856,
+ "test_loss": 4.673583441162109,
+ "test_acc": 0.01,
+ "lyapunov": 1.4816227761071052,
+ "grad_norm": 0.08805256597520511,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 41.648523807525635
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.263810054168701,
+ "train_acc": 0.00914,
+ "test_loss": 4.673584091186523,
+ "test_acc": 0.01,
+ "lyapunov": 1.4815898499525417,
+ "grad_norm": 0.08812282585660734,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 41.73938012123108
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.2631301567077635,
+ "train_acc": 0.00882,
+ "test_loss": 4.673581381225586,
+ "test_acc": 0.01,
+ "lyapunov": 1.4808570945354373,
+ "grad_norm": 0.0884075853889321,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 41.70086741447449
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.264147056427002,
+ "train_acc": 0.00966,
+ "test_loss": 4.673584265136719,
+ "test_acc": 0.01,
+ "lyapunov": 1.4819788155348406,
+ "grad_norm": 0.08781225710160669,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 41.63281536102295
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.264177637023926,
+ "train_acc": 0.00946,
+ "test_loss": 4.673582272338868,
+ "test_acc": 0.01,
+ "lyapunov": 1.4820371799151917,
+ "grad_norm": 0.08778605437009919,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 41.605711221694946
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.264175823974609,
+ "train_acc": 0.01,
+ "test_loss": 4.673583470153808,
+ "test_acc": 0.01,
+ "lyapunov": 1.482038261030641,
+ "grad_norm": 0.08820186315365212,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 41.616660594940186
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.263000276947022,
+ "train_acc": 0.01,
+ "test_loss": 4.67358302154541,
+ "test_acc": 0.01,
+ "lyapunov": 1.4806900521373505,
+ "grad_norm": 0.08785028349994792,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 41.626938819885254
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.264303789367676,
+ "train_acc": 0.0093,
+ "test_loss": 4.673582839202881,
+ "test_acc": 0.01,
+ "lyapunov": 1.4821641326255506,
+ "grad_norm": 0.08832630889985595,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 41.62687826156616
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.266550144958496,
+ "train_acc": 0.01,
+ "test_loss": 4.673582318115234,
+ "test_acc": 0.01,
+ "lyapunov": 1.4840948478035305,
+ "grad_norm": 0.08863982897252927,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 41.63750672340393
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.2637120777893065,
+ "train_acc": 0.01,
+ "test_loss": 4.673582674407959,
+ "test_acc": 0.01,
+ "lyapunov": 1.4815035524880489,
+ "grad_norm": 0.08799138407501185,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 41.61049675941467
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.263380687713623,
+ "train_acc": 0.01,
+ "test_loss": 4.6735828002929685,
+ "test_acc": 0.01,
+ "lyapunov": 1.48112582825029,
+ "grad_norm": 0.08789323778024616,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 41.664053201675415
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.262870178375244,
+ "train_acc": 0.01,
+ "test_loss": 4.67358247756958,
+ "test_acc": 0.01,
+ "lyapunov": 1.4805500345766698,
+ "grad_norm": 0.08785274592155841,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 41.73871088027954
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.263046730651856,
+ "train_acc": 0.01,
+ "test_loss": 4.673582760620117,
+ "test_acc": 0.01,
+ "lyapunov": 1.480766166811404,
+ "grad_norm": 0.08817919214333009,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 41.71699619293213
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.264003658447265,
+ "train_acc": 0.01,
+ "test_loss": 4.673582760620117,
+ "test_acc": 0.01,
+ "lyapunov": 1.4818289621406808,
+ "grad_norm": 0.08840976368023683,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 41.63391995429993
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.264799559326172,
+ "train_acc": 0.01,
+ "test_loss": 4.673582650756836,
+ "test_acc": 0.01,
+ "lyapunov": 1.4827044315045448,
+ "grad_norm": 0.08814260335342491,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 41.604254484176636
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 5.146115896911621,
+ "train_acc": 0.02178,
+ "test_loss": 4.658292015838623,
+ "test_acc": 0.0179,
+ "lyapunov": 2.2941700692676825,
+ "grad_norm": 5.7514440172256105,
+ "grad_max_sv": 4.608755576610565,
+ "grad_min_sv": 9.931108821970013e-08,
+ "grad_condition": 54298677.31321855,
+ "lr": 0.0009998903417374227,
+ "time_sec": 86.91112756729126
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.702691088256836,
+ "train_acc": 0.02976,
+ "test_loss": 4.6687107803344725,
+ "test_acc": 0.0173,
+ "lyapunov": 1.8152018111685049,
+ "grad_norm": 3.1269645106600352,
+ "grad_max_sv": 2.3287330240011217,
+ "grad_min_sv": 5.3721432058395636e-08,
+ "grad_condition": 52432891.31661774,
+ "lr": 0.0009995614150494292,
+ "time_sec": 86.96670389175415
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.563177616271973,
+ "train_acc": 0.03108,
+ "test_loss": 4.458634540557862,
+ "test_acc": 0.0275,
+ "lyapunov": 1.659614868481141,
+ "grad_norm": 1.6241391637016038,
+ "grad_max_sv": 1.0878711834549903,
+ "grad_min_sv": 2.6067565292442475e-08,
+ "grad_condition": 83662403.24623688,
+ "lr": 0.0009990133642141358,
+ "time_sec": 86.90370392799377
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.516682284240723,
+ "train_acc": 0.03726,
+ "test_loss": 4.491609892272949,
+ "test_acc": 0.0226,
+ "lyapunov": 1.5915839062322437,
+ "grad_norm": 1.140832409431892,
+ "grad_max_sv": 0.6813461020588875,
+ "grad_min_sv": 1.4620473591086398e-08,
+ "grad_condition": 563097834.1159084,
+ "lr": 0.0009982464296247522,
+ "time_sec": 86.99007058143616
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.5070478215026855,
+ "train_acc": 0.04338,
+ "test_loss": 4.482846225738525,
+ "test_acc": 0.0231,
+ "lyapunov": 1.5719971531797248,
+ "grad_norm": 0.9891134281920906,
+ "grad_max_sv": 0.576826149970293,
+ "grad_min_sv": 1.4178649894447393e-08,
+ "grad_condition": 58885947.278740086,
+ "lr": 0.0009972609476841367,
+ "time_sec": 86.98556971549988
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.547509643402099,
+ "train_acc": 0.0439,
+ "test_loss": 4.9390108833312985,
+ "test_acc": 0.0116,
+ "lyapunov": 1.566867695744995,
+ "grad_norm": 0.8577969738236341,
+ "grad_max_sv": 0.45468067899346354,
+ "grad_min_sv": 1.1785924136642478e-08,
+ "grad_condition": 51467445.538705364,
+ "lr": 0.000996057350657239,
+ "time_sec": 86.93410611152649
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.532205999908447,
+ "train_acc": 0.04932,
+ "test_loss": 4.854185777282715,
+ "test_acc": 0.0105,
+ "lyapunov": 1.5658333350325484,
+ "grad_norm": 0.7813900002362055,
+ "grad_max_sv": 0.42395056039094925,
+ "grad_min_sv": 1.0807322919567653e-08,
+ "grad_condition": 102461132.44291899,
+ "lr": 0.000994636166481494,
+ "time_sec": 86.96581149101257
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.556547904968261,
+ "train_acc": 0.0504,
+ "test_loss": 5.202551012420654,
+ "test_acc": 0.0104,
+ "lyapunov": 1.5580533120943152,
+ "grad_norm": 0.7496749300980402,
+ "grad_max_sv": 0.3704929508268833,
+ "grad_min_sv": 9.9690008810438e-09,
+ "grad_condition": 130808798.44108884,
+ "lr": 0.0009929980185352525,
+ "time_sec": 86.94089555740356
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.701766607666015,
+ "train_acc": 0.03756,
+ "test_loss": 5.755129487609863,
+ "test_acc": 0.01,
+ "lyapunov": 1.5552253073743543,
+ "grad_norm": 0.6765304040507019,
+ "grad_max_sv": 0.36201889589428904,
+ "grad_min_sv": 8.426840739095276e-09,
+ "grad_condition": 62920470.9578716,
+ "lr": 0.0009911436253643444,
+ "time_sec": 86.93878936767578
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.765756509094238,
+ "train_acc": 0.03202,
+ "test_loss": 5.775740480041504,
+ "test_acc": 0.01,
+ "lyapunov": 1.5391303578301159,
+ "grad_norm": 0.7537997383732445,
+ "grad_max_sv": 0.34123560786247253,
+ "grad_min_sv": 8.077983985887994e-09,
+ "grad_condition": 51423310.42648181,
+ "lr": 0.0009890738003669028,
+ "time_sec": 86.94973969459534
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.81721549484253,
+ "train_acc": 0.0287,
+ "test_loss": 5.310749195861816,
+ "test_acc": 0.01,
+ "lyapunov": 1.5252552425769894,
+ "grad_norm": 0.6724423278308185,
+ "grad_max_sv": 0.2991580605506897,
+ "grad_min_sv": 5.889135633492526e-09,
+ "grad_condition": 125659233.84784427,
+ "lr": 0.00098678945143658,
+ "time_sec": 86.92238068580627
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.815476130065918,
+ "train_acc": 0.03228,
+ "test_loss": 4.919392412567139,
+ "test_acc": 0.01,
+ "lyapunov": 1.5252421408358132,
+ "grad_norm": 0.6745068286502589,
+ "grad_max_sv": 0.2930708375293761,
+ "grad_min_sv": 6.114008772872826e-09,
+ "grad_condition": 71899366.71277946,
+ "lr": 0.0009842915805643154,
+ "time_sec": 86.96433067321777
+ },
+ {
+ "epoch": 13,
+ "train_loss": 4.802655950775146,
+ "train_acc": 0.03752,
+ "test_loss": 4.738039018249512,
+ "test_acc": 0.01,
+ "lyapunov": 1.5223182784321974,
+ "grad_norm": 0.6997812002840638,
+ "grad_max_sv": 0.34992206916213037,
+ "grad_min_sv": 8.056309852566556e-09,
+ "grad_condition": 47743142.04490039,
+ "lr": 0.000981581283398829,
+ "time_sec": 86.93432188034058
+ },
+ {
+ "epoch": 14,
+ "train_loss": 4.879040807647705,
+ "train_acc": 0.03196,
+ "test_loss": 4.635845722961426,
+ "test_acc": 0.01,
+ "lyapunov": 1.5264948713200173,
+ "grad_norm": 0.7132128709453732,
+ "grad_max_sv": 0.37259799614548683,
+ "grad_min_sv": 7.726031005933498e-09,
+ "grad_condition": 77087531.09708562,
+ "lr": 0.0009786597487660333,
+ "time_sec": 86.92895364761353
+ },
+ {
+ "epoch": 15,
+ "train_loss": 4.93996203048706,
+ "train_acc": 0.0286,
+ "test_loss": 4.715687692260742,
+ "test_acc": 0.01,
+ "lyapunov": 1.5275609859115327,
+ "grad_norm": 0.7145493932975088,
+ "grad_max_sv": 0.3383642140775919,
+ "grad_min_sv": 6.660084050924553e-09,
+ "grad_condition": 63568945.70900831,
+ "lr": 0.0009755282581475766,
+ "time_sec": 86.93708157539368
+ },
+ {
+ "epoch": 16,
+ "train_loss": 4.951732353668213,
+ "train_acc": 0.03108,
+ "test_loss": 4.694218672180176,
+ "test_acc": 0.01,
+ "lyapunov": 1.5221876610270546,
+ "grad_norm": 0.6526072701529334,
+ "grad_max_sv": 0.29856473468244077,
+ "grad_min_sv": 5.5810975953029866e-09,
+ "grad_condition": 3669494078.4381485,
+ "lr": 0.0009721881851187403,
+ "time_sec": 86.95431900024414
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.028552846374511,
+ "train_acc": 0.02936,
+ "test_loss": 4.582682956695557,
+ "test_acc": 0.0148,
+ "lyapunov": 1.5572718967257253,
+ "grad_norm": 0.8395071465637489,
+ "grad_max_sv": 0.2635829897597432,
+ "grad_min_sv": 4.546329786998837e-09,
+ "grad_condition": 9308629659.195911,
+ "lr": 0.0009686409947459456,
+ "time_sec": 86.94067001342773
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.080957429504394,
+ "train_acc": 0.02958,
+ "test_loss": 4.743882189178467,
+ "test_acc": 0.01,
+ "lyapunov": 1.573465526256415,
+ "grad_norm": 0.7060094795148925,
+ "grad_max_sv": 0.26090904884040356,
+ "grad_min_sv": 4.9669986091141484e-09,
+ "grad_condition": 158829567.68689433,
+ "lr": 0.0009648882429441254,
+ "time_sec": 86.93801307678223
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.163744027404785,
+ "train_acc": 0.0251,
+ "test_loss": 5.350689000701904,
+ "test_acc": 0.01,
+ "lyapunov": 1.5783103155662945,
+ "grad_norm": 0.7236371812810315,
+ "grad_max_sv": 0.32311243638396264,
+ "grad_min_sv": 4.661415661322624e-09,
+ "grad_condition": 362163554.1712912,
+ "lr": 0.00096093157579425,
+ "time_sec": 86.95386362075806
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.177699388122559,
+ "train_acc": 0.02336,
+ "test_loss": 4.728291717529297,
+ "test_acc": 0.01,
+ "lyapunov": 1.5543774262718533,
+ "grad_norm": 0.6278235228394613,
+ "grad_max_sv": 0.2316085107624531,
+ "grad_min_sv": 2.9537814670154304e-09,
+ "grad_condition": 3474032967.5441117,
+ "lr": 0.0009567727288213001,
+ "time_sec": 86.9823546409607
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.2000909381103515,
+ "train_acc": 0.02436,
+ "test_loss": 4.806672692871094,
+ "test_acc": 0.01,
+ "lyapunov": 1.5755902729985658,
+ "grad_norm": 0.766013265906278,
+ "grad_max_sv": 0.21709984578192235,
+ "grad_min_sv": 2.2318304187728858e-09,
+ "grad_condition": 8696284488.710842,
+ "lr": 0.0009524135262330095,
+ "time_sec": 86.9815993309021
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.172516224975586,
+ "train_acc": 0.02578,
+ "test_loss": 5.050736184692383,
+ "test_acc": 0.01,
+ "lyapunov": 1.5738651392709873,
+ "grad_norm": 0.8548378900544575,
+ "grad_max_sv": 0.21818067859858276,
+ "grad_min_sv": 2.4550293141510983e-09,
+ "grad_condition": 1446353295.730711,
+ "lr": 0.0009478558801197061,
+ "time_sec": 86.96929454803467
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.301382947845459,
+ "train_acc": 0.01554,
+ "test_loss": 5.921122685241699,
+ "test_acc": 0.01,
+ "lyapunov": 1.5795374422731912,
+ "grad_norm": 1.072625133417376,
+ "grad_max_sv": 0.29671905748546124,
+ "grad_min_sv": 3.4811909517637897e-09,
+ "grad_condition": 2268879972.814607,
+ "lr": 0.000943101789615607,
+ "time_sec": 87.05305171012878
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.308596148986816,
+ "train_acc": 0.01028,
+ "test_loss": 5.915314376831055,
+ "test_acc": 0.01,
+ "lyapunov": 1.5046202849853985,
+ "grad_norm": 0.4300250072511413,
+ "grad_max_sv": 0.29422527775168417,
+ "grad_min_sv": 2.563464584050615e-09,
+ "grad_condition": 1801474829.549522,
+ "lr": 0.0009381533400219313,
+ "time_sec": 86.9294683933258
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.30389043762207,
+ "train_acc": 0.01028,
+ "test_loss": 5.442194981384278,
+ "test_acc": 0.01,
+ "lyapunov": 1.5036146476140717,
+ "grad_norm": 0.369004063413563,
+ "grad_max_sv": 0.27016645595431327,
+ "grad_min_sv": 1.563399900968634e-09,
+ "grad_condition": 26105306242.6268,
+ "lr": 0.0009330127018922189,
+ "time_sec": 86.93831205368042
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.310046338348388,
+ "train_acc": 0.00962,
+ "test_loss": 6.1388027900695805,
+ "test_acc": 0.01,
+ "lyapunov": 1.5094104654648726,
+ "grad_norm": 0.3921330241846595,
+ "grad_max_sv": 0.27323133423924445,
+ "grad_min_sv": 2.6655278586792953e-09,
+ "grad_condition": 217735166.8546676,
+ "lr": 0.000927682130080253,
+ "time_sec": 87.04652237892151
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.301853795013428,
+ "train_acc": 0.01042,
+ "test_loss": 5.515717539215088,
+ "test_acc": 0.01,
+ "lyapunov": 1.508369487569765,
+ "grad_norm": 0.30565280482621787,
+ "grad_max_sv": 0.22872439920902252,
+ "grad_min_sv": 7.688681849029263e-10,
+ "grad_condition": 46178443525.53847,
+ "lr": 0.0009221639627510072,
+ "time_sec": 87.04486989974976
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.29817862487793,
+ "train_acc": 0.00972,
+ "test_loss": 5.770360753631592,
+ "test_acc": 0.01,
+ "lyapunov": 1.5080109913940625,
+ "grad_norm": 0.277614712245464,
+ "grad_max_sv": 0.196561511605978,
+ "grad_min_sv": 1.2118332304701748e-12,
+ "grad_condition": 124861391701.8731,
+ "lr": 0.0009164606203550494,
+ "time_sec": 86.97034883499146
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.299116547241211,
+ "train_acc": 0.00974,
+ "test_loss": 6.629917897796631,
+ "test_acc": 0.01,
+ "lyapunov": 1.5079803863144896,
+ "grad_norm": 0.26773989693385675,
+ "grad_max_sv": 0.19062257409095765,
+ "grad_min_sv": 1.316391307854978e-12,
+ "grad_condition": 118514569073.00333,
+ "lr": 0.0009105746045668516,
+ "time_sec": 86.9515905380249
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.301858203277588,
+ "train_acc": 0.00952,
+ "test_loss": 7.616147738647461,
+ "test_acc": 0.01,
+ "lyapunov": 1.5108254772927754,
+ "grad_norm": 0.2739642757327739,
+ "grad_max_sv": 0.2010789501480758,
+ "grad_min_sv": 3.194205121044685e-10,
+ "grad_condition": 84817443385.97237,
+ "lr": 0.0009045084971874733,
+ "time_sec": 86.96926951408386
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.299806740875244,
+ "train_acc": 0.01004,
+ "test_loss": 7.885091897583008,
+ "test_acc": 0.01,
+ "lyapunov": 1.5118325930422225,
+ "grad_norm": 0.23726371187902562,
+ "grad_max_sv": 0.1534210465848446,
+ "grad_min_sv": 3.777587378576868e-12,
+ "grad_condition": 117298463694.8497,
+ "lr": 0.0008982649590120977,
+ "time_sec": 86.93767380714417
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.294980096740723,
+ "train_acc": 0.01054,
+ "test_loss": 7.175394052124023,
+ "test_acc": 0.01,
+ "lyapunov": 1.5122702329055122,
+ "grad_norm": 0.18490861832393377,
+ "grad_max_sv": 0.09243289618752897,
+ "grad_min_sv": 7.151144434390166e-15,
+ "grad_condition": 91554722602.0434,
+ "lr": 0.0008918467286629196,
+ "time_sec": 86.92625045776367
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.302116135559082,
+ "train_acc": 0.00916,
+ "test_loss": 6.950838031005859,
+ "test_acc": 0.01,
+ "lyapunov": 1.514583631854533,
+ "grad_norm": 0.22539071559889906,
+ "grad_max_sv": 0.14949913807213305,
+ "grad_min_sv": 3.03463898255766e-13,
+ "grad_condition": 123295125931.77371,
+ "lr": 0.0008852566213878943,
+ "time_sec": 86.96885013580322
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.298243276367187,
+ "train_acc": 0.00926,
+ "test_loss": 7.482379321289063,
+ "test_acc": 0.01,
+ "lyapunov": 1.514684440839626,
+ "grad_norm": 0.18381668144055355,
+ "grad_max_sv": 0.10984101705253124,
+ "grad_min_sv": 7.163631845931476e-15,
+ "grad_condition": 109054948912.02344,
+ "lr": 0.000878497527825878,
+ "time_sec": 87.12512397766113
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.308689108428955,
+ "train_acc": 0.00958,
+ "test_loss": 7.612553489685059,
+ "test_acc": 0.01,
+ "lyapunov": 1.5216995715485204,
+ "grad_norm": 0.22567054848299975,
+ "grad_max_sv": 0.1234450839459896,
+ "grad_min_sv": 5.377204609898583e-14,
+ "grad_condition": 117334156157.8593,
+ "lr": 0.000871572412738697,
+ "time_sec": 86.95104956626892
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.303922519226075,
+ "train_acc": 0.00964,
+ "test_loss": 8.831939950561523,
+ "test_acc": 0.01,
+ "lyapunov": 1.5175864534914647,
+ "grad_norm": 0.2187679660724696,
+ "grad_max_sv": 0.13990986812859774,
+ "grad_min_sv": 1.80366368447702e-13,
+ "grad_condition": 123448577181.446,
+ "lr": 0.0008644843137107055,
+ "time_sec": 86.92687749862671
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.303381102600098,
+ "train_acc": 0.00916,
+ "test_loss": 6.551040885925293,
+ "test_acc": 0.01,
+ "lyapunov": 1.5200756013850727,
+ "grad_norm": 0.1798120608859804,
+ "grad_max_sv": 0.10729131288826466,
+ "grad_min_sv": 1.364290789538136e-14,
+ "grad_condition": 105529300010.77225,
+ "lr": 0.0008572363398164014,
+ "time_sec": 86.95336151123047
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.30714798034668,
+ "train_acc": 0.0094,
+ "test_loss": 6.027979496765137,
+ "test_acc": 0.01,
+ "lyapunov": 1.5257836866866596,
+ "grad_norm": 0.1909663013844348,
+ "grad_max_sv": 0.07728723548352719,
+ "grad_min_sv": 4.265317043954499e-24,
+ "grad_condition": 77287235483.15219,
+ "lr": 0.0008498316702566826,
+ "time_sec": 86.9212384223938
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.306197135772705,
+ "train_acc": 0.00974,
+ "test_loss": 6.997566845703125,
+ "test_acc": 0.01,
+ "lyapunov": 1.5238893687572626,
+ "grad_norm": 0.18383519139729404,
+ "grad_max_sv": 0.1007891584187746,
+ "grad_min_sv": 5.3239199179750705e-15,
+ "grad_condition": 100154494637.09956,
+ "lr": 0.0008422735529643442,
+ "time_sec": 86.89629626274109
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.307650102386474,
+ "train_acc": 0.00992,
+ "test_loss": 6.040484946441651,
+ "test_acc": 0.01,
+ "lyapunov": 1.5250033597507135,
+ "grad_norm": 0.18467843309484097,
+ "grad_max_sv": 0.1127883294597268,
+ "grad_min_sv": 7.1038360456260524e-15,
+ "grad_condition": 111935273841.19809,
+ "lr": 0.0008345653031794289,
+ "time_sec": 87.02732610702515
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.307996878356934,
+ "train_acc": 0.00992,
+ "test_loss": 5.920440175628662,
+ "test_acc": 0.01,
+ "lyapunov": 1.5282226456400683,
+ "grad_norm": 0.16629297131246892,
+ "grad_max_sv": 0.07292309552431106,
+ "grad_min_sv": 1.583549415956451e-17,
+ "grad_condition": 72921914356.18047,
+ "lr": 0.0008267103019950526,
+ "time_sec": 86.94355273246765
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.311696410522461,
+ "train_acc": 0.00968,
+ "test_loss": 6.38518196105957,
+ "test_acc": 0.01,
+ "lyapunov": 1.5307711250032001,
+ "grad_norm": 0.1871179922092424,
+ "grad_max_sv": 0.08245804710313678,
+ "grad_min_sv": 6.943719241443141e-16,
+ "grad_condition": 82389599949.82372,
+ "lr": 0.0008187119948743447,
+ "time_sec": 86.93303918838501
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.307222317810059,
+ "train_acc": 0.00956,
+ "test_loss": 6.652195385742187,
+ "test_acc": 0.01,
+ "lyapunov": 1.5260984678097698,
+ "grad_norm": 0.16067559125539438,
+ "grad_max_sv": 0.09466201290488244,
+ "grad_min_sv": 4.4300769825600874e-16,
+ "grad_condition": 94621173553.03905,
+ "lr": 0.000810573890139155,
+ "time_sec": 86.90417695045471
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.308213620300293,
+ "train_acc": 0.00882,
+ "test_loss": 6.962696185302734,
+ "test_acc": 0.01,
+ "lyapunov": 1.527706109044497,
+ "grad_norm": 0.1609729738345643,
+ "grad_max_sv": 0.07951483679935337,
+ "grad_min_sv": 1.2691498572245332e-19,
+ "grad_condition": 79514825996.07883,
+ "lr": 0.0008022995574311873,
+ "time_sec": 86.90469932556152
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.313642641601563,
+ "train_acc": 0.01004,
+ "test_loss": 6.176641661071777,
+ "test_acc": 0.01,
+ "lyapunov": 1.5278308333643258,
+ "grad_norm": 0.20554701681584006,
+ "grad_max_sv": 0.1498540248721838,
+ "grad_min_sv": 2.7361367599211426e-14,
+ "grad_condition": 145983867269.5576,
+ "lr": 0.0007938926261462363,
+ "time_sec": 86.93738555908203
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.3097161289978025,
+ "train_acc": 0.00952,
+ "test_loss": 6.005211575317383,
+ "test_acc": 0.01,
+ "lyapunov": 1.5284498929977417,
+ "grad_norm": 0.17319376275900747,
+ "grad_max_sv": 0.10527544040232897,
+ "grad_min_sv": 1.6379736406305529e-15,
+ "grad_condition": 105101166914.13033,
+ "lr": 0.0007853567838422158,
+ "time_sec": 86.95744371414185
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.311491881408691,
+ "train_acc": 0.00956,
+ "test_loss": 5.9810846961975095,
+ "test_acc": 0.01,
+ "lyapunov": 1.530076160760182,
+ "grad_norm": 0.1622416677557275,
+ "grad_max_sv": 0.09897023066878319,
+ "grad_min_sv": 1.1070734961814082e-15,
+ "grad_condition": 98861145932.69461,
+ "lr": 0.0007766957746216719,
+ "time_sec": 86.9021110534668
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.310971976165772,
+ "train_acc": 0.00894,
+ "test_loss": 5.884356218719482,
+ "test_acc": 0.01,
+ "lyapunov": 1.5301186023160929,
+ "grad_norm": 0.15478972851501702,
+ "grad_max_sv": 0.09055562000721692,
+ "grad_min_sv": 6.095582881917491e-16,
+ "grad_condition": 90492925874.14865,
+ "lr": 0.0007679133974894982,
+ "time_sec": 86.923269033432
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.313096929931641,
+ "train_acc": 0.00936,
+ "test_loss": 5.441997985839844,
+ "test_acc": 0.01,
+ "lyapunov": 1.5325667373359662,
+ "grad_norm": 0.15811997882687892,
+ "grad_max_sv": 0.09403467867523432,
+ "grad_min_sv": 2.5362328677092476e-16,
+ "grad_condition": 94010861805.62488,
+ "lr": 0.000759013504686565,
+ "time_sec": 86.9168426990509
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.311940245513916,
+ "train_acc": 0.00958,
+ "test_loss": 5.371611124420166,
+ "test_acc": 0.01,
+ "lyapunov": 1.5327015231027628,
+ "grad_norm": 0.14176864627007332,
+ "grad_max_sv": 0.07908807899802923,
+ "grad_min_sv": 2.050192692484369e-32,
+ "grad_condition": 79088078998.02924,
+ "lr": 0.0007499999999999998,
+ "time_sec": 86.92089605331421
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.310895777282715,
+ "train_acc": 0.00916,
+ "test_loss": 5.434047091674804,
+ "test_acc": 0.01,
+ "lyapunov": 1.53158952573986,
+ "grad_norm": 0.1361778166532044,
+ "grad_max_sv": 0.06832279236987233,
+ "grad_min_sv": 6.675573383462495e-16,
+ "grad_condition": 68265680127.16847,
+ "lr": 0.0007408768370508575,
+ "time_sec": 86.94595527648926
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.3132603437805175,
+ "train_acc": 0.01008,
+ "test_loss": 6.7278813507080075,
+ "test_acc": 0.01,
+ "lyapunov": 1.535024075252016,
+ "grad_norm": 0.17384705948913357,
+ "grad_max_sv": 0.04316680300980806,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43166803009.80806,
+ "lr": 0.0007316480175599307,
+ "time_sec": 86.91442537307739
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.3123740222167966,
+ "train_acc": 0.00936,
+ "test_loss": 6.131865232849121,
+ "test_acc": 0.01,
+ "lyapunov": 1.5338834356468962,
+ "grad_norm": 0.1343518088533916,
+ "grad_max_sv": 0.04088693740777671,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40886937407.77672,
+ "lr": 0.0007223175895924635,
+ "time_sec": 86.89388537406921
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.311756536712647,
+ "train_acc": 0.00874,
+ "test_loss": 6.26136455078125,
+ "test_acc": 0.01,
+ "lyapunov": 1.534105893900937,
+ "grad_norm": 0.12044776828887008,
+ "grad_max_sv": 0.018818416306748985,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18818416306.748985,
+ "lr": 0.0007128896457825361,
+ "time_sec": 86.86209654808044
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.314126918182373,
+ "train_acc": 0.00948,
+ "test_loss": 6.455938655853272,
+ "test_acc": 0.01,
+ "lyapunov": 1.5355246698155123,
+ "grad_norm": 0.16535062387735305,
+ "grad_max_sv": 0.048017819551751016,
+ "grad_min_sv": 0.0,
+ "grad_condition": 48017819551.75102,
+ "lr": 0.0007033683215378998,
+ "time_sec": 86.91218829154968
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.3133398397827145,
+ "train_acc": 0.00934,
+ "test_loss": 6.355834351348877,
+ "test_acc": 0.01,
+ "lyapunov": 1.535221906574181,
+ "grad_norm": 0.14103865757116907,
+ "grad_max_sv": 0.040325032686814664,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40325032686.814674,
+ "lr": 0.0006937577932260512,
+ "time_sec": 87.01914978027344
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.315177789154053,
+ "train_acc": 0.00906,
+ "test_loss": 5.778967167663574,
+ "test_acc": 0.01,
+ "lyapunov": 1.5374448241480172,
+ "grad_norm": 0.12626262616875458,
+ "grad_max_sv": 0.04227766813710332,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42277668137.10332,
+ "lr": 0.0006840622763423388,
+ "time_sec": 86.90552043914795
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.314984718017578,
+ "train_acc": 0.0096,
+ "test_loss": 5.680106079101562,
+ "test_acc": 0.01,
+ "lyapunov": 1.536767850141696,
+ "grad_norm": 0.13366926148127872,
+ "grad_max_sv": 0.05202861637808383,
+ "grad_min_sv": 0.0,
+ "grad_condition": 52028616378.083824,
+ "lr": 0.0006742860236609073,
+ "time_sec": 86.97483849525452
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.314250464019775,
+ "train_acc": 0.00922,
+ "test_loss": 5.60796079864502,
+ "test_acc": 0.01,
+ "lyapunov": 1.535877099732304,
+ "grad_norm": 0.13264295460080205,
+ "grad_max_sv": 0.053861632384359835,
+ "grad_min_sv": 0.0,
+ "grad_condition": 53861632384.35984,
+ "lr": 0.0006644333233692913,
+ "time_sec": 86.90899348258972
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.315608520202637,
+ "train_acc": 0.00862,
+ "test_loss": 5.75697197265625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5373123942128837,
+ "grad_norm": 0.13451447891861437,
+ "grad_max_sv": 0.05724321529269218,
+ "grad_min_sv": 0.0,
+ "grad_condition": 57243215292.692184,
+ "lr": 0.0006545084971874734,
+ "time_sec": 86.93145775794983
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.315526120605469,
+ "train_acc": 0.00966,
+ "test_loss": 5.641050135803223,
+ "test_acc": 0.01,
+ "lyapunov": 1.537875465419896,
+ "grad_norm": 0.134018980558527,
+ "grad_max_sv": 0.04659216776490212,
+ "grad_min_sv": 0.0,
+ "grad_condition": 46592167764.902115,
+ "lr": 0.0006445158984722354,
+ "time_sec": 86.9526846408844
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.3171287049865725,
+ "train_acc": 0.0095,
+ "test_loss": 5.52830389251709,
+ "test_acc": 0.01,
+ "lyapunov": 1.5390207541873082,
+ "grad_norm": 0.13900770761864464,
+ "grad_max_sv": 0.05631723469123244,
+ "grad_min_sv": 0.0,
+ "grad_condition": 56317234691.232445,
+ "lr": 0.0006344599103076324,
+ "time_sec": 86.95262598991394
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.321492596435547,
+ "train_acc": 0.00884,
+ "test_loss": 5.732630862426758,
+ "test_acc": 0.01,
+ "lyapunov": 1.5413236017422298,
+ "grad_norm": 0.1533270491872105,
+ "grad_max_sv": 0.04487980231642723,
+ "grad_min_sv": 0.0,
+ "grad_condition": 44879802316.42723,
+ "lr": 0.0006243449435824269,
+ "time_sec": 86.93239831924438
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.315124908752441,
+ "train_acc": 0.0099,
+ "test_loss": 5.382702461242676,
+ "test_acc": 0.01,
+ "lyapunov": 1.5375381320943613,
+ "grad_norm": 0.12218366701103515,
+ "grad_max_sv": 0.032946509402245285,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32946509402.24528,
+ "lr": 0.0006141754350553275,
+ "time_sec": 86.91653037071228
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.317460901031494,
+ "train_acc": 0.00952,
+ "test_loss": 5.498714874267578,
+ "test_acc": 0.01,
+ "lyapunov": 1.5401654679452061,
+ "grad_norm": 0.11182228456659622,
+ "grad_max_sv": 0.020332988910377027,
+ "grad_min_sv": 0.0,
+ "grad_condition": 20332988910.377026,
+ "lr": 0.0006039558454088793,
+ "time_sec": 86.86022281646729
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.315697211608887,
+ "train_acc": 0.00964,
+ "test_loss": 5.722520481872559,
+ "test_acc": 0.01,
+ "lyapunov": 1.5384024250537842,
+ "grad_norm": 0.11947856234602877,
+ "grad_max_sv": 0.012709397682920098,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12709397682.9201,
+ "lr": 0.000593690657292862,
+ "time_sec": 86.83588552474976
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.315312230377197,
+ "train_acc": 0.00948,
+ "test_loss": 5.6552305557250975,
+ "test_acc": 0.01,
+ "lyapunov": 1.5376315924822521,
+ "grad_norm": 0.12716375762874924,
+ "grad_max_sv": 0.026200923277065157,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26200923277.06516,
+ "lr": 0.0005833843733580507,
+ "time_sec": 86.93734240531921
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.316413257446289,
+ "train_acc": 0.00892,
+ "test_loss": 5.644158979797363,
+ "test_acc": 0.01,
+ "lyapunov": 1.5389487700694053,
+ "grad_norm": 0.11329541475422919,
+ "grad_max_sv": 0.025692512933164834,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25692512933.164837,
+ "lr": 0.0005730415142812054,
+ "time_sec": 86.92358016967773
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.317326981048584,
+ "train_acc": 0.00962,
+ "test_loss": 5.646556529998779,
+ "test_acc": 0.01,
+ "lyapunov": 1.5400864053565217,
+ "grad_norm": 0.1245567601020978,
+ "grad_max_sv": 0.024738446017727254,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24738446017.727257,
+ "lr": 0.0005626666167821517,
+ "time_sec": 86.86787414550781
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.317049356994629,
+ "train_acc": 0.00982,
+ "test_loss": 5.6787915084838865,
+ "test_acc": 0.01,
+ "lyapunov": 1.5397665028072074,
+ "grad_norm": 0.118076358762286,
+ "grad_max_sv": 0.03472304726019502,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34723047260.195015,
+ "lr": 0.0005522642316338265,
+ "time_sec": 86.88831448554993
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.315880928039551,
+ "train_acc": 0.00964,
+ "test_loss": 5.735556723022461,
+ "test_acc": 0.01,
+ "lyapunov": 1.5387067657602413,
+ "grad_norm": 0.11912248112688287,
+ "grad_max_sv": 0.025617524981498718,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25617524981.49872,
+ "lr": 0.0005418389216661573,
+ "time_sec": 86.86845374107361
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.320206904296875,
+ "train_acc": 0.00958,
+ "test_loss": 5.694711586761475,
+ "test_acc": 0.01,
+ "lyapunov": 1.5424333557753307,
+ "grad_norm": 0.12792597639508846,
+ "grad_max_sv": 0.03625847464427352,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36258474644.27352,
+ "lr": 0.0005313952597646563,
+ "time_sec": 86.87807965278625
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.318149011688233,
+ "train_acc": 0.0099,
+ "test_loss": 5.715859918212891,
+ "test_acc": 0.01,
+ "lyapunov": 1.5407461092600128,
+ "grad_norm": 0.12131920132322771,
+ "grad_max_sv": 0.04332554340362549,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43325543403.62549,
+ "lr": 0.0005209378268645994,
+ "time_sec": 86.93414950370789
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.316737642364502,
+ "train_acc": 0.0094,
+ "test_loss": 5.432159627532959,
+ "test_acc": 0.01,
+ "lyapunov": 1.5394032800289066,
+ "grad_norm": 0.11202086425017638,
+ "grad_max_sv": 0.02820308110676706,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28203081106.76706,
+ "lr": 0.0005104712099416781,
+ "time_sec": 86.86637806892395
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.317990305633545,
+ "train_acc": 0.00994,
+ "test_loss": 5.894020344543457,
+ "test_acc": 0.01,
+ "lyapunov": 1.5408979687849274,
+ "grad_norm": 0.15447706508859999,
+ "grad_max_sv": 0.01931341988965869,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19313419889.65869,
+ "lr": 0.0004999999999999996,
+ "time_sec": 86.85794830322266
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.329913055419921,
+ "train_acc": 0.00922,
+ "test_loss": 5.356306673431397,
+ "test_acc": 0.01,
+ "lyapunov": 1.5469030404029904,
+ "grad_norm": 0.1130858808468486,
+ "grad_max_sv": 0.020954679837450384,
+ "grad_min_sv": 0.0,
+ "grad_condition": 20954679837.450386,
+ "lr": 0.0004895287900583212,
+ "time_sec": 86.8532190322876
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.317062496490479,
+ "train_acc": 0.01014,
+ "test_loss": 5.6768914947509765,
+ "test_acc": 0.01,
+ "lyapunov": 1.539591530399859,
+ "grad_norm": 0.11763219922287847,
+ "grad_max_sv": 0.03681175904348492,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36811759043.484924,
+ "lr": 0.0004790621731353997,
+ "time_sec": 86.89854335784912
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.321235802612304,
+ "train_acc": 0.00956,
+ "test_loss": 5.498642253875732,
+ "test_acc": 0.01,
+ "lyapunov": 1.5433477379781815,
+ "grad_norm": 0.12257877066992058,
+ "grad_max_sv": 0.002356324018910527,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2356324018.910527,
+ "lr": 0.000468604740235343,
+ "time_sec": 86.82986307144165
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.3170875860595705,
+ "train_acc": 0.00874,
+ "test_loss": 5.678500232696533,
+ "test_acc": 0.01,
+ "lyapunov": 1.5401862192031976,
+ "grad_norm": 0.11850283030771655,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00045816107833384175,
+ "time_sec": 86.84353518486023
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.319253426513672,
+ "train_acc": 0.00918,
+ "test_loss": 5.127548231506347,
+ "test_acc": 0.01,
+ "lyapunov": 1.5418513970606773,
+ "grad_norm": 0.11699107355632338,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004477357683661729,
+ "time_sec": 86.8760769367218
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.317456825408936,
+ "train_acc": 0.00894,
+ "test_loss": 5.307968811035156,
+ "test_acc": 0.01,
+ "lyapunov": 1.5405245113860615,
+ "grad_norm": 0.1284549935774549,
+ "grad_max_sv": 0.0083365049213171,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8336504921.317101,
+ "lr": 0.00043733338321784746,
+ "time_sec": 86.87371492385864
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.317734858398437,
+ "train_acc": 0.00954,
+ "test_loss": 5.0544998031616215,
+ "test_acc": 0.01,
+ "lyapunov": 1.5406023172466345,
+ "grad_norm": 0.120735257297947,
+ "grad_max_sv": 0.02263884055428207,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22638840554.282066,
+ "lr": 0.0004269584857187939,
+ "time_sec": 86.92492771148682
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.32118753692627,
+ "train_acc": 0.00954,
+ "test_loss": 5.125200929260254,
+ "test_acc": 0.01,
+ "lyapunov": 1.5442977073552357,
+ "grad_norm": 0.11585054245697951,
+ "grad_max_sv": 0.004569409461691975,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4569409461.691976,
+ "lr": 0.0004166156266419484,
+ "time_sec": 86.81740093231201
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.317668086853027,
+ "train_acc": 0.00892,
+ "test_loss": 5.523793495178222,
+ "test_acc": 0.01,
+ "lyapunov": 1.5407223094759694,
+ "grad_norm": 0.10949975143698651,
+ "grad_max_sv": 0.01457698536105454,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14576985361.05454,
+ "lr": 0.0004063093427071373,
+ "time_sec": 86.87661004066467
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.327004724578857,
+ "train_acc": 0.00984,
+ "test_loss": 5.3676797477722165,
+ "test_acc": 0.01,
+ "lyapunov": 1.54690202819112,
+ "grad_norm": 0.11567866960588237,
+ "grad_max_sv": 0.00381420748308301,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3814207483.0830092,
+ "lr": 0.0003960441545911199,
+ "time_sec": 86.82225131988525
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.3172469395446775,
+ "train_acc": 0.00898,
+ "test_loss": 4.901917692565918,
+ "test_acc": 0.01,
+ "lyapunov": 1.5404299381748794,
+ "grad_norm": 0.11387390679382547,
+ "grad_max_sv": 0.001853126659989357,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1853126659.989357,
+ "lr": 0.0003858245649446718,
+ "time_sec": 86.82927370071411
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.318947126464844,
+ "train_acc": 0.00926,
+ "test_loss": 5.208927967834473,
+ "test_acc": 0.01,
+ "lyapunov": 1.5421383124788095,
+ "grad_norm": 0.10919909006363937,
+ "grad_max_sv": 0.0032654264010488986,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3265426401.048898,
+ "lr": 0.00037565505641757235,
+ "time_sec": 86.81736421585083
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.318348231048584,
+ "train_acc": 0.00918,
+ "test_loss": 4.997183460998535,
+ "test_acc": 0.01,
+ "lyapunov": 1.5415247068990527,
+ "grad_norm": 0.11341200364232766,
+ "grad_max_sv": 0.006511487392708659,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6511487392.708659,
+ "lr": 0.00036554008969236695,
+ "time_sec": 86.82162237167358
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.318816225433349,
+ "train_acc": 0.00892,
+ "test_loss": 5.18877671661377,
+ "test_acc": 0.01,
+ "lyapunov": 1.5420374519684736,
+ "grad_norm": 0.12034783892609052,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003554841015277638,
+ "time_sec": 86.97105526924133
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.318523200531006,
+ "train_acc": 0.00938,
+ "test_loss": 5.115398947143555,
+ "test_acc": 0.01,
+ "lyapunov": 1.5415691600736146,
+ "grad_norm": 0.14346849260322833,
+ "grad_max_sv": 0.02495567239820957,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24955672398.20957,
+ "lr": 0.000345491502812526,
+ "time_sec": 86.88058757781982
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.318174597930908,
+ "train_acc": 0.00928,
+ "test_loss": 5.025017410278321,
+ "test_acc": 0.01,
+ "lyapunov": 1.5413767959150817,
+ "grad_norm": 0.12564666917462933,
+ "grad_max_sv": 0.0075723147485405205,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7572314748.540522,
+ "lr": 0.0003355666766307081,
+ "time_sec": 86.85795545578003
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.318962445831299,
+ "train_acc": 0.00776,
+ "test_loss": 4.925245237731934,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422863734652623,
+ "grad_norm": 0.12308146620405915,
+ "grad_max_sv": 0.0013421432580798865,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1342143258.0798864,
+ "lr": 0.00032571397633909225,
+ "time_sec": 86.79794430732727
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.327239834136963,
+ "train_acc": 0.00902,
+ "test_loss": 5.076303866577148,
+ "test_acc": 0.01,
+ "lyapunov": 1.5474630085098775,
+ "grad_norm": 0.1277051442186759,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00031593772365766094,
+ "time_sec": 86.82232332229614
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.318930770874023,
+ "train_acc": 0.00872,
+ "test_loss": 4.880594007110596,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422684445100672,
+ "grad_norm": 0.13600368147480044,
+ "grad_max_sv": 0.002521184924989939,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2521184924.9899387,
+ "lr": 0.0003062422067739483,
+ "time_sec": 86.81427669525146
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.319566112213135,
+ "train_acc": 0.00978,
+ "test_loss": 4.991552732849121,
+ "test_acc": 0.01,
+ "lyapunov": 1.5428647238885045,
+ "grad_norm": 0.12437123327866709,
+ "grad_max_sv": 0.012525724712759256,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12525724712.759256,
+ "lr": 0.00029663167846209965,
+ "time_sec": 86.81576943397522
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.321689688720703,
+ "train_acc": 0.00864,
+ "test_loss": 4.8253173141479495,
+ "test_acc": 0.01,
+ "lyapunov": 1.5444780929619089,
+ "grad_norm": 0.12565886868121948,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00028711035421746345,
+ "time_sec": 86.88868856430054
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.31878070602417,
+ "train_acc": 0.00896,
+ "test_loss": 4.881497433471679,
+ "test_acc": 0.01,
+ "lyapunov": 1.5421305144839275,
+ "grad_norm": 0.11716334018301236,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00027768241040753615,
+ "time_sec": 86.82862520217896
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.322988173828125,
+ "train_acc": 0.00888,
+ "test_loss": 4.762122218322754,
+ "test_acc": 0.01,
+ "lyapunov": 1.545472724663327,
+ "grad_norm": 0.14401618175686975,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00026835198244006903,
+ "time_sec": 86.81479406356812
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.318863394622802,
+ "train_acc": 0.00886,
+ "test_loss": 4.714427976989746,
+ "test_acc": 0.01,
+ "lyapunov": 1.5421699697099378,
+ "grad_norm": 0.13101580238155278,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002591231629491421,
+ "time_sec": 86.82360768318176
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.32177279083252,
+ "train_acc": 0.00908,
+ "test_loss": 4.741457105255127,
+ "test_acc": 0.01,
+ "lyapunov": 1.5448724360722106,
+ "grad_norm": 0.12685940692823117,
+ "grad_max_sv": 0.0014819118659943342,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1481911865.9943342,
+ "lr": 0.0002499999999999997,
+ "time_sec": 86.83973097801208
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.321585564422607,
+ "train_acc": 0.0095,
+ "test_loss": 4.660526361846924,
+ "test_acc": 0.01,
+ "lyapunov": 1.5446103762482744,
+ "grad_norm": 0.15017654739054603,
+ "grad_max_sv": 0.013982362765818834,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13982362765.818836,
+ "lr": 0.00024098649531343477,
+ "time_sec": 86.89186692237854
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.318927859802246,
+ "train_acc": 0.00892,
+ "test_loss": 4.667855642700196,
+ "test_acc": 0.01,
+ "lyapunov": 1.542065743900016,
+ "grad_norm": 0.14354448313759138,
+ "grad_max_sv": 0.007601975044235587,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7601975044.235586,
+ "lr": 0.0002320866025105016,
+ "time_sec": 86.85510921478271
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.319302808380127,
+ "train_acc": 0.00854,
+ "test_loss": 4.7306030563354495,
+ "test_acc": 0.01,
+ "lyapunov": 1.5426954067576573,
+ "grad_norm": 0.1222745390564005,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002233042253783278,
+ "time_sec": 86.83695554733276
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.3208301354980465,
+ "train_acc": 0.00928,
+ "test_loss": 4.6642813407897945,
+ "test_acc": 0.01,
+ "lyapunov": 1.5443277465717873,
+ "grad_norm": 0.12082325206764133,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000214643216157784,
+ "time_sec": 86.83465480804443
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.325607220458984,
+ "train_acc": 0.00868,
+ "test_loss": 4.797847722625733,
+ "test_acc": 0.01,
+ "lyapunov": 1.547427470421852,
+ "grad_norm": 0.1467365865583852,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376332,
+ "time_sec": 86.92287278175354
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.327985736999512,
+ "train_acc": 0.00948,
+ "test_loss": 4.780700933837891,
+ "test_acc": 0.01,
+ "lyapunov": 1.5493294055504567,
+ "grad_norm": 0.13200210447777874,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019770044256881242,
+ "time_sec": 86.93008136749268
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.319034835205078,
+ "train_acc": 0.00946,
+ "test_loss": 4.834465756225586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422752080366129,
+ "grad_norm": 0.12777999612030252,
+ "grad_max_sv": 0.02157975882291794,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21579758822.91794,
+ "lr": 0.0001894261098608447,
+ "time_sec": 86.82852697372437
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.321411961364746,
+ "train_acc": 0.00916,
+ "test_loss": 4.814922105407715,
+ "test_acc": 0.01,
+ "lyapunov": 1.544609341475055,
+ "grad_norm": 0.13197562787736147,
+ "grad_max_sv": 0.015251889312639832,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15251889312.639832,
+ "lr": 0.000181288005125655,
+ "time_sec": 86.85191607475281
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.322899269256592,
+ "train_acc": 0.00876,
+ "test_loss": 4.713241914367676,
+ "test_acc": 0.01,
+ "lyapunov": 1.54528974267223,
+ "grad_norm": 0.12828276594838653,
+ "grad_max_sv": 0.0006727563217282295,
+ "grad_min_sv": 0.0,
+ "grad_condition": 672756321.7282295,
+ "lr": 0.0001732896980049473,
+ "time_sec": 86.82081818580627
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.318816036987305,
+ "train_acc": 0.0094,
+ "test_loss": 4.679484854125977,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422053230388084,
+ "grad_norm": 0.12847280658733387,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016543469682057076,
+ "time_sec": 86.9124755859375
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.318745676116944,
+ "train_acc": 0.00848,
+ "test_loss": 4.795034047698975,
+ "test_acc": 0.01,
+ "lyapunov": 1.5421484263656695,
+ "grad_norm": 0.1278982868324375,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 86.83268451690674
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.318630710906983,
+ "train_acc": 0.00898,
+ "test_loss": 4.784210496520996,
+ "test_acc": 0.01,
+ "lyapunov": 1.5420354778504433,
+ "grad_norm": 0.13247976598300262,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 86.79545545578003
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.318998959655762,
+ "train_acc": 0.00884,
+ "test_loss": 4.768862895202637,
+ "test_acc": 0.01,
+ "lyapunov": 1.542412842021269,
+ "grad_norm": 0.13154644614275643,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 86.8436176776886
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.3237989538574215,
+ "train_acc": 0.00958,
+ "test_loss": 4.739323009490967,
+ "test_acc": 0.01,
+ "lyapunov": 1.5463786896537333,
+ "grad_norm": 0.14268776917647705,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00013551568628929425,
+ "time_sec": 86.84370040893555
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.321883607025146,
+ "train_acc": 0.00924,
+ "test_loss": 4.724630879211426,
+ "test_acc": 0.01,
+ "lyapunov": 1.544751648707768,
+ "grad_norm": 0.13724738045143065,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 86.83514404296875
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.317745707855225,
+ "train_acc": 0.00926,
+ "test_loss": 4.771264694213867,
+ "test_acc": 0.01,
+ "lyapunov": 1.5411124830050846,
+ "grad_norm": 0.13439912972628948,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 86.83839774131775
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.318638670196533,
+ "train_acc": 0.00944,
+ "test_loss": 4.926259418487549,
+ "test_acc": 0.01,
+ "lyapunov": 1.5420454350273933,
+ "grad_norm": 0.1301899172356262,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 86.81545162200928
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.317975592346191,
+ "train_acc": 0.0091,
+ "test_loss": 4.7584453956604005,
+ "test_acc": 0.01,
+ "lyapunov": 1.5413338939856995,
+ "grad_norm": 0.1306510838756953,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010815327133708009,
+ "time_sec": 86.84224820137024
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.317512142944336,
+ "train_acc": 0.00918,
+ "test_loss": 4.75227194366455,
+ "test_acc": 0.01,
+ "lyapunov": 1.5408342912069062,
+ "grad_norm": 0.13531431192184493,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010173504098790182,
+ "time_sec": 86.84121561050415
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.32096346862793,
+ "train_acc": 0.00916,
+ "test_loss": 4.783403231811524,
+ "test_acc": 0.01,
+ "lyapunov": 1.5443097962747754,
+ "grad_norm": 0.1366841922730417,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 86.8264012336731
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.31987023651123,
+ "train_acc": 0.009,
+ "test_loss": 4.769460425567627,
+ "test_acc": 0.01,
+ "lyapunov": 1.5431054827502317,
+ "grad_norm": 0.13796061159903233,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 86.83200931549072
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.317669274597168,
+ "train_acc": 0.009,
+ "test_loss": 4.726600196838379,
+ "test_acc": 0.01,
+ "lyapunov": 1.5410202537351252,
+ "grad_norm": 0.13807476351768067,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 86.85096383094788
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.31959240447998,
+ "train_acc": 0.00982,
+ "test_loss": 4.731892253112793,
+ "test_acc": 0.01,
+ "lyapunov": 1.5430450296158071,
+ "grad_norm": 0.14330032241201268,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 86.8001983165741
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.317501362304688,
+ "train_acc": 0.00938,
+ "test_loss": 4.782514060974121,
+ "test_acc": 0.01,
+ "lyapunov": 1.540854393673675,
+ "grad_norm": 0.14059038369574442,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 86.87392091751099
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.318027396545411,
+ "train_acc": 0.0095,
+ "test_loss": 4.765302996826172,
+ "test_acc": 0.01,
+ "lyapunov": 1.5414052317514444,
+ "grad_norm": 0.1418679045184447,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 86.82495832443237
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.318346632080078,
+ "train_acc": 0.0092,
+ "test_loss": 4.7442352600097655,
+ "test_acc": 0.01,
+ "lyapunov": 1.5417146911401578,
+ "grad_norm": 0.142826590523136,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 86.79729580879211
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.318922318725586,
+ "train_acc": 0.00974,
+ "test_loss": 4.76433516998291,
+ "test_acc": 0.01,
+ "lyapunov": 1.542423507136762,
+ "grad_norm": 0.14495446560643363,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 86.93182754516602
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.318007217102051,
+ "train_acc": 0.00962,
+ "test_loss": 4.764061611938477,
+ "test_acc": 0.01,
+ "lyapunov": 1.541390145831096,
+ "grad_norm": 0.14153652471754832,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 86.8191487789154
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.318092449340821,
+ "train_acc": 0.00968,
+ "test_loss": 4.765155668640137,
+ "test_acc": 0.01,
+ "lyapunov": 1.5414884422746156,
+ "grad_norm": 0.14863798950920318,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 86.92294239997864
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.318419138793946,
+ "train_acc": 0.00922,
+ "test_loss": 4.764954615783691,
+ "test_acc": 0.01,
+ "lyapunov": 1.541847081745372,
+ "grad_norm": 0.14422350481698742,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 86.83364939689636
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.319330998535157,
+ "train_acc": 0.00984,
+ "test_loss": 4.749797338867188,
+ "test_acc": 0.01,
+ "lyapunov": 1.5428275848593553,
+ "grad_norm": 0.1575339118534098,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 86.83805966377258
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.3225936277771,
+ "train_acc": 0.00944,
+ "test_loss": 4.753033805847168,
+ "test_acc": 0.01,
+ "lyapunov": 1.5456237704552653,
+ "grad_norm": 0.1459542484301229,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 86.83223581314087
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.319478280029297,
+ "train_acc": 0.00904,
+ "test_loss": 4.726372310638427,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427262319628234,
+ "grad_norm": 0.15430065761057823,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 86.81233429908752
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.320157431182861,
+ "train_acc": 0.00978,
+ "test_loss": 4.729707991790772,
+ "test_acc": 0.01,
+ "lyapunov": 1.5434529592314035,
+ "grad_norm": 0.14953623206124225,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 86.81813621520996
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.344091755371093,
+ "train_acc": 0.00992,
+ "test_loss": 4.742976405334472,
+ "test_acc": 0.01,
+ "lyapunov": 1.5575274945524953,
+ "grad_norm": 0.17021644451164028,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 86.84416842460632
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.3179564929199215,
+ "train_acc": 0.01,
+ "test_loss": 4.757002459716797,
+ "test_acc": 0.01,
+ "lyapunov": 1.541358881289392,
+ "grad_norm": 0.1455320955701897,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 86.83202290534973
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.319369739990234,
+ "train_acc": 0.00978,
+ "test_loss": 4.748977610015869,
+ "test_acc": 0.01,
+ "lyapunov": 1.5428897822299577,
+ "grad_norm": 0.15104084037444107,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 86.81699085235596
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.318675216522217,
+ "train_acc": 0.01,
+ "test_loss": 4.713645321655274,
+ "test_acc": 0.01,
+ "lyapunov": 1.5421365197662198,
+ "grad_norm": 0.14694031631290994,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 86.8898720741272
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.318637705383301,
+ "train_acc": 0.01,
+ "test_loss": 4.743732140350342,
+ "test_acc": 0.01,
+ "lyapunov": 1.5420801776754276,
+ "grad_norm": 0.15086340410308036,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 86.82428193092346
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.318365608825683,
+ "train_acc": 0.01,
+ "test_loss": 4.738941632843018,
+ "test_acc": 0.01,
+ "lyapunov": 1.5417572262951784,
+ "grad_norm": 0.1451696630670528,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 86.8176257610321
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.319074583282471,
+ "train_acc": 0.01,
+ "test_loss": 4.743734898376465,
+ "test_acc": 0.01,
+ "lyapunov": 1.5425543062522282,
+ "grad_norm": 0.14883420989990226,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 86.81977844238281
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.321842821502686,
+ "train_acc": 0.01,
+ "test_loss": 4.742512757873535,
+ "test_acc": 0.01,
+ "lyapunov": 1.5452124737107846,
+ "grad_norm": 0.14940314161589946,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 86.9058632850647
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.323013974456787,
+ "train_acc": 0.01,
+ "test_loss": 4.7366528335571285,
+ "test_acc": 0.01,
+ "lyapunov": 1.5466468251879564,
+ "grad_norm": 0.48352294330900464,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 86.8274781703949
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.322230252380371,
+ "train_acc": 0.01,
+ "test_loss": 4.734474227905274,
+ "test_acc": 0.01,
+ "lyapunov": 1.5454154453619058,
+ "grad_norm": 0.15060559526776118,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 86.83571076393127
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.318391214904785,
+ "train_acc": 0.01,
+ "test_loss": 4.740697119140625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5418205120984245,
+ "grad_norm": 0.14599666991367263,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 86.83404302597046
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.3190992230224605,
+ "train_acc": 0.01,
+ "test_loss": 4.740016835021972,
+ "test_acc": 0.01,
+ "lyapunov": 1.542624485462218,
+ "grad_norm": 0.15263702906229243,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 86.86582016944885
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.318638049316406,
+ "train_acc": 0.01,
+ "test_loss": 4.740016804504394,
+ "test_acc": 0.01,
+ "lyapunov": 1.542047378352231,
+ "grad_norm": 0.1501107976108878,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 86.7875075340271
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.318966191101074,
+ "train_acc": 0.01,
+ "test_loss": 4.740017098999023,
+ "test_acc": 0.01,
+ "lyapunov": 1.5423082866327231,
+ "grad_norm": 0.1506843352752174,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 86.85878276824951
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.318281329040527,
+ "train_acc": 0.01,
+ "test_loss": 4.740017213439941,
+ "test_acc": 0.01,
+ "lyapunov": 1.5417110215672447,
+ "grad_norm": 0.14832275166563608,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 87.06339812278748
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.318742103729248,
+ "train_acc": 0.01,
+ "test_loss": 4.740017121887207,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422426760958894,
+ "grad_norm": 0.1485832497803494,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 86.82008957862854
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 5.142427458190918,
+ "train_acc": 0.01732,
+ "test_loss": 4.915040765380859,
+ "test_acc": 0.0102,
+ "lyapunov": 2.4272339856228253,
+ "grad_norm": 5.192250161678427,
+ "grad_max_sv": 4.473296946287155,
+ "grad_min_sv": 8.955331335380733e-08,
+ "grad_condition": 71327028.89068338,
+ "lr": 0.0009998903417374227,
+ "time_sec": 132.13672518730164
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.874939300842285,
+ "train_acc": 0.01776,
+ "test_loss": 4.858658763122558,
+ "test_acc": 0.0123,
+ "lyapunov": 1.9352691591243305,
+ "grad_norm": 3.5048458101816564,
+ "grad_max_sv": 2.842214399576187,
+ "grad_min_sv": 5.994522662700064e-08,
+ "grad_condition": 56014607.037285045,
+ "lr": 0.0009995614150494292,
+ "time_sec": 132.1895821094513
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.780418332366944,
+ "train_acc": 0.01696,
+ "test_loss": 5.036572162628174,
+ "test_acc": 0.013,
+ "lyapunov": 1.6941773053020468,
+ "grad_norm": 2.3576536383434044,
+ "grad_max_sv": 1.8239452183246612,
+ "grad_min_sv": 3.909134313473395e-08,
+ "grad_condition": 54665529.32274648,
+ "lr": 0.0009990133642141358,
+ "time_sec": 132.14293670654297
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.74106760559082,
+ "train_acc": 0.0156,
+ "test_loss": 4.614977532958984,
+ "test_acc": 0.01,
+ "lyapunov": 1.667667641359217,
+ "grad_norm": 1.2834888351442275,
+ "grad_max_sv": 0.7230008448474109,
+ "grad_min_sv": 1.1444949870584092e-08,
+ "grad_condition": 21641297318.53074,
+ "lr": 0.0009982464296247522,
+ "time_sec": 132.18336057662964
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.765737413482666,
+ "train_acc": 0.01652,
+ "test_loss": 5.099783699798584,
+ "test_acc": 0.01,
+ "lyapunov": 1.6692155538617497,
+ "grad_norm": 0.6681729594071041,
+ "grad_max_sv": 0.4321929462254047,
+ "grad_min_sv": 8.256420696048775e-10,
+ "grad_condition": 130856413066.44238,
+ "lr": 0.0009972609476841367,
+ "time_sec": 132.0963535308838
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.802682023925781,
+ "train_acc": 0.01584,
+ "test_loss": 4.645143016052246,
+ "test_acc": 0.01,
+ "lyapunov": 1.6541148235121041,
+ "grad_norm": 0.5601084813828376,
+ "grad_max_sv": 0.3682811915874481,
+ "grad_min_sv": 4.4830527621445066e-12,
+ "grad_condition": 122810946704.98007,
+ "lr": 0.000996057350657239,
+ "time_sec": 132.08646774291992
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.861019936065674,
+ "train_acc": 0.0145,
+ "test_loss": 5.0593204246521,
+ "test_acc": 0.012,
+ "lyapunov": 1.6806474119196158,
+ "grad_norm": 0.4786920265962189,
+ "grad_max_sv": 0.36215363070368767,
+ "grad_min_sv": 5.403665967264682e-10,
+ "grad_condition": 157595569273.04913,
+ "lr": 0.000994636166481494,
+ "time_sec": 132.12457752227783
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.906115528869629,
+ "train_acc": 0.01422,
+ "test_loss": 4.609849331665039,
+ "test_acc": 0.01,
+ "lyapunov": 1.6933349569130431,
+ "grad_norm": 0.5105557123165358,
+ "grad_max_sv": 0.2962237525731325,
+ "grad_min_sv": 1.5893412122574907e-12,
+ "grad_condition": 162936272535.53033,
+ "lr": 0.0009929980185352525,
+ "time_sec": 132.0816192626953
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.948906524505615,
+ "train_acc": 0.01298,
+ "test_loss": 4.606528971099854,
+ "test_acc": 0.01,
+ "lyapunov": 1.684294082624528,
+ "grad_norm": 0.4680820303299784,
+ "grad_max_sv": 0.2727967657148838,
+ "grad_min_sv": 6.175172652279376e-13,
+ "grad_condition": 191797793138.9354,
+ "lr": 0.0009911436253643444,
+ "time_sec": 132.09475946426392
+ },
+ {
+ "epoch": 10,
+ "train_loss": 5.001812951354981,
+ "train_acc": 0.01048,
+ "test_loss": 4.605593468475342,
+ "test_acc": 0.01,
+ "lyapunov": 1.6371012395605102,
+ "grad_norm": 0.4454332910853826,
+ "grad_max_sv": 0.06080346256494522,
+ "grad_min_sv": 1.1174912073463375e-13,
+ "grad_condition": 43714632849.557816,
+ "lr": 0.0009890738003669028,
+ "time_sec": 132.12074422836304
+ },
+ {
+ "epoch": 11,
+ "train_loss": 5.020210814056396,
+ "train_acc": 0.0096,
+ "test_loss": 6.067085327148438,
+ "test_acc": 0.01,
+ "lyapunov": 1.55058368331636,
+ "grad_norm": 0.43082604131055474,
+ "grad_max_sv": 0.221556506305933,
+ "grad_min_sv": 2.881964604461995e-09,
+ "grad_condition": 154673733.23759162,
+ "lr": 0.00098678945143658,
+ "time_sec": 132.08557748794556
+ },
+ {
+ "epoch": 12,
+ "train_loss": 5.050462992553711,
+ "train_acc": 0.0094,
+ "test_loss": 4.605482531738281,
+ "test_acc": 0.01,
+ "lyapunov": 1.5398570713789568,
+ "grad_norm": 0.381893916008903,
+ "grad_max_sv": 0.2668355040252209,
+ "grad_min_sv": 3.789388436370445e-09,
+ "grad_condition": 42311880.80663426,
+ "lr": 0.0009842915805643154,
+ "time_sec": 132.05907773971558
+ },
+ {
+ "epoch": 13,
+ "train_loss": 5.067867939758301,
+ "train_acc": 0.00924,
+ "test_loss": 4.605311224365234,
+ "test_acc": 0.01,
+ "lyapunov": 1.539125974830764,
+ "grad_norm": 0.1537321432498029,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000981581283398829,
+ "time_sec": 132.1301724910736
+ },
+ {
+ "epoch": 14,
+ "train_loss": 5.122542482299805,
+ "train_acc": 0.01028,
+ "test_loss": 6.089662152862549,
+ "test_acc": 0.01,
+ "lyapunov": 1.5396406424929723,
+ "grad_norm": 0.3505932006709459,
+ "grad_max_sv": 0.24503438249230386,
+ "grad_min_sv": 3.2204854292020023e-09,
+ "grad_condition": 175828681.99119335,
+ "lr": 0.0009786597487660333,
+ "time_sec": 132.11422061920166
+ },
+ {
+ "epoch": 15,
+ "train_loss": 5.167975009613037,
+ "train_acc": 0.00938,
+ "test_loss": 6.145216786956787,
+ "test_acc": 0.01,
+ "lyapunov": 1.5421736868446136,
+ "grad_norm": 0.460038063194906,
+ "grad_max_sv": 0.37677369341254235,
+ "grad_min_sv": 5.061586208499058e-09,
+ "grad_condition": 83937837.74305013,
+ "lr": 0.0009755282581475766,
+ "time_sec": 132.15303254127502
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.185187667541504,
+ "train_acc": 0.00964,
+ "test_loss": 4.605292627716064,
+ "test_acc": 0.01,
+ "lyapunov": 1.5415043111347482,
+ "grad_norm": 0.2749549655041811,
+ "grad_max_sv": 0.13375916928052903,
+ "grad_min_sv": 1.7694276155388877e-09,
+ "grad_condition": 28413171.440939356,
+ "lr": 0.0009721881851187403,
+ "time_sec": 132.0988028049469
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.213513888549805,
+ "train_acc": 0.00944,
+ "test_loss": 4.605225193786621,
+ "test_acc": 0.01,
+ "lyapunov": 1.5439205886153005,
+ "grad_norm": 0.15107835674594625,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0009686409947459456,
+ "time_sec": 132.06156492233276
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.259810456237793,
+ "train_acc": 0.00946,
+ "test_loss": 6.243620587158203,
+ "test_acc": 0.01,
+ "lyapunov": 1.5492180427321998,
+ "grad_norm": 0.17993668118393238,
+ "grad_max_sv": 0.02630040645599365,
+ "grad_min_sv": 2.2052708131825583e-10,
+ "grad_condition": 25149159.75180607,
+ "lr": 0.0009648882429441254,
+ "time_sec": 132.04172444343567
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.30400526260376,
+ "train_acc": 0.01008,
+ "test_loss": 6.052386779022217,
+ "test_acc": 0.01,
+ "lyapunov": 1.544384488974081,
+ "grad_norm": 0.348063373631547,
+ "grad_max_sv": 0.2475440863519907,
+ "grad_min_sv": 2.704030184225853e-09,
+ "grad_condition": 448939719.83669394,
+ "lr": 0.00096093157579425,
+ "time_sec": 132.16821956634521
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.344405227050781,
+ "train_acc": 0.0094,
+ "test_loss": 6.0689891357421875,
+ "test_acc": 0.01,
+ "lyapunov": 1.549183475087061,
+ "grad_norm": 0.3941364600912924,
+ "grad_max_sv": 0.28380888141691685,
+ "grad_min_sv": 2.9937321677220295e-09,
+ "grad_condition": 919686281.1330671,
+ "lr": 0.0009567727288213001,
+ "time_sec": 132.13486909866333
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.342385781860352,
+ "train_acc": 0.00934,
+ "test_loss": 5.634283610534668,
+ "test_acc": 0.01,
+ "lyapunov": 1.5489524468741454,
+ "grad_norm": 0.35198337312808664,
+ "grad_max_sv": 0.2675567839294672,
+ "grad_min_sv": 2.7506563800988593e-09,
+ "grad_condition": 137616088.9764635,
+ "lr": 0.0009524135262330095,
+ "time_sec": 132.15001010894775
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.340258148040771,
+ "train_acc": 0.01038,
+ "test_loss": 6.047631702423096,
+ "test_acc": 0.01,
+ "lyapunov": 1.5503142017232792,
+ "grad_norm": 0.32912217146899386,
+ "grad_max_sv": 0.23988064490258693,
+ "grad_min_sv": 2.0088645359163383e-09,
+ "grad_condition": 325233106.42990357,
+ "lr": 0.0009478558801197061,
+ "time_sec": 132.1328146457672
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.33926953994751,
+ "train_acc": 0.00924,
+ "test_loss": 6.389647571563721,
+ "test_acc": 0.01,
+ "lyapunov": 1.5511968355349568,
+ "grad_norm": 0.3034442087369207,
+ "grad_max_sv": 0.21002153679728508,
+ "grad_min_sv": 7.416720458496191e-10,
+ "grad_condition": 49849833895.91653,
+ "lr": 0.000943101789615607,
+ "time_sec": 132.11377239227295
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.342641763763428,
+ "train_acc": 0.01046,
+ "test_loss": 6.151307273101807,
+ "test_acc": 0.01,
+ "lyapunov": 1.5519740599805436,
+ "grad_norm": 0.32351011233615656,
+ "grad_max_sv": 0.24164889194071293,
+ "grad_min_sv": 1.9842920796070418e-09,
+ "grad_condition": 216397157.20139033,
+ "lr": 0.0009381533400219313,
+ "time_sec": 132.07816553115845
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.336951184997559,
+ "train_acc": 0.00994,
+ "test_loss": 5.9992121322631835,
+ "test_acc": 0.01,
+ "lyapunov": 1.5503220811219471,
+ "grad_norm": 0.2784195734173852,
+ "grad_max_sv": 0.19388381093740464,
+ "grad_min_sv": 2.1356596568026515e-10,
+ "grad_condition": 108561949775.06238,
+ "lr": 0.0009330127018922189,
+ "time_sec": 132.10879969596863
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.336466632537841,
+ "train_acc": 0.01006,
+ "test_loss": 5.7221336074829106,
+ "test_acc": 0.01,
+ "lyapunov": 1.5520486011529517,
+ "grad_norm": 0.24825146645127755,
+ "grad_max_sv": 0.17286810129880906,
+ "grad_min_sv": 1.0904332706662028e-12,
+ "grad_condition": 103853917717.00699,
+ "lr": 0.000927682130080253,
+ "time_sec": 132.1171510219574
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.336693968505859,
+ "train_acc": 0.00944,
+ "test_loss": 5.829081159210205,
+ "test_acc": 0.01,
+ "lyapunov": 1.5536211549168657,
+ "grad_norm": 0.23362614927382305,
+ "grad_max_sv": 0.15823216680437327,
+ "grad_min_sv": 7.62931019239883e-13,
+ "grad_condition": 111090272986.05489,
+ "lr": 0.0009221639627510072,
+ "time_sec": 132.13189697265625
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.336333346252442,
+ "train_acc": 0.01034,
+ "test_loss": 6.183766918945312,
+ "test_acc": 0.01,
+ "lyapunov": 1.5548379052325587,
+ "grad_norm": 0.2252526539391841,
+ "grad_max_sv": 0.1425440175458789,
+ "grad_min_sv": 5.001494019507075e-14,
+ "grad_condition": 136232139639.80547,
+ "lr": 0.0009164606203550494,
+ "time_sec": 132.0898892879486
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.3385375555419925,
+ "train_acc": 0.01006,
+ "test_loss": 18.741441845703125,
+ "test_acc": 0.01,
+ "lyapunov": 1.559137857478598,
+ "grad_norm": 0.24309729358940327,
+ "grad_max_sv": 0.1129613446071744,
+ "grad_min_sv": 7.652494146034002e-15,
+ "grad_condition": 112054629681.63525,
+ "lr": 0.0009105746045668516,
+ "time_sec": 132.19855189323425
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.337543925323486,
+ "train_acc": 0.00958,
+ "test_loss": 17.780749963378906,
+ "test_acc": 0.01,
+ "lyapunov": 1.5578542255684542,
+ "grad_norm": 0.22390701226492316,
+ "grad_max_sv": 0.10281856972724199,
+ "grad_min_sv": 3.3459312089163837e-15,
+ "grad_condition": 102453292464.96785,
+ "lr": 0.0009045084971874733,
+ "time_sec": 132.09549117088318
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.33479830078125,
+ "train_acc": 0.00896,
+ "test_loss": 18.024621951293945,
+ "test_acc": 0.01,
+ "lyapunov": 1.5561083588758697,
+ "grad_norm": 0.2617176836095928,
+ "grad_max_sv": 0.0911625299602747,
+ "grad_min_sv": 1.0217219065908696e-15,
+ "grad_condition": 91065349161.70517,
+ "lr": 0.0008982649590120977,
+ "time_sec": 132.07474184036255
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.336539338684082,
+ "train_acc": 0.0096,
+ "test_loss": 18.656125256347657,
+ "test_acc": 0.01,
+ "lyapunov": 1.558475110536951,
+ "grad_norm": 0.2736415217941262,
+ "grad_max_sv": 0.08601008746773005,
+ "grad_min_sv": 8.793854624629887e-16,
+ "grad_condition": 85922955415.14108,
+ "lr": 0.0008918467286629196,
+ "time_sec": 132.10801935195923
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.346367032775879,
+ "train_acc": 0.00982,
+ "test_loss": 16.179306204223632,
+ "test_acc": 0.01,
+ "lyapunov": 1.5642947364036384,
+ "grad_norm": 0.26593824832856844,
+ "grad_max_sv": 0.11054420564323664,
+ "grad_min_sv": 1.4557409070313929e-10,
+ "grad_condition": 86957832407.85573,
+ "lr": 0.0008852566213878943,
+ "time_sec": 132.09707188606262
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.366751658630371,
+ "train_acc": 0.0095,
+ "test_loss": 14.5320333984375,
+ "test_acc": 0.01,
+ "lyapunov": 1.5604360716422196,
+ "grad_norm": 0.39203529519334207,
+ "grad_max_sv": 0.3150600105524063,
+ "grad_min_sv": 3.335271438415291e-09,
+ "grad_condition": 437335317.70210946,
+ "lr": 0.000878497527825878,
+ "time_sec": 132.12472343444824
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.3540499374389645,
+ "train_acc": 0.00914,
+ "test_loss": 14.636802185058594,
+ "test_acc": 0.01,
+ "lyapunov": 1.5606954972762281,
+ "grad_norm": 0.3377550426065231,
+ "grad_max_sv": 0.2708315536379814,
+ "grad_min_sv": 2.616331799126792e-09,
+ "grad_condition": 145659046.06806198,
+ "lr": 0.000871572412738697,
+ "time_sec": 132.10315084457397
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.350296534576416,
+ "train_acc": 0.00996,
+ "test_loss": 15.48446300354004,
+ "test_acc": 0.01,
+ "lyapunov": 1.5607713335920173,
+ "grad_norm": 0.29951473550525415,
+ "grad_max_sv": 0.24341562166810035,
+ "grad_min_sv": 1.5972995535181583e-09,
+ "grad_condition": 1815700162.0467975,
+ "lr": 0.0008644843137107055,
+ "time_sec": 132.10273575782776
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.3520866116333,
+ "train_acc": 0.00968,
+ "test_loss": 14.972803247070312,
+ "test_acc": 0.01,
+ "lyapunov": 1.5632766884611087,
+ "grad_norm": 0.33571017690288324,
+ "grad_max_sv": 0.2274009022861719,
+ "grad_min_sv": 6.642170352888692e-10,
+ "grad_condition": 43022286203.22009,
+ "lr": 0.0008572363398164014,
+ "time_sec": 132.0913314819336
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.347811700897217,
+ "train_acc": 0.00978,
+ "test_loss": 15.4173666015625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5653380673864614,
+ "grad_norm": 0.23644614014625348,
+ "grad_max_sv": 0.15670949593186378,
+ "grad_min_sv": 3.485120328424339e-13,
+ "grad_condition": 126042108666.44785,
+ "lr": 0.0008498316702566826,
+ "time_sec": 132.12694144248962
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.350918925933838,
+ "train_acc": 0.01,
+ "test_loss": 7.349865231323242,
+ "test_acc": 0.01,
+ "lyapunov": 1.5639865206330634,
+ "grad_norm": 0.25831036099968246,
+ "grad_max_sv": 0.18908596560359,
+ "grad_min_sv": 3.4109730636612205e-10,
+ "grad_condition": 109021837331.04056,
+ "lr": 0.0008422735529643442,
+ "time_sec": 132.15545773506165
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.350084358825684,
+ "train_acc": 0.00968,
+ "test_loss": 6.699221839904785,
+ "test_acc": 0.01,
+ "lyapunov": 1.5618754555197323,
+ "grad_norm": 0.33240423060946156,
+ "grad_max_sv": 0.16681117806583642,
+ "grad_min_sv": 8.354353915913262e-10,
+ "grad_condition": 29639133022.15968,
+ "lr": 0.0008345653031794289,
+ "time_sec": 132.0622968673706
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.348379842224121,
+ "train_acc": 0.01014,
+ "test_loss": 12.351808143615722,
+ "test_acc": 0.01,
+ "lyapunov": 1.5626876762760875,
+ "grad_norm": 0.31832555128145307,
+ "grad_max_sv": 0.20640474413521587,
+ "grad_min_sv": 8.66528908347317e-13,
+ "grad_condition": 129815385507.61075,
+ "lr": 0.0008267103019950526,
+ "time_sec": 132.2454056739807
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.34665752532959,
+ "train_acc": 0.00974,
+ "test_loss": 14.07037748260498,
+ "test_acc": 0.01,
+ "lyapunov": 1.5655529825278864,
+ "grad_norm": 0.2561124376145529,
+ "grad_max_sv": 0.10575219443999231,
+ "grad_min_sv": 1.9916840597483354e-10,
+ "grad_condition": 82384130296.00456,
+ "lr": 0.0008187119948743447,
+ "time_sec": 132.08385848999023
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.343207415618896,
+ "train_acc": 0.0099,
+ "test_loss": 13.306277600097657,
+ "test_acc": 0.01,
+ "lyapunov": 1.5653508831472958,
+ "grad_norm": 0.19924932372474,
+ "grad_max_sv": 0.096745721437037,
+ "grad_min_sv": 1.0061398517570142e-15,
+ "grad_condition": 96651724250.54889,
+ "lr": 0.000810573890139155,
+ "time_sec": 132.13167572021484
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.345402418518066,
+ "train_acc": 0.00992,
+ "test_loss": 7.869494395446777,
+ "test_acc": 0.01,
+ "lyapunov": 1.5646309980650996,
+ "grad_norm": 0.21769658517748566,
+ "grad_max_sv": 0.13879811409860848,
+ "grad_min_sv": 1.6053037275992228e-14,
+ "grad_condition": 135561498479.67575,
+ "lr": 0.0008022995574311873,
+ "time_sec": 132.21540069580078
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.346674517059326,
+ "train_acc": 0.00986,
+ "test_loss": 11.400154348754883,
+ "test_acc": 0.01,
+ "lyapunov": 1.5669585390164114,
+ "grad_norm": 0.21055278107954878,
+ "grad_max_sv": 0.12050471100956202,
+ "grad_min_sv": 1.448653245665297e-14,
+ "grad_condition": 117784195175.33076,
+ "lr": 0.0007938926261462363,
+ "time_sec": 132.13598537445068
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.350086312103271,
+ "train_acc": 0.00912,
+ "test_loss": 11.996928524780273,
+ "test_acc": 0.01,
+ "lyapunov": 1.5701792279777624,
+ "grad_norm": 0.21008620048452556,
+ "grad_max_sv": 0.08796360064297915,
+ "grad_min_sv": 3.893309181110675e-16,
+ "grad_condition": 87925759209.02908,
+ "lr": 0.0007853567838422158,
+ "time_sec": 132.10033679008484
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.342350235290527,
+ "train_acc": 0.0087,
+ "test_loss": 10.970650772094727,
+ "test_acc": 0.01,
+ "lyapunov": 1.564373235263483,
+ "grad_norm": 0.1731163774631187,
+ "grad_max_sv": 0.08237459398806095,
+ "grad_min_sv": 2.1940905206855015e-16,
+ "grad_condition": 82355183433.8488,
+ "lr": 0.0007766957746216719,
+ "time_sec": 132.1089198589325
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.34227012512207,
+ "train_acc": 0.00988,
+ "test_loss": 11.343988357543946,
+ "test_acc": 0.01,
+ "lyapunov": 1.5652936489685723,
+ "grad_norm": 0.16074333900064897,
+ "grad_max_sv": 0.07524463571608067,
+ "grad_min_sv": 4.129742513509048e-34,
+ "grad_condition": 75244635716.08066,
+ "lr": 0.0007679133974894982,
+ "time_sec": 132.16328692436218
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.344108670349121,
+ "train_acc": 0.00988,
+ "test_loss": 11.356095449829102,
+ "test_acc": 0.01,
+ "lyapunov": 1.5667558609677092,
+ "grad_norm": 0.15860129770355044,
+ "grad_max_sv": 0.07414976768195629,
+ "grad_min_sv": 2.920054218147879e-21,
+ "grad_condition": 74149767435.12958,
+ "lr": 0.000759013504686565,
+ "time_sec": 132.1159553527832
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.3415603378295895,
+ "train_acc": 0.00976,
+ "test_loss": 11.700657446289062,
+ "test_acc": 0.01,
+ "lyapunov": 1.5651936311551067,
+ "grad_norm": 0.14626453498485173,
+ "grad_max_sv": 0.05773629667237401,
+ "grad_min_sv": 7.389830128226318e-40,
+ "grad_condition": 57736296672.37401,
+ "lr": 0.0007499999999999998,
+ "time_sec": 132.10842418670654
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.345499488220215,
+ "train_acc": 0.0091,
+ "test_loss": 7.841943490600586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5647823362399245,
+ "grad_norm": 0.19931882783012003,
+ "grad_max_sv": 0.13148421347141265,
+ "grad_min_sv": 1.1399481724407015e-14,
+ "grad_condition": 129966725437.33623,
+ "lr": 0.0007408768370508575,
+ "time_sec": 132.13836026191711
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.346541320800781,
+ "train_acc": 0.01036,
+ "test_loss": 8.251887129211426,
+ "test_acc": 0.01,
+ "lyapunov": 1.565840955280587,
+ "grad_norm": 0.21227656722607438,
+ "grad_max_sv": 0.14938069488853217,
+ "grad_min_sv": 2.1186636603898966e-14,
+ "grad_condition": 146306194841.0702,
+ "lr": 0.0007316480175599307,
+ "time_sec": 132.21652913093567
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.346332246856689,
+ "train_acc": 0.00998,
+ "test_loss": 8.80145364074707,
+ "test_acc": 0.01,
+ "lyapunov": 1.5666624332023094,
+ "grad_norm": 0.2018507800384921,
+ "grad_max_sv": 0.12567667234688998,
+ "grad_min_sv": 4.6990583254762225e-15,
+ "grad_condition": 125036911617.91772,
+ "lr": 0.0007223175895924635,
+ "time_sec": 132.1492202281952
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.344240028381348,
+ "train_acc": 0.0096,
+ "test_loss": 8.331844716644287,
+ "test_acc": 0.01,
+ "lyapunov": 1.5653653464963675,
+ "grad_norm": 0.1977193203709713,
+ "grad_max_sv": 0.12096917647868395,
+ "grad_min_sv": 2.717621440740357e-15,
+ "grad_condition": 120646434306.70581,
+ "lr": 0.0007128896457825361,
+ "time_sec": 132.13583779335022
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.34588626373291,
+ "train_acc": 0.00938,
+ "test_loss": 8.483297344970703,
+ "test_acc": 0.01,
+ "lyapunov": 1.5671809872093103,
+ "grad_norm": 0.17917342896025326,
+ "grad_max_sv": 0.10660264752805233,
+ "grad_min_sv": 2.903017749905976e-15,
+ "grad_condition": 106288369212.58371,
+ "lr": 0.0007033683215378998,
+ "time_sec": 132.12570214271545
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.347936657714844,
+ "train_acc": 0.00928,
+ "test_loss": 12.471004583740234,
+ "test_acc": 0.01,
+ "lyapunov": 1.5704145821768913,
+ "grad_norm": 0.1585992442529963,
+ "grad_max_sv": 0.05894996239803731,
+ "grad_min_sv": 4.065829085829974e-17,
+ "grad_condition": 58945476044.698166,
+ "lr": 0.0006937577932260512,
+ "time_sec": 132.08077478408813
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.350657684173584,
+ "train_acc": 0.00942,
+ "test_loss": 11.975766296386718,
+ "test_acc": 0.01,
+ "lyapunov": 1.572284730803936,
+ "grad_norm": 0.16329462100720574,
+ "grad_max_sv": 0.018565936107188465,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18565936107.188465,
+ "lr": 0.0006840622763423388,
+ "time_sec": 132.12146091461182
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.342193555297851,
+ "train_acc": 0.00952,
+ "test_loss": 12.00783012084961,
+ "test_acc": 0.01,
+ "lyapunov": 1.5669191542183956,
+ "grad_norm": 0.13144150243285688,
+ "grad_max_sv": 0.014100767159834503,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14100767159.834503,
+ "lr": 0.0006742860236609073,
+ "time_sec": 132.0214581489563
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.349671448669434,
+ "train_acc": 0.0097,
+ "test_loss": 12.08228343963623,
+ "test_acc": 0.01,
+ "lyapunov": 1.5733529234786168,
+ "grad_norm": 0.15236031303960995,
+ "grad_max_sv": 0.002432991983368993,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2432991983.368993,
+ "lr": 0.0006644333233692913,
+ "time_sec": 131.98429799079895
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.343136109619141,
+ "train_acc": 0.00986,
+ "test_loss": 10.815134619140625,
+ "test_acc": 0.01,
+ "lyapunov": 1.567219941207515,
+ "grad_norm": 0.13665097355727693,
+ "grad_max_sv": 0.03331217863596976,
+ "grad_min_sv": 4.039363544528912e-19,
+ "grad_condition": 33312131775.42389,
+ "lr": 0.0006545084971874734,
+ "time_sec": 132.03068280220032
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.344384336853027,
+ "train_acc": 0.01022,
+ "test_loss": 11.902839001464844,
+ "test_acc": 0.01,
+ "lyapunov": 1.5653783214061767,
+ "grad_norm": 0.18581223375617745,
+ "grad_max_sv": 0.11722703091800213,
+ "grad_min_sv": 1.8473140836599877e-15,
+ "grad_condition": 117024266905.12569,
+ "lr": 0.0006445158984722354,
+ "time_sec": 132.11943864822388
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.346207113494873,
+ "train_acc": 0.00964,
+ "test_loss": 10.298070428466797,
+ "test_acc": 0.01,
+ "lyapunov": 1.5678635116123483,
+ "grad_norm": 0.17212702314261866,
+ "grad_max_sv": 0.11003287564963102,
+ "grad_min_sv": 1.1830899390639064e-16,
+ "grad_condition": 110021246721.88094,
+ "lr": 0.0006344599103076324,
+ "time_sec": 132.09185695648193
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.345449805297852,
+ "train_acc": 0.00958,
+ "test_loss": 9.716324475097656,
+ "test_acc": 0.01,
+ "lyapunov": 1.5676089863643012,
+ "grad_norm": 0.15858824070117938,
+ "grad_max_sv": 0.09742239024490118,
+ "grad_min_sv": 2.2791221237746455e-16,
+ "grad_condition": 97400387801.48373,
+ "lr": 0.0006243449435824269,
+ "time_sec": 132.09884762763977
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.347441923828125,
+ "train_acc": 0.01,
+ "test_loss": 9.248421519470215,
+ "test_acc": 0.01,
+ "lyapunov": 1.5703948257524338,
+ "grad_norm": 0.14831464239510592,
+ "grad_max_sv": 0.07895854022353888,
+ "grad_min_sv": 1.0966957298749494e-34,
+ "grad_condition": 78958540223.53888,
+ "lr": 0.0006141754350553275,
+ "time_sec": 132.1075723171234
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.3479963973999025,
+ "train_acc": 0.00918,
+ "test_loss": 11.96562194519043,
+ "test_acc": 0.01,
+ "lyapunov": 1.5711398328966497,
+ "grad_norm": 0.13907361248234446,
+ "grad_max_sv": 0.06278349282220005,
+ "grad_min_sv": 0.0,
+ "grad_condition": 62783492822.20006,
+ "lr": 0.0006039558454088793,
+ "time_sec": 132.1277093887329
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.343847501678467,
+ "train_acc": 0.00942,
+ "test_loss": 10.723486402893066,
+ "test_acc": 0.01,
+ "lyapunov": 1.5666573139102868,
+ "grad_norm": 0.1348401569471477,
+ "grad_max_sv": 0.07675737962126732,
+ "grad_min_sv": 0.0,
+ "grad_condition": 76757379621.2673,
+ "lr": 0.000593690657292862,
+ "time_sec": 132.15379786491394
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.348686145477295,
+ "train_acc": 0.00928,
+ "test_loss": 9.169928652954102,
+ "test_acc": 0.01,
+ "lyapunov": 1.5714481184854532,
+ "grad_norm": 0.16082287392865435,
+ "grad_max_sv": 0.09281166503205895,
+ "grad_min_sv": 4.119931040700715e-29,
+ "grad_condition": 92811665032.05894,
+ "lr": 0.0005833843733580507,
+ "time_sec": 132.15499711036682
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.346614480133057,
+ "train_acc": 0.01036,
+ "test_loss": 9.111311894226073,
+ "test_acc": 0.01,
+ "lyapunov": 1.5694071944717252,
+ "grad_norm": 0.15530027367743043,
+ "grad_max_sv": 0.09021252328529954,
+ "grad_min_sv": 9.645277459794148e-41,
+ "grad_condition": 90212523285.29953,
+ "lr": 0.0005730415142812054,
+ "time_sec": 132.0900914669037
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.345042231140137,
+ "train_acc": 0.0094,
+ "test_loss": 8.921395944213867,
+ "test_acc": 0.01,
+ "lyapunov": 1.5690713626954256,
+ "grad_norm": 0.12882941842915957,
+ "grad_max_sv": 0.05447775078937411,
+ "grad_min_sv": 0.0,
+ "grad_condition": 54477750789.374115,
+ "lr": 0.0005626666167821517,
+ "time_sec": 132.08048009872437
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.35093121887207,
+ "train_acc": 0.00998,
+ "test_loss": 9.45476280517578,
+ "test_acc": 0.01,
+ "lyapunov": 1.5726936317770683,
+ "grad_norm": 0.15278112356314727,
+ "grad_max_sv": 0.05165710533037782,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51657105330.377815,
+ "lr": 0.0005522642316338265,
+ "time_sec": 132.26694178581238
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.349324496612549,
+ "train_acc": 0.0099,
+ "test_loss": 8.863416375732422,
+ "test_acc": 0.01,
+ "lyapunov": 1.572835110642416,
+ "grad_norm": 0.13044312395716468,
+ "grad_max_sv": 0.040168187906965615,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40168187906.965614,
+ "lr": 0.0005418389216661573,
+ "time_sec": 132.09336495399475
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.344522937774658,
+ "train_acc": 0.0098,
+ "test_loss": 8.490674835205079,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687179925191739,
+ "grad_norm": 0.12245301057298638,
+ "grad_max_sv": 0.05633250158280134,
+ "grad_min_sv": 0.0,
+ "grad_condition": 56332501582.801346,
+ "lr": 0.0005313952597646563,
+ "time_sec": 132.10885214805603
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.344547733154297,
+ "train_acc": 0.0097,
+ "test_loss": 8.686578596496583,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687794383529508,
+ "grad_norm": 0.11446001541385904,
+ "grad_max_sv": 0.049419266358017924,
+ "grad_min_sv": 0.0,
+ "grad_condition": 49419266358.01792,
+ "lr": 0.0005209378268645994,
+ "time_sec": 132.04956126213074
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.3437795330810545,
+ "train_acc": 0.0094,
+ "test_loss": 8.874914520263673,
+ "test_acc": 0.01,
+ "lyapunov": 1.5682151988339241,
+ "grad_norm": 0.1237497118091755,
+ "grad_max_sv": 0.03953348807990551,
+ "grad_min_sv": 0.0,
+ "grad_condition": 39533488079.9055,
+ "lr": 0.0005104712099416781,
+ "time_sec": 132.10020518302917
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.343674107208252,
+ "train_acc": 0.0092,
+ "test_loss": 8.772430587768556,
+ "test_acc": 0.01,
+ "lyapunov": 1.5683565054403241,
+ "grad_norm": 0.11349041239477198,
+ "grad_max_sv": 0.026115051889792084,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26115051889.792084,
+ "lr": 0.0004999999999999996,
+ "time_sec": 132.01686429977417
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.342641368255615,
+ "train_acc": 0.00932,
+ "test_loss": 8.705339865112304,
+ "test_acc": 0.01,
+ "lyapunov": 1.5662559923308585,
+ "grad_norm": 0.12277695191025612,
+ "grad_max_sv": 0.0629763058386743,
+ "grad_min_sv": 0.0,
+ "grad_condition": 62976305838.67432,
+ "lr": 0.0004895287900583212,
+ "time_sec": 132.05883979797363
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.341884041595459,
+ "train_acc": 0.00968,
+ "test_loss": 9.93609327545166,
+ "test_acc": 0.01,
+ "lyapunov": 1.566317234502729,
+ "grad_norm": 0.11484157346336721,
+ "grad_max_sv": 0.047401683824136856,
+ "grad_min_sv": 0.0,
+ "grad_condition": 47401683824.136856,
+ "lr": 0.0004790621731353997,
+ "time_sec": 132.05576992034912
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.343069399871826,
+ "train_acc": 0.0102,
+ "test_loss": 8.943976522827148,
+ "test_acc": 0.01,
+ "lyapunov": 1.5676431427221469,
+ "grad_norm": 0.10629466820483455,
+ "grad_max_sv": 0.034334157966077326,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34334157966.077324,
+ "lr": 0.000468604740235343,
+ "time_sec": 132.03219604492188
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.342923241119385,
+ "train_acc": 0.00894,
+ "test_loss": 10.30071854095459,
+ "test_acc": 0.01,
+ "lyapunov": 1.5677035571364186,
+ "grad_norm": 0.11729853273385192,
+ "grad_max_sv": 0.018184055807068944,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18184055807.068947,
+ "lr": 0.00045816107833384175,
+ "time_sec": 132.0335590839386
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.342889130249024,
+ "train_acc": 0.00868,
+ "test_loss": 9.292682635498046,
+ "test_acc": 0.01,
+ "lyapunov": 1.5676629153054085,
+ "grad_norm": 0.10602422228730526,
+ "grad_max_sv": 0.022180042415857314,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22180042415.857315,
+ "lr": 0.0004477357683661729,
+ "time_sec": 132.04535913467407
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.3435448347473145,
+ "train_acc": 0.01026,
+ "test_loss": 10.646222018432617,
+ "test_acc": 0.01,
+ "lyapunov": 1.5682694253409306,
+ "grad_norm": 0.10584507536046345,
+ "grad_max_sv": 0.036097540194168685,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36097540194.168686,
+ "lr": 0.00043733338321784746,
+ "time_sec": 132.0792417526245
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.346409954376221,
+ "train_acc": 0.00938,
+ "test_loss": 8.388480964660644,
+ "test_acc": 0.01,
+ "lyapunov": 1.5704751517766578,
+ "grad_norm": 0.1594968968610417,
+ "grad_max_sv": 0.05689305039122701,
+ "grad_min_sv": 0.0,
+ "grad_condition": 56893050391.227005,
+ "lr": 0.0004269584857187939,
+ "time_sec": 132.10688591003418
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.351143104705811,
+ "train_acc": 0.00934,
+ "test_loss": 10.536403848266602,
+ "test_acc": 0.01,
+ "lyapunov": 1.57418333660916,
+ "grad_norm": 0.14631187426937112,
+ "grad_max_sv": 0.043841119017452,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43841119017.451996,
+ "lr": 0.0004166156266419484,
+ "time_sec": 132.08924984931946
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.345183093261719,
+ "train_acc": 0.00942,
+ "test_loss": 11.133738461303711,
+ "test_acc": 0.01,
+ "lyapunov": 1.5697272662311563,
+ "grad_norm": 0.11663908627078753,
+ "grad_max_sv": 0.04061344410292804,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40613444102.92804,
+ "lr": 0.0004063093427071373,
+ "time_sec": 132.13465809822083
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.346176763000488,
+ "train_acc": 0.01038,
+ "test_loss": 11.12772626953125,
+ "test_acc": 0.01,
+ "lyapunov": 1.5703431422753102,
+ "grad_norm": 0.1377494846746287,
+ "grad_max_sv": 0.026653958344832064,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26653958344.83206,
+ "lr": 0.0003960441545911199,
+ "time_sec": 132.03662395477295
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.343412326202393,
+ "train_acc": 0.00966,
+ "test_loss": 10.485674588012696,
+ "test_acc": 0.01,
+ "lyapunov": 1.568256547383945,
+ "grad_norm": 0.11507124566756707,
+ "grad_max_sv": 0.015460054902359844,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15460054902.359842,
+ "lr": 0.0003858245649446718,
+ "time_sec": 132.30029678344727
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.343340453948975,
+ "train_acc": 0.0093,
+ "test_loss": 10.443886459350585,
+ "test_acc": 0.01,
+ "lyapunov": 1.5683554758501175,
+ "grad_norm": 0.11491345749975401,
+ "grad_max_sv": 0.01923052747733891,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19230527477.33891,
+ "lr": 0.00037565505641757235,
+ "time_sec": 132.09554266929626
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.343219871826172,
+ "train_acc": 0.00982,
+ "test_loss": 9.331489477539062,
+ "test_acc": 0.01,
+ "lyapunov": 1.5680722632371555,
+ "grad_norm": 0.10357957499765331,
+ "grad_max_sv": 0.03583596190437675,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35835961904.37675,
+ "lr": 0.00036554008969236695,
+ "time_sec": 132.38618564605713
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.345059629974365,
+ "train_acc": 0.00942,
+ "test_loss": 9.705012353515626,
+ "test_acc": 0.01,
+ "lyapunov": 1.5701254081848028,
+ "grad_norm": 0.13335748884903612,
+ "grad_max_sv": 0.01991720902733505,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19917209027.335045,
+ "lr": 0.0003554841015277638,
+ "time_sec": 132.10200333595276
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.346582987670899,
+ "train_acc": 0.00936,
+ "test_loss": 9.92761245727539,
+ "test_acc": 0.01,
+ "lyapunov": 1.570894326395391,
+ "grad_norm": 0.12917945353905133,
+ "grad_max_sv": 0.005056336428970099,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5056336428.9700985,
+ "lr": 0.000345491502812526,
+ "time_sec": 132.01398086547852
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.343077623138428,
+ "train_acc": 0.00948,
+ "test_loss": 9.892114511108398,
+ "test_acc": 0.01,
+ "lyapunov": 1.5679589848384223,
+ "grad_norm": 0.10089565070900397,
+ "grad_max_sv": 0.024783097906038165,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24783097906.038166,
+ "lr": 0.0003355666766307081,
+ "time_sec": 132.0552315711975
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.344612928619385,
+ "train_acc": 0.00984,
+ "test_loss": 9.036325561523437,
+ "test_acc": 0.01,
+ "lyapunov": 1.5697500227052537,
+ "grad_norm": 0.13133583896592352,
+ "grad_max_sv": 0.017823219764977694,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17823219764.977695,
+ "lr": 0.00032571397633909225,
+ "time_sec": 132.07679438591003
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.346883224182129,
+ "train_acc": 0.0096,
+ "test_loss": 8.63075946044922,
+ "test_acc": 0.01,
+ "lyapunov": 1.5719260608448702,
+ "grad_norm": 0.09641577817960369,
+ "grad_max_sv": 0.003358140075579286,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3358140075.5792856,
+ "lr": 0.00031593772365766094,
+ "time_sec": 132.0291886329651
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.343683553771973,
+ "train_acc": 0.00968,
+ "test_loss": 8.73685708618164,
+ "test_acc": 0.01,
+ "lyapunov": 1.5686328389760478,
+ "grad_norm": 0.09724660681276874,
+ "grad_max_sv": 0.018295074068009853,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18295074068.00985,
+ "lr": 0.0003062422067739483,
+ "time_sec": 132.12304759025574
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.343045575866699,
+ "train_acc": 0.0086,
+ "test_loss": 8.563214770507813,
+ "test_acc": 0.01,
+ "lyapunov": 1.5680832335406252,
+ "grad_norm": 0.09663765425859253,
+ "grad_max_sv": 0.0011947159189730882,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1194715918.9730883,
+ "lr": 0.00029663167846209965,
+ "time_sec": 132.08247256278992
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.342066871490479,
+ "train_acc": 0.00906,
+ "test_loss": 8.190421600341796,
+ "test_acc": 0.01,
+ "lyapunov": 1.5670246782205295,
+ "grad_norm": 0.10563473423950201,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00028711035421746345,
+ "time_sec": 132.00989890098572
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.344517989196778,
+ "train_acc": 0.00956,
+ "test_loss": 7.861407074737548,
+ "test_acc": 0.01,
+ "lyapunov": 1.5693480187974622,
+ "grad_norm": 0.11742062064295959,
+ "grad_max_sv": 0.0026324169710278513,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2632416971.027851,
+ "lr": 0.00027768241040753615,
+ "time_sec": 132.0594036579132
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.347235653991699,
+ "train_acc": 0.0093,
+ "test_loss": 7.575284122467041,
+ "test_acc": 0.01,
+ "lyapunov": 1.571171855682607,
+ "grad_norm": 0.09980977977399007,
+ "grad_max_sv": 0.02286601336672902,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22866013366.729023,
+ "lr": 0.00026835198244006903,
+ "time_sec": 132.04233193397522
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.343029342498779,
+ "train_acc": 0.00906,
+ "test_loss": 7.45513014831543,
+ "test_acc": 0.01,
+ "lyapunov": 1.5681262549841801,
+ "grad_norm": 0.09342461116650493,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002591231629491421,
+ "time_sec": 131.9914095401764
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.3494312777709965,
+ "train_acc": 0.00946,
+ "test_loss": 7.298580384063721,
+ "test_acc": 0.01,
+ "lyapunov": 1.573579462897747,
+ "grad_norm": 0.11907283705246616,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002499999999999997,
+ "time_sec": 131.99966597557068
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.342477266693115,
+ "train_acc": 0.00948,
+ "test_loss": 7.23597857055664,
+ "test_acc": 0.01,
+ "lyapunov": 1.5675478393159559,
+ "grad_norm": 0.09720728561760718,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00024098649531343477,
+ "time_sec": 131.99136352539062
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.341832947845459,
+ "train_acc": 0.00952,
+ "test_loss": 6.885648638916016,
+ "test_acc": 0.01,
+ "lyapunov": 1.5668759388691933,
+ "grad_norm": 0.09041804951245885,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002320866025105016,
+ "time_sec": 131.99253511428833
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.342141702270508,
+ "train_acc": 0.00956,
+ "test_loss": 7.227639694976807,
+ "test_acc": 0.01,
+ "lyapunov": 1.5670329186007799,
+ "grad_norm": 0.09504910369326992,
+ "grad_max_sv": 0.02663951087743044,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26639510877.43044,
+ "lr": 0.0002233042253783278,
+ "time_sec": 132.1089026927948
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.342686755828858,
+ "train_acc": 0.00952,
+ "test_loss": 7.590157605743408,
+ "test_acc": 0.01,
+ "lyapunov": 1.5676686721079796,
+ "grad_norm": 0.09647661834231228,
+ "grad_max_sv": 0.024380091251805423,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24380091251.805428,
+ "lr": 0.000214643216157784,
+ "time_sec": 132.06964230537415
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.344026827392578,
+ "train_acc": 0.0095,
+ "test_loss": 7.26397318649292,
+ "test_acc": 0.01,
+ "lyapunov": 1.569079797895973,
+ "grad_norm": 0.09462212649965553,
+ "grad_max_sv": 0.025716999545693398,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25716999545.693398,
+ "lr": 0.00020610737385376332,
+ "time_sec": 132.05113744735718
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.343383273925781,
+ "train_acc": 0.00984,
+ "test_loss": 7.472719841003418,
+ "test_acc": 0.01,
+ "lyapunov": 1.5685262430049574,
+ "grad_norm": 0.09652945369879859,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019770044256881242,
+ "time_sec": 132.04551148414612
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.343959386138916,
+ "train_acc": 0.00958,
+ "test_loss": 7.445523268127442,
+ "test_acc": 0.01,
+ "lyapunov": 1.5691688893091342,
+ "grad_norm": 0.11388204494439719,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001894261098608447,
+ "time_sec": 132.02328181266785
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.342418379516602,
+ "train_acc": 0.00956,
+ "test_loss": 7.7173920944213865,
+ "test_acc": 0.01,
+ "lyapunov": 1.5675345683646629,
+ "grad_norm": 0.09095832390063928,
+ "grad_max_sv": 0.0006004700437188149,
+ "grad_min_sv": 0.0,
+ "grad_condition": 600470043.7188148,
+ "lr": 0.000181288005125655,
+ "time_sec": 132.05611062049866
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.343011405029297,
+ "train_acc": 0.00944,
+ "test_loss": 7.669947085571289,
+ "test_acc": 0.01,
+ "lyapunov": 1.5680827374958322,
+ "grad_norm": 0.09262475373763442,
+ "grad_max_sv": 0.005615572584792972,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5615572584.792972,
+ "lr": 0.0001732896980049473,
+ "time_sec": 132.0278182029724
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.343270805511475,
+ "train_acc": 0.00902,
+ "test_loss": 7.524606921386718,
+ "test_acc": 0.01,
+ "lyapunov": 1.5684265477578048,
+ "grad_norm": 0.0929528487372896,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016543469682057076,
+ "time_sec": 132.01432704925537
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.3430648620605465,
+ "train_acc": 0.00908,
+ "test_loss": 7.709186791992187,
+ "test_acc": 0.01,
+ "lyapunov": 1.568246929236995,
+ "grad_norm": 0.08919578457075998,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 131.99741911888123
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.343547642822266,
+ "train_acc": 0.00982,
+ "test_loss": 7.633082518005371,
+ "test_acc": 0.01,
+ "lyapunov": 1.56872364535661,
+ "grad_norm": 0.09053282340492008,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 131.9864740371704
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.349385154571533,
+ "train_acc": 0.00926,
+ "test_loss": 7.402510799407959,
+ "test_acc": 0.01,
+ "lyapunov": 1.573695613295221,
+ "grad_norm": 0.1331401826658418,
+ "grad_max_sv": 0.007452957844361663,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7452957844.361662,
+ "lr": 0.00014276366018359834,
+ "time_sec": 131.9871220588684
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.3475169880676265,
+ "train_acc": 0.00952,
+ "test_loss": 7.718253441619873,
+ "test_acc": 0.01,
+ "lyapunov": 1.5723201231578428,
+ "grad_norm": 0.12289444805074258,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00013551568628929425,
+ "time_sec": 131.98372554779053
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.344510088806152,
+ "train_acc": 0.0094,
+ "test_loss": 7.667512203216552,
+ "test_acc": 0.01,
+ "lyapunov": 1.569762335713867,
+ "grad_norm": 0.09241242910799227,
+ "grad_max_sv": 0.008661840902641415,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8661840902.641415,
+ "lr": 0.00012842758726130276,
+ "time_sec": 132.05068254470825
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.343971741943359,
+ "train_acc": 0.00908,
+ "test_loss": 7.700549072265625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5691710436130728,
+ "grad_norm": 0.10830143197848235,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 132.05018138885498
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.34632839920044,
+ "train_acc": 0.00976,
+ "test_loss": 7.761262622070313,
+ "test_acc": 0.01,
+ "lyapunov": 1.5713817326309125,
+ "grad_norm": 0.11435501476976112,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 131.99043989181519
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.343400028686523,
+ "train_acc": 0.0092,
+ "test_loss": 7.794083961486816,
+ "test_acc": 0.01,
+ "lyapunov": 1.5685766228019733,
+ "grad_norm": 0.08899614535065951,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010815327133708009,
+ "time_sec": 131.99262475967407
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.343056818084717,
+ "train_acc": 0.00994,
+ "test_loss": 7.639262364196777,
+ "test_acc": 0.01,
+ "lyapunov": 1.5682302356680946,
+ "grad_norm": 0.08977728685492378,
+ "grad_max_sv": 0.0006828804966062307,
+ "grad_min_sv": 0.0,
+ "grad_condition": 682880496.6062307,
+ "lr": 0.00010173504098790182,
+ "time_sec": 132.01868438720703
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.343217134552002,
+ "train_acc": 0.00976,
+ "test_loss": 7.660574660491943,
+ "test_acc": 0.01,
+ "lyapunov": 1.5684062449828438,
+ "grad_norm": 0.09249377742678497,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 132.00144267082214
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.344638092651367,
+ "train_acc": 0.00922,
+ "test_loss": 7.663163458251953,
+ "test_acc": 0.01,
+ "lyapunov": 1.5699151044001665,
+ "grad_norm": 0.1218726255205378,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 132.01804733276367
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.348134873046875,
+ "train_acc": 0.00886,
+ "test_loss": 7.884050512695312,
+ "test_acc": 0.01,
+ "lyapunov": 1.5724969224246872,
+ "grad_norm": 0.09050076665656355,
+ "grad_max_sv": 0.006364198122173548,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6364198122.173548,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 132.0272445678711
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.345365750579834,
+ "train_acc": 0.00954,
+ "test_loss": 7.118724527740478,
+ "test_acc": 0.01,
+ "lyapunov": 1.5703083133453604,
+ "grad_norm": 0.09069370794057488,
+ "grad_max_sv": 0.011258925357833505,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11258925357.833506,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 132.11900568008423
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.3431124142456055,
+ "train_acc": 0.01036,
+ "test_loss": 7.23227484741211,
+ "test_acc": 0.01,
+ "lyapunov": 1.568215018952899,
+ "grad_norm": 0.09217613058420869,
+ "grad_max_sv": 0.022803956363350152,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22803956363.35015,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 132.04238414764404
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.343697594146729,
+ "train_acc": 0.00968,
+ "test_loss": 7.098866456604004,
+ "test_acc": 0.01,
+ "lyapunov": 1.5689014327495605,
+ "grad_norm": 0.09081931856189392,
+ "grad_max_sv": 0.0006075550802052021,
+ "grad_min_sv": 0.0,
+ "grad_condition": 607555080.2052021,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 132.0574872493744
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.34278548538208,
+ "train_acc": 0.00934,
+ "test_loss": 7.256412179565429,
+ "test_acc": 0.01,
+ "lyapunov": 1.5679547353778653,
+ "grad_norm": 0.09038480638705418,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 132.04981470108032
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.342774636230469,
+ "train_acc": 0.0091,
+ "test_loss": 7.211266984558105,
+ "test_acc": 0.01,
+ "lyapunov": 1.567944114470421,
+ "grad_norm": 0.089217745438497,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 132.0332305431366
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.343552632446289,
+ "train_acc": 0.00974,
+ "test_loss": 7.4164355209350585,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687480887488636,
+ "grad_norm": 0.11327584151012998,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 132.0342137813568
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.343920302124023,
+ "train_acc": 0.00956,
+ "test_loss": 7.272874592590332,
+ "test_acc": 0.01,
+ "lyapunov": 1.5691817562903285,
+ "grad_norm": 0.09015948976899717,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 132.10112881660461
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.3440144625854495,
+ "train_acc": 0.01,
+ "test_loss": 7.378188175964356,
+ "test_acc": 0.01,
+ "lyapunov": 1.5693023784081344,
+ "grad_norm": 0.08928317026508968,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 132.07870721817017
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.343164742889404,
+ "train_acc": 0.01,
+ "test_loss": 7.42498392944336,
+ "test_acc": 0.01,
+ "lyapunov": 1.5683802131496731,
+ "grad_norm": 0.08938231829702648,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 132.035484790802
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.343568996734619,
+ "train_acc": 0.01,
+ "test_loss": 7.3698252609252926,
+ "test_acc": 0.01,
+ "lyapunov": 1.5688252653307317,
+ "grad_norm": 0.08905121975076379,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 132.03120112419128
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.343650721282959,
+ "train_acc": 0.01,
+ "test_loss": 7.399177293395996,
+ "test_acc": 0.01,
+ "lyapunov": 1.568874374070131,
+ "grad_norm": 0.08945297165320838,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 132.04973649978638
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.344010626678466,
+ "train_acc": 0.01,
+ "test_loss": 7.451564918518066,
+ "test_acc": 0.01,
+ "lyapunov": 1.569275133750018,
+ "grad_norm": 0.08901909798719944,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 132.0272672176361
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.3513097511291505,
+ "train_acc": 0.01,
+ "test_loss": 7.494620336914062,
+ "test_acc": 0.01,
+ "lyapunov": 1.5749251406515956,
+ "grad_norm": 0.11347426013089548,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 132.07217669487
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.344121324768066,
+ "train_acc": 0.01,
+ "test_loss": 7.466115431976318,
+ "test_acc": 0.01,
+ "lyapunov": 1.5693210134725741,
+ "grad_norm": 0.13961703652050822,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 132.09098315238953
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.3435055235290525,
+ "train_acc": 0.01,
+ "test_loss": 7.356763949584961,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687689787286627,
+ "grad_norm": 0.08881051948095202,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 132.01117372512817
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.343292431945801,
+ "train_acc": 0.01,
+ "test_loss": 7.423162863159179,
+ "test_acc": 0.01,
+ "lyapunov": 1.5685121305763263,
+ "grad_norm": 0.08882639322875942,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 132.0426745414734
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.345961066894532,
+ "train_acc": 0.01,
+ "test_loss": 7.442799024963379,
+ "test_acc": 0.01,
+ "lyapunov": 1.5709345974885593,
+ "grad_norm": 0.11315656196544904,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 132.11658310890198
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.343492304992676,
+ "train_acc": 0.01,
+ "test_loss": 7.444627010345459,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687398992840895,
+ "grad_norm": 0.08884505400987935,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 132.04373836517334
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.344924531860352,
+ "train_acc": 0.01,
+ "test_loss": 7.465608943176269,
+ "test_acc": 0.01,
+ "lyapunov": 1.570182631387735,
+ "grad_norm": 0.0880861679030681,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 132.03311824798584
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.343007263793945,
+ "train_acc": 0.01,
+ "test_loss": 7.4812581214904785,
+ "test_acc": 0.01,
+ "lyapunov": 1.5682257471791923,
+ "grad_norm": 0.08813951319538865,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 132.02575135231018
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.343106704711914,
+ "train_acc": 0.01,
+ "test_loss": 7.437115397644043,
+ "test_acc": 0.01,
+ "lyapunov": 1.5683247204631796,
+ "grad_norm": 0.10158596989760496,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 132.05020785331726
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.34294032119751,
+ "train_acc": 0.01,
+ "test_loss": 7.48037815246582,
+ "test_acc": 0.01,
+ "lyapunov": 1.5681621552733205,
+ "grad_norm": 0.08833317407426634,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 132.06616115570068
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.3438012377929685,
+ "train_acc": 0.01,
+ "test_loss": 7.496150346374511,
+ "test_acc": 0.01,
+ "lyapunov": 1.5690925231065287,
+ "grad_norm": 0.08791012889132134,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 132.04411220550537
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.342738318328857,
+ "train_acc": 0.01,
+ "test_loss": 7.490428826141358,
+ "test_acc": 0.01,
+ "lyapunov": 1.5679414330236137,
+ "grad_norm": 0.08841039102397012,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 132.08523440361023
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.3446823258972165,
+ "train_acc": 0.01,
+ "test_loss": 7.497726692199707,
+ "test_acc": 0.01,
+ "lyapunov": 1.5699935627105597,
+ "grad_norm": 0.08776043049557726,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 132.03058862686157
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.343377943572998,
+ "train_acc": 0.01,
+ "test_loss": 7.49042504272461,
+ "test_acc": 0.01,
+ "lyapunov": 1.5686415504006779,
+ "grad_norm": 0.08845953592324265,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 132.1206715106964
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.342948052978516,
+ "train_acc": 0.01,
+ "test_loss": 7.490426095581054,
+ "test_acc": 0.01,
+ "lyapunov": 1.5681962311420294,
+ "grad_norm": 0.08842267718527619,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 132.15464973449707
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.341931441345215,
+ "train_acc": 0.01,
+ "test_loss": 7.487130715942383,
+ "test_acc": 0.01,
+ "lyapunov": 1.567085372822364,
+ "grad_norm": 0.0882430826444348,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 132.04750204086304
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 5.159331872253418,
+ "train_acc": 0.01526,
+ "test_loss": 4.873309817504883,
+ "test_acc": 0.0093,
+ "lyapunov": 2.4743038653717626,
+ "grad_norm": 5.258705722697472,
+ "grad_max_sv": 4.479718285799026,
+ "grad_min_sv": 8.709666913797598e-08,
+ "grad_condition": 86685976.9902235,
+ "lr": 0.0009998903417374227,
+ "time_sec": 177.3543930053711
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.886084578857422,
+ "train_acc": 0.01782,
+ "test_loss": 4.853029528808594,
+ "test_acc": 0.01,
+ "lyapunov": 1.9916716545744015,
+ "grad_norm": 3.460383424161388,
+ "grad_max_sv": 2.7798140585422515,
+ "grad_min_sv": 5.706028290974885e-08,
+ "grad_condition": 56364730.82112197,
+ "lr": 0.0009995614150494292,
+ "time_sec": 177.3599088191986
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.784042566375732,
+ "train_acc": 0.01776,
+ "test_loss": 4.790321257781982,
+ "test_acc": 0.0116,
+ "lyapunov": 1.7964752174704277,
+ "grad_norm": 2.38204770499042,
+ "grad_max_sv": 1.8151098906993866,
+ "grad_min_sv": 3.787766869461917e-08,
+ "grad_condition": 87913704.86086728,
+ "lr": 0.0009990133642141358,
+ "time_sec": 177.30120587348938
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.7238768682861325,
+ "train_acc": 0.017,
+ "test_loss": 4.624422996520996,
+ "test_acc": 0.01,
+ "lyapunov": 1.708475301332791,
+ "grad_norm": 1.1762359291788405,
+ "grad_max_sv": 0.7854173953674035,
+ "grad_min_sv": 9.800736290438679e-09,
+ "grad_condition": 32224269144.49076,
+ "lr": 0.0009982464296247522,
+ "time_sec": 177.37837982177734
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.755855419616699,
+ "train_acc": 0.01562,
+ "test_loss": 4.610174011230469,
+ "test_acc": 0.01,
+ "lyapunov": 1.675043061871053,
+ "grad_norm": 0.7259009952417778,
+ "grad_max_sv": 0.5301507465541363,
+ "grad_min_sv": 5.1440461827152224e-11,
+ "grad_condition": 105915112802.73376,
+ "lr": 0.0009972609476841367,
+ "time_sec": 177.381986618042
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.81643141998291,
+ "train_acc": 0.01288,
+ "test_loss": 4.60545783996582,
+ "test_acc": 0.01,
+ "lyapunov": 1.6532284676876214,
+ "grad_norm": 0.4607532772533372,
+ "grad_max_sv": 0.3609377399086952,
+ "grad_min_sv": 5.305074951633812e-13,
+ "grad_condition": 279971546429.15295,
+ "lr": 0.000996057350657239,
+ "time_sec": 177.434068441391
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.86136633392334,
+ "train_acc": 0.01224,
+ "test_loss": 5.360651237487793,
+ "test_acc": 0.01,
+ "lyapunov": 1.6404305040988776,
+ "grad_norm": 0.3680696909769052,
+ "grad_max_sv": 0.316419655829668,
+ "grad_min_sv": 4.076535490995613e-14,
+ "grad_condition": 307643620830.443,
+ "lr": 0.000994636166481494,
+ "time_sec": 177.2750985622406
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.912417060089111,
+ "train_acc": 0.01054,
+ "test_loss": 9.9219926071167,
+ "test_acc": 0.01,
+ "lyapunov": 1.6378350980446468,
+ "grad_norm": 0.4461762738170382,
+ "grad_max_sv": 0.26778712812811134,
+ "grad_min_sv": 1.894336000793759e-10,
+ "grad_condition": 230695726821.5417,
+ "lr": 0.0009929980185352525,
+ "time_sec": 177.29276037216187
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.968367258911133,
+ "train_acc": 0.00954,
+ "test_loss": 7.827674491882324,
+ "test_acc": 0.01,
+ "lyapunov": 1.624799670465767,
+ "grad_norm": 0.5375330781925154,
+ "grad_max_sv": 0.19412051439285277,
+ "grad_min_sv": 1.2617160814236554e-09,
+ "grad_condition": 49059473464.09962,
+ "lr": 0.0009911436253643444,
+ "time_sec": 177.24522376060486
+ },
+ {
+ "epoch": 10,
+ "train_loss": 5.062082354125977,
+ "train_acc": 0.01038,
+ "test_loss": 5.569893667602539,
+ "test_acc": 0.01,
+ "lyapunov": 1.6864765662976238,
+ "grad_norm": 0.753548419446606,
+ "grad_max_sv": 0.4160853669047356,
+ "grad_min_sv": 5.35826894499278e-09,
+ "grad_condition": 10262508595.882322,
+ "lr": 0.0009890738003669028,
+ "time_sec": 177.3631317615509
+ },
+ {
+ "epoch": 11,
+ "train_loss": 5.058011302032471,
+ "train_acc": 0.00952,
+ "test_loss": 5.087331884002686,
+ "test_acc": 0.01,
+ "lyapunov": 1.6062763267770752,
+ "grad_norm": 0.6603912459051273,
+ "grad_max_sv": 0.3468701772391796,
+ "grad_min_sv": 4.421987463785291e-09,
+ "grad_condition": 31727265214.824364,
+ "lr": 0.00098678945143658,
+ "time_sec": 177.38562989234924
+ },
+ {
+ "epoch": 12,
+ "train_loss": 5.058439118957519,
+ "train_acc": 0.00978,
+ "test_loss": 5.082496954345703,
+ "test_acc": 0.01,
+ "lyapunov": 1.5697322474111377,
+ "grad_norm": 0.3523516525308902,
+ "grad_max_sv": 0.15937897935509682,
+ "grad_min_sv": 1.873834291129129e-09,
+ "grad_condition": 2759306059.465498,
+ "lr": 0.0009842915805643154,
+ "time_sec": 177.36675763130188
+ },
+ {
+ "epoch": 13,
+ "train_loss": 5.109822076416016,
+ "train_acc": 0.00966,
+ "test_loss": 5.692898876953125,
+ "test_acc": 0.01,
+ "lyapunov": 1.5695562542551924,
+ "grad_norm": 0.4593422563560374,
+ "grad_max_sv": 0.35409238263964654,
+ "grad_min_sv": 4.71099455383317e-09,
+ "grad_condition": 127958722.61296721,
+ "lr": 0.000981581283398829,
+ "time_sec": 177.44806337356567
+ },
+ {
+ "epoch": 14,
+ "train_loss": 5.165816433410645,
+ "train_acc": 0.01014,
+ "test_loss": 7.84957985534668,
+ "test_acc": 0.01,
+ "lyapunov": 1.5709327590435058,
+ "grad_norm": 0.5694077536605798,
+ "grad_max_sv": 0.4453627858310938,
+ "grad_min_sv": 5.610913853565864e-09,
+ "grad_condition": 15313856896.7998,
+ "lr": 0.0009786597487660333,
+ "time_sec": 177.33772945404053
+ },
+ {
+ "epoch": 15,
+ "train_loss": 5.173155229797363,
+ "train_acc": 0.00972,
+ "test_loss": 5.157973370361328,
+ "test_acc": 0.01,
+ "lyapunov": 1.5706551062786365,
+ "grad_norm": 0.43055135839909847,
+ "grad_max_sv": 0.21150126457214355,
+ "grad_min_sv": 1.4762666979190565e-09,
+ "grad_condition": 47799778820.01504,
+ "lr": 0.0009755282581475766,
+ "time_sec": 177.33515882492065
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.207788455657959,
+ "train_acc": 0.00962,
+ "test_loss": 7.759160287475586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5720331275554569,
+ "grad_norm": 0.3894440758556563,
+ "grad_max_sv": 0.1499915760010481,
+ "grad_min_sv": 1.4193079274022143e-09,
+ "grad_condition": 19769526881.522236,
+ "lr": 0.0009721881851187403,
+ "time_sec": 177.28159952163696
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.25385222076416,
+ "train_acc": 0.00914,
+ "test_loss": 4.720599290466309,
+ "test_acc": 0.01,
+ "lyapunov": 1.579244610293747,
+ "grad_norm": 0.3647403085884025,
+ "grad_max_sv": 0.17017204388976098,
+ "grad_min_sv": 1.3479770702114132e-09,
+ "grad_condition": 29838909132.92096,
+ "lr": 0.0009686409947459456,
+ "time_sec": 177.3482620716095
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.290630603790283,
+ "train_acc": 0.00966,
+ "test_loss": 4.818104879760742,
+ "test_acc": 0.01,
+ "lyapunov": 1.572280853300753,
+ "grad_norm": 0.42846936793954693,
+ "grad_max_sv": 0.2142110202461481,
+ "grad_min_sv": 2.2586123961791682e-09,
+ "grad_condition": 6069325065.621381,
+ "lr": 0.0009648882429441254,
+ "time_sec": 177.32465243339539
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.347908495483399,
+ "train_acc": 0.00976,
+ "test_loss": 4.680776121520996,
+ "test_acc": 0.01,
+ "lyapunov": 1.575872380715197,
+ "grad_norm": 0.575049551174443,
+ "grad_max_sv": 0.43422624468803406,
+ "grad_min_sv": 4.46815191792408e-09,
+ "grad_condition": 771924430.9754374,
+ "lr": 0.00096093157579425,
+ "time_sec": 177.39169430732727
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.372361971588135,
+ "train_acc": 0.0092,
+ "test_loss": 4.661239500427246,
+ "test_acc": 0.01,
+ "lyapunov": 1.5752952742149762,
+ "grad_norm": 0.48504969680471643,
+ "grad_max_sv": 0.3245972327888012,
+ "grad_min_sv": 3.24804563384129e-09,
+ "grad_condition": 111189476.23947105,
+ "lr": 0.0009567727288213001,
+ "time_sec": 177.45550775527954
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.37029109954834,
+ "train_acc": 0.00994,
+ "test_loss": 4.667470470428467,
+ "test_acc": 0.01,
+ "lyapunov": 1.5776933690775996,
+ "grad_norm": 0.5453589213556644,
+ "grad_max_sv": 0.3167274951934814,
+ "grad_min_sv": 1.839770059066596e-09,
+ "grad_condition": 35181903296.3187,
+ "lr": 0.0009524135262330095,
+ "time_sec": 177.39379477500916
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.364489818725586,
+ "train_acc": 0.01004,
+ "test_loss": 4.650138076782227,
+ "test_acc": 0.01,
+ "lyapunov": 1.5788932602728725,
+ "grad_norm": 0.41535739480122674,
+ "grad_max_sv": 0.2576656248420477,
+ "grad_min_sv": 1.5858205317854233e-12,
+ "grad_condition": 141035021433.30975,
+ "lr": 0.0009478558801197061,
+ "time_sec": 177.35208559036255
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.354643789978027,
+ "train_acc": 0.0095,
+ "test_loss": 4.695660099029541,
+ "test_acc": 0.01,
+ "lyapunov": 1.5758325334095284,
+ "grad_norm": 0.30581042910039435,
+ "grad_max_sv": 0.09805708080530166,
+ "grad_min_sv": 6.027597976882962e-11,
+ "grad_condition": 58654490617.71743,
+ "lr": 0.000943101789615607,
+ "time_sec": 177.3221151828766
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.353882457122802,
+ "train_acc": 0.00926,
+ "test_loss": 4.697132012939453,
+ "test_acc": 0.01,
+ "lyapunov": 1.578979221756196,
+ "grad_norm": 0.24237849220724425,
+ "grad_max_sv": 0.008070914912968874,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8070914912.968875,
+ "lr": 0.0009381533400219313,
+ "time_sec": 177.2640483379364
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.351721515655518,
+ "train_acc": 0.00882,
+ "test_loss": 4.700634111022949,
+ "test_acc": 0.01,
+ "lyapunov": 1.5769606035993533,
+ "grad_norm": 0.299683664855393,
+ "grad_max_sv": 0.0009750408120453357,
+ "grad_min_sv": 0.0,
+ "grad_condition": 975040812.0453358,
+ "lr": 0.0009330127018922189,
+ "time_sec": 177.26898193359375
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.350724313659668,
+ "train_acc": 0.00882,
+ "test_loss": 4.976845028686523,
+ "test_acc": 0.01,
+ "lyapunov": 1.5759871856635794,
+ "grad_norm": 0.25282322824422004,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000927682130080253,
+ "time_sec": 177.23982048034668
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.3572762519836425,
+ "train_acc": 0.00916,
+ "test_loss": 4.699456916046143,
+ "test_acc": 0.01,
+ "lyapunov": 1.5826555691716615,
+ "grad_norm": 0.3870563147260469,
+ "grad_max_sv": 0.0008042730391025543,
+ "grad_min_sv": 0.0,
+ "grad_condition": 804273039.1025543,
+ "lr": 0.0009221639627510072,
+ "time_sec": 177.22700691223145
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.352617038269043,
+ "train_acc": 0.0083,
+ "test_loss": 4.97811413192749,
+ "test_acc": 0.01,
+ "lyapunov": 1.5779867312487434,
+ "grad_norm": 0.23788834158418645,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0009164606203550494,
+ "time_sec": 177.21826004981995
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.361850127716065,
+ "train_acc": 0.00882,
+ "test_loss": 4.701448201751709,
+ "test_acc": 0.01,
+ "lyapunov": 1.5833598887524032,
+ "grad_norm": 0.42995748870040046,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0009105746045668516,
+ "time_sec": 177.21908974647522
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.358213574829102,
+ "train_acc": 0.00904,
+ "test_loss": 5.412950395202636,
+ "test_acc": 0.01,
+ "lyapunov": 1.5822858404930291,
+ "grad_norm": 0.331672095140798,
+ "grad_max_sv": 0.0007659861817955971,
+ "grad_min_sv": 0.0,
+ "grad_condition": 765986181.7955971,
+ "lr": 0.0009045084971874733,
+ "time_sec": 177.25155925750732
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.359104016113282,
+ "train_acc": 0.00934,
+ "test_loss": 4.669879191589356,
+ "test_acc": 0.01,
+ "lyapunov": 1.5799903305595184,
+ "grad_norm": 0.2952731697889261,
+ "grad_max_sv": 0.07996195461601019,
+ "grad_min_sv": 1.8027052930896337e-13,
+ "grad_condition": 65774856592.69602,
+ "lr": 0.0008982649590120977,
+ "time_sec": 177.35512685775757
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.376470304718017,
+ "train_acc": 0.0094,
+ "test_loss": 5.556229885864258,
+ "test_acc": 0.01,
+ "lyapunov": 1.5852845087075782,
+ "grad_norm": 0.34062130802734397,
+ "grad_max_sv": 0.1435967419296503,
+ "grad_min_sv": 4.671640446328522e-10,
+ "grad_condition": 42736336798.66166,
+ "lr": 0.0008918467286629196,
+ "time_sec": 177.3573558330536
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.354219467468262,
+ "train_acc": 0.00872,
+ "test_loss": 5.552221805572509,
+ "test_acc": 0.01,
+ "lyapunov": 1.5796612647488295,
+ "grad_norm": 0.24724638679639113,
+ "grad_max_sv": 0.012037708284333348,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12037708284.333347,
+ "lr": 0.0008852566213878943,
+ "time_sec": 177.34085536003113
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.358693110198975,
+ "train_acc": 0.00966,
+ "test_loss": 5.034206434631348,
+ "test_acc": 0.01,
+ "lyapunov": 1.5802869622969566,
+ "grad_norm": 0.26366751089242085,
+ "grad_max_sv": 0.08639110988005996,
+ "grad_min_sv": 4.474218043386011e-15,
+ "grad_condition": 85802279590.28976,
+ "lr": 0.000878497527825878,
+ "time_sec": 177.4128155708313
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.366087015075683,
+ "train_acc": 0.00934,
+ "test_loss": 4.936266462707519,
+ "test_acc": 0.01,
+ "lyapunov": 1.584944297285641,
+ "grad_norm": 0.3376396372917839,
+ "grad_max_sv": 0.1203163092955947,
+ "grad_min_sv": 2.7491684533434274e-14,
+ "grad_condition": 116380291473.68535,
+ "lr": 0.000871572412738697,
+ "time_sec": 177.40404987335205
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.361581598358154,
+ "train_acc": 0.01024,
+ "test_loss": 4.950734414672851,
+ "test_acc": 0.01,
+ "lyapunov": 1.5822551268750749,
+ "grad_norm": 0.35809443213096964,
+ "grad_max_sv": 0.13039383399300278,
+ "grad_min_sv": 9.003150469885764e-15,
+ "grad_condition": 129198667968.56705,
+ "lr": 0.0008644843137107055,
+ "time_sec": 177.38117098808289
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.367499517974854,
+ "train_acc": 0.00976,
+ "test_loss": 5.498499377441406,
+ "test_acc": 0.01,
+ "lyapunov": 1.58695989923404,
+ "grad_norm": 0.3008050326299743,
+ "grad_max_sv": 0.1228790944442153,
+ "grad_min_sv": 5.822944316845422e-15,
+ "grad_condition": 122173960457.34317,
+ "lr": 0.0008572363398164014,
+ "time_sec": 177.40381455421448
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.360039620361328,
+ "train_acc": 0.0097,
+ "test_loss": 5.010895380401611,
+ "test_acc": 0.01,
+ "lyapunov": 1.5823902507572223,
+ "grad_norm": 0.28800004102415633,
+ "grad_max_sv": 0.10303753465414048,
+ "grad_min_sv": 1.7600771723101566e-15,
+ "grad_condition": 102819314675.69463,
+ "lr": 0.0008498316702566826,
+ "time_sec": 177.36353826522827
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.361895691375732,
+ "train_acc": 0.00962,
+ "test_loss": 5.47797232055664,
+ "test_acc": 0.01,
+ "lyapunov": 1.5826790979146348,
+ "grad_norm": 0.3607282899922051,
+ "grad_max_sv": 0.1270065199583769,
+ "grad_min_sv": 5.8177677532204334e-15,
+ "grad_condition": 126306540301.11067,
+ "lr": 0.0008422735529643442,
+ "time_sec": 177.36847496032715
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.360779151458741,
+ "train_acc": 0.00974,
+ "test_loss": 4.913441442871094,
+ "test_acc": 0.01,
+ "lyapunov": 1.5841997578320905,
+ "grad_norm": 0.30144541489536497,
+ "grad_max_sv": 0.08766317497938872,
+ "grad_min_sv": 3.1235879522614164e-15,
+ "grad_condition": 87300355595.9631,
+ "lr": 0.0008345653031794289,
+ "time_sec": 177.39417672157288
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.361253643188476,
+ "train_acc": 0.00952,
+ "test_loss": 5.392577352905273,
+ "test_acc": 0.01,
+ "lyapunov": 1.584902299334631,
+ "grad_norm": 0.33710076786895654,
+ "grad_max_sv": 0.07017813064157963,
+ "grad_min_sv": 1.8795491026783212e-20,
+ "grad_condition": 70178128751.4103,
+ "lr": 0.0008267103019950526,
+ "time_sec": 177.4070680141449
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.359663697814941,
+ "train_acc": 0.00966,
+ "test_loss": 5.435651000976563,
+ "test_acc": 0.01,
+ "lyapunov": 1.583795747793544,
+ "grad_norm": 0.44265142669444985,
+ "grad_max_sv": 0.06058515841141343,
+ "grad_min_sv": 8.532913146218004e-39,
+ "grad_condition": 60585158411.41343,
+ "lr": 0.0008187119948743447,
+ "time_sec": 177.301589012146
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.361796244659423,
+ "train_acc": 0.0104,
+ "test_loss": 5.4946890060424805,
+ "test_acc": 0.01,
+ "lyapunov": 1.5847100778613858,
+ "grad_norm": 0.6384686198807327,
+ "grad_max_sv": 0.08455213336274028,
+ "grad_min_sv": 1.854097809152722e-15,
+ "grad_condition": 84328075575.36731,
+ "lr": 0.000810573890139155,
+ "time_sec": 177.35142517089844
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.364447811279297,
+ "train_acc": 0.01014,
+ "test_loss": 5.332209419250488,
+ "test_acc": 0.01,
+ "lyapunov": 1.5854847031786008,
+ "grad_norm": 0.675284019586962,
+ "grad_max_sv": 0.11337836356833578,
+ "grad_min_sv": 1.7049374807524963e-14,
+ "grad_condition": 111308573138.52168,
+ "lr": 0.0008022995574311873,
+ "time_sec": 177.3521008491516
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.360489757080078,
+ "train_acc": 0.00976,
+ "test_loss": 5.304935124206543,
+ "test_acc": 0.01,
+ "lyapunov": 1.5837746992745363,
+ "grad_norm": 0.5718003616383085,
+ "grad_max_sv": 0.08602348966524005,
+ "grad_min_sv": 3.0378301121606614e-16,
+ "grad_condition": 85997891115.73683,
+ "lr": 0.0007938926261462363,
+ "time_sec": 177.33692407608032
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.361809297485352,
+ "train_acc": 0.01014,
+ "test_loss": 4.89552943725586,
+ "test_acc": 0.01,
+ "lyapunov": 1.585215172194459,
+ "grad_norm": 0.44412809114793517,
+ "grad_max_sv": 0.0825215914286673,
+ "grad_min_sv": 1.1713936618830865e-15,
+ "grad_condition": 82407893767.02434,
+ "lr": 0.0007853567838422158,
+ "time_sec": 177.35017251968384
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.361848121795655,
+ "train_acc": 0.00954,
+ "test_loss": 4.982022219848633,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858572995876108,
+ "grad_norm": 0.4284143094057381,
+ "grad_max_sv": 0.06426824014633895,
+ "grad_min_sv": 5.420102114032563e-18,
+ "grad_condition": 64267673459.65764,
+ "lr": 0.0007766957746216719,
+ "time_sec": 177.3225803375244
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.360097906646729,
+ "train_acc": 0.0101,
+ "test_loss": 5.039643939208984,
+ "test_acc": 0.01,
+ "lyapunov": 1.5852815909763736,
+ "grad_norm": 0.21919166507419222,
+ "grad_max_sv": 0.02766723851673305,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27667238516.73305,
+ "lr": 0.0007679133974894982,
+ "time_sec": 177.3571081161499
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.361355583496094,
+ "train_acc": 0.00912,
+ "test_loss": 4.70521968460083,
+ "test_acc": 0.01,
+ "lyapunov": 1.587215112603229,
+ "grad_norm": 0.31401296813167406,
+ "grad_max_sv": 0.0012400273233652114,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1240027323.3652115,
+ "lr": 0.000759013504686565,
+ "time_sec": 177.23792433738708
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.374890024871826,
+ "train_acc": 0.00998,
+ "test_loss": 5.3741009857177735,
+ "test_acc": 0.01,
+ "lyapunov": 1.5953726881300396,
+ "grad_norm": 0.3238754552354357,
+ "grad_max_sv": 0.04934265548363328,
+ "grad_min_sv": 2.6824701739898724e-33,
+ "grad_condition": 49342655483.63328,
+ "lr": 0.0007499999999999998,
+ "time_sec": 177.3176691532135
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.359442653961182,
+ "train_acc": 0.0091,
+ "test_loss": 5.708284506988526,
+ "test_acc": 0.01,
+ "lyapunov": 1.5848879155600468,
+ "grad_norm": 0.19742833159549178,
+ "grad_max_sv": 0.019448843877762557,
+ "grad_min_sv": 4.3389140032583084e-41,
+ "grad_condition": 19448843877.762554,
+ "lr": 0.0007408768370508575,
+ "time_sec": 177.30614399909973
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.357807418670654,
+ "train_acc": 0.00892,
+ "test_loss": 5.598787411499023,
+ "test_acc": 0.01,
+ "lyapunov": 1.5835388462866664,
+ "grad_norm": 0.22895282871195646,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007316480175599307,
+ "time_sec": 177.23059678077698
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.364920553588867,
+ "train_acc": 0.00838,
+ "test_loss": 5.555523378753662,
+ "test_acc": 0.01,
+ "lyapunov": 1.5897833791840108,
+ "grad_norm": 0.27349172628604307,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007223175895924635,
+ "time_sec": 177.23636078834534
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.360137451934815,
+ "train_acc": 0.00904,
+ "test_loss": 5.4607298324584965,
+ "test_acc": 0.01,
+ "lyapunov": 1.585875649586358,
+ "grad_norm": 0.3494380261105508,
+ "grad_max_sv": 0.009265018161386251,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9265018161.386251,
+ "lr": 0.0007128896457825361,
+ "time_sec": 177.3195767402649
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.361894327392578,
+ "train_acc": 0.01076,
+ "test_loss": 5.3967264434814455,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858059591039673,
+ "grad_norm": 0.32616838064335635,
+ "grad_max_sv": 0.06554236207157374,
+ "grad_min_sv": 3.9627266810538444e-22,
+ "grad_condition": 65542362038.60982,
+ "lr": 0.0007033683215378998,
+ "time_sec": 177.4070463180542
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.361103507232666,
+ "train_acc": 0.00966,
+ "test_loss": 5.396138972473144,
+ "test_acc": 0.01,
+ "lyapunov": 1.585260014399848,
+ "grad_norm": 0.24476233592152788,
+ "grad_max_sv": 0.053304498083889484,
+ "grad_min_sv": 8.107207506846484e-17,
+ "grad_condition": 53297506440.79659,
+ "lr": 0.0006937577932260512,
+ "time_sec": 177.3034119606018
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.3623845806884765,
+ "train_acc": 0.00962,
+ "test_loss": 5.060037421417237,
+ "test_acc": 0.01,
+ "lyapunov": 1.5866734694946758,
+ "grad_norm": 0.28857632314696974,
+ "grad_max_sv": 0.06447782786563039,
+ "grad_min_sv": 1.9607974133287156e-16,
+ "grad_condition": 64457267604.59035,
+ "lr": 0.0006840622763423388,
+ "time_sec": 177.35450506210327
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.361771304779053,
+ "train_acc": 0.01002,
+ "test_loss": 5.0901702087402345,
+ "test_acc": 0.01,
+ "lyapunov": 1.586991887873091,
+ "grad_norm": 0.23271259978105882,
+ "grad_max_sv": 0.04189403969794512,
+ "grad_min_sv": 2.1019476964872255e-46,
+ "grad_condition": 41894039697.945114,
+ "lr": 0.0006742860236609073,
+ "time_sec": 177.32643222808838
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.360649804382324,
+ "train_acc": 0.00986,
+ "test_loss": 5.02971961517334,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858081442010983,
+ "grad_norm": 0.25490660325152764,
+ "grad_max_sv": 0.04079276975244284,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40792769752.44284,
+ "lr": 0.0006644333233692913,
+ "time_sec": 177.3179268836975
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.364020364685058,
+ "train_acc": 0.00904,
+ "test_loss": 4.7199004196167,
+ "test_acc": 0.01,
+ "lyapunov": 1.5886733891713956,
+ "grad_norm": 0.22342122942097759,
+ "grad_max_sv": 0.027459373604506253,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27459373604.506256,
+ "lr": 0.0006545084971874734,
+ "time_sec": 177.30202984809875
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.363523327484131,
+ "train_acc": 0.00934,
+ "test_loss": 4.7266477081298826,
+ "test_acc": 0.01,
+ "lyapunov": 1.5883313112551598,
+ "grad_norm": 0.20389335925530302,
+ "grad_max_sv": 0.045495460741221905,
+ "grad_min_sv": 1.4012984643248171e-46,
+ "grad_condition": 45495460741.2219,
+ "lr": 0.0006445158984722354,
+ "time_sec": 177.32515287399292
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.367948243408203,
+ "train_acc": 0.0091,
+ "test_loss": 4.75396729888916,
+ "test_acc": 0.01,
+ "lyapunov": 1.5914591578266504,
+ "grad_norm": 0.255614489528913,
+ "grad_max_sv": 0.03248326424509287,
+ "grad_min_sv": 1.3219893653396629e-33,
+ "grad_condition": 32483264245.092873,
+ "lr": 0.0006344599103076324,
+ "time_sec": 177.34726858139038
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.360079801940918,
+ "train_acc": 0.0094,
+ "test_loss": 5.19269112701416,
+ "test_acc": 0.01,
+ "lyapunov": 1.5859909679578699,
+ "grad_norm": 0.247568680367887,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006243449435824269,
+ "time_sec": 177.2823510169983
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.359493107910156,
+ "train_acc": 0.00876,
+ "test_loss": 5.2250466796875,
+ "test_acc": 0.01,
+ "lyapunov": 1.585366655188753,
+ "grad_norm": 0.2769224967661722,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006141754350553275,
+ "time_sec": 177.23246479034424
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.361286865844726,
+ "train_acc": 0.00938,
+ "test_loss": 5.298229453277588,
+ "test_acc": 0.01,
+ "lyapunov": 1.5870976630988938,
+ "grad_norm": 0.24716357558635968,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006039558454088793,
+ "time_sec": 177.274742603302
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.360220510559082,
+ "train_acc": 0.00942,
+ "test_loss": 5.1931522216796875,
+ "test_acc": 0.01,
+ "lyapunov": 1.5856442792946115,
+ "grad_norm": 0.21643181506904438,
+ "grad_max_sv": 0.028073416696861385,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28073416696.86139,
+ "lr": 0.000593690657292862,
+ "time_sec": 177.3214614391327
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.3634411520385745,
+ "train_acc": 0.01004,
+ "test_loss": 4.726324760437012,
+ "test_acc": 0.01,
+ "lyapunov": 1.5876712076499333,
+ "grad_norm": 0.19917891606110388,
+ "grad_max_sv": 0.06480920519679785,
+ "grad_min_sv": 5.826939700269216e-27,
+ "grad_condition": 64809205196.797485,
+ "lr": 0.0005833843733580507,
+ "time_sec": 177.30631113052368
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.3627893775939945,
+ "train_acc": 0.0096,
+ "test_loss": 4.78324942779541,
+ "test_acc": 0.01,
+ "lyapunov": 1.5872700497927263,
+ "grad_norm": 0.17814025282763096,
+ "grad_max_sv": 0.05710890954360366,
+ "grad_min_sv": 1.642725198984103e-39,
+ "grad_condition": 57108909543.60366,
+ "lr": 0.0005730415142812054,
+ "time_sec": 177.28468227386475
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.36284663772583,
+ "train_acc": 0.01016,
+ "test_loss": 4.65924833908081,
+ "test_acc": 0.01,
+ "lyapunov": 1.5882405993883566,
+ "grad_norm": 0.18974647851723686,
+ "grad_max_sv": 0.03764563817530871,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37645638175.3087,
+ "lr": 0.0005626666167821517,
+ "time_sec": 177.30268549919128
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.365585427398682,
+ "train_acc": 0.00962,
+ "test_loss": 4.667314112854004,
+ "test_acc": 0.01,
+ "lyapunov": 1.58941994451196,
+ "grad_norm": 0.17127250466631513,
+ "grad_max_sv": 0.043766821082681415,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43766821082.68142,
+ "lr": 0.0005522642316338265,
+ "time_sec": 177.31375312805176
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.360834673461914,
+ "train_acc": 0.0103,
+ "test_loss": 4.691217092895508,
+ "test_acc": 0.01,
+ "lyapunov": 1.5854695108540529,
+ "grad_norm": 0.15750040762462056,
+ "grad_max_sv": 0.05662639001384377,
+ "grad_min_sv": 0.0,
+ "grad_condition": 56626390013.84377,
+ "lr": 0.0005418389216661573,
+ "time_sec": 177.3107042312622
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.360965846557617,
+ "train_acc": 0.01014,
+ "test_loss": 4.686003870391846,
+ "test_acc": 0.01,
+ "lyapunov": 1.586221619945048,
+ "grad_norm": 0.1761841219237378,
+ "grad_max_sv": 0.051002619601786134,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51002619601.78613,
+ "lr": 0.0005313952597646563,
+ "time_sec": 177.28891253471375
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.365758000946045,
+ "train_acc": 0.00988,
+ "test_loss": 4.678875315856933,
+ "test_acc": 0.01,
+ "lyapunov": 1.5900602660825491,
+ "grad_norm": 0.21832467373191636,
+ "grad_max_sv": 0.06282770875841379,
+ "grad_min_sv": 0.0,
+ "grad_condition": 62827708758.413795,
+ "lr": 0.0005209378268645994,
+ "time_sec": 177.3162078857422
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.365496074371338,
+ "train_acc": 0.0093,
+ "test_loss": 4.655053031921387,
+ "test_acc": 0.01,
+ "lyapunov": 1.589696585979608,
+ "grad_norm": 0.23086253967925782,
+ "grad_max_sv": 0.060001683793962,
+ "grad_min_sv": 0.0,
+ "grad_condition": 60001683793.962,
+ "lr": 0.0005104712099416781,
+ "time_sec": 177.30215072631836
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.364179220275879,
+ "train_acc": 0.0099,
+ "test_loss": 4.638170684051514,
+ "test_acc": 0.01,
+ "lyapunov": 1.5883820352651883,
+ "grad_norm": 0.3049112090346521,
+ "grad_max_sv": 0.05380613347515464,
+ "grad_min_sv": 0.0,
+ "grad_condition": 53806133475.15464,
+ "lr": 0.0004999999999999996,
+ "time_sec": 177.36862349510193
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.359675194854736,
+ "train_acc": 0.01046,
+ "test_loss": 4.649093914794922,
+ "test_acc": 0.01,
+ "lyapunov": 1.5854026216375248,
+ "grad_norm": 0.2119481091202284,
+ "grad_max_sv": 0.03726704930886626,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37267049308.86626,
+ "lr": 0.0004895287900583212,
+ "time_sec": 177.32284903526306
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.360474863128662,
+ "train_acc": 0.00958,
+ "test_loss": 4.605349244689942,
+ "test_acc": 0.01,
+ "lyapunov": 1.5860518323795876,
+ "grad_norm": 0.20492250658984978,
+ "grad_max_sv": 0.010520621668547392,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10520621668.54739,
+ "lr": 0.0004790621731353997,
+ "time_sec": 177.27856492996216
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.3626285870361325,
+ "train_acc": 0.0096,
+ "test_loss": 4.636105052185059,
+ "test_acc": 0.01,
+ "lyapunov": 1.5883512807928997,
+ "grad_norm": 0.16200768770528595,
+ "grad_max_sv": 0.01769152507185936,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17691525071.85936,
+ "lr": 0.000468604740235343,
+ "time_sec": 177.26149678230286
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.361725220947266,
+ "train_acc": 0.00962,
+ "test_loss": 4.642175579071045,
+ "test_acc": 0.01,
+ "lyapunov": 1.5874589931629504,
+ "grad_norm": 0.1671711869857159,
+ "grad_max_sv": 0.027231273613870143,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27231273613.870144,
+ "lr": 0.00045816107833384175,
+ "time_sec": 177.28059816360474
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.359847649841309,
+ "train_acc": 0.00934,
+ "test_loss": 4.646283575439453,
+ "test_acc": 0.01,
+ "lyapunov": 1.5854374237377624,
+ "grad_norm": 0.15090527056955186,
+ "grad_max_sv": 0.02150285104289651,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21502851042.896507,
+ "lr": 0.0004477357683661729,
+ "time_sec": 177.27379083633423
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.3600718869018555,
+ "train_acc": 0.01048,
+ "test_loss": 4.752709213256836,
+ "test_acc": 0.01,
+ "lyapunov": 1.585394742238857,
+ "grad_norm": 0.17187344605967436,
+ "grad_max_sv": 0.043320519663393495,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43320519663.39349,
+ "lr": 0.00043733338321784746,
+ "time_sec": 177.62933731079102
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.362194033813476,
+ "train_acc": 0.00908,
+ "test_loss": 4.769781411743164,
+ "test_acc": 0.01,
+ "lyapunov": 1.5872593858967656,
+ "grad_norm": 0.17685474969644083,
+ "grad_max_sv": 0.043185068760067225,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43185068760.06722,
+ "lr": 0.0004269584857187939,
+ "time_sec": 177.36878728866577
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.360512623901367,
+ "train_acc": 0.00896,
+ "test_loss": 4.634495629882813,
+ "test_acc": 0.01,
+ "lyapunov": 1.585809985999866,
+ "grad_norm": 0.17569851085947658,
+ "grad_max_sv": 0.048822146560996774,
+ "grad_min_sv": 0.0,
+ "grad_condition": 48822146560.99677,
+ "lr": 0.0004166156266419484,
+ "time_sec": 177.35730743408203
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.360660369110107,
+ "train_acc": 0.01062,
+ "test_loss": 4.635055514526367,
+ "test_acc": 0.01,
+ "lyapunov": 1.5863755276745848,
+ "grad_norm": 0.1734959766637803,
+ "grad_max_sv": 0.03708101906813681,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37081019068.13681,
+ "lr": 0.0004063093427071373,
+ "time_sec": 177.31386804580688
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.359581319885254,
+ "train_acc": 0.00962,
+ "test_loss": 4.680524919128418,
+ "test_acc": 0.01,
+ "lyapunov": 1.585432373349319,
+ "grad_norm": 0.19633262712151112,
+ "grad_max_sv": 0.016985992342233656,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16985992342.233658,
+ "lr": 0.0003960441545911199,
+ "time_sec": 177.29162740707397
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.364330820922851,
+ "train_acc": 0.00994,
+ "test_loss": 4.640988105010987,
+ "test_acc": 0.01,
+ "lyapunov": 1.5893402819133475,
+ "grad_norm": 0.17010660799200755,
+ "grad_max_sv": 0.005552049493417144,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5552049493.417144,
+ "lr": 0.0003858245649446718,
+ "time_sec": 177.2697069644928
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.36001446975708,
+ "train_acc": 0.0091,
+ "test_loss": 4.6622309997558595,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858566068932223,
+ "grad_norm": 0.18253684720194474,
+ "grad_max_sv": 0.009605350159108638,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9605350159.108639,
+ "lr": 0.00037565505641757235,
+ "time_sec": 177.2729914188385
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.363334915313721,
+ "train_acc": 0.00928,
+ "test_loss": 4.651910215759277,
+ "test_acc": 0.01,
+ "lyapunov": 1.5891908779168678,
+ "grad_norm": 0.25285970261724394,
+ "grad_max_sv": 0.014622378209605814,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14622378209.605814,
+ "lr": 0.00036554008969236695,
+ "time_sec": 177.25673460960388
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.366140861053466,
+ "train_acc": 0.0098,
+ "test_loss": 4.632004132843018,
+ "test_acc": 0.01,
+ "lyapunov": 1.5918613025904311,
+ "grad_norm": 0.3793803057886311,
+ "grad_max_sv": 0.0227991352789104,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22799135278.9104,
+ "lr": 0.0003554841015277638,
+ "time_sec": 177.28270602226257
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.358956403503418,
+ "train_acc": 0.00908,
+ "test_loss": 4.634336037445069,
+ "test_acc": 0.01,
+ "lyapunov": 1.5845078528689607,
+ "grad_norm": 0.16129836844937653,
+ "grad_max_sv": 0.030955695733428,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30955695733.428,
+ "lr": 0.000345491502812526,
+ "time_sec": 177.34664869308472
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.370377727966309,
+ "train_acc": 0.01008,
+ "test_loss": 4.641486628723144,
+ "test_acc": 0.01,
+ "lyapunov": 1.5915974838959286,
+ "grad_norm": 0.23056801493799003,
+ "grad_max_sv": 0.021973734814673664,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21973734814.673664,
+ "lr": 0.0003355666766307081,
+ "time_sec": 177.30071926116943
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.35953079574585,
+ "train_acc": 0.0104,
+ "test_loss": 4.654357167816162,
+ "test_acc": 0.01,
+ "lyapunov": 1.5854123461886744,
+ "grad_norm": 0.2133357061554603,
+ "grad_max_sv": 0.01584432367235422,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15844323672.354221,
+ "lr": 0.00032571397633909225,
+ "time_sec": 177.30744338035583
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.359757648162842,
+ "train_acc": 0.01004,
+ "test_loss": 4.635669487762451,
+ "test_acc": 0.01,
+ "lyapunov": 1.5857275602457774,
+ "grad_norm": 0.21123088900545153,
+ "grad_max_sv": 0.022326651168987154,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22326651168.98716,
+ "lr": 0.00031593772365766094,
+ "time_sec": 177.30698537826538
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.358649451293945,
+ "train_acc": 0.00924,
+ "test_loss": 4.650500559997559,
+ "test_acc": 0.01,
+ "lyapunov": 1.584580004367682,
+ "grad_norm": 0.22156955822269123,
+ "grad_max_sv": 0.0036812785547226667,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3681278554.7226667,
+ "lr": 0.0003062422067739483,
+ "time_sec": 177.29391837120056
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.368402194519043,
+ "train_acc": 0.0096,
+ "test_loss": 4.631659384155274,
+ "test_acc": 0.01,
+ "lyapunov": 1.5918427952720076,
+ "grad_norm": 0.19012319147558024,
+ "grad_max_sv": 0.01328945653513074,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13289456535.130741,
+ "lr": 0.00029663167846209965,
+ "time_sec": 177.28295135498047
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.360648808441162,
+ "train_acc": 0.00988,
+ "test_loss": 4.642071528625488,
+ "test_acc": 0.01,
+ "lyapunov": 1.586560007251437,
+ "grad_norm": 0.16157307254883244,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00028711035421746345,
+ "time_sec": 177.2989547252655
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.358733374786377,
+ "train_acc": 0.00914,
+ "test_loss": 4.639485282897949,
+ "test_acc": 0.01,
+ "lyapunov": 1.5846895253871713,
+ "grad_norm": 0.14480973228900776,
+ "grad_max_sv": 0.00837345547042787,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8373455470.427872,
+ "lr": 0.00027768241040753615,
+ "time_sec": 177.27525234222412
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.360293337707519,
+ "train_acc": 0.0099,
+ "test_loss": 4.644459535980225,
+ "test_acc": 0.01,
+ "lyapunov": 1.5861705498927086,
+ "grad_norm": 0.18867802153244584,
+ "grad_max_sv": 0.026158737391233443,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26158737391.23344,
+ "lr": 0.00026835198244006903,
+ "time_sec": 177.2919957637787
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.360852672576904,
+ "train_acc": 0.00976,
+ "test_loss": 4.641770568847656,
+ "test_acc": 0.01,
+ "lyapunov": 1.5866629604793265,
+ "grad_norm": 0.2490166385107765,
+ "grad_max_sv": 0.025310791656374933,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25310791656.37493,
+ "lr": 0.0002591231629491421,
+ "time_sec": 177.28516483306885
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.359503317260742,
+ "train_acc": 0.0096,
+ "test_loss": 4.633657774353027,
+ "test_acc": 0.01,
+ "lyapunov": 1.5852865261190079,
+ "grad_norm": 0.31764569596084014,
+ "grad_max_sv": 0.03201284250244498,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32012842502.444984,
+ "lr": 0.0002499999999999997,
+ "time_sec": 177.3286590576172
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.3610862644958495,
+ "train_acc": 0.01004,
+ "test_loss": 4.627243125915528,
+ "test_acc": 0.01,
+ "lyapunov": 1.586990461934863,
+ "grad_norm": 0.3077979208978545,
+ "grad_max_sv": 0.022488519130274654,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22488519130.274654,
+ "lr": 0.00024098649531343477,
+ "time_sec": 177.27038407325745
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.359221751708985,
+ "train_acc": 0.0099,
+ "test_loss": 4.6350917106628415,
+ "test_acc": 0.01,
+ "lyapunov": 1.5852433824173324,
+ "grad_norm": 0.17125449319078032,
+ "grad_max_sv": 0.0006372035015374423,
+ "grad_min_sv": 0.0,
+ "grad_condition": 637203501.5374422,
+ "lr": 0.0002320866025105016,
+ "time_sec": 177.26434516906738
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.359845841064453,
+ "train_acc": 0.00998,
+ "test_loss": 4.644444650268555,
+ "test_acc": 0.01,
+ "lyapunov": 1.5859144453502372,
+ "grad_norm": 0.15906823668777442,
+ "grad_max_sv": 0.0012175182346254587,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1217518234.6254587,
+ "lr": 0.0002233042253783278,
+ "time_sec": 177.29427409172058
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.359393982086182,
+ "train_acc": 0.00964,
+ "test_loss": 4.629140382385254,
+ "test_acc": 0.01,
+ "lyapunov": 1.5853588230469648,
+ "grad_norm": 0.18868988717884208,
+ "grad_max_sv": 0.007832410791888834,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7832410791.888834,
+ "lr": 0.000214643216157784,
+ "time_sec": 177.3122420310974
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.376110725402832,
+ "train_acc": 0.00958,
+ "test_loss": 4.641193688201905,
+ "test_acc": 0.01,
+ "lyapunov": 1.594091626079491,
+ "grad_norm": 0.21866401239429448,
+ "grad_max_sv": 0.01763616520911455,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17636165209.11455,
+ "lr": 0.00020610737385376332,
+ "time_sec": 177.33545303344727
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.360543824005127,
+ "train_acc": 0.00952,
+ "test_loss": 4.63230926361084,
+ "test_acc": 0.01,
+ "lyapunov": 1.586505341407893,
+ "grad_norm": 0.19148423296709022,
+ "grad_max_sv": 0.007322627399116754,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7322627399.116755,
+ "lr": 0.00019770044256881242,
+ "time_sec": 177.29128861427307
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.359816354370118,
+ "train_acc": 0.00964,
+ "test_loss": 4.628876644897461,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858964429182165,
+ "grad_norm": 0.16953893016049196,
+ "grad_max_sv": 0.005570205627009273,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5570205627.009273,
+ "lr": 0.0001894261098608447,
+ "time_sec": 177.26312851905823
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.360526904602051,
+ "train_acc": 0.009,
+ "test_loss": 4.630769221496582,
+ "test_acc": 0.01,
+ "lyapunov": 1.5865018233618773,
+ "grad_norm": 0.18006495124030458,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000181288005125655,
+ "time_sec": 177.246666431427
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.361382939453125,
+ "train_acc": 0.0098,
+ "test_loss": 4.626291159820557,
+ "test_acc": 0.01,
+ "lyapunov": 1.586926028856536,
+ "grad_norm": 0.2328474503629796,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001732896980049473,
+ "time_sec": 177.25811576843262
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.358514823455811,
+ "train_acc": 0.00986,
+ "test_loss": 4.6495152236938475,
+ "test_acc": 0.01,
+ "lyapunov": 1.5844445182844196,
+ "grad_norm": 0.31612028134160525,
+ "grad_max_sv": 0.010267550591379404,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10267550591.379404,
+ "lr": 0.00016543469682057076,
+ "time_sec": 177.28474497795105
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.366782173309327,
+ "train_acc": 0.00906,
+ "test_loss": 4.620611762237549,
+ "test_acc": 0.01,
+ "lyapunov": 1.5906709133816497,
+ "grad_norm": 0.40151776348821855,
+ "grad_max_sv": 0.010553297400474549,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10553297400.474548,
+ "lr": 0.00015772644703565552,
+ "time_sec": 177.3135175704956
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.359567135009765,
+ "train_acc": 0.00886,
+ "test_loss": 4.628111135101318,
+ "test_acc": 0.01,
+ "lyapunov": 1.5856597996733683,
+ "grad_norm": 0.3009012541884835,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 177.25540447235107
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.358919576873779,
+ "train_acc": 0.00968,
+ "test_loss": 4.627276501464844,
+ "test_acc": 0.01,
+ "lyapunov": 1.5849643582883088,
+ "grad_norm": 0.3242366139837751,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 177.27025246620178
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.3586665776062015,
+ "train_acc": 0.00944,
+ "test_loss": 4.620662684631347,
+ "test_acc": 0.01,
+ "lyapunov": 1.5846976368018733,
+ "grad_norm": 0.2903374978600601,
+ "grad_max_sv": 0.004233767790719867,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4233767790.7198668,
+ "lr": 0.00013551568628929425,
+ "time_sec": 177.26198053359985
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.3605953396606445,
+ "train_acc": 0.00902,
+ "test_loss": 4.621528549194336,
+ "test_acc": 0.01,
+ "lyapunov": 1.586485847792662,
+ "grad_norm": 0.331820693233947,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 177.23981928825378
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.359012928771973,
+ "train_acc": 0.00958,
+ "test_loss": 4.619492964172363,
+ "test_acc": 0.01,
+ "lyapunov": 1.585117801376011,
+ "grad_norm": 0.2797157160809922,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 177.225914478302
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.359644413146973,
+ "train_acc": 0.00924,
+ "test_loss": 4.621938159942627,
+ "test_acc": 0.01,
+ "lyapunov": 1.5857579552608987,
+ "grad_norm": 0.2795622109437437,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 177.22438168525696
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.359761270446778,
+ "train_acc": 0.00924,
+ "test_loss": 4.6217840301513675,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858274750087573,
+ "grad_norm": 0.24852001797471837,
+ "grad_max_sv": 0.0012709970586001873,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1270997058.6001873,
+ "lr": 0.00010815327133708009,
+ "time_sec": 177.2276487350464
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.357662630462647,
+ "train_acc": 0.0091,
+ "test_loss": 4.622296886444092,
+ "test_acc": 0.01,
+ "lyapunov": 1.5836935113458073,
+ "grad_norm": 0.24372977816065178,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010173504098790182,
+ "time_sec": 177.25115942955017
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.361358259277344,
+ "train_acc": 0.00944,
+ "test_loss": 4.622046688079834,
+ "test_acc": 0.01,
+ "lyapunov": 1.587042825301285,
+ "grad_norm": 0.22330891574384296,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 177.27366518974304
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.35905032409668,
+ "train_acc": 0.00908,
+ "test_loss": 4.622121089935303,
+ "test_acc": 0.01,
+ "lyapunov": 1.5851479878510966,
+ "grad_norm": 0.20960225247372524,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 177.23317313194275
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.361670205078125,
+ "train_acc": 0.0093,
+ "test_loss": 4.622285698699951,
+ "test_acc": 0.01,
+ "lyapunov": 1.5875935237425978,
+ "grad_norm": 0.21843560272800885,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 177.2194859981537
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.360625909729004,
+ "train_acc": 0.01,
+ "test_loss": 4.6224393463134765,
+ "test_acc": 0.01,
+ "lyapunov": 1.5867376934232005,
+ "grad_norm": 0.2137074208505857,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 177.2682557106018
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.358632594451905,
+ "train_acc": 0.0093,
+ "test_loss": 4.680952319335938,
+ "test_acc": 0.01,
+ "lyapunov": 1.5847194472237316,
+ "grad_norm": 0.1870926810471898,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 177.23400807380676
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.360412776184082,
+ "train_acc": 0.0089,
+ "test_loss": 4.73941685333252,
+ "test_acc": 0.01,
+ "lyapunov": 1.5865021639162926,
+ "grad_norm": 0.21273250180362335,
+ "grad_max_sv": 0.0014166037552058696,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1416603755.2058697,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 177.24382710456848
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.358947314758301,
+ "train_acc": 0.0097,
+ "test_loss": 4.672125242614746,
+ "test_acc": 0.01,
+ "lyapunov": 1.584972734646419,
+ "grad_norm": 0.23341550723215748,
+ "grad_max_sv": 0.001309919636696577,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1309919636.696577,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 177.26921725273132
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.359260606536865,
+ "train_acc": 0.00982,
+ "test_loss": 4.664470828247071,
+ "test_acc": 0.01,
+ "lyapunov": 1.585314722012376,
+ "grad_norm": 0.265210981123156,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 177.23559665679932
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.361228064270019,
+ "train_acc": 0.0096,
+ "test_loss": 4.79210078125,
+ "test_acc": 0.01,
+ "lyapunov": 1.5868884224416044,
+ "grad_norm": 0.284706461729636,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 177.23232126235962
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.358762674407959,
+ "train_acc": 0.00948,
+ "test_loss": 4.767799957275391,
+ "test_acc": 0.01,
+ "lyapunov": 1.5848681917580802,
+ "grad_norm": 0.27692568211643537,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 177.2341754436493
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.360010164489746,
+ "train_acc": 0.00926,
+ "test_loss": 4.671016343688965,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858237874477417,
+ "grad_norm": 0.2706962686573412,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 177.24218034744263
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.3587316012573245,
+ "train_acc": 0.00928,
+ "test_loss": 4.748648097229004,
+ "test_acc": 0.01,
+ "lyapunov": 1.5848381055895324,
+ "grad_norm": 0.23937263927645328,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 177.2330150604248
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.35890893157959,
+ "train_acc": 0.00964,
+ "test_loss": 4.8125279388427735,
+ "test_acc": 0.01,
+ "lyapunov": 1.5850241647656922,
+ "grad_norm": 0.2489556767273508,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 177.22991752624512
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.361185835876465,
+ "train_acc": 0.00952,
+ "test_loss": 4.643449569702148,
+ "test_acc": 0.01,
+ "lyapunov": 1.5871033570955477,
+ "grad_norm": 0.31193315187891146,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 177.2139208316803
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.358732033691406,
+ "train_acc": 0.00876,
+ "test_loss": 4.706984965515137,
+ "test_acc": 0.01,
+ "lyapunov": 1.5848448145420044,
+ "grad_norm": 0.25839982964286506,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 177.22592782974243
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.359151672363281,
+ "train_acc": 0.00906,
+ "test_loss": 4.7044763816833495,
+ "test_acc": 0.01,
+ "lyapunov": 1.5852836605228122,
+ "grad_norm": 0.2598696228178214,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 177.2558205127716
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.359703632965088,
+ "train_acc": 0.01,
+ "test_loss": 4.721178560638427,
+ "test_acc": 0.01,
+ "lyapunov": 1.5858281173974351,
+ "grad_norm": 0.26109222250019687,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 177.24931955337524
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.359647062225342,
+ "train_acc": 0.00956,
+ "test_loss": 4.705288150024414,
+ "test_acc": 0.01,
+ "lyapunov": 1.585799050453069,
+ "grad_norm": 0.2430419176031886,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 177.20098423957825
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.370798114471436,
+ "train_acc": 0.01,
+ "test_loss": 4.711322469329834,
+ "test_acc": 0.01,
+ "lyapunov": 1.592538814105646,
+ "grad_norm": 0.23717985848250528,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 177.27925276756287
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.358164114685058,
+ "train_acc": 0.0097,
+ "test_loss": 4.713753561401367,
+ "test_acc": 0.01,
+ "lyapunov": 1.5842537294568309,
+ "grad_norm": 0.21577381809039398,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 177.2640838623047
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.359127445678711,
+ "train_acc": 0.00982,
+ "test_loss": 4.702644599914551,
+ "test_acc": 0.01,
+ "lyapunov": 1.5852683206348468,
+ "grad_norm": 0.22693874606806255,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 177.26845002174377
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.358451212463379,
+ "train_acc": 0.01,
+ "test_loss": 4.709589306640625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5845830724062517,
+ "grad_norm": 0.21686215956311627,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 177.26886224746704
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.359413949279785,
+ "train_acc": 0.01,
+ "test_loss": 4.713582644653321,
+ "test_acc": 0.01,
+ "lyapunov": 1.5855683030374825,
+ "grad_norm": 0.2386062253915984,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 177.24717164039612
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.380280564575195,
+ "train_acc": 0.01,
+ "test_loss": 4.7039310775756835,
+ "test_acc": 0.01,
+ "lyapunov": 1.59827317331758,
+ "grad_norm": 0.281062533044562,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 177.23896765708923
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.359466158905029,
+ "train_acc": 0.01,
+ "test_loss": 4.690676583862305,
+ "test_acc": 0.01,
+ "lyapunov": 1.5856200407837968,
+ "grad_norm": 0.18794718433603225,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 177.22590732574463
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.358838105926513,
+ "train_acc": 0.01,
+ "test_loss": 4.686097943115234,
+ "test_acc": 0.01,
+ "lyapunov": 1.5849668324146124,
+ "grad_norm": 0.18762604455384463,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 177.2236692905426
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.358961830444336,
+ "train_acc": 0.01,
+ "test_loss": 4.6859198120117185,
+ "test_acc": 0.01,
+ "lyapunov": 1.5850938287232539,
+ "grad_norm": 0.20367093372209882,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 177.23711729049683
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.359495299530029,
+ "train_acc": 0.01,
+ "test_loss": 4.686381504821777,
+ "test_acc": 0.01,
+ "lyapunov": 1.585582929194126,
+ "grad_norm": 0.1846519425292254,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 177.23132824897766
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.358631723632812,
+ "train_acc": 0.01,
+ "test_loss": 4.686381640625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5847509065857324,
+ "grad_norm": 0.21479574972052035,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 177.25513577461243
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.359418527679443,
+ "train_acc": 0.01,
+ "test_loss": 4.6863815933227535,
+ "test_acc": 0.01,
+ "lyapunov": 1.585573171105836,
+ "grad_norm": 0.18053721718052793,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 177.26594400405884
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.358559367828369,
+ "train_acc": 0.01,
+ "test_loss": 4.686381562042237,
+ "test_acc": 0.01,
+ "lyapunov": 1.584673622075249,
+ "grad_norm": 0.17806465386525372,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 177.21632599830627
+ }
+ ]
+ }
+} \ No newline at end of file