summaryrefslogtreecommitdiff
path: root/runs/depth_scaling_asymm/cifar100_20260101-112330
diff options
context:
space:
mode:
Diffstat (limited to 'runs/depth_scaling_asymm/cifar100_20260101-112330')
-rw-r--r--runs/depth_scaling_asymm/cifar100_20260101-112330/config.json22
-rw-r--r--runs/depth_scaling_asymm/cifar100_20260101-112330/results.json16822
2 files changed, 16844 insertions, 0 deletions
diff --git a/runs/depth_scaling_asymm/cifar100_20260101-112330/config.json b/runs/depth_scaling_asymm/cifar100_20260101-112330/config.json
new file mode 100644
index 0000000..eaf917f
--- /dev/null
+++ b/runs/depth_scaling_asymm/cifar100_20260101-112330/config.json
@@ -0,0 +1,22 @@
+{
+ "dataset": "cifar100",
+ "depths": [
+ 4,
+ 8,
+ 12,
+ 16
+ ],
+ "T": 4,
+ "epochs": 150,
+ "batch_size": 128,
+ "lr": 0.001,
+ "lambda_reg": 0.3,
+ "lambda_target": -0.1,
+ "data_dir": "./data",
+ "out_dir": "runs/depth_scaling_asymm",
+ "device": "cuda",
+ "seed": 42,
+ "no_progress": false,
+ "reg_type": "asymmetric",
+ "warmup_epochs": 20
+} \ No newline at end of file
diff --git a/runs/depth_scaling_asymm/cifar100_20260101-112330/results.json b/runs/depth_scaling_asymm/cifar100_20260101-112330/results.json
new file mode 100644
index 0000000..6c6da3b
--- /dev/null
+++ b/runs/depth_scaling_asymm/cifar100_20260101-112330/results.json
@@ -0,0 +1,16822 @@
+{
+ "vanilla": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 4.348092296829224,
+ "train_acc": 0.09724,
+ "test_loss": 3.5478567863464354,
+ "test_acc": 0.1787,
+ "lyapunov": null,
+ "grad_norm": 6.316536759043694,
+ "grad_max_sv": 4.902881336212158,
+ "grad_min_sv": 1.1448865706586986e-07,
+ "grad_condition": 88191421.7926497,
+ "lr": 0.0009998903417374227,
+ "time_sec": 17.679682731628418
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.49050922706604,
+ "train_acc": 0.1874,
+ "test_loss": 3.2633129741668703,
+ "test_acc": 0.2305,
+ "lyapunov": null,
+ "grad_norm": 4.4801349556346395,
+ "grad_max_sv": 3.2215479910373688,
+ "grad_min_sv": 8.299195606298326e-08,
+ "grad_condition": 121110274.52327952,
+ "lr": 0.0009995614150494292,
+ "time_sec": 15.735185623168945
+ },
+ {
+ "epoch": 3,
+ "train_loss": 3.0170057023620607,
+ "train_acc": 0.25916,
+ "test_loss": 2.9698277725219726,
+ "test_acc": 0.277,
+ "lyapunov": null,
+ "grad_norm": 3.5133664087504743,
+ "grad_max_sv": 2.335329008102417,
+ "grad_min_sv": 6.557634772974552e-08,
+ "grad_condition": 39177377.20397766,
+ "lr": 0.0009990133642141358,
+ "time_sec": 15.478843212127686
+ },
+ {
+ "epoch": 4,
+ "train_loss": 2.72460933883667,
+ "train_acc": 0.31376,
+ "test_loss": 2.5551274646759032,
+ "test_acc": 0.3459,
+ "lyapunov": null,
+ "grad_norm": 2.9634417699116904,
+ "grad_max_sv": 1.8090383648872375,
+ "grad_min_sv": 5.484415814827059e-08,
+ "grad_condition": 38079849.47138412,
+ "lr": 0.0009982464296247522,
+ "time_sec": 15.453156232833862
+ },
+ {
+ "epoch": 5,
+ "train_loss": 2.490703504867554,
+ "train_acc": 0.35894,
+ "test_loss": 2.7182868785858156,
+ "test_acc": 0.3267,
+ "lyapunov": null,
+ "grad_norm": 2.6429461818460145,
+ "grad_max_sv": 1.5860196590423583,
+ "grad_min_sv": 4.9649662298145714e-08,
+ "grad_condition": 58850970.75600495,
+ "lr": 0.0009972609476841367,
+ "time_sec": 15.466280460357666
+ },
+ {
+ "epoch": 6,
+ "train_loss": 2.3172771724700927,
+ "train_acc": 0.39578,
+ "test_loss": 2.39353342666626,
+ "test_acc": 0.3858,
+ "lyapunov": null,
+ "grad_norm": 2.425728150736765,
+ "grad_max_sv": 1.3820528209209442,
+ "grad_min_sv": 4.6181405355394387e-08,
+ "grad_condition": 48644681.68891229,
+ "lr": 0.000996057350657239,
+ "time_sec": 15.472876071929932
+ },
+ {
+ "epoch": 7,
+ "train_loss": 2.1795343031311036,
+ "train_acc": 0.42514,
+ "test_loss": 2.5081939483642577,
+ "test_acc": 0.3733,
+ "lyapunov": null,
+ "grad_norm": 2.261531612589412,
+ "grad_max_sv": 1.2684625327587127,
+ "grad_min_sv": 4.360769899069972e-08,
+ "grad_condition": 42250330.837381184,
+ "lr": 0.000994636166481494,
+ "time_sec": 15.466506242752075
+ },
+ {
+ "epoch": 8,
+ "train_loss": 2.0688308012390135,
+ "train_acc": 0.44974,
+ "test_loss": 2.4493139656066893,
+ "test_acc": 0.3851,
+ "lyapunov": null,
+ "grad_norm": 2.118981579627668,
+ "grad_max_sv": 1.159741823375225,
+ "grad_min_sv": 4.073619567137449e-08,
+ "grad_condition": 437927531.63442343,
+ "lr": 0.0009929980185352525,
+ "time_sec": 15.472336769104004
+ },
+ {
+ "epoch": 9,
+ "train_loss": 1.9493904537963866,
+ "train_acc": 0.47454,
+ "test_loss": 2.441312085723877,
+ "test_acc": 0.389,
+ "lyapunov": null,
+ "grad_norm": 1.9875075491821204,
+ "grad_max_sv": 1.0529514640569686,
+ "grad_min_sv": 3.8403542657050595e-08,
+ "grad_condition": 87931604.40353736,
+ "lr": 0.0009911436253643444,
+ "time_sec": 15.4936044216156
+ },
+ {
+ "epoch": 10,
+ "train_loss": 1.858957971572876,
+ "train_acc": 0.4983,
+ "test_loss": 2.183478004837036,
+ "test_acc": 0.4383,
+ "lyapunov": null,
+ "grad_norm": 1.8688341406216382,
+ "grad_max_sv": 0.9524922624230385,
+ "grad_min_sv": 3.567054506770084e-08,
+ "grad_condition": 37551442.84495841,
+ "lr": 0.0009890738003669028,
+ "time_sec": 15.46358847618103
+ },
+ {
+ "epoch": 11,
+ "train_loss": 1.7630364864730834,
+ "train_acc": 0.51782,
+ "test_loss": 3.0158682430267336,
+ "test_acc": 0.3359,
+ "lyapunov": null,
+ "grad_norm": 1.7816105917819214,
+ "grad_max_sv": 0.9029998555779457,
+ "grad_min_sv": 3.4386650932249904e-08,
+ "grad_condition": 96253986.02645789,
+ "lr": 0.00098678945143658,
+ "time_sec": 15.461369752883911
+ },
+ {
+ "epoch": 12,
+ "train_loss": 1.7038999611282348,
+ "train_acc": 0.52966,
+ "test_loss": 2.345099726104736,
+ "test_acc": 0.4116,
+ "lyapunov": null,
+ "grad_norm": 1.703439920745613,
+ "grad_max_sv": 0.8390393868088722,
+ "grad_min_sv": 3.2384037166287294e-08,
+ "grad_condition": 263062888.07930222,
+ "lr": 0.0009842915805643154,
+ "time_sec": 15.47589898109436
+ },
+ {
+ "epoch": 13,
+ "train_loss": 1.6350115670394898,
+ "train_acc": 0.54934,
+ "test_loss": 2.3178677167892454,
+ "test_acc": 0.4258,
+ "lyapunov": null,
+ "grad_norm": 1.627197475633154,
+ "grad_max_sv": 0.7804030522704124,
+ "grad_min_sv": 3.0640796072622935e-08,
+ "grad_condition": 47339680.420034245,
+ "lr": 0.000981581283398829,
+ "time_sec": 15.482157230377197
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.5789134158706666,
+ "train_acc": 0.56262,
+ "test_loss": 3.108631703567505,
+ "test_acc": 0.3341,
+ "lyapunov": null,
+ "grad_norm": 1.5815496416496932,
+ "grad_max_sv": 0.7780330538749695,
+ "grad_min_sv": 3.0241727028840204e-08,
+ "grad_condition": 121072879.52128251,
+ "lr": 0.0009786597487660333,
+ "time_sec": 15.469743490219116
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.5213708932495118,
+ "train_acc": 0.57622,
+ "test_loss": 2.1178235721588137,
+ "test_acc": 0.4665,
+ "lyapunov": null,
+ "grad_norm": 1.5137971406754955,
+ "grad_max_sv": 0.7158914238214493,
+ "grad_min_sv": 2.8684351333074785e-08,
+ "grad_condition": 31997486.936446648,
+ "lr": 0.0009755282581475766,
+ "time_sec": 15.4898362159729
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.466670620689392,
+ "train_acc": 0.58748,
+ "test_loss": 1.9707215017318727,
+ "test_acc": 0.4909,
+ "lyapunov": null,
+ "grad_norm": 1.4598686481318373,
+ "grad_max_sv": 0.6799994811415673,
+ "grad_min_sv": 2.748090726922836e-08,
+ "grad_condition": 67712877.74998799,
+ "lr": 0.0009721881851187403,
+ "time_sec": 15.463284254074097
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.4266776397705079,
+ "train_acc": 0.60022,
+ "test_loss": 1.9578287740707399,
+ "test_acc": 0.496,
+ "lyapunov": null,
+ "grad_norm": 1.4163199382153222,
+ "grad_max_sv": 0.6607045501470565,
+ "grad_min_sv": 2.6701706835885463e-08,
+ "grad_condition": 69925020.646238,
+ "lr": 0.0009686409947459456,
+ "time_sec": 15.465324878692627
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.3868621417999267,
+ "train_acc": 0.61008,
+ "test_loss": 1.8873281810760498,
+ "test_acc": 0.5122,
+ "lyapunov": null,
+ "grad_norm": 1.3780415134056272,
+ "grad_max_sv": 0.6475953251123429,
+ "grad_min_sv": 2.629753427935144e-08,
+ "grad_condition": 71849203.49105962,
+ "lr": 0.0009648882429441254,
+ "time_sec": 15.476778745651245
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.3300997947692872,
+ "train_acc": 0.6208,
+ "test_loss": 1.8625336185455321,
+ "test_acc": 0.5163,
+ "lyapunov": null,
+ "grad_norm": 1.3376016965348547,
+ "grad_max_sv": 0.6296016126871109,
+ "grad_min_sv": 2.534474096427264e-08,
+ "grad_condition": 40912774.4949669,
+ "lr": 0.00096093157579425,
+ "time_sec": 15.47281002998352
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.2915953662490844,
+ "train_acc": 0.6313,
+ "test_loss": 1.88144536113739,
+ "test_acc": 0.5061,
+ "lyapunov": null,
+ "grad_norm": 1.3064427354934414,
+ "grad_max_sv": 0.5868082754313946,
+ "grad_min_sv": 2.44614505123808e-08,
+ "grad_condition": 40190101.53190343,
+ "lr": 0.0009567727288213001,
+ "time_sec": 15.473944902420044
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.2615811933898926,
+ "train_acc": 0.63936,
+ "test_loss": 2.138494786453247,
+ "test_acc": 0.4639,
+ "lyapunov": null,
+ "grad_norm": 1.2742362971746195,
+ "grad_max_sv": 0.577499034255743,
+ "grad_min_sv": 2.428454916880707e-08,
+ "grad_condition": 34685614.15402056,
+ "lr": 0.0009524135262330095,
+ "time_sec": 15.476754188537598
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.2293620531463623,
+ "train_acc": 0.6453,
+ "test_loss": 1.8758944011688232,
+ "test_acc": 0.5147,
+ "lyapunov": null,
+ "grad_norm": 1.252289309007294,
+ "grad_max_sv": 0.570976011455059,
+ "grad_min_sv": 2.3561374129510426e-08,
+ "grad_condition": 48751943.11700691,
+ "lr": 0.0009478558801197061,
+ "time_sec": 15.473217487335205
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.1897959590911866,
+ "train_acc": 0.65626,
+ "test_loss": 1.8954246566772461,
+ "test_acc": 0.5211,
+ "lyapunov": null,
+ "grad_norm": 1.2259155434497018,
+ "grad_max_sv": 0.5599369831383229,
+ "grad_min_sv": 2.2801355227530795e-08,
+ "grad_condition": 52092903.5694242,
+ "lr": 0.000943101789615607,
+ "time_sec": 15.473440170288086
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.1551566465377807,
+ "train_acc": 0.665,
+ "test_loss": 1.896939277267456,
+ "test_acc": 0.5226,
+ "lyapunov": null,
+ "grad_norm": 1.2022612803404449,
+ "grad_max_sv": 0.5331769093871117,
+ "grad_min_sv": 2.2077526620062348e-08,
+ "grad_condition": 154376470.85049906,
+ "lr": 0.0009381533400219313,
+ "time_sec": 15.473422765731812
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.13716111492157,
+ "train_acc": 0.66968,
+ "test_loss": 1.9673876178741454,
+ "test_acc": 0.5073,
+ "lyapunov": null,
+ "grad_norm": 1.1814644477570717,
+ "grad_max_sv": 0.5192016668617725,
+ "grad_min_sv": 2.207178118607267e-08,
+ "grad_condition": 32052263.833083443,
+ "lr": 0.0009330127018922189,
+ "time_sec": 15.463173151016235
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.0986487645339966,
+ "train_acc": 0.6787,
+ "test_loss": 1.7822764610290527,
+ "test_acc": 0.5433,
+ "lyapunov": null,
+ "grad_norm": 1.1543031476624748,
+ "grad_max_sv": 0.5173374325037002,
+ "grad_min_sv": 2.149504294557403e-08,
+ "grad_condition": 47084637.545989394,
+ "lr": 0.000927682130080253,
+ "time_sec": 15.460694313049316
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.0663320102691651,
+ "train_acc": 0.6865,
+ "test_loss": 1.8293514751434325,
+ "test_acc": 0.533,
+ "lyapunov": null,
+ "grad_norm": 1.1345054831803263,
+ "grad_max_sv": 0.4966191992163658,
+ "grad_min_sv": 2.08524984349201e-08,
+ "grad_condition": 45914156.60470325,
+ "lr": 0.0009221639627510072,
+ "time_sec": 15.467730045318604
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.0501069176864624,
+ "train_acc": 0.68934,
+ "test_loss": 2.0238259536743164,
+ "test_acc": 0.5084,
+ "lyapunov": null,
+ "grad_norm": 1.1176238593171397,
+ "grad_max_sv": 0.489936176687479,
+ "grad_min_sv": 2.0258219826652103e-08,
+ "grad_condition": 52549899.42960344,
+ "lr": 0.0009164606203550494,
+ "time_sec": 15.526809692382812
+ },
+ {
+ "epoch": 29,
+ "train_loss": 1.0180758087921142,
+ "train_acc": 0.69862,
+ "test_loss": 1.8129717712402345,
+ "test_acc": 0.5511,
+ "lyapunov": null,
+ "grad_norm": 1.0978329669563418,
+ "grad_max_sv": 0.49835110902786256,
+ "grad_min_sv": 2.0405637433853347e-08,
+ "grad_condition": 716037506.8371468,
+ "lr": 0.0009105746045668516,
+ "time_sec": 15.492526054382324
+ },
+ {
+ "epoch": 30,
+ "train_loss": 0.9951805596923828,
+ "train_acc": 0.7055,
+ "test_loss": 1.746192921257019,
+ "test_acc": 0.5623,
+ "lyapunov": null,
+ "grad_norm": 1.0796441895567979,
+ "grad_max_sv": 0.47773563787341117,
+ "grad_min_sv": 1.9923237732071692e-08,
+ "grad_condition": 316108467.8828658,
+ "lr": 0.0009045084971874733,
+ "time_sec": 15.470518827438354
+ },
+ {
+ "epoch": 31,
+ "train_loss": 0.9780883857536316,
+ "train_acc": 0.70904,
+ "test_loss": 1.7732117160797118,
+ "test_acc": 0.558,
+ "lyapunov": null,
+ "grad_norm": 1.0645091607080823,
+ "grad_max_sv": 0.46556121930480004,
+ "grad_min_sv": 1.9688543108527246e-08,
+ "grad_condition": 174238515.18129045,
+ "lr": 0.0008982649590120977,
+ "time_sec": 15.477237224578857
+ },
+ {
+ "epoch": 32,
+ "train_loss": 0.9519822745513916,
+ "train_acc": 0.71686,
+ "test_loss": 1.7432144353866577,
+ "test_acc": 0.5575,
+ "lyapunov": null,
+ "grad_norm": 1.0432923508174365,
+ "grad_max_sv": 0.46001894399523735,
+ "grad_min_sv": 1.928787157004508e-08,
+ "grad_condition": 84996179.20525053,
+ "lr": 0.0008918467286629196,
+ "time_sec": 15.482601881027222
+ },
+ {
+ "epoch": 33,
+ "train_loss": 0.9250898433685303,
+ "train_acc": 0.7218,
+ "test_loss": 1.7904945095062257,
+ "test_acc": 0.556,
+ "lyapunov": null,
+ "grad_norm": 1.0314496073989632,
+ "grad_max_sv": 0.45169909074902537,
+ "grad_min_sv": 1.9128463927403638e-08,
+ "grad_condition": 68691111.76926772,
+ "lr": 0.0008852566213878943,
+ "time_sec": 15.519761800765991
+ },
+ {
+ "epoch": 34,
+ "train_loss": 0.9152010176086426,
+ "train_acc": 0.72778,
+ "test_loss": 1.835019757270813,
+ "test_acc": 0.5553,
+ "lyapunov": null,
+ "grad_norm": 1.0226948793120243,
+ "grad_max_sv": 0.44521483927965166,
+ "grad_min_sv": 1.8672882064196816e-08,
+ "grad_condition": 72631593.89558022,
+ "lr": 0.000878497527825878,
+ "time_sec": 15.492830753326416
+ },
+ {
+ "epoch": 35,
+ "train_loss": 0.8909054629325867,
+ "train_acc": 0.72998,
+ "test_loss": 1.8686577810287475,
+ "test_acc": 0.5431,
+ "lyapunov": null,
+ "grad_norm": 1.0060209353905554,
+ "grad_max_sv": 0.428337212651968,
+ "grad_min_sv": 1.8221278065555514e-08,
+ "grad_condition": 54925799.50217812,
+ "lr": 0.000871572412738697,
+ "time_sec": 15.495248556137085
+ },
+ {
+ "epoch": 36,
+ "train_loss": 0.8669569097518921,
+ "train_acc": 0.7396,
+ "test_loss": 1.8778275032043457,
+ "test_acc": 0.5506,
+ "lyapunov": null,
+ "grad_norm": 0.9935254761598353,
+ "grad_max_sv": 0.42610192447900774,
+ "grad_min_sv": 1.789830566673034e-08,
+ "grad_condition": 65521171.05971684,
+ "lr": 0.0008644843137107055,
+ "time_sec": 15.501812219619751
+ },
+ {
+ "epoch": 37,
+ "train_loss": 0.8407849538421631,
+ "train_acc": 0.74404,
+ "test_loss": 1.884768021965027,
+ "test_acc": 0.5558,
+ "lyapunov": null,
+ "grad_norm": 0.983358047025113,
+ "grad_max_sv": 0.429234990477562,
+ "grad_min_sv": 1.8252723432699015e-08,
+ "grad_condition": 312919609.17862236,
+ "lr": 0.0008572363398164014,
+ "time_sec": 15.485287427902222
+ },
+ {
+ "epoch": 38,
+ "train_loss": 0.8223714313125611,
+ "train_acc": 0.74734,
+ "test_loss": 1.8372897932052612,
+ "test_acc": 0.5581,
+ "lyapunov": null,
+ "grad_norm": 0.9730686293969507,
+ "grad_max_sv": 0.43215164765715597,
+ "grad_min_sv": 1.805779136082597e-08,
+ "grad_condition": 111631952.08398516,
+ "lr": 0.0008498316702566826,
+ "time_sec": 15.495893239974976
+ },
+ {
+ "epoch": 39,
+ "train_loss": 0.8224841629219055,
+ "train_acc": 0.7495,
+ "test_loss": 1.8123548791885375,
+ "test_acc": 0.5623,
+ "lyapunov": null,
+ "grad_norm": 0.9689754376402935,
+ "grad_max_sv": 0.41914472356438637,
+ "grad_min_sv": 1.7533556316562392e-08,
+ "grad_condition": 50149472.40203967,
+ "lr": 0.0008422735529643442,
+ "time_sec": 15.51100492477417
+ },
+ {
+ "epoch": 40,
+ "train_loss": 0.8005770356750488,
+ "train_acc": 0.75588,
+ "test_loss": 1.9014682191848755,
+ "test_acc": 0.5541,
+ "lyapunov": null,
+ "grad_norm": 0.9508080469971997,
+ "grad_max_sv": 0.42388487085700033,
+ "grad_min_sv": 1.762832624032859e-08,
+ "grad_condition": 346358468.0799734,
+ "lr": 0.0008345653031794289,
+ "time_sec": 15.498661279678345
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.7747948072814942,
+ "train_acc": 0.76342,
+ "test_loss": 1.8567888566970825,
+ "test_acc": 0.5642,
+ "lyapunov": null,
+ "grad_norm": 0.9372391115065106,
+ "grad_max_sv": 0.4081222198903561,
+ "grad_min_sv": 1.7018125511580885e-08,
+ "grad_condition": 61876276.47604829,
+ "lr": 0.0008267103019950526,
+ "time_sec": 15.5028657913208
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.7694620947647095,
+ "train_acc": 0.76502,
+ "test_loss": 1.8408411359786987,
+ "test_acc": 0.5591,
+ "lyapunov": null,
+ "grad_norm": 0.9326717735984488,
+ "grad_max_sv": 0.41085106804966925,
+ "grad_min_sv": 1.7216302598821454e-08,
+ "grad_condition": 43901470.16833824,
+ "lr": 0.0008187119948743447,
+ "time_sec": 15.496897459030151
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.7424543988418579,
+ "train_acc": 0.77306,
+ "test_loss": 1.809230382347107,
+ "test_acc": 0.571,
+ "lyapunov": null,
+ "grad_norm": 0.9131307159835452,
+ "grad_max_sv": 0.40560107976198195,
+ "grad_min_sv": 1.6559755318563962e-08,
+ "grad_condition": 374063353.4207941,
+ "lr": 0.000810573890139155,
+ "time_sec": 15.487475872039795
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.7239759206962585,
+ "train_acc": 0.77538,
+ "test_loss": 1.7808053987503052,
+ "test_acc": 0.5793,
+ "lyapunov": null,
+ "grad_norm": 0.9060005234187932,
+ "grad_max_sv": 0.39045327603816987,
+ "grad_min_sv": 1.6347653778933656e-08,
+ "grad_condition": 175023718.92676198,
+ "lr": 0.0008022995574311873,
+ "time_sec": 15.478513240814209
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.709962793712616,
+ "train_acc": 0.77894,
+ "test_loss": 1.9501771980285645,
+ "test_acc": 0.5602,
+ "lyapunov": null,
+ "grad_norm": 0.8987907360568149,
+ "grad_max_sv": 0.39080821722745895,
+ "grad_min_sv": 1.634847552334229e-08,
+ "grad_condition": 38169444.05614711,
+ "lr": 0.0007938926261462363,
+ "time_sec": 15.49375057220459
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.7000335352516174,
+ "train_acc": 0.78202,
+ "test_loss": 1.9276861065864563,
+ "test_acc": 0.563,
+ "lyapunov": null,
+ "grad_norm": 0.8939654390908522,
+ "grad_max_sv": 0.3900447376072407,
+ "grad_min_sv": 1.6118415283213062e-08,
+ "grad_condition": 201079781.287968,
+ "lr": 0.0007853567838422158,
+ "time_sec": 15.506261825561523
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.6843666355323792,
+ "train_acc": 0.78712,
+ "test_loss": 1.8863512687683106,
+ "test_acc": 0.5648,
+ "lyapunov": null,
+ "grad_norm": 0.8860846821543104,
+ "grad_max_sv": 0.38012751266360284,
+ "grad_min_sv": 1.5984218158706515e-08,
+ "grad_condition": 363331609.5318787,
+ "lr": 0.0007766957746216719,
+ "time_sec": 15.481945991516113
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.6651840719032288,
+ "train_acc": 0.79232,
+ "test_loss": 1.826128447341919,
+ "test_acc": 0.5815,
+ "lyapunov": null,
+ "grad_norm": 0.8702032066364243,
+ "grad_max_sv": 0.37026465982198714,
+ "grad_min_sv": 1.544788876539638e-08,
+ "grad_condition": 1805163796.8757565,
+ "lr": 0.0007679133974894982,
+ "time_sec": 15.52286958694458
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.6528418668937683,
+ "train_acc": 0.79534,
+ "test_loss": 1.8805492639541626,
+ "test_acc": 0.5748,
+ "lyapunov": null,
+ "grad_norm": 0.8668040159369109,
+ "grad_max_sv": 0.3801993615925312,
+ "grad_min_sv": 1.5647269831914333e-08,
+ "grad_condition": 52007972.99755625,
+ "lr": 0.000759013504686565,
+ "time_sec": 15.518036127090454
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.6436834973526001,
+ "train_acc": 0.7997,
+ "test_loss": 1.793442686843872,
+ "test_acc": 0.5833,
+ "lyapunov": null,
+ "grad_norm": 0.8597198609492746,
+ "grad_max_sv": 0.37670152857899664,
+ "grad_min_sv": 1.5507358382387677e-08,
+ "grad_condition": 427721692.1185082,
+ "lr": 0.0007499999999999998,
+ "time_sec": 15.534092426300049
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.6239418637657166,
+ "train_acc": 0.80486,
+ "test_loss": 1.9321050287246704,
+ "test_acc": 0.5702,
+ "lyapunov": null,
+ "grad_norm": 0.8414343547264628,
+ "grad_max_sv": 0.3712430141866207,
+ "grad_min_sv": 1.5363422166663614e-08,
+ "grad_condition": 365943262.8213007,
+ "lr": 0.0007408768370508575,
+ "time_sec": 15.527155876159668
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.6170344979095459,
+ "train_acc": 0.80566,
+ "test_loss": 1.7804856214523315,
+ "test_acc": 0.588,
+ "lyapunov": null,
+ "grad_norm": 0.8457147724415158,
+ "grad_max_sv": 0.36000491231679915,
+ "grad_min_sv": 1.510340268962018e-08,
+ "grad_condition": 55532260.257321715,
+ "lr": 0.0007316480175599307,
+ "time_sec": 15.508218765258789
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.6110373974990845,
+ "train_acc": 0.8104,
+ "test_loss": 2.008984780883789,
+ "test_acc": 0.5633,
+ "lyapunov": null,
+ "grad_norm": 0.8288727311238714,
+ "grad_max_sv": 0.3595147252082825,
+ "grad_min_sv": 1.5030111735758744e-08,
+ "grad_condition": 51249181.30750112,
+ "lr": 0.0007223175895924635,
+ "time_sec": 15.506837129592896
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.5891339810752869,
+ "train_acc": 0.81566,
+ "test_loss": 1.8466287677764892,
+ "test_acc": 0.578,
+ "lyapunov": null,
+ "grad_norm": 0.8213597411734475,
+ "grad_max_sv": 0.3565825395286083,
+ "grad_min_sv": 1.4749719501978495e-08,
+ "grad_condition": 570713779.6923382,
+ "lr": 0.0007128896457825361,
+ "time_sec": 15.501415491104126
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.5801966732025147,
+ "train_acc": 0.81848,
+ "test_loss": 1.8548430694580078,
+ "test_acc": 0.5809,
+ "lyapunov": null,
+ "grad_norm": 0.815116092241223,
+ "grad_max_sv": 0.36071729883551595,
+ "grad_min_sv": 1.4880934259310642e-08,
+ "grad_condition": 334242266.9087108,
+ "lr": 0.0007033683215378998,
+ "time_sec": 15.510899066925049
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.569889211063385,
+ "train_acc": 0.82134,
+ "test_loss": 1.8169442867279053,
+ "test_acc": 0.5857,
+ "lyapunov": null,
+ "grad_norm": 0.8134294920256526,
+ "grad_max_sv": 0.3643924631178379,
+ "grad_min_sv": 1.5098616617734152e-08,
+ "grad_condition": 592439727.9387308,
+ "lr": 0.0006937577932260512,
+ "time_sec": 15.496611595153809
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.5602374402427673,
+ "train_acc": 0.82158,
+ "test_loss": 1.915207731628418,
+ "test_acc": 0.5802,
+ "lyapunov": null,
+ "grad_norm": 0.8103201963167868,
+ "grad_max_sv": 0.3596944443881512,
+ "grad_min_sv": 1.4392631711435122e-08,
+ "grad_condition": 84052786.33799395,
+ "lr": 0.0006840622763423388,
+ "time_sec": 15.500912427902222
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.5363558686447144,
+ "train_acc": 0.83006,
+ "test_loss": 1.9087711734771728,
+ "test_acc": 0.579,
+ "lyapunov": null,
+ "grad_norm": 0.7940934690943876,
+ "grad_max_sv": 0.3485556967556477,
+ "grad_min_sv": 1.4054249935363528e-08,
+ "grad_condition": 99578456.52402398,
+ "lr": 0.0006742860236609073,
+ "time_sec": 15.499320268630981
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.5240596619415283,
+ "train_acc": 0.83386,
+ "test_loss": 1.8847876579284668,
+ "test_acc": 0.5849,
+ "lyapunov": null,
+ "grad_norm": 0.7848942902344976,
+ "grad_max_sv": 0.3444338757544756,
+ "grad_min_sv": 1.4203639615807326e-08,
+ "grad_condition": 1006017198.7685986,
+ "lr": 0.0006644333233692913,
+ "time_sec": 15.51360535621643
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.5250089431381225,
+ "train_acc": 0.83314,
+ "test_loss": 1.8497852947235107,
+ "test_acc": 0.5934,
+ "lyapunov": null,
+ "grad_norm": 0.78894564972248,
+ "grad_max_sv": 0.35073093622922896,
+ "grad_min_sv": 1.3935465524236857e-08,
+ "grad_condition": 88013656.03250492,
+ "lr": 0.0006545084971874734,
+ "time_sec": 15.508491516113281
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.5165614600944519,
+ "train_acc": 0.83506,
+ "test_loss": 1.8630810359954835,
+ "test_acc": 0.5874,
+ "lyapunov": null,
+ "grad_norm": 0.7829768565092297,
+ "grad_max_sv": 0.3336628802120686,
+ "grad_min_sv": 1.3946549117481444e-08,
+ "grad_condition": 180242934.78653836,
+ "lr": 0.0006445158984722354,
+ "time_sec": 15.503038167953491
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.500950801115036,
+ "train_acc": 0.83966,
+ "test_loss": 1.8171254947662354,
+ "test_acc": 0.5999,
+ "lyapunov": null,
+ "grad_norm": 0.7677509624143988,
+ "grad_max_sv": 0.3256234541535378,
+ "grad_min_sv": 1.3750762319075793e-08,
+ "grad_condition": 64445933.52390041,
+ "lr": 0.0006344599103076324,
+ "time_sec": 15.505617618560791
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.48925278188705446,
+ "train_acc": 0.84414,
+ "test_loss": 1.9641206827163695,
+ "test_acc": 0.5824,
+ "lyapunov": null,
+ "grad_norm": 0.7625502199233959,
+ "grad_max_sv": 0.3294233627617359,
+ "grad_min_sv": 1.32725306221243e-08,
+ "grad_condition": 1228963257.7671177,
+ "lr": 0.0006243449435824269,
+ "time_sec": 15.529828071594238
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.48350829057693484,
+ "train_acc": 0.84334,
+ "test_loss": 1.9596610692977905,
+ "test_acc": 0.5774,
+ "lyapunov": null,
+ "grad_norm": 0.7632750006619222,
+ "grad_max_sv": 0.3282707162201405,
+ "grad_min_sv": 1.3222439235009708e-08,
+ "grad_condition": 124220191.9706742,
+ "lr": 0.0006141754350553275,
+ "time_sec": 15.521306037902832
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.4709274704360962,
+ "train_acc": 0.84992,
+ "test_loss": 1.8849371217727662,
+ "test_acc": 0.5929,
+ "lyapunov": null,
+ "grad_norm": 0.7514320426924211,
+ "grad_max_sv": 0.3312883138656616,
+ "grad_min_sv": 1.352077347374636e-08,
+ "grad_condition": 135157839.23060852,
+ "lr": 0.0006039558454088793,
+ "time_sec": 15.500089168548584
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.4579773247909546,
+ "train_acc": 0.85246,
+ "test_loss": 1.9383041584968568,
+ "test_acc": 0.5795,
+ "lyapunov": null,
+ "grad_norm": 0.7398296341112965,
+ "grad_max_sv": 0.32728378027677535,
+ "grad_min_sv": 1.3280565344621006e-08,
+ "grad_condition": 870917269.6899513,
+ "lr": 0.000593690657292862,
+ "time_sec": 15.498245477676392
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.4509772509765625,
+ "train_acc": 0.85632,
+ "test_loss": 1.9290270626068116,
+ "test_acc": 0.5832,
+ "lyapunov": null,
+ "grad_norm": 0.733532607565585,
+ "grad_max_sv": 0.3176191322505474,
+ "grad_min_sv": 1.2820620155827924e-08,
+ "grad_condition": 563528143.6689861,
+ "lr": 0.0005833843733580507,
+ "time_sec": 15.513327360153198
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.44296426357269286,
+ "train_acc": 0.85874,
+ "test_loss": 1.9557575977325439,
+ "test_acc": 0.5895,
+ "lyapunov": null,
+ "grad_norm": 0.7313567414469692,
+ "grad_max_sv": 0.3311334565281868,
+ "grad_min_sv": 1.299003317134506e-08,
+ "grad_condition": 57636313.192167915,
+ "lr": 0.0005730415142812054,
+ "time_sec": 15.521730422973633
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.43896515016555787,
+ "train_acc": 0.85892,
+ "test_loss": 1.960878660583496,
+ "test_acc": 0.5868,
+ "lyapunov": null,
+ "grad_norm": 0.7340093422433535,
+ "grad_max_sv": 0.3193955574184656,
+ "grad_min_sv": 1.2791151784291576e-08,
+ "grad_condition": 100597916.68063782,
+ "lr": 0.0005626666167821517,
+ "time_sec": 15.51311707496643
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.4285468480491638,
+ "train_acc": 0.86298,
+ "test_loss": 1.9584955738067626,
+ "test_acc": 0.591,
+ "lyapunov": null,
+ "grad_norm": 0.7244061253185728,
+ "grad_max_sv": 0.31838734485208986,
+ "grad_min_sv": 1.2623370689458097e-08,
+ "grad_condition": 256671325.86986813,
+ "lr": 0.0005522642316338265,
+ "time_sec": 15.545679569244385
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.4232082028102875,
+ "train_acc": 0.863,
+ "test_loss": 1.9168709438323974,
+ "test_acc": 0.5946,
+ "lyapunov": null,
+ "grad_norm": 0.7235116987420683,
+ "grad_max_sv": 0.3361910209059715,
+ "grad_min_sv": 1.3065330882943912e-08,
+ "grad_condition": 539616293.1861387,
+ "lr": 0.0005418389216661573,
+ "time_sec": 15.529778480529785
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.40893464082717895,
+ "train_acc": 0.8671,
+ "test_loss": 1.9778603734970093,
+ "test_acc": 0.5917,
+ "lyapunov": null,
+ "grad_norm": 0.7120788606908913,
+ "grad_max_sv": 0.3133332245051861,
+ "grad_min_sv": 1.2864244934573943e-08,
+ "grad_condition": 599875620.9980721,
+ "lr": 0.0005313952597646563,
+ "time_sec": 15.501370429992676
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.4073019913864136,
+ "train_acc": 0.86922,
+ "test_loss": 1.8993178993225097,
+ "test_acc": 0.6036,
+ "lyapunov": null,
+ "grad_norm": 0.7054800561985982,
+ "grad_max_sv": 0.32210378982126714,
+ "grad_min_sv": 1.2598049555162874e-08,
+ "grad_condition": 609078116.1228421,
+ "lr": 0.0005209378268645994,
+ "time_sec": 15.514087915420532
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.38610194705963136,
+ "train_acc": 0.87514,
+ "test_loss": 1.9717372917175293,
+ "test_acc": 0.5877,
+ "lyapunov": null,
+ "grad_norm": 0.6876754791376803,
+ "grad_max_sv": 0.30587312653660775,
+ "grad_min_sv": 1.228859272620758e-08,
+ "grad_condition": 287047740.76686746,
+ "lr": 0.0005104712099416781,
+ "time_sec": 15.521286249160767
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.38415311262130736,
+ "train_acc": 0.87532,
+ "test_loss": 1.9978297256469726,
+ "test_acc": 0.5873,
+ "lyapunov": null,
+ "grad_norm": 0.6901352414114731,
+ "grad_max_sv": 0.30640832521021366,
+ "grad_min_sv": 1.2382189768650464e-08,
+ "grad_condition": 89574244.76284985,
+ "lr": 0.0004999999999999996,
+ "time_sec": 15.522554159164429
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.38036803808212283,
+ "train_acc": 0.87676,
+ "test_loss": 1.9114773050308227,
+ "test_acc": 0.5941,
+ "lyapunov": null,
+ "grad_norm": 0.6862042555811976,
+ "grad_max_sv": 0.30668022595345973,
+ "grad_min_sv": 1.2098685775799311e-08,
+ "grad_condition": 79753720.75813168,
+ "lr": 0.0004895287900583212,
+ "time_sec": 15.500049591064453
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.37699529049873354,
+ "train_acc": 0.8755,
+ "test_loss": 1.9144949556350708,
+ "test_acc": 0.6035,
+ "lyapunov": null,
+ "grad_norm": 0.6869175270134545,
+ "grad_max_sv": 0.30233032815158367,
+ "grad_min_sv": 1.210133520196388e-08,
+ "grad_condition": 86138637.5204114,
+ "lr": 0.0004790621731353997,
+ "time_sec": 15.553943395614624
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.3636139490318298,
+ "train_acc": 0.88226,
+ "test_loss": 1.9924920860290527,
+ "test_acc": 0.5927,
+ "lyapunov": null,
+ "grad_norm": 0.6711688569608495,
+ "grad_max_sv": 0.29902654588222505,
+ "grad_min_sv": 1.1863716191731766e-08,
+ "grad_condition": 88817475.8392382,
+ "lr": 0.000468604740235343,
+ "time_sec": 15.530450820922852
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.362152115983963,
+ "train_acc": 0.88426,
+ "test_loss": 1.924188154411316,
+ "test_acc": 0.598,
+ "lyapunov": null,
+ "grad_norm": 0.6714773282743005,
+ "grad_max_sv": 0.29965595006942747,
+ "grad_min_sv": 1.1964831648906583e-08,
+ "grad_condition": 902616195.7149051,
+ "lr": 0.00045816107833384175,
+ "time_sec": 15.498046636581421
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.35668459805488584,
+ "train_acc": 0.88318,
+ "test_loss": 1.9200622287750244,
+ "test_acc": 0.5961,
+ "lyapunov": null,
+ "grad_norm": 0.6691406173146984,
+ "grad_max_sv": 0.30350013412535193,
+ "grad_min_sv": 1.2079031691623194e-08,
+ "grad_condition": 208431932.92374653,
+ "lr": 0.0004477357683661729,
+ "time_sec": 15.500086307525635
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.3465567926597595,
+ "train_acc": 0.88642,
+ "test_loss": 1.9750726140975952,
+ "test_acc": 0.5909,
+ "lyapunov": null,
+ "grad_norm": 0.6600906573823067,
+ "grad_max_sv": 0.3025949317961931,
+ "grad_min_sv": 1.1841972132921319e-08,
+ "grad_condition": 833170767.4888487,
+ "lr": 0.00043733338321784746,
+ "time_sec": 15.528315544128418
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.3412511627674103,
+ "train_acc": 0.88932,
+ "test_loss": 1.9702592422485352,
+ "test_acc": 0.5983,
+ "lyapunov": null,
+ "grad_norm": 0.6534470838362898,
+ "grad_max_sv": 0.281625871360302,
+ "grad_min_sv": 1.1298424867564605e-08,
+ "grad_condition": 245256269.73618746,
+ "lr": 0.0004269584857187939,
+ "time_sec": 15.54018759727478
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.32986866790771485,
+ "train_acc": 0.89278,
+ "test_loss": 1.9833718214035034,
+ "test_acc": 0.5983,
+ "lyapunov": null,
+ "grad_norm": 0.6472964118800569,
+ "grad_max_sv": 0.2898814812302589,
+ "grad_min_sv": 1.1219894397937468e-08,
+ "grad_condition": 67348047.22944725,
+ "lr": 0.0004166156266419484,
+ "time_sec": 15.523268938064575
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.32046857831954956,
+ "train_acc": 0.89464,
+ "test_loss": 1.9931445137023927,
+ "test_acc": 0.5976,
+ "lyapunov": null,
+ "grad_norm": 0.6387491891164032,
+ "grad_max_sv": 0.2859178498387337,
+ "grad_min_sv": 1.1112689026274158e-08,
+ "grad_condition": 532191414.5407898,
+ "lr": 0.0004063093427071373,
+ "time_sec": 15.5046226978302
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.31971281969070436,
+ "train_acc": 0.89616,
+ "test_loss": 1.919898393058777,
+ "test_acc": 0.6034,
+ "lyapunov": null,
+ "grad_norm": 0.6349502290101287,
+ "grad_max_sv": 0.2895286176353693,
+ "grad_min_sv": 1.114760893840749e-08,
+ "grad_condition": 1708507357.4309907,
+ "lr": 0.0003960441545911199,
+ "time_sec": 15.50874662399292
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.314735742893219,
+ "train_acc": 0.89802,
+ "test_loss": 1.9826490537643433,
+ "test_acc": 0.6039,
+ "lyapunov": null,
+ "grad_norm": 0.6374095409599659,
+ "grad_max_sv": 0.29547037966549394,
+ "grad_min_sv": 1.1427597929134642e-08,
+ "grad_condition": 249196257.17434186,
+ "lr": 0.0003858245649446718,
+ "time_sec": 15.518042802810669
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.3056777443599701,
+ "train_acc": 0.90104,
+ "test_loss": 2.015980870628357,
+ "test_acc": 0.5982,
+ "lyapunov": null,
+ "grad_norm": 0.6267239770409858,
+ "grad_max_sv": 0.29190454818308353,
+ "grad_min_sv": 1.1234584110458944e-08,
+ "grad_condition": 1983104332.2605565,
+ "lr": 0.00037565505641757235,
+ "time_sec": 15.49971318244934
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.3044772444725037,
+ "train_acc": 0.90106,
+ "test_loss": 2.005346726799011,
+ "test_acc": 0.6026,
+ "lyapunov": null,
+ "grad_norm": 0.6293105806437898,
+ "grad_max_sv": 0.2927882194519043,
+ "grad_min_sv": 1.12210154674941e-08,
+ "grad_condition": 178904778.3418693,
+ "lr": 0.00036554008969236695,
+ "time_sec": 15.495405673980713
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.30109511434555053,
+ "train_acc": 0.90188,
+ "test_loss": 1.998448072052002,
+ "test_acc": 0.6034,
+ "lyapunov": null,
+ "grad_norm": 0.6266125109308321,
+ "grad_max_sv": 0.29103793352842333,
+ "grad_min_sv": 1.1148633635108679e-08,
+ "grad_condition": 893976917.5132227,
+ "lr": 0.0003554841015277638,
+ "time_sec": 15.50434947013855
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.28917674076080324,
+ "train_acc": 0.90682,
+ "test_loss": 1.9980867877960204,
+ "test_acc": 0.6012,
+ "lyapunov": null,
+ "grad_norm": 0.6127659289231001,
+ "grad_max_sv": 0.29112574011087416,
+ "grad_min_sv": 1.1166155032202307e-08,
+ "grad_condition": 348701496.86000526,
+ "lr": 0.000345491502812526,
+ "time_sec": 15.520820617675781
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.2823534561729431,
+ "train_acc": 0.90822,
+ "test_loss": 1.9809785503387451,
+ "test_acc": 0.6052,
+ "lyapunov": null,
+ "grad_norm": 0.606268342013339,
+ "grad_max_sv": 0.27696173191070556,
+ "grad_min_sv": 1.0846671113454859e-08,
+ "grad_condition": 248996494.78191227,
+ "lr": 0.0003355666766307081,
+ "time_sec": 15.745567321777344
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.28228991139411924,
+ "train_acc": 0.91008,
+ "test_loss": 2.0131442947387694,
+ "test_acc": 0.6001,
+ "lyapunov": null,
+ "grad_norm": 0.6064057382091922,
+ "grad_max_sv": 0.277644307166338,
+ "grad_min_sv": 1.0798128024722132e-08,
+ "grad_condition": 406311701.1258798,
+ "lr": 0.00032571397633909225,
+ "time_sec": 15.527170181274414
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.2772208102607727,
+ "train_acc": 0.91184,
+ "test_loss": 2.0510717596054078,
+ "test_acc": 0.5952,
+ "lyapunov": null,
+ "grad_norm": 0.603398829043512,
+ "grad_max_sv": 0.2785311110317707,
+ "grad_min_sv": 1.0620686785936529e-08,
+ "grad_condition": 159246942.28978306,
+ "lr": 0.00031593772365766094,
+ "time_sec": 15.521395206451416
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.2721544520187378,
+ "train_acc": 0.91266,
+ "test_loss": 2.044207299041748,
+ "test_acc": 0.5963,
+ "lyapunov": null,
+ "grad_norm": 0.597776334868791,
+ "grad_max_sv": 0.2813128184527159,
+ "grad_min_sv": 1.032634765595758e-08,
+ "grad_condition": 320344963.9972409,
+ "lr": 0.0003062422067739483,
+ "time_sec": 15.535969257354736
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.2562399788665771,
+ "train_acc": 0.91636,
+ "test_loss": 2.1072509820938112,
+ "test_acc": 0.5953,
+ "lyapunov": null,
+ "grad_norm": 0.5775561165196347,
+ "grad_max_sv": 0.27824114337563516,
+ "grad_min_sv": 1.0481623234420353e-08,
+ "grad_condition": 474004359.26671135,
+ "lr": 0.00029663167846209965,
+ "time_sec": 15.517311334609985
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.2625131010723114,
+ "train_acc": 0.9142,
+ "test_loss": 2.035417915725708,
+ "test_acc": 0.604,
+ "lyapunov": null,
+ "grad_norm": 0.5877203581399221,
+ "grad_max_sv": 0.28129979483783246,
+ "grad_min_sv": 1.0502568877773787e-08,
+ "grad_condition": 177356414.63757357,
+ "lr": 0.00028711035421746345,
+ "time_sec": 15.521276950836182
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.2552481310462952,
+ "train_acc": 0.9173,
+ "test_loss": 1.9491484304428102,
+ "test_acc": 0.6093,
+ "lyapunov": null,
+ "grad_norm": 0.5816116237706002,
+ "grad_max_sv": 0.27597419619560243,
+ "grad_min_sv": 1.0369440153409904e-08,
+ "grad_condition": 153072053.30610082,
+ "lr": 0.00027768241040753615,
+ "time_sec": 15.518199920654297
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.2514290081501007,
+ "train_acc": 0.91774,
+ "test_loss": 1.9556513019561768,
+ "test_acc": 0.6144,
+ "lyapunov": null,
+ "grad_norm": 0.5786453355425705,
+ "grad_max_sv": 0.25863444767892363,
+ "grad_min_sv": 9.982682687079137e-09,
+ "grad_condition": 323898207.1043015,
+ "lr": 0.00026835198244006903,
+ "time_sec": 15.518558025360107
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.24542429465293883,
+ "train_acc": 0.92078,
+ "test_loss": 2.0414382596969602,
+ "test_acc": 0.6093,
+ "lyapunov": null,
+ "grad_norm": 0.5720561260068352,
+ "grad_max_sv": 0.2730622936040163,
+ "grad_min_sv": 1.0236981595745931e-08,
+ "grad_condition": 73009111.50173582,
+ "lr": 0.0002591231629491421,
+ "time_sec": 15.516184568405151
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.2419339677333832,
+ "train_acc": 0.92168,
+ "test_loss": 2.0001620481491087,
+ "test_acc": 0.615,
+ "lyapunov": null,
+ "grad_norm": 0.5656963959074934,
+ "grad_max_sv": 0.2690838035196066,
+ "grad_min_sv": 1.0369351413283546e-08,
+ "grad_condition": 325100290.9819474,
+ "lr": 0.0002499999999999997,
+ "time_sec": 15.516221761703491
+ },
+ {
+ "epoch": 101,
+ "train_loss": 0.23517837069511413,
+ "train_acc": 0.92362,
+ "test_loss": 2.0624069427490235,
+ "test_acc": 0.6006,
+ "lyapunov": null,
+ "grad_norm": 0.5588551885657764,
+ "grad_max_sv": 0.26636214926838875,
+ "grad_min_sv": 9.985110372735806e-09,
+ "grad_condition": 152593330.29256034,
+ "lr": 0.00024098649531343477,
+ "time_sec": 15.525659799575806
+ },
+ {
+ "epoch": 102,
+ "train_loss": 0.23243571233749388,
+ "train_acc": 0.92494,
+ "test_loss": 2.050922277832031,
+ "test_acc": 0.6071,
+ "lyapunov": null,
+ "grad_norm": 0.555094837720988,
+ "grad_max_sv": 0.2671301085501909,
+ "grad_min_sv": 9.489460735148495e-09,
+ "grad_condition": 975172257.3566437,
+ "lr": 0.0002320866025105016,
+ "time_sec": 15.512139797210693
+ },
+ {
+ "epoch": 103,
+ "train_loss": 0.22915385756969453,
+ "train_acc": 0.92618,
+ "test_loss": 2.0090701560974122,
+ "test_acc": 0.6102,
+ "lyapunov": null,
+ "grad_norm": 0.551643622576711,
+ "grad_max_sv": 0.26358814239501954,
+ "grad_min_sv": 9.903819275135706e-09,
+ "grad_condition": 8450881945.308035,
+ "lr": 0.0002233042253783278,
+ "time_sec": 15.51590085029602
+ },
+ {
+ "epoch": 104,
+ "train_loss": 0.22301624965667724,
+ "train_acc": 0.929,
+ "test_loss": 2.0414324163436888,
+ "test_acc": 0.6097,
+ "lyapunov": null,
+ "grad_norm": 0.547361757777093,
+ "grad_max_sv": 0.2635317210108042,
+ "grad_min_sv": 9.868235632663237e-09,
+ "grad_condition": 918464158.4766433,
+ "lr": 0.000214643216157784,
+ "time_sec": 15.517698764801025
+ },
+ {
+ "epoch": 105,
+ "train_loss": 0.21800282436847687,
+ "train_acc": 0.92888,
+ "test_loss": 2.006334408760071,
+ "test_acc": 0.6108,
+ "lyapunov": null,
+ "grad_norm": 0.5441245707971135,
+ "grad_max_sv": 0.2652390133589506,
+ "grad_min_sv": 9.775255871067018e-09,
+ "grad_condition": 1728037982.0008423,
+ "lr": 0.00020610737385376332,
+ "time_sec": 15.521651268005371
+ },
+ {
+ "epoch": 106,
+ "train_loss": 0.22170533905029297,
+ "train_acc": 0.92766,
+ "test_loss": 2.0015246070861816,
+ "test_acc": 0.6151,
+ "lyapunov": null,
+ "grad_norm": 0.5504732473005655,
+ "grad_max_sv": 0.2658932194113731,
+ "grad_min_sv": 9.836566865553675e-09,
+ "grad_condition": 187622343.96039546,
+ "lr": 0.00019770044256881242,
+ "time_sec": 15.52303409576416
+ },
+ {
+ "epoch": 107,
+ "train_loss": 0.21625425663948059,
+ "train_acc": 0.92998,
+ "test_loss": 2.0188750885009767,
+ "test_acc": 0.6132,
+ "lyapunov": null,
+ "grad_norm": 0.5416895117176501,
+ "grad_max_sv": 0.25219607427716256,
+ "grad_min_sv": 9.366761803773077e-09,
+ "grad_condition": 260260509.50687146,
+ "lr": 0.0001894261098608447,
+ "time_sec": 15.538499593734741
+ },
+ {
+ "epoch": 108,
+ "train_loss": 0.20747127439498902,
+ "train_acc": 0.93344,
+ "test_loss": 1.992410384941101,
+ "test_acc": 0.6181,
+ "lyapunov": null,
+ "grad_norm": 0.5312872760984289,
+ "grad_max_sv": 0.26626099497079847,
+ "grad_min_sv": 9.742697032379816e-09,
+ "grad_condition": 241868081.8815055,
+ "lr": 0.000181288005125655,
+ "time_sec": 15.520596027374268
+ },
+ {
+ "epoch": 109,
+ "train_loss": 0.21061437376976014,
+ "train_acc": 0.93212,
+ "test_loss": 2.0430712549209593,
+ "test_acc": 0.6121,
+ "lyapunov": null,
+ "grad_norm": 0.53793437376293,
+ "grad_max_sv": 0.26196735054254533,
+ "grad_min_sv": 9.911649283440849e-09,
+ "grad_condition": 196778424.3729182,
+ "lr": 0.0001732896980049473,
+ "time_sec": 15.514817953109741
+ },
+ {
+ "epoch": 110,
+ "train_loss": 0.20801750651359557,
+ "train_acc": 0.93272,
+ "test_loss": 2.0129987867355346,
+ "test_acc": 0.6136,
+ "lyapunov": null,
+ "grad_norm": 0.5345111757966097,
+ "grad_max_sv": 0.2620788164436817,
+ "grad_min_sv": 9.685049608479378e-09,
+ "grad_condition": 442982408.6181739,
+ "lr": 0.00016543469682057076,
+ "time_sec": 15.524093389511108
+ },
+ {
+ "epoch": 111,
+ "train_loss": 0.20387941056251527,
+ "train_acc": 0.93432,
+ "test_loss": 2.017576940536499,
+ "test_acc": 0.6171,
+ "lyapunov": null,
+ "grad_norm": 0.5265383831682404,
+ "grad_max_sv": 0.2475517351180315,
+ "grad_min_sv": 9.334722057222771e-09,
+ "grad_condition": 520706944.53767884,
+ "lr": 0.00015772644703565552,
+ "time_sec": 15.520273685455322
+ },
+ {
+ "epoch": 112,
+ "train_loss": 0.20065601328372956,
+ "train_acc": 0.93514,
+ "test_loss": 2.0878772733688353,
+ "test_acc": 0.6091,
+ "lyapunov": null,
+ "grad_norm": 0.5235410807678327,
+ "grad_max_sv": 0.2556714225560427,
+ "grad_min_sv": 9.592023909182901e-09,
+ "grad_condition": 295083197.1946956,
+ "lr": 0.00015016832974331713,
+ "time_sec": 15.510764837265015
+ },
+ {
+ "epoch": 113,
+ "train_loss": 0.1982079153442383,
+ "train_acc": 0.93612,
+ "test_loss": 2.047266570854187,
+ "test_acc": 0.6181,
+ "lyapunov": null,
+ "grad_norm": 0.5197176578777744,
+ "grad_max_sv": 0.25255175642669203,
+ "grad_min_sv": 9.308845385150311e-09,
+ "grad_condition": 520055211.6428779,
+ "lr": 0.00014276366018359834,
+ "time_sec": 15.705829381942749
+ },
+ {
+ "epoch": 114,
+ "train_loss": 0.19655517510414122,
+ "train_acc": 0.93708,
+ "test_loss": 2.0292094760894774,
+ "test_acc": 0.6144,
+ "lyapunov": null,
+ "grad_norm": 0.5181527372855724,
+ "grad_max_sv": 0.25922506861388683,
+ "grad_min_sv": 9.507550523431274e-09,
+ "grad_condition": 332806274.6985155,
+ "lr": 0.00013551568628929425,
+ "time_sec": 15.525954723358154
+ },
+ {
+ "epoch": 115,
+ "train_loss": 0.18803977591514587,
+ "train_acc": 0.93928,
+ "test_loss": 2.0187850973129273,
+ "test_acc": 0.6152,
+ "lyapunov": null,
+ "grad_norm": 0.5114058292617459,
+ "grad_max_sv": 0.2462628223001957,
+ "grad_min_sv": 9.353905294090265e-09,
+ "grad_condition": 1483441837.69936,
+ "lr": 0.00012842758726130276,
+ "time_sec": 15.518154859542847
+ },
+ {
+ "epoch": 116,
+ "train_loss": 0.18797869988918303,
+ "train_acc": 0.93912,
+ "test_loss": 2.084369885826111,
+ "test_acc": 0.6095,
+ "lyapunov": null,
+ "grad_norm": 0.5077819115434521,
+ "grad_max_sv": 0.25109760873019693,
+ "grad_min_sv": 8.964496494212256e-09,
+ "grad_condition": 298276978.79912215,
+ "lr": 0.0001215024721741218,
+ "time_sec": 15.520355939865112
+ },
+ {
+ "epoch": 117,
+ "train_loss": 0.18214592965126036,
+ "train_acc": 0.94196,
+ "test_loss": 2.034072047996521,
+ "test_acc": 0.6169,
+ "lyapunov": null,
+ "grad_norm": 0.49960618612788865,
+ "grad_max_sv": 0.25671581737697124,
+ "grad_min_sv": 9.445877218535077e-09,
+ "grad_condition": 1803107586.0713096,
+ "lr": 0.00011474337861210538,
+ "time_sec": 15.5315523147583
+ },
+ {
+ "epoch": 118,
+ "train_loss": 0.18415243848800658,
+ "train_acc": 0.93992,
+ "test_loss": 2.082629474067688,
+ "test_acc": 0.6147,
+ "lyapunov": null,
+ "grad_norm": 0.5036047735021936,
+ "grad_max_sv": 0.24121248573064805,
+ "grad_min_sv": 8.989532489320911e-09,
+ "grad_condition": 1883514828.3661075,
+ "lr": 0.00010815327133708009,
+ "time_sec": 15.565385580062866
+ },
+ {
+ "epoch": 119,
+ "train_loss": 0.18069743538856506,
+ "train_acc": 0.94234,
+ "test_loss": 2.0749569414138795,
+ "test_acc": 0.6104,
+ "lyapunov": null,
+ "grad_norm": 0.4967845602516186,
+ "grad_max_sv": 0.24950436390936376,
+ "grad_min_sv": 9.221202780431564e-09,
+ "grad_condition": 275651167.2776666,
+ "lr": 0.00010173504098790182,
+ "time_sec": 15.531636476516724
+ },
+ {
+ "epoch": 120,
+ "train_loss": 0.1800184269142151,
+ "train_acc": 0.9418,
+ "test_loss": 2.063923722267151,
+ "test_acc": 0.6149,
+ "lyapunov": null,
+ "grad_norm": 0.5000634640274525,
+ "grad_max_sv": 0.2467968337237835,
+ "grad_min_sv": 9.10186292138633e-09,
+ "grad_condition": 420120780.22859687,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 15.545646905899048
+ },
+ {
+ "epoch": 121,
+ "train_loss": 0.1746319353055954,
+ "train_acc": 0.94524,
+ "test_loss": 2.031014646720886,
+ "test_acc": 0.6202,
+ "lyapunov": null,
+ "grad_norm": 0.4894634649372604,
+ "grad_max_sv": 0.24847413785755634,
+ "grad_min_sv": 9.111916768203901e-09,
+ "grad_condition": 529933823.1357336,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 15.525688648223877
+ },
+ {
+ "epoch": 122,
+ "train_loss": 0.1720413486146927,
+ "train_acc": 0.94558,
+ "test_loss": 2.0709302186965943,
+ "test_acc": 0.6107,
+ "lyapunov": null,
+ "grad_norm": 0.4872422158802626,
+ "grad_max_sv": 0.25410806462168695,
+ "grad_min_sv": 9.372779969513134e-09,
+ "grad_condition": 129683199.58735898,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 15.53614616394043
+ },
+ {
+ "epoch": 123,
+ "train_loss": 0.167387109708786,
+ "train_acc": 0.94716,
+ "test_loss": 2.04781618976593,
+ "test_acc": 0.621,
+ "lyapunov": null,
+ "grad_norm": 0.47867845277837057,
+ "grad_max_sv": 0.24308387711644172,
+ "grad_min_sv": 8.83432009590561e-09,
+ "grad_condition": 446940201.78913987,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 15.534965991973877
+ },
+ {
+ "epoch": 124,
+ "train_loss": 0.17369194811820984,
+ "train_acc": 0.9434,
+ "test_loss": 2.080777750968933,
+ "test_acc": 0.6137,
+ "lyapunov": null,
+ "grad_norm": 0.4915299120514337,
+ "grad_max_sv": 0.24491641744971276,
+ "grad_min_sv": 8.973002642667129e-09,
+ "grad_condition": 968560910.7177868,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 15.534366130828857
+ },
+ {
+ "epoch": 125,
+ "train_loss": 0.17029917016983032,
+ "train_acc": 0.94574,
+ "test_loss": 2.0687435190200807,
+ "test_acc": 0.6157,
+ "lyapunov": null,
+ "grad_norm": 0.4850020461380622,
+ "grad_max_sv": 0.24593175910413265,
+ "grad_min_sv": 8.810581337420631e-09,
+ "grad_condition": 165938611.54228717,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 15.55061674118042
+ },
+ {
+ "epoch": 126,
+ "train_loss": 0.1665445522928238,
+ "train_acc": 0.94674,
+ "test_loss": 2.0515053030014037,
+ "test_acc": 0.6187,
+ "lyapunov": null,
+ "grad_norm": 0.48056912270271285,
+ "grad_max_sv": 0.23969021812081337,
+ "grad_min_sv": 8.827286746693327e-09,
+ "grad_condition": 1743247825.2921212,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 15.531169652938843
+ },
+ {
+ "epoch": 127,
+ "train_loss": 0.16487963933944702,
+ "train_acc": 0.94836,
+ "test_loss": 2.033387902641296,
+ "test_acc": 0.6198,
+ "lyapunov": null,
+ "grad_norm": 0.47729941792361885,
+ "grad_max_sv": 0.2343486487865448,
+ "grad_min_sv": 8.995271932876748e-09,
+ "grad_condition": 606828641.3185183,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 15.539721250534058
+ },
+ {
+ "epoch": 128,
+ "train_loss": 0.16376567732810973,
+ "train_acc": 0.94834,
+ "test_loss": 2.0975912773132324,
+ "test_acc": 0.6112,
+ "lyapunov": null,
+ "grad_norm": 0.47555669561822944,
+ "grad_max_sv": 0.2403645869344473,
+ "grad_min_sv": 8.86344721578395e-09,
+ "grad_condition": 1871409158.001809,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 15.523812055587769
+ },
+ {
+ "epoch": 129,
+ "train_loss": 0.16381013206005096,
+ "train_acc": 0.94882,
+ "test_loss": 2.0344886224746705,
+ "test_acc": 0.6205,
+ "lyapunov": null,
+ "grad_norm": 0.47811068127125184,
+ "grad_max_sv": 0.2321129973977804,
+ "grad_min_sv": 8.809577021736195e-09,
+ "grad_condition": 674841641.2549579,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 15.542162656784058
+ },
+ {
+ "epoch": 130,
+ "train_loss": 0.1587965604352951,
+ "train_acc": 0.95018,
+ "test_loss": 2.039856211090088,
+ "test_acc": 0.6198,
+ "lyapunov": null,
+ "grad_norm": 0.46996704308372744,
+ "grad_max_sv": 0.24367436692118644,
+ "grad_min_sv": 8.878338260412334e-09,
+ "grad_condition": 3107522776.3953853,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 15.518379926681519
+ },
+ {
+ "epoch": 131,
+ "train_loss": 0.16415684640884398,
+ "train_acc": 0.94804,
+ "test_loss": 2.0716621114730835,
+ "test_acc": 0.6177,
+ "lyapunov": null,
+ "grad_norm": 0.477860267933493,
+ "grad_max_sv": 0.23813350014388562,
+ "grad_min_sv": 8.676938825780134e-09,
+ "grad_condition": 186204488.74284863,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 15.52889084815979
+ },
+ {
+ "epoch": 132,
+ "train_loss": 0.1586827588367462,
+ "train_acc": 0.94982,
+ "test_loss": 2.053567728805542,
+ "test_acc": 0.6199,
+ "lyapunov": null,
+ "grad_norm": 0.4697672382287586,
+ "grad_max_sv": 0.2426899142563343,
+ "grad_min_sv": 8.828440787385545e-09,
+ "grad_condition": 1012659868.4686158,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 15.524049282073975
+ },
+ {
+ "epoch": 133,
+ "train_loss": 0.15553737973690032,
+ "train_acc": 0.95082,
+ "test_loss": 2.043516174507141,
+ "test_acc": 0.6191,
+ "lyapunov": null,
+ "grad_norm": 0.4649067986135626,
+ "grad_max_sv": 0.24401309713721275,
+ "grad_min_sv": 8.961552855574292e-09,
+ "grad_condition": 1162757970.0586789,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 15.536059856414795
+ },
+ {
+ "epoch": 134,
+ "train_loss": 0.15784678574085237,
+ "train_acc": 0.9499,
+ "test_loss": 2.03684903011322,
+ "test_acc": 0.6189,
+ "lyapunov": null,
+ "grad_norm": 0.4686730421924603,
+ "grad_max_sv": 0.23595759123563767,
+ "grad_min_sv": 8.586731024010303e-09,
+ "grad_condition": 4315274102.848023,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 15.534076690673828
+ },
+ {
+ "epoch": 135,
+ "train_loss": 0.15442110489368438,
+ "train_acc": 0.95192,
+ "test_loss": 2.0882527042388914,
+ "test_acc": 0.6147,
+ "lyapunov": null,
+ "grad_norm": 0.4615131055534514,
+ "grad_max_sv": 0.2321950040757656,
+ "grad_min_sv": 8.617836743177176e-09,
+ "grad_condition": 99470014.62201284,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 15.554243803024292
+ },
+ {
+ "epoch": 136,
+ "train_loss": 0.15938658513069154,
+ "train_acc": 0.95014,
+ "test_loss": 2.0193495433807374,
+ "test_acc": 0.619,
+ "lyapunov": null,
+ "grad_norm": 0.46997706784197274,
+ "grad_max_sv": 0.24588101021945477,
+ "grad_min_sv": 8.594699345537e-09,
+ "grad_condition": 299854790.23102367,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 15.515581130981445
+ },
+ {
+ "epoch": 137,
+ "train_loss": 0.15305941107273102,
+ "train_acc": 0.95102,
+ "test_loss": 2.085107785606384,
+ "test_acc": 0.6178,
+ "lyapunov": null,
+ "grad_norm": 0.4651082031381239,
+ "grad_max_sv": 0.23546294569969178,
+ "grad_min_sv": 8.641280193082048e-09,
+ "grad_condition": 1355468630.1220336,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 15.523824691772461
+ },
+ {
+ "epoch": 138,
+ "train_loss": 0.15521952202796935,
+ "train_acc": 0.95138,
+ "test_loss": 2.05961570148468,
+ "test_acc": 0.621,
+ "lyapunov": null,
+ "grad_norm": 0.4655707979434113,
+ "grad_max_sv": 0.22249948792159557,
+ "grad_min_sv": 8.559314398871517e-09,
+ "grad_condition": 523110775.45855033,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 15.527312755584717
+ },
+ {
+ "epoch": 139,
+ "train_loss": 0.15613153836250304,
+ "train_acc": 0.94964,
+ "test_loss": 2.0917256591796876,
+ "test_acc": 0.6145,
+ "lyapunov": null,
+ "grad_norm": 0.4685524417915432,
+ "grad_max_sv": 0.23622551932930946,
+ "grad_min_sv": 8.448936071386512e-09,
+ "grad_condition": 381309760.86173236,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 15.53156852722168
+ },
+ {
+ "epoch": 140,
+ "train_loss": 0.15750930822372436,
+ "train_acc": 0.95076,
+ "test_loss": 2.0336023241043093,
+ "test_acc": 0.6231,
+ "lyapunov": null,
+ "grad_norm": 0.46956356170298885,
+ "grad_max_sv": 0.24571651183068752,
+ "grad_min_sv": 8.880518665268025e-09,
+ "grad_condition": 446576930.15414965,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 15.513741731643677
+ },
+ {
+ "epoch": 141,
+ "train_loss": 0.15634389350891112,
+ "train_acc": 0.95178,
+ "test_loss": 2.0461313623428343,
+ "test_acc": 0.6206,
+ "lyapunov": null,
+ "grad_norm": 0.4667179789960613,
+ "grad_max_sv": 0.2333354063332081,
+ "grad_min_sv": 8.735082636959725e-09,
+ "grad_condition": 2773787337.949284,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 15.527939558029175
+ },
+ {
+ "epoch": 142,
+ "train_loss": 0.1522996149158478,
+ "train_acc": 0.95188,
+ "test_loss": 2.036745939064026,
+ "test_acc": 0.6191,
+ "lyapunov": null,
+ "grad_norm": 0.45971196350477606,
+ "grad_max_sv": 0.23409303948283194,
+ "grad_min_sv": 8.654798093845651e-09,
+ "grad_condition": 899766914.5561358,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 15.528279781341553
+ },
+ {
+ "epoch": 143,
+ "train_loss": 0.15602009796380997,
+ "train_acc": 0.95086,
+ "test_loss": 2.030546005439758,
+ "test_acc": 0.6179,
+ "lyapunov": null,
+ "grad_norm": 0.46698211747670393,
+ "grad_max_sv": 0.2427021000534296,
+ "grad_min_sv": 8.880018779116672e-09,
+ "grad_condition": 2005668849.0321355,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 15.519719362258911
+ },
+ {
+ "epoch": 144,
+ "train_loss": 0.15405357198238373,
+ "train_acc": 0.95214,
+ "test_loss": 2.0480900999069216,
+ "test_acc": 0.6225,
+ "lyapunov": null,
+ "grad_norm": 0.4619783068969592,
+ "grad_max_sv": 0.24754497669637204,
+ "grad_min_sv": 9.022524723482569e-09,
+ "grad_condition": 472769507.4774891,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 15.538635015487671
+ },
+ {
+ "epoch": 145,
+ "train_loss": 0.15324831766605376,
+ "train_acc": 0.95236,
+ "test_loss": 2.0383225648880003,
+ "test_acc": 0.6217,
+ "lyapunov": null,
+ "grad_norm": 0.46106192343039926,
+ "grad_max_sv": 0.23626826107501983,
+ "grad_min_sv": 8.604992432687843e-09,
+ "grad_condition": 1211825093.7054877,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 15.542897939682007
+ },
+ {
+ "epoch": 146,
+ "train_loss": 0.15349729721069336,
+ "train_acc": 0.9521,
+ "test_loss": 2.0096838916778563,
+ "test_acc": 0.6241,
+ "lyapunov": null,
+ "grad_norm": 0.4615822267692517,
+ "grad_max_sv": 0.23966375291347503,
+ "grad_min_sv": 8.838330253866516e-09,
+ "grad_condition": 685922400.3184944,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 15.519303321838379
+ },
+ {
+ "epoch": 147,
+ "train_loss": 0.15039199693679808,
+ "train_acc": 0.95362,
+ "test_loss": 2.0573708726882933,
+ "test_acc": 0.6207,
+ "lyapunov": null,
+ "grad_norm": 0.4572591547952713,
+ "grad_max_sv": 0.2330123759806156,
+ "grad_min_sv": 8.66143673887215e-09,
+ "grad_condition": 1329748658.9084074,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 15.523812532424927
+ },
+ {
+ "epoch": 148,
+ "train_loss": 0.15033800620317458,
+ "train_acc": 0.95234,
+ "test_loss": 2.0463861759185793,
+ "test_acc": 0.6186,
+ "lyapunov": null,
+ "grad_norm": 0.45711357740306113,
+ "grad_max_sv": 0.2265869051218033,
+ "grad_min_sv": 8.489472146479878e-09,
+ "grad_condition": 764759274.1337291,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 15.51754641532898
+ },
+ {
+ "epoch": 149,
+ "train_loss": 0.15091258768081664,
+ "train_acc": 0.95256,
+ "test_loss": 2.0271072778701784,
+ "test_acc": 0.6188,
+ "lyapunov": null,
+ "grad_norm": 0.4574063447607332,
+ "grad_max_sv": 0.23711176067590714,
+ "grad_min_sv": 8.619700593825432e-09,
+ "grad_condition": 2609529945.0149875,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 15.518434286117554
+ },
+ {
+ "epoch": 150,
+ "train_loss": 0.153145382938385,
+ "train_acc": 0.95224,
+ "test_loss": 2.03473729095459,
+ "test_acc": 0.6182,
+ "lyapunov": null,
+ "grad_norm": 0.46046361312569684,
+ "grad_max_sv": 0.22179042883217334,
+ "grad_min_sv": 8.465783018335969e-09,
+ "grad_condition": 1154619433.2746358,
+ "lr": 0.0,
+ "time_sec": 15.527158737182617
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 4.604280056762695,
+ "train_acc": 0.06204,
+ "test_loss": 4.320657266998291,
+ "test_acc": 0.0698,
+ "lyapunov": null,
+ "grad_norm": 6.299548945029663,
+ "grad_max_sv": 5.383423590660096,
+ "grad_min_sv": 1.0969439819819016e-07,
+ "grad_condition": 135387683.66756994,
+ "lr": 0.0009998903417374227,
+ "time_sec": 32.66659903526306
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.8911869562530517,
+ "train_acc": 0.12252,
+ "test_loss": 3.901215605163574,
+ "test_acc": 0.1102,
+ "lyapunov": null,
+ "grad_norm": 4.7289084274834625,
+ "grad_max_sv": 4.045294773578644,
+ "grad_min_sv": 8.59628614957586e-08,
+ "grad_condition": 54316925.08787592,
+ "lr": 0.0009995614150494292,
+ "time_sec": 32.55902910232544
+ },
+ {
+ "epoch": 3,
+ "train_loss": 3.5447918058776855,
+ "train_acc": 0.16864,
+ "test_loss": 3.5751065971374514,
+ "test_acc": 0.1632,
+ "lyapunov": null,
+ "grad_norm": 3.9235192359291027,
+ "grad_max_sv": 3.218869465589523,
+ "grad_min_sv": 7.25899491738069e-08,
+ "grad_condition": 59713400.674747445,
+ "lr": 0.0009990133642141358,
+ "time_sec": 32.56558012962341
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.285915934448242,
+ "train_acc": 0.20564,
+ "test_loss": 3.4154525535583495,
+ "test_acc": 0.1808,
+ "lyapunov": null,
+ "grad_norm": 3.2931939429390655,
+ "grad_max_sv": 2.48674353659153,
+ "grad_min_sv": 6.094367343001394e-08,
+ "grad_condition": 49578785.90593137,
+ "lr": 0.0009982464296247522,
+ "time_sec": 32.57981467247009
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.049801904296875,
+ "train_acc": 0.2475,
+ "test_loss": 3.380838261413574,
+ "test_acc": 0.2067,
+ "lyapunov": null,
+ "grad_norm": 2.7585548587495836,
+ "grad_max_sv": 1.9313260614871979,
+ "grad_min_sv": 5.103909220399716e-08,
+ "grad_condition": 117086071.43576927,
+ "lr": 0.0009972609476841367,
+ "time_sec": 32.564860582351685
+ },
+ {
+ "epoch": 6,
+ "train_loss": 2.861402225112915,
+ "train_acc": 0.28052,
+ "test_loss": 3.1182963836669924,
+ "test_acc": 0.2393,
+ "lyapunov": null,
+ "grad_norm": 2.365169286939716,
+ "grad_max_sv": 1.514634570479393,
+ "grad_min_sv": 4.377452151871353e-08,
+ "grad_condition": 42685906.70361744,
+ "lr": 0.000996057350657239,
+ "time_sec": 32.57882595062256
+ },
+ {
+ "epoch": 7,
+ "train_loss": 2.683069683303833,
+ "train_acc": 0.31566,
+ "test_loss": 2.857948400115967,
+ "test_acc": 0.2899,
+ "lyapunov": null,
+ "grad_norm": 2.0678830204526424,
+ "grad_max_sv": 1.2104690104722977,
+ "grad_min_sv": 3.849874057187952e-08,
+ "grad_condition": 83742051.18670955,
+ "lr": 0.000994636166481494,
+ "time_sec": 32.585235834121704
+ },
+ {
+ "epoch": 8,
+ "train_loss": 2.5299233337402343,
+ "train_acc": 0.34444,
+ "test_loss": 3.000171680831909,
+ "test_acc": 0.2752,
+ "lyapunov": null,
+ "grad_norm": 1.874555701802065,
+ "grad_max_sv": 1.0279113829135895,
+ "grad_min_sv": 3.509024343872902e-08,
+ "grad_condition": 55390142.1353655,
+ "lr": 0.0009929980185352525,
+ "time_sec": 32.69047737121582
+ },
+ {
+ "epoch": 9,
+ "train_loss": 2.4147268306732177,
+ "train_acc": 0.3694,
+ "test_loss": 2.543715224456787,
+ "test_acc": 0.3455,
+ "lyapunov": null,
+ "grad_norm": 1.7485138229937156,
+ "grad_max_sv": 0.9131708398461342,
+ "grad_min_sv": 3.287046465294541e-08,
+ "grad_condition": 39656658.27812234,
+ "lr": 0.0009911436253643444,
+ "time_sec": 32.57169961929321
+ },
+ {
+ "epoch": 10,
+ "train_loss": 2.2967233794403077,
+ "train_acc": 0.39298,
+ "test_loss": 2.6548849906921386,
+ "test_acc": 0.3353,
+ "lyapunov": null,
+ "grad_norm": 1.6282804367899422,
+ "grad_max_sv": 0.782713083922863,
+ "grad_min_sv": 3.019940961190848e-08,
+ "grad_condition": 36873848.007240444,
+ "lr": 0.0009890738003669028,
+ "time_sec": 32.577866077423096
+ },
+ {
+ "epoch": 11,
+ "train_loss": 2.192351549682617,
+ "train_acc": 0.41852,
+ "test_loss": 2.3893451919555666,
+ "test_acc": 0.3824,
+ "lyapunov": null,
+ "grad_norm": 1.5518898048516216,
+ "grad_max_sv": 0.7297310382127762,
+ "grad_min_sv": 2.9274875311402494e-08,
+ "grad_condition": 81724146.83842216,
+ "lr": 0.00098678945143658,
+ "time_sec": 32.599745750427246
+ },
+ {
+ "epoch": 12,
+ "train_loss": 2.117909373779297,
+ "train_acc": 0.4337,
+ "test_loss": 2.522136171722412,
+ "test_acc": 0.3587,
+ "lyapunov": null,
+ "grad_norm": 1.4842631514558458,
+ "grad_max_sv": 0.66500775963068,
+ "grad_min_sv": 2.8010595395921988e-08,
+ "grad_condition": 35670339.18143847,
+ "lr": 0.0009842915805643154,
+ "time_sec": 32.62933874130249
+ },
+ {
+ "epoch": 13,
+ "train_loss": 2.035253409576416,
+ "train_acc": 0.45344,
+ "test_loss": 2.391997838592529,
+ "test_acc": 0.3805,
+ "lyapunov": null,
+ "grad_norm": 1.4422903854957079,
+ "grad_max_sv": 0.6408356204628944,
+ "grad_min_sv": 2.7295970482510425e-08,
+ "grad_condition": 43720876.000019774,
+ "lr": 0.000981581283398829,
+ "time_sec": 32.557313442230225
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.9614996997451781,
+ "train_acc": 0.46826,
+ "test_loss": 2.3329195419311524,
+ "test_acc": 0.4028,
+ "lyapunov": null,
+ "grad_norm": 1.3741944023253918,
+ "grad_max_sv": 0.6013172835111618,
+ "grad_min_sv": 2.5733794781213072e-08,
+ "grad_condition": 36069642.478253104,
+ "lr": 0.0009786597487660333,
+ "time_sec": 32.58955407142639
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.8944761297988892,
+ "train_acc": 0.48526,
+ "test_loss": 2.2367286880493165,
+ "test_acc": 0.4236,
+ "lyapunov": null,
+ "grad_norm": 1.3219592289498192,
+ "grad_max_sv": 0.5812912411987782,
+ "grad_min_sv": 2.4716666779944773e-08,
+ "grad_condition": 29281331.50836698,
+ "lr": 0.0009755282581475766,
+ "time_sec": 32.56029748916626
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.8379625350189208,
+ "train_acc": 0.49608,
+ "test_loss": 2.1963637313842774,
+ "test_acc": 0.4284,
+ "lyapunov": null,
+ "grad_norm": 1.2908175006695335,
+ "grad_max_sv": 0.5532825239002704,
+ "grad_min_sv": 2.4336655729539913e-08,
+ "grad_condition": 42358304.72716427,
+ "lr": 0.0009721881851187403,
+ "time_sec": 32.54909014701843
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.7670473766326904,
+ "train_acc": 0.51538,
+ "test_loss": 2.1328998752593993,
+ "test_acc": 0.4452,
+ "lyapunov": null,
+ "grad_norm": 1.2440997761596901,
+ "grad_max_sv": 0.5198108039796352,
+ "grad_min_sv": 2.3273317767413813e-08,
+ "grad_condition": 35998824.48422967,
+ "lr": 0.0009686409947459456,
+ "time_sec": 32.55762696266174
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.7253368561553954,
+ "train_acc": 0.52444,
+ "test_loss": 2.245950330352783,
+ "test_acc": 0.4284,
+ "lyapunov": null,
+ "grad_norm": 1.214902512911659,
+ "grad_max_sv": 0.5048692628741265,
+ "grad_min_sv": 2.2689030459988047e-08,
+ "grad_condition": 49317544.599824145,
+ "lr": 0.0009648882429441254,
+ "time_sec": 32.5514817237854
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.6694325649261474,
+ "train_acc": 0.5342,
+ "test_loss": 2.19226961517334,
+ "test_acc": 0.4387,
+ "lyapunov": null,
+ "grad_norm": 1.1750671216974986,
+ "grad_max_sv": 0.4863507993519306,
+ "grad_min_sv": 2.2075054092324244e-08,
+ "grad_condition": 97502207.70501134,
+ "lr": 0.00096093157579425,
+ "time_sec": 32.55115628242493
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.617248278427124,
+ "train_acc": 0.5473,
+ "test_loss": 2.143247143173218,
+ "test_acc": 0.453,
+ "lyapunov": null,
+ "grad_norm": 1.1445750522907119,
+ "grad_max_sv": 0.4708236537873745,
+ "grad_min_sv": 2.1383133666508236e-08,
+ "grad_condition": 30242603.347623855,
+ "lr": 0.0009567727288213001,
+ "time_sec": 32.56135654449463
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.5802922723007202,
+ "train_acc": 0.557,
+ "test_loss": 2.0990093154907226,
+ "test_acc": 0.4651,
+ "lyapunov": null,
+ "grad_norm": 1.1146123139527973,
+ "grad_max_sv": 0.45539517551660535,
+ "grad_min_sv": 2.1216313506045025e-08,
+ "grad_condition": 32120917.787080377,
+ "lr": 0.0009524135262330095,
+ "time_sec": 32.58874869346619
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.540067174949646,
+ "train_acc": 0.56592,
+ "test_loss": 2.0439955375671386,
+ "test_acc": 0.4707,
+ "lyapunov": null,
+ "grad_norm": 1.0888616623198637,
+ "grad_max_sv": 0.43293082937598226,
+ "grad_min_sv": 2.0197447772596356e-08,
+ "grad_condition": 51667507.409315005,
+ "lr": 0.0009478558801197061,
+ "time_sec": 32.57522892951965
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.5045368173980713,
+ "train_acc": 0.57686,
+ "test_loss": 2.0701497230529786,
+ "test_acc": 0.4729,
+ "lyapunov": null,
+ "grad_norm": 1.0823066547637195,
+ "grad_max_sv": 0.4348363593220711,
+ "grad_min_sv": 2.0215574525472847e-08,
+ "grad_condition": 38846769.86075296,
+ "lr": 0.000943101789615607,
+ "time_sec": 32.58562135696411
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.464451589126587,
+ "train_acc": 0.58532,
+ "test_loss": 2.2039865215301515,
+ "test_acc": 0.4486,
+ "lyapunov": null,
+ "grad_norm": 1.0523927832685198,
+ "grad_max_sv": 0.41661558151245115,
+ "grad_min_sv": 1.950878351086871e-08,
+ "grad_condition": 34416119.9412758,
+ "lr": 0.0009381533400219313,
+ "time_sec": 32.563148736953735
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.4205649266052247,
+ "train_acc": 0.59388,
+ "test_loss": 2.1708908073425293,
+ "test_acc": 0.4631,
+ "lyapunov": null,
+ "grad_norm": 1.0237955167104829,
+ "grad_max_sv": 0.41313874199986456,
+ "grad_min_sv": 1.9160673876000846e-08,
+ "grad_condition": 116069222.65926342,
+ "lr": 0.0009330127018922189,
+ "time_sec": 32.58251953125
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.3801667861938476,
+ "train_acc": 0.60904,
+ "test_loss": 2.141048712158203,
+ "test_acc": 0.4804,
+ "lyapunov": null,
+ "grad_norm": 1.003894338084706,
+ "grad_max_sv": 0.39152884259819987,
+ "grad_min_sv": 1.85417132805496e-08,
+ "grad_condition": 149070926.97039393,
+ "lr": 0.000927682130080253,
+ "time_sec": 32.58069562911987
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.3742198986053467,
+ "train_acc": 0.6049,
+ "test_loss": 2.1493278324127196,
+ "test_acc": 0.4766,
+ "lyapunov": null,
+ "grad_norm": 1.0025464883815882,
+ "grad_max_sv": 0.3876075059175491,
+ "grad_min_sv": 1.830616184195222e-08,
+ "grad_condition": 35882215.67392446,
+ "lr": 0.0009221639627510072,
+ "time_sec": 32.56836271286011
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.320306241645813,
+ "train_acc": 0.6196,
+ "test_loss": 2.1034063312530518,
+ "test_acc": 0.4844,
+ "lyapunov": null,
+ "grad_norm": 0.9735499274270826,
+ "grad_max_sv": 0.3877687506377697,
+ "grad_min_sv": 1.8286890105835564e-08,
+ "grad_condition": 335682383.9298244,
+ "lr": 0.0009164606203550494,
+ "time_sec": 32.57155418395996
+ },
+ {
+ "epoch": 29,
+ "train_loss": 1.2960155849075317,
+ "train_acc": 0.6256,
+ "test_loss": 2.1984372549057007,
+ "test_acc": 0.4692,
+ "lyapunov": null,
+ "grad_norm": 0.9613960934578316,
+ "grad_max_sv": 0.3829047717154026,
+ "grad_min_sv": 1.7720739411974938e-08,
+ "grad_condition": 36256976.72962162,
+ "lr": 0.0009105746045668516,
+ "time_sec": 32.55882430076599
+ },
+ {
+ "epoch": 30,
+ "train_loss": 1.276566519241333,
+ "train_acc": 0.62918,
+ "test_loss": 2.3138665813446044,
+ "test_acc": 0.4615,
+ "lyapunov": null,
+ "grad_norm": 0.9496542327680724,
+ "grad_max_sv": 0.37292894124984743,
+ "grad_min_sv": 1.7765610841463662e-08,
+ "grad_condition": 48990654.53726908,
+ "lr": 0.0009045084971874733,
+ "time_sec": 32.57599472999573
+ },
+ {
+ "epoch": 31,
+ "train_loss": 1.2222671955871582,
+ "train_acc": 0.64256,
+ "test_loss": 2.1691656875610352,
+ "test_acc": 0.4809,
+ "lyapunov": null,
+ "grad_norm": 0.9328591067251968,
+ "grad_max_sv": 0.3668631583452225,
+ "grad_min_sv": 1.731717505781827e-08,
+ "grad_condition": 30411660.235134684,
+ "lr": 0.0008982649590120977,
+ "time_sec": 32.56551241874695
+ },
+ {
+ "epoch": 32,
+ "train_loss": 1.2110996068191529,
+ "train_acc": 0.64794,
+ "test_loss": 2.214646379852295,
+ "test_acc": 0.4829,
+ "lyapunov": null,
+ "grad_norm": 0.930727366359918,
+ "grad_max_sv": 0.3651597030460835,
+ "grad_min_sv": 1.725773807192965e-08,
+ "grad_condition": 25901528.27644656,
+ "lr": 0.0008918467286629196,
+ "time_sec": 32.56990313529968
+ },
+ {
+ "epoch": 33,
+ "train_loss": 1.1722402347946168,
+ "train_acc": 0.6566,
+ "test_loss": 2.2246903633117676,
+ "test_acc": 0.4846,
+ "lyapunov": null,
+ "grad_norm": 0.9124985410949377,
+ "grad_max_sv": 0.35901916325092315,
+ "grad_min_sv": 1.6734816802102536e-08,
+ "grad_condition": 84184024.35994068,
+ "lr": 0.0008852566213878943,
+ "time_sec": 32.58838510513306
+ },
+ {
+ "epoch": 34,
+ "train_loss": 1.1472361179351807,
+ "train_acc": 0.66254,
+ "test_loss": 2.1493885478973387,
+ "test_acc": 0.4941,
+ "lyapunov": null,
+ "grad_norm": 0.8981676912068559,
+ "grad_max_sv": 0.34216810315847396,
+ "grad_min_sv": 1.6077876746622975e-08,
+ "grad_condition": 36468768.92296384,
+ "lr": 0.000878497527825878,
+ "time_sec": 32.57939434051514
+ },
+ {
+ "epoch": 35,
+ "train_loss": 1.1205655740356446,
+ "train_acc": 0.66956,
+ "test_loss": 2.163042925453186,
+ "test_acc": 0.4954,
+ "lyapunov": null,
+ "grad_norm": 0.8860645128225066,
+ "grad_max_sv": 0.3396616868674755,
+ "grad_min_sv": 1.607423450074308e-08,
+ "grad_condition": 144981538.90034992,
+ "lr": 0.000871572412738697,
+ "time_sec": 32.57995939254761
+ },
+ {
+ "epoch": 36,
+ "train_loss": 1.1019499723815918,
+ "train_acc": 0.67338,
+ "test_loss": 2.1101196655273435,
+ "test_acc": 0.508,
+ "lyapunov": null,
+ "grad_norm": 0.8837215741761234,
+ "grad_max_sv": 0.3453404136002064,
+ "grad_min_sv": 1.6300073393815674e-08,
+ "grad_condition": 39609134.3745661,
+ "lr": 0.0008644843137107055,
+ "time_sec": 32.610419511795044
+ },
+ {
+ "epoch": 37,
+ "train_loss": 1.0685892918777466,
+ "train_acc": 0.68264,
+ "test_loss": 2.166209588623047,
+ "test_acc": 0.5007,
+ "lyapunov": null,
+ "grad_norm": 0.8688858809651051,
+ "grad_max_sv": 0.3433241851627827,
+ "grad_min_sv": 1.6007609650054573e-08,
+ "grad_condition": 775786281.5340235,
+ "lr": 0.0008572363398164014,
+ "time_sec": 32.565879583358765
+ },
+ {
+ "epoch": 38,
+ "train_loss": 1.0574775017929077,
+ "train_acc": 0.68396,
+ "test_loss": 2.222346786689758,
+ "test_acc": 0.5,
+ "lyapunov": null,
+ "grad_norm": 0.8639145605396845,
+ "grad_max_sv": 0.3388586565852165,
+ "grad_min_sv": 1.583358475998331e-08,
+ "grad_condition": 34039562.91252621,
+ "lr": 0.0008498316702566826,
+ "time_sec": 32.57612729072571
+ },
+ {
+ "epoch": 39,
+ "train_loss": 1.0226109420394898,
+ "train_acc": 0.69532,
+ "test_loss": 2.190898861312866,
+ "test_acc": 0.502,
+ "lyapunov": null,
+ "grad_norm": 0.8542002974927076,
+ "grad_max_sv": 0.3443542592227459,
+ "grad_min_sv": 1.5959563168244095e-08,
+ "grad_condition": 59986387.77119949,
+ "lr": 0.0008422735529643442,
+ "time_sec": 32.57960486412048
+ },
+ {
+ "epoch": 40,
+ "train_loss": 1.0001259584808349,
+ "train_acc": 0.70102,
+ "test_loss": 2.25260383605957,
+ "test_acc": 0.4998,
+ "lyapunov": null,
+ "grad_norm": 0.8465843258509351,
+ "grad_max_sv": 0.33337946608662605,
+ "grad_min_sv": 1.5467166557259216e-08,
+ "grad_condition": 37113133.49315401,
+ "lr": 0.0008345653031794289,
+ "time_sec": 32.61366534233093
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.980431226234436,
+ "train_acc": 0.70476,
+ "test_loss": 2.1930856651306154,
+ "test_acc": 0.5111,
+ "lyapunov": null,
+ "grad_norm": 0.8344894111462177,
+ "grad_max_sv": 0.3344740740954876,
+ "grad_min_sv": 1.5184292248560104e-08,
+ "grad_condition": 42849773.682712145,
+ "lr": 0.0008267103019950526,
+ "time_sec": 32.604257106781006
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.9617984279251098,
+ "train_acc": 0.71146,
+ "test_loss": 2.2299947700500486,
+ "test_acc": 0.506,
+ "lyapunov": null,
+ "grad_norm": 0.8242242603947335,
+ "grad_max_sv": 0.3212660253047943,
+ "grad_min_sv": 1.4864016899610033e-08,
+ "grad_condition": 73401477.5678053,
+ "lr": 0.0008187119948743447,
+ "time_sec": 32.6293363571167
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.9384816081619263,
+ "train_acc": 0.71576,
+ "test_loss": 2.1490371479034422,
+ "test_acc": 0.5197,
+ "lyapunov": null,
+ "grad_norm": 0.8237477937232076,
+ "grad_max_sv": 0.3244126185774803,
+ "grad_min_sv": 1.494453279390906e-08,
+ "grad_condition": 58033299.26618519,
+ "lr": 0.000810573890139155,
+ "time_sec": 32.59305548667908
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.9152639833831787,
+ "train_acc": 0.72254,
+ "test_loss": 2.227645333480835,
+ "test_acc": 0.515,
+ "lyapunov": null,
+ "grad_norm": 0.8114307246954692,
+ "grad_max_sv": 0.32891099974513055,
+ "grad_min_sv": 1.470089587857909e-08,
+ "grad_condition": 187882457.4560508,
+ "lr": 0.0008022995574311873,
+ "time_sec": 32.56365776062012
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.8937730826950073,
+ "train_acc": 0.72926,
+ "test_loss": 2.257075512313843,
+ "test_acc": 0.5171,
+ "lyapunov": null,
+ "grad_norm": 0.7991066773444042,
+ "grad_max_sv": 0.310314255207777,
+ "grad_min_sv": 1.442440034638004e-08,
+ "grad_condition": 67545918.8595486,
+ "lr": 0.0007938926261462363,
+ "time_sec": 32.56998062133789
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.8821200103569031,
+ "train_acc": 0.73168,
+ "test_loss": 2.312848774147034,
+ "test_acc": 0.5052,
+ "lyapunov": null,
+ "grad_norm": 0.7987404367629951,
+ "grad_max_sv": 0.31381460800766947,
+ "grad_min_sv": 1.427665476706752e-08,
+ "grad_condition": 147171178.65022224,
+ "lr": 0.0007853567838422158,
+ "time_sec": 32.57842302322388
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.8545298266983032,
+ "train_acc": 0.73686,
+ "test_loss": 2.2923807540893555,
+ "test_acc": 0.5057,
+ "lyapunov": null,
+ "grad_norm": 0.7859231581178334,
+ "grad_max_sv": 0.31694323718547823,
+ "grad_min_sv": 1.4505229091466009e-08,
+ "grad_condition": 93313806.69758794,
+ "lr": 0.0007766957746216719,
+ "time_sec": 32.56472444534302
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.8375117244720459,
+ "train_acc": 0.74296,
+ "test_loss": 2.350985548019409,
+ "test_acc": 0.5065,
+ "lyapunov": null,
+ "grad_norm": 0.7733144016514287,
+ "grad_max_sv": 0.31536148227751254,
+ "grad_min_sv": 1.3926250694989983e-08,
+ "grad_condition": 138817686.6846688,
+ "lr": 0.0007679133974894982,
+ "time_sec": 32.562721490859985
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.8223947568511963,
+ "train_acc": 0.74656,
+ "test_loss": 2.268610196495056,
+ "test_acc": 0.509,
+ "lyapunov": null,
+ "grad_norm": 0.7708191932209156,
+ "grad_max_sv": 0.3082855362445116,
+ "grad_min_sv": 1.424878183428624e-08,
+ "grad_condition": 48064293.176824205,
+ "lr": 0.000759013504686565,
+ "time_sec": 32.59068489074707
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.8102355616569519,
+ "train_acc": 0.75154,
+ "test_loss": 2.303807855987549,
+ "test_acc": 0.5172,
+ "lyapunov": null,
+ "grad_norm": 0.7678857639968419,
+ "grad_max_sv": 0.30606309957802297,
+ "grad_min_sv": 1.401376939977328e-08,
+ "grad_condition": 66554378.026006415,
+ "lr": 0.0007499999999999998,
+ "time_sec": 32.61594772338867
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.7894559608268737,
+ "train_acc": 0.75788,
+ "test_loss": 2.3806381210327148,
+ "test_acc": 0.5067,
+ "lyapunov": null,
+ "grad_norm": 0.7578995070890107,
+ "grad_max_sv": 0.2958958923816681,
+ "grad_min_sv": 1.3479759735507413e-08,
+ "grad_condition": 59071539.288179755,
+ "lr": 0.0007408768370508575,
+ "time_sec": 32.58355736732483
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.7807610025405883,
+ "train_acc": 0.7587,
+ "test_loss": 2.335085013961792,
+ "test_acc": 0.5175,
+ "lyapunov": null,
+ "grad_norm": 0.7536291786486181,
+ "grad_max_sv": 0.3058082439005375,
+ "grad_min_sv": 1.4062500508851828e-08,
+ "grad_condition": 89488373.11429313,
+ "lr": 0.0007316480175599307,
+ "time_sec": 32.58504581451416
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.7639712882995605,
+ "train_acc": 0.76632,
+ "test_loss": 2.2413758136749267,
+ "test_acc": 0.529,
+ "lyapunov": null,
+ "grad_norm": 0.7437671807956605,
+ "grad_max_sv": 0.2986128095537424,
+ "grad_min_sv": 1.3716437835195604e-08,
+ "grad_condition": 153765004.26652625,
+ "lr": 0.0007223175895924635,
+ "time_sec": 32.599562883377075
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.7342572978401184,
+ "train_acc": 0.77172,
+ "test_loss": 2.3813604881286623,
+ "test_acc": 0.5211,
+ "lyapunov": null,
+ "grad_norm": 0.7415334115465683,
+ "grad_max_sv": 0.2952877823263407,
+ "grad_min_sv": 1.3237078199702934e-08,
+ "grad_condition": 158912190.85988137,
+ "lr": 0.0007128896457825361,
+ "time_sec": 32.58093762397766
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.7243311285591125,
+ "train_acc": 0.77394,
+ "test_loss": 2.5364841087341308,
+ "test_acc": 0.4919,
+ "lyapunov": null,
+ "grad_norm": 0.7336077653545635,
+ "grad_max_sv": 0.30250501483678816,
+ "grad_min_sv": 1.3610404020827915e-08,
+ "grad_condition": 80425531.55629282,
+ "lr": 0.0007033683215378998,
+ "time_sec": 32.64418268203735
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.7082911996078491,
+ "train_acc": 0.77956,
+ "test_loss": 2.494243837738037,
+ "test_acc": 0.5119,
+ "lyapunov": null,
+ "grad_norm": 0.7290174142670145,
+ "grad_max_sv": 0.2945553746074438,
+ "grad_min_sv": 1.3041360513894872e-08,
+ "grad_condition": 131633091.2577754,
+ "lr": 0.0006937577932260512,
+ "time_sec": 32.61989617347717
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.6861382236289978,
+ "train_acc": 0.7852,
+ "test_loss": 2.4704931076049803,
+ "test_acc": 0.518,
+ "lyapunov": null,
+ "grad_norm": 0.7189100733167055,
+ "grad_max_sv": 0.2928345203399658,
+ "grad_min_sv": 1.3202054537260477e-08,
+ "grad_condition": 122301802.04377504,
+ "lr": 0.0006840622763423388,
+ "time_sec": 32.601600885391235
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.6700656919956207,
+ "train_acc": 0.79076,
+ "test_loss": 2.505882039642334,
+ "test_acc": 0.5131,
+ "lyapunov": null,
+ "grad_norm": 0.7086978020515203,
+ "grad_max_sv": 0.28342925757169724,
+ "grad_min_sv": 1.2833174680912385e-08,
+ "grad_condition": 67698817.82937825,
+ "lr": 0.0006742860236609073,
+ "time_sec": 32.58192586898804
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.6577284108161926,
+ "train_acc": 0.79492,
+ "test_loss": 2.491006435775757,
+ "test_acc": 0.5155,
+ "lyapunov": null,
+ "grad_norm": 0.7069652566379913,
+ "grad_max_sv": 0.2849778015166521,
+ "grad_min_sv": 1.2662411319475097e-08,
+ "grad_condition": 54369902.95066987,
+ "lr": 0.0006644333233692913,
+ "time_sec": 32.601956605911255
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.6429468762397766,
+ "train_acc": 0.7985,
+ "test_loss": 2.4342385992050173,
+ "test_acc": 0.5281,
+ "lyapunov": null,
+ "grad_norm": 0.6950269523418225,
+ "grad_max_sv": 0.2759479142725468,
+ "grad_min_sv": 1.2526198570604087e-08,
+ "grad_condition": 1003668275.7453331,
+ "lr": 0.0006545084971874734,
+ "time_sec": 32.593979835510254
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.6316694467926025,
+ "train_acc": 0.80204,
+ "test_loss": 2.572236448669434,
+ "test_acc": 0.5228,
+ "lyapunov": null,
+ "grad_norm": 0.6953930381951806,
+ "grad_max_sv": 0.2823780722916126,
+ "grad_min_sv": 1.2607634538338957e-08,
+ "grad_condition": 910241325.2806966,
+ "lr": 0.0006445158984722354,
+ "time_sec": 32.63531136512756
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.6084016784477234,
+ "train_acc": 0.80756,
+ "test_loss": 2.528528450965881,
+ "test_acc": 0.5249,
+ "lyapunov": null,
+ "grad_norm": 0.6902039343361056,
+ "grad_max_sv": 0.2754691679030657,
+ "grad_min_sv": 1.2385301192095743e-08,
+ "grad_condition": 124171966.43343556,
+ "lr": 0.0006344599103076324,
+ "time_sec": 32.646347761154175
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.6006980142784119,
+ "train_acc": 0.81018,
+ "test_loss": 2.438706118583679,
+ "test_acc": 0.5266,
+ "lyapunov": null,
+ "grad_norm": 0.6822637884805373,
+ "grad_max_sv": 0.276136140525341,
+ "grad_min_sv": 1.2456568440621928e-08,
+ "grad_condition": 41258405.402897015,
+ "lr": 0.0006243449435824269,
+ "time_sec": 32.60796880722046
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.585920947380066,
+ "train_acc": 0.81566,
+ "test_loss": 2.505697784423828,
+ "test_acc": 0.5259,
+ "lyapunov": null,
+ "grad_norm": 0.6743129224923755,
+ "grad_max_sv": 0.26691033616662024,
+ "grad_min_sv": 1.2091218234630552e-08,
+ "grad_condition": 57195642.756296314,
+ "lr": 0.0006141754350553275,
+ "time_sec": 32.621875286102295
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.5716569157028198,
+ "train_acc": 0.81832,
+ "test_loss": 2.488600128173828,
+ "test_acc": 0.5221,
+ "lyapunov": null,
+ "grad_norm": 0.6747582168048405,
+ "grad_max_sv": 0.2778852738440037,
+ "grad_min_sv": 1.2316326589503767e-08,
+ "grad_condition": 66617009.51688242,
+ "lr": 0.0006039558454088793,
+ "time_sec": 32.58805871009827
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.5558187670326233,
+ "train_acc": 0.82442,
+ "test_loss": 2.455172736740112,
+ "test_acc": 0.5327,
+ "lyapunov": null,
+ "grad_norm": 0.6650651562580321,
+ "grad_max_sv": 0.27054035626351836,
+ "grad_min_sv": 1.1980440989180913e-08,
+ "grad_condition": 263553333.63889045,
+ "lr": 0.000593690657292862,
+ "time_sec": 32.61953616142273
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.5372648673820496,
+ "train_acc": 0.82802,
+ "test_loss": 2.5111166515350343,
+ "test_acc": 0.5259,
+ "lyapunov": null,
+ "grad_norm": 0.6598459109898526,
+ "grad_max_sv": 0.26995205879211426,
+ "grad_min_sv": 1.1711705713568498e-08,
+ "grad_condition": 40680262.666348636,
+ "lr": 0.0005833843733580507,
+ "time_sec": 32.596007108688354
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.529928300704956,
+ "train_acc": 0.83184,
+ "test_loss": 2.505376844024658,
+ "test_acc": 0.5324,
+ "lyapunov": null,
+ "grad_norm": 0.6554247710983278,
+ "grad_max_sv": 0.2640453014522791,
+ "grad_min_sv": 1.16465385096437e-08,
+ "grad_condition": 196611022.55457097,
+ "lr": 0.0005730415142812054,
+ "time_sec": 32.589977502822876
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.5270337955570221,
+ "train_acc": 0.83232,
+ "test_loss": 2.6256065521240233,
+ "test_acc": 0.5197,
+ "lyapunov": null,
+ "grad_norm": 0.6567252289857295,
+ "grad_max_sv": 0.2711860008537769,
+ "grad_min_sv": 1.1960956241034368e-08,
+ "grad_condition": 561898784.4199932,
+ "lr": 0.0005626666167821517,
+ "time_sec": 32.5863139629364
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.5109112097549439,
+ "train_acc": 0.8354,
+ "test_loss": 2.5708269050598145,
+ "test_acc": 0.5302,
+ "lyapunov": null,
+ "grad_norm": 0.646381173102848,
+ "grad_max_sv": 0.27013656310737133,
+ "grad_min_sv": 1.1766451666391648e-08,
+ "grad_condition": 259686356.85246676,
+ "lr": 0.0005522642316338265,
+ "time_sec": 32.601078033447266
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.49452698835372927,
+ "train_acc": 0.84226,
+ "test_loss": 2.5480498626708985,
+ "test_acc": 0.5341,
+ "lyapunov": null,
+ "grad_norm": 0.6360062848670928,
+ "grad_max_sv": 0.26699192114174364,
+ "grad_min_sv": 1.1295523278341807e-08,
+ "grad_condition": 5391854944.622183,
+ "lr": 0.0005418389216661573,
+ "time_sec": 32.60187101364136
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.48291658142089844,
+ "train_acc": 0.84586,
+ "test_loss": 2.659250145339966,
+ "test_acc": 0.5273,
+ "lyapunov": null,
+ "grad_norm": 0.6354901528331942,
+ "grad_max_sv": 0.26031049638986586,
+ "grad_min_sv": 1.1230092526043345e-08,
+ "grad_condition": 88239876.70399968,
+ "lr": 0.0005313952597646563,
+ "time_sec": 32.61269569396973
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.4778318354034424,
+ "train_acc": 0.8473,
+ "test_loss": 2.5874798002243042,
+ "test_acc": 0.5314,
+ "lyapunov": null,
+ "grad_norm": 0.6300098949086598,
+ "grad_max_sv": 0.26232460178434847,
+ "grad_min_sv": 1.134239846749957e-08,
+ "grad_condition": 105944680.31289935,
+ "lr": 0.0005209378268645994,
+ "time_sec": 32.613691091537476
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.46288997037887575,
+ "train_acc": 0.85288,
+ "test_loss": 2.5993505474090575,
+ "test_acc": 0.5337,
+ "lyapunov": null,
+ "grad_norm": 0.6215157272690962,
+ "grad_max_sv": 0.26828358359634874,
+ "grad_min_sv": 1.1235708100021391e-08,
+ "grad_condition": 41868662.72964181,
+ "lr": 0.0005104712099416781,
+ "time_sec": 32.61982536315918
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.45871317274093626,
+ "train_acc": 0.85266,
+ "test_loss": 2.6259676776885987,
+ "test_acc": 0.5345,
+ "lyapunov": null,
+ "grad_norm": 0.6170925610226076,
+ "grad_max_sv": 0.2573466833680868,
+ "grad_min_sv": 1.104757565784445e-08,
+ "grad_condition": 212140699.82071534,
+ "lr": 0.0004999999999999996,
+ "time_sec": 32.598039627075195
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.45109452469825745,
+ "train_acc": 0.85454,
+ "test_loss": 2.665439921569824,
+ "test_acc": 0.5303,
+ "lyapunov": null,
+ "grad_norm": 0.6161744946755234,
+ "grad_max_sv": 0.25873752422630786,
+ "grad_min_sv": 1.1002691283393782e-08,
+ "grad_condition": 1052469961.0162939,
+ "lr": 0.0004895287900583212,
+ "time_sec": 32.58305859565735
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.43257994356155394,
+ "train_acc": 0.86046,
+ "test_loss": 2.702251711654663,
+ "test_acc": 0.526,
+ "lyapunov": null,
+ "grad_norm": 0.607726688787837,
+ "grad_max_sv": 0.26136815659701823,
+ "grad_min_sv": 1.0734200759157653e-08,
+ "grad_condition": 189329156.27802238,
+ "lr": 0.0004790621731353997,
+ "time_sec": 32.59784960746765
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.41896025703430173,
+ "train_acc": 0.86472,
+ "test_loss": 2.671762952804565,
+ "test_acc": 0.5336,
+ "lyapunov": null,
+ "grad_norm": 0.5957655893318665,
+ "grad_max_sv": 0.2534705221652985,
+ "grad_min_sv": 1.0711852985699488e-08,
+ "grad_condition": 191261118.43217826,
+ "lr": 0.000468604740235343,
+ "time_sec": 32.62303113937378
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.40766072305679324,
+ "train_acc": 0.86786,
+ "test_loss": 2.584160025596619,
+ "test_acc": 0.5417,
+ "lyapunov": null,
+ "grad_norm": 0.5933439762516267,
+ "grad_max_sv": 0.2529820345342159,
+ "grad_min_sv": 1.1027942445340776e-08,
+ "grad_condition": 38680465.32555069,
+ "lr": 0.00045816107833384175,
+ "time_sec": 32.64057159423828
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.395585339012146,
+ "train_acc": 0.8719,
+ "test_loss": 2.6836016262054443,
+ "test_acc": 0.5338,
+ "lyapunov": null,
+ "grad_norm": 0.5915283577904045,
+ "grad_max_sv": 0.2511633686721325,
+ "grad_min_sv": 1.074133903124913e-08,
+ "grad_condition": 579600714.0219278,
+ "lr": 0.0004477357683661729,
+ "time_sec": 32.63526272773743
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.39450348417282105,
+ "train_acc": 0.87178,
+ "test_loss": 2.5824236192703247,
+ "test_acc": 0.5448,
+ "lyapunov": null,
+ "grad_norm": 0.5885071131780099,
+ "grad_max_sv": 0.25625271871685984,
+ "grad_min_sv": 1.0501880514518502e-08,
+ "grad_condition": 124784334.66343915,
+ "lr": 0.00043733338321784746,
+ "time_sec": 32.604066610336304
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.3872408880805969,
+ "train_acc": 0.87422,
+ "test_loss": 2.6602687486648557,
+ "test_acc": 0.5352,
+ "lyapunov": null,
+ "grad_norm": 0.5833408041873426,
+ "grad_max_sv": 0.2544650699943304,
+ "grad_min_sv": 1.0623962720494873e-08,
+ "grad_condition": 134511278.94006854,
+ "lr": 0.0004269584857187939,
+ "time_sec": 32.63341236114502
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.3692175518798828,
+ "train_acc": 0.8823,
+ "test_loss": 2.6812981620788574,
+ "test_acc": 0.5354,
+ "lyapunov": null,
+ "grad_norm": 0.571242006609448,
+ "grad_max_sv": 0.2509057328104973,
+ "grad_min_sv": 1.0469137029164855e-08,
+ "grad_condition": 133735555.98911181,
+ "lr": 0.0004166156266419484,
+ "time_sec": 32.600364685058594
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.36960686668396,
+ "train_acc": 0.8806,
+ "test_loss": 2.6419603324890137,
+ "test_acc": 0.5453,
+ "lyapunov": null,
+ "grad_norm": 0.5733982210439359,
+ "grad_max_sv": 0.25141631327569486,
+ "grad_min_sv": 1.0406415923511908e-08,
+ "grad_condition": 126933629.16775417,
+ "lr": 0.0004063093427071373,
+ "time_sec": 32.60528612136841
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.3596297464942932,
+ "train_acc": 0.88366,
+ "test_loss": 2.716620068740845,
+ "test_acc": 0.5395,
+ "lyapunov": null,
+ "grad_norm": 0.5676461114412606,
+ "grad_max_sv": 0.24900777079164982,
+ "grad_min_sv": 1.0182381811286654e-08,
+ "grad_condition": 508099869.8504903,
+ "lr": 0.0003960441545911199,
+ "time_sec": 32.61734056472778
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.3471255212688446,
+ "train_acc": 0.88682,
+ "test_loss": 2.6910045627593995,
+ "test_acc": 0.5395,
+ "lyapunov": null,
+ "grad_norm": 0.5548265984779118,
+ "grad_max_sv": 0.23751378245651722,
+ "grad_min_sv": 9.806933828904186e-09,
+ "grad_condition": 127564160.08711353,
+ "lr": 0.0003858245649446718,
+ "time_sec": 32.59777784347534
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.3406936288833618,
+ "train_acc": 0.8891,
+ "test_loss": 2.744849885940552,
+ "test_acc": 0.5429,
+ "lyapunov": null,
+ "grad_norm": 0.5555218429462011,
+ "grad_max_sv": 0.2389649160206318,
+ "grad_min_sv": 9.80964975061914e-09,
+ "grad_condition": 889623886.9749553,
+ "lr": 0.00037565505641757235,
+ "time_sec": 32.603169679641724
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.332358439912796,
+ "train_acc": 0.89152,
+ "test_loss": 2.7001221378326417,
+ "test_acc": 0.5481,
+ "lyapunov": null,
+ "grad_norm": 0.550628932039783,
+ "grad_max_sv": 0.24251497723162174,
+ "grad_min_sv": 9.773675100493983e-09,
+ "grad_condition": 85698012.51102474,
+ "lr": 0.00036554008969236695,
+ "time_sec": 32.60269355773926
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.31770461375236514,
+ "train_acc": 0.89674,
+ "test_loss": 2.826695262527466,
+ "test_acc": 0.5359,
+ "lyapunov": null,
+ "grad_norm": 0.5452633910908743,
+ "grad_max_sv": 0.2457874234765768,
+ "grad_min_sv": 1.0011228396625271e-08,
+ "grad_condition": 115516500.1980664,
+ "lr": 0.0003554841015277638,
+ "time_sec": 32.615172147750854
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.3198126357555389,
+ "train_acc": 0.89686,
+ "test_loss": 2.761284243011475,
+ "test_acc": 0.5383,
+ "lyapunov": null,
+ "grad_norm": 0.5420260505535877,
+ "grad_max_sv": 0.2379120856523514,
+ "grad_min_sv": 9.806707615064857e-09,
+ "grad_condition": 292496720.3714178,
+ "lr": 0.000345491502812526,
+ "time_sec": 32.60730767250061
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.31583098639965057,
+ "train_acc": 0.89624,
+ "test_loss": 2.798471709060669,
+ "test_acc": 0.5389,
+ "lyapunov": null,
+ "grad_norm": 0.541688273995152,
+ "grad_max_sv": 0.2411293275654316,
+ "grad_min_sv": 9.842002349441745e-09,
+ "grad_condition": 859517900.635659,
+ "lr": 0.0003355666766307081,
+ "time_sec": 32.59173631668091
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.30620651626586914,
+ "train_acc": 0.89982,
+ "test_loss": 2.8147284172058105,
+ "test_acc": 0.5372,
+ "lyapunov": null,
+ "grad_norm": 0.534845986324325,
+ "grad_max_sv": 0.2446113031357527,
+ "grad_min_sv": 9.80392773058253e-09,
+ "grad_condition": 318006434.8637026,
+ "lr": 0.00032571397633909225,
+ "time_sec": 32.625818729400635
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.2942564325428009,
+ "train_acc": 0.9027,
+ "test_loss": 2.7974524646759034,
+ "test_acc": 0.5458,
+ "lyapunov": null,
+ "grad_norm": 0.5258623807030809,
+ "grad_max_sv": 0.23323353454470636,
+ "grad_min_sv": 9.338492477830445e-09,
+ "grad_condition": 179043441.62085792,
+ "lr": 0.00031593772365766094,
+ "time_sec": 32.64636468887329
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.29325305396080015,
+ "train_acc": 0.90696,
+ "test_loss": 2.7924257678985596,
+ "test_acc": 0.5399,
+ "lyapunov": null,
+ "grad_norm": 0.5223436049599501,
+ "grad_max_sv": 0.23972665779292585,
+ "grad_min_sv": 9.572742014005153e-09,
+ "grad_condition": 829147220.8115915,
+ "lr": 0.0003062422067739483,
+ "time_sec": 32.63534426689148
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.2819689624214172,
+ "train_acc": 0.90976,
+ "test_loss": 2.925028160858154,
+ "test_acc": 0.5349,
+ "lyapunov": null,
+ "grad_norm": 0.5142202374019095,
+ "grad_max_sv": 0.2272823579609394,
+ "grad_min_sv": 9.26979293529133e-09,
+ "grad_condition": 746493228.5809206,
+ "lr": 0.00029663167846209965,
+ "time_sec": 32.632474184036255
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.2815214267730713,
+ "train_acc": 0.90818,
+ "test_loss": 2.834438822937012,
+ "test_acc": 0.5361,
+ "lyapunov": null,
+ "grad_norm": 0.5120345521537165,
+ "grad_max_sv": 0.23016531057655812,
+ "grad_min_sv": 9.260385527062182e-09,
+ "grad_condition": 233123428.8839547,
+ "lr": 0.00028711035421746345,
+ "time_sec": 32.61351776123047
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.2686532742404938,
+ "train_acc": 0.91288,
+ "test_loss": 2.7868608379364015,
+ "test_acc": 0.5454,
+ "lyapunov": null,
+ "grad_norm": 0.50888083523268,
+ "grad_max_sv": 0.23386715427041055,
+ "grad_min_sv": 9.24353042355136e-09,
+ "grad_condition": 480824699.4459009,
+ "lr": 0.00027768241040753615,
+ "time_sec": 32.597689628601074
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.26857261137008664,
+ "train_acc": 0.9114,
+ "test_loss": 2.8518635543823243,
+ "test_acc": 0.5437,
+ "lyapunov": null,
+ "grad_norm": 0.5090536597227022,
+ "grad_max_sv": 0.22117703258991242,
+ "grad_min_sv": 8.954814682826662e-09,
+ "grad_condition": 523046386.34619534,
+ "lr": 0.00026835198244006903,
+ "time_sec": 32.608073472976685
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.25366373962402344,
+ "train_acc": 0.91882,
+ "test_loss": 2.8721565658569337,
+ "test_acc": 0.543,
+ "lyapunov": null,
+ "grad_norm": 0.49238261306821557,
+ "grad_max_sv": 0.2156506847590208,
+ "grad_min_sv": 8.781873435826509e-09,
+ "grad_condition": 904102693.0135263,
+ "lr": 0.0002591231629491421,
+ "time_sec": 32.61784863471985
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.24887621872901916,
+ "train_acc": 0.91974,
+ "test_loss": 2.921920951461792,
+ "test_acc": 0.5361,
+ "lyapunov": null,
+ "grad_norm": 0.4888254012066189,
+ "grad_max_sv": 0.2262551225721836,
+ "grad_min_sv": 9.07711106217608e-09,
+ "grad_condition": 2378158119.157684,
+ "lr": 0.0002499999999999997,
+ "time_sec": 32.63064646720886
+ },
+ {
+ "epoch": 101,
+ "train_loss": 0.2486992248916626,
+ "train_acc": 0.92078,
+ "test_loss": 2.84906298789978,
+ "test_acc": 0.546,
+ "lyapunov": null,
+ "grad_norm": 0.49044990509199843,
+ "grad_max_sv": 0.2249086916446686,
+ "grad_min_sv": 8.942711630455583e-09,
+ "grad_condition": 368518315.458243,
+ "lr": 0.00024098649531343477,
+ "time_sec": 32.61569309234619
+ },
+ {
+ "epoch": 102,
+ "train_loss": 0.24084433520317078,
+ "train_acc": 0.92134,
+ "test_loss": 2.8644924999237062,
+ "test_acc": 0.5466,
+ "lyapunov": null,
+ "grad_norm": 0.4835634789382412,
+ "grad_max_sv": 0.22181024961173534,
+ "grad_min_sv": 8.71543736290746e-09,
+ "grad_condition": 729146084.7030591,
+ "lr": 0.0002320866025105016,
+ "time_sec": 32.61780500411987
+ },
+ {
+ "epoch": 103,
+ "train_loss": 0.23572091526031494,
+ "train_acc": 0.9245,
+ "test_loss": 2.8849633934020997,
+ "test_acc": 0.5462,
+ "lyapunov": null,
+ "grad_norm": 0.47616360717681877,
+ "grad_max_sv": 0.21196404211223124,
+ "grad_min_sv": 8.353945581216632e-09,
+ "grad_condition": 474656759.6437806,
+ "lr": 0.0002233042253783278,
+ "time_sec": 32.613890647888184
+ },
+ {
+ "epoch": 104,
+ "train_loss": 0.2249231512260437,
+ "train_acc": 0.92648,
+ "test_loss": 2.9231421543121336,
+ "test_acc": 0.5417,
+ "lyapunov": null,
+ "grad_norm": 0.47192872655679174,
+ "grad_max_sv": 0.214255590736866,
+ "grad_min_sv": 8.505988313570536e-09,
+ "grad_condition": 289197672.1924402,
+ "lr": 0.000214643216157784,
+ "time_sec": 32.601218938827515
+ },
+ {
+ "epoch": 105,
+ "train_loss": 0.22248219745159148,
+ "train_acc": 0.9281,
+ "test_loss": 2.9562902782440186,
+ "test_acc": 0.5427,
+ "lyapunov": null,
+ "grad_norm": 0.4698308403081668,
+ "grad_max_sv": 0.22572967931628227,
+ "grad_min_sv": 8.526192928743314e-09,
+ "grad_condition": 1450261253.9932175,
+ "lr": 0.00020610737385376332,
+ "time_sec": 32.612290382385254
+ },
+ {
+ "epoch": 106,
+ "train_loss": 0.21623054056167604,
+ "train_acc": 0.92962,
+ "test_loss": 2.908762315750122,
+ "test_acc": 0.5446,
+ "lyapunov": null,
+ "grad_norm": 0.46340711985172833,
+ "grad_max_sv": 0.21638907827436923,
+ "grad_min_sv": 8.416883249314638e-09,
+ "grad_condition": 255468039.70825052,
+ "lr": 0.00019770044256881242,
+ "time_sec": 32.612945318222046
+ },
+ {
+ "epoch": 107,
+ "train_loss": 0.21244655453205108,
+ "train_acc": 0.93246,
+ "test_loss": 2.974463511657715,
+ "test_acc": 0.5384,
+ "lyapunov": null,
+ "grad_norm": 0.4594548274355528,
+ "grad_max_sv": 0.22012278363108634,
+ "grad_min_sv": 8.49774636952922e-09,
+ "grad_condition": 2473361556.8977194,
+ "lr": 0.0001894261098608447,
+ "time_sec": 32.62226438522339
+ },
+ {
+ "epoch": 108,
+ "train_loss": 0.2094324759197235,
+ "train_acc": 0.93186,
+ "test_loss": 2.8919307563781738,
+ "test_acc": 0.5468,
+ "lyapunov": null,
+ "grad_norm": 0.4576154748028718,
+ "grad_max_sv": 0.2116704247891903,
+ "grad_min_sv": 8.391172841922153e-09,
+ "grad_condition": 466352424.25916034,
+ "lr": 0.000181288005125655,
+ "time_sec": 32.6186683177948
+ },
+ {
+ "epoch": 109,
+ "train_loss": 0.20401785006046294,
+ "train_acc": 0.93418,
+ "test_loss": 2.957660815048218,
+ "test_acc": 0.539,
+ "lyapunov": null,
+ "grad_norm": 0.4546298422322962,
+ "grad_max_sv": 0.21849206127226353,
+ "grad_min_sv": 8.682296616380203e-09,
+ "grad_condition": 191940882.5588118,
+ "lr": 0.0001732896980049473,
+ "time_sec": 32.628432273864746
+ },
+ {
+ "epoch": 110,
+ "train_loss": 0.20467783069610596,
+ "train_acc": 0.9347,
+ "test_loss": 2.958277463912964,
+ "test_acc": 0.5437,
+ "lyapunov": null,
+ "grad_norm": 0.4527691780730168,
+ "grad_max_sv": 0.20565569326281546,
+ "grad_min_sv": 8.186116849185146e-09,
+ "grad_condition": 362737702.71097183,
+ "lr": 0.00016543469682057076,
+ "time_sec": 32.61425018310547
+ },
+ {
+ "epoch": 111,
+ "train_loss": 0.1963657117843628,
+ "train_acc": 0.93738,
+ "test_loss": 2.912566703796387,
+ "test_acc": 0.5453,
+ "lyapunov": null,
+ "grad_norm": 0.4442740357567778,
+ "grad_max_sv": 0.20528529062867165,
+ "grad_min_sv": 7.897949131502324e-09,
+ "grad_condition": 332879126.46642524,
+ "lr": 0.00015772644703565552,
+ "time_sec": 32.640437841415405
+ },
+ {
+ "epoch": 112,
+ "train_loss": 0.19529674465417862,
+ "train_acc": 0.93706,
+ "test_loss": 2.9921934005737305,
+ "test_acc": 0.5439,
+ "lyapunov": null,
+ "grad_norm": 0.4472859282028686,
+ "grad_max_sv": 0.21485005132853985,
+ "grad_min_sv": 8.123189853593854e-09,
+ "grad_condition": 1264491045.958951,
+ "lr": 0.00015016832974331713,
+ "time_sec": 32.62719178199768
+ },
+ {
+ "epoch": 113,
+ "train_loss": 0.19033806517124177,
+ "train_acc": 0.93864,
+ "test_loss": 2.982124820327759,
+ "test_acc": 0.5437,
+ "lyapunov": null,
+ "grad_norm": 0.44136667096649934,
+ "grad_max_sv": 0.21058676335960627,
+ "grad_min_sv": 8.165891918036905e-09,
+ "grad_condition": 312331837.29792935,
+ "lr": 0.00014276366018359834,
+ "time_sec": 32.62637948989868
+ },
+ {
+ "epoch": 114,
+ "train_loss": 0.1861744700717926,
+ "train_acc": 0.9415,
+ "test_loss": 2.9888067501068116,
+ "test_acc": 0.5439,
+ "lyapunov": null,
+ "grad_norm": 0.4352864374741274,
+ "grad_max_sv": 0.20403808429837228,
+ "grad_min_sv": 7.826812852777115e-09,
+ "grad_condition": 157749511.7241363,
+ "lr": 0.00013551568628929425,
+ "time_sec": 32.61394190788269
+ },
+ {
+ "epoch": 115,
+ "train_loss": 0.17919604228019714,
+ "train_acc": 0.94228,
+ "test_loss": 2.9267702087402343,
+ "test_acc": 0.5533,
+ "lyapunov": null,
+ "grad_norm": 0.4303078691865104,
+ "grad_max_sv": 0.21317217014729978,
+ "grad_min_sv": 7.932376714335499e-09,
+ "grad_condition": 130563128.16561177,
+ "lr": 0.00012842758726130276,
+ "time_sec": 32.59867215156555
+ },
+ {
+ "epoch": 116,
+ "train_loss": 0.1819922329044342,
+ "train_acc": 0.9421,
+ "test_loss": 2.9711815841674807,
+ "test_acc": 0.5465,
+ "lyapunov": null,
+ "grad_norm": 0.43180962461173705,
+ "grad_max_sv": 0.22204699292778968,
+ "grad_min_sv": 8.152687410540802e-09,
+ "grad_condition": 465179275.152493,
+ "lr": 0.0001215024721741218,
+ "time_sec": 32.63067364692688
+ },
+ {
+ "epoch": 117,
+ "train_loss": 0.1775187094783783,
+ "train_acc": 0.94306,
+ "test_loss": 2.9692884788513183,
+ "test_acc": 0.5485,
+ "lyapunov": null,
+ "grad_norm": 0.42535422696695824,
+ "grad_max_sv": 0.20696271434426308,
+ "grad_min_sv": 7.841850190731802e-09,
+ "grad_condition": 340204799.15066475,
+ "lr": 0.00011474337861210538,
+ "time_sec": 32.682225465774536
+ },
+ {
+ "epoch": 118,
+ "train_loss": 0.1782768397474289,
+ "train_acc": 0.94228,
+ "test_loss": 2.9190274017333984,
+ "test_acc": 0.5529,
+ "lyapunov": null,
+ "grad_norm": 0.4288690474100953,
+ "grad_max_sv": 0.20459303073585033,
+ "grad_min_sv": 7.852907129212925e-09,
+ "grad_condition": 413565999.92345744,
+ "lr": 0.00010815327133708009,
+ "time_sec": 32.6104941368103
+ },
+ {
+ "epoch": 119,
+ "train_loss": 0.17245361244678498,
+ "train_acc": 0.94452,
+ "test_loss": 2.9115855850219727,
+ "test_acc": 0.5518,
+ "lyapunov": null,
+ "grad_norm": 0.42115534183071457,
+ "grad_max_sv": 0.20364198610186576,
+ "grad_min_sv": 7.842290997188895e-09,
+ "grad_condition": 4300198879.021836,
+ "lr": 0.00010173504098790182,
+ "time_sec": 32.599159479141235
+ },
+ {
+ "epoch": 120,
+ "train_loss": 0.16841998175621034,
+ "train_acc": 0.9465,
+ "test_loss": 2.9750044021606445,
+ "test_acc": 0.5509,
+ "lyapunov": null,
+ "grad_norm": 0.4139970919760924,
+ "grad_max_sv": 0.21118448078632354,
+ "grad_min_sv": 7.870022611139622e-09,
+ "grad_condition": 588234398.5889165,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 32.60773468017578
+ },
+ {
+ "epoch": 121,
+ "train_loss": 0.1674146131658554,
+ "train_acc": 0.94722,
+ "test_loss": 3.043567562866211,
+ "test_acc": 0.5401,
+ "lyapunov": null,
+ "grad_norm": 0.4140688259905283,
+ "grad_max_sv": 0.19524961337447166,
+ "grad_min_sv": 7.740067117572789e-09,
+ "grad_condition": 294042234.42343616,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 32.605161905288696
+ },
+ {
+ "epoch": 122,
+ "train_loss": 0.16243593076705934,
+ "train_acc": 0.94846,
+ "test_loss": 2.929161159515381,
+ "test_acc": 0.5544,
+ "lyapunov": null,
+ "grad_norm": 0.4069435316400916,
+ "grad_max_sv": 0.1928358545526862,
+ "grad_min_sv": 7.721300553786966e-09,
+ "grad_condition": 1492464032.2227066,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 32.641791105270386
+ },
+ {
+ "epoch": 123,
+ "train_loss": 0.1584806259393692,
+ "train_acc": 0.94938,
+ "test_loss": 3.1013183868408203,
+ "test_acc": 0.5441,
+ "lyapunov": null,
+ "grad_norm": 0.4074794428211969,
+ "grad_max_sv": 0.19953589588403703,
+ "grad_min_sv": 7.50950879795792e-09,
+ "grad_condition": 963926565.1466379,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 32.63674283027649
+ },
+ {
+ "epoch": 124,
+ "train_loss": 0.15840048369407653,
+ "train_acc": 0.9494,
+ "test_loss": 3.02653837890625,
+ "test_acc": 0.5519,
+ "lyapunov": null,
+ "grad_norm": 0.4076422491058348,
+ "grad_max_sv": 0.2066960282623768,
+ "grad_min_sv": 7.477964763082447e-09,
+ "grad_condition": 442993334.53740203,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 32.61531352996826
+ },
+ {
+ "epoch": 125,
+ "train_loss": 0.15796427134990693,
+ "train_acc": 0.9492,
+ "test_loss": 3.0291555103302,
+ "test_acc": 0.547,
+ "lyapunov": null,
+ "grad_norm": 0.4074327913561712,
+ "grad_max_sv": 0.20506599061191083,
+ "grad_min_sv": 7.742264148888345e-09,
+ "grad_condition": 174320401.78922492,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 32.616377115249634
+ },
+ {
+ "epoch": 126,
+ "train_loss": 0.15587055792808532,
+ "train_acc": 0.94994,
+ "test_loss": 3.0593951934814454,
+ "test_acc": 0.5475,
+ "lyapunov": null,
+ "grad_norm": 0.40499205379602254,
+ "grad_max_sv": 0.20328918769955634,
+ "grad_min_sv": 7.676706426616719e-09,
+ "grad_condition": 1609865519.3051925,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 32.61218738555908
+ },
+ {
+ "epoch": 127,
+ "train_loss": 0.1515829546546936,
+ "train_acc": 0.95164,
+ "test_loss": 2.997521667098999,
+ "test_acc": 0.5527,
+ "lyapunov": null,
+ "grad_norm": 0.3980720784578974,
+ "grad_max_sv": 0.20609603635966778,
+ "grad_min_sv": 7.607568789811877e-09,
+ "grad_condition": 467148050.5049923,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 32.59871435165405
+ },
+ {
+ "epoch": 128,
+ "train_loss": 0.15070208614826203,
+ "train_acc": 0.95202,
+ "test_loss": 2.989130591583252,
+ "test_acc": 0.5478,
+ "lyapunov": null,
+ "grad_norm": 0.4001034661246295,
+ "grad_max_sv": 0.1990298792719841,
+ "grad_min_sv": 7.700730269807106e-09,
+ "grad_condition": 1087373342.1502237,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 32.64661478996277
+ },
+ {
+ "epoch": 129,
+ "train_loss": 0.1532275314569473,
+ "train_acc": 0.95156,
+ "test_loss": 3.076161633300781,
+ "test_acc": 0.5428,
+ "lyapunov": null,
+ "grad_norm": 0.39710317166706477,
+ "grad_max_sv": 0.2050964504480362,
+ "grad_min_sv": 7.753612097250589e-09,
+ "grad_condition": 177848968.01384813,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 32.619911193847656
+ },
+ {
+ "epoch": 130,
+ "train_loss": 0.14840273664474488,
+ "train_acc": 0.95386,
+ "test_loss": 3.0291847702026367,
+ "test_acc": 0.5514,
+ "lyapunov": null,
+ "grad_norm": 0.3943339950090642,
+ "grad_max_sv": 0.20189184583723546,
+ "grad_min_sv": 7.418064280288045e-09,
+ "grad_condition": 225551543.43719563,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 32.61198544502258
+ },
+ {
+ "epoch": 131,
+ "train_loss": 0.1431949885225296,
+ "train_acc": 0.95528,
+ "test_loss": 3.027348929977417,
+ "test_acc": 0.5507,
+ "lyapunov": null,
+ "grad_norm": 0.38711994826678314,
+ "grad_max_sv": 0.19673722572624683,
+ "grad_min_sv": 7.518409088564434e-09,
+ "grad_condition": 1146835061.4670472,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 32.61335587501526
+ },
+ {
+ "epoch": 132,
+ "train_loss": 0.1487313818216324,
+ "train_acc": 0.95322,
+ "test_loss": 3.0886004333496095,
+ "test_acc": 0.5461,
+ "lyapunov": null,
+ "grad_norm": 0.395507713545241,
+ "grad_max_sv": 0.20544077269732952,
+ "grad_min_sv": 7.573043920433565e-09,
+ "grad_condition": 168877391.5952191,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 32.5999391078949
+ },
+ {
+ "epoch": 133,
+ "train_loss": 0.14615771746635436,
+ "train_acc": 0.95264,
+ "test_loss": 3.000204067611694,
+ "test_acc": 0.5534,
+ "lyapunov": null,
+ "grad_norm": 0.3932909447553781,
+ "grad_max_sv": 0.18928411398082973,
+ "grad_min_sv": 7.371471794906034e-09,
+ "grad_condition": 362753839.3369804,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 32.6199426651001
+ },
+ {
+ "epoch": 134,
+ "train_loss": 0.14433889319181442,
+ "train_acc": 0.95458,
+ "test_loss": 3.007744090270996,
+ "test_acc": 0.5535,
+ "lyapunov": null,
+ "grad_norm": 0.38729299837720393,
+ "grad_max_sv": 0.1966633189469576,
+ "grad_min_sv": 7.389140074115508e-09,
+ "grad_condition": 474683811.0722334,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 32.66906452178955
+ },
+ {
+ "epoch": 135,
+ "train_loss": 0.14040502546787262,
+ "train_acc": 0.95526,
+ "test_loss": 2.9782509716033934,
+ "test_acc": 0.5519,
+ "lyapunov": null,
+ "grad_norm": 0.3837181152764762,
+ "grad_max_sv": 0.19970894865691663,
+ "grad_min_sv": 7.428829410741772e-09,
+ "grad_condition": 568455087.6695989,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 32.612287521362305
+ },
+ {
+ "epoch": 136,
+ "train_loss": 0.14493111051797866,
+ "train_acc": 0.95468,
+ "test_loss": 3.0520059284210204,
+ "test_acc": 0.5481,
+ "lyapunov": null,
+ "grad_norm": 0.39055918813288093,
+ "grad_max_sv": 0.20612289309501647,
+ "grad_min_sv": 7.689209627608634e-09,
+ "grad_condition": 670288720.96072,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 32.61230111122131
+ },
+ {
+ "epoch": 137,
+ "train_loss": 0.1412872414493561,
+ "train_acc": 0.95532,
+ "test_loss": 2.9926007400512695,
+ "test_acc": 0.5538,
+ "lyapunov": null,
+ "grad_norm": 0.3847438191608403,
+ "grad_max_sv": 0.1935590598732233,
+ "grad_min_sv": 7.3988825210688506e-09,
+ "grad_condition": 818122774.676174,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 32.63673734664917
+ },
+ {
+ "epoch": 138,
+ "train_loss": 0.1368464488697052,
+ "train_acc": 0.95786,
+ "test_loss": 3.0026862827301026,
+ "test_acc": 0.5541,
+ "lyapunov": null,
+ "grad_norm": 0.3793276651282968,
+ "grad_max_sv": 0.2012945655733347,
+ "grad_min_sv": 7.351351802645234e-09,
+ "grad_condition": 363599415.4796465,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 32.59603404998779
+ },
+ {
+ "epoch": 139,
+ "train_loss": 0.1389853618478775,
+ "train_acc": 0.95644,
+ "test_loss": 3.04127444152832,
+ "test_acc": 0.5497,
+ "lyapunov": null,
+ "grad_norm": 0.38369680042825305,
+ "grad_max_sv": 0.1901318434625864,
+ "grad_min_sv": 7.190909153147098e-09,
+ "grad_condition": 1063192542.6047398,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 32.623175382614136
+ },
+ {
+ "epoch": 140,
+ "train_loss": 0.13792312327384948,
+ "train_acc": 0.95614,
+ "test_loss": 3.004412171936035,
+ "test_acc": 0.5534,
+ "lyapunov": null,
+ "grad_norm": 0.37904522036307264,
+ "grad_max_sv": 0.19201667234301567,
+ "grad_min_sv": 7.376605424202435e-09,
+ "grad_condition": 1234012097.4190845,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 32.630115270614624
+ },
+ {
+ "epoch": 141,
+ "train_loss": 0.1407741106414795,
+ "train_acc": 0.95654,
+ "test_loss": 3.0456832256317137,
+ "test_acc": 0.5511,
+ "lyapunov": null,
+ "grad_norm": 0.38330137862093777,
+ "grad_max_sv": 0.19592518154531718,
+ "grad_min_sv": 7.054394128222507e-09,
+ "grad_condition": 86708521.56413671,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 32.61585021018982
+ },
+ {
+ "epoch": 142,
+ "train_loss": 0.1388852431154251,
+ "train_acc": 0.95632,
+ "test_loss": 3.063602409744263,
+ "test_acc": 0.5478,
+ "lyapunov": null,
+ "grad_norm": 0.3828568546417417,
+ "grad_max_sv": 0.1969303483143449,
+ "grad_min_sv": 7.518555048707278e-09,
+ "grad_condition": 678890293.0423553,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 32.630441427230835
+ },
+ {
+ "epoch": 143,
+ "train_loss": 0.13581469515800476,
+ "train_acc": 0.9579,
+ "test_loss": 3.0148553092956543,
+ "test_acc": 0.5538,
+ "lyapunov": null,
+ "grad_norm": 0.37580622771801075,
+ "grad_max_sv": 0.18920586220920085,
+ "grad_min_sv": 7.312373946242665e-09,
+ "grad_condition": 360908520.84421337,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 32.64005398750305
+ },
+ {
+ "epoch": 144,
+ "train_loss": 0.1397603491592407,
+ "train_acc": 0.9547,
+ "test_loss": 3.017238700866699,
+ "test_acc": 0.5514,
+ "lyapunov": null,
+ "grad_norm": 0.3851319102923484,
+ "grad_max_sv": 0.19529533758759499,
+ "grad_min_sv": 7.18097194788922e-09,
+ "grad_condition": 274499937.83092636,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 32.60517716407776
+ },
+ {
+ "epoch": 145,
+ "train_loss": 0.13670911428451538,
+ "train_acc": 0.95648,
+ "test_loss": 3.0282860946655275,
+ "test_acc": 0.5508,
+ "lyapunov": null,
+ "grad_norm": 0.37783913784420287,
+ "grad_max_sv": 0.19311878457665443,
+ "grad_min_sv": 7.273629627901489e-09,
+ "grad_condition": 2161793817.455667,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 32.614171266555786
+ },
+ {
+ "epoch": 146,
+ "train_loss": 0.1391296845769882,
+ "train_acc": 0.95668,
+ "test_loss": 3.0094220054626466,
+ "test_acc": 0.5501,
+ "lyapunov": null,
+ "grad_norm": 0.37960085678866656,
+ "grad_max_sv": 0.18867351226508616,
+ "grad_min_sv": 7.0429120130072884e-09,
+ "grad_condition": 483257361.70673215,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 32.59815835952759
+ },
+ {
+ "epoch": 147,
+ "train_loss": 0.13715074803590774,
+ "train_acc": 0.95716,
+ "test_loss": 3.018283353805542,
+ "test_acc": 0.5494,
+ "lyapunov": null,
+ "grad_norm": 0.3750663523004214,
+ "grad_max_sv": 0.19733735918998718,
+ "grad_min_sv": 7.336720725349341e-09,
+ "grad_condition": 639022830.9873111,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 32.63532900810242
+ },
+ {
+ "epoch": 148,
+ "train_loss": 0.13438899482250213,
+ "train_acc": 0.95838,
+ "test_loss": 3.0480747367858885,
+ "test_acc": 0.5511,
+ "lyapunov": null,
+ "grad_norm": 0.374029090307932,
+ "grad_max_sv": 0.19485083129256964,
+ "grad_min_sv": 7.2787410602915756e-09,
+ "grad_condition": 1280998842.4402964,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 32.61666941642761
+ },
+ {
+ "epoch": 149,
+ "train_loss": 0.1355752257716656,
+ "train_acc": 0.95742,
+ "test_loss": 3.020583014678955,
+ "test_acc": 0.5479,
+ "lyapunov": null,
+ "grad_norm": 0.3742080999065961,
+ "grad_max_sv": 0.18681482430547475,
+ "grad_min_sv": 7.387960459213656e-09,
+ "grad_condition": 886872133.6824732,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 32.62542963027954
+ },
+ {
+ "epoch": 150,
+ "train_loss": 0.13964056191444396,
+ "train_acc": 0.95646,
+ "test_loss": 3.1249655624389647,
+ "test_acc": 0.5464,
+ "lyapunov": null,
+ "grad_norm": 0.3794352519997707,
+ "grad_max_sv": 0.2051174059510231,
+ "grad_min_sv": 7.552300875884155e-09,
+ "grad_condition": 4688136301.586805,
+ "lr": 0.0,
+ "time_sec": 32.61311602592468
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 4.857979267883301,
+ "train_acc": 0.03128,
+ "test_loss": 4.8280028671264645,
+ "test_acc": 0.0162,
+ "lyapunov": null,
+ "grad_norm": 5.914070912211268,
+ "grad_max_sv": 5.325387370586395,
+ "grad_min_sv": 9.769405192663893e-08,
+ "grad_condition": 1337497985.1511102,
+ "lr": 0.0009998903417374227,
+ "time_sec": 49.62461066246033
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.336386154098511,
+ "train_acc": 0.05714,
+ "test_loss": 4.968493894958496,
+ "test_acc": 0.0197,
+ "lyapunov": null,
+ "grad_norm": 4.4863167388537235,
+ "grad_max_sv": 3.9469796657562255,
+ "grad_min_sv": 7.601632206477583e-08,
+ "grad_condition": 129963899.4749479,
+ "lr": 0.0009995614150494292,
+ "time_sec": 49.636900901794434
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.062883013763428,
+ "train_acc": 0.08342,
+ "test_loss": 4.448897337341308,
+ "test_acc": 0.037,
+ "lyapunov": null,
+ "grad_norm": 3.6333047310988777,
+ "grad_max_sv": 3.0409141004085543,
+ "grad_min_sv": 6.369543137374478e-08,
+ "grad_condition": 59962043.95176021,
+ "lr": 0.0009990133642141358,
+ "time_sec": 49.63047957420349
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.8605975818634035,
+ "train_acc": 0.10722,
+ "test_loss": 4.516425963592529,
+ "test_acc": 0.0415,
+ "lyapunov": null,
+ "grad_norm": 3.020259734680317,
+ "grad_max_sv": 2.476314604282379,
+ "grad_min_sv": 5.230481114892882e-08,
+ "grad_condition": 51922675.56557977,
+ "lr": 0.0009982464296247522,
+ "time_sec": 49.61615824699402
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.6876567860412597,
+ "train_acc": 0.13404,
+ "test_loss": 4.7616854064941405,
+ "test_acc": 0.0373,
+ "lyapunov": null,
+ "grad_norm": 2.454606191256652,
+ "grad_max_sv": 1.8841783970594406,
+ "grad_min_sv": 4.2170166864030635e-08,
+ "grad_condition": 61784571.5567351,
+ "lr": 0.0009972609476841367,
+ "time_sec": 49.621190309524536
+ },
+ {
+ "epoch": 6,
+ "train_loss": 3.5600004296875,
+ "train_acc": 0.15464,
+ "test_loss": 4.541135731506348,
+ "test_acc": 0.0565,
+ "lyapunov": null,
+ "grad_norm": 2.047081522054368,
+ "grad_max_sv": 1.4700775474309922,
+ "grad_min_sv": 3.5812032206372636e-08,
+ "grad_condition": 47166242.58068286,
+ "lr": 0.000996057350657239,
+ "time_sec": 49.63187623023987
+ },
+ {
+ "epoch": 7,
+ "train_loss": 3.453279203033447,
+ "train_acc": 0.17224,
+ "test_loss": 4.9032746643066405,
+ "test_acc": 0.0512,
+ "lyapunov": null,
+ "grad_norm": 1.7128403586652834,
+ "grad_max_sv": 1.1189136162400246,
+ "grad_min_sv": 3.018336235394159e-08,
+ "grad_condition": 41920446.3053714,
+ "lr": 0.000994636166481494,
+ "time_sec": 49.60520005226135
+ },
+ {
+ "epoch": 8,
+ "train_loss": 3.36041114944458,
+ "train_acc": 0.1888,
+ "test_loss": 4.752816521453857,
+ "test_acc": 0.0648,
+ "lyapunov": null,
+ "grad_norm": 1.4850467477612923,
+ "grad_max_sv": 0.8669481813907624,
+ "grad_min_sv": 2.6475041869922223e-08,
+ "grad_condition": 37599938.73602452,
+ "lr": 0.0009929980185352525,
+ "time_sec": 49.618135929107666
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.286079960784912,
+ "train_acc": 0.20154,
+ "test_loss": 5.178885292053223,
+ "test_acc": 0.0623,
+ "lyapunov": null,
+ "grad_norm": 1.342261473440063,
+ "grad_max_sv": 0.7033843606710434,
+ "grad_min_sv": 2.384479090948577e-08,
+ "grad_condition": 141440858.58776602,
+ "lr": 0.0009911436253643444,
+ "time_sec": 49.62771654129028
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.2129677861022947,
+ "train_acc": 0.2144,
+ "test_loss": 5.0195522842407225,
+ "test_acc": 0.0622,
+ "lyapunov": null,
+ "grad_norm": 1.2503967032062735,
+ "grad_max_sv": 0.6261777065694332,
+ "grad_min_sv": 2.239258505704056e-08,
+ "grad_condition": 118005336.87045276,
+ "lr": 0.0009890738003669028,
+ "time_sec": 49.60965371131897
+ },
+ {
+ "epoch": 11,
+ "train_loss": 3.162713228683472,
+ "train_acc": 0.22544,
+ "test_loss": 4.962263533020019,
+ "test_acc": 0.0779,
+ "lyapunov": null,
+ "grad_norm": 1.1906728267056432,
+ "grad_max_sv": 0.5766806580126286,
+ "grad_min_sv": 2.144448115332098e-08,
+ "grad_condition": 68570214.69490463,
+ "lr": 0.00098678945143658,
+ "time_sec": 49.638447284698486
+ },
+ {
+ "epoch": 12,
+ "train_loss": 3.107430252532959,
+ "train_acc": 0.23672,
+ "test_loss": 5.273008836364746,
+ "test_acc": 0.0622,
+ "lyapunov": null,
+ "grad_norm": 1.1141405269120466,
+ "grad_max_sv": 0.5137097157537938,
+ "grad_min_sv": 2.047304612853851e-08,
+ "grad_condition": 58656857.58404706,
+ "lr": 0.0009842915805643154,
+ "time_sec": 49.64548635482788
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.054518303833008,
+ "train_acc": 0.24298,
+ "test_loss": 4.751382202148437,
+ "test_acc": 0.0805,
+ "lyapunov": null,
+ "grad_norm": 1.056334374659988,
+ "grad_max_sv": 0.4537819892168045,
+ "grad_min_sv": 1.9099582219961332e-08,
+ "grad_condition": 40473913.58753422,
+ "lr": 0.000981581283398829,
+ "time_sec": 49.62596035003662
+ },
+ {
+ "epoch": 14,
+ "train_loss": 3.0128901699066164,
+ "train_acc": 0.2535,
+ "test_loss": 5.3179588119506835,
+ "test_acc": 0.0894,
+ "lyapunov": null,
+ "grad_norm": 1.0060720335526403,
+ "grad_max_sv": 0.4221613615751266,
+ "grad_min_sv": 1.8469374840623944e-08,
+ "grad_condition": 27648316.070058893,
+ "lr": 0.0009786597487660333,
+ "time_sec": 49.63119626045227
+ },
+ {
+ "epoch": 15,
+ "train_loss": 2.9737020013427733,
+ "train_acc": 0.26082,
+ "test_loss": 6.165470205688477,
+ "test_acc": 0.0593,
+ "lyapunov": null,
+ "grad_norm": 0.9787012560859192,
+ "grad_max_sv": 0.39918764010071756,
+ "grad_min_sv": 1.789977660815456e-08,
+ "grad_condition": 32066062.312103875,
+ "lr": 0.0009755282581475766,
+ "time_sec": 49.61084794998169
+ },
+ {
+ "epoch": 16,
+ "train_loss": 2.9363278299713134,
+ "train_acc": 0.2678,
+ "test_loss": 7.10851273803711,
+ "test_acc": 0.0421,
+ "lyapunov": null,
+ "grad_norm": 0.9372246408127133,
+ "grad_max_sv": 0.38435717970132827,
+ "grad_min_sv": 1.733210386878348e-08,
+ "grad_condition": 24088715.267205216,
+ "lr": 0.0009721881851187403,
+ "time_sec": 49.61706733703613
+ },
+ {
+ "epoch": 17,
+ "train_loss": 2.911891692504883,
+ "train_acc": 0.27176,
+ "test_loss": 6.38866512298584,
+ "test_acc": 0.0601,
+ "lyapunov": null,
+ "grad_norm": 0.9126706344355823,
+ "grad_max_sv": 0.3579227849841118,
+ "grad_min_sv": 1.667584251102694e-08,
+ "grad_condition": 47679489.14127077,
+ "lr": 0.0009686409947459456,
+ "time_sec": 49.62139368057251
+ },
+ {
+ "epoch": 18,
+ "train_loss": 2.8810440801239015,
+ "train_acc": 0.2804,
+ "test_loss": 6.160967282104492,
+ "test_acc": 0.0718,
+ "lyapunov": null,
+ "grad_norm": 0.8853626149459919,
+ "grad_max_sv": 0.36028596982359884,
+ "grad_min_sv": 1.644115990712125e-08,
+ "grad_condition": 52172419.08719461,
+ "lr": 0.0009648882429441254,
+ "time_sec": 49.61437940597534
+ },
+ {
+ "epoch": 19,
+ "train_loss": 2.845276382827759,
+ "train_acc": 0.28578,
+ "test_loss": 5.377824464416504,
+ "test_acc": 0.0852,
+ "lyapunov": null,
+ "grad_norm": 0.859853543351059,
+ "grad_max_sv": 0.33440142646431925,
+ "grad_min_sv": 1.5989740054234146e-08,
+ "grad_condition": 23981566.09987827,
+ "lr": 0.00096093157579425,
+ "time_sec": 49.60141611099243
+ },
+ {
+ "epoch": 20,
+ "train_loss": 2.8133937200927734,
+ "train_acc": 0.29282,
+ "test_loss": 6.930623114013672,
+ "test_acc": 0.061,
+ "lyapunov": null,
+ "grad_norm": 0.8428428790749917,
+ "grad_max_sv": 0.3265179105103016,
+ "grad_min_sv": 1.569473392637466e-08,
+ "grad_condition": 52730874.60876007,
+ "lr": 0.0009567727288213001,
+ "time_sec": 49.62118935585022
+ },
+ {
+ "epoch": 21,
+ "train_loss": 2.792502545776367,
+ "train_acc": 0.29682,
+ "test_loss": 7.603221396636963,
+ "test_acc": 0.0601,
+ "lyapunov": null,
+ "grad_norm": 0.8301062641843454,
+ "grad_max_sv": 0.3209334272891283,
+ "grad_min_sv": 1.5400497213602372e-08,
+ "grad_condition": 32858821.905855753,
+ "lr": 0.0009524135262330095,
+ "time_sec": 49.61830496788025
+ },
+ {
+ "epoch": 22,
+ "train_loss": 2.763432760696411,
+ "train_acc": 0.30106,
+ "test_loss": 7.683717921447754,
+ "test_acc": 0.0632,
+ "lyapunov": null,
+ "grad_norm": 0.8155075807756811,
+ "grad_max_sv": 0.31464248038828374,
+ "grad_min_sv": 1.523456016894187e-08,
+ "grad_condition": 22807354.246203102,
+ "lr": 0.0009478558801197061,
+ "time_sec": 49.62720441818237
+ },
+ {
+ "epoch": 23,
+ "train_loss": 2.7460695344543455,
+ "train_acc": 0.3031,
+ "test_loss": 5.747795407867431,
+ "test_acc": 0.0819,
+ "lyapunov": null,
+ "grad_norm": 0.7966165231048401,
+ "grad_max_sv": 0.29990778900682924,
+ "grad_min_sv": 1.4812020640575519e-08,
+ "grad_condition": 26907900.924312055,
+ "lr": 0.000943101789615607,
+ "time_sec": 49.620564699172974
+ },
+ {
+ "epoch": 24,
+ "train_loss": 2.713617621231079,
+ "train_acc": 0.31124,
+ "test_loss": 6.716322633361816,
+ "test_acc": 0.08,
+ "lyapunov": null,
+ "grad_norm": 0.7863969132473815,
+ "grad_max_sv": 0.3049128696322441,
+ "grad_min_sv": 1.4714444074304112e-08,
+ "grad_condition": 23621111.366144888,
+ "lr": 0.0009381533400219313,
+ "time_sec": 49.6185462474823
+ },
+ {
+ "epoch": 25,
+ "train_loss": 2.692608075027466,
+ "train_acc": 0.3135,
+ "test_loss": 6.315327671813965,
+ "test_acc": 0.0773,
+ "lyapunov": null,
+ "grad_norm": 0.7780809028085155,
+ "grad_max_sv": 0.28820848651230335,
+ "grad_min_sv": 1.4556970873158548e-08,
+ "grad_condition": 22925885.469558023,
+ "lr": 0.0009330127018922189,
+ "time_sec": 49.63029909133911
+ },
+ {
+ "epoch": 26,
+ "train_loss": 2.6578130314636232,
+ "train_acc": 0.32226,
+ "test_loss": 7.161731970214844,
+ "test_acc": 0.074,
+ "lyapunov": null,
+ "grad_norm": 0.7600241350813963,
+ "grad_max_sv": 0.27918743565678594,
+ "grad_min_sv": 1.41998530961418e-08,
+ "grad_condition": 24836498.868989673,
+ "lr": 0.000927682130080253,
+ "time_sec": 49.61888551712036
+ },
+ {
+ "epoch": 27,
+ "train_loss": 2.6360860138702393,
+ "train_acc": 0.3281,
+ "test_loss": 6.265446292114258,
+ "test_acc": 0.072,
+ "lyapunov": null,
+ "grad_norm": 0.7503860366874832,
+ "grad_max_sv": 0.27820607759058474,
+ "grad_min_sv": 1.403503115116056e-08,
+ "grad_condition": 43704568.438496746,
+ "lr": 0.0009221639627510072,
+ "time_sec": 49.6322455406189
+ },
+ {
+ "epoch": 28,
+ "train_loss": 2.621903458404541,
+ "train_acc": 0.33094,
+ "test_loss": 8.008352018737792,
+ "test_acc": 0.0635,
+ "lyapunov": null,
+ "grad_norm": 0.7411508249278186,
+ "grad_max_sv": 0.276602141186595,
+ "grad_min_sv": 1.3749510615473914e-08,
+ "grad_condition": 48846366.407403715,
+ "lr": 0.0009164606203550494,
+ "time_sec": 49.62464737892151
+ },
+ {
+ "epoch": 29,
+ "train_loss": 2.6009712726593017,
+ "train_acc": 0.33356,
+ "test_loss": 6.3420821472167965,
+ "test_acc": 0.0871,
+ "lyapunov": null,
+ "grad_norm": 0.7392237108014773,
+ "grad_max_sv": 0.2745568320155144,
+ "grad_min_sv": 1.3796570551283249e-08,
+ "grad_condition": 31273171.49927681,
+ "lr": 0.0009105746045668516,
+ "time_sec": 49.654367446899414
+ },
+ {
+ "epoch": 30,
+ "train_loss": 2.5890472722625733,
+ "train_acc": 0.33498,
+ "test_loss": 6.483042420959473,
+ "test_acc": 0.0746,
+ "lyapunov": null,
+ "grad_norm": 0.7254213710143503,
+ "grad_max_sv": 0.2663456965237856,
+ "grad_min_sv": 1.3537345176783955e-08,
+ "grad_condition": 33323808.90351194,
+ "lr": 0.0009045084971874733,
+ "time_sec": 49.62457275390625
+ },
+ {
+ "epoch": 31,
+ "train_loss": 2.5546424687194826,
+ "train_acc": 0.3411,
+ "test_loss": 5.880196138000488,
+ "test_acc": 0.0666,
+ "lyapunov": null,
+ "grad_norm": 0.7170650074645288,
+ "grad_max_sv": 0.2706871546804905,
+ "grad_min_sv": 1.3557976122346993e-08,
+ "grad_condition": 55625831.471463725,
+ "lr": 0.0008982649590120977,
+ "time_sec": 49.625417709350586
+ },
+ {
+ "epoch": 32,
+ "train_loss": 2.5356599130249022,
+ "train_acc": 0.3476,
+ "test_loss": 6.206172892761231,
+ "test_acc": 0.0935,
+ "lyapunov": null,
+ "grad_norm": 0.7148263297514528,
+ "grad_max_sv": 0.2631382804363966,
+ "grad_min_sv": 1.335368298993611e-08,
+ "grad_condition": 27919253.234171998,
+ "lr": 0.0008918467286629196,
+ "time_sec": 49.64267349243164
+ },
+ {
+ "epoch": 33,
+ "train_loss": 2.520495999908447,
+ "train_acc": 0.34764,
+ "test_loss": 6.414087007141113,
+ "test_acc": 0.0819,
+ "lyapunov": null,
+ "grad_norm": 0.7096693517368512,
+ "grad_max_sv": 0.2555254019796848,
+ "grad_min_sv": 1.326168482251866e-08,
+ "grad_condition": 30057889.81326326,
+ "lr": 0.0008852566213878943,
+ "time_sec": 49.633198976516724
+ },
+ {
+ "epoch": 34,
+ "train_loss": 2.4981268305206297,
+ "train_acc": 0.35368,
+ "test_loss": 7.161307034301758,
+ "test_acc": 0.0753,
+ "lyapunov": null,
+ "grad_norm": 0.6981273416861422,
+ "grad_max_sv": 0.25148845836520195,
+ "grad_min_sv": 1.3116743149965693e-08,
+ "grad_condition": 25097258.440184355,
+ "lr": 0.000878497527825878,
+ "time_sec": 49.629374980926514
+ },
+ {
+ "epoch": 35,
+ "train_loss": 2.4812187934875487,
+ "train_acc": 0.35656,
+ "test_loss": 6.375511972045898,
+ "test_acc": 0.0787,
+ "lyapunov": null,
+ "grad_norm": 0.693256631694674,
+ "grad_max_sv": 0.24989120960235595,
+ "grad_min_sv": 1.3051334765701306e-08,
+ "grad_condition": 22699406.58897232,
+ "lr": 0.000871572412738697,
+ "time_sec": 49.620848655700684
+ },
+ {
+ "epoch": 36,
+ "train_loss": 2.4649569733428955,
+ "train_acc": 0.3595,
+ "test_loss": 5.7549407691955565,
+ "test_acc": 0.1002,
+ "lyapunov": null,
+ "grad_norm": 0.6880223056040339,
+ "grad_max_sv": 0.2544675827026367,
+ "grad_min_sv": 1.2971388471672008e-08,
+ "grad_condition": 27090819.46416967,
+ "lr": 0.0008644843137107055,
+ "time_sec": 49.639307498931885
+ },
+ {
+ "epoch": 37,
+ "train_loss": 2.4404139349365233,
+ "train_acc": 0.36276,
+ "test_loss": 6.19379566192627,
+ "test_acc": 0.0843,
+ "lyapunov": null,
+ "grad_norm": 0.6915322266205055,
+ "grad_max_sv": 0.25557893700897694,
+ "grad_min_sv": 1.3099128221005785e-08,
+ "grad_condition": 22396412.415633548,
+ "lr": 0.0008572363398164014,
+ "time_sec": 49.65658497810364
+ },
+ {
+ "epoch": 38,
+ "train_loss": 2.4350104721832277,
+ "train_acc": 0.36944,
+ "test_loss": 6.483997691345214,
+ "test_acc": 0.0947,
+ "lyapunov": null,
+ "grad_norm": 0.6860817508888643,
+ "grad_max_sv": 0.24186794832348824,
+ "grad_min_sv": 1.2734190080188058e-08,
+ "grad_condition": 24245161.640245236,
+ "lr": 0.0008498316702566826,
+ "time_sec": 49.636590003967285
+ },
+ {
+ "epoch": 39,
+ "train_loss": 2.4035986038970947,
+ "train_acc": 0.37506,
+ "test_loss": 7.426128985595703,
+ "test_acc": 0.0633,
+ "lyapunov": null,
+ "grad_norm": 0.6768284631491337,
+ "grad_max_sv": 0.23978918939828872,
+ "grad_min_sv": 1.2544681339196617e-08,
+ "grad_condition": 58875883.49556484,
+ "lr": 0.0008422735529643442,
+ "time_sec": 49.6271595954895
+ },
+ {
+ "epoch": 40,
+ "train_loss": 2.396695173187256,
+ "train_acc": 0.37446,
+ "test_loss": 6.887982989501953,
+ "test_acc": 0.0659,
+ "lyapunov": null,
+ "grad_norm": 0.6758452994499082,
+ "grad_max_sv": 0.23218532651662827,
+ "grad_min_sv": 1.2284334864609559e-08,
+ "grad_condition": 27825244.741001748,
+ "lr": 0.0008345653031794289,
+ "time_sec": 49.6188850402832
+ },
+ {
+ "epoch": 41,
+ "train_loss": 2.3766202754211427,
+ "train_acc": 0.38084,
+ "test_loss": 7.051847720336914,
+ "test_acc": 0.061,
+ "lyapunov": null,
+ "grad_norm": 0.6727252530320494,
+ "grad_max_sv": 0.2428621307015419,
+ "grad_min_sv": 1.2773543862920622e-08,
+ "grad_condition": 27042190.577230137,
+ "lr": 0.0008267103019950526,
+ "time_sec": 49.63360857963562
+ },
+ {
+ "epoch": 42,
+ "train_loss": 2.3670169010925295,
+ "train_acc": 0.38192,
+ "test_loss": 6.82649090423584,
+ "test_acc": 0.0753,
+ "lyapunov": null,
+ "grad_norm": 0.6702600637325808,
+ "grad_max_sv": 0.23488462790846826,
+ "grad_min_sv": 1.2701740556564367e-08,
+ "grad_condition": 22978134.483096853,
+ "lr": 0.0008187119948743447,
+ "time_sec": 49.626428842544556
+ },
+ {
+ "epoch": 43,
+ "train_loss": 2.34640893951416,
+ "train_acc": 0.38418,
+ "test_loss": 7.456131955718994,
+ "test_acc": 0.0764,
+ "lyapunov": null,
+ "grad_norm": 0.6673821071425099,
+ "grad_max_sv": 0.2304955620318651,
+ "grad_min_sv": 1.2439765384453239e-08,
+ "grad_condition": 31820388.99010671,
+ "lr": 0.000810573890139155,
+ "time_sec": 49.62021851539612
+ },
+ {
+ "epoch": 44,
+ "train_loss": 2.3332527070617677,
+ "train_acc": 0.38834,
+ "test_loss": 6.233900453186036,
+ "test_acc": 0.0882,
+ "lyapunov": null,
+ "grad_norm": 0.6619434612787911,
+ "grad_max_sv": 0.23275020457804202,
+ "grad_min_sv": 1.2357255231576491e-08,
+ "grad_condition": 41092001.19472371,
+ "lr": 0.0008022995574311873,
+ "time_sec": 49.632553815841675
+ },
+ {
+ "epoch": 45,
+ "train_loss": 2.319253850402832,
+ "train_acc": 0.3902,
+ "test_loss": 7.539175698852539,
+ "test_acc": 0.0652,
+ "lyapunov": null,
+ "grad_norm": 0.6606380867238602,
+ "grad_max_sv": 0.2288034502416849,
+ "grad_min_sv": 1.234043749409608e-08,
+ "grad_condition": 23995474.740780547,
+ "lr": 0.0007938926261462363,
+ "time_sec": 49.638259410858154
+ },
+ {
+ "epoch": 46,
+ "train_loss": 2.308006600112915,
+ "train_acc": 0.39154,
+ "test_loss": 7.362489430999756,
+ "test_acc": 0.0558,
+ "lyapunov": null,
+ "grad_norm": 0.660045345704197,
+ "grad_max_sv": 0.2337587408721447,
+ "grad_min_sv": 1.2529785493875512e-08,
+ "grad_condition": 24243355.610875387,
+ "lr": 0.0007853567838422158,
+ "time_sec": 49.64337158203125
+ },
+ {
+ "epoch": 47,
+ "train_loss": 2.287512142944336,
+ "train_acc": 0.39698,
+ "test_loss": 7.659019016265869,
+ "test_acc": 0.0729,
+ "lyapunov": null,
+ "grad_norm": 0.6552491008893353,
+ "grad_max_sv": 0.2252129375934601,
+ "grad_min_sv": 1.2101228903660389e-08,
+ "grad_condition": 37944286.39668895,
+ "lr": 0.0007766957746216719,
+ "time_sec": 49.610002756118774
+ },
+ {
+ "epoch": 48,
+ "train_loss": 2.2750962590026855,
+ "train_acc": 0.39712,
+ "test_loss": 6.906008920288086,
+ "test_acc": 0.085,
+ "lyapunov": null,
+ "grad_norm": 0.6572787443040576,
+ "grad_max_sv": 0.23201882764697074,
+ "grad_min_sv": 1.233105519499178e-08,
+ "grad_condition": 27571588.322845332,
+ "lr": 0.0007679133974894982,
+ "time_sec": 49.65186142921448
+ },
+ {
+ "epoch": 49,
+ "train_loss": 2.2525532193756104,
+ "train_acc": 0.40456,
+ "test_loss": 7.617325218963623,
+ "test_acc": 0.074,
+ "lyapunov": null,
+ "grad_norm": 0.6492386918943517,
+ "grad_max_sv": 0.2307146478444338,
+ "grad_min_sv": 1.229703296403914e-08,
+ "grad_condition": 211540506.258676,
+ "lr": 0.000759013504686565,
+ "time_sec": 49.6446647644043
+ },
+ {
+ "epoch": 50,
+ "train_loss": 2.237634787826538,
+ "train_acc": 0.40684,
+ "test_loss": 6.678198162841797,
+ "test_acc": 0.0633,
+ "lyapunov": null,
+ "grad_norm": 0.6565102133805185,
+ "grad_max_sv": 0.2293539997190237,
+ "grad_min_sv": 1.2340318197856526e-08,
+ "grad_condition": 27740724.758145083,
+ "lr": 0.0007499999999999998,
+ "time_sec": 49.653481006622314
+ },
+ {
+ "epoch": 51,
+ "train_loss": 2.209577166748047,
+ "train_acc": 0.40976,
+ "test_loss": 6.840425001525879,
+ "test_acc": 0.0718,
+ "lyapunov": null,
+ "grad_norm": 0.6547461235382159,
+ "grad_max_sv": 0.22949806824326516,
+ "grad_min_sv": 1.2320622985728668e-08,
+ "grad_condition": 23307963.55905198,
+ "lr": 0.0007408768370508575,
+ "time_sec": 49.61805582046509
+ },
+ {
+ "epoch": 52,
+ "train_loss": 2.200788235549927,
+ "train_acc": 0.41432,
+ "test_loss": 7.2077490463256835,
+ "test_acc": 0.0756,
+ "lyapunov": null,
+ "grad_norm": 0.6510213685672233,
+ "grad_max_sv": 0.23402363583445548,
+ "grad_min_sv": 1.2258231881986937e-08,
+ "grad_condition": 75476519.13664213,
+ "lr": 0.0007316480175599307,
+ "time_sec": 49.646629095077515
+ },
+ {
+ "epoch": 53,
+ "train_loss": 2.184033504333496,
+ "train_acc": 0.41906,
+ "test_loss": 6.790815046691894,
+ "test_acc": 0.0761,
+ "lyapunov": null,
+ "grad_norm": 0.6498948423513097,
+ "grad_max_sv": 0.2297774288803339,
+ "grad_min_sv": 1.2289613515736875e-08,
+ "grad_condition": 25175002.986691862,
+ "lr": 0.0007223175895924635,
+ "time_sec": 49.616777181625366
+ },
+ {
+ "epoch": 54,
+ "train_loss": 2.1751246100616455,
+ "train_acc": 0.4209,
+ "test_loss": 7.843894770812988,
+ "test_acc": 0.0728,
+ "lyapunov": null,
+ "grad_norm": 0.6502026955560598,
+ "grad_max_sv": 0.22432956397533416,
+ "grad_min_sv": 1.2058743079079725e-08,
+ "grad_condition": 27210725.454316296,
+ "lr": 0.0007128896457825361,
+ "time_sec": 49.63462972640991
+ },
+ {
+ "epoch": 55,
+ "train_loss": 2.1508761085510253,
+ "train_acc": 0.42416,
+ "test_loss": 7.085880072784424,
+ "test_acc": 0.0952,
+ "lyapunov": null,
+ "grad_norm": 0.6487356152863625,
+ "grad_max_sv": 0.22850245125591756,
+ "grad_min_sv": 1.2312155951710312e-08,
+ "grad_condition": 41183718.923533805,
+ "lr": 0.0007033683215378998,
+ "time_sec": 49.64608693122864
+ },
+ {
+ "epoch": 56,
+ "train_loss": 2.141602848587036,
+ "train_acc": 0.42634,
+ "test_loss": 6.250551121520996,
+ "test_acc": 0.0971,
+ "lyapunov": null,
+ "grad_norm": 0.6410808562446506,
+ "grad_max_sv": 0.2151340998709202,
+ "grad_min_sv": 1.176430176191845e-08,
+ "grad_condition": 30604181.986327033,
+ "lr": 0.0006937577932260512,
+ "time_sec": 49.70740008354187
+ },
+ {
+ "epoch": 57,
+ "train_loss": 2.14431159286499,
+ "train_acc": 0.42548,
+ "test_loss": 6.846168923950195,
+ "test_acc": 0.0958,
+ "lyapunov": null,
+ "grad_norm": 0.6444720385859491,
+ "grad_max_sv": 0.2224727988243103,
+ "grad_min_sv": 1.2025717233132837e-08,
+ "grad_condition": 23924517.448539954,
+ "lr": 0.0006840622763423388,
+ "time_sec": 49.63225722312927
+ },
+ {
+ "epoch": 58,
+ "train_loss": 2.10916792388916,
+ "train_acc": 0.43432,
+ "test_loss": 6.8249847625732425,
+ "test_acc": 0.1066,
+ "lyapunov": null,
+ "grad_norm": 0.6502634467633226,
+ "grad_max_sv": 0.22863934263587,
+ "grad_min_sv": 1.218627998234023e-08,
+ "grad_condition": 28771962.702913057,
+ "lr": 0.0006742860236609073,
+ "time_sec": 49.63661074638367
+ },
+ {
+ "epoch": 59,
+ "train_loss": 2.100633440322876,
+ "train_acc": 0.43724,
+ "test_loss": 7.080769053649902,
+ "test_acc": 0.097,
+ "lyapunov": null,
+ "grad_norm": 0.6514345540301675,
+ "grad_max_sv": 0.23131897561252118,
+ "grad_min_sv": 1.2473222341102818e-08,
+ "grad_condition": 23428156.69088362,
+ "lr": 0.0006644333233692913,
+ "time_sec": 49.631585359573364
+ },
+ {
+ "epoch": 60,
+ "train_loss": 2.0753550579452513,
+ "train_acc": 0.44222,
+ "test_loss": 7.097881182861328,
+ "test_acc": 0.0782,
+ "lyapunov": null,
+ "grad_norm": 0.642048459758103,
+ "grad_max_sv": 0.21754480227828027,
+ "grad_min_sv": 1.2038245155582273e-08,
+ "grad_condition": 35173118.59205349,
+ "lr": 0.0006545084971874734,
+ "time_sec": 49.642804861068726
+ },
+ {
+ "epoch": 61,
+ "train_loss": 2.060260758514404,
+ "train_acc": 0.4465,
+ "test_loss": 6.766320790863037,
+ "test_acc": 0.0839,
+ "lyapunov": null,
+ "grad_norm": 0.6459643627424662,
+ "grad_max_sv": 0.223102143406868,
+ "grad_min_sv": 1.22261165164117e-08,
+ "grad_condition": 22073921.720915027,
+ "lr": 0.0006445158984722354,
+ "time_sec": 49.64657950401306
+ },
+ {
+ "epoch": 62,
+ "train_loss": 2.0472131072998048,
+ "train_acc": 0.4486,
+ "test_loss": 6.881848452758789,
+ "test_acc": 0.0976,
+ "lyapunov": null,
+ "grad_norm": 0.6461433133831308,
+ "grad_max_sv": 0.22962211742997168,
+ "grad_min_sv": 1.2113809159074174e-08,
+ "grad_condition": 324038818.4677658,
+ "lr": 0.0006344599103076324,
+ "time_sec": 49.627341747283936
+ },
+ {
+ "epoch": 63,
+ "train_loss": 2.035955301361084,
+ "train_acc": 0.44882,
+ "test_loss": 7.18960142211914,
+ "test_acc": 0.0878,
+ "lyapunov": null,
+ "grad_norm": 0.6422783690964438,
+ "grad_max_sv": 0.2209172960370779,
+ "grad_min_sv": 1.2127595816480152e-08,
+ "grad_condition": 21910433.389134284,
+ "lr": 0.0006243449435824269,
+ "time_sec": 49.64501976966858
+ },
+ {
+ "epoch": 64,
+ "train_loss": 2.036686828079224,
+ "train_acc": 0.45056,
+ "test_loss": 7.650535336303711,
+ "test_acc": 0.0924,
+ "lyapunov": null,
+ "grad_norm": 0.641718667248247,
+ "grad_max_sv": 0.22157798074185847,
+ "grad_min_sv": 1.1966991517176062e-08,
+ "grad_condition": 25321432.686805125,
+ "lr": 0.0006141754350553275,
+ "time_sec": 49.63518667221069
+ },
+ {
+ "epoch": 65,
+ "train_loss": 2.0039944877624514,
+ "train_acc": 0.45574,
+ "test_loss": 7.262261317443848,
+ "test_acc": 0.114,
+ "lyapunov": null,
+ "grad_norm": 0.6509729656164255,
+ "grad_max_sv": 0.2328164666891098,
+ "grad_min_sv": 1.2227686406116046e-08,
+ "grad_condition": 78588688.09864715,
+ "lr": 0.0006039558454088793,
+ "time_sec": 49.62892246246338
+ },
+ {
+ "epoch": 66,
+ "train_loss": 1.9934623148345947,
+ "train_acc": 0.4604,
+ "test_loss": 6.735845774841309,
+ "test_acc": 0.0988,
+ "lyapunov": null,
+ "grad_norm": 0.6428090636861153,
+ "grad_max_sv": 0.22018610946834088,
+ "grad_min_sv": 1.2050285417425366e-08,
+ "grad_condition": 33987345.003156364,
+ "lr": 0.000593690657292862,
+ "time_sec": 49.634801626205444
+ },
+ {
+ "epoch": 67,
+ "train_loss": 1.968681404800415,
+ "train_acc": 0.46364,
+ "test_loss": 7.602304705810547,
+ "test_acc": 0.0987,
+ "lyapunov": null,
+ "grad_norm": 0.6457740641454927,
+ "grad_max_sv": 0.2279145259410143,
+ "grad_min_sv": 1.2256968678903136e-08,
+ "grad_condition": 23591230.853540566,
+ "lr": 0.0005833843733580507,
+ "time_sec": 49.640379190444946
+ },
+ {
+ "epoch": 68,
+ "train_loss": 1.9723771545791626,
+ "train_acc": 0.46456,
+ "test_loss": 7.501553115844726,
+ "test_acc": 0.0743,
+ "lyapunov": null,
+ "grad_norm": 0.6345718818470338,
+ "grad_max_sv": 0.21636971682310105,
+ "grad_min_sv": 1.1871784413863828e-08,
+ "grad_condition": 21468624.440050583,
+ "lr": 0.0005730415142812054,
+ "time_sec": 49.618358850479126
+ },
+ {
+ "epoch": 69,
+ "train_loss": 1.950169172744751,
+ "train_acc": 0.46892,
+ "test_loss": 7.0990902679443355,
+ "test_acc": 0.0888,
+ "lyapunov": null,
+ "grad_norm": 0.6406229801466465,
+ "grad_max_sv": 0.2206659872084856,
+ "grad_min_sv": 1.1992476682196051e-08,
+ "grad_condition": 56593916.45522114,
+ "lr": 0.0005626666167821517,
+ "time_sec": 49.63790965080261
+ },
+ {
+ "epoch": 70,
+ "train_loss": 1.939907547531128,
+ "train_acc": 0.4716,
+ "test_loss": 7.282066575622559,
+ "test_acc": 0.0983,
+ "lyapunov": null,
+ "grad_norm": 0.6459981596212524,
+ "grad_max_sv": 0.23004377372562884,
+ "grad_min_sv": 1.2037511798457245e-08,
+ "grad_condition": 28235857.849722397,
+ "lr": 0.0005522642316338265,
+ "time_sec": 49.62828755378723
+ },
+ {
+ "epoch": 71,
+ "train_loss": 1.929073366470337,
+ "train_acc": 0.47462,
+ "test_loss": 6.812109463500977,
+ "test_acc": 0.1063,
+ "lyapunov": null,
+ "grad_norm": 0.6476540219610287,
+ "grad_max_sv": 0.22166885659098626,
+ "grad_min_sv": 1.2136537663048897e-08,
+ "grad_condition": 51677369.32839097,
+ "lr": 0.0005418389216661573,
+ "time_sec": 49.61943817138672
+ },
+ {
+ "epoch": 72,
+ "train_loss": 1.919623097305298,
+ "train_acc": 0.47576,
+ "test_loss": 6.68877933883667,
+ "test_acc": 0.0798,
+ "lyapunov": null,
+ "grad_norm": 0.638990192022336,
+ "grad_max_sv": 0.2177750900387764,
+ "grad_min_sv": 1.1837285757154703e-08,
+ "grad_condition": 30448032.105450857,
+ "lr": 0.0005313952597646563,
+ "time_sec": 49.63543653488159
+ },
+ {
+ "epoch": 73,
+ "train_loss": 1.8911805786514282,
+ "train_acc": 0.4813,
+ "test_loss": 7.259025004577636,
+ "test_acc": 0.1017,
+ "lyapunov": null,
+ "grad_norm": 0.6388927531170105,
+ "grad_max_sv": 0.2268439143896103,
+ "grad_min_sv": 1.2116396552741548e-08,
+ "grad_condition": 25828769.58088143,
+ "lr": 0.0005209378268645994,
+ "time_sec": 49.63246250152588
+ },
+ {
+ "epoch": 74,
+ "train_loss": 1.87730663772583,
+ "train_acc": 0.4856,
+ "test_loss": 6.621179290771485,
+ "test_acc": 0.1118,
+ "lyapunov": null,
+ "grad_norm": 0.6382424632105009,
+ "grad_max_sv": 0.22017028257250787,
+ "grad_min_sv": 1.1917627623647676e-08,
+ "grad_condition": 36459230.544282585,
+ "lr": 0.0005104712099416781,
+ "time_sec": 49.63705110549927
+ },
+ {
+ "epoch": 75,
+ "train_loss": 1.8676763352966308,
+ "train_acc": 0.4867,
+ "test_loss": 6.639352639770507,
+ "test_acc": 0.1035,
+ "lyapunov": null,
+ "grad_norm": 0.6471776484855016,
+ "grad_max_sv": 0.22313491702079774,
+ "grad_min_sv": 1.2076539387256834e-08,
+ "grad_condition": 168096640.34612545,
+ "lr": 0.0004999999999999996,
+ "time_sec": 49.62802839279175
+ },
+ {
+ "epoch": 76,
+ "train_loss": 1.8601240715026854,
+ "train_acc": 0.48752,
+ "test_loss": 7.69632975769043,
+ "test_acc": 0.093,
+ "lyapunov": null,
+ "grad_norm": 0.6373532537157988,
+ "grad_max_sv": 0.21818222440779209,
+ "grad_min_sv": 1.1897569247160123e-08,
+ "grad_condition": 49575276.624648556,
+ "lr": 0.0004895287900583212,
+ "time_sec": 49.61473488807678
+ },
+ {
+ "epoch": 77,
+ "train_loss": 1.844694657020569,
+ "train_acc": 0.49,
+ "test_loss": 7.673219400024414,
+ "test_acc": 0.0971,
+ "lyapunov": null,
+ "grad_norm": 0.6357429485708425,
+ "grad_max_sv": 0.21753050275146962,
+ "grad_min_sv": 1.1727277435258366e-08,
+ "grad_condition": 25108982.07055033,
+ "lr": 0.0004790621731353997,
+ "time_sec": 49.61942458152771
+ },
+ {
+ "epoch": 78,
+ "train_loss": 1.8382536688232423,
+ "train_acc": 0.49426,
+ "test_loss": 8.053473236083985,
+ "test_acc": 0.0877,
+ "lyapunov": null,
+ "grad_norm": 0.6413732546621618,
+ "grad_max_sv": 0.22126910798251628,
+ "grad_min_sv": 1.217776433408424e-08,
+ "grad_condition": 50630196.79387429,
+ "lr": 0.000468604740235343,
+ "time_sec": 49.620675802230835
+ },
+ {
+ "epoch": 79,
+ "train_loss": 1.8119768780899048,
+ "train_acc": 0.50004,
+ "test_loss": 7.10159133605957,
+ "test_acc": 0.103,
+ "lyapunov": null,
+ "grad_norm": 0.64075038803741,
+ "grad_max_sv": 0.22004345506429673,
+ "grad_min_sv": 1.179401228554311e-08,
+ "grad_condition": 39644724.18434289,
+ "lr": 0.00045816107833384175,
+ "time_sec": 49.65424633026123
+ },
+ {
+ "epoch": 80,
+ "train_loss": 1.805297444114685,
+ "train_acc": 0.50122,
+ "test_loss": 7.127357855224609,
+ "test_acc": 0.1076,
+ "lyapunov": null,
+ "grad_norm": 0.6452326753546996,
+ "grad_max_sv": 0.2212912131100893,
+ "grad_min_sv": 1.2059882024961777e-08,
+ "grad_condition": 29968320.229064513,
+ "lr": 0.0004477357683661729,
+ "time_sec": 49.62116003036499
+ },
+ {
+ "epoch": 81,
+ "train_loss": 1.792769065246582,
+ "train_acc": 0.50348,
+ "test_loss": 7.439458018493652,
+ "test_acc": 0.0985,
+ "lyapunov": null,
+ "grad_norm": 0.6408257507786687,
+ "grad_max_sv": 0.22126449905335904,
+ "grad_min_sv": 1.1952658901526191e-08,
+ "grad_condition": 23156470.62447612,
+ "lr": 0.00043733338321784746,
+ "time_sec": 49.64424705505371
+ },
+ {
+ "epoch": 82,
+ "train_loss": 1.770621812400818,
+ "train_acc": 0.51052,
+ "test_loss": 7.155345419311524,
+ "test_acc": 0.1127,
+ "lyapunov": null,
+ "grad_norm": 0.6446017522348026,
+ "grad_max_sv": 0.22318419590592384,
+ "grad_min_sv": 1.1969205995082665e-08,
+ "grad_condition": 88594611.75801164,
+ "lr": 0.0004269584857187939,
+ "time_sec": 49.622429847717285
+ },
+ {
+ "epoch": 83,
+ "train_loss": 1.769109418029785,
+ "train_acc": 0.50846,
+ "test_loss": 7.010694668579101,
+ "test_acc": 0.1057,
+ "lyapunov": null,
+ "grad_norm": 0.6502891030839932,
+ "grad_max_sv": 0.2263760395348072,
+ "grad_min_sv": 1.2018579030603772e-08,
+ "grad_condition": 29299643.5314746,
+ "lr": 0.0004166156266419484,
+ "time_sec": 49.614967584609985
+ },
+ {
+ "epoch": 84,
+ "train_loss": 1.7552229693222046,
+ "train_acc": 0.51318,
+ "test_loss": 7.019638833618164,
+ "test_acc": 0.1006,
+ "lyapunov": null,
+ "grad_norm": 0.6441122145546607,
+ "grad_max_sv": 0.21587914675474168,
+ "grad_min_sv": 1.1914460645509606e-08,
+ "grad_condition": 54331112.96990696,
+ "lr": 0.0004063093427071373,
+ "time_sec": 49.63624048233032
+ },
+ {
+ "epoch": 85,
+ "train_loss": 1.7453889175796509,
+ "train_acc": 0.5142,
+ "test_loss": 6.935272999572754,
+ "test_acc": 0.0772,
+ "lyapunov": null,
+ "grad_norm": 0.6354119534548792,
+ "grad_max_sv": 0.22349480539560318,
+ "grad_min_sv": 1.188125494724912e-08,
+ "grad_condition": 54450146.559093714,
+ "lr": 0.0003960441545911199,
+ "time_sec": 49.63727903366089
+ },
+ {
+ "epoch": 86,
+ "train_loss": 1.7361508292388916,
+ "train_acc": 0.51694,
+ "test_loss": 6.903331332397461,
+ "test_acc": 0.0874,
+ "lyapunov": null,
+ "grad_norm": 0.6433396686482765,
+ "grad_max_sv": 0.2229986496269703,
+ "grad_min_sv": 1.2302347957016124e-08,
+ "grad_condition": 20829684.95092944,
+ "lr": 0.0003858245649446718,
+ "time_sec": 49.620397329330444
+ },
+ {
+ "epoch": 87,
+ "train_loss": 1.7140229907989502,
+ "train_acc": 0.52362,
+ "test_loss": 6.144080555725098,
+ "test_acc": 0.0973,
+ "lyapunov": null,
+ "grad_norm": 0.6397281329733326,
+ "grad_max_sv": 0.2236575834453106,
+ "grad_min_sv": 1.2130321444536741e-08,
+ "grad_condition": 24582093.327500105,
+ "lr": 0.00037565505641757235,
+ "time_sec": 49.63749957084656
+ },
+ {
+ "epoch": 88,
+ "train_loss": 1.698942677230835,
+ "train_acc": 0.52702,
+ "test_loss": 6.329557989501953,
+ "test_acc": 0.1043,
+ "lyapunov": null,
+ "grad_norm": 0.6429735672215783,
+ "grad_max_sv": 0.22443199381232262,
+ "grad_min_sv": 1.2242971281217762e-08,
+ "grad_condition": 21997184.984676402,
+ "lr": 0.00036554008969236695,
+ "time_sec": 49.64341187477112
+ },
+ {
+ "epoch": 89,
+ "train_loss": 1.6915926089859008,
+ "train_acc": 0.52672,
+ "test_loss": 6.97091061706543,
+ "test_acc": 0.1064,
+ "lyapunov": null,
+ "grad_norm": 0.6396443107842517,
+ "grad_max_sv": 0.21398231349885463,
+ "grad_min_sv": 1.1860397219898289e-08,
+ "grad_condition": 25819116.390227333,
+ "lr": 0.0003554841015277638,
+ "time_sec": 49.61740279197693
+ },
+ {
+ "epoch": 90,
+ "train_loss": 1.6705048236846924,
+ "train_acc": 0.53226,
+ "test_loss": 6.474410656738281,
+ "test_acc": 0.1104,
+ "lyapunov": null,
+ "grad_norm": 0.6447874278631877,
+ "grad_max_sv": 0.22352466247975827,
+ "grad_min_sv": 1.1839073051078675e-08,
+ "grad_condition": 194632597.18194634,
+ "lr": 0.000345491502812526,
+ "time_sec": 49.63944673538208
+ },
+ {
+ "epoch": 91,
+ "train_loss": 1.6604324224090576,
+ "train_acc": 0.53478,
+ "test_loss": 7.210493100738526,
+ "test_acc": 0.1186,
+ "lyapunov": null,
+ "grad_norm": 0.6483901695782636,
+ "grad_max_sv": 0.23147397823631763,
+ "grad_min_sv": 1.2240159032281435e-08,
+ "grad_condition": 833122995.4080375,
+ "lr": 0.0003355666766307081,
+ "time_sec": 49.65723490715027
+ },
+ {
+ "epoch": 92,
+ "train_loss": 1.655436181564331,
+ "train_acc": 0.53562,
+ "test_loss": 6.41819879989624,
+ "test_acc": 0.1099,
+ "lyapunov": null,
+ "grad_norm": 0.6422800867205569,
+ "grad_max_sv": 0.22188753299415112,
+ "grad_min_sv": 1.1910704758588687e-08,
+ "grad_condition": 31454971.248209517,
+ "lr": 0.00032571397633909225,
+ "time_sec": 49.62359666824341
+ },
+ {
+ "epoch": 93,
+ "train_loss": 1.6418727423477173,
+ "train_acc": 0.53886,
+ "test_loss": 6.5647822364807125,
+ "test_acc": 0.1078,
+ "lyapunov": null,
+ "grad_norm": 0.6425002000385331,
+ "grad_max_sv": 0.22996555864810944,
+ "grad_min_sv": 1.214085261491693e-08,
+ "grad_condition": 23136414.278494585,
+ "lr": 0.00031593772365766094,
+ "time_sec": 49.648432970047
+ },
+ {
+ "epoch": 94,
+ "train_loss": 1.6380917670822144,
+ "train_acc": 0.54016,
+ "test_loss": 6.60304995880127,
+ "test_acc": 0.1013,
+ "lyapunov": null,
+ "grad_norm": 0.6435715746993702,
+ "grad_max_sv": 0.22394425868988038,
+ "grad_min_sv": 1.1969105850884176e-08,
+ "grad_condition": 22813937.74993243,
+ "lr": 0.0003062422067739483,
+ "time_sec": 49.62917709350586
+ },
+ {
+ "epoch": 95,
+ "train_loss": 1.6159375607681274,
+ "train_acc": 0.54468,
+ "test_loss": 7.4295039352417,
+ "test_acc": 0.1043,
+ "lyapunov": null,
+ "grad_norm": 0.6459265748151144,
+ "grad_max_sv": 0.2222417715936899,
+ "grad_min_sv": 1.2084532810541226e-08,
+ "grad_condition": 23228929.65699155,
+ "lr": 0.00029663167846209965,
+ "time_sec": 49.633803606033325
+ },
+ {
+ "epoch": 96,
+ "train_loss": 1.6130770600128175,
+ "train_acc": 0.54918,
+ "test_loss": 7.755695833587646,
+ "test_acc": 0.103,
+ "lyapunov": null,
+ "grad_norm": 0.6373845581356181,
+ "grad_max_sv": 0.2166528631001711,
+ "grad_min_sv": 1.1723080543812881e-08,
+ "grad_condition": 61573060.408652686,
+ "lr": 0.00028711035421746345,
+ "time_sec": 49.63398790359497
+ },
+ {
+ "epoch": 97,
+ "train_loss": 1.5942238623046876,
+ "train_acc": 0.55338,
+ "test_loss": 7.366734781646729,
+ "test_acc": 0.0942,
+ "lyapunov": null,
+ "grad_norm": 0.645954709653033,
+ "grad_max_sv": 0.23344604782760142,
+ "grad_min_sv": 1.211216281021832e-08,
+ "grad_condition": 28920253.40686954,
+ "lr": 0.00027768241040753615,
+ "time_sec": 49.63687562942505
+ },
+ {
+ "epoch": 98,
+ "train_loss": 1.5829193838119506,
+ "train_acc": 0.55468,
+ "test_loss": 7.60546820526123,
+ "test_acc": 0.0996,
+ "lyapunov": null,
+ "grad_norm": 0.6414940955031293,
+ "grad_max_sv": 0.22326541543006898,
+ "grad_min_sv": 1.18154431003048e-08,
+ "grad_condition": 27850671.690087616,
+ "lr": 0.00026835198244006903,
+ "time_sec": 49.60518288612366
+ },
+ {
+ "epoch": 99,
+ "train_loss": 1.5702915887451172,
+ "train_acc": 0.55388,
+ "test_loss": 7.25171710357666,
+ "test_acc": 0.0857,
+ "lyapunov": null,
+ "grad_norm": 0.6448707164382114,
+ "grad_max_sv": 0.22703963220119477,
+ "grad_min_sv": 1.2078747084476315e-08,
+ "grad_condition": 30695848.89590156,
+ "lr": 0.0002591231629491421,
+ "time_sec": 49.6348443031311
+ },
+ {
+ "epoch": 100,
+ "train_loss": 1.563120531387329,
+ "train_acc": 0.5575,
+ "test_loss": 7.321073220062256,
+ "test_acc": 0.0975,
+ "lyapunov": null,
+ "grad_norm": 0.6501432324709732,
+ "grad_max_sv": 0.22466112971305846,
+ "grad_min_sv": 1.1973627836447952e-08,
+ "grad_condition": 23144250.2743996,
+ "lr": 0.0002499999999999997,
+ "time_sec": 49.639625549316406
+ },
+ {
+ "epoch": 101,
+ "train_loss": 1.5544149493026733,
+ "train_acc": 0.562,
+ "test_loss": 8.2606175201416,
+ "test_acc": 0.0986,
+ "lyapunov": null,
+ "grad_norm": 0.6383634384668164,
+ "grad_max_sv": 0.22597188949584962,
+ "grad_min_sv": 1.1897128555232727e-08,
+ "grad_condition": 42860913.99555977,
+ "lr": 0.00024098649531343477,
+ "time_sec": 49.64992117881775
+ },
+ {
+ "epoch": 102,
+ "train_loss": 1.547795528869629,
+ "train_acc": 0.5621,
+ "test_loss": 7.994213732910156,
+ "test_acc": 0.1009,
+ "lyapunov": null,
+ "grad_norm": 0.6440457566084322,
+ "grad_max_sv": 0.22605536915361882,
+ "grad_min_sv": 1.21044593875963e-08,
+ "grad_condition": 23222249.12666279,
+ "lr": 0.0002320866025105016,
+ "time_sec": 49.638099670410156
+ },
+ {
+ "epoch": 103,
+ "train_loss": 1.5383813903045653,
+ "train_acc": 0.56598,
+ "test_loss": 8.507730350494384,
+ "test_acc": 0.0971,
+ "lyapunov": null,
+ "grad_norm": 0.6412277700079685,
+ "grad_max_sv": 0.2286630392074585,
+ "grad_min_sv": 1.1935943896451695e-08,
+ "grad_condition": 61496117.17851217,
+ "lr": 0.0002233042253783278,
+ "time_sec": 49.624167919158936
+ },
+ {
+ "epoch": 104,
+ "train_loss": 1.5296855780792236,
+ "train_acc": 0.56802,
+ "test_loss": 7.766149099731446,
+ "test_acc": 0.1005,
+ "lyapunov": null,
+ "grad_norm": 0.6402323929530521,
+ "grad_max_sv": 0.2234394859522581,
+ "grad_min_sv": 1.1708301472790339e-08,
+ "grad_condition": 51957414.29232074,
+ "lr": 0.000214643216157784,
+ "time_sec": 49.62683367729187
+ },
+ {
+ "epoch": 105,
+ "train_loss": 1.515010786781311,
+ "train_acc": 0.5704,
+ "test_loss": 7.568338539123535,
+ "test_acc": 0.1172,
+ "lyapunov": null,
+ "grad_norm": 0.6478082803296404,
+ "grad_max_sv": 0.23342282325029373,
+ "grad_min_sv": 1.216084826727304e-08,
+ "grad_condition": 26048714.73020513,
+ "lr": 0.00020610737385376332,
+ "time_sec": 49.63592481613159
+ },
+ {
+ "epoch": 106,
+ "train_loss": 1.512930496749878,
+ "train_acc": 0.56978,
+ "test_loss": 7.760108979797363,
+ "test_acc": 0.1047,
+ "lyapunov": null,
+ "grad_norm": 0.6453652740846443,
+ "grad_max_sv": 0.22414597682654858,
+ "grad_min_sv": 1.1973005337173603e-08,
+ "grad_condition": 26272467.73653502,
+ "lr": 0.00019770044256881242,
+ "time_sec": 49.61698055267334
+ },
+ {
+ "epoch": 107,
+ "train_loss": 1.4956118043899536,
+ "train_acc": 0.57444,
+ "test_loss": 8.33652488708496,
+ "test_acc": 0.1011,
+ "lyapunov": null,
+ "grad_norm": 0.6438260578925417,
+ "grad_max_sv": 0.2238406077027321,
+ "grad_min_sv": 1.1764498750177488e-08,
+ "grad_condition": 28981818.37375744,
+ "lr": 0.0001894261098608447,
+ "time_sec": 49.63762021064758
+ },
+ {
+ "epoch": 108,
+ "train_loss": 1.491361379776001,
+ "train_acc": 0.57876,
+ "test_loss": 8.52306475906372,
+ "test_acc": 0.1029,
+ "lyapunov": null,
+ "grad_norm": 0.6413105894442734,
+ "grad_max_sv": 0.22412343323230743,
+ "grad_min_sv": 1.2146300558402157e-08,
+ "grad_condition": 34732320.931619205,
+ "lr": 0.000181288005125655,
+ "time_sec": 49.6246235370636
+ },
+ {
+ "epoch": 109,
+ "train_loss": 1.4785979221343994,
+ "train_acc": 0.5778,
+ "test_loss": 7.686713803100586,
+ "test_acc": 0.0994,
+ "lyapunov": null,
+ "grad_norm": 0.6419467845001164,
+ "grad_max_sv": 0.22575648352503777,
+ "grad_min_sv": 1.1847785963414737e-08,
+ "grad_condition": 32480603.86279717,
+ "lr": 0.0001732896980049473,
+ "time_sec": 49.628063678741455
+ },
+ {
+ "epoch": 110,
+ "train_loss": 1.4723126147842407,
+ "train_acc": 0.57888,
+ "test_loss": 8.482755671691894,
+ "test_acc": 0.1053,
+ "lyapunov": null,
+ "grad_norm": 0.6427405399098718,
+ "grad_max_sv": 0.2258045580238104,
+ "grad_min_sv": 1.177179903347203e-08,
+ "grad_condition": 55737890.93326217,
+ "lr": 0.00016543469682057076,
+ "time_sec": 49.82239508628845
+ },
+ {
+ "epoch": 111,
+ "train_loss": 1.4714193873977661,
+ "train_acc": 0.5821,
+ "test_loss": 8.059153175354004,
+ "test_acc": 0.1095,
+ "lyapunov": null,
+ "grad_norm": 0.643358384906005,
+ "grad_max_sv": 0.2271666146814823,
+ "grad_min_sv": 1.1828724497814358e-08,
+ "grad_condition": 53541240.65537085,
+ "lr": 0.00015772644703565552,
+ "time_sec": 49.64692163467407
+ },
+ {
+ "epoch": 112,
+ "train_loss": 1.4565179361724854,
+ "train_acc": 0.58618,
+ "test_loss": 8.070704318237304,
+ "test_acc": 0.0989,
+ "lyapunov": null,
+ "grad_norm": 0.6414562113271406,
+ "grad_max_sv": 0.22715382017195224,
+ "grad_min_sv": 1.2078682694316445e-08,
+ "grad_condition": 27450211.87146064,
+ "lr": 0.00015016832974331713,
+ "time_sec": 49.634828329086304
+ },
+ {
+ "epoch": 113,
+ "train_loss": 1.445754097442627,
+ "train_acc": 0.58848,
+ "test_loss": 8.390233863830566,
+ "test_acc": 0.1078,
+ "lyapunov": null,
+ "grad_norm": 0.6411801061752302,
+ "grad_max_sv": 0.2343009330332279,
+ "grad_min_sv": 1.2054243894374373e-08,
+ "grad_condition": 73622071.21411385,
+ "lr": 0.00014276366018359834,
+ "time_sec": 49.62168598175049
+ },
+ {
+ "epoch": 114,
+ "train_loss": 1.4396562029647828,
+ "train_acc": 0.59112,
+ "test_loss": 7.990397840881347,
+ "test_acc": 0.1207,
+ "lyapunov": null,
+ "grad_norm": 0.6446675700592518,
+ "grad_max_sv": 0.22858907766640185,
+ "grad_min_sv": 1.2150255043752444e-08,
+ "grad_condition": 23031763.367673956,
+ "lr": 0.00013551568628929425,
+ "time_sec": 49.621737480163574
+ },
+ {
+ "epoch": 115,
+ "train_loss": 1.4295790006256104,
+ "train_acc": 0.5919,
+ "test_loss": 7.907929286956787,
+ "test_acc": 0.1088,
+ "lyapunov": null,
+ "grad_norm": 0.6414787996170513,
+ "grad_max_sv": 0.22259003035724162,
+ "grad_min_sv": 1.1937235663839196e-08,
+ "grad_condition": 26925988.130458646,
+ "lr": 0.00012842758726130276,
+ "time_sec": 49.702799558639526
+ },
+ {
+ "epoch": 116,
+ "train_loss": 1.419941686477661,
+ "train_acc": 0.59402,
+ "test_loss": 7.794718334197998,
+ "test_acc": 0.118,
+ "lyapunov": null,
+ "grad_norm": 0.6403562503796186,
+ "grad_max_sv": 0.23044625744223596,
+ "grad_min_sv": 1.1990111638271461e-08,
+ "grad_condition": 86324103.75912428,
+ "lr": 0.0001215024721741218,
+ "time_sec": 49.6519889831543
+ },
+ {
+ "epoch": 117,
+ "train_loss": 1.4125151259613038,
+ "train_acc": 0.59724,
+ "test_loss": 8.082193556976318,
+ "test_acc": 0.1093,
+ "lyapunov": null,
+ "grad_norm": 0.6390276536629967,
+ "grad_max_sv": 0.22913259454071522,
+ "grad_min_sv": 1.1846856870501021e-08,
+ "grad_condition": 38051050.155520104,
+ "lr": 0.00011474337861210538,
+ "time_sec": 49.67843008041382
+ },
+ {
+ "epoch": 118,
+ "train_loss": 1.4061624579238892,
+ "train_acc": 0.59848,
+ "test_loss": 7.994955434417725,
+ "test_acc": 0.1217,
+ "lyapunov": null,
+ "grad_norm": 0.6431427525608711,
+ "grad_max_sv": 0.22681293152272702,
+ "grad_min_sv": 1.2012494199353796e-08,
+ "grad_condition": 22440692.932778567,
+ "lr": 0.00010815327133708009,
+ "time_sec": 49.65889072418213
+ },
+ {
+ "epoch": 119,
+ "train_loss": 1.4033130680847168,
+ "train_acc": 0.59806,
+ "test_loss": 7.7351758087158204,
+ "test_acc": 0.1159,
+ "lyapunov": null,
+ "grad_norm": 0.6393512801434791,
+ "grad_max_sv": 0.22470695674419403,
+ "grad_min_sv": 1.173807711446484e-08,
+ "grad_condition": 33523113.628067147,
+ "lr": 0.00010173504098790182,
+ "time_sec": 49.65284276008606
+ },
+ {
+ "epoch": 120,
+ "train_loss": 1.3988560864257813,
+ "train_acc": 0.59928,
+ "test_loss": 8.596598931121827,
+ "test_acc": 0.104,
+ "lyapunov": null,
+ "grad_norm": 0.6430512338238313,
+ "grad_max_sv": 0.23124604262411594,
+ "grad_min_sv": 1.2035057309067731e-08,
+ "grad_condition": 27263284.07382477,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 49.64090633392334
+ },
+ {
+ "epoch": 121,
+ "train_loss": 1.3857270031356812,
+ "train_acc": 0.60484,
+ "test_loss": 7.9892033752441405,
+ "test_acc": 0.1183,
+ "lyapunov": null,
+ "grad_norm": 0.6395461283787793,
+ "grad_max_sv": 0.22570451460778712,
+ "grad_min_sv": 1.2030840006518884e-08,
+ "grad_condition": 53181043.26539834,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 49.60771918296814
+ },
+ {
+ "epoch": 122,
+ "train_loss": 1.3880330154037475,
+ "train_acc": 0.60376,
+ "test_loss": 8.22642307357788,
+ "test_acc": 0.115,
+ "lyapunov": null,
+ "grad_norm": 0.6427946655580464,
+ "grad_max_sv": 0.22782764062285424,
+ "grad_min_sv": 1.1785313203116487e-08,
+ "grad_condition": 24787267.408791415,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 49.64048886299133
+ },
+ {
+ "epoch": 123,
+ "train_loss": 1.377012547569275,
+ "train_acc": 0.60464,
+ "test_loss": 7.7657553009033204,
+ "test_acc": 0.114,
+ "lyapunov": null,
+ "grad_norm": 0.6396634441881897,
+ "grad_max_sv": 0.23086622469127177,
+ "grad_min_sv": 1.198922548739656e-08,
+ "grad_condition": 23123320.372294467,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 49.63312888145447
+ },
+ {
+ "epoch": 124,
+ "train_loss": 1.376011091003418,
+ "train_acc": 0.60928,
+ "test_loss": 7.944722248840332,
+ "test_acc": 0.1039,
+ "lyapunov": null,
+ "grad_norm": 0.6321494808563242,
+ "grad_max_sv": 0.22378434427082539,
+ "grad_min_sv": 1.1604401764855887e-08,
+ "grad_condition": 58244211.34800786,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 49.64424800872803
+ },
+ {
+ "epoch": 125,
+ "train_loss": 1.368886891708374,
+ "train_acc": 0.60824,
+ "test_loss": 8.258360435485839,
+ "test_acc": 0.1147,
+ "lyapunov": null,
+ "grad_norm": 0.6400148651728099,
+ "grad_max_sv": 0.22423702478408813,
+ "grad_min_sv": 1.175346897655527e-08,
+ "grad_condition": 47951723.35743973,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 49.635197162628174
+ },
+ {
+ "epoch": 126,
+ "train_loss": 1.368887268447876,
+ "train_acc": 0.60784,
+ "test_loss": 8.00912710647583,
+ "test_acc": 0.1098,
+ "lyapunov": null,
+ "grad_norm": 0.6414620945866057,
+ "grad_max_sv": 0.22984928116202355,
+ "grad_min_sv": 1.1862470802870284e-08,
+ "grad_condition": 27488218.9085432,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 49.63115334510803
+ },
+ {
+ "epoch": 127,
+ "train_loss": 1.3691972059631348,
+ "train_acc": 0.60894,
+ "test_loss": 8.099956825256347,
+ "test_acc": 0.1137,
+ "lyapunov": null,
+ "grad_norm": 0.6379342286587659,
+ "grad_max_sv": 0.22721209563314915,
+ "grad_min_sv": 1.1842124452571268e-08,
+ "grad_condition": 66054597.76675473,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 49.64264273643494
+ },
+ {
+ "epoch": 128,
+ "train_loss": 1.3585320538711547,
+ "train_acc": 0.61176,
+ "test_loss": 8.168904312896728,
+ "test_acc": 0.1178,
+ "lyapunov": null,
+ "grad_norm": 0.6384779111033096,
+ "grad_max_sv": 0.2258748199790716,
+ "grad_min_sv": 1.1702591148909925e-08,
+ "grad_condition": 121211424.44652918,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 49.62958645820618
+ },
+ {
+ "epoch": 129,
+ "train_loss": 1.3585711254501343,
+ "train_acc": 0.6101,
+ "test_loss": 7.90961298828125,
+ "test_acc": 0.1095,
+ "lyapunov": null,
+ "grad_norm": 0.6412738082737135,
+ "grad_max_sv": 0.22799600511789322,
+ "grad_min_sv": 1.2047476663501478e-08,
+ "grad_condition": 44984170.42448841,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 49.62019920349121
+ },
+ {
+ "epoch": 130,
+ "train_loss": 1.3606473222351074,
+ "train_acc": 0.60866,
+ "test_loss": 7.8885728500366215,
+ "test_acc": 0.1165,
+ "lyapunov": null,
+ "grad_norm": 0.6429377341506345,
+ "grad_max_sv": 0.22763566635549068,
+ "grad_min_sv": 1.1949406383826578e-08,
+ "grad_condition": 23238593.216242827,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 49.60610270500183
+ },
+ {
+ "epoch": 131,
+ "train_loss": 1.340769683189392,
+ "train_acc": 0.61422,
+ "test_loss": 7.97282382888794,
+ "test_acc": 0.1176,
+ "lyapunov": null,
+ "grad_norm": 0.6365898965081005,
+ "grad_max_sv": 0.22698684968054295,
+ "grad_min_sv": 1.1841301903944835e-08,
+ "grad_condition": 57050057.91630666,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 49.639729738235474
+ },
+ {
+ "epoch": 132,
+ "train_loss": 1.3506625385284423,
+ "train_acc": 0.61254,
+ "test_loss": 8.237340574645996,
+ "test_acc": 0.1112,
+ "lyapunov": null,
+ "grad_norm": 0.6405822016126281,
+ "grad_max_sv": 0.2313113920390606,
+ "grad_min_sv": 1.1943680751358432e-08,
+ "grad_condition": 32855860.000038534,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 49.62140464782715
+ },
+ {
+ "epoch": 133,
+ "train_loss": 1.3537355774307251,
+ "train_acc": 0.60946,
+ "test_loss": 8.220967332458496,
+ "test_acc": 0.1107,
+ "lyapunov": null,
+ "grad_norm": 0.6424071935223469,
+ "grad_max_sv": 0.2330889504402876,
+ "grad_min_sv": 1.1997084857148787e-08,
+ "grad_condition": 44613447.03937371,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 49.62578868865967
+ },
+ {
+ "epoch": 134,
+ "train_loss": 1.33552843044281,
+ "train_acc": 0.61362,
+ "test_loss": 8.059291929626465,
+ "test_acc": 0.1019,
+ "lyapunov": null,
+ "grad_norm": 0.6408761914883747,
+ "grad_max_sv": 0.2316820841282606,
+ "grad_min_sv": 1.1778968132813982e-08,
+ "grad_condition": 105523171.68805893,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 49.62417006492615
+ },
+ {
+ "epoch": 135,
+ "train_loss": 1.3386833112335206,
+ "train_acc": 0.61374,
+ "test_loss": 7.973577444458008,
+ "test_acc": 0.1097,
+ "lyapunov": null,
+ "grad_norm": 0.6388300432658766,
+ "grad_max_sv": 0.22841673195362092,
+ "grad_min_sv": 1.1936609616361448e-08,
+ "grad_condition": 69324765.09964362,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 49.65416145324707
+ },
+ {
+ "epoch": 136,
+ "train_loss": 1.3311992990112305,
+ "train_acc": 0.618,
+ "test_loss": 8.200102568817139,
+ "test_acc": 0.1214,
+ "lyapunov": null,
+ "grad_norm": 0.638950694855791,
+ "grad_max_sv": 0.2365179505199194,
+ "grad_min_sv": 1.1939427453644402e-08,
+ "grad_condition": 27475716.41514334,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 49.64095640182495
+ },
+ {
+ "epoch": 137,
+ "train_loss": 1.3340746058273316,
+ "train_acc": 0.61812,
+ "test_loss": 7.946666102600098,
+ "test_acc": 0.1106,
+ "lyapunov": null,
+ "grad_norm": 0.6352812169452327,
+ "grad_max_sv": 0.22020692974328995,
+ "grad_min_sv": 1.1623311241271139e-08,
+ "grad_condition": 29930613.060724013,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 49.633143186569214
+ },
+ {
+ "epoch": 138,
+ "train_loss": 1.336420276031494,
+ "train_acc": 0.61512,
+ "test_loss": 8.25653330230713,
+ "test_acc": 0.112,
+ "lyapunov": null,
+ "grad_norm": 0.6397251204580275,
+ "grad_max_sv": 0.23347726799547672,
+ "grad_min_sv": 1.1918404803357152e-08,
+ "grad_condition": 81456104.36957063,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 49.639748334884644
+ },
+ {
+ "epoch": 139,
+ "train_loss": 1.3220760538482665,
+ "train_acc": 0.61838,
+ "test_loss": 8.026485778808594,
+ "test_acc": 0.1138,
+ "lyapunov": null,
+ "grad_norm": 0.6398193491025633,
+ "grad_max_sv": 0.2238193929195404,
+ "grad_min_sv": 1.1681687835801702e-08,
+ "grad_condition": 38144371.645152286,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 49.63212180137634
+ },
+ {
+ "epoch": 140,
+ "train_loss": 1.3198553924942016,
+ "train_acc": 0.61854,
+ "test_loss": 8.029016185760499,
+ "test_acc": 0.1179,
+ "lyapunov": null,
+ "grad_norm": 0.639466602267434,
+ "grad_max_sv": 0.22324420213699342,
+ "grad_min_sv": 1.1702349164699477e-08,
+ "grad_condition": 28474783.149248235,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 49.65198302268982
+ },
+ {
+ "epoch": 141,
+ "train_loss": 1.3253049739837646,
+ "train_acc": 0.62014,
+ "test_loss": 8.258732906341553,
+ "test_acc": 0.1086,
+ "lyapunov": null,
+ "grad_norm": 0.6377969869493302,
+ "grad_max_sv": 0.23066396303474904,
+ "grad_min_sv": 1.1955105984340354e-08,
+ "grad_condition": 28290681.03527581,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 49.712565183639526
+ },
+ {
+ "epoch": 142,
+ "train_loss": 1.3294593518066407,
+ "train_acc": 0.6165,
+ "test_loss": 8.097643237304688,
+ "test_acc": 0.1079,
+ "lyapunov": null,
+ "grad_norm": 0.6416721044495594,
+ "grad_max_sv": 0.22946001626551152,
+ "grad_min_sv": 1.1918349693273988e-08,
+ "grad_condition": 33830275.99348913,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 49.62647032737732
+ },
+ {
+ "epoch": 143,
+ "train_loss": 1.3246013949203492,
+ "train_acc": 0.619,
+ "test_loss": 8.003326276397704,
+ "test_acc": 0.1093,
+ "lyapunov": null,
+ "grad_norm": 0.6406658358506779,
+ "grad_max_sv": 0.22979442439973355,
+ "grad_min_sv": 1.1885957310075503e-08,
+ "grad_condition": 1265929967.3983974,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 49.64323043823242
+ },
+ {
+ "epoch": 144,
+ "train_loss": 1.3237170028686522,
+ "train_acc": 0.61912,
+ "test_loss": 8.245773946380615,
+ "test_acc": 0.1116,
+ "lyapunov": null,
+ "grad_norm": 0.640154182788332,
+ "grad_max_sv": 0.22960694395005704,
+ "grad_min_sv": 1.1789325913159205e-08,
+ "grad_condition": 220785020.05461937,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 49.62677884101868
+ },
+ {
+ "epoch": 145,
+ "train_loss": 1.323034522781372,
+ "train_acc": 0.61748,
+ "test_loss": 8.367132460784912,
+ "test_acc": 0.1101,
+ "lyapunov": null,
+ "grad_norm": 0.6399875505077857,
+ "grad_max_sv": 0.2292648758739233,
+ "grad_min_sv": 1.1756407276852787e-08,
+ "grad_condition": 46749240.33218758,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 49.61358666419983
+ },
+ {
+ "epoch": 146,
+ "train_loss": 1.3221456618118286,
+ "train_acc": 0.61958,
+ "test_loss": 8.256616510772705,
+ "test_acc": 0.1088,
+ "lyapunov": null,
+ "grad_norm": 0.6401843350865242,
+ "grad_max_sv": 0.23075628280639648,
+ "grad_min_sv": 1.1929567545268527e-08,
+ "grad_condition": 56821403.658394314,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 49.62871527671814
+ },
+ {
+ "epoch": 147,
+ "train_loss": 1.32188304227829,
+ "train_acc": 0.62262,
+ "test_loss": 7.983602857208252,
+ "test_acc": 0.115,
+ "lyapunov": null,
+ "grad_norm": 0.6377455957871468,
+ "grad_max_sv": 0.2265624139457941,
+ "grad_min_sv": 1.1661963828825395e-08,
+ "grad_condition": 178436067.44761798,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 49.63710594177246
+ },
+ {
+ "epoch": 148,
+ "train_loss": 1.3234341220855712,
+ "train_acc": 0.61708,
+ "test_loss": 8.329111752319337,
+ "test_acc": 0.1046,
+ "lyapunov": null,
+ "grad_norm": 0.6428801038701755,
+ "grad_max_sv": 0.2313603863120079,
+ "grad_min_sv": 1.1845945344264585e-08,
+ "grad_condition": 144408842.21709472,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 49.63905072212219
+ },
+ {
+ "epoch": 149,
+ "train_loss": 1.3202154207611083,
+ "train_acc": 0.61986,
+ "test_loss": 8.021684009552002,
+ "test_acc": 0.1127,
+ "lyapunov": null,
+ "grad_norm": 0.6406912156142667,
+ "grad_max_sv": 0.2288107428699732,
+ "grad_min_sv": 1.181119294590971e-08,
+ "grad_condition": 65688308.80478315,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 49.61029553413391
+ },
+ {
+ "epoch": 150,
+ "train_loss": 1.3158636585235595,
+ "train_acc": 0.62006,
+ "test_loss": 8.094485763549805,
+ "test_acc": 0.1123,
+ "lyapunov": null,
+ "grad_norm": 0.6406489877650078,
+ "grad_max_sv": 0.23017469234764576,
+ "grad_min_sv": 1.1906818318807578e-08,
+ "grad_condition": 37789807.4961655,
+ "lr": 0.0,
+ "time_sec": 49.65584897994995
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 5.089254416656495,
+ "train_acc": 0.01344,
+ "test_loss": 4.870831555175781,
+ "test_acc": 0.01,
+ "lyapunov": null,
+ "grad_norm": 5.582063459208639,
+ "grad_max_sv": 5.0306542873382565,
+ "grad_min_sv": 8.441757832766683e-08,
+ "grad_condition": 74707534.78681344,
+ "lr": 0.0009998903417374227,
+ "time_sec": 66.70097637176514
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.736304296569824,
+ "train_acc": 0.02172,
+ "test_loss": 4.92340059890747,
+ "test_acc": 0.01,
+ "lyapunov": null,
+ "grad_norm": 4.087296772772229,
+ "grad_max_sv": 3.672157108783722,
+ "grad_min_sv": 6.109624839933935e-08,
+ "grad_condition": 230714811.36310124,
+ "lr": 0.0009995614150494292,
+ "time_sec": 66.83215641975403
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.52685978515625,
+ "train_acc": 0.03204,
+ "test_loss": 5.045831031799317,
+ "test_acc": 0.0094,
+ "lyapunov": null,
+ "grad_norm": 3.1470044543912175,
+ "grad_max_sv": 2.6447540044784548,
+ "grad_min_sv": 4.639755384339139e-08,
+ "grad_condition": 65625701.84585605,
+ "lr": 0.0009990133642141358,
+ "time_sec": 66.70765495300293
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.371717319641113,
+ "train_acc": 0.04112,
+ "test_loss": 4.993129699707032,
+ "test_acc": 0.0115,
+ "lyapunov": null,
+ "grad_norm": 2.5123688948843395,
+ "grad_max_sv": 2.1027904629707335,
+ "grad_min_sv": 3.615837387664633e-08,
+ "grad_condition": 418817692.03399765,
+ "lr": 0.0009982464296247522,
+ "time_sec": 66.70319509506226
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.27407361251831,
+ "train_acc": 0.0488,
+ "test_loss": 5.161634465789795,
+ "test_acc": 0.0119,
+ "lyapunov": null,
+ "grad_norm": 1.9573801826064445,
+ "grad_max_sv": 1.613087645173073,
+ "grad_min_sv": 2.8529539808364034e-08,
+ "grad_condition": 62747668.20627429,
+ "lr": 0.0009972609476841367,
+ "time_sec": 66.74726390838623
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.183251854553222,
+ "train_acc": 0.05812,
+ "test_loss": 5.447854755401611,
+ "test_acc": 0.0093,
+ "lyapunov": null,
+ "grad_norm": 1.436449079599314,
+ "grad_max_sv": 1.0459295481443405,
+ "grad_min_sv": 2.0654144772258576e-08,
+ "grad_condition": 94732574.16372415,
+ "lr": 0.000996057350657239,
+ "time_sec": 66.68073081970215
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.103355536193848,
+ "train_acc": 0.06872,
+ "test_loss": 5.544150679016114,
+ "test_acc": 0.0124,
+ "lyapunov": null,
+ "grad_norm": 1.082624040556548,
+ "grad_max_sv": 0.678101472556591,
+ "grad_min_sv": 1.6660088839048904e-08,
+ "grad_condition": 49338508.46283151,
+ "lr": 0.000994636166481494,
+ "time_sec": 66.77410340309143
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.040529095458984,
+ "train_acc": 0.07876,
+ "test_loss": 5.577163777160645,
+ "test_acc": 0.0172,
+ "lyapunov": null,
+ "grad_norm": 0.963869121683512,
+ "grad_max_sv": 0.5578698106110096,
+ "grad_min_sv": 1.4817374840991882e-08,
+ "grad_condition": 46172185.25999212,
+ "lr": 0.0009929980185352525,
+ "time_sec": 66.7442455291748
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.999490645446777,
+ "train_acc": 0.0856,
+ "test_loss": 5.472281336975097,
+ "test_acc": 0.0116,
+ "lyapunov": null,
+ "grad_norm": 0.9198022107734598,
+ "grad_max_sv": 0.5003849364817142,
+ "grad_min_sv": 1.3862486752946878e-08,
+ "grad_condition": 137028895.09887612,
+ "lr": 0.0009911436253643444,
+ "time_sec": 66.71199488639832
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.9641557629394533,
+ "train_acc": 0.09124,
+ "test_loss": 5.43024553604126,
+ "test_acc": 0.0112,
+ "lyapunov": null,
+ "grad_norm": 0.8539816540258655,
+ "grad_max_sv": 0.4397390566766262,
+ "grad_min_sv": 1.3177782898221579e-08,
+ "grad_condition": 50953468.3517745,
+ "lr": 0.0009890738003669028,
+ "time_sec": 66.71694684028625
+ },
+ {
+ "epoch": 11,
+ "train_loss": 3.9142907052612306,
+ "train_acc": 0.09788,
+ "test_loss": 5.24972756652832,
+ "test_acc": 0.0174,
+ "lyapunov": null,
+ "grad_norm": 0.8303589651826888,
+ "grad_max_sv": 0.4246540553867817,
+ "grad_min_sv": 1.288730961390705e-08,
+ "grad_condition": 88294678.08247125,
+ "lr": 0.00098678945143658,
+ "time_sec": 66.70689487457275
+ },
+ {
+ "epoch": 12,
+ "train_loss": 3.881778168411255,
+ "train_acc": 0.1037,
+ "test_loss": 5.765969756317139,
+ "test_acc": 0.0186,
+ "lyapunov": null,
+ "grad_norm": 0.7855031029198277,
+ "grad_max_sv": 0.3756070680916309,
+ "grad_min_sv": 1.2611303298881715e-08,
+ "grad_condition": 36786532.210794725,
+ "lr": 0.0009842915805643154,
+ "time_sec": 66.73540306091309
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.8490214154815674,
+ "train_acc": 0.1068,
+ "test_loss": 5.832162282562256,
+ "test_acc": 0.0138,
+ "lyapunov": null,
+ "grad_norm": 0.7681061932199776,
+ "grad_max_sv": 0.3604050487279892,
+ "grad_min_sv": 1.2243067453593382e-08,
+ "grad_condition": 131143000.26933214,
+ "lr": 0.000981581283398829,
+ "time_sec": 66.73431468009949
+ },
+ {
+ "epoch": 14,
+ "train_loss": 3.828877674636841,
+ "train_acc": 0.11234,
+ "test_loss": 6.293205305480957,
+ "test_acc": 0.0134,
+ "lyapunov": null,
+ "grad_norm": 0.7460407539013362,
+ "grad_max_sv": 0.34510768875479697,
+ "grad_min_sv": 1.1813573212726692e-08,
+ "grad_condition": 49629148.15911349,
+ "lr": 0.0009786597487660333,
+ "time_sec": 66.77479386329651
+ },
+ {
+ "epoch": 15,
+ "train_loss": 3.803487832107544,
+ "train_acc": 0.1159,
+ "test_loss": 6.4087516273498535,
+ "test_acc": 0.013,
+ "lyapunov": null,
+ "grad_norm": 0.716379034773642,
+ "grad_max_sv": 0.3261814657598734,
+ "grad_min_sv": 1.1572917107960378e-08,
+ "grad_condition": 31644703.4401185,
+ "lr": 0.0009755282581475766,
+ "time_sec": 66.73083448410034
+ },
+ {
+ "epoch": 16,
+ "train_loss": 3.7821172668457033,
+ "train_acc": 0.11904,
+ "test_loss": 6.406122239685058,
+ "test_acc": 0.0123,
+ "lyapunov": null,
+ "grad_norm": 0.697749546532161,
+ "grad_max_sv": 0.31582852490246294,
+ "grad_min_sv": 1.1393312793206434e-08,
+ "grad_condition": 39132519.74005551,
+ "lr": 0.0009721881851187403,
+ "time_sec": 66.74327826499939
+ },
+ {
+ "epoch": 17,
+ "train_loss": 3.7480180199432374,
+ "train_acc": 0.12526,
+ "test_loss": 6.8633532814025875,
+ "test_acc": 0.0132,
+ "lyapunov": null,
+ "grad_norm": 0.6758633251362415,
+ "grad_max_sv": 0.2994280070066452,
+ "grad_min_sv": 1.1069095015581176e-08,
+ "grad_condition": 36563832.03358241,
+ "lr": 0.0009686409947459456,
+ "time_sec": 66.76521873474121
+ },
+ {
+ "epoch": 18,
+ "train_loss": 3.730831000213623,
+ "train_acc": 0.12792,
+ "test_loss": 6.246407075500488,
+ "test_acc": 0.0177,
+ "lyapunov": null,
+ "grad_norm": 0.664831990265232,
+ "grad_max_sv": 0.2994547080248594,
+ "grad_min_sv": 1.0997234457625626e-08,
+ "grad_condition": 122736750.78260681,
+ "lr": 0.0009648882429441254,
+ "time_sec": 66.71729445457458
+ },
+ {
+ "epoch": 19,
+ "train_loss": 3.716553072052002,
+ "train_acc": 0.12942,
+ "test_loss": 5.873876965332031,
+ "test_acc": 0.0149,
+ "lyapunov": null,
+ "grad_norm": 0.6518241757841252,
+ "grad_max_sv": 0.29539270177483556,
+ "grad_min_sv": 1.0741561572852331e-08,
+ "grad_condition": 49669322.25294405,
+ "lr": 0.00096093157579425,
+ "time_sec": 66.81875944137573
+ },
+ {
+ "epoch": 20,
+ "train_loss": 3.6975706172180174,
+ "train_acc": 0.13298,
+ "test_loss": 6.400744886779785,
+ "test_acc": 0.0155,
+ "lyapunov": null,
+ "grad_norm": 0.6347864002121714,
+ "grad_max_sv": 0.28284979946911337,
+ "grad_min_sv": 1.0701284272607303e-08,
+ "grad_condition": 30013146.4819826,
+ "lr": 0.0009567727288213001,
+ "time_sec": 66.8477098941803
+ },
+ {
+ "epoch": 21,
+ "train_loss": 3.673498316040039,
+ "train_acc": 0.13564,
+ "test_loss": 6.160238801574707,
+ "test_acc": 0.0204,
+ "lyapunov": null,
+ "grad_norm": 0.6252581472584972,
+ "grad_max_sv": 0.27260397262871267,
+ "grad_min_sv": 1.0594542484282377e-08,
+ "grad_condition": 46350413.24314589,
+ "lr": 0.0009524135262330095,
+ "time_sec": 66.72814178466797
+ },
+ {
+ "epoch": 22,
+ "train_loss": 3.654527678833008,
+ "train_acc": 0.1393,
+ "test_loss": 6.9474281982421875,
+ "test_acc": 0.0176,
+ "lyapunov": null,
+ "grad_norm": 0.6149063083720292,
+ "grad_max_sv": 0.26224171184003353,
+ "grad_min_sv": 1.035294387718988e-08,
+ "grad_condition": 32282705.350815333,
+ "lr": 0.0009478558801197061,
+ "time_sec": 66.82811260223389
+ },
+ {
+ "epoch": 23,
+ "train_loss": 3.6450364729309084,
+ "train_acc": 0.14028,
+ "test_loss": 7.2393467880249025,
+ "test_acc": 0.0127,
+ "lyapunov": null,
+ "grad_norm": 0.6067467053692205,
+ "grad_max_sv": 0.26614573895931243,
+ "grad_min_sv": 1.0267544686692886e-08,
+ "grad_condition": 28213061.075003404,
+ "lr": 0.000943101789615607,
+ "time_sec": 66.74721336364746
+ },
+ {
+ "epoch": 24,
+ "train_loss": 3.623104200592041,
+ "train_acc": 0.14594,
+ "test_loss": 6.526107063293457,
+ "test_acc": 0.0187,
+ "lyapunov": null,
+ "grad_norm": 0.5980858749774747,
+ "grad_max_sv": 0.25203392654657364,
+ "grad_min_sv": 1.0098680717357534e-08,
+ "grad_condition": 50563247.00258337,
+ "lr": 0.0009381533400219313,
+ "time_sec": 66.77076554298401
+ },
+ {
+ "epoch": 25,
+ "train_loss": 3.6136645338439943,
+ "train_acc": 0.14728,
+ "test_loss": 7.030907647705078,
+ "test_acc": 0.0182,
+ "lyapunov": null,
+ "grad_norm": 0.594016587561951,
+ "grad_max_sv": 0.25378315448760985,
+ "grad_min_sv": 9.976338428627219e-09,
+ "grad_condition": 72065195.62747766,
+ "lr": 0.0009330127018922189,
+ "time_sec": 66.78083634376526
+ },
+ {
+ "epoch": 26,
+ "train_loss": 3.5951533477020265,
+ "train_acc": 0.15,
+ "test_loss": 6.8098891067504885,
+ "test_acc": 0.0193,
+ "lyapunov": null,
+ "grad_norm": 0.5888833643522708,
+ "grad_max_sv": 0.24365438856184482,
+ "grad_min_sv": 9.933017187935267e-09,
+ "grad_condition": 44149369.91233202,
+ "lr": 0.000927682130080253,
+ "time_sec": 66.72774887084961
+ },
+ {
+ "epoch": 27,
+ "train_loss": 3.5870719739532473,
+ "train_acc": 0.15012,
+ "test_loss": 6.188968405151368,
+ "test_acc": 0.0198,
+ "lyapunov": null,
+ "grad_norm": 0.5778870286561091,
+ "grad_max_sv": 0.23904258161783218,
+ "grad_min_sv": 9.864321945385335e-09,
+ "grad_condition": 29413784.94482057,
+ "lr": 0.0009221639627510072,
+ "time_sec": 66.7466390132904
+ },
+ {
+ "epoch": 28,
+ "train_loss": 3.5677108099365236,
+ "train_acc": 0.15438,
+ "test_loss": 7.111977198028565,
+ "test_acc": 0.0186,
+ "lyapunov": null,
+ "grad_norm": 0.565332521044754,
+ "grad_max_sv": 0.22653766870498657,
+ "grad_min_sv": 9.587734812674387e-09,
+ "grad_condition": 61781100.03898337,
+ "lr": 0.0009164606203550494,
+ "time_sec": 66.74424004554749
+ },
+ {
+ "epoch": 29,
+ "train_loss": 3.5525446216583254,
+ "train_acc": 0.1561,
+ "test_loss": 6.844758932495117,
+ "test_acc": 0.0209,
+ "lyapunov": null,
+ "grad_norm": 0.5709459777275144,
+ "grad_max_sv": 0.22716681994497775,
+ "grad_min_sv": 9.63618568827762e-09,
+ "grad_condition": 26044218.51829529,
+ "lr": 0.0009105746045668516,
+ "time_sec": 66.73790216445923
+ },
+ {
+ "epoch": 30,
+ "train_loss": 3.5511199297332765,
+ "train_acc": 0.15632,
+ "test_loss": 6.829617092895508,
+ "test_acc": 0.0179,
+ "lyapunov": null,
+ "grad_norm": 0.5599177583176913,
+ "grad_max_sv": 0.22315906584262848,
+ "grad_min_sv": 9.481845958392298e-09,
+ "grad_condition": 31696446.039096247,
+ "lr": 0.0009045084971874733,
+ "time_sec": 66.74309277534485
+ },
+ {
+ "epoch": 31,
+ "train_loss": 3.5346223778533936,
+ "train_acc": 0.15964,
+ "test_loss": 7.171929656982422,
+ "test_acc": 0.0181,
+ "lyapunov": null,
+ "grad_norm": 0.5560980115082016,
+ "grad_max_sv": 0.22190811820328235,
+ "grad_min_sv": 9.472099816998369e-09,
+ "grad_condition": 65999783.19253375,
+ "lr": 0.0008982649590120977,
+ "time_sec": 66.72736811637878
+ },
+ {
+ "epoch": 32,
+ "train_loss": 3.523619603424072,
+ "train_acc": 0.16298,
+ "test_loss": 7.11264291381836,
+ "test_acc": 0.0196,
+ "lyapunov": null,
+ "grad_norm": 0.5484008571230936,
+ "grad_max_sv": 0.21031202785670758,
+ "grad_min_sv": 9.324677128358382e-09,
+ "grad_condition": 59831756.702754,
+ "lr": 0.0008918467286629196,
+ "time_sec": 66.70681715011597
+ },
+ {
+ "epoch": 33,
+ "train_loss": 3.503953924026489,
+ "train_acc": 0.1662,
+ "test_loss": 6.848249008178711,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.5416204323895276,
+ "grad_max_sv": 0.2181798741221428,
+ "grad_min_sv": 9.399793365156769e-09,
+ "grad_condition": 389136802.1825175,
+ "lr": 0.0008852566213878943,
+ "time_sec": 66.73786091804504
+ },
+ {
+ "epoch": 34,
+ "train_loss": 3.505652629928589,
+ "train_acc": 0.16502,
+ "test_loss": 6.877189469909668,
+ "test_acc": 0.02,
+ "lyapunov": null,
+ "grad_norm": 0.5355113980631458,
+ "grad_max_sv": 0.20969012342393398,
+ "grad_min_sv": 9.270577998321538e-09,
+ "grad_condition": 31525454.84069126,
+ "lr": 0.000878497527825878,
+ "time_sec": 66.72686457633972
+ },
+ {
+ "epoch": 35,
+ "train_loss": 3.486978895339966,
+ "train_acc": 0.16714,
+ "test_loss": 7.1552359481811525,
+ "test_acc": 0.0172,
+ "lyapunov": null,
+ "grad_norm": 0.5346080374847578,
+ "grad_max_sv": 0.20298720821738242,
+ "grad_min_sv": 9.306896420202548e-09,
+ "grad_condition": 25441508.50613912,
+ "lr": 0.000871572412738697,
+ "time_sec": 66.75551271438599
+ },
+ {
+ "epoch": 36,
+ "train_loss": 3.479604592208862,
+ "train_acc": 0.16902,
+ "test_loss": 6.844674809265137,
+ "test_acc": 0.0223,
+ "lyapunov": null,
+ "grad_norm": 0.5311517334543933,
+ "grad_max_sv": 0.20205551721155643,
+ "grad_min_sv": 9.200601613218452e-09,
+ "grad_condition": 45450108.39040236,
+ "lr": 0.0008644843137107055,
+ "time_sec": 66.7082417011261
+ },
+ {
+ "epoch": 37,
+ "train_loss": 3.4750630870819093,
+ "train_acc": 0.16898,
+ "test_loss": 7.165343771362305,
+ "test_acc": 0.0171,
+ "lyapunov": null,
+ "grad_norm": 0.5255800840531358,
+ "grad_max_sv": 0.19590781554579734,
+ "grad_min_sv": 9.155419039910683e-09,
+ "grad_condition": 108339245.17679186,
+ "lr": 0.0008572363398164014,
+ "time_sec": 66.71217584609985
+ },
+ {
+ "epoch": 38,
+ "train_loss": 3.461921478424072,
+ "train_acc": 0.17176,
+ "test_loss": 7.6983903167724606,
+ "test_acc": 0.0204,
+ "lyapunov": null,
+ "grad_norm": 0.5291599359124736,
+ "grad_max_sv": 0.19806304536759853,
+ "grad_min_sv": 9.252919158653227e-09,
+ "grad_condition": 26129114.857841287,
+ "lr": 0.0008498316702566826,
+ "time_sec": 66.83607125282288
+ },
+ {
+ "epoch": 39,
+ "train_loss": 3.4502412219238283,
+ "train_acc": 0.1729,
+ "test_loss": 6.8047522277832035,
+ "test_acc": 0.0213,
+ "lyapunov": null,
+ "grad_norm": 0.5281639901017625,
+ "grad_max_sv": 0.20096433460712432,
+ "grad_min_sv": 9.085016680621116e-09,
+ "grad_condition": 33958186.51443162,
+ "lr": 0.0008422735529643442,
+ "time_sec": 66.73851490020752
+ },
+ {
+ "epoch": 40,
+ "train_loss": 3.4376924714660646,
+ "train_acc": 0.17616,
+ "test_loss": 7.263092966461182,
+ "test_acc": 0.0182,
+ "lyapunov": null,
+ "grad_norm": 0.5216932066323713,
+ "grad_max_sv": 0.19504240863025188,
+ "grad_min_sv": 9.154586153026223e-09,
+ "grad_condition": 25458573.387380652,
+ "lr": 0.0008345653031794289,
+ "time_sec": 66.7052755355835
+ },
+ {
+ "epoch": 41,
+ "train_loss": 3.4279933405303957,
+ "train_acc": 0.17836,
+ "test_loss": 6.396369320678711,
+ "test_acc": 0.0195,
+ "lyapunov": null,
+ "grad_norm": 0.5194410647845549,
+ "grad_max_sv": 0.19078941717743875,
+ "grad_min_sv": 9.012956635884306e-09,
+ "grad_condition": 42363604.716461524,
+ "lr": 0.0008267103019950526,
+ "time_sec": 66.72479486465454
+ },
+ {
+ "epoch": 42,
+ "train_loss": 3.4256856929016113,
+ "train_acc": 0.17732,
+ "test_loss": 6.679870991516113,
+ "test_acc": 0.0212,
+ "lyapunov": null,
+ "grad_norm": 0.5198265520764738,
+ "grad_max_sv": 0.19169757179915906,
+ "grad_min_sv": 9.036233127035497e-09,
+ "grad_condition": 51260505.579239644,
+ "lr": 0.0008187119948743447,
+ "time_sec": 66.75225281715393
+ },
+ {
+ "epoch": 43,
+ "train_loss": 3.411117221832275,
+ "train_acc": 0.18158,
+ "test_loss": 7.357481904602051,
+ "test_acc": 0.0185,
+ "lyapunov": null,
+ "grad_norm": 0.5156740849780826,
+ "grad_max_sv": 0.19417562745511532,
+ "grad_min_sv": 9.037307471815303e-09,
+ "grad_condition": 35283510.30299447,
+ "lr": 0.000810573890139155,
+ "time_sec": 66.72709918022156
+ },
+ {
+ "epoch": 44,
+ "train_loss": 3.4085953338623045,
+ "train_acc": 0.18096,
+ "test_loss": 7.635249890899658,
+ "test_acc": 0.0161,
+ "lyapunov": null,
+ "grad_norm": 0.5119612982206426,
+ "grad_max_sv": 0.18738919235765933,
+ "grad_min_sv": 8.878314214366689e-09,
+ "grad_condition": 31365951.59678828,
+ "lr": 0.0008022995574311873,
+ "time_sec": 66.72823333740234
+ },
+ {
+ "epoch": 45,
+ "train_loss": 3.391282188873291,
+ "train_acc": 0.18358,
+ "test_loss": 7.057773623657226,
+ "test_acc": 0.0215,
+ "lyapunov": null,
+ "grad_norm": 0.512636753960722,
+ "grad_max_sv": 0.18591308295726777,
+ "grad_min_sv": 8.905265155845221e-09,
+ "grad_condition": 34037092.10974729,
+ "lr": 0.0007938926261462363,
+ "time_sec": 66.75207853317261
+ },
+ {
+ "epoch": 46,
+ "train_loss": 3.385137359466553,
+ "train_acc": 0.18694,
+ "test_loss": 7.400888244628907,
+ "test_acc": 0.0212,
+ "lyapunov": null,
+ "grad_norm": 0.5082656505289807,
+ "grad_max_sv": 0.18733446709811688,
+ "grad_min_sv": 8.893193696474926e-09,
+ "grad_condition": 125851280.80010274,
+ "lr": 0.0007853567838422158,
+ "time_sec": 66.7163679599762
+ },
+ {
+ "epoch": 47,
+ "train_loss": 3.376342626800537,
+ "train_acc": 0.18838,
+ "test_loss": 7.475112818908691,
+ "test_acc": 0.0175,
+ "lyapunov": null,
+ "grad_norm": 0.5045706953392911,
+ "grad_max_sv": 0.18063193671405314,
+ "grad_min_sv": 8.950101182403359e-09,
+ "grad_condition": 22625503.611506984,
+ "lr": 0.0007766957746216719,
+ "time_sec": 66.7100522518158
+ },
+ {
+ "epoch": 48,
+ "train_loss": 3.3649324946594237,
+ "train_acc": 0.18694,
+ "test_loss": 8.045938752746583,
+ "test_acc": 0.0189,
+ "lyapunov": null,
+ "grad_norm": 0.5007866825544302,
+ "grad_max_sv": 0.1830794021487236,
+ "grad_min_sv": 8.805358707453248e-09,
+ "grad_condition": 27558131.426934887,
+ "lr": 0.0007679133974894982,
+ "time_sec": 66.70468735694885
+ },
+ {
+ "epoch": 49,
+ "train_loss": 3.3610028453063965,
+ "train_acc": 0.1888,
+ "test_loss": 7.112044483947754,
+ "test_acc": 0.0233,
+ "lyapunov": null,
+ "grad_norm": 0.5007184914478864,
+ "grad_max_sv": 0.18336209803819656,
+ "grad_min_sv": 9.024269038288013e-09,
+ "grad_condition": 33518235.006607275,
+ "lr": 0.000759013504686565,
+ "time_sec": 66.7611026763916
+ },
+ {
+ "epoch": 50,
+ "train_loss": 3.3484571326446533,
+ "train_acc": 0.1906,
+ "test_loss": 7.519181715393066,
+ "test_acc": 0.0209,
+ "lyapunov": null,
+ "grad_norm": 0.5018491559425493,
+ "grad_max_sv": 0.18028105311095716,
+ "grad_min_sv": 8.925991949043643e-09,
+ "grad_condition": 33524852.83647134,
+ "lr": 0.0007499999999999998,
+ "time_sec": 66.76505136489868
+ },
+ {
+ "epoch": 51,
+ "train_loss": 3.3410891053009033,
+ "train_acc": 0.1921,
+ "test_loss": 7.056560147094727,
+ "test_acc": 0.0249,
+ "lyapunov": null,
+ "grad_norm": 0.4996656726107064,
+ "grad_max_sv": 0.17895969636738301,
+ "grad_min_sv": 8.92833956489536e-09,
+ "grad_condition": 30339744.194165338,
+ "lr": 0.0007408768370508575,
+ "time_sec": 66.76679730415344
+ },
+ {
+ "epoch": 52,
+ "train_loss": 3.329959710845947,
+ "train_acc": 0.19464,
+ "test_loss": 7.733986283874512,
+ "test_acc": 0.02,
+ "lyapunov": null,
+ "grad_norm": 0.49662871046839857,
+ "grad_max_sv": 0.17035150155425072,
+ "grad_min_sv": 8.920055267341853e-09,
+ "grad_condition": 39560292.40680326,
+ "lr": 0.0007316480175599307,
+ "time_sec": 66.73509478569031
+ },
+ {
+ "epoch": 53,
+ "train_loss": 3.328139169998169,
+ "train_acc": 0.1964,
+ "test_loss": 8.010476211547852,
+ "test_acc": 0.0211,
+ "lyapunov": null,
+ "grad_norm": 0.4958475219811756,
+ "grad_max_sv": 0.17490845173597336,
+ "grad_min_sv": 8.784460091802727e-09,
+ "grad_condition": 71860322.54887062,
+ "lr": 0.0007223175895924635,
+ "time_sec": 66.72841596603394
+ },
+ {
+ "epoch": 54,
+ "train_loss": 3.3162127281188964,
+ "train_acc": 0.19728,
+ "test_loss": 7.010640211486816,
+ "test_acc": 0.0247,
+ "lyapunov": null,
+ "grad_norm": 0.4961833449463003,
+ "grad_max_sv": 0.17223588079214097,
+ "grad_min_sv": 8.753281316442596e-09,
+ "grad_condition": 22715187.33107339,
+ "lr": 0.0007128896457825361,
+ "time_sec": 66.72108912467957
+ },
+ {
+ "epoch": 55,
+ "train_loss": 3.3105887175750732,
+ "train_acc": 0.1977,
+ "test_loss": 8.294336575317383,
+ "test_acc": 0.0177,
+ "lyapunov": null,
+ "grad_norm": 0.4959871213831781,
+ "grad_max_sv": 0.17211879640817643,
+ "grad_min_sv": 8.85512002890554e-09,
+ "grad_condition": 22832904.69554911,
+ "lr": 0.0007033683215378998,
+ "time_sec": 66.77683353424072
+ },
+ {
+ "epoch": 56,
+ "train_loss": 3.3091206261444093,
+ "train_acc": 0.19822,
+ "test_loss": 6.872190827941894,
+ "test_acc": 0.0233,
+ "lyapunov": null,
+ "grad_norm": 0.4968424527269832,
+ "grad_max_sv": 0.16929374635219574,
+ "grad_min_sv": 8.852659438840504e-09,
+ "grad_condition": 21482011.311691545,
+ "lr": 0.0006937577932260512,
+ "time_sec": 66.7394802570343
+ },
+ {
+ "epoch": 57,
+ "train_loss": 3.2911807606506347,
+ "train_acc": 0.20104,
+ "test_loss": 6.781019482421875,
+ "test_acc": 0.0266,
+ "lyapunov": null,
+ "grad_norm": 0.49806961864225907,
+ "grad_max_sv": 0.17269197143614293,
+ "grad_min_sv": 9.028358619045385e-09,
+ "grad_condition": 21860182.81813491,
+ "lr": 0.0006840622763423388,
+ "time_sec": 66.74213409423828
+ },
+ {
+ "epoch": 58,
+ "train_loss": 3.28923882019043,
+ "train_acc": 0.2009,
+ "test_loss": 7.48718016204834,
+ "test_acc": 0.0233,
+ "lyapunov": null,
+ "grad_norm": 0.497037583502488,
+ "grad_max_sv": 0.17720941305160523,
+ "grad_min_sv": 8.923951845540844e-09,
+ "grad_condition": 25638959.340645056,
+ "lr": 0.0006742860236609073,
+ "time_sec": 66.70864987373352
+ },
+ {
+ "epoch": 59,
+ "train_loss": 3.288974278411865,
+ "train_acc": 0.2022,
+ "test_loss": 6.711775099182129,
+ "test_acc": 0.0288,
+ "lyapunov": null,
+ "grad_norm": 0.5006739014854031,
+ "grad_max_sv": 0.1799727737903595,
+ "grad_min_sv": 8.922615390982714e-09,
+ "grad_condition": 22962596.945499133,
+ "lr": 0.0006644333233692913,
+ "time_sec": 66.72898769378662
+ },
+ {
+ "epoch": 60,
+ "train_loss": 3.283515991897583,
+ "train_acc": 0.20374,
+ "test_loss": 7.436810195922852,
+ "test_acc": 0.0217,
+ "lyapunov": null,
+ "grad_norm": 0.4970314759637393,
+ "grad_max_sv": 0.1713873755186796,
+ "grad_min_sv": 8.852956717708694e-09,
+ "grad_condition": 21460924.515540235,
+ "lr": 0.0006545084971874734,
+ "time_sec": 66.77793312072754
+ },
+ {
+ "epoch": 61,
+ "train_loss": 3.2660218312072753,
+ "train_acc": 0.2052,
+ "test_loss": 7.1023060356140135,
+ "test_acc": 0.0237,
+ "lyapunov": null,
+ "grad_norm": 0.49642283106124174,
+ "grad_max_sv": 0.17171172685921193,
+ "grad_min_sv": 9.03237155625014e-09,
+ "grad_condition": 23554914.711565603,
+ "lr": 0.0006445158984722354,
+ "time_sec": 66.71418523788452
+ },
+ {
+ "epoch": 62,
+ "train_loss": 3.254552359466553,
+ "train_acc": 0.2084,
+ "test_loss": 7.483150309753418,
+ "test_acc": 0.0225,
+ "lyapunov": null,
+ "grad_norm": 0.4960786681631791,
+ "grad_max_sv": 0.1668458305299282,
+ "grad_min_sv": 8.818685695577421e-09,
+ "grad_condition": 74094011.9951904,
+ "lr": 0.0006344599103076324,
+ "time_sec": 66.70579290390015
+ },
+ {
+ "epoch": 63,
+ "train_loss": 3.2479764625549317,
+ "train_acc": 0.20702,
+ "test_loss": 7.495381002807617,
+ "test_acc": 0.0243,
+ "lyapunov": null,
+ "grad_norm": 0.4917077399114027,
+ "grad_max_sv": 0.16495948433876037,
+ "grad_min_sv": 8.864074795694732e-09,
+ "grad_condition": 30857102.41845674,
+ "lr": 0.0006243449435824269,
+ "time_sec": 66.72497200965881
+ },
+ {
+ "epoch": 64,
+ "train_loss": 3.245808661117554,
+ "train_acc": 0.20704,
+ "test_loss": 6.5149994140625,
+ "test_acc": 0.0299,
+ "lyapunov": null,
+ "grad_norm": 0.4942308484852371,
+ "grad_max_sv": 0.16808778569102287,
+ "grad_min_sv": 8.905879750331636e-09,
+ "grad_condition": 21297665.020826895,
+ "lr": 0.0006141754350553275,
+ "time_sec": 66.71531987190247
+ },
+ {
+ "epoch": 65,
+ "train_loss": 3.2359812786102293,
+ "train_acc": 0.20964,
+ "test_loss": 6.7083621681213375,
+ "test_acc": 0.0257,
+ "lyapunov": null,
+ "grad_norm": 0.4924300564127143,
+ "grad_max_sv": 0.1668924294412136,
+ "grad_min_sv": 8.814785660855167e-09,
+ "grad_condition": 387068362.7974197,
+ "lr": 0.0006039558454088793,
+ "time_sec": 66.739919424057
+ },
+ {
+ "epoch": 66,
+ "train_loss": 3.2231747630310057,
+ "train_acc": 0.21288,
+ "test_loss": 6.6462861267089846,
+ "test_acc": 0.0258,
+ "lyapunov": null,
+ "grad_norm": 0.49278283649554394,
+ "grad_max_sv": 0.16672560423612595,
+ "grad_min_sv": 8.910612160628607e-09,
+ "grad_condition": 23460863.699399397,
+ "lr": 0.000593690657292862,
+ "time_sec": 66.73168134689331
+ },
+ {
+ "epoch": 67,
+ "train_loss": 3.2156623792266847,
+ "train_acc": 0.21342,
+ "test_loss": 7.029375877380371,
+ "test_acc": 0.0223,
+ "lyapunov": null,
+ "grad_norm": 0.4909443834963243,
+ "grad_max_sv": 0.16597550213336945,
+ "grad_min_sv": 8.912085689566362e-09,
+ "grad_condition": 31291994.15683285,
+ "lr": 0.0005833843733580507,
+ "time_sec": 66.72268962860107
+ },
+ {
+ "epoch": 68,
+ "train_loss": 3.2102099297332765,
+ "train_acc": 0.21536,
+ "test_loss": 6.8582941429138184,
+ "test_acc": 0.0244,
+ "lyapunov": null,
+ "grad_norm": 0.49321037808878027,
+ "grad_max_sv": 0.16992229372262954,
+ "grad_min_sv": 8.80631389199582e-09,
+ "grad_condition": 129842817.14263825,
+ "lr": 0.0005730415142812054,
+ "time_sec": 66.73015308380127
+ },
+ {
+ "epoch": 69,
+ "train_loss": 3.2087192346191404,
+ "train_acc": 0.21692,
+ "test_loss": 6.703964881134033,
+ "test_acc": 0.0266,
+ "lyapunov": null,
+ "grad_norm": 0.4884522648005531,
+ "grad_max_sv": 0.16176489181816578,
+ "grad_min_sv": 8.772693779746099e-09,
+ "grad_condition": 26469955.870484192,
+ "lr": 0.0005626666167821517,
+ "time_sec": 66.71746468544006
+ },
+ {
+ "epoch": 70,
+ "train_loss": 3.195241547088623,
+ "train_acc": 0.21844,
+ "test_loss": 6.542587074279785,
+ "test_acc": 0.0284,
+ "lyapunov": null,
+ "grad_norm": 0.49091657002079947,
+ "grad_max_sv": 0.16242207810282708,
+ "grad_min_sv": 9.02578579792257e-09,
+ "grad_condition": 23591537.371170804,
+ "lr": 0.0005522642316338265,
+ "time_sec": 66.72597932815552
+ },
+ {
+ "epoch": 71,
+ "train_loss": 3.1896180830383303,
+ "train_acc": 0.21886,
+ "test_loss": 6.82057219543457,
+ "test_acc": 0.0261,
+ "lyapunov": null,
+ "grad_norm": 0.4892216781222015,
+ "grad_max_sv": 0.1621775720268488,
+ "grad_min_sv": 8.926039651857565e-09,
+ "grad_condition": 20890687.882442366,
+ "lr": 0.0005418389216661573,
+ "time_sec": 66.7145037651062
+ },
+ {
+ "epoch": 72,
+ "train_loss": 3.18413442276001,
+ "train_acc": 0.21908,
+ "test_loss": 7.1544591903686525,
+ "test_acc": 0.0243,
+ "lyapunov": null,
+ "grad_norm": 0.48870515357132727,
+ "grad_max_sv": 0.16475776992738247,
+ "grad_min_sv": 8.91442188816205e-09,
+ "grad_condition": 35365218.5794013,
+ "lr": 0.0005313952597646563,
+ "time_sec": 66.72212243080139
+ },
+ {
+ "epoch": 73,
+ "train_loss": 3.1829597901153566,
+ "train_acc": 0.21974,
+ "test_loss": 7.2174785011291505,
+ "test_acc": 0.0215,
+ "lyapunov": null,
+ "grad_norm": 0.4892142900976219,
+ "grad_max_sv": 0.16382574513554574,
+ "grad_min_sv": 8.810792702352264e-09,
+ "grad_condition": 2088135479.3673325,
+ "lr": 0.0005209378268645994,
+ "time_sec": 66.73431754112244
+ },
+ {
+ "epoch": 74,
+ "train_loss": 3.172711128463745,
+ "train_acc": 0.22268,
+ "test_loss": 7.406581823730469,
+ "test_acc": 0.0232,
+ "lyapunov": null,
+ "grad_norm": 0.48885933422631656,
+ "grad_max_sv": 0.1622017789632082,
+ "grad_min_sv": 8.900176362569568e-09,
+ "grad_condition": 22065867.848713316,
+ "lr": 0.0005104712099416781,
+ "time_sec": 66.76118803024292
+ },
+ {
+ "epoch": 75,
+ "train_loss": 3.1605979063415526,
+ "train_acc": 0.22268,
+ "test_loss": 7.909864106750488,
+ "test_acc": 0.0215,
+ "lyapunov": null,
+ "grad_norm": 0.4864315646638775,
+ "grad_max_sv": 0.16106058210134505,
+ "grad_min_sv": 8.83298489941231e-09,
+ "grad_condition": 46212562.907684386,
+ "lr": 0.0004999999999999996,
+ "time_sec": 66.70442318916321
+ },
+ {
+ "epoch": 76,
+ "train_loss": 3.1487682283020018,
+ "train_acc": 0.22692,
+ "test_loss": 7.801919015502929,
+ "test_acc": 0.0215,
+ "lyapunov": null,
+ "grad_norm": 0.49432790922941905,
+ "grad_max_sv": 0.1653361301869154,
+ "grad_min_sv": 9.004006756851979e-09,
+ "grad_condition": 21481137.43510855,
+ "lr": 0.0004895287900583212,
+ "time_sec": 66.72583270072937
+ },
+ {
+ "epoch": 77,
+ "train_loss": 3.150441154251099,
+ "train_acc": 0.22298,
+ "test_loss": 7.5658083923339845,
+ "test_acc": 0.0206,
+ "lyapunov": null,
+ "grad_norm": 0.4905609551233629,
+ "grad_max_sv": 0.16559089235961438,
+ "grad_min_sv": 9.02131503666137e-09,
+ "grad_condition": 20767700.255871035,
+ "lr": 0.0004790621731353997,
+ "time_sec": 66.69700527191162
+ },
+ {
+ "epoch": 78,
+ "train_loss": 3.1500933878326416,
+ "train_acc": 0.22786,
+ "test_loss": 7.626110935974121,
+ "test_acc": 0.0244,
+ "lyapunov": null,
+ "grad_norm": 0.4905443897236645,
+ "grad_max_sv": 0.16319101713597775,
+ "grad_min_sv": 8.856467318546501e-09,
+ "grad_condition": 30384641.86177106,
+ "lr": 0.000468604740235343,
+ "time_sec": 66.70938420295715
+ },
+ {
+ "epoch": 79,
+ "train_loss": 3.1403994177246095,
+ "train_acc": 0.22896,
+ "test_loss": 7.712996089172363,
+ "test_acc": 0.0224,
+ "lyapunov": null,
+ "grad_norm": 0.4915245764953966,
+ "grad_max_sv": 0.16383215487003328,
+ "grad_min_sv": 9.000386157198559e-09,
+ "grad_condition": 24292562.845880195,
+ "lr": 0.00045816107833384175,
+ "time_sec": 66.70869493484497
+ },
+ {
+ "epoch": 80,
+ "train_loss": 3.135038282623291,
+ "train_acc": 0.22664,
+ "test_loss": 7.267129122161865,
+ "test_acc": 0.0247,
+ "lyapunov": null,
+ "grad_norm": 0.49111047918715733,
+ "grad_max_sv": 0.1639216773211956,
+ "grad_min_sv": 8.921349751783367e-09,
+ "grad_condition": 420151306.09404176,
+ "lr": 0.0004477357683661729,
+ "time_sec": 66.7166097164154
+ },
+ {
+ "epoch": 81,
+ "train_loss": 3.1244947747802736,
+ "train_acc": 0.22956,
+ "test_loss": 7.662328411865234,
+ "test_acc": 0.0247,
+ "lyapunov": null,
+ "grad_norm": 0.49289166159918185,
+ "grad_max_sv": 0.16057575568556787,
+ "grad_min_sv": 9.007528779803043e-09,
+ "grad_condition": 25322164.642992593,
+ "lr": 0.00043733338321784746,
+ "time_sec": 66.70411825180054
+ },
+ {
+ "epoch": 82,
+ "train_loss": 3.1161900270080567,
+ "train_acc": 0.23102,
+ "test_loss": 6.92779616394043,
+ "test_acc": 0.0285,
+ "lyapunov": null,
+ "grad_norm": 0.49270870414948964,
+ "grad_max_sv": 0.1599017258733511,
+ "grad_min_sv": 9.11951086590701e-09,
+ "grad_condition": 20698906.206454754,
+ "lr": 0.0004269584857187939,
+ "time_sec": 66.70752501487732
+ },
+ {
+ "epoch": 83,
+ "train_loss": 3.117374754104614,
+ "train_acc": 0.23338,
+ "test_loss": 7.148474893188476,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.4925974195490984,
+ "grad_max_sv": 0.16150497682392598,
+ "grad_min_sv": 8.971566273219267e-09,
+ "grad_condition": 20007661.368726093,
+ "lr": 0.0004166156266419484,
+ "time_sec": 66.70796918869019
+ },
+ {
+ "epoch": 84,
+ "train_loss": 3.1047154219055177,
+ "train_acc": 0.23342,
+ "test_loss": 7.627574306488037,
+ "test_acc": 0.0234,
+ "lyapunov": null,
+ "grad_norm": 0.4921892080867045,
+ "grad_max_sv": 0.16364577710628508,
+ "grad_min_sv": 8.967278117277822e-09,
+ "grad_condition": 20465428.39487014,
+ "lr": 0.0004063093427071373,
+ "time_sec": 66.70926451683044
+ },
+ {
+ "epoch": 85,
+ "train_loss": 3.0953226109313965,
+ "train_acc": 0.23356,
+ "test_loss": 7.637861351776123,
+ "test_acc": 0.0254,
+ "lyapunov": null,
+ "grad_norm": 0.49401889904765806,
+ "grad_max_sv": 0.16418364495038987,
+ "grad_min_sv": 8.915860015990679e-09,
+ "grad_condition": 203043858.99741915,
+ "lr": 0.0003960441545911199,
+ "time_sec": 66.6929943561554
+ },
+ {
+ "epoch": 86,
+ "train_loss": 3.0932106770324705,
+ "train_acc": 0.23452,
+ "test_loss": 7.435467148590088,
+ "test_acc": 0.0248,
+ "lyapunov": null,
+ "grad_norm": 0.4934388084197917,
+ "grad_max_sv": 0.16211238466203212,
+ "grad_min_sv": 9.0381108895643e-09,
+ "grad_condition": 38210459.14289879,
+ "lr": 0.0003858245649446718,
+ "time_sec": 66.71461033821106
+ },
+ {
+ "epoch": 87,
+ "train_loss": 3.091542336883545,
+ "train_acc": 0.23574,
+ "test_loss": 7.27965379486084,
+ "test_acc": 0.0266,
+ "lyapunov": null,
+ "grad_norm": 0.49327307505927953,
+ "grad_max_sv": 0.1624306257814169,
+ "grad_min_sv": 9.051206378840603e-09,
+ "grad_condition": 19977131.887911893,
+ "lr": 0.00037565505641757235,
+ "time_sec": 66.7017343044281
+ },
+ {
+ "epoch": 88,
+ "train_loss": 3.0846370722961427,
+ "train_acc": 0.2367,
+ "test_loss": 7.714011827087402,
+ "test_acc": 0.0274,
+ "lyapunov": null,
+ "grad_norm": 0.49521950469943726,
+ "grad_max_sv": 0.16350008510053157,
+ "grad_min_sv": 9.132233064201855e-09,
+ "grad_condition": 20496153.697574906,
+ "lr": 0.00036554008969236695,
+ "time_sec": 66.80735445022583
+ },
+ {
+ "epoch": 89,
+ "train_loss": 3.067184111480713,
+ "train_acc": 0.23956,
+ "test_loss": 7.469543979644776,
+ "test_acc": 0.0274,
+ "lyapunov": null,
+ "grad_norm": 0.49450885750587337,
+ "grad_max_sv": 0.16215350292623043,
+ "grad_min_sv": 9.075074243122815e-09,
+ "grad_condition": 63145499.63971396,
+ "lr": 0.0003554841015277638,
+ "time_sec": 66.7019522190094
+ },
+ {
+ "epoch": 90,
+ "train_loss": 3.0696119786071776,
+ "train_acc": 0.23776,
+ "test_loss": 7.227960666656494,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.49496033151417024,
+ "grad_max_sv": 0.15985839106142521,
+ "grad_min_sv": 9.114914140302688e-09,
+ "grad_condition": 88232236.67419389,
+ "lr": 0.000345491502812526,
+ "time_sec": 66.71336770057678
+ },
+ {
+ "epoch": 91,
+ "train_loss": 3.0570466086578367,
+ "train_acc": 0.24112,
+ "test_loss": 7.087581924438476,
+ "test_acc": 0.0285,
+ "lyapunov": null,
+ "grad_norm": 0.49532470616490887,
+ "grad_max_sv": 0.16271125935018063,
+ "grad_min_sv": 9.14848334726548e-09,
+ "grad_condition": 28858228.725753903,
+ "lr": 0.0003355666766307081,
+ "time_sec": 66.71155142784119
+ },
+ {
+ "epoch": 92,
+ "train_loss": 3.060674235687256,
+ "train_acc": 0.24284,
+ "test_loss": 7.354493684387207,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.49422169257384346,
+ "grad_max_sv": 0.16212479658424855,
+ "grad_min_sv": 9.094859150515777e-09,
+ "grad_condition": 27013716.07646851,
+ "lr": 0.00032571397633909225,
+ "time_sec": 66.73360872268677
+ },
+ {
+ "epoch": 93,
+ "train_loss": 3.045851851577759,
+ "train_acc": 0.24666,
+ "test_loss": 6.961697528839111,
+ "test_acc": 0.0257,
+ "lyapunov": null,
+ "grad_norm": 0.4943781413484412,
+ "grad_max_sv": 0.15829392597079278,
+ "grad_min_sv": 9.1174124181026e-09,
+ "grad_condition": 24719922.26471028,
+ "lr": 0.00031593772365766094,
+ "time_sec": 66.72647047042847
+ },
+ {
+ "epoch": 94,
+ "train_loss": 3.0384512644958495,
+ "train_acc": 0.24492,
+ "test_loss": 7.376283264160156,
+ "test_acc": 0.028,
+ "lyapunov": null,
+ "grad_norm": 0.49582915049730736,
+ "grad_max_sv": 0.1624866124242544,
+ "grad_min_sv": 9.118276048341972e-09,
+ "grad_condition": 727643917.2657491,
+ "lr": 0.0003062422067739483,
+ "time_sec": 66.70089149475098
+ },
+ {
+ "epoch": 95,
+ "train_loss": 3.039133260345459,
+ "train_acc": 0.24476,
+ "test_loss": 7.406265617370606,
+ "test_acc": 0.0298,
+ "lyapunov": null,
+ "grad_norm": 0.4964727526376002,
+ "grad_max_sv": 0.15984426029026508,
+ "grad_min_sv": 9.0936182872009e-09,
+ "grad_condition": 53822276.22529755,
+ "lr": 0.00029663167846209965,
+ "time_sec": 66.71791744232178
+ },
+ {
+ "epoch": 96,
+ "train_loss": 3.0375169485473634,
+ "train_acc": 0.24388,
+ "test_loss": 7.3450915855407715,
+ "test_acc": 0.0244,
+ "lyapunov": null,
+ "grad_norm": 0.4980105941759735,
+ "grad_max_sv": 0.1639113176614046,
+ "grad_min_sv": 9.174823172204694e-09,
+ "grad_condition": 75847501.33547327,
+ "lr": 0.00028711035421746345,
+ "time_sec": 66.74349761009216
+ },
+ {
+ "epoch": 97,
+ "train_loss": 3.036133956604004,
+ "train_acc": 0.2481,
+ "test_loss": 7.577465545654297,
+ "test_acc": 0.0264,
+ "lyapunov": null,
+ "grad_norm": 0.4958252185119339,
+ "grad_max_sv": 0.16029710061848162,
+ "grad_min_sv": 8.978423951533366e-09,
+ "grad_condition": 19961795.980553128,
+ "lr": 0.00027768241040753615,
+ "time_sec": 66.72821807861328
+ },
+ {
+ "epoch": 98,
+ "train_loss": 3.021324711227417,
+ "train_acc": 0.25076,
+ "test_loss": 7.219669580841065,
+ "test_acc": 0.0303,
+ "lyapunov": null,
+ "grad_norm": 0.4970296963841891,
+ "grad_max_sv": 0.16001575216650962,
+ "grad_min_sv": 9.067042531715752e-09,
+ "grad_condition": 41223693.265652105,
+ "lr": 0.00026835198244006903,
+ "time_sec": 66.74218535423279
+ },
+ {
+ "epoch": 99,
+ "train_loss": 3.0151924266815184,
+ "train_acc": 0.25042,
+ "test_loss": 7.808471519470215,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.497912540335549,
+ "grad_max_sv": 0.1632791668176651,
+ "grad_min_sv": 9.184349171464934e-09,
+ "grad_condition": 23400737.365473915,
+ "lr": 0.0002591231629491421,
+ "time_sec": 66.70754623413086
+ },
+ {
+ "epoch": 100,
+ "train_loss": 3.0173143773651123,
+ "train_acc": 0.24922,
+ "test_loss": 7.265430112457276,
+ "test_acc": 0.028,
+ "lyapunov": null,
+ "grad_norm": 0.49818870466542803,
+ "grad_max_sv": 0.16289953589439393,
+ "grad_min_sv": 9.281307221387091e-09,
+ "grad_condition": 23108793.760435097,
+ "lr": 0.0002499999999999997,
+ "time_sec": 66.74620199203491
+ },
+ {
+ "epoch": 101,
+ "train_loss": 3.0063516328430175,
+ "train_acc": 0.25068,
+ "test_loss": 7.405182618713379,
+ "test_acc": 0.0321,
+ "lyapunov": null,
+ "grad_norm": 0.4980158759477165,
+ "grad_max_sv": 0.16276963874697686,
+ "grad_min_sv": 9.112035989633505e-09,
+ "grad_condition": 21414811.754604597,
+ "lr": 0.00024098649531343477,
+ "time_sec": 66.74015522003174
+ },
+ {
+ "epoch": 102,
+ "train_loss": 3.004280758743286,
+ "train_acc": 0.25098,
+ "test_loss": 7.399062448120117,
+ "test_acc": 0.03,
+ "lyapunov": null,
+ "grad_norm": 0.500738337792044,
+ "grad_max_sv": 0.1635062240064144,
+ "grad_min_sv": 9.288643754157277e-09,
+ "grad_condition": 21845553.2838238,
+ "lr": 0.0002320866025105016,
+ "time_sec": 66.69196605682373
+ },
+ {
+ "epoch": 103,
+ "train_loss": 2.9984512678527833,
+ "train_acc": 0.2512,
+ "test_loss": 7.320097260284424,
+ "test_acc": 0.0284,
+ "lyapunov": null,
+ "grad_norm": 0.4980454163272628,
+ "grad_max_sv": 0.1580117117613554,
+ "grad_min_sv": 9.07426482149587e-09,
+ "grad_condition": 30985957.899948187,
+ "lr": 0.0002233042253783278,
+ "time_sec": 66.74033546447754
+ },
+ {
+ "epoch": 104,
+ "train_loss": 2.99728506942749,
+ "train_acc": 0.25086,
+ "test_loss": 7.463210521697998,
+ "test_acc": 0.0329,
+ "lyapunov": null,
+ "grad_norm": 0.5009998323620124,
+ "grad_max_sv": 0.16469128727912902,
+ "grad_min_sv": 9.2030743081839e-09,
+ "grad_condition": 22045083.846339237,
+ "lr": 0.000214643216157784,
+ "time_sec": 66.72671890258789
+ },
+ {
+ "epoch": 105,
+ "train_loss": 2.9898451292419432,
+ "train_acc": 0.25504,
+ "test_loss": 7.531641695404053,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.5022636847492568,
+ "grad_max_sv": 0.16528656147420406,
+ "grad_min_sv": 9.158518983476415e-09,
+ "grad_condition": 24732730.3300323,
+ "lr": 0.00020610737385376332,
+ "time_sec": 66.72895193099976
+ },
+ {
+ "epoch": 106,
+ "train_loss": 2.984173779754639,
+ "train_acc": 0.25438,
+ "test_loss": 7.581431744384766,
+ "test_acc": 0.0273,
+ "lyapunov": null,
+ "grad_norm": 0.5028431980176926,
+ "grad_max_sv": 0.1630011171102524,
+ "grad_min_sv": 9.238039688774791e-09,
+ "grad_condition": 20675234.791328143,
+ "lr": 0.00019770044256881242,
+ "time_sec": 66.73670959472656
+ },
+ {
+ "epoch": 107,
+ "train_loss": 2.974853392868042,
+ "train_acc": 0.25748,
+ "test_loss": 7.1432702926635745,
+ "test_acc": 0.0313,
+ "lyapunov": null,
+ "grad_norm": 0.49959385619284613,
+ "grad_max_sv": 0.16204869262874128,
+ "grad_min_sv": 9.195193381716926e-09,
+ "grad_condition": 21149671.894155927,
+ "lr": 0.0001894261098608447,
+ "time_sec": 66.74563598632812
+ },
+ {
+ "epoch": 108,
+ "train_loss": 2.9721791679382323,
+ "train_acc": 0.25728,
+ "test_loss": 7.795809649658203,
+ "test_acc": 0.0298,
+ "lyapunov": null,
+ "grad_norm": 0.4995722502777866,
+ "grad_max_sv": 0.15964266508817673,
+ "grad_min_sv": 9.203898770904218e-09,
+ "grad_condition": 20323974.743836712,
+ "lr": 0.000181288005125655,
+ "time_sec": 66.73793625831604
+ },
+ {
+ "epoch": 109,
+ "train_loss": 2.970719254760742,
+ "train_acc": 0.25944,
+ "test_loss": 7.365542489624024,
+ "test_acc": 0.0299,
+ "lyapunov": null,
+ "grad_norm": 0.500757198933526,
+ "grad_max_sv": 0.16609507314860822,
+ "grad_min_sv": 9.356035884922065e-09,
+ "grad_condition": 20439457.080971286,
+ "lr": 0.0001732896980049473,
+ "time_sec": 66.7298583984375
+ },
+ {
+ "epoch": 110,
+ "train_loss": 2.972525007095337,
+ "train_acc": 0.25712,
+ "test_loss": 7.133980830383301,
+ "test_acc": 0.0312,
+ "lyapunov": null,
+ "grad_norm": 0.5042334021436244,
+ "grad_max_sv": 0.15981336012482644,
+ "grad_min_sv": 9.288604266299849e-09,
+ "grad_condition": 21280953.98530178,
+ "lr": 0.00016543469682057076,
+ "time_sec": 66.76267719268799
+ },
+ {
+ "epoch": 111,
+ "train_loss": 2.9631910160827637,
+ "train_acc": 0.25998,
+ "test_loss": 7.417809590148925,
+ "test_acc": 0.0274,
+ "lyapunov": null,
+ "grad_norm": 0.5014056320574171,
+ "grad_max_sv": 0.16821228563785554,
+ "grad_min_sv": 9.333871581716779e-09,
+ "grad_condition": 101661462.28679642,
+ "lr": 0.00015772644703565552,
+ "time_sec": 66.72111940383911
+ },
+ {
+ "epoch": 112,
+ "train_loss": 2.9575250452423094,
+ "train_acc": 0.26008,
+ "test_loss": 7.389129028320313,
+ "test_acc": 0.0277,
+ "lyapunov": null,
+ "grad_norm": 0.5007918938537274,
+ "grad_max_sv": 0.16079586669802665,
+ "grad_min_sv": 9.307818968351534e-09,
+ "grad_condition": 20753238.25422468,
+ "lr": 0.00015016832974331713,
+ "time_sec": 66.72973942756653
+ },
+ {
+ "epoch": 113,
+ "train_loss": 2.952999960632324,
+ "train_acc": 0.26198,
+ "test_loss": 7.37722262878418,
+ "test_acc": 0.0287,
+ "lyapunov": null,
+ "grad_norm": 0.5013173930748581,
+ "grad_max_sv": 0.16444203816354275,
+ "grad_min_sv": 9.318139330971587e-09,
+ "grad_condition": 26788166.113831718,
+ "lr": 0.00014276366018359834,
+ "time_sec": 66.83487486839294
+ },
+ {
+ "epoch": 114,
+ "train_loss": 2.948192635574341,
+ "train_acc": 0.26038,
+ "test_loss": 7.436811110687255,
+ "test_acc": 0.0279,
+ "lyapunov": null,
+ "grad_norm": 0.5032371113955786,
+ "grad_max_sv": 0.1634738527238369,
+ "grad_min_sv": 9.2874662635219e-09,
+ "grad_condition": 319138381.19418097,
+ "lr": 0.00013551568628929425,
+ "time_sec": 66.70622992515564
+ },
+ {
+ "epoch": 115,
+ "train_loss": 2.9517051191711428,
+ "train_acc": 0.26036,
+ "test_loss": 7.19214797668457,
+ "test_acc": 0.03,
+ "lyapunov": null,
+ "grad_norm": 0.5054472421665304,
+ "grad_max_sv": 0.16728437952697278,
+ "grad_min_sv": 9.324679213496e-09,
+ "grad_condition": 26191438.542866766,
+ "lr": 0.00012842758726130276,
+ "time_sec": 66.71952223777771
+ },
+ {
+ "epoch": 116,
+ "train_loss": 2.9479563136291502,
+ "train_acc": 0.25988,
+ "test_loss": 7.865117324829102,
+ "test_acc": 0.0272,
+ "lyapunov": null,
+ "grad_norm": 0.501425656974135,
+ "grad_max_sv": 0.16254092417657376,
+ "grad_min_sv": 9.171186369366646e-09,
+ "grad_condition": 43416689.99828492,
+ "lr": 0.0001215024721741218,
+ "time_sec": 66.74095702171326
+ },
+ {
+ "epoch": 117,
+ "train_loss": 2.9373822256469726,
+ "train_acc": 0.26326,
+ "test_loss": 7.544526052856446,
+ "test_acc": 0.0288,
+ "lyapunov": null,
+ "grad_norm": 0.5031467536307935,
+ "grad_max_sv": 0.16549900099635123,
+ "grad_min_sv": 9.4188400051598e-09,
+ "grad_condition": 19833315.44179687,
+ "lr": 0.00011474337861210538,
+ "time_sec": 66.72034072875977
+ },
+ {
+ "epoch": 118,
+ "train_loss": 2.9374622593688966,
+ "train_acc": 0.26362,
+ "test_loss": 7.940575238037109,
+ "test_acc": 0.0276,
+ "lyapunov": null,
+ "grad_norm": 0.502189701036258,
+ "grad_max_sv": 0.1663150992244482,
+ "grad_min_sv": 9.337868267511595e-09,
+ "grad_condition": 22055002.57718137,
+ "lr": 0.00010815327133708009,
+ "time_sec": 66.71819615364075
+ },
+ {
+ "epoch": 119,
+ "train_loss": 2.9290069982910154,
+ "train_acc": 0.26682,
+ "test_loss": 8.381109976196289,
+ "test_acc": 0.0245,
+ "lyapunov": null,
+ "grad_norm": 0.5022580399945052,
+ "grad_max_sv": 0.16189948543906213,
+ "grad_min_sv": 9.334797540505591e-09,
+ "grad_condition": 53795996.97598307,
+ "lr": 0.00010173504098790182,
+ "time_sec": 66.73639011383057
+ },
+ {
+ "epoch": 120,
+ "train_loss": 2.927497018890381,
+ "train_acc": 0.26494,
+ "test_loss": 8.134235343933106,
+ "test_acc": 0.0268,
+ "lyapunov": null,
+ "grad_norm": 0.5044191934677914,
+ "grad_max_sv": 0.1647841826081276,
+ "grad_min_sv": 9.31749464250231e-09,
+ "grad_condition": 21075801.592136864,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 66.71619915962219
+ },
+ {
+ "epoch": 121,
+ "train_loss": 2.9210917962646485,
+ "train_acc": 0.2676,
+ "test_loss": 7.665898156738281,
+ "test_acc": 0.0284,
+ "lyapunov": null,
+ "grad_norm": 0.505046124945648,
+ "grad_max_sv": 0.16069133542478084,
+ "grad_min_sv": 9.383237816254498e-09,
+ "grad_condition": 53773449.70699586,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 66.7949550151825
+ },
+ {
+ "epoch": 122,
+ "train_loss": 2.9300759950256348,
+ "train_acc": 0.26686,
+ "test_loss": 7.947439320373535,
+ "test_acc": 0.0253,
+ "lyapunov": null,
+ "grad_norm": 0.5039924043792687,
+ "grad_max_sv": 0.16329768523573876,
+ "grad_min_sv": 9.309516596847645e-09,
+ "grad_condition": 105483269.53547074,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 66.70848250389099
+ },
+ {
+ "epoch": 123,
+ "train_loss": 2.91971375289917,
+ "train_acc": 0.26734,
+ "test_loss": 7.80317967376709,
+ "test_acc": 0.0286,
+ "lyapunov": null,
+ "grad_norm": 0.5061715705620777,
+ "grad_max_sv": 0.16143706440925598,
+ "grad_min_sv": 9.3223205665377e-09,
+ "grad_condition": 44714095.26064149,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 66.75235438346863
+ },
+ {
+ "epoch": 124,
+ "train_loss": 2.920988783569336,
+ "train_acc": 0.2672,
+ "test_loss": 7.688530905151367,
+ "test_acc": 0.0267,
+ "lyapunov": null,
+ "grad_norm": 0.5036561383144873,
+ "grad_max_sv": 0.16541591919958593,
+ "grad_min_sv": 9.339689868714807e-09,
+ "grad_condition": 21082674.48603835,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 66.7428572177887
+ },
+ {
+ "epoch": 125,
+ "train_loss": 2.9158429930877685,
+ "train_acc": 0.26972,
+ "test_loss": 7.870475231933594,
+ "test_acc": 0.0266,
+ "lyapunov": null,
+ "grad_norm": 0.5050163715028828,
+ "grad_max_sv": 0.16450283974409102,
+ "grad_min_sv": 9.300618648844239e-09,
+ "grad_condition": 22745467.54728716,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 66.70153951644897
+ },
+ {
+ "epoch": 126,
+ "train_loss": 2.9174345250701905,
+ "train_acc": 0.26804,
+ "test_loss": 7.7597047775268555,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.5054786147107485,
+ "grad_max_sv": 0.16298311799764634,
+ "grad_min_sv": 9.272562198105183e-09,
+ "grad_condition": 355815933.8318427,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 66.70234727859497
+ },
+ {
+ "epoch": 127,
+ "train_loss": 2.9025824697875975,
+ "train_acc": 0.26988,
+ "test_loss": 7.446964788818359,
+ "test_acc": 0.0276,
+ "lyapunov": null,
+ "grad_norm": 0.5066198768830174,
+ "grad_max_sv": 0.1645387414842844,
+ "grad_min_sv": 9.428870359484698e-09,
+ "grad_condition": 20208395.537682876,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 66.714515209198
+ },
+ {
+ "epoch": 128,
+ "train_loss": 2.915607092437744,
+ "train_acc": 0.26734,
+ "test_loss": 7.931312725830078,
+ "test_acc": 0.0244,
+ "lyapunov": null,
+ "grad_norm": 0.5071889354627791,
+ "grad_max_sv": 0.16293769851326942,
+ "grad_min_sv": 9.389047653241001e-09,
+ "grad_condition": 19442274.807418514,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 66.77645683288574
+ },
+ {
+ "epoch": 129,
+ "train_loss": 2.9043918053436277,
+ "train_acc": 0.27058,
+ "test_loss": 7.705898820495605,
+ "test_acc": 0.0294,
+ "lyapunov": null,
+ "grad_norm": 0.5061548650342338,
+ "grad_max_sv": 0.1668264877051115,
+ "grad_min_sv": 9.293020419853803e-09,
+ "grad_condition": 22634656.7147369,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 66.68853044509888
+ },
+ {
+ "epoch": 130,
+ "train_loss": 2.9112479612731934,
+ "train_acc": 0.2704,
+ "test_loss": 7.656457232666016,
+ "test_acc": 0.0278,
+ "lyapunov": null,
+ "grad_norm": 0.5055330426804672,
+ "grad_max_sv": 0.162294964119792,
+ "grad_min_sv": 9.291567426572556e-09,
+ "grad_condition": 22558154.425069276,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 66.69644737243652
+ },
+ {
+ "epoch": 131,
+ "train_loss": 2.9026712393951417,
+ "train_acc": 0.26934,
+ "test_loss": 7.7139065521240235,
+ "test_acc": 0.0274,
+ "lyapunov": null,
+ "grad_norm": 0.5078534676699445,
+ "grad_max_sv": 0.16336566992104054,
+ "grad_min_sv": 9.403588141498886e-09,
+ "grad_condition": 20579658.983666856,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 66.69969606399536
+ },
+ {
+ "epoch": 132,
+ "train_loss": 2.8976589154815673,
+ "train_acc": 0.27122,
+ "test_loss": 7.718105026245118,
+ "test_acc": 0.026,
+ "lyapunov": null,
+ "grad_norm": 0.5077215533015317,
+ "grad_max_sv": 0.16301583163440228,
+ "grad_min_sv": 9.312006112038862e-09,
+ "grad_condition": 27087738.24954634,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 66.74734258651733
+ },
+ {
+ "epoch": 133,
+ "train_loss": 2.9053258415222167,
+ "train_acc": 0.26974,
+ "test_loss": 7.773404074859619,
+ "test_acc": 0.029,
+ "lyapunov": null,
+ "grad_norm": 0.5077078460971154,
+ "grad_max_sv": 0.16176522485911846,
+ "grad_min_sv": 9.38179235271397e-09,
+ "grad_condition": 22801102.593637146,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 66.71020007133484
+ },
+ {
+ "epoch": 134,
+ "train_loss": 2.90214939994812,
+ "train_acc": 0.2685,
+ "test_loss": 7.735068745422363,
+ "test_acc": 0.0283,
+ "lyapunov": null,
+ "grad_norm": 0.5056827916750407,
+ "grad_max_sv": 0.16394426934421064,
+ "grad_min_sv": 9.382484492375525e-09,
+ "grad_condition": 273849135.71961355,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 66.72329211235046
+ },
+ {
+ "epoch": 135,
+ "train_loss": 2.8955694792175293,
+ "train_acc": 0.27204,
+ "test_loss": 8.074042736816406,
+ "test_acc": 0.0263,
+ "lyapunov": null,
+ "grad_norm": 0.5072891279476816,
+ "grad_max_sv": 0.1647134818136692,
+ "grad_min_sv": 9.274373982681716e-09,
+ "grad_condition": 20878941.234711803,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 66.69911003112793
+ },
+ {
+ "epoch": 136,
+ "train_loss": 2.901527007369995,
+ "train_acc": 0.272,
+ "test_loss": 7.88837564239502,
+ "test_acc": 0.0256,
+ "lyapunov": null,
+ "grad_norm": 0.5069997382716037,
+ "grad_max_sv": 0.16248776540160179,
+ "grad_min_sv": 9.28558460677742e-09,
+ "grad_condition": 26142069.423716225,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 66.73573279380798
+ },
+ {
+ "epoch": 137,
+ "train_loss": 2.8907382415008547,
+ "train_acc": 0.2728,
+ "test_loss": 8.04134146270752,
+ "test_acc": 0.0266,
+ "lyapunov": null,
+ "grad_norm": 0.506922138474151,
+ "grad_max_sv": 0.16456650160253047,
+ "grad_min_sv": 9.394744830693025e-09,
+ "grad_condition": 22952282.106423754,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 66.72893476486206
+ },
+ {
+ "epoch": 138,
+ "train_loss": 2.8925764886474608,
+ "train_acc": 0.27096,
+ "test_loss": 7.848298292541504,
+ "test_acc": 0.0281,
+ "lyapunov": null,
+ "grad_norm": 0.5070877996969257,
+ "grad_max_sv": 0.16335688717663288,
+ "grad_min_sv": 9.458600758183167e-09,
+ "grad_condition": 21212816.652376812,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 66.69498014450073
+ },
+ {
+ "epoch": 139,
+ "train_loss": 2.8905470305633547,
+ "train_acc": 0.2723,
+ "test_loss": 7.805370147705078,
+ "test_acc": 0.0276,
+ "lyapunov": null,
+ "grad_norm": 0.5091697345599102,
+ "grad_max_sv": 0.16748546734452247,
+ "grad_min_sv": 9.554275959278158e-09,
+ "grad_condition": 21817543.256782603,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 66.69882249832153
+ },
+ {
+ "epoch": 140,
+ "train_loss": 2.8900568451690676,
+ "train_acc": 0.2725,
+ "test_loss": 8.150068646240234,
+ "test_acc": 0.0263,
+ "lyapunov": null,
+ "grad_norm": 0.5094580986389692,
+ "grad_max_sv": 0.16614943966269494,
+ "grad_min_sv": 9.441066034510115e-09,
+ "grad_condition": 25708375.318254933,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 66.72957038879395
+ },
+ {
+ "epoch": 141,
+ "train_loss": 2.8928156049346923,
+ "train_acc": 0.27302,
+ "test_loss": 7.946534848022461,
+ "test_acc": 0.0271,
+ "lyapunov": null,
+ "grad_norm": 0.5089732688724395,
+ "grad_max_sv": 0.1660338044166565,
+ "grad_min_sv": 9.440311787671519e-09,
+ "grad_condition": 79734166.44560626,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 66.7075400352478
+ },
+ {
+ "epoch": 142,
+ "train_loss": 2.88548219871521,
+ "train_acc": 0.27172,
+ "test_loss": 8.169772109985352,
+ "test_acc": 0.0265,
+ "lyapunov": null,
+ "grad_norm": 0.5086553359451463,
+ "grad_max_sv": 0.16840459816157818,
+ "grad_min_sv": 9.377848261826749e-09,
+ "grad_condition": 22023976.535071947,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 66.71758651733398
+ },
+ {
+ "epoch": 143,
+ "train_loss": 2.89183920753479,
+ "train_acc": 0.27372,
+ "test_loss": 7.852110308837891,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.5094733139547303,
+ "grad_max_sv": 0.16687579974532127,
+ "grad_min_sv": 9.444928218693693e-09,
+ "grad_condition": 24477411.004352577,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 66.72722506523132
+ },
+ {
+ "epoch": 144,
+ "train_loss": 2.8904072105407717,
+ "train_acc": 0.27378,
+ "test_loss": 8.066141241455078,
+ "test_acc": 0.0255,
+ "lyapunov": null,
+ "grad_norm": 0.5089427679493953,
+ "grad_max_sv": 0.1690099250525236,
+ "grad_min_sv": 9.382681727398978e-09,
+ "grad_condition": 24070995.123834018,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 66.73601293563843
+ },
+ {
+ "epoch": 145,
+ "train_loss": 2.8936181242370607,
+ "train_acc": 0.27214,
+ "test_loss": 8.10545317993164,
+ "test_acc": 0.0258,
+ "lyapunov": null,
+ "grad_norm": 0.507865092838002,
+ "grad_max_sv": 0.1655246399343014,
+ "grad_min_sv": 9.371320355833212e-09,
+ "grad_condition": 20893591.384689607,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 66.70678782463074
+ },
+ {
+ "epoch": 146,
+ "train_loss": 2.894159292755127,
+ "train_acc": 0.27236,
+ "test_loss": 7.739997250366211,
+ "test_acc": 0.0282,
+ "lyapunov": null,
+ "grad_norm": 0.5079666742519956,
+ "grad_max_sv": 0.16401765793561934,
+ "grad_min_sv": 9.365164058139363e-09,
+ "grad_condition": 30379279.137967873,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 66.73851418495178
+ },
+ {
+ "epoch": 147,
+ "train_loss": 2.892810397796631,
+ "train_acc": 0.27236,
+ "test_loss": 8.097870037841798,
+ "test_acc": 0.0261,
+ "lyapunov": null,
+ "grad_norm": 0.5083955380496783,
+ "grad_max_sv": 0.16239417865872383,
+ "grad_min_sv": 9.437153494773476e-09,
+ "grad_condition": 22581567.79918761,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 66.69952964782715
+ },
+ {
+ "epoch": 148,
+ "train_loss": 2.8858398888397216,
+ "train_acc": 0.27292,
+ "test_loss": 7.955520216369629,
+ "test_acc": 0.0253,
+ "lyapunov": null,
+ "grad_norm": 0.5081646285749641,
+ "grad_max_sv": 0.1665601458400488,
+ "grad_min_sv": 9.4039764724082e-09,
+ "grad_condition": 2788122152.665894,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 66.72941470146179
+ },
+ {
+ "epoch": 149,
+ "train_loss": 2.8937516955566407,
+ "train_acc": 0.27344,
+ "test_loss": 8.195967932128907,
+ "test_acc": 0.0259,
+ "lyapunov": null,
+ "grad_norm": 0.5088598826502255,
+ "grad_max_sv": 0.16467942893505097,
+ "grad_min_sv": 9.292379346548252e-09,
+ "grad_condition": 20098211.57433509,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 66.7379686832428
+ },
+ {
+ "epoch": 150,
+ "train_loss": 2.8891425512695315,
+ "train_acc": 0.27354,
+ "test_loss": 8.199688424682618,
+ "test_acc": 0.0264,
+ "lyapunov": null,
+ "grad_norm": 0.5085081625178647,
+ "grad_max_sv": 0.17037647701799868,
+ "grad_min_sv": 9.396511368997551e-09,
+ "grad_condition": 30341616.600583784,
+ "lr": 0.0,
+ "time_sec": 66.7265522480011
+ }
+ ]
+ },
+ "lyapunov": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 4.600389208526611,
+ "train_acc": 0.07146,
+ "test_loss": 4.086850812530518,
+ "test_acc": 0.089,
+ "lyapunov": 2.088574398813955,
+ "grad_norm": 5.951641147060766,
+ "grad_max_sv": 4.604718941450119,
+ "grad_min_sv": 1.0862287848634189e-07,
+ "grad_condition": 102934308.40827194,
+ "lr": 0.0009998903417374227,
+ "time_sec": 41.90148162841797
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.154245112686157,
+ "train_acc": 0.09378,
+ "test_loss": 4.727289266204834,
+ "test_acc": 0.049,
+ "lyapunov": 1.675386021509195,
+ "grad_norm": 3.9336812922654714,
+ "grad_max_sv": 2.925524663925171,
+ "grad_min_sv": 7.262743817529338e-08,
+ "grad_condition": 424809238.9666936,
+ "lr": 0.0009995614150494292,
+ "time_sec": 41.78368663787842
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.027823886566162,
+ "train_acc": 0.1086,
+ "test_loss": 5.036119989776611,
+ "test_acc": 0.0347,
+ "lyapunov": 1.6001547501825006,
+ "grad_norm": 3.0745862198210694,
+ "grad_max_sv": 2.1295204132795336,
+ "grad_min_sv": 5.70765142704488e-08,
+ "grad_condition": 40571486.668118164,
+ "lr": 0.0009990133642141358,
+ "time_sec": 41.703768253326416
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.9490097280883787,
+ "train_acc": 0.1205,
+ "test_loss": 6.33214266204834,
+ "test_acc": 0.0188,
+ "lyapunov": 1.5750604392317555,
+ "grad_norm": 2.373335141934517,
+ "grad_max_sv": 1.5385636299848557,
+ "grad_min_sv": 4.3810931549259635e-08,
+ "grad_condition": 41690835.43861919,
+ "lr": 0.0009982464296247522,
+ "time_sec": 41.732722997665405
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.9766585917663573,
+ "train_acc": 0.11954,
+ "test_loss": 8.71332287902832,
+ "test_acc": 0.0188,
+ "lyapunov": 1.565549552593085,
+ "grad_norm": 2.0246690982621796,
+ "grad_max_sv": 1.2804439306259154,
+ "grad_min_sv": 3.6991484700377165e-08,
+ "grad_condition": 85372782.32745245,
+ "lr": 0.0009972609476841367,
+ "time_sec": 41.76529860496521
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.073858399047851,
+ "train_acc": 0.11056,
+ "test_loss": 9.466819995117188,
+ "test_acc": 0.0223,
+ "lyapunov": 1.5455034062685564,
+ "grad_norm": 1.7934086339665274,
+ "grad_max_sv": 1.104438428580761,
+ "grad_min_sv": 3.247254408700328e-08,
+ "grad_condition": 45291989.58759006,
+ "lr": 0.000996057350657239,
+ "time_sec": 41.74420213699341
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.1445047888183595,
+ "train_acc": 0.10608,
+ "test_loss": 10.480993731689454,
+ "test_acc": 0.0156,
+ "lyapunov": 1.5415380177900309,
+ "grad_norm": 1.5679408505934445,
+ "grad_max_sv": 0.9464981764554977,
+ "grad_min_sv": 2.8262019316493968e-08,
+ "grad_condition": 54295754.70226411,
+ "lr": 0.000994636166481494,
+ "time_sec": 41.73182463645935
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.26063258026123,
+ "train_acc": 0.09112,
+ "test_loss": 7.7578563934326175,
+ "test_acc": 0.0186,
+ "lyapunov": 1.5429353631670824,
+ "grad_norm": 1.3464117763442929,
+ "grad_max_sv": 0.7779564633965492,
+ "grad_min_sv": 2.375586672376251e-08,
+ "grad_condition": 62692972.26952485,
+ "lr": 0.0009929980185352525,
+ "time_sec": 41.739473819732666
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.513377053375244,
+ "train_acc": 0.05922,
+ "test_loss": 7.138281170654297,
+ "test_acc": 0.011,
+ "lyapunov": 1.5319068190996603,
+ "grad_norm": 1.139364674598679,
+ "grad_max_sv": 0.6511225394904614,
+ "grad_min_sv": 1.8816128205534354e-08,
+ "grad_condition": 44484041.03115648,
+ "lr": 0.0009911436253643444,
+ "time_sec": 41.73070311546326
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.696486204833985,
+ "train_acc": 0.03644,
+ "test_loss": 8.94805923461914,
+ "test_acc": 0.01,
+ "lyapunov": 1.4879300298593234,
+ "grad_norm": 0.9658719057515597,
+ "grad_max_sv": 0.6352818965911865,
+ "grad_min_sv": 1.4476460679876436e-08,
+ "grad_condition": 2057995491.241798,
+ "lr": 0.0009890738003669028,
+ "time_sec": 41.76564049720764
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.811119628295899,
+ "train_acc": 0.03002,
+ "test_loss": 8.594207092285156,
+ "test_acc": 0.01,
+ "lyapunov": 1.545145396381388,
+ "grad_norm": 0.9564458204494278,
+ "grad_max_sv": 0.6685591802001,
+ "grad_min_sv": 1.3870340914018398e-08,
+ "grad_condition": 146809154.0196677,
+ "lr": 0.00098678945143658,
+ "time_sec": 41.74543738365173
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.975349290466308,
+ "train_acc": 0.01658,
+ "test_loss": 8.6747091796875,
+ "test_acc": 0.0114,
+ "lyapunov": 1.4708023967645358,
+ "grad_norm": 0.7817948112887597,
+ "grad_max_sv": 0.603185323625803,
+ "grad_min_sv": 9.743947088081129e-09,
+ "grad_condition": 67868723.94202444,
+ "lr": 0.0009842915805643154,
+ "time_sec": 41.7559871673584
+ },
+ {
+ "epoch": 13,
+ "train_loss": 5.0296261746215825,
+ "train_acc": 0.01604,
+ "test_loss": 11.79697481994629,
+ "test_acc": 0.01,
+ "lyapunov": 1.5253148819784375,
+ "grad_norm": 0.5736780904158933,
+ "grad_max_sv": 0.42879281714558604,
+ "grad_min_sv": 6.762437510681764e-09,
+ "grad_condition": 1079134295.4881654,
+ "lr": 0.000981581283398829,
+ "time_sec": 41.76394009590149
+ },
+ {
+ "epoch": 14,
+ "train_loss": 5.057629988555909,
+ "train_acc": 0.00992,
+ "test_loss": 8.410659944152831,
+ "test_acc": 0.01,
+ "lyapunov": 1.4446861634169088,
+ "grad_norm": 0.39926683732439516,
+ "grad_max_sv": 0.33072102442383766,
+ "grad_min_sv": 4.070671115463664e-09,
+ "grad_condition": 171229170.03266063,
+ "lr": 0.0009786597487660333,
+ "time_sec": 41.78986120223999
+ },
+ {
+ "epoch": 15,
+ "train_loss": 5.068990168609619,
+ "train_acc": 0.01004,
+ "test_loss": 8.000550273132324,
+ "test_acc": 0.01,
+ "lyapunov": 1.4198117143357807,
+ "grad_norm": 0.31403539953973636,
+ "grad_max_sv": 0.261398883163929,
+ "grad_min_sv": 2.518455900589597e-09,
+ "grad_condition": 1889483827.2041466,
+ "lr": 0.0009755282581475766,
+ "time_sec": 41.803417682647705
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.098585692901612,
+ "train_acc": 0.00948,
+ "test_loss": 8.965616151428222,
+ "test_acc": 0.01,
+ "lyapunov": 1.4220252604130894,
+ "grad_norm": 0.2674000226215519,
+ "grad_max_sv": 0.2171985387802124,
+ "grad_min_sv": 6.561514876139448e-10,
+ "grad_condition": 51847368847.70773,
+ "lr": 0.0009721881851187403,
+ "time_sec": 41.763081789016724
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.128935182189942,
+ "train_acc": 0.0104,
+ "test_loss": 7.713327481842041,
+ "test_acc": 0.01,
+ "lyapunov": 1.4243087640503789,
+ "grad_norm": 0.2268635753508302,
+ "grad_max_sv": 0.17724891044199467,
+ "grad_min_sv": 1.1410712791450972e-12,
+ "grad_condition": 106447262687.9498,
+ "lr": 0.0009686409947459456,
+ "time_sec": 41.777748823165894
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.169684513702393,
+ "train_acc": 0.00924,
+ "test_loss": 9.309846389770508,
+ "test_acc": 0.01,
+ "lyapunov": 1.4357064035542482,
+ "grad_norm": 0.2142537464973637,
+ "grad_max_sv": 0.1502558846026659,
+ "grad_min_sv": 4.244580750085834e-13,
+ "grad_condition": 128309590371.45757,
+ "lr": 0.0009648882429441254,
+ "time_sec": 41.78967308998108
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.18758517288208,
+ "train_acc": 0.01042,
+ "test_loss": 9.819900524902344,
+ "test_acc": 0.01,
+ "lyapunov": 1.4233030394824875,
+ "grad_norm": 0.1952009554667118,
+ "grad_max_sv": 0.14073190968483687,
+ "grad_min_sv": 2.6230090465217223e-13,
+ "grad_condition": 123371153139.15,
+ "lr": 0.00096093157579425,
+ "time_sec": 41.77319002151489
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.217939367370605,
+ "train_acc": 0.00912,
+ "test_loss": 9.18544906463623,
+ "test_acc": 0.01,
+ "lyapunov": 1.4247246755053624,
+ "grad_norm": 0.15876002882735193,
+ "grad_max_sv": 0.10825764928013086,
+ "grad_min_sv": 3.338896381884262e-15,
+ "grad_condition": 107875834900.70416,
+ "lr": 0.0009567727288213001,
+ "time_sec": 41.805402517318726
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.2237202166748045,
+ "train_acc": 0.00884,
+ "test_loss": 7.853615603637695,
+ "test_acc": 0.01,
+ "lyapunov": 1.4316062283942768,
+ "grad_norm": 0.16150401588518373,
+ "grad_max_sv": 0.09900619480758906,
+ "grad_min_sv": 6.6800742534662695e-15,
+ "grad_condition": 98362933683.42502,
+ "lr": 0.0009524135262330095,
+ "time_sec": 41.81541037559509
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.223462156219482,
+ "train_acc": 0.00896,
+ "test_loss": 7.39350982055664,
+ "test_acc": 0.01,
+ "lyapunov": 1.4326209281106739,
+ "grad_norm": 0.1473213530853359,
+ "grad_max_sv": 0.07929724231362342,
+ "grad_min_sv": 1.359730040562078e-16,
+ "grad_condition": 79286860137.91084,
+ "lr": 0.0009478558801197061,
+ "time_sec": 41.77298974990845
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.2433684585571285,
+ "train_acc": 0.0104,
+ "test_loss": 7.137277140808106,
+ "test_acc": 0.01,
+ "lyapunov": 1.4520324453368516,
+ "grad_norm": 0.1808576226701931,
+ "grad_max_sv": 0.0958871865645051,
+ "grad_min_sv": 8.016626722354409e-12,
+ "grad_condition": 91441708516.60077,
+ "lr": 0.000943101789615607,
+ "time_sec": 41.78183579444885
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.227817250061035,
+ "train_acc": 0.01018,
+ "test_loss": 6.776467510986328,
+ "test_acc": 0.01,
+ "lyapunov": 1.4379125001180508,
+ "grad_norm": 0.12771270098590454,
+ "grad_max_sv": 0.06905819587409497,
+ "grad_min_sv": 2.599435841374051e-17,
+ "grad_condition": 69055853998.34868,
+ "lr": 0.0009381533400219313,
+ "time_sec": 41.771769285202026
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.245168194122314,
+ "train_acc": 0.0099,
+ "test_loss": 6.430454106140137,
+ "test_acc": 0.01,
+ "lyapunov": 1.4564172242913405,
+ "grad_norm": 0.12472749302013317,
+ "grad_max_sv": 0.05845061130821705,
+ "grad_min_sv": 1.194259418817754e-40,
+ "grad_condition": 58450611308.21704,
+ "lr": 0.0009330127018922189,
+ "time_sec": 41.770474433898926
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.246722939758301,
+ "train_acc": 0.00928,
+ "test_loss": 6.331733448791504,
+ "test_acc": 0.01,
+ "lyapunov": 1.4580842101055642,
+ "grad_norm": 0.1662077239803915,
+ "grad_max_sv": 0.06711247004568577,
+ "grad_min_sv": 3.516773949087515e-14,
+ "grad_condition": 65770012096.831566,
+ "lr": 0.000927682130080253,
+ "time_sec": 41.73953866958618
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.241074298706055,
+ "train_acc": 0.00908,
+ "test_loss": 5.877811084747314,
+ "test_acc": 0.01,
+ "lyapunov": 1.4511035900286702,
+ "grad_norm": 0.11653593515355255,
+ "grad_max_sv": 0.057695817202329636,
+ "grad_min_sv": 2.245335846475005e-19,
+ "grad_condition": 57695796508.56338,
+ "lr": 0.0009221639627510072,
+ "time_sec": 41.77058434486389
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.231804114685058,
+ "train_acc": 0.00918,
+ "test_loss": 5.65352537612915,
+ "test_acc": 0.01,
+ "lyapunov": 1.4424795046486818,
+ "grad_norm": 0.11846210716711081,
+ "grad_max_sv": 0.05332653652876616,
+ "grad_min_sv": 1.997381835377637e-16,
+ "grad_condition": 53305647188.1228,
+ "lr": 0.0009164606203550494,
+ "time_sec": 41.764750957489014
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.262847916870117,
+ "train_acc": 0.01024,
+ "test_loss": 6.106614427185058,
+ "test_acc": 0.01,
+ "lyapunov": 1.4771753000786236,
+ "grad_norm": 0.12029871369481651,
+ "grad_max_sv": 0.04656773656606674,
+ "grad_min_sv": 3.853570776893247e-46,
+ "grad_condition": 46567736566.06674,
+ "lr": 0.0009105746045668516,
+ "time_sec": 41.72984552383423
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.23929132598877,
+ "train_acc": 0.00934,
+ "test_loss": 5.9899550048828125,
+ "test_acc": 0.01,
+ "lyapunov": 1.4511136694637405,
+ "grad_norm": 0.11304905556902457,
+ "grad_max_sv": 0.047783416556194426,
+ "grad_min_sv": 9.917357230877788e-21,
+ "grad_condition": 47783415656.63218,
+ "lr": 0.0009045084971874733,
+ "time_sec": 41.7406222820282
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.248380351104736,
+ "train_acc": 0.01028,
+ "test_loss": 5.734669494628906,
+ "test_acc": 0.01,
+ "lyapunov": 1.461517483986857,
+ "grad_norm": 0.10074340116724037,
+ "grad_max_sv": 0.034037844324484465,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34037844324.484474,
+ "lr": 0.0008982649590120977,
+ "time_sec": 41.74093008041382
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.236619085388184,
+ "train_acc": 0.00984,
+ "test_loss": 5.793693973541259,
+ "test_acc": 0.01,
+ "lyapunov": 1.4490889871821684,
+ "grad_norm": 0.10695665831734988,
+ "grad_max_sv": 0.04561040163971484,
+ "grad_min_sv": 0.0,
+ "grad_condition": 45610401639.71483,
+ "lr": 0.0008918467286629196,
+ "time_sec": 41.984901666641235
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.23296120513916,
+ "train_acc": 0.00958,
+ "test_loss": 5.439259308624267,
+ "test_acc": 0.01,
+ "lyapunov": 1.444964089661913,
+ "grad_norm": 0.10554551126822227,
+ "grad_max_sv": 0.042046601651236415,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42046601651.23641,
+ "lr": 0.0008852566213878943,
+ "time_sec": 41.770121335983276
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.236159170837403,
+ "train_acc": 0.00974,
+ "test_loss": 5.683465595245361,
+ "test_acc": 0.01,
+ "lyapunov": 1.44912754269817,
+ "grad_norm": 0.10158597595404413,
+ "grad_max_sv": 0.0364499366376549,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36449936637.6549,
+ "lr": 0.000878497527825878,
+ "time_sec": 41.73541307449341
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.244431438751221,
+ "train_acc": 0.00982,
+ "test_loss": 5.822091407775879,
+ "test_acc": 0.01,
+ "lyapunov": 1.4579007311550247,
+ "grad_norm": 0.10227185751901953,
+ "grad_max_sv": 0.04079357534646988,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40793575346.46987,
+ "lr": 0.000871572412738697,
+ "time_sec": 41.72771143913269
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.242595237579346,
+ "train_acc": 0.00948,
+ "test_loss": 5.712351992797852,
+ "test_acc": 0.01,
+ "lyapunov": 1.4565396217433997,
+ "grad_norm": 0.09594442137602498,
+ "grad_max_sv": 0.023863840941339733,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23863840941.33973,
+ "lr": 0.0008644843137107055,
+ "time_sec": 41.679956674575806
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.25272214477539,
+ "train_acc": 0.00774,
+ "test_loss": 5.519532617950439,
+ "test_acc": 0.01,
+ "lyapunov": 1.4673221968019101,
+ "grad_norm": 0.09989553017175994,
+ "grad_max_sv": 0.01326487297192216,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13264872971.922161,
+ "lr": 0.0008572363398164014,
+ "time_sec": 41.665099143981934
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.239593379211426,
+ "train_acc": 0.00894,
+ "test_loss": 5.685215021514892,
+ "test_acc": 0.01,
+ "lyapunov": 1.4529655787646008,
+ "grad_norm": 0.09888602041808069,
+ "grad_max_sv": 0.03386777136474848,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33867771364.748474,
+ "lr": 0.0008498316702566826,
+ "time_sec": 41.71084642410278
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.24351258758545,
+ "train_acc": 0.00926,
+ "test_loss": 5.718768641662598,
+ "test_acc": 0.01,
+ "lyapunov": 1.4566386227717485,
+ "grad_norm": 0.10344101016289994,
+ "grad_max_sv": 0.04082807558588684,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40828075585.886826,
+ "lr": 0.0008422735529643442,
+ "time_sec": 41.73838138580322
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.241183159027099,
+ "train_acc": 0.00956,
+ "test_loss": 5.497510899353028,
+ "test_acc": 0.01,
+ "lyapunov": 1.4553583491488795,
+ "grad_norm": 0.09390993405990472,
+ "grad_max_sv": 0.015733347134664656,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15733347134.664654,
+ "lr": 0.0008345653031794289,
+ "time_sec": 41.734697580337524
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.242352604675293,
+ "train_acc": 0.00974,
+ "test_loss": 5.167651419830322,
+ "test_acc": 0.01,
+ "lyapunov": 1.454840253076285,
+ "grad_norm": 0.11429776991375327,
+ "grad_max_sv": 0.05544604551978409,
+ "grad_min_sv": 2.0339863136307694e-16,
+ "grad_condition": 55425910698.75984,
+ "lr": 0.0008267103019950526,
+ "time_sec": 41.75088906288147
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.242215647735596,
+ "train_acc": 0.00988,
+ "test_loss": 5.260814582824707,
+ "test_acc": 0.01,
+ "lyapunov": 1.4554345080309816,
+ "grad_norm": 0.10783002802519942,
+ "grad_max_sv": 0.04959035101346672,
+ "grad_min_sv": 4.912822630335892e-20,
+ "grad_condition": 49590347491.3975,
+ "lr": 0.0008187119948743447,
+ "time_sec": 41.73639273643494
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.244567107543945,
+ "train_acc": 0.01008,
+ "test_loss": 4.993986747741699,
+ "test_acc": 0.01,
+ "lyapunov": 1.4585875352020459,
+ "grad_norm": 0.10047934695930735,
+ "grad_max_sv": 0.03824934270232916,
+ "grad_min_sv": 3.853570776893247e-46,
+ "grad_condition": 38249342702.329155,
+ "lr": 0.000810573890139155,
+ "time_sec": 41.74794268608093
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.244575652618408,
+ "train_acc": 0.0093,
+ "test_loss": 4.9594275024414065,
+ "test_acc": 0.01,
+ "lyapunov": 1.4588656959021489,
+ "grad_norm": 0.09576972429911833,
+ "grad_max_sv": 0.031089681945741177,
+ "grad_min_sv": 0.0,
+ "grad_condition": 31089681945.741173,
+ "lr": 0.0008022995574311873,
+ "time_sec": 41.72138214111328
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.2458512478637696,
+ "train_acc": 0.00958,
+ "test_loss": 4.983256524658203,
+ "test_acc": 0.01,
+ "lyapunov": 1.460322377017087,
+ "grad_norm": 0.09632514814173115,
+ "grad_max_sv": 0.02758595086634159,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27585950866.34159,
+ "lr": 0.0007938926261462363,
+ "time_sec": 41.73388934135437
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.245156242980957,
+ "train_acc": 0.00914,
+ "test_loss": 5.5051834045410155,
+ "test_acc": 0.01,
+ "lyapunov": 1.459906402451303,
+ "grad_norm": 0.09376667391500292,
+ "grad_max_sv": 0.017312733735889197,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17312733735.8892,
+ "lr": 0.0007853567838422158,
+ "time_sec": 41.682612657547
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.24946335647583,
+ "train_acc": 0.0092,
+ "test_loss": 5.037567407989502,
+ "test_acc": 0.01,
+ "lyapunov": 1.464009671260024,
+ "grad_norm": 0.09467776161020446,
+ "grad_max_sv": 0.01866090311668813,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18660903116.688133,
+ "lr": 0.0007766957746216719,
+ "time_sec": 41.71859622001648
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.2716734535217284,
+ "train_acc": 0.00954,
+ "test_loss": 4.725313116455078,
+ "test_acc": 0.01,
+ "lyapunov": 1.4846527972794554,
+ "grad_norm": 0.12086822830734321,
+ "grad_max_sv": 0.020449956133961677,
+ "grad_min_sv": 0.0,
+ "grad_condition": 20449956133.961678,
+ "lr": 0.0007679133974894982,
+ "time_sec": 41.662288427352905
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.264281662597656,
+ "train_acc": 0.0094,
+ "test_loss": 4.704328326416015,
+ "test_acc": 0.01,
+ "lyapunov": 1.4808302587255493,
+ "grad_norm": 0.1006442361474557,
+ "grad_max_sv": 0.003648173250257969,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3648173250.257969,
+ "lr": 0.000759013504686565,
+ "time_sec": 41.659945011138916
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.260963584136963,
+ "train_acc": 0.00864,
+ "test_loss": 4.687705662536621,
+ "test_acc": 0.01,
+ "lyapunov": 1.4764524859845485,
+ "grad_norm": 0.08983274926440024,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007499999999999998,
+ "time_sec": 41.73585891723633
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.254029862213135,
+ "train_acc": 0.00892,
+ "test_loss": 4.650592637634277,
+ "test_acc": 0.01,
+ "lyapunov": 1.4702172300699727,
+ "grad_norm": 0.08943196133143812,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007408768370508575,
+ "time_sec": 41.63914966583252
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.253371743927002,
+ "train_acc": 0.00914,
+ "test_loss": 4.651584497070313,
+ "test_acc": 0.01,
+ "lyapunov": 1.469337931984221,
+ "grad_norm": 0.09050035162045282,
+ "grad_max_sv": 0.00823306110687554,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8233061106.875539,
+ "lr": 0.0007316480175599307,
+ "time_sec": 41.676894187927246
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.25479355255127,
+ "train_acc": 0.00884,
+ "test_loss": 4.6638921875,
+ "test_acc": 0.01,
+ "lyapunov": 1.4709156809560477,
+ "grad_norm": 0.0923409314747527,
+ "grad_max_sv": 0.01720760380849242,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17207603808.492424,
+ "lr": 0.0007223175895924635,
+ "time_sec": 41.68897199630737
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.255663233642578,
+ "train_acc": 0.0087,
+ "test_loss": 4.690281636047363,
+ "test_acc": 0.01,
+ "lyapunov": 1.4720432532717809,
+ "grad_norm": 0.09116086408440177,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007128896457825361,
+ "time_sec": 41.65702509880066
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.255450089111328,
+ "train_acc": 0.0089,
+ "test_loss": 4.664666540527343,
+ "test_acc": 0.01,
+ "lyapunov": 1.4717262035135723,
+ "grad_norm": 0.08960989934748306,
+ "grad_max_sv": 0.0027584049850702284,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2758404985.0702286,
+ "lr": 0.0007033683215378998,
+ "time_sec": 41.68492293357849
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.25642558013916,
+ "train_acc": 0.00918,
+ "test_loss": 4.672654594421386,
+ "test_acc": 0.01,
+ "lyapunov": 1.4729856798411025,
+ "grad_norm": 0.08842004194228453,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006937577932260512,
+ "time_sec": 41.66422128677368
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.256343665313721,
+ "train_acc": 0.00928,
+ "test_loss": 4.675612693786621,
+ "test_acc": 0.01,
+ "lyapunov": 1.4728102668776841,
+ "grad_norm": 0.0894492177832343,
+ "grad_max_sv": 0.003824355313554406,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3824355313.554406,
+ "lr": 0.0006840622763423388,
+ "time_sec": 41.66166043281555
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.256470738372803,
+ "train_acc": 0.00846,
+ "test_loss": 4.673555949401855,
+ "test_acc": 0.01,
+ "lyapunov": 1.473022796918669,
+ "grad_norm": 0.09415093095699927,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006742860236609073,
+ "time_sec": 41.72664546966553
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.257105118560791,
+ "train_acc": 0.0089,
+ "test_loss": 4.662265467834473,
+ "test_acc": 0.01,
+ "lyapunov": 1.4737855485638085,
+ "grad_norm": 0.08933320536804817,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006644333233692913,
+ "time_sec": 41.683704137802124
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.2567843800354,
+ "train_acc": 0.00894,
+ "test_loss": 4.67973249130249,
+ "test_acc": 0.01,
+ "lyapunov": 1.4734186650542043,
+ "grad_norm": 0.08845010319296705,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006545084971874734,
+ "time_sec": 41.65764546394348
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.2586814794921874,
+ "train_acc": 0.00832,
+ "test_loss": 4.66929153137207,
+ "test_acc": 0.01,
+ "lyapunov": 1.4755458350071822,
+ "grad_norm": 0.08796570828809193,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006445158984722354,
+ "time_sec": 41.66641640663147
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.257138239135743,
+ "train_acc": 0.00822,
+ "test_loss": 4.672049102783203,
+ "test_acc": 0.01,
+ "lyapunov": 1.4738077528946234,
+ "grad_norm": 0.08897000656850247,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006344599103076324,
+ "time_sec": 41.66154670715332
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.25840109664917,
+ "train_acc": 0.00872,
+ "test_loss": 4.668118723297119,
+ "test_acc": 0.01,
+ "lyapunov": 1.4752026089012165,
+ "grad_norm": 0.08994871774610383,
+ "grad_max_sv": 0.0018751383759081364,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1875138375.9081364,
+ "lr": 0.0006243449435824269,
+ "time_sec": 41.65010213851929
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.259331801910401,
+ "train_acc": 0.009,
+ "test_loss": 4.6509183990478515,
+ "test_acc": 0.01,
+ "lyapunov": 1.4761373133915465,
+ "grad_norm": 0.09230518416704733,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006141754350553275,
+ "time_sec": 41.68602395057678
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.259325382080078,
+ "train_acc": 0.00842,
+ "test_loss": 4.649483604431152,
+ "test_acc": 0.01,
+ "lyapunov": 1.4762441697327986,
+ "grad_norm": 0.09181035955304583,
+ "grad_max_sv": 0.002657032757997513,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2657032757.997513,
+ "lr": 0.0006039558454088793,
+ "time_sec": 41.649319648742676
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.258703485870361,
+ "train_acc": 0.0089,
+ "test_loss": 4.659050286865234,
+ "test_acc": 0.01,
+ "lyapunov": 1.475566557911046,
+ "grad_norm": 0.08911107124283034,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000593690657292862,
+ "time_sec": 41.66279911994934
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.258656344146728,
+ "train_acc": 0.00868,
+ "test_loss": 4.652145028686523,
+ "test_acc": 0.01,
+ "lyapunov": 1.4755408843155102,
+ "grad_norm": 0.08984660357930904,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005833843733580507,
+ "time_sec": 41.65086126327515
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.259207654724121,
+ "train_acc": 0.00934,
+ "test_loss": 4.644708920288086,
+ "test_acc": 0.01,
+ "lyapunov": 1.476156848470878,
+ "grad_norm": 0.08930414014303266,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005730415142812054,
+ "time_sec": 41.6753249168396
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.259739582061767,
+ "train_acc": 0.00962,
+ "test_loss": 4.635655142974853,
+ "test_acc": 0.01,
+ "lyapunov": 1.4767807136716136,
+ "grad_norm": 0.08868883564267036,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005626666167821517,
+ "time_sec": 41.6395525932312
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.258972863311768,
+ "train_acc": 0.0098,
+ "test_loss": 4.630142547607422,
+ "test_acc": 0.01,
+ "lyapunov": 1.4758698986009564,
+ "grad_norm": 0.08847186803439672,
+ "grad_max_sv": 0.0013374987989664077,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1337498798.9664078,
+ "lr": 0.0005522642316338265,
+ "time_sec": 41.64910697937012
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.259250410003662,
+ "train_acc": 0.00816,
+ "test_loss": 4.623734491729737,
+ "test_acc": 0.01,
+ "lyapunov": 1.4762009812133086,
+ "grad_norm": 0.0884158256705388,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005418389216661573,
+ "time_sec": 41.65673208236694
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.260035207519532,
+ "train_acc": 0.00856,
+ "test_loss": 4.622923696899414,
+ "test_acc": 0.01,
+ "lyapunov": 1.4770802146638446,
+ "grad_norm": 0.08974113871672654,
+ "grad_max_sv": 0.00768307838588953,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7683078385.889531,
+ "lr": 0.0005313952597646563,
+ "time_sec": 41.65725779533386
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.258972092895508,
+ "train_acc": 0.0089,
+ "test_loss": 4.627894605255127,
+ "test_acc": 0.01,
+ "lyapunov": 1.4759459010780316,
+ "grad_norm": 0.08863002112233408,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005209378268645994,
+ "time_sec": 41.67947006225586
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.260160232849121,
+ "train_acc": 0.00854,
+ "test_loss": 4.623137206268311,
+ "test_acc": 0.01,
+ "lyapunov": 1.4772573081428741,
+ "grad_norm": 0.09051043005437374,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005104712099416781,
+ "time_sec": 41.64360570907593
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.261452306213379,
+ "train_acc": 0.0086,
+ "test_loss": 4.62108766708374,
+ "test_acc": 0.01,
+ "lyapunov": 1.478764491617832,
+ "grad_norm": 0.08870478754258258,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004999999999999996,
+ "time_sec": 41.64626455307007
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.2611726042175295,
+ "train_acc": 0.00886,
+ "test_loss": 4.623955220794678,
+ "test_acc": 0.01,
+ "lyapunov": 1.4784429673953434,
+ "grad_norm": 0.08878094000275963,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004895287900583212,
+ "time_sec": 41.656346797943115
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.261820520782471,
+ "train_acc": 0.00874,
+ "test_loss": 4.61466668548584,
+ "test_acc": 0.01,
+ "lyapunov": 1.479163033273214,
+ "grad_norm": 0.088273880644991,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004790621731353997,
+ "time_sec": 41.629544734954834
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.262518656311035,
+ "train_acc": 0.00864,
+ "test_loss": 4.618248620605469,
+ "test_acc": 0.01,
+ "lyapunov": 1.4799401089358513,
+ "grad_norm": 0.08861130102060333,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000468604740235343,
+ "time_sec": 41.636940240859985
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.262553581237793,
+ "train_acc": 0.009,
+ "test_loss": 4.612181239318848,
+ "test_acc": 0.01,
+ "lyapunov": 1.4799358280723358,
+ "grad_norm": 0.0903783960157925,
+ "grad_max_sv": 0.01033918051980436,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10339180519.80436,
+ "lr": 0.00045816107833384175,
+ "time_sec": 41.68020677566528
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.261878743896484,
+ "train_acc": 0.00886,
+ "test_loss": 4.612385320281982,
+ "test_acc": 0.01,
+ "lyapunov": 1.4792317411173945,
+ "grad_norm": 0.08815903777083657,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004477357683661729,
+ "time_sec": 41.65713667869568
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.270162540740967,
+ "train_acc": 0.00948,
+ "test_loss": 4.61169965209961,
+ "test_acc": 0.01,
+ "lyapunov": 1.4845762399151503,
+ "grad_norm": 0.08933321451984454,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00043733338321784746,
+ "time_sec": 41.67780160903931
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.261875872955322,
+ "train_acc": 0.00904,
+ "test_loss": 4.612089576721192,
+ "test_acc": 0.01,
+ "lyapunov": 1.47926344438587,
+ "grad_norm": 0.08839554451712253,
+ "grad_max_sv": 0.0006388438399881124,
+ "grad_min_sv": 0.0,
+ "grad_condition": 638843839.9881124,
+ "lr": 0.0004269584857187939,
+ "time_sec": 41.646398305892944
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.260851752319336,
+ "train_acc": 0.00926,
+ "test_loss": 4.605935791778564,
+ "test_acc": 0.01,
+ "lyapunov": 1.4780823766727886,
+ "grad_norm": 0.08881372923156301,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004166156266419484,
+ "time_sec": 41.64280557632446
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.261813834838867,
+ "train_acc": 0.0087,
+ "test_loss": 4.608912050628662,
+ "test_acc": 0.01,
+ "lyapunov": 1.4791915989897746,
+ "grad_norm": 0.08828411260554986,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004063093427071373,
+ "time_sec": 41.650211811065674
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.26105229888916,
+ "train_acc": 0.00876,
+ "test_loss": 4.607143463134766,
+ "test_acc": 0.01,
+ "lyapunov": 1.4783552308826495,
+ "grad_norm": 0.08801037770330913,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003960441545911199,
+ "time_sec": 41.64579463005066
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.262948518676758,
+ "train_acc": 0.0089,
+ "test_loss": 4.605761601257324,
+ "test_acc": 0.01,
+ "lyapunov": 1.4804744302769146,
+ "grad_norm": 0.08824824639135734,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003858245649446718,
+ "time_sec": 41.694432497024536
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.261626904449463,
+ "train_acc": 0.00888,
+ "test_loss": 4.605769618988037,
+ "test_acc": 0.01,
+ "lyapunov": 1.4789858986349667,
+ "grad_norm": 0.08846494510980996,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00037565505641757235,
+ "time_sec": 41.681015491485596
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.262741643371582,
+ "train_acc": 0.00854,
+ "test_loss": 4.60517066192627,
+ "test_acc": 0.01,
+ "lyapunov": 1.4802151354377533,
+ "grad_norm": 0.08805740561566744,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00036554008969236695,
+ "time_sec": 41.71163582801819
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.263213445281982,
+ "train_acc": 0.00854,
+ "test_loss": 4.605359262847901,
+ "test_acc": 0.01,
+ "lyapunov": 1.480777892005413,
+ "grad_norm": 0.08816151399502117,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003554841015277638,
+ "time_sec": 41.67105174064636
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.262189238433838,
+ "train_acc": 0.00928,
+ "test_loss": 4.605318756103515,
+ "test_acc": 0.01,
+ "lyapunov": 1.4796337014269036,
+ "grad_norm": 0.08930367772167215,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000345491502812526,
+ "time_sec": 41.640591859817505
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.261863013916016,
+ "train_acc": 0.00846,
+ "test_loss": 4.605316780853271,
+ "test_acc": 0.01,
+ "lyapunov": 1.4792772080282421,
+ "grad_norm": 0.08825121039889311,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003355666766307081,
+ "time_sec": 41.705339193344116
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.263724805908203,
+ "train_acc": 0.0084,
+ "test_loss": 4.605317385101318,
+ "test_acc": 0.01,
+ "lyapunov": 1.4813950381925345,
+ "grad_norm": 0.0876042035379079,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00032571397633909225,
+ "time_sec": 41.64047455787659
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.263348481750488,
+ "train_acc": 0.00826,
+ "test_loss": 4.605170777893067,
+ "test_acc": 0.01,
+ "lyapunov": 1.480857576250725,
+ "grad_norm": 0.09205208782948476,
+ "grad_max_sv": 0.007683574734255671,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7683574734.2556715,
+ "lr": 0.00031593772365766094,
+ "time_sec": 41.66976022720337
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.263678814697266,
+ "train_acc": 0.0087,
+ "test_loss": 4.605170695495605,
+ "test_acc": 0.01,
+ "lyapunov": 1.481314537775181,
+ "grad_norm": 0.09018876116473232,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003062422067739483,
+ "time_sec": 41.65629434585571
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.262105151977539,
+ "train_acc": 0.00832,
+ "test_loss": 4.605170751190186,
+ "test_acc": 0.01,
+ "lyapunov": 1.479619727110314,
+ "grad_norm": 0.08829391493330081,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00029663167846209965,
+ "time_sec": 41.637601375579834
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.261454503326416,
+ "train_acc": 0.00892,
+ "test_loss": 4.605170954895019,
+ "test_acc": 0.01,
+ "lyapunov": 1.4788271173491807,
+ "grad_norm": 0.08829025030553274,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00028711035421746345,
+ "time_sec": 41.64588212966919
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.2617424992370605,
+ "train_acc": 0.00796,
+ "test_loss": 4.605170453643799,
+ "test_acc": 0.01,
+ "lyapunov": 1.4791636610275034,
+ "grad_norm": 0.08832466346515266,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00027768241040753615,
+ "time_sec": 41.67742967605591
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.263716314086914,
+ "train_acc": 0.00858,
+ "test_loss": 4.605170697784424,
+ "test_acc": 0.01,
+ "lyapunov": 1.4813884213147566,
+ "grad_norm": 0.08840081765609732,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00026835198244006903,
+ "time_sec": 41.668766260147095
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.263833166656494,
+ "train_acc": 0.0087,
+ "test_loss": 4.605170695495605,
+ "test_acc": 0.01,
+ "lyapunov": 1.4815085251313036,
+ "grad_norm": 0.08792820202741711,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002591231629491421,
+ "time_sec": 41.66829442977905
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.262581251525879,
+ "train_acc": 0.00938,
+ "test_loss": 4.605170309448242,
+ "test_acc": 0.01,
+ "lyapunov": 1.480138891188385,
+ "grad_norm": 0.08832421824906611,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002499999999999997,
+ "time_sec": 41.68127655982971
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.263155633087158,
+ "train_acc": 0.00926,
+ "test_loss": 4.605170729064941,
+ "test_acc": 0.01,
+ "lyapunov": 1.480774727928669,
+ "grad_norm": 0.08869235909302142,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00024098649531343477,
+ "time_sec": 41.64776301383972
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.263860197906494,
+ "train_acc": 0.00848,
+ "test_loss": 4.6051703002929685,
+ "test_acc": 0.01,
+ "lyapunov": 1.4815483535342204,
+ "grad_norm": 0.08903961910912474,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002320866025105016,
+ "time_sec": 41.674145460128784
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.262970734710693,
+ "train_acc": 0.00884,
+ "test_loss": 4.605170517730713,
+ "test_acc": 0.01,
+ "lyapunov": 1.4805596624798787,
+ "grad_norm": 0.08876501131615566,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002233042253783278,
+ "time_sec": 41.65722608566284
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.26228626159668,
+ "train_acc": 0.00864,
+ "test_loss": 4.6051704086303715,
+ "test_acc": 0.01,
+ "lyapunov": 1.4798069201466981,
+ "grad_norm": 0.08768680006785402,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000214643216157784,
+ "time_sec": 41.67565131187439
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.262674415435791,
+ "train_acc": 0.00838,
+ "test_loss": 4.6051702949523925,
+ "test_acc": 0.01,
+ "lyapunov": 1.480235590654261,
+ "grad_norm": 0.08782166200414132,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376332,
+ "time_sec": 41.69558024406433
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.261244326171875,
+ "train_acc": 0.00838,
+ "test_loss": 4.605170240020752,
+ "test_acc": 0.01,
+ "lyapunov": 1.4786384803864656,
+ "grad_norm": 0.08788578987148214,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019770044256881242,
+ "time_sec": 41.650753021240234
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.261433357849121,
+ "train_acc": 0.00904,
+ "test_loss": 4.605170213317871,
+ "test_acc": 0.01,
+ "lyapunov": 1.47886505273297,
+ "grad_norm": 0.08770929414544659,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001894261098608447,
+ "time_sec": 41.68164348602295
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.263026925201416,
+ "train_acc": 0.009,
+ "test_loss": 4.60517043762207,
+ "test_acc": 0.01,
+ "lyapunov": 1.480643398621503,
+ "grad_norm": 0.08785423875011682,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000181288005125655,
+ "time_sec": 41.660765647888184
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.263078652801513,
+ "train_acc": 0.00816,
+ "test_loss": 4.605601066589355,
+ "test_acc": 0.01,
+ "lyapunov": 1.4807295979136397,
+ "grad_norm": 0.08803442353918925,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001732896980049473,
+ "time_sec": 41.66913390159607
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.263812705535889,
+ "train_acc": 0.00886,
+ "test_loss": 4.605602632141113,
+ "test_acc": 0.01,
+ "lyapunov": 1.4815696554110789,
+ "grad_norm": 0.08891727786082522,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016543469682057076,
+ "time_sec": 41.659369230270386
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.262115261535644,
+ "train_acc": 0.0078,
+ "test_loss": 4.605170052337646,
+ "test_acc": 0.01,
+ "lyapunov": 1.479651604771919,
+ "grad_norm": 0.08875181240277763,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 41.70141959190369
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.261109837646484,
+ "train_acc": 0.00874,
+ "test_loss": 4.605170468139648,
+ "test_acc": 0.01,
+ "lyapunov": 1.4785008156086172,
+ "grad_norm": 0.08816074014970703,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 41.72004580497742
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.262560579681397,
+ "train_acc": 0.0086,
+ "test_loss": 4.6051704193115235,
+ "test_acc": 0.01,
+ "lyapunov": 1.4801284751623793,
+ "grad_norm": 0.08840941179148938,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 41.699143409729004
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.263074327697754,
+ "train_acc": 0.00886,
+ "test_loss": 4.605170431518554,
+ "test_acc": 0.01,
+ "lyapunov": 1.4807007001793904,
+ "grad_norm": 0.08821068724217689,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00013551568628929425,
+ "time_sec": 41.67876648902893
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.262186526947022,
+ "train_acc": 0.0086,
+ "test_loss": 4.60517013092041,
+ "test_acc": 0.01,
+ "lyapunov": 1.4797226050320793,
+ "grad_norm": 0.0883831455880719,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 41.696322202682495
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.263145412445068,
+ "train_acc": 0.00836,
+ "test_loss": 4.605170120239258,
+ "test_acc": 0.01,
+ "lyapunov": 1.480826344026629,
+ "grad_norm": 0.08792566727039719,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 41.70669603347778
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.263297129516602,
+ "train_acc": 0.00834,
+ "test_loss": 4.60517033996582,
+ "test_acc": 0.01,
+ "lyapunov": 1.4809697009718326,
+ "grad_norm": 0.0880297462141732,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 41.66155934333801
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.263041806030273,
+ "train_acc": 0.00838,
+ "test_loss": 4.605170127868653,
+ "test_acc": 0.01,
+ "lyapunov": 1.4806942784267922,
+ "grad_norm": 0.0885706870416634,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010815327133708009,
+ "time_sec": 41.6468141078949
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.2626050819396974,
+ "train_acc": 0.00882,
+ "test_loss": 4.6051702911376955,
+ "test_acc": 0.01,
+ "lyapunov": 1.4802038822027728,
+ "grad_norm": 0.08805401420662645,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010173504098790182,
+ "time_sec": 41.67359256744385
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.262915015411377,
+ "train_acc": 0.00904,
+ "test_loss": 4.605170024108887,
+ "test_acc": 0.01,
+ "lyapunov": 1.4805879507528241,
+ "grad_norm": 0.08796658508917193,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 41.736050844192505
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.263114930877686,
+ "train_acc": 0.0083,
+ "test_loss": 4.605170388031006,
+ "test_acc": 0.01,
+ "lyapunov": 1.4807836167952593,
+ "grad_norm": 0.08806195734422055,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 41.839574337005615
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.262788164825439,
+ "train_acc": 0.00866,
+ "test_loss": 4.605170208740234,
+ "test_acc": 0.01,
+ "lyapunov": 1.4804405013618567,
+ "grad_norm": 0.08816097534558247,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 41.688995599746704
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.26315210357666,
+ "train_acc": 0.00874,
+ "test_loss": 4.60517013168335,
+ "test_acc": 0.01,
+ "lyapunov": 1.480828346498787,
+ "grad_norm": 0.08865951427268862,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 41.67227745056152
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.261944111022949,
+ "train_acc": 0.00914,
+ "test_loss": 4.605170402526856,
+ "test_acc": 0.01,
+ "lyapunov": 1.4794809848756132,
+ "grad_norm": 0.08788803702349164,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 41.66115140914917
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.262568561401367,
+ "train_acc": 0.0084,
+ "test_loss": 4.60517010345459,
+ "test_acc": 0.01,
+ "lyapunov": 1.4801926018331972,
+ "grad_norm": 0.08788675914126909,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 41.66165113449097
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.262280065460205,
+ "train_acc": 0.00902,
+ "test_loss": 4.605170187377929,
+ "test_acc": 0.01,
+ "lyapunov": 1.479902151295596,
+ "grad_norm": 0.08819775554912056,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 41.69537806510925
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.263674239196777,
+ "train_acc": 0.00884,
+ "test_loss": 4.605170446777343,
+ "test_acc": 0.01,
+ "lyapunov": 1.48142600425369,
+ "grad_norm": 0.08796249954554257,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 41.79696488380432
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.270508392181396,
+ "train_acc": 0.00774,
+ "test_loss": 4.6051702003479,
+ "test_acc": 0.01,
+ "lyapunov": 1.4854568767425653,
+ "grad_norm": 0.0903277044807366,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 41.78498363494873
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.264521000213623,
+ "train_acc": 0.00884,
+ "test_loss": 4.60517049331665,
+ "test_acc": 0.01,
+ "lyapunov": 1.4823556894536518,
+ "grad_norm": 0.08791573530006377,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 41.75825619697571
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.263497207641602,
+ "train_acc": 0.00856,
+ "test_loss": 4.605170115661621,
+ "test_acc": 0.01,
+ "lyapunov": 1.4812386575562264,
+ "grad_norm": 0.08821103937271832,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 41.753769874572754
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.262869830932617,
+ "train_acc": 0.00886,
+ "test_loss": 4.605170347595215,
+ "test_acc": 0.01,
+ "lyapunov": 1.4805735938079523,
+ "grad_norm": 0.08785954608269858,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 41.688891649246216
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.261720856323242,
+ "train_acc": 0.0092,
+ "test_loss": 4.605170230865479,
+ "test_acc": 0.01,
+ "lyapunov": 1.4792467572195145,
+ "grad_norm": 0.087651258765062,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 41.77381873130798
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.262511810150147,
+ "train_acc": 0.0094,
+ "test_loss": 4.605170274353028,
+ "test_acc": 0.01,
+ "lyapunov": 1.480145969354283,
+ "grad_norm": 0.08750516435565067,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 41.82425284385681
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.2628221615600586,
+ "train_acc": 0.009,
+ "test_loss": 4.605170260620117,
+ "test_acc": 0.01,
+ "lyapunov": 1.480488061295141,
+ "grad_norm": 0.08767200957157907,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 41.67008709907532
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.262214541320801,
+ "train_acc": 0.00906,
+ "test_loss": 4.605170357513428,
+ "test_acc": 0.01,
+ "lyapunov": 1.479800993524244,
+ "grad_norm": 0.08833622992837174,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 41.68112754821777
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.261716612854004,
+ "train_acc": 0.00888,
+ "test_loss": 4.605170449829101,
+ "test_acc": 0.01,
+ "lyapunov": 1.4792663523608156,
+ "grad_norm": 0.0879915508382305,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 41.70846509933472
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.2621297309875485,
+ "train_acc": 0.00882,
+ "test_loss": 4.6051704208374025,
+ "test_acc": 0.01,
+ "lyapunov": 1.4797221123410003,
+ "grad_norm": 0.08806309329797692,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 41.68800139427185
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.262034148254394,
+ "train_acc": 0.009,
+ "test_loss": 4.6051704246520995,
+ "test_acc": 0.01,
+ "lyapunov": 1.4796448052691682,
+ "grad_norm": 0.08834842868525353,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 41.69483256340027
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.262303157958985,
+ "train_acc": 0.00964,
+ "test_loss": 4.605170336914062,
+ "test_acc": 0.01,
+ "lyapunov": 1.479908719696962,
+ "grad_norm": 0.08774925576434625,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 41.66975927352905
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.262272278747559,
+ "train_acc": 0.0093,
+ "test_loss": 4.60517025756836,
+ "test_acc": 0.01,
+ "lyapunov": 1.4799000518706145,
+ "grad_norm": 0.08772068441716457,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 41.66502594947815
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.262688246459961,
+ "train_acc": 0.01,
+ "test_loss": 4.605170532226563,
+ "test_acc": 0.01,
+ "lyapunov": 1.4803482586770411,
+ "grad_norm": 0.08814041677323237,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 41.68389272689819
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.2666687211608885,
+ "train_acc": 0.01,
+ "test_loss": 4.605170266723633,
+ "test_acc": 0.01,
+ "lyapunov": 1.4834284483624236,
+ "grad_norm": 0.08808456177000348,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 41.70149374008179
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.2625910409545895,
+ "train_acc": 0.00962,
+ "test_loss": 4.605170193481445,
+ "test_acc": 0.01,
+ "lyapunov": 1.4802313485108982,
+ "grad_norm": 0.08826750361435122,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 41.675010204315186
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.260678899536133,
+ "train_acc": 0.01,
+ "test_loss": 4.60517022857666,
+ "test_acc": 0.01,
+ "lyapunov": 1.4781028556701776,
+ "grad_norm": 0.08826672055694883,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 41.67730474472046
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.262034167785645,
+ "train_acc": 0.01,
+ "test_loss": 4.605170384216309,
+ "test_acc": 0.01,
+ "lyapunov": 1.47965680668726,
+ "grad_norm": 0.08792698291184464,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 41.711742639541626
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.262125458984375,
+ "train_acc": 0.01,
+ "test_loss": 4.605170105743408,
+ "test_acc": 0.01,
+ "lyapunov": 1.4797236641959461,
+ "grad_norm": 0.0878274682773103,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 41.72946882247925
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.263207815246582,
+ "train_acc": 0.01,
+ "test_loss": 4.605170260620117,
+ "test_acc": 0.01,
+ "lyapunov": 1.4809288390152289,
+ "grad_norm": 0.08780070915999844,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 41.724937438964844
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.262101231384277,
+ "train_acc": 0.01,
+ "test_loss": 4.605170335388183,
+ "test_acc": 0.01,
+ "lyapunov": 1.4797268191261974,
+ "grad_norm": 0.08811462011437057,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 41.86608529090881
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.26564047592163,
+ "train_acc": 0.01,
+ "test_loss": 4.605170273590088,
+ "test_acc": 0.01,
+ "lyapunov": 1.4827746887646063,
+ "grad_norm": 0.088563737069616,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 41.668235540390015
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.263033789978027,
+ "train_acc": 0.01,
+ "test_loss": 4.605170249176026,
+ "test_acc": 0.01,
+ "lyapunov": 1.480735678197173,
+ "grad_norm": 0.08808051231477661,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 41.65666699409485
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 5.146603754577637,
+ "train_acc": 0.02116,
+ "test_loss": 4.799143431091308,
+ "test_acc": 0.0147,
+ "lyapunov": 2.247725067846001,
+ "grad_norm": 5.759558294617595,
+ "grad_max_sv": 4.593458223342895,
+ "grad_min_sv": 9.939812799508729e-08,
+ "grad_condition": 84468621.05560377,
+ "lr": 0.0009998903417374227,
+ "time_sec": 86.99692106246948
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.751044019317627,
+ "train_acc": 0.0261,
+ "test_loss": 4.781899060058594,
+ "test_acc": 0.0112,
+ "lyapunov": 1.7586963832225946,
+ "grad_norm": 3.669503755077576,
+ "grad_max_sv": 2.629068848490715,
+ "grad_min_sv": 6.128463263532779e-08,
+ "grad_condition": 51408050.19515464,
+ "lr": 0.0009995614150494292,
+ "time_sec": 86.99053359031677
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.5855533428955075,
+ "train_acc": 0.0302,
+ "test_loss": 4.783446264648438,
+ "test_acc": 0.0204,
+ "lyapunov": 1.650954161458613,
+ "grad_norm": 1.8760355114337364,
+ "grad_max_sv": 1.30306978225708,
+ "grad_min_sv": 3.0873310079282404e-08,
+ "grad_condition": 74135293.70537718,
+ "lr": 0.0009990133642141358,
+ "time_sec": 87.01290392875671
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.534848844451904,
+ "train_acc": 0.03702,
+ "test_loss": 4.8837289710998535,
+ "test_acc": 0.0149,
+ "lyapunov": 1.5894556011995087,
+ "grad_norm": 1.244556287523884,
+ "grad_max_sv": 0.7792816802859306,
+ "grad_min_sv": 1.8834766013497984e-08,
+ "grad_condition": 45093330.72508425,
+ "lr": 0.0009982464296247522,
+ "time_sec": 87.01876306533813
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.592422800903321,
+ "train_acc": 0.03296,
+ "test_loss": 4.848946441650391,
+ "test_acc": 0.0145,
+ "lyapunov": 1.5674470586849905,
+ "grad_norm": 0.9784603406000693,
+ "grad_max_sv": 0.5906251654028892,
+ "grad_min_sv": 1.3135394039365212e-08,
+ "grad_condition": 2765173736.408195,
+ "lr": 0.0009972609476841367,
+ "time_sec": 87.06145668029785
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.617396930847168,
+ "train_acc": 0.03438,
+ "test_loss": 5.069504800415039,
+ "test_acc": 0.0141,
+ "lyapunov": 1.5743840259054434,
+ "grad_norm": 0.8765996249293907,
+ "grad_max_sv": 0.4905373930931091,
+ "grad_min_sv": 1.1570106956413153e-08,
+ "grad_condition": 490506519.64879054,
+ "lr": 0.000996057350657239,
+ "time_sec": 86.98913550376892
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.673418109436035,
+ "train_acc": 0.03144,
+ "test_loss": 5.083357322692871,
+ "test_acc": 0.01,
+ "lyapunov": 1.5757776337206517,
+ "grad_norm": 0.842980463237632,
+ "grad_max_sv": 0.4635330677032471,
+ "grad_min_sv": 9.801791714218744e-09,
+ "grad_condition": 672093861.9243783,
+ "lr": 0.000994636166481494,
+ "time_sec": 87.02865362167358
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.715173123626709,
+ "train_acc": 0.02866,
+ "test_loss": 6.969320404052734,
+ "test_acc": 0.01,
+ "lyapunov": 1.572990819621269,
+ "grad_norm": 0.7658102895010526,
+ "grad_max_sv": 0.39840318709611894,
+ "grad_min_sv": 7.909037175684143e-09,
+ "grad_condition": 2689350489.23699,
+ "lr": 0.0009929980185352525,
+ "time_sec": 87.05855631828308
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.719650735931396,
+ "train_acc": 0.03378,
+ "test_loss": 6.69895283203125,
+ "test_acc": 0.01,
+ "lyapunov": 1.5739632753459998,
+ "grad_norm": 0.6951362665980956,
+ "grad_max_sv": 0.40656831562519075,
+ "grad_min_sv": 9.631129597315046e-09,
+ "grad_condition": 152979631.4939035,
+ "lr": 0.0009911436253643444,
+ "time_sec": 87.04356169700623
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.785277546691894,
+ "train_acc": 0.03084,
+ "test_loss": 7.56282477722168,
+ "test_acc": 0.01,
+ "lyapunov": 1.5731478392925409,
+ "grad_norm": 0.8027087514422708,
+ "grad_max_sv": 0.4249536793678999,
+ "grad_min_sv": 1.0233699096961427e-08,
+ "grad_condition": 2212458832.3035727,
+ "lr": 0.0009890738003669028,
+ "time_sec": 86.9918863773346
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.85365997543335,
+ "train_acc": 0.02776,
+ "test_loss": 6.083891798400879,
+ "test_acc": 0.01,
+ "lyapunov": 1.594173707315684,
+ "grad_norm": 0.6228665658651402,
+ "grad_max_sv": 0.3807309426367283,
+ "grad_min_sv": 7.858218521034076e-09,
+ "grad_condition": 142247255.9097917,
+ "lr": 0.00098678945143658,
+ "time_sec": 87.02730226516724
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.936503148193359,
+ "train_acc": 0.02734,
+ "test_loss": 4.648137149047852,
+ "test_acc": 0.01,
+ "lyapunov": 1.6324983204112333,
+ "grad_norm": 0.8180108242362618,
+ "grad_max_sv": 0.3168713390827179,
+ "grad_min_sv": 6.217847966746067e-09,
+ "grad_condition": 1904828726.2920518,
+ "lr": 0.0009842915805643154,
+ "time_sec": 86.98762059211731
+ },
+ {
+ "epoch": 13,
+ "train_loss": 4.989127286529541,
+ "train_acc": 0.02624,
+ "test_loss": 5.89718906326294,
+ "test_acc": 0.01,
+ "lyapunov": 1.6513543821051908,
+ "grad_norm": 0.8703418944824507,
+ "grad_max_sv": 0.3535689525306225,
+ "grad_min_sv": 6.494354365393917e-09,
+ "grad_condition": 75061975.40179494,
+ "lr": 0.000981581283398829,
+ "time_sec": 86.99741172790527
+ },
+ {
+ "epoch": 14,
+ "train_loss": 5.027360094604492,
+ "train_acc": 0.02734,
+ "test_loss": 5.6859222030639645,
+ "test_acc": 0.01,
+ "lyapunov": 1.66906841667107,
+ "grad_norm": 0.8955015428134906,
+ "grad_max_sv": 0.3326103314757347,
+ "grad_min_sv": 5.961173611852833e-09,
+ "grad_condition": 196184685.20064688,
+ "lr": 0.0009786597487660333,
+ "time_sec": 86.990553855896
+ },
+ {
+ "epoch": 15,
+ "train_loss": 5.103685426635742,
+ "train_acc": 0.0235,
+ "test_loss": 4.620827954101562,
+ "test_acc": 0.01,
+ "lyapunov": 1.6500021161325753,
+ "grad_norm": 0.7165299396921548,
+ "grad_max_sv": 0.29206431321799753,
+ "grad_min_sv": 3.742070758853766e-09,
+ "grad_condition": 11821452317.947672,
+ "lr": 0.0009755282581475766,
+ "time_sec": 86.99919128417969
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.046826876983642,
+ "train_acc": 0.02808,
+ "test_loss": 4.618471592712402,
+ "test_acc": 0.01,
+ "lyapunov": 1.6286348086183944,
+ "grad_norm": 0.8805208885120411,
+ "grad_max_sv": 0.34881011955440044,
+ "grad_min_sv": 5.4340508724715075e-09,
+ "grad_condition": 607977502.9364278,
+ "lr": 0.0009721881851187403,
+ "time_sec": 87.02350974082947
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.125038688812256,
+ "train_acc": 0.02188,
+ "test_loss": 5.0374674758911135,
+ "test_acc": 0.01,
+ "lyapunov": 1.6156021630977426,
+ "grad_norm": 0.7664664524159326,
+ "grad_max_sv": 0.31916227340698244,
+ "grad_min_sv": 3.2244314654420098e-09,
+ "grad_condition": 12300439770.56846,
+ "lr": 0.0009686409947459456,
+ "time_sec": 87.0214216709137
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.1917090243530275,
+ "train_acc": 0.02074,
+ "test_loss": 6.239829849243164,
+ "test_acc": 0.01,
+ "lyapunov": 1.6075686880999513,
+ "grad_norm": 0.8340839537949596,
+ "grad_max_sv": 0.2987551841884851,
+ "grad_min_sv": 1.3384357527406395e-09,
+ "grad_condition": 53090691786.99108,
+ "lr": 0.0009648882429441254,
+ "time_sec": 87.0026741027832
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.1467557635498045,
+ "train_acc": 0.02224,
+ "test_loss": 4.859098764038086,
+ "test_acc": 0.01,
+ "lyapunov": 1.5547950270840578,
+ "grad_norm": 0.5424186147523934,
+ "grad_max_sv": 0.2584996819496155,
+ "grad_min_sv": 1.7988151973410667e-10,
+ "grad_condition": 42973213975.62498,
+ "lr": 0.00096093157579425,
+ "time_sec": 87.0099880695343
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.253306176147461,
+ "train_acc": 0.01948,
+ "test_loss": 8.813103515625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5798406722905385,
+ "grad_norm": 0.6790335216715864,
+ "grad_max_sv": 0.2796168942004442,
+ "grad_min_sv": 1.3123472687420754e-09,
+ "grad_condition": 55528903276.005905,
+ "lr": 0.0009567727288213001,
+ "time_sec": 87.00798654556274
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.3828185322570805,
+ "train_acc": 0.01028,
+ "test_loss": 8.961210163879395,
+ "test_acc": 0.01,
+ "lyapunov": 1.566893112933849,
+ "grad_norm": 0.9785357311156059,
+ "grad_max_sv": 0.4175733871757984,
+ "grad_min_sv": 5.038056967646815e-09,
+ "grad_condition": 2576596333.756474,
+ "lr": 0.0009524135262330095,
+ "time_sec": 87.24499773979187
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.318783715209961,
+ "train_acc": 0.01022,
+ "test_loss": 9.226270596313476,
+ "test_acc": 0.01,
+ "lyapunov": 1.515167183888233,
+ "grad_norm": 0.5897187117480035,
+ "grad_max_sv": 0.32070303708314896,
+ "grad_min_sv": 3.3304707929004972e-09,
+ "grad_condition": 145373104.26632357,
+ "lr": 0.0009478558801197061,
+ "time_sec": 87.02501797676086
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.311336210021973,
+ "train_acc": 0.00992,
+ "test_loss": 9.553670106506347,
+ "test_acc": 0.01,
+ "lyapunov": 1.5058710337294947,
+ "grad_norm": 0.42067884050272164,
+ "grad_max_sv": 0.3374065548181534,
+ "grad_min_sv": 3.917849118045824e-09,
+ "grad_condition": 148787617.53453642,
+ "lr": 0.000943101789615607,
+ "time_sec": 87.03109979629517
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.310154438018799,
+ "train_acc": 0.01036,
+ "test_loss": 7.603771569824219,
+ "test_acc": 0.01,
+ "lyapunov": 1.509728124379502,
+ "grad_norm": 0.3834815238141383,
+ "grad_max_sv": 0.3096462905406952,
+ "grad_min_sv": 2.737797575240686e-09,
+ "grad_condition": 22145829075.872944,
+ "lr": 0.0009381533400219313,
+ "time_sec": 86.98246717453003
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.301079537353516,
+ "train_acc": 0.00976,
+ "test_loss": 7.519319520568848,
+ "test_acc": 0.01,
+ "lyapunov": 1.5108507871627808,
+ "grad_norm": 0.30755221598797206,
+ "grad_max_sv": 0.2302608024328947,
+ "grad_min_sv": 2.0953720649433853e-11,
+ "grad_condition": 115571274953.14014,
+ "lr": 0.0009330127018922189,
+ "time_sec": 87.00150752067566
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.2993214897155765,
+ "train_acc": 0.00926,
+ "test_loss": 7.535327529907226,
+ "test_acc": 0.01,
+ "lyapunov": 1.5122191076693328,
+ "grad_norm": 0.2686555081361175,
+ "grad_max_sv": 0.1873680654913187,
+ "grad_min_sv": 1.1968037446042912e-12,
+ "grad_condition": 111356408601.78958,
+ "lr": 0.000927682130080253,
+ "time_sec": 87.06040525436401
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.301115319061279,
+ "train_acc": 0.01026,
+ "test_loss": 7.4256896377563475,
+ "test_acc": 0.01,
+ "lyapunov": 1.5147829875921655,
+ "grad_norm": 0.2584031825672629,
+ "grad_max_sv": 0.18733071088790892,
+ "grad_min_sv": 1.5532640335746842e-12,
+ "grad_condition": 105854162513.72067,
+ "lr": 0.0009221639627510072,
+ "time_sec": 87.0212287902832
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.300986379394531,
+ "train_acc": 0.00912,
+ "test_loss": 7.3856002044677735,
+ "test_acc": 0.01,
+ "lyapunov": 1.5147232972752407,
+ "grad_norm": 0.2414535578672304,
+ "grad_max_sv": 0.16182587593793868,
+ "grad_min_sv": 2.716757690251971e-13,
+ "grad_condition": 139096227622.95874,
+ "lr": 0.0009164606203550494,
+ "time_sec": 87.02124691009521
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.311827180175781,
+ "train_acc": 0.00958,
+ "test_loss": 9.537436566162109,
+ "test_acc": 0.01,
+ "lyapunov": 1.5239817428466913,
+ "grad_norm": 0.2934555140553008,
+ "grad_max_sv": 0.17254459988325835,
+ "grad_min_sv": 7.800315873566188e-13,
+ "grad_condition": 118094677554.4253,
+ "lr": 0.0009105746045668516,
+ "time_sec": 87.02146863937378
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.306949669952393,
+ "train_acc": 0.00986,
+ "test_loss": 9.629324139404297,
+ "test_acc": 0.01,
+ "lyapunov": 1.5190055486186387,
+ "grad_norm": 0.2568362833037679,
+ "grad_max_sv": 0.1871931992471218,
+ "grad_min_sv": 8.733775765521943e-13,
+ "grad_condition": 124328292229.6437,
+ "lr": 0.0009045084971874733,
+ "time_sec": 87.0063271522522
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.317695409240723,
+ "train_acc": 0.00946,
+ "test_loss": 9.857299293518066,
+ "test_acc": 0.01,
+ "lyapunov": 1.5297813034423478,
+ "grad_norm": 0.31967679371455754,
+ "grad_max_sv": 0.17166709154844284,
+ "grad_min_sv": 1.3052075569227142e-12,
+ "grad_condition": 105851795247.06416,
+ "lr": 0.0008982649590120977,
+ "time_sec": 87.03139019012451
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.306474250030518,
+ "train_acc": 0.00946,
+ "test_loss": 6.192124473571777,
+ "test_acc": 0.01,
+ "lyapunov": 1.5204204305663438,
+ "grad_norm": 0.22033885472694253,
+ "grad_max_sv": 0.1525889288634062,
+ "grad_min_sv": 4.756078352149119e-13,
+ "grad_condition": 128078379912.95,
+ "lr": 0.0008918467286629196,
+ "time_sec": 86.99606108665466
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.307142764892578,
+ "train_acc": 0.00976,
+ "test_loss": 7.497373861694336,
+ "test_acc": 0.01,
+ "lyapunov": 1.522810420721693,
+ "grad_norm": 0.20782539541327114,
+ "grad_max_sv": 0.13517180345952512,
+ "grad_min_sv": 1.1068227830043178e-13,
+ "grad_condition": 123350210961.5916,
+ "lr": 0.0008852566213878943,
+ "time_sec": 87.02485609054565
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.307786667785645,
+ "train_acc": 0.01036,
+ "test_loss": 6.049268864440918,
+ "test_acc": 0.01,
+ "lyapunov": 1.5257866547235748,
+ "grad_norm": 0.1890978405416262,
+ "grad_max_sv": 0.10800869315862656,
+ "grad_min_sv": 7.129825504179478e-15,
+ "grad_condition": 107252102588.7272,
+ "lr": 0.000878497527825878,
+ "time_sec": 87.10786271095276
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.3119341674804685,
+ "train_acc": 0.009,
+ "test_loss": 4.805781600952148,
+ "test_acc": 0.01,
+ "lyapunov": 1.5290101019622724,
+ "grad_norm": 0.1944266687511967,
+ "grad_max_sv": 0.11351412069052458,
+ "grad_min_sv": 1.0284869415209545e-14,
+ "grad_condition": 112374076474.89091,
+ "lr": 0.000871572412738697,
+ "time_sec": 87.02945756912231
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.30866313369751,
+ "train_acc": 0.01008,
+ "test_loss": 5.370443841552734,
+ "test_acc": 0.01,
+ "lyapunov": 1.5276334587570346,
+ "grad_norm": 0.16190926523802132,
+ "grad_max_sv": 0.09535483401268721,
+ "grad_min_sv": 3.195651304626571e-15,
+ "grad_condition": 94990079164.94656,
+ "lr": 0.0008644843137107055,
+ "time_sec": 86.99824213981628
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.308895555877686,
+ "train_acc": 0.0099,
+ "test_loss": 4.843223188781738,
+ "test_acc": 0.01,
+ "lyapunov": 1.5290613820790635,
+ "grad_norm": 0.15630460219006667,
+ "grad_max_sv": 0.08036092817783355,
+ "grad_min_sv": 1.1315139619811405e-17,
+ "grad_condition": 80360078431.92064,
+ "lr": 0.0008572363398164014,
+ "time_sec": 86.98283195495605
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.31004166229248,
+ "train_acc": 0.00976,
+ "test_loss": 4.780417753601074,
+ "test_acc": 0.01,
+ "lyapunov": 1.5300937909299455,
+ "grad_norm": 0.16356950260232017,
+ "grad_max_sv": 0.08305604849010706,
+ "grad_min_sv": 8.648904023608753e-17,
+ "grad_condition": 83049364241.033,
+ "lr": 0.0008498316702566826,
+ "time_sec": 87.12476921081543
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.308765927276611,
+ "train_acc": 0.00922,
+ "test_loss": 4.650610294342041,
+ "test_acc": 0.01,
+ "lyapunov": 1.529145797195337,
+ "grad_norm": 0.13936121996216216,
+ "grad_max_sv": 0.06846637381240725,
+ "grad_min_sv": 6.938789416330728e-18,
+ "grad_condition": 68465862650.46446,
+ "lr": 0.0008422735529643442,
+ "time_sec": 87.00707483291626
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.312034950561523,
+ "train_acc": 0.00936,
+ "test_loss": 8.73487543487549,
+ "test_acc": 0.01,
+ "lyapunov": 1.532078573465957,
+ "grad_norm": 0.18500833074783374,
+ "grad_max_sv": 0.078881626855582,
+ "grad_min_sv": 1.2209525522074501e-26,
+ "grad_condition": 78881626855.5808,
+ "lr": 0.0008345653031794289,
+ "time_sec": 86.97358655929565
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.3188898524475094,
+ "train_acc": 0.00938,
+ "test_loss": 6.380272773742676,
+ "test_acc": 0.01,
+ "lyapunov": 1.5366824176305396,
+ "grad_norm": 0.16899341003407245,
+ "grad_max_sv": 0.0827794061973691,
+ "grad_min_sv": 1.2491873132717773e-20,
+ "grad_condition": 82779405140.55663,
+ "lr": 0.0008267103019950526,
+ "time_sec": 86.98160243034363
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.311096598052979,
+ "train_acc": 0.00918,
+ "test_loss": 6.181304641723633,
+ "test_acc": 0.01,
+ "lyapunov": 1.53186220738589,
+ "grad_norm": 0.14945919124069362,
+ "grad_max_sv": 0.07147165723145008,
+ "grad_min_sv": 1.6261729001718281e-18,
+ "grad_condition": 71471530485.47403,
+ "lr": 0.0008187119948743447,
+ "time_sec": 86.98783445358276
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.311037984619141,
+ "train_acc": 0.00992,
+ "test_loss": 6.528422421264648,
+ "test_acc": 0.01,
+ "lyapunov": 1.5322752218417195,
+ "grad_norm": 0.13413981069527348,
+ "grad_max_sv": 0.05753951920196414,
+ "grad_min_sv": 5.739214042427294e-41,
+ "grad_condition": 57539519201.964134,
+ "lr": 0.000810573890139155,
+ "time_sec": 87.02233648300171
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.314179193420411,
+ "train_acc": 0.00976,
+ "test_loss": 6.383645655822754,
+ "test_acc": 0.01,
+ "lyapunov": 1.5352078728053882,
+ "grad_norm": 0.15018671176350665,
+ "grad_max_sv": 0.06426793411374092,
+ "grad_min_sv": 1.0144677449199871e-19,
+ "grad_condition": 64267926931.3136,
+ "lr": 0.0008022995574311873,
+ "time_sec": 86.99135541915894
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.3138120045471195,
+ "train_acc": 0.00972,
+ "test_loss": 6.1780305633544925,
+ "test_acc": 0.01,
+ "lyapunov": 1.53417928048107,
+ "grad_norm": 0.1546946181453632,
+ "grad_max_sv": 0.07538183946162462,
+ "grad_min_sv": 2.0235549254645516e-17,
+ "grad_condition": 75380064770.74498,
+ "lr": 0.0007938926261462363,
+ "time_sec": 86.9700219631195
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.31338122253418,
+ "train_acc": 0.01088,
+ "test_loss": 4.875375650024414,
+ "test_acc": 0.01,
+ "lyapunov": 1.5348101799445384,
+ "grad_norm": 0.13799834022044194,
+ "grad_max_sv": 0.05826565367169678,
+ "grad_min_sv": 1.2213807007518915e-19,
+ "grad_condition": 58265644274.60155,
+ "lr": 0.0007853567838422158,
+ "time_sec": 86.9914186000824
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.316119242401123,
+ "train_acc": 0.01028,
+ "test_loss": 7.579864669799805,
+ "test_acc": 0.01,
+ "lyapunov": 1.5372701596725933,
+ "grad_norm": 0.1318310224117309,
+ "grad_max_sv": 0.059043215587735176,
+ "grad_min_sv": 1.0278524235822533e-42,
+ "grad_condition": 59043215587.73517,
+ "lr": 0.0007766957746216719,
+ "time_sec": 86.99268984794617
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.3163630574035645,
+ "train_acc": 0.00918,
+ "test_loss": 8.10872494354248,
+ "test_acc": 0.01,
+ "lyapunov": 1.537570302443736,
+ "grad_norm": 0.14919853802284255,
+ "grad_max_sv": 0.059043734613806007,
+ "grad_min_sv": 1.9169802249728662e-27,
+ "grad_condition": 59043734613.80581,
+ "lr": 0.0007679133974894982,
+ "time_sec": 86.96942186355591
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.315186663513184,
+ "train_acc": 0.00982,
+ "test_loss": 10.137148637390137,
+ "test_acc": 0.01,
+ "lyapunov": 1.5357392169630435,
+ "grad_norm": 0.14339565437399782,
+ "grad_max_sv": 0.07659720163792372,
+ "grad_min_sv": 9.214212859750722e-16,
+ "grad_condition": 76509866898.91414,
+ "lr": 0.000759013504686565,
+ "time_sec": 87.01622128486633
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.314455534973145,
+ "train_acc": 0.0102,
+ "test_loss": 8.247185594177246,
+ "test_acc": 0.01,
+ "lyapunov": 1.5355263009400624,
+ "grad_norm": 0.13354715221640268,
+ "grad_max_sv": 0.06603035274893046,
+ "grad_min_sv": 4.3361800326764774e-19,
+ "grad_condition": 66030309212.30867,
+ "lr": 0.0007499999999999998,
+ "time_sec": 86.99394655227661
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.32153740737915,
+ "train_acc": 0.01,
+ "test_loss": 8.37662465057373,
+ "test_acc": 0.01,
+ "lyapunov": 1.5409153455968403,
+ "grad_norm": 0.14502327588857133,
+ "grad_max_sv": 0.06259518237784505,
+ "grad_min_sv": 4.890059136866219e-20,
+ "grad_condition": 62595178420.28666,
+ "lr": 0.0007408768370508575,
+ "time_sec": 86.97510194778442
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.316599715270996,
+ "train_acc": 0.00936,
+ "test_loss": 8.278748655700683,
+ "test_acc": 0.01,
+ "lyapunov": 1.5381617646692964,
+ "grad_norm": 0.1359300928840212,
+ "grad_max_sv": 0.05868045939132571,
+ "grad_min_sv": 2.1909536115890692e-21,
+ "grad_condition": 58680459216.2619,
+ "lr": 0.0007316480175599307,
+ "time_sec": 86.98001670837402
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.316536732788086,
+ "train_acc": 0.01016,
+ "test_loss": 5.486338158416748,
+ "test_acc": 0.01,
+ "lyapunov": 1.5382660676146407,
+ "grad_norm": 0.1271741910618785,
+ "grad_max_sv": 0.05760562280192971,
+ "grad_min_sv": 3.503246160812043e-47,
+ "grad_condition": 57605622801.92971,
+ "lr": 0.0007223175895924635,
+ "time_sec": 86.99369311332703
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.316702398681641,
+ "train_acc": 0.0102,
+ "test_loss": 5.302798899841308,
+ "test_acc": 0.01,
+ "lyapunov": 1.5386110059440594,
+ "grad_norm": 0.15368852800875965,
+ "grad_max_sv": 0.0578720694873482,
+ "grad_min_sv": 1.7830822309301135e-42,
+ "grad_condition": 57872069487.348206,
+ "lr": 0.0007128896457825361,
+ "time_sec": 86.96624207496643
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.316231355743408,
+ "train_acc": 0.00948,
+ "test_loss": 8.74564740600586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5383109363448588,
+ "grad_norm": 0.13190622008458677,
+ "grad_max_sv": 0.04535484011285007,
+ "grad_min_sv": 0.0,
+ "grad_condition": 45354840112.850075,
+ "lr": 0.0007033683215378998,
+ "time_sec": 86.97799372673035
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.317534141235352,
+ "train_acc": 0.00946,
+ "test_loss": 8.70028028869629,
+ "test_acc": 0.01,
+ "lyapunov": 1.5393455677934924,
+ "grad_norm": 0.13462977039802712,
+ "grad_max_sv": 0.06513494476675988,
+ "grad_min_sv": 3.503246160812043e-47,
+ "grad_condition": 65134944766.75987,
+ "lr": 0.0006937577932260512,
+ "time_sec": 86.98487591743469
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.318079041290283,
+ "train_acc": 0.0097,
+ "test_loss": 9.145556756591796,
+ "test_acc": 0.01,
+ "lyapunov": 1.5401513216745517,
+ "grad_norm": 0.13118847481535986,
+ "grad_max_sv": 0.05173748955130577,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51737489551.30577,
+ "lr": 0.0006840622763423388,
+ "time_sec": 87.00480890274048
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.316858307800293,
+ "train_acc": 0.00892,
+ "test_loss": 8.666381803894042,
+ "test_acc": 0.01,
+ "lyapunov": 1.5383905370522033,
+ "grad_norm": 0.12912610896619198,
+ "grad_max_sv": 0.06017917674034834,
+ "grad_min_sv": 3.503246160812043e-47,
+ "grad_condition": 60179176740.34834,
+ "lr": 0.0006742860236609073,
+ "time_sec": 87.00866675376892
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.325099550476074,
+ "train_acc": 0.00954,
+ "test_loss": 8.285526527404786,
+ "test_acc": 0.01,
+ "lyapunov": 1.544173507739211,
+ "grad_norm": 0.15876381906710343,
+ "grad_max_sv": 0.06922355592250824,
+ "grad_min_sv": 2.3088949294307303e-16,
+ "grad_condition": 69207800483.04135,
+ "lr": 0.0006644333233692913,
+ "time_sec": 86.97984671592712
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.3204884049987795,
+ "train_acc": 0.0094,
+ "test_loss": 8.168935748291016,
+ "test_acc": 0.01,
+ "lyapunov": 1.5423277512840603,
+ "grad_norm": 0.12428279151580043,
+ "grad_max_sv": 0.05191116128116846,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51911161281.168465,
+ "lr": 0.0006545084971874734,
+ "time_sec": 86.99251651763916
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.318557815551758,
+ "train_acc": 0.00974,
+ "test_loss": 11.625576313781739,
+ "test_acc": 0.01,
+ "lyapunov": 1.5408994303944776,
+ "grad_norm": 0.11981934242025526,
+ "grad_max_sv": 0.04157847780734301,
+ "grad_min_sv": 0.0,
+ "grad_condition": 41578477807.343,
+ "lr": 0.0006445158984722354,
+ "time_sec": 86.97000765800476
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.320785666503906,
+ "train_acc": 0.00938,
+ "test_loss": 12.541597724914551,
+ "test_acc": 0.01,
+ "lyapunov": 1.5433500727729115,
+ "grad_norm": 0.11919617488574552,
+ "grad_max_sv": 0.04310994283296168,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43109942832.96168,
+ "lr": 0.0006344599103076324,
+ "time_sec": 86.96448731422424
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.32412813293457,
+ "train_acc": 0.0091,
+ "test_loss": 11.793109805297851,
+ "test_acc": 0.01,
+ "lyapunov": 1.5443742366702966,
+ "grad_norm": 0.118004366839836,
+ "grad_max_sv": 0.0428059502504766,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42805950250.4766,
+ "lr": 0.0006243449435824269,
+ "time_sec": 86.93323230743408
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.318806624603272,
+ "train_acc": 0.00956,
+ "test_loss": 12.444959045410156,
+ "test_acc": 0.01,
+ "lyapunov": 1.5414444375830842,
+ "grad_norm": 0.11645932110555444,
+ "grad_max_sv": 0.030990714300423862,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30990714300.42386,
+ "lr": 0.0006141754350553275,
+ "time_sec": 86.89740920066833
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.317045929870606,
+ "train_acc": 0.01018,
+ "test_loss": 10.023806936645508,
+ "test_acc": 0.01,
+ "lyapunov": 1.5395582572883353,
+ "grad_norm": 0.11276313707472024,
+ "grad_max_sv": 0.03361189742572605,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33611897425.726055,
+ "lr": 0.0006039558454088793,
+ "time_sec": 86.97432947158813
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.32016941192627,
+ "train_acc": 0.00944,
+ "test_loss": 10.012617837524415,
+ "test_acc": 0.01,
+ "lyapunov": 1.5425440329115103,
+ "grad_norm": 0.10590387961842582,
+ "grad_max_sv": 0.02548480206169188,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25484802061.691883,
+ "lr": 0.000593690657292862,
+ "time_sec": 86.97213578224182
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.320958078460693,
+ "train_acc": 0.00912,
+ "test_loss": 8.012544973754883,
+ "test_acc": 0.01,
+ "lyapunov": 1.5432329269321374,
+ "grad_norm": 0.11098177802612447,
+ "grad_max_sv": 0.028018432063981892,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28018432063.98189,
+ "lr": 0.0005833843733580507,
+ "time_sec": 86.92108106613159
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.319859785614014,
+ "train_acc": 0.0098,
+ "test_loss": 9.247186422729492,
+ "test_acc": 0.01,
+ "lyapunov": 1.542363587852634,
+ "grad_norm": 0.1248664197770911,
+ "grad_max_sv": 0.04367699818685651,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43676998186.85651,
+ "lr": 0.0005730415142812054,
+ "time_sec": 86.95592594146729
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.318826563873291,
+ "train_acc": 0.01016,
+ "test_loss": 10.35489285736084,
+ "test_acc": 0.01,
+ "lyapunov": 1.5414060040203201,
+ "grad_norm": 0.10987589074835707,
+ "grad_max_sv": 0.03276977320201695,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32769773202.01695,
+ "lr": 0.0005626666167821517,
+ "time_sec": 86.91380739212036
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.317324656524658,
+ "train_acc": 0.01038,
+ "test_loss": 9.99694027709961,
+ "test_acc": 0.01,
+ "lyapunov": 1.5401056565896933,
+ "grad_norm": 0.10923451968148526,
+ "grad_max_sv": 0.026721618324518203,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26721618324.518204,
+ "lr": 0.0005522642316338265,
+ "time_sec": 86.8878607749939
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.317690666198731,
+ "train_acc": 0.00962,
+ "test_loss": 8.448246655273438,
+ "test_acc": 0.01,
+ "lyapunov": 1.5407067177545688,
+ "grad_norm": 0.10993057282913465,
+ "grad_max_sv": 0.021391112776473164,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21391112776.473164,
+ "lr": 0.0005418389216661573,
+ "time_sec": 86.89513158798218
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.317815923156738,
+ "train_acc": 0.01004,
+ "test_loss": 12.15319383392334,
+ "test_acc": 0.01,
+ "lyapunov": 1.5406005382537842,
+ "grad_norm": 0.11546754813601234,
+ "grad_max_sv": 0.04164923094213009,
+ "grad_min_sv": 0.0,
+ "grad_condition": 41649230942.13009,
+ "lr": 0.0005313952597646563,
+ "time_sec": 86.93751883506775
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.318552890930175,
+ "train_acc": 0.009,
+ "test_loss": 7.365837602996826,
+ "test_acc": 0.01,
+ "lyapunov": 1.5411235444685991,
+ "grad_norm": 0.11378399985617368,
+ "grad_max_sv": 0.03538390537723899,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35383905377.23899,
+ "lr": 0.0005209378268645994,
+ "time_sec": 86.92508888244629
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.3266375039672855,
+ "train_acc": 0.00916,
+ "test_loss": 5.939176264190674,
+ "test_acc": 0.01,
+ "lyapunov": 1.5473728344568511,
+ "grad_norm": 0.112949937059148,
+ "grad_max_sv": 0.01943044299259782,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19430442992.597816,
+ "lr": 0.0005104712099416781,
+ "time_sec": 86.87594652175903
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.3182286242675785,
+ "train_acc": 0.00916,
+ "test_loss": 7.4682364219665525,
+ "test_acc": 0.01,
+ "lyapunov": 1.5411189620757042,
+ "grad_norm": 0.11641453125231847,
+ "grad_max_sv": 0.01762835620902479,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17628356209.024788,
+ "lr": 0.0004999999999999996,
+ "time_sec": 86.89264059066772
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.318416892242432,
+ "train_acc": 0.00958,
+ "test_loss": 6.8439142288208,
+ "test_acc": 0.01,
+ "lyapunov": 1.5413539412686281,
+ "grad_norm": 0.10777855944530633,
+ "grad_max_sv": 0.015298370318487287,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15298370318.487286,
+ "lr": 0.0004895287900583212,
+ "time_sec": 86.88371872901917
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.3228406227111815,
+ "train_acc": 0.00964,
+ "test_loss": 10.02866414489746,
+ "test_acc": 0.01,
+ "lyapunov": 1.544968852606576,
+ "grad_norm": 0.1305888852844692,
+ "grad_max_sv": 0.01963789644651115,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19637896446.51115,
+ "lr": 0.0004790621731353997,
+ "time_sec": 86.87340235710144
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.319401046447754,
+ "train_acc": 0.00956,
+ "test_loss": 8.256184762573243,
+ "test_acc": 0.01,
+ "lyapunov": 1.54242708158615,
+ "grad_norm": 0.11168685518140656,
+ "grad_max_sv": 0.02321814843453467,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23218148434.534668,
+ "lr": 0.000468604740235343,
+ "time_sec": 86.87403607368469
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.319539002532959,
+ "train_acc": 0.00924,
+ "test_loss": 6.6485612655639645,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427932879504036,
+ "grad_norm": 0.1281479832918265,
+ "grad_max_sv": 0.014649314666166901,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14649314666.1669,
+ "lr": 0.00045816107833384175,
+ "time_sec": 86.86377239227295
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.321709277648925,
+ "train_acc": 0.00858,
+ "test_loss": 7.656314584350586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5438944933664462,
+ "grad_norm": 0.1379118039308171,
+ "grad_max_sv": 0.006280570011585951,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6280570011.585951,
+ "lr": 0.0004477357683661729,
+ "time_sec": 86.91206550598145
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.319362686614991,
+ "train_acc": 0.00904,
+ "test_loss": 7.019269757080078,
+ "test_acc": 0.01,
+ "lyapunov": 1.542548160723713,
+ "grad_norm": 0.12802539188386938,
+ "grad_max_sv": 0.019554349593818188,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19554349593.818188,
+ "lr": 0.00043733338321784746,
+ "time_sec": 86.88340616226196
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.319549789886475,
+ "train_acc": 0.00932,
+ "test_loss": 7.563053443908691,
+ "test_acc": 0.01,
+ "lyapunov": 1.5428213295729265,
+ "grad_norm": 0.12962728912126797,
+ "grad_max_sv": 0.011001831339672207,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11001831339.672207,
+ "lr": 0.0004269584857187939,
+ "time_sec": 87.12197208404541
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.3209361798095705,
+ "train_acc": 0.01004,
+ "test_loss": 8.245951638793946,
+ "test_acc": 0.01,
+ "lyapunov": 1.543517429810351,
+ "grad_norm": 0.12992986434807738,
+ "grad_max_sv": 0.011371771851554514,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11371771851.554514,
+ "lr": 0.0004166156266419484,
+ "time_sec": 86.8549747467041
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.319158186340332,
+ "train_acc": 0.00988,
+ "test_loss": 11.181426934814453,
+ "test_acc": 0.01,
+ "lyapunov": 1.5418739129820138,
+ "grad_norm": 0.14570895237027714,
+ "grad_max_sv": 0.03400726960971952,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34007269609.719513,
+ "lr": 0.0004063093427071373,
+ "time_sec": 86.95320224761963
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.319012271881103,
+ "train_acc": 0.0104,
+ "test_loss": 8.699293096923828,
+ "test_acc": 0.01,
+ "lyapunov": 1.5420828835128824,
+ "grad_norm": 0.15422110126668967,
+ "grad_max_sv": 0.0475749587174505,
+ "grad_min_sv": 0.0,
+ "grad_condition": 47574958717.4505,
+ "lr": 0.0003960441545911199,
+ "time_sec": 86.97516655921936
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.319778329925537,
+ "train_acc": 0.0099,
+ "test_loss": 8.610072163391113,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427404270147729,
+ "grad_norm": 0.16350408468824804,
+ "grad_max_sv": 0.0467130537610501,
+ "grad_min_sv": 0.0,
+ "grad_condition": 46713053761.0501,
+ "lr": 0.0003858245649446718,
+ "time_sec": 86.97473764419556
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.320261403961181,
+ "train_acc": 0.01,
+ "test_loss": 9.01234596862793,
+ "test_acc": 0.01,
+ "lyapunov": 1.5430970234639199,
+ "grad_norm": 0.1987413764171708,
+ "grad_max_sv": 0.042272613104432824,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42272613104.432816,
+ "lr": 0.00037565505641757235,
+ "time_sec": 86.94777846336365
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.328781169433594,
+ "train_acc": 0.00958,
+ "test_loss": 7.222933032226562,
+ "test_acc": 0.01,
+ "lyapunov": 1.5479203133326966,
+ "grad_norm": 0.20200984386229512,
+ "grad_max_sv": 0.037374650174751875,
+ "grad_min_sv": 2.888694869312344e-20,
+ "grad_condition": 37374645422.50441,
+ "lr": 0.00036554008969236695,
+ "time_sec": 86.9300582408905
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.3212895065307615,
+ "train_acc": 0.00972,
+ "test_loss": 7.341721871948242,
+ "test_acc": 0.01,
+ "lyapunov": 1.5442103443243314,
+ "grad_norm": 0.21135067798139123,
+ "grad_max_sv": 0.03894036049023271,
+ "grad_min_sv": 0.0,
+ "grad_condition": 38940360490.232704,
+ "lr": 0.0003554841015277638,
+ "time_sec": 87.02612471580505
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.319550964050293,
+ "train_acc": 0.0093,
+ "test_loss": 7.149930093383789,
+ "test_acc": 0.01,
+ "lyapunov": 1.5423216917325773,
+ "grad_norm": 0.17437221481494697,
+ "grad_max_sv": 0.04075719062238932,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40757190622.38932,
+ "lr": 0.000345491502812526,
+ "time_sec": 86.95247411727905
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.319614014892578,
+ "train_acc": 0.00888,
+ "test_loss": 7.18144443359375,
+ "test_acc": 0.01,
+ "lyapunov": 1.5426533264882119,
+ "grad_norm": 0.17520092959369415,
+ "grad_max_sv": 0.022456927318125965,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22456927318.125965,
+ "lr": 0.0003355666766307081,
+ "time_sec": 86.8960337638855
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.3187762687683104,
+ "train_acc": 0.00888,
+ "test_loss": 7.264889540863037,
+ "test_acc": 0.01,
+ "lyapunov": 1.5419618226683047,
+ "grad_norm": 0.1656377365844615,
+ "grad_max_sv": 0.015189866488799452,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15189866488.799454,
+ "lr": 0.00032571397633909225,
+ "time_sec": 86.88141465187073
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.321614575958252,
+ "train_acc": 0.00952,
+ "test_loss": 7.152406310272217,
+ "test_acc": 0.01,
+ "lyapunov": 1.5444753560263786,
+ "grad_norm": 0.1783525963324978,
+ "grad_max_sv": 0.024426844296976925,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24426844296.97692,
+ "lr": 0.00031593772365766094,
+ "time_sec": 86.87559199333191
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.319984560089111,
+ "train_acc": 0.0098,
+ "test_loss": 7.227280062866211,
+ "test_acc": 0.01,
+ "lyapunov": 1.543088520884209,
+ "grad_norm": 0.16043633002422977,
+ "grad_max_sv": 0.0368963482324034,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36896348232.4034,
+ "lr": 0.0003062422067739483,
+ "time_sec": 86.98869109153748
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.318843619537353,
+ "train_acc": 0.00988,
+ "test_loss": 7.253403067016602,
+ "test_acc": 0.01,
+ "lyapunov": 1.5419552667671457,
+ "grad_norm": 0.15988427664274688,
+ "grad_max_sv": 0.03179542766883969,
+ "grad_min_sv": 0.0,
+ "grad_condition": 31795427668.83969,
+ "lr": 0.00029663167846209965,
+ "time_sec": 86.96610736846924
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.321573169403076,
+ "train_acc": 0.00976,
+ "test_loss": 6.988779404449463,
+ "test_acc": 0.01,
+ "lyapunov": 1.5446298613267786,
+ "grad_norm": 0.14208572570705744,
+ "grad_max_sv": 0.03598490892909467,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35984908929.09467,
+ "lr": 0.00028711035421746345,
+ "time_sec": 86.90040850639343
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.325382752685547,
+ "train_acc": 0.00972,
+ "test_loss": 6.935153257751465,
+ "test_acc": 0.01,
+ "lyapunov": 1.5469825359256677,
+ "grad_norm": 0.18543936556050314,
+ "grad_max_sv": 0.024622759968042373,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24622759968.042374,
+ "lr": 0.00027768241040753615,
+ "time_sec": 86.86737728118896
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.319345963439941,
+ "train_acc": 0.0094,
+ "test_loss": 6.679858758544922,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427014974072157,
+ "grad_norm": 0.1365697052360637,
+ "grad_max_sv": 0.0006230609491467476,
+ "grad_min_sv": 0.0,
+ "grad_condition": 623060949.1467476,
+ "lr": 0.00026835198244006903,
+ "time_sec": 86.8515510559082
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.31858975479126,
+ "train_acc": 0.00966,
+ "test_loss": 6.5813590454101565,
+ "test_acc": 0.01,
+ "lyapunov": 1.5418859296442602,
+ "grad_norm": 0.13741337242075724,
+ "grad_max_sv": 0.0017974570393562317,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1797457039.3562317,
+ "lr": 0.0002591231629491421,
+ "time_sec": 86.8734724521637
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.319550311279297,
+ "train_acc": 0.0096,
+ "test_loss": 6.593423309326172,
+ "test_acc": 0.01,
+ "lyapunov": 1.5429147582529756,
+ "grad_norm": 0.1428860474069435,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002499999999999997,
+ "time_sec": 86.91073799133301
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.319647026672364,
+ "train_acc": 0.00946,
+ "test_loss": 6.644115385437011,
+ "test_acc": 0.01,
+ "lyapunov": 1.5430320498278685,
+ "grad_norm": 0.14070137371271418,
+ "grad_max_sv": 0.0011870765592902899,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1187076559.2902899,
+ "lr": 0.00024098649531343477,
+ "time_sec": 86.85703229904175
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.320731920471191,
+ "train_acc": 0.01,
+ "test_loss": 6.511743521118164,
+ "test_acc": 0.01,
+ "lyapunov": 1.544078452202975,
+ "grad_norm": 0.16647090297400036,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002320866025105016,
+ "time_sec": 86.84212875366211
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.320380414123536,
+ "train_acc": 0.0087,
+ "test_loss": 6.558885827636718,
+ "test_acc": 0.01,
+ "lyapunov": 1.5436865057786713,
+ "grad_norm": 0.16211214182978093,
+ "grad_max_sv": 0.0006886070128530264,
+ "grad_min_sv": 0.0,
+ "grad_condition": 688607012.8530264,
+ "lr": 0.0002233042253783278,
+ "time_sec": 86.84861445426941
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.320676337890625,
+ "train_acc": 0.0096,
+ "test_loss": 6.2893127243041995,
+ "test_acc": 0.01,
+ "lyapunov": 1.5437259469800593,
+ "grad_norm": 0.15756640000371477,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000214643216157784,
+ "time_sec": 86.85342407226562
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.318497552947998,
+ "train_acc": 0.00968,
+ "test_loss": 6.463031019592285,
+ "test_acc": 0.01,
+ "lyapunov": 1.5418586124239675,
+ "grad_norm": 0.16471254677440242,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376332,
+ "time_sec": 86.83621501922607
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.319013707885742,
+ "train_acc": 0.00958,
+ "test_loss": 8.393161967468261,
+ "test_acc": 0.01,
+ "lyapunov": 1.5424105264341739,
+ "grad_norm": 0.1697085900956353,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019770044256881242,
+ "time_sec": 86.87845063209534
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.319404435882569,
+ "train_acc": 0.01006,
+ "test_loss": 6.168719081115722,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427791502164758,
+ "grad_norm": 0.16661392944132697,
+ "grad_max_sv": 0.008691688347607852,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8691688347.607851,
+ "lr": 0.0001894261098608447,
+ "time_sec": 86.86028218269348
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.320062127532959,
+ "train_acc": 0.00946,
+ "test_loss": 6.123481111145019,
+ "test_acc": 0.01,
+ "lyapunov": 1.543502251510425,
+ "grad_norm": 0.1553396268788007,
+ "grad_max_sv": 0.0017994886264204979,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1799488626.420498,
+ "lr": 0.000181288005125655,
+ "time_sec": 86.88756346702576
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.32126156539917,
+ "train_acc": 0.0097,
+ "test_loss": 6.113170930480957,
+ "test_acc": 0.01,
+ "lyapunov": 1.5443304225306986,
+ "grad_norm": 0.16827005574777967,
+ "grad_max_sv": 0.008998295897617936,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8998295897.617935,
+ "lr": 0.0001732896980049473,
+ "time_sec": 86.87347865104675
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.319310050964355,
+ "train_acc": 0.00904,
+ "test_loss": 6.0610163803100585,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427448618442505,
+ "grad_norm": 0.14666590598052404,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016543469682057076,
+ "time_sec": 86.86950135231018
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.319597338256836,
+ "train_acc": 0.00972,
+ "test_loss": 6.453852326202393,
+ "test_acc": 0.01,
+ "lyapunov": 1.5429801303712303,
+ "grad_norm": 0.15909427151540545,
+ "grad_max_sv": 0.008126799669116735,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8126799669.116735,
+ "lr": 0.00015772644703565552,
+ "time_sec": 86.88328433036804
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.3212175,
+ "train_acc": 0.00984,
+ "test_loss": 6.988222769927979,
+ "test_acc": 0.01,
+ "lyapunov": 1.5440433973546528,
+ "grad_norm": 0.15582154742531334,
+ "grad_max_sv": 0.023284211242571472,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23284211242.571472,
+ "lr": 0.00015016832974331713,
+ "time_sec": 86.88312244415283
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.320971462249756,
+ "train_acc": 0.0098,
+ "test_loss": 6.753297560882569,
+ "test_acc": 0.01,
+ "lyapunov": 1.5437339016848513,
+ "grad_norm": 0.15454565641823212,
+ "grad_max_sv": 0.0231532484292984,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23153248429.2984,
+ "lr": 0.00014276366018359834,
+ "time_sec": 86.87558174133301
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.318772131958008,
+ "train_acc": 0.00984,
+ "test_loss": 6.465322698974609,
+ "test_acc": 0.01,
+ "lyapunov": 1.5421108507439303,
+ "grad_norm": 0.15163809922079102,
+ "grad_max_sv": 0.017600245866924526,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17600245866.924522,
+ "lr": 0.00013551568628929425,
+ "time_sec": 86.85901880264282
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.323592142486572,
+ "train_acc": 0.00918,
+ "test_loss": 5.990406560516357,
+ "test_acc": 0.01,
+ "lyapunov": 1.5453894397486811,
+ "grad_norm": 0.15673824664274916,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 86.8471782207489
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.321912714385986,
+ "train_acc": 0.00934,
+ "test_loss": 5.642854423522949,
+ "test_acc": 0.01,
+ "lyapunov": 1.5451806213544763,
+ "grad_norm": 0.14873545301539315,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 86.82159352302551
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.319042910766601,
+ "train_acc": 0.00916,
+ "test_loss": 5.394878324890136,
+ "test_acc": 0.01,
+ "lyapunov": 1.5425118525009935,
+ "grad_norm": 0.15364989808867727,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 86.8501136302948
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.3216519416809085,
+ "train_acc": 0.0099,
+ "test_loss": 5.54234706954956,
+ "test_acc": 0.01,
+ "lyapunov": 1.544617168738714,
+ "grad_norm": 0.16204040482857374,
+ "grad_max_sv": 0.014768891455605625,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14768891455.605625,
+ "lr": 0.00010815327133708009,
+ "time_sec": 86.8445405960083
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.318838922729492,
+ "train_acc": 0.00982,
+ "test_loss": 5.401806521606446,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422493301694045,
+ "grad_norm": 0.16127338804024163,
+ "grad_max_sv": 0.00781935746781528,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7819357467.81528,
+ "lr": 0.00010173504098790182,
+ "time_sec": 86.82885694503784
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.319433266448975,
+ "train_acc": 0.00962,
+ "test_loss": 5.87718871307373,
+ "test_acc": 0.01,
+ "lyapunov": 1.5428460543722753,
+ "grad_norm": 0.16811186230922795,
+ "grad_max_sv": 0.003142098290845752,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3142098290.845752,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 86.83435249328613
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.318956566009521,
+ "train_acc": 0.00864,
+ "test_loss": 5.642109811401367,
+ "test_acc": 0.01,
+ "lyapunov": 1.5424094806851634,
+ "grad_norm": 0.16401865280170627,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 86.84270787239075
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.320396621246338,
+ "train_acc": 0.00946,
+ "test_loss": 5.506566726684571,
+ "test_acc": 0.01,
+ "lyapunov": 1.543682734984571,
+ "grad_norm": 0.16574195620383422,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 86.84029245376587
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.3207761328125,
+ "train_acc": 0.0098,
+ "test_loss": 5.753901168823242,
+ "test_acc": 0.01,
+ "lyapunov": 1.5442172185234402,
+ "grad_norm": 0.17475767067470402,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 86.83801436424255
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.318808111877441,
+ "train_acc": 0.00922,
+ "test_loss": 5.811789031982422,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422291850190029,
+ "grad_norm": 0.16090202757718183,
+ "grad_max_sv": 0.003358612256124616,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3358612256.1246157,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 86.8513069152832
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.319976197967529,
+ "train_acc": 0.00978,
+ "test_loss": 5.7769184440612795,
+ "test_acc": 0.01,
+ "lyapunov": 1.543531141622597,
+ "grad_norm": 0.15700147429987782,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 86.86197853088379
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.318454194946289,
+ "train_acc": 0.00986,
+ "test_loss": 6.11075336303711,
+ "test_acc": 0.01,
+ "lyapunov": 1.5418975673368216,
+ "grad_norm": 0.15336017967137117,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 86.86198329925537
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.3203326902771,
+ "train_acc": 0.00934,
+ "test_loss": 6.080118833160401,
+ "test_acc": 0.01,
+ "lyapunov": 1.5438893414519328,
+ "grad_norm": 0.15768179334274351,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 86.84648036956787
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.318091445770263,
+ "train_acc": 0.0093,
+ "test_loss": 6.249022463989258,
+ "test_acc": 0.01,
+ "lyapunov": 1.5415176842218774,
+ "grad_norm": 0.15317629834457977,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 86.83089065551758
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.319208795776367,
+ "train_acc": 0.00944,
+ "test_loss": 6.242862550354004,
+ "test_acc": 0.01,
+ "lyapunov": 1.5426923082307782,
+ "grad_norm": 0.1586342865712123,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 86.8825249671936
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.319570325469971,
+ "train_acc": 0.00932,
+ "test_loss": 6.273485357666016,
+ "test_acc": 0.01,
+ "lyapunov": 1.5430697696593108,
+ "grad_norm": 0.16288378510968,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 86.85678577423096
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.31834419998169,
+ "train_acc": 0.00966,
+ "test_loss": 6.162585590362549,
+ "test_acc": 0.01,
+ "lyapunov": 1.5417695389989088,
+ "grad_norm": 0.15701283230384563,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 86.83028483390808
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.319475943603516,
+ "train_acc": 0.0094,
+ "test_loss": 6.003315113067627,
+ "test_acc": 0.01,
+ "lyapunov": 1.5429863951090352,
+ "grad_norm": 0.1615796670941878,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 86.82017540931702
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.32576198135376,
+ "train_acc": 0.00958,
+ "test_loss": 5.846498718261719,
+ "test_acc": 0.01,
+ "lyapunov": 1.5467814566839078,
+ "grad_norm": 0.1814711768537964,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 86.84380340576172
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.321647165985107,
+ "train_acc": 0.00952,
+ "test_loss": 5.876250485229492,
+ "test_acc": 0.01,
+ "lyapunov": 1.544941949722407,
+ "grad_norm": 0.18078759337952854,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 86.84492230415344
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.31924706817627,
+ "train_acc": 0.0096,
+ "test_loss": 5.819815138244629,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427488103851943,
+ "grad_norm": 0.16329066142016732,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 86.83999133110046
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.319398911132812,
+ "train_acc": 0.00982,
+ "test_loss": 6.490616073608399,
+ "test_acc": 0.01,
+ "lyapunov": 1.5429087801052785,
+ "grad_norm": 0.15926311416791136,
+ "grad_max_sv": 0.0018711634445935487,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1871163444.5935485,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 86.86916947364807
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.318829065551758,
+ "train_acc": 0.00978,
+ "test_loss": 5.920670237731934,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422979410347122,
+ "grad_norm": 0.16006466704199326,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 86.87598538398743
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.3190561383056645,
+ "train_acc": 0.00948,
+ "test_loss": 6.480327618408203,
+ "test_acc": 0.01,
+ "lyapunov": 1.5425209660664239,
+ "grad_norm": 0.16458438595098937,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 86.83726739883423
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.318953646392822,
+ "train_acc": 0.00984,
+ "test_loss": 5.952891006469726,
+ "test_acc": 0.01,
+ "lyapunov": 1.5424313371443688,
+ "grad_norm": 0.16278457254190812,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 86.83793210983276
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.3213463069152835,
+ "train_acc": 0.00976,
+ "test_loss": 6.456882773590088,
+ "test_acc": 0.01,
+ "lyapunov": 1.5445466053760266,
+ "grad_norm": 0.16371751816212385,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 86.85442423820496
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.318112189025879,
+ "train_acc": 0.00942,
+ "test_loss": 6.3592885223388675,
+ "test_acc": 0.01,
+ "lyapunov": 1.5415452919957582,
+ "grad_norm": 0.16093776786582448,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 86.8611011505127
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.319325820617676,
+ "train_acc": 0.00982,
+ "test_loss": 6.396855745697022,
+ "test_acc": 0.01,
+ "lyapunov": 1.5428402808011341,
+ "grad_norm": 0.16262217434072207,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 86.8790693283081
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.319489360198975,
+ "train_acc": 0.0098,
+ "test_loss": 6.390167568206787,
+ "test_acc": 0.01,
+ "lyapunov": 1.5430222728368266,
+ "grad_norm": 0.1599024522956201,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 86.8610942363739
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.3194953466796875,
+ "train_acc": 0.00936,
+ "test_loss": 6.3929207939147945,
+ "test_acc": 0.01,
+ "lyapunov": 1.5430299802814298,
+ "grad_norm": 0.15787151048989498,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 86.83452033996582
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.319091488189697,
+ "train_acc": 0.0099,
+ "test_loss": 6.387041884613037,
+ "test_acc": 0.01,
+ "lyapunov": 1.5425858250664324,
+ "grad_norm": 0.15981682340967285,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 86.84639286994934
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.319918049621582,
+ "train_acc": 0.01,
+ "test_loss": 6.390152045440674,
+ "test_acc": 0.01,
+ "lyapunov": 1.5434830600343397,
+ "grad_norm": 0.1664732055156118,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 86.84289050102234
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.319467689819336,
+ "train_acc": 0.01,
+ "test_loss": 6.383955514526368,
+ "test_acc": 0.01,
+ "lyapunov": 1.5429968952827746,
+ "grad_norm": 0.16425908204350428,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 86.85825252532959
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.319666849975586,
+ "train_acc": 0.01,
+ "test_loss": 6.379462463378906,
+ "test_acc": 0.01,
+ "lyapunov": 1.5432310299495298,
+ "grad_norm": 0.1579801299018272,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 86.90520691871643
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.318641065368652,
+ "train_acc": 0.01,
+ "test_loss": 6.385379031372071,
+ "test_acc": 0.01,
+ "lyapunov": 1.542139550609052,
+ "grad_norm": 0.1606682447514192,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 86.85262036323547
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.31824127532959,
+ "train_acc": 0.01,
+ "test_loss": 6.3839585464477535,
+ "test_acc": 0.01,
+ "lyapunov": 1.5416794817161072,
+ "grad_norm": 0.158152508901321,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 86.85510659217834
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 5.138188102111816,
+ "train_acc": 0.01868,
+ "test_loss": 4.947204817199707,
+ "test_acc": 0.0102,
+ "lyapunov": 2.4137888052274503,
+ "grad_norm": 5.2278560060516135,
+ "grad_max_sv": 4.450121748447418,
+ "grad_min_sv": 8.815894619873532e-08,
+ "grad_condition": 73462066.87031136,
+ "lr": 0.0009998903417374227,
+ "time_sec": 132.20039796829224
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.910357958526611,
+ "train_acc": 0.01772,
+ "test_loss": 4.974901505279541,
+ "test_acc": 0.0098,
+ "lyapunov": 1.8470725811960753,
+ "grad_norm": 5.334406474785501,
+ "grad_max_sv": 2.416768090268306,
+ "grad_min_sv": 4.845974281257734e-08,
+ "grad_condition": 156669965.4219852,
+ "lr": 0.0009995614150494292,
+ "time_sec": 132.20067143440247
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.789790082702637,
+ "train_acc": 0.01798,
+ "test_loss": 5.241659837341309,
+ "test_acc": 0.0152,
+ "lyapunov": 1.7693803560398425,
+ "grad_norm": 2.284868849655408,
+ "grad_max_sv": 1.6544225737452507,
+ "grad_min_sv": 3.7601093222372486e-08,
+ "grad_condition": 74204967.95678225,
+ "lr": 0.0009990133642141358,
+ "time_sec": 132.1939766407013
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.734155084381103,
+ "train_acc": 0.02012,
+ "test_loss": 4.736255917358398,
+ "test_acc": 0.01,
+ "lyapunov": 1.7185492494222148,
+ "grad_norm": 1.2969402037730182,
+ "grad_max_sv": 0.8527256481349468,
+ "grad_min_sv": 1.8718222001719557e-08,
+ "grad_condition": 3595934101.1830444,
+ "lr": 0.0009982464296247522,
+ "time_sec": 132.19083857536316
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.7501870367431644,
+ "train_acc": 0.01884,
+ "test_loss": 4.7008225593566895,
+ "test_acc": 0.01,
+ "lyapunov": 1.6784742927307363,
+ "grad_norm": 0.7283552366408743,
+ "grad_max_sv": 0.540743650496006,
+ "grad_min_sv": 6.143185659736945e-09,
+ "grad_condition": 20744559298.222054,
+ "lr": 0.0009972609476841367,
+ "time_sec": 132.19878315925598
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.777885425109863,
+ "train_acc": 0.01988,
+ "test_loss": 4.847038110351562,
+ "test_acc": 0.0163,
+ "lyapunov": 1.6714926692835814,
+ "grad_norm": 0.6978205109559127,
+ "grad_max_sv": 0.4112665578722954,
+ "grad_min_sv": 2.577558256003571e-09,
+ "grad_condition": 19293368058.44477,
+ "lr": 0.000996057350657239,
+ "time_sec": 132.22198057174683
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.817885786285401,
+ "train_acc": 0.01714,
+ "test_loss": 4.907033979797363,
+ "test_acc": 0.01,
+ "lyapunov": 1.6430019908548925,
+ "grad_norm": 0.538957530048536,
+ "grad_max_sv": 0.3900473590940237,
+ "grad_min_sv": 8.011143267797137e-10,
+ "grad_condition": 53520886424.44034,
+ "lr": 0.000994636166481494,
+ "time_sec": 132.18847823143005
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.866279851989746,
+ "train_acc": 0.01534,
+ "test_loss": 4.982185540008545,
+ "test_acc": 0.01,
+ "lyapunov": 1.622301935234948,
+ "grad_norm": 0.44743905036756576,
+ "grad_max_sv": 0.2975618153810501,
+ "grad_min_sv": 4.042702856767639e-12,
+ "grad_condition": 98919396245.19788,
+ "lr": 0.0009929980185352525,
+ "time_sec": 132.2019805908203
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.93485692489624,
+ "train_acc": 0.01296,
+ "test_loss": 5.24868205871582,
+ "test_acc": 0.01,
+ "lyapunov": 1.6329893876829416,
+ "grad_norm": 1.2710312604148948,
+ "grad_max_sv": 0.23227821737527848,
+ "grad_min_sv": 1.210631234207371e-10,
+ "grad_condition": 132050856729.70003,
+ "lr": 0.0009911436253643444,
+ "time_sec": 132.25901436805725
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.94441338470459,
+ "train_acc": 0.01662,
+ "test_loss": 4.9677005256652835,
+ "test_acc": 0.01,
+ "lyapunov": 1.6191197569717837,
+ "grad_norm": 0.5849346197331,
+ "grad_max_sv": 0.3103320188820362,
+ "grad_min_sv": 2.4441770461207573e-12,
+ "grad_condition": 142331552698.27188,
+ "lr": 0.0009890738003669028,
+ "time_sec": 132.24092388153076
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.978343018798828,
+ "train_acc": 0.01596,
+ "test_loss": 4.759020803070069,
+ "test_acc": 0.01,
+ "lyapunov": 1.607335550096029,
+ "grad_norm": 0.4668173173890936,
+ "grad_max_sv": 0.3271574813872576,
+ "grad_min_sv": 1.5228846413101469e-12,
+ "grad_condition": 163401069045.22977,
+ "lr": 0.00098678945143658,
+ "time_sec": 132.22342109680176
+ },
+ {
+ "epoch": 12,
+ "train_loss": 5.019883101348877,
+ "train_acc": 0.0154,
+ "test_loss": 4.942817668151855,
+ "test_acc": 0.01,
+ "lyapunov": 1.6049258376631286,
+ "grad_norm": 0.5264008543358515,
+ "grad_max_sv": 0.28871628642082214,
+ "grad_min_sv": 1.5745550588117867e-12,
+ "grad_condition": 141150096351.00974,
+ "lr": 0.0009842915805643154,
+ "time_sec": 132.17593479156494
+ },
+ {
+ "epoch": 13,
+ "train_loss": 5.055773426361084,
+ "train_acc": 0.01454,
+ "test_loss": 5.201871238708496,
+ "test_acc": 0.01,
+ "lyapunov": 1.5926724358287918,
+ "grad_norm": 0.5496018971790103,
+ "grad_max_sv": 0.3235856369137764,
+ "grad_min_sv": 1.5836317227272346e-12,
+ "grad_condition": 172440841867.61472,
+ "lr": 0.000981581283398829,
+ "time_sec": 132.19917631149292
+ },
+ {
+ "epoch": 14,
+ "train_loss": 5.1001338768005375,
+ "train_acc": 0.01374,
+ "test_loss": 6.031500621795654,
+ "test_acc": 0.01,
+ "lyapunov": 1.5873235156164145,
+ "grad_norm": 0.5347429702370289,
+ "grad_max_sv": 0.31967496164143083,
+ "grad_min_sv": 8.416411018220654e-13,
+ "grad_condition": 202636437942.46396,
+ "lr": 0.0009786597487660333,
+ "time_sec": 132.17077159881592
+ },
+ {
+ "epoch": 15,
+ "train_loss": 5.135957703857422,
+ "train_acc": 0.0124,
+ "test_loss": 5.739520129394531,
+ "test_acc": 0.01,
+ "lyapunov": 1.574544443803675,
+ "grad_norm": 0.6201173127889323,
+ "grad_max_sv": 0.32148296795785425,
+ "grad_min_sv": 1.8768859669293263e-11,
+ "grad_condition": 245017227140.7776,
+ "lr": 0.0009755282581475766,
+ "time_sec": 132.19619607925415
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.19933319366455,
+ "train_acc": 0.01332,
+ "test_loss": 6.819124224090576,
+ "test_acc": 0.01,
+ "lyapunov": 1.588761254649638,
+ "grad_norm": 0.7105947575125269,
+ "grad_max_sv": 0.3380855549126863,
+ "grad_min_sv": 1.0418656496584723e-09,
+ "grad_condition": 212026412736.4578,
+ "lr": 0.0009721881851187403,
+ "time_sec": 132.16591668128967
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.203327436523438,
+ "train_acc": 0.0158,
+ "test_loss": 7.679113117980957,
+ "test_acc": 0.01,
+ "lyapunov": 1.5917936892765563,
+ "grad_norm": 0.5687429696625533,
+ "grad_max_sv": 0.3429654061794281,
+ "grad_min_sv": 1.0535516342595844e-12,
+ "grad_condition": 208532854744.75134,
+ "lr": 0.0009686409947459456,
+ "time_sec": 132.23086404800415
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.227132577209472,
+ "train_acc": 0.01704,
+ "test_loss": 5.224352997589111,
+ "test_acc": 0.01,
+ "lyapunov": 1.590573813604272,
+ "grad_norm": 0.6501892893379347,
+ "grad_max_sv": 0.3389496423304081,
+ "grad_min_sv": 1.4743293232017855e-12,
+ "grad_condition": 179354691955.7947,
+ "lr": 0.0009648882429441254,
+ "time_sec": 132.17126607894897
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.268917711486816,
+ "train_acc": 0.01574,
+ "test_loss": 5.769149468994141,
+ "test_acc": 0.01,
+ "lyapunov": 1.5737659489102376,
+ "grad_norm": 0.7756970175394374,
+ "grad_max_sv": 0.33219469264149665,
+ "grad_min_sv": 1.3963206987681851e-12,
+ "grad_condition": 166340823567.4583,
+ "lr": 0.00096093157579425,
+ "time_sec": 132.3532431125641
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.388035034332275,
+ "train_acc": 0.01436,
+ "test_loss": 4.855289517211914,
+ "test_acc": 0.01,
+ "lyapunov": 1.6196008579200492,
+ "grad_norm": 3.273774802278225,
+ "grad_max_sv": 0.3476741284544914,
+ "grad_min_sv": 1.7954016832837687e-12,
+ "grad_condition": 163400108512.08075,
+ "lr": 0.0009567727288213001,
+ "time_sec": 132.18322706222534
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.477730575561523,
+ "train_acc": 0.0119,
+ "test_loss": 5.734935963439941,
+ "test_acc": 0.01,
+ "lyapunov": 1.6737558759386888,
+ "grad_norm": 0.7316822390940195,
+ "grad_max_sv": 0.41190238408744334,
+ "grad_min_sv": 1.4433235299420839e-09,
+ "grad_condition": 115946317202.22786,
+ "lr": 0.0009524135262330095,
+ "time_sec": 132.2254023551941
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.39889496673584,
+ "train_acc": 0.01078,
+ "test_loss": 4.648544214630127,
+ "test_acc": 0.01,
+ "lyapunov": 1.5598208084130836,
+ "grad_norm": 0.9136530334274789,
+ "grad_max_sv": 0.5729864671826362,
+ "grad_min_sv": 6.476590619830438e-09,
+ "grad_condition": 6966838482.173167,
+ "lr": 0.0009478558801197061,
+ "time_sec": 132.19873070716858
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.343370434570312,
+ "train_acc": 0.00934,
+ "test_loss": 4.6330633590698245,
+ "test_acc": 0.01,
+ "lyapunov": 1.544742999174406,
+ "grad_norm": 0.5447776712180945,
+ "grad_max_sv": 0.3971055932343006,
+ "grad_min_sv": 3.0723113141940555e-09,
+ "grad_condition": 10360739417.615135,
+ "lr": 0.000943101789615607,
+ "time_sec": 132.19472217559814
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.354044710998535,
+ "train_acc": 0.0106,
+ "test_loss": 4.758938900756836,
+ "test_acc": 0.01,
+ "lyapunov": 1.5540964880867687,
+ "grad_norm": 0.49799279906750776,
+ "grad_max_sv": 0.32289256788790227,
+ "grad_min_sv": 1.215183540768495e-09,
+ "grad_condition": 84138259698.76875,
+ "lr": 0.0009381533400219313,
+ "time_sec": 132.18565702438354
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.34166207687378,
+ "train_acc": 0.00954,
+ "test_loss": 4.616498927307129,
+ "test_acc": 0.01,
+ "lyapunov": 1.5548294105798082,
+ "grad_norm": 0.35224887377867997,
+ "grad_max_sv": 0.2050650805234909,
+ "grad_min_sv": 4.310481015545377e-10,
+ "grad_condition": 137027644012.72295,
+ "lr": 0.0009330127018922189,
+ "time_sec": 132.1707353591919
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.329114703826904,
+ "train_acc": 0.00962,
+ "test_loss": 4.608516737365723,
+ "test_acc": 0.01,
+ "lyapunov": 1.5478018071035595,
+ "grad_norm": 0.41152400199519606,
+ "grad_max_sv": 0.14391734022647143,
+ "grad_min_sv": 6.406558234285353e-11,
+ "grad_condition": 129739564652.99875,
+ "lr": 0.000927682130080253,
+ "time_sec": 132.1968698501587
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.333489670410156,
+ "train_acc": 0.0092,
+ "test_loss": 4.6180027542114255,
+ "test_acc": 0.01,
+ "lyapunov": 1.553746031068475,
+ "grad_norm": 0.395956424199356,
+ "grad_max_sv": 0.077771030459553,
+ "grad_min_sv": 3.8469886311157825e-16,
+ "grad_condition": 77730702472.31937,
+ "lr": 0.0009221639627510072,
+ "time_sec": 132.21505451202393
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.351277679595947,
+ "train_acc": 0.00942,
+ "test_loss": 4.7706145118713374,
+ "test_acc": 0.01,
+ "lyapunov": 1.564519799273947,
+ "grad_norm": 0.8070388432556335,
+ "grad_max_sv": 0.08204491948708892,
+ "grad_min_sv": 1.474816693019578e-15,
+ "grad_condition": 81835653341.89993,
+ "lr": 0.0009164606203550494,
+ "time_sec": 132.19659543037415
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.322618664703369,
+ "train_acc": 0.00872,
+ "test_loss": 5.576576512145996,
+ "test_acc": 0.01,
+ "lyapunov": 1.5448476557841386,
+ "grad_norm": 1.8211987840238726,
+ "grad_max_sv": 0.006918648211285472,
+ "grad_min_sv": 3.854375422071664e-17,
+ "grad_condition": 6914688932.083499,
+ "lr": 0.0009105746045668516,
+ "time_sec": 132.10211896896362
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.332048937377929,
+ "train_acc": 0.00954,
+ "test_loss": 5.513208132934571,
+ "test_acc": 0.01,
+ "lyapunov": 1.550695708035813,
+ "grad_norm": 1.1118821287367113,
+ "grad_max_sv": 0.019531637569889425,
+ "grad_min_sv": 1.0689040165877983e-16,
+ "grad_condition": 19522880900.554432,
+ "lr": 0.0009045084971874733,
+ "time_sec": 132.11267638206482
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.326176876373291,
+ "train_acc": 0.00918,
+ "test_loss": 5.386148994445801,
+ "test_acc": 0.01,
+ "lyapunov": 1.5464019519288827,
+ "grad_norm": 0.5069935542454341,
+ "grad_max_sv": 0.054698918107897045,
+ "grad_min_sv": 3.7386723818325515e-15,
+ "grad_condition": 54294495664.74051,
+ "lr": 0.0008982649590120977,
+ "time_sec": 132.1673936843872
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.322083574829102,
+ "train_acc": 0.01,
+ "test_loss": 4.707043412780762,
+ "test_acc": 0.01,
+ "lyapunov": 1.544298157667565,
+ "grad_norm": 0.42554937796746406,
+ "grad_max_sv": 0.04392390437424183,
+ "grad_min_sv": 2.3012806918730416e-16,
+ "grad_condition": 43903285638.58012,
+ "lr": 0.0008918467286629196,
+ "time_sec": 132.18636798858643
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.328476766967773,
+ "train_acc": 0.00958,
+ "test_loss": 5.157709109497071,
+ "test_acc": 0.01,
+ "lyapunov": 1.5494323496318534,
+ "grad_norm": 0.3948590073220422,
+ "grad_max_sv": 0.046419868059456346,
+ "grad_min_sv": 3.920453121241332e-16,
+ "grad_condition": 46387197576.51258,
+ "lr": 0.0008852566213878943,
+ "time_sec": 132.14906311035156
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.335322699432373,
+ "train_acc": 0.00912,
+ "test_loss": 4.63318578491211,
+ "test_acc": 0.01,
+ "lyapunov": 1.5560249096292365,
+ "grad_norm": 0.3431205276749687,
+ "grad_max_sv": 0.006924860086292029,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6924860086.292028,
+ "lr": 0.000878497527825878,
+ "time_sec": 132.08630466461182
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.323294322357178,
+ "train_acc": 0.00884,
+ "test_loss": 4.605205520629883,
+ "test_acc": 0.01,
+ "lyapunov": 1.5453313735439955,
+ "grad_norm": 0.3024735245825119,
+ "grad_max_sv": 0.028930858056992293,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28930858056.9923,
+ "lr": 0.000871572412738697,
+ "time_sec": 132.11405229568481
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.324136592712402,
+ "train_acc": 0.00868,
+ "test_loss": 4.605186470031739,
+ "test_acc": 0.01,
+ "lyapunov": 1.5469522064604113,
+ "grad_norm": 0.361219602695028,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008644843137107055,
+ "time_sec": 132.07118153572083
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.3209700448608395,
+ "train_acc": 0.00892,
+ "test_loss": 4.665984559631347,
+ "test_acc": 0.01,
+ "lyapunov": 1.5437110970392252,
+ "grad_norm": 0.3116729659195542,
+ "grad_max_sv": 0.020941149955615402,
+ "grad_min_sv": 0.0,
+ "grad_condition": 20941149955.6154,
+ "lr": 0.0008572363398164014,
+ "time_sec": 132.09318017959595
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.325020372467041,
+ "train_acc": 0.00874,
+ "test_loss": 4.663543145751953,
+ "test_acc": 0.01,
+ "lyapunov": 1.5469195239074396,
+ "grad_norm": 0.305903104498294,
+ "grad_max_sv": 0.024645538488402962,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24645538488.40296,
+ "lr": 0.0008498316702566826,
+ "time_sec": 132.18630456924438
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.326424997558593,
+ "train_acc": 0.00926,
+ "test_loss": 4.710470159912109,
+ "test_acc": 0.01,
+ "lyapunov": 1.5472500924868962,
+ "grad_norm": 0.3315518442712431,
+ "grad_max_sv": 0.03559725326485932,
+ "grad_min_sv": 4.71556170988084e-33,
+ "grad_condition": 35597253264.859314,
+ "lr": 0.0008422735529643442,
+ "time_sec": 132.1392993927002
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.33426462966919,
+ "train_acc": 0.0096,
+ "test_loss": 4.689337516784668,
+ "test_acc": 0.01,
+ "lyapunov": 1.555562095568918,
+ "grad_norm": 0.3795118996689083,
+ "grad_max_sv": 0.028565633855760098,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28565633855.760094,
+ "lr": 0.0008345653031794289,
+ "time_sec": 132.12650513648987
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.329594454193115,
+ "train_acc": 0.00962,
+ "test_loss": 4.677967825317383,
+ "test_acc": 0.01,
+ "lyapunov": 1.5518201217626977,
+ "grad_norm": 0.35226874238427724,
+ "grad_max_sv": 0.031289939628914,
+ "grad_min_sv": 0.0,
+ "grad_condition": 31289939628.913994,
+ "lr": 0.0008267103019950526,
+ "time_sec": 132.1842393875122
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.334290416412354,
+ "train_acc": 0.00948,
+ "test_loss": 4.7127025581359865,
+ "test_acc": 0.01,
+ "lyapunov": 1.55599294903943,
+ "grad_norm": 0.3150010140468872,
+ "grad_max_sv": 0.008952232170850038,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8952232170.850039,
+ "lr": 0.0008187119948743447,
+ "time_sec": 132.16592741012573
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.330992495574951,
+ "train_acc": 0.00988,
+ "test_loss": 4.715853765869141,
+ "test_acc": 0.01,
+ "lyapunov": 1.5526615817223668,
+ "grad_norm": 0.32555598147833537,
+ "grad_max_sv": 0.025627513602375983,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25627513602.375984,
+ "lr": 0.000810573890139155,
+ "time_sec": 132.1376314163208
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.342441840667725,
+ "train_acc": 0.009,
+ "test_loss": 4.814597158813476,
+ "test_acc": 0.01,
+ "lyapunov": 1.5608167011109764,
+ "grad_norm": 0.3705555621106487,
+ "grad_max_sv": 0.012277775909751654,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12277775909.751654,
+ "lr": 0.0008022995574311873,
+ "time_sec": 132.10150909423828
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.330550760803223,
+ "train_acc": 0.00922,
+ "test_loss": 4.82506159362793,
+ "test_acc": 0.01,
+ "lyapunov": 1.552602043846989,
+ "grad_norm": 0.41377353743023604,
+ "grad_max_sv": 0.012684891000390053,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12684891000.390053,
+ "lr": 0.0007938926261462363,
+ "time_sec": 132.13983154296875
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.346614602661133,
+ "train_acc": 0.00908,
+ "test_loss": 4.75941802444458,
+ "test_acc": 0.01,
+ "lyapunov": 1.565407470059212,
+ "grad_norm": 0.6666703677397586,
+ "grad_max_sv": 0.0006472387816756964,
+ "grad_min_sv": 0.0,
+ "grad_condition": 647238781.6756964,
+ "lr": 0.0007853567838422158,
+ "time_sec": 132.07343816757202
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.32947943145752,
+ "train_acc": 0.00898,
+ "test_loss": 4.822898616027832,
+ "test_acc": 0.01,
+ "lyapunov": 1.5532338082637933,
+ "grad_norm": 1.2230171967365666,
+ "grad_max_sv": 0.011994929099455477,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11994929099.455475,
+ "lr": 0.0007766957746216719,
+ "time_sec": 132.13085794448853
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.3338893869018555,
+ "train_acc": 0.0092,
+ "test_loss": 4.843168624877929,
+ "test_acc": 0.01,
+ "lyapunov": 1.5537122622170412,
+ "grad_norm": 0.9355731457390791,
+ "grad_max_sv": 0.06068415185436606,
+ "grad_min_sv": 1.5809611954265782e-13,
+ "grad_condition": 46398377146.35246,
+ "lr": 0.0007679133974894982,
+ "time_sec": 132.11377477645874
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.340212641296387,
+ "train_acc": 0.00966,
+ "test_loss": 4.808492147827148,
+ "test_acc": 0.01,
+ "lyapunov": 1.556026118490702,
+ "grad_norm": 0.3770156243368251,
+ "grad_max_sv": 0.1463914191350341,
+ "grad_min_sv": 3.152568142733814e-13,
+ "grad_condition": 121760995460.97897,
+ "lr": 0.000759013504686565,
+ "time_sec": 132.2147512435913
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.332282363586426,
+ "train_acc": 0.0096,
+ "test_loss": 4.743034214782715,
+ "test_acc": 0.01,
+ "lyapunov": 1.5524532118111924,
+ "grad_norm": 0.3116530039130024,
+ "grad_max_sv": 0.10226385369896888,
+ "grad_min_sv": 3.0737180401130916e-15,
+ "grad_condition": 101953179254.12184,
+ "lr": 0.0007499999999999998,
+ "time_sec": 132.22958421707153
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.3305883631896975,
+ "train_acc": 0.00952,
+ "test_loss": 4.724603568267822,
+ "test_acc": 0.01,
+ "lyapunov": 1.5518521100968656,
+ "grad_norm": 0.3241210515609679,
+ "grad_max_sv": 0.08684249427169562,
+ "grad_min_sv": 6.328097683852358e-16,
+ "grad_condition": 86783867952.95651,
+ "lr": 0.0007408768370508575,
+ "time_sec": 132.19532179832458
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.332131455078125,
+ "train_acc": 0.00964,
+ "test_loss": 4.782391441345215,
+ "test_acc": 0.01,
+ "lyapunov": 1.5542255048556706,
+ "grad_norm": 0.32295260623787486,
+ "grad_max_sv": 0.077319351490587,
+ "grad_min_sv": 1.8882153881334225e-23,
+ "grad_condition": 77319351489.28442,
+ "lr": 0.0007316480175599307,
+ "time_sec": 132.21878457069397
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.333503689270019,
+ "train_acc": 0.00936,
+ "test_loss": 4.801981381225586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5553877649404813,
+ "grad_norm": 0.31562374196715365,
+ "grad_max_sv": 0.06292690904811024,
+ "grad_min_sv": 1.0573404187094843e-32,
+ "grad_condition": 62926909048.110245,
+ "lr": 0.0007223175895924635,
+ "time_sec": 132.18660378456116
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.333852608795166,
+ "train_acc": 0.00896,
+ "test_loss": 4.810883659362793,
+ "test_acc": 0.01,
+ "lyapunov": 1.5559345386217318,
+ "grad_norm": 0.2781133113627033,
+ "grad_max_sv": 0.06129774982109666,
+ "grad_min_sv": 2.855284741973353e-38,
+ "grad_condition": 61297749821.09666,
+ "lr": 0.0007128896457825361,
+ "time_sec": 132.2198555469513
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.3339955087280275,
+ "train_acc": 0.00996,
+ "test_loss": 4.7569840606689455,
+ "test_acc": 0.01,
+ "lyapunov": 1.5569808833739336,
+ "grad_norm": 0.2566538491911281,
+ "grad_max_sv": 0.05556260636076331,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55562606360.763306,
+ "lr": 0.0007033683215378998,
+ "time_sec": 132.21158051490784
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.3385576313781735,
+ "train_acc": 0.00902,
+ "test_loss": 4.754797148895264,
+ "test_acc": 0.01,
+ "lyapunov": 1.5597065461566075,
+ "grad_norm": 0.27047724542782614,
+ "grad_max_sv": 0.0640806739218533,
+ "grad_min_sv": 1.2193818893472967e-19,
+ "grad_condition": 64080664167.18032,
+ "lr": 0.0006937577932260512,
+ "time_sec": 132.19129037857056
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.334184418182373,
+ "train_acc": 0.0103,
+ "test_loss": 4.782689431762695,
+ "test_acc": 0.01,
+ "lyapunov": 1.556523521842859,
+ "grad_norm": 0.29259577039987816,
+ "grad_max_sv": 0.07542139226570725,
+ "grad_min_sv": 8.844145625485828e-17,
+ "grad_condition": 75415188010.71097,
+ "lr": 0.0006840622763423388,
+ "time_sec": 132.19539308547974
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.3342736126708985,
+ "train_acc": 0.00902,
+ "test_loss": 4.792922207641602,
+ "test_acc": 0.01,
+ "lyapunov": 1.556638328925423,
+ "grad_norm": 0.27651642414760924,
+ "grad_max_sv": 0.07381959799677133,
+ "grad_min_sv": 5.679191077750394e-25,
+ "grad_condition": 73819597996.72554,
+ "lr": 0.0006742860236609073,
+ "time_sec": 132.1646604537964
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.3365766784667965,
+ "train_acc": 0.00976,
+ "test_loss": 4.764654750061035,
+ "test_acc": 0.01,
+ "lyapunov": 1.559028771527283,
+ "grad_norm": 0.32368701389084115,
+ "grad_max_sv": 0.06830886630341411,
+ "grad_min_sv": 3.373213421233685e-18,
+ "grad_condition": 68308625699.52162,
+ "lr": 0.0006644333233692913,
+ "time_sec": 132.20315170288086
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.3372549061584476,
+ "train_acc": 0.00876,
+ "test_loss": 4.821174919128418,
+ "test_acc": 0.01,
+ "lyapunov": 1.5602548335824171,
+ "grad_norm": 0.3407373955115073,
+ "grad_max_sv": 0.05221205474808812,
+ "grad_min_sv": 0.0,
+ "grad_condition": 52212054748.08812,
+ "lr": 0.0006545084971874734,
+ "time_sec": 132.21871399879456
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.340573087158203,
+ "train_acc": 0.01004,
+ "test_loss": 4.814465225219727,
+ "test_acc": 0.01,
+ "lyapunov": 1.5639353786283137,
+ "grad_norm": 0.33445562902063697,
+ "grad_max_sv": 0.04306556633673608,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43065566336.736084,
+ "lr": 0.0006445158984722354,
+ "time_sec": 132.16924214363098
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.343714674987793,
+ "train_acc": 0.0095,
+ "test_loss": 4.770381900024414,
+ "test_acc": 0.01,
+ "lyapunov": 1.566701197258347,
+ "grad_norm": 0.41600975854497274,
+ "grad_max_sv": 0.0407159102614969,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40715910261.4969,
+ "lr": 0.0006344599103076324,
+ "time_sec": 132.14849257469177
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.340150414581299,
+ "train_acc": 0.00942,
+ "test_loss": 4.809834826660156,
+ "test_acc": 0.01,
+ "lyapunov": 1.5634946268232888,
+ "grad_norm": 0.4244404576721166,
+ "grad_max_sv": 0.046563083119690415,
+ "grad_min_sv": 0.0,
+ "grad_condition": 46563083119.690414,
+ "lr": 0.0006243449435824269,
+ "time_sec": 132.2440116405487
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.352264609527588,
+ "train_acc": 0.00968,
+ "test_loss": 4.719538593292237,
+ "test_acc": 0.01,
+ "lyapunov": 1.5730204283428924,
+ "grad_norm": 0.6484058447373605,
+ "grad_max_sv": 0.06881329002790153,
+ "grad_min_sv": 4.045636130762067e-11,
+ "grad_condition": 57057261120.16382,
+ "lr": 0.0006141754350553275,
+ "time_sec": 132.1377170085907
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.345465493011474,
+ "train_acc": 0.0095,
+ "test_loss": 4.807828170013428,
+ "test_acc": 0.01,
+ "lyapunov": 1.5668580141823616,
+ "grad_norm": 0.26811037405238153,
+ "grad_max_sv": 0.0895066935569048,
+ "grad_min_sv": 8.923440580685122e-16,
+ "grad_condition": 89405744261.32881,
+ "lr": 0.0006039558454088793,
+ "time_sec": 132.18963503837585
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.339095722351074,
+ "train_acc": 0.00992,
+ "test_loss": 4.79014116973877,
+ "test_acc": 0.01,
+ "lyapunov": 1.562422338044247,
+ "grad_norm": 0.2418134006072333,
+ "grad_max_sv": 0.04957848088815808,
+ "grad_min_sv": 0.0,
+ "grad_condition": 49578480888.15808,
+ "lr": 0.000593690657292862,
+ "time_sec": 132.18193554878235
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.339143208312988,
+ "train_acc": 0.00878,
+ "test_loss": 4.846720378875732,
+ "test_acc": 0.01,
+ "lyapunov": 1.5629626052153995,
+ "grad_norm": 0.23211875934280046,
+ "grad_max_sv": 0.04276521084830165,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42765210848.30165,
+ "lr": 0.0005833843733580507,
+ "time_sec": 132.21098923683167
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.341660294799805,
+ "train_acc": 0.00926,
+ "test_loss": 4.93624571685791,
+ "test_acc": 0.01,
+ "lyapunov": 1.5647895671522525,
+ "grad_norm": 0.25226724531209027,
+ "grad_max_sv": 0.04243421019054949,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42434210190.54949,
+ "lr": 0.0005730415142812054,
+ "time_sec": 132.18032026290894
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.3429354066467285,
+ "train_acc": 0.00964,
+ "test_loss": 4.963717977905273,
+ "test_acc": 0.01,
+ "lyapunov": 1.5658744921159866,
+ "grad_norm": 0.26387680813745,
+ "grad_max_sv": 0.044778031017631295,
+ "grad_min_sv": 0.0,
+ "grad_condition": 44778031017.63129,
+ "lr": 0.0005626666167821517,
+ "time_sec": 132.16022729873657
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.344523805389405,
+ "train_acc": 0.0091,
+ "test_loss": 4.810392481231689,
+ "test_acc": 0.01,
+ "lyapunov": 1.5665253672148565,
+ "grad_norm": 0.31439106456207916,
+ "grad_max_sv": 0.03966532703489065,
+ "grad_min_sv": 0.0,
+ "grad_condition": 39665327034.890656,
+ "lr": 0.0005522642316338265,
+ "time_sec": 132.1867744922638
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.346882275238037,
+ "train_acc": 0.00912,
+ "test_loss": 4.778971862792969,
+ "test_acc": 0.01,
+ "lyapunov": 1.568563460998828,
+ "grad_norm": 0.20952619953519083,
+ "grad_max_sv": 0.03776215887628496,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37762158876.28496,
+ "lr": 0.0005418389216661573,
+ "time_sec": 132.18875670433044
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.353162684936524,
+ "train_acc": 0.00818,
+ "test_loss": 4.764224601745606,
+ "test_acc": 0.01,
+ "lyapunov": 1.5738632352760686,
+ "grad_norm": 0.21224191589739633,
+ "grad_max_sv": 0.02936461050994694,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29364610509.94694,
+ "lr": 0.0005313952597646563,
+ "time_sec": 132.16054940223694
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.341572857055664,
+ "train_acc": 0.00934,
+ "test_loss": 4.764213945770264,
+ "test_acc": 0.01,
+ "lyapunov": 1.5656722372450183,
+ "grad_norm": 0.17131578138452824,
+ "grad_max_sv": 0.026255082851275802,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26255082851.275803,
+ "lr": 0.0005209378268645994,
+ "time_sec": 132.11386466026306
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.34148181564331,
+ "train_acc": 0.00884,
+ "test_loss": 4.787430990600586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5657289049509542,
+ "grad_norm": 0.20416273686306285,
+ "grad_max_sv": 0.03651727414689958,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36517274146.89958,
+ "lr": 0.0005104712099416781,
+ "time_sec": 132.2018940448761
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.341119176330566,
+ "train_acc": 0.00948,
+ "test_loss": 4.769783227539063,
+ "test_acc": 0.01,
+ "lyapunov": 1.5654692183370176,
+ "grad_norm": 0.17080101166392242,
+ "grad_max_sv": 0.030799029115587472,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30799029115.587475,
+ "lr": 0.0004999999999999996,
+ "time_sec": 132.12539839744568
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.345115729370117,
+ "train_acc": 0.00946,
+ "test_loss": 4.734894322967529,
+ "test_acc": 0.01,
+ "lyapunov": 1.5686149972174175,
+ "grad_norm": 0.18659944764551223,
+ "grad_max_sv": 0.012125130696222185,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12125130696.222187,
+ "lr": 0.0004895287900583212,
+ "time_sec": 132.09123158454895
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.338459321289062,
+ "train_acc": 0.0094,
+ "test_loss": 4.7248460479736325,
+ "test_acc": 0.01,
+ "lyapunov": 1.5630621724116527,
+ "grad_norm": 0.176032379936258,
+ "grad_max_sv": 0.013429323118180037,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13429323118.180037,
+ "lr": 0.0004790621731353997,
+ "time_sec": 132.07102465629578
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.345072369537354,
+ "train_acc": 0.00896,
+ "test_loss": 4.745542971801758,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687669668051287,
+ "grad_norm": 0.2223520771526132,
+ "grad_max_sv": 0.00913866781629622,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9138667816.29622,
+ "lr": 0.000468604740235343,
+ "time_sec": 132.31091713905334
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.338468246459961,
+ "train_acc": 0.00906,
+ "test_loss": 4.776708003234863,
+ "test_acc": 0.01,
+ "lyapunov": 1.5631554016981588,
+ "grad_norm": 0.18439021291098787,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00045816107833384175,
+ "time_sec": 132.1099407672882
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.3392803921508785,
+ "train_acc": 0.0085,
+ "test_loss": 4.756961068725586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5640239118005308,
+ "grad_norm": 0.1670344381602521,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004477357683661729,
+ "time_sec": 132.07850074768066
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.338647942352295,
+ "train_acc": 0.00896,
+ "test_loss": 4.738301519775391,
+ "test_acc": 0.01,
+ "lyapunov": 1.563378708441849,
+ "grad_norm": 0.15920625845312916,
+ "grad_max_sv": 0.012282294360920787,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12282294360.920788,
+ "lr": 0.00043733338321784746,
+ "time_sec": 132.09186792373657
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.339479166107178,
+ "train_acc": 0.0092,
+ "test_loss": 4.714014392089844,
+ "test_acc": 0.01,
+ "lyapunov": 1.5639294709086113,
+ "grad_norm": 0.1731138874132484,
+ "grad_max_sv": 0.03721864921972155,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37218649219.72156,
+ "lr": 0.0004269584857187939,
+ "time_sec": 132.1542615890503
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.345089318237305,
+ "train_acc": 0.00928,
+ "test_loss": 4.7151237457275395,
+ "test_acc": 0.01,
+ "lyapunov": 1.5680857643751842,
+ "grad_norm": 0.1866415261285155,
+ "grad_max_sv": 0.03729230999015272,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37292309990.152725,
+ "lr": 0.0004166156266419484,
+ "time_sec": 132.18493914604187
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.345381183319092,
+ "train_acc": 0.00918,
+ "test_loss": 4.68825431060791,
+ "test_acc": 0.01,
+ "lyapunov": 1.568592563309633,
+ "grad_norm": 0.1882901347639973,
+ "grad_max_sv": 0.021022121235728265,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21022121235.728264,
+ "lr": 0.0004063093427071373,
+ "time_sec": 132.12367796897888
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.340999842681884,
+ "train_acc": 0.00992,
+ "test_loss": 4.716685279846192,
+ "test_acc": 0.01,
+ "lyapunov": 1.5657545608632706,
+ "grad_norm": 0.20177951961733773,
+ "grad_max_sv": 0.01230331021361053,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12303310213.610529,
+ "lr": 0.0003960441545911199,
+ "time_sec": 132.0947766304016
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.344697039794922,
+ "train_acc": 0.00906,
+ "test_loss": 4.770621002197266,
+ "test_acc": 0.01,
+ "lyapunov": 1.5692900818632083,
+ "grad_norm": 0.20891700571465235,
+ "grad_max_sv": 0.013876684103161096,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13876684103.161098,
+ "lr": 0.0003858245649446718,
+ "time_sec": 132.09650421142578
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.346022133178711,
+ "train_acc": 0.00958,
+ "test_loss": 4.825743739318848,
+ "test_acc": 0.01,
+ "lyapunov": 1.5695690389179513,
+ "grad_norm": 0.23167422762918993,
+ "grad_max_sv": 0.0037465339992195368,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3746533999.219537,
+ "lr": 0.00037565505641757235,
+ "time_sec": 132.0917444229126
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.346828841705323,
+ "train_acc": 0.00876,
+ "test_loss": 4.960531255340576,
+ "test_acc": 0.01,
+ "lyapunov": 1.5696865573258656,
+ "grad_norm": 0.1785675731490032,
+ "grad_max_sv": 0.005577366659417748,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5577366659.417749,
+ "lr": 0.00036554008969236695,
+ "time_sec": 132.0870282649994
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.342154947357177,
+ "train_acc": 0.00878,
+ "test_loss": 4.975327129364014,
+ "test_acc": 0.01,
+ "lyapunov": 1.5665336716205567,
+ "grad_norm": 0.16793525655934358,
+ "grad_max_sv": 0.00797480964101851,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7974809641.018509,
+ "lr": 0.0003554841015277638,
+ "time_sec": 132.12742161750793
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.346710361175537,
+ "train_acc": 0.00918,
+ "test_loss": 4.953879835510254,
+ "test_acc": 0.01,
+ "lyapunov": 1.5700483614831324,
+ "grad_norm": 0.18433712454121046,
+ "grad_max_sv": 0.012014600727707148,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12014600727.707148,
+ "lr": 0.000345491502812526,
+ "time_sec": 132.0858714580536
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.341808082733154,
+ "train_acc": 0.00856,
+ "test_loss": 5.010934870910645,
+ "test_acc": 0.01,
+ "lyapunov": 1.566529265754973,
+ "grad_norm": 0.1758408454253638,
+ "grad_max_sv": 0.003343093441799283,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3343093441.799283,
+ "lr": 0.0003355666766307081,
+ "time_sec": 132.0660150051117
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.351253204956055,
+ "train_acc": 0.00918,
+ "test_loss": 5.023424221801758,
+ "test_acc": 0.01,
+ "lyapunov": 1.5723978284069948,
+ "grad_norm": 0.17788255301821657,
+ "grad_max_sv": 0.014162034029141068,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14162034029.141071,
+ "lr": 0.00032571397633909225,
+ "time_sec": 132.10221076011658
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.347586841278076,
+ "train_acc": 0.00884,
+ "test_loss": 4.963154336547851,
+ "test_acc": 0.01,
+ "lyapunov": 1.5719817017045472,
+ "grad_norm": 0.2369860248003482,
+ "grad_max_sv": 0.004905311437323689,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4905311437.323689,
+ "lr": 0.00031593772365766094,
+ "time_sec": 132.1323049068451
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.343141855926514,
+ "train_acc": 0.00848,
+ "test_loss": 4.921149578094482,
+ "test_acc": 0.01,
+ "lyapunov": 1.5679576765850682,
+ "grad_norm": 0.1602509536119079,
+ "grad_max_sv": 0.019888732209801675,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19888732209.801674,
+ "lr": 0.0003062422067739483,
+ "time_sec": 132.1422688961029
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.343594031066894,
+ "train_acc": 0.00906,
+ "test_loss": 4.905448650360108,
+ "test_acc": 0.01,
+ "lyapunov": 1.5682554074260584,
+ "grad_norm": 0.17541418565565223,
+ "grad_max_sv": 0.009854677692055702,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9854677692.055702,
+ "lr": 0.00029663167846209965,
+ "time_sec": 132.11462831497192
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.341661099700928,
+ "train_acc": 0.00938,
+ "test_loss": 4.896561671447754,
+ "test_acc": 0.01,
+ "lyapunov": 1.566467627539964,
+ "grad_norm": 0.18126299601196125,
+ "grad_max_sv": 0.013893446559086442,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13893446559.086445,
+ "lr": 0.00028711035421746345,
+ "time_sec": 132.183189868927
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.341162901000977,
+ "train_acc": 0.00872,
+ "test_loss": 4.906980642700195,
+ "test_acc": 0.01,
+ "lyapunov": 1.5660171655132948,
+ "grad_norm": 0.18389173404235654,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00027768241040753615,
+ "time_sec": 132.1316442489624
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.340904234008789,
+ "train_acc": 0.0087,
+ "test_loss": 4.880604965209961,
+ "test_acc": 0.01,
+ "lyapunov": 1.5657722669489242,
+ "grad_norm": 0.16941469287847527,
+ "grad_max_sv": 0.0025681605096906424,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2568160509.6906424,
+ "lr": 0.00026835198244006903,
+ "time_sec": 132.0789442062378
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.342495626068115,
+ "train_acc": 0.00838,
+ "test_loss": 4.8667546737670895,
+ "test_acc": 0.01,
+ "lyapunov": 1.56737110986734,
+ "grad_norm": 0.2098824320936581,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002591231629491421,
+ "time_sec": 132.06338381767273
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.341140549468994,
+ "train_acc": 0.00882,
+ "test_loss": 4.923036535644531,
+ "test_acc": 0.01,
+ "lyapunov": 1.5660716353170097,
+ "grad_norm": 0.16309007942968,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002499999999999997,
+ "time_sec": 132.0798683166504
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.367573778076172,
+ "train_acc": 0.00942,
+ "test_loss": 4.8419834274291995,
+ "test_acc": 0.01,
+ "lyapunov": 1.5839073743356769,
+ "grad_norm": 0.17849770970668777,
+ "grad_max_sv": 0.006972884247079492,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6972884247.079493,
+ "lr": 0.00024098649531343477,
+ "time_sec": 132.07039666175842
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.3430040219116215,
+ "train_acc": 0.00878,
+ "test_loss": 4.867986113739014,
+ "test_acc": 0.01,
+ "lyapunov": 1.5680094472587567,
+ "grad_norm": 0.17231990573343864,
+ "grad_max_sv": 0.002580128749832511,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2580128749.832511,
+ "lr": 0.0002320866025105016,
+ "time_sec": 132.0873384475708
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.342889985504151,
+ "train_acc": 0.00874,
+ "test_loss": 4.840346334075928,
+ "test_acc": 0.01,
+ "lyapunov": 1.5678095716954497,
+ "grad_norm": 0.18603931144131847,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002233042253783278,
+ "time_sec": 132.0669243335724
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.345595389709473,
+ "train_acc": 0.00906,
+ "test_loss": 4.82763256072998,
+ "test_acc": 0.01,
+ "lyapunov": 1.5700134941379127,
+ "grad_norm": 0.17962506167998699,
+ "grad_max_sv": 0.0006658073514699935,
+ "grad_min_sv": 0.0,
+ "grad_condition": 665807351.4699936,
+ "lr": 0.000214643216157784,
+ "time_sec": 132.0985701084137
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.354534033508301,
+ "train_acc": 0.00898,
+ "test_loss": 4.813229525756836,
+ "test_acc": 0.01,
+ "lyapunov": 1.5754887292452175,
+ "grad_norm": 0.2002013331480914,
+ "grad_max_sv": 0.004350297572091222,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4350297572.091222,
+ "lr": 0.00020610737385376332,
+ "time_sec": 132.09686851501465
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.3426032342529295,
+ "train_acc": 0.00804,
+ "test_loss": 4.823688924407959,
+ "test_acc": 0.01,
+ "lyapunov": 1.567502071485495,
+ "grad_norm": 0.177797147662824,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019770044256881242,
+ "time_sec": 132.1264684200287
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.349622652893067,
+ "train_acc": 0.00884,
+ "test_loss": 4.844220027923584,
+ "test_acc": 0.01,
+ "lyapunov": 1.571947547176,
+ "grad_norm": 0.16292252305474791,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001894261098608447,
+ "time_sec": 132.10880613327026
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.345900168304444,
+ "train_acc": 0.00918,
+ "test_loss": 4.840348344421387,
+ "test_acc": 0.01,
+ "lyapunov": 1.5703127265281385,
+ "grad_norm": 0.17468920430563006,
+ "grad_max_sv": 0.0029470635578036307,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2947063557.803631,
+ "lr": 0.000181288005125655,
+ "time_sec": 132.11736822128296
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.345384422454834,
+ "train_acc": 0.00874,
+ "test_loss": 4.8622421981811526,
+ "test_acc": 0.01,
+ "lyapunov": 1.5698327935870042,
+ "grad_norm": 0.21177276682423293,
+ "grad_max_sv": 0.0007724121678620577,
+ "grad_min_sv": 0.0,
+ "grad_condition": 772412167.8620577,
+ "lr": 0.0001732896980049473,
+ "time_sec": 132.07746076583862
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.342875657653809,
+ "train_acc": 0.00912,
+ "test_loss": 4.856573393249512,
+ "test_acc": 0.01,
+ "lyapunov": 1.5677888875117387,
+ "grad_norm": 0.16084383685322373,
+ "grad_max_sv": 0.013493797415867448,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13493797415.867447,
+ "lr": 0.00016543469682057076,
+ "time_sec": 132.08074021339417
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.355080330505371,
+ "train_acc": 0.00822,
+ "test_loss": 4.830239296722412,
+ "test_acc": 0.01,
+ "lyapunov": 1.5756983775312028,
+ "grad_norm": 0.1959747570871713,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 132.07752227783203
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.342228624572754,
+ "train_acc": 0.00892,
+ "test_loss": 4.84301993560791,
+ "test_acc": 0.01,
+ "lyapunov": 1.5673401697212472,
+ "grad_norm": 0.14204259013530204,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 132.06180357933044
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.3422714726257325,
+ "train_acc": 0.00928,
+ "test_loss": 4.821010319519043,
+ "test_acc": 0.01,
+ "lyapunov": 1.5673690311744084,
+ "grad_norm": 0.1572610072392831,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 132.09343099594116
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.3444528672790526,
+ "train_acc": 0.0086,
+ "test_loss": 4.83043311843872,
+ "test_acc": 0.01,
+ "lyapunov": 1.5691952199277366,
+ "grad_norm": 0.15397404749427382,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00013551568628929425,
+ "time_sec": 132.07117557525635
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.342576068572998,
+ "train_acc": 0.00892,
+ "test_loss": 4.83036664352417,
+ "test_acc": 0.01,
+ "lyapunov": 1.5677011345353578,
+ "grad_norm": 0.13531666387620547,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 132.1246190071106
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.342390079040527,
+ "train_acc": 0.009,
+ "test_loss": 4.818707986450195,
+ "test_acc": 0.01,
+ "lyapunov": 1.5674945427023845,
+ "grad_norm": 0.11755267765049923,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 132.10427331924438
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.346578267517089,
+ "train_acc": 0.00914,
+ "test_loss": 4.808753877258301,
+ "test_acc": 0.01,
+ "lyapunov": 1.571015379617891,
+ "grad_norm": 0.14739866079910954,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 132.09667372703552
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.341421314849853,
+ "train_acc": 0.00888,
+ "test_loss": 4.8178321044921875,
+ "test_acc": 0.01,
+ "lyapunov": 1.5664617289667544,
+ "grad_norm": 0.15196598686273202,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010815327133708009,
+ "time_sec": 132.09818243980408
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.342278069915771,
+ "train_acc": 0.00846,
+ "test_loss": 4.809390866088867,
+ "test_acc": 0.01,
+ "lyapunov": 1.5673773797881572,
+ "grad_norm": 0.17015255493793316,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010173504098790182,
+ "time_sec": 132.13357877731323
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.341155296783447,
+ "train_acc": 0.00878,
+ "test_loss": 4.819783433532715,
+ "test_acc": 0.01,
+ "lyapunov": 1.56620217955021,
+ "grad_norm": 0.13456226708171515,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 132.0805094242096
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.344341220397949,
+ "train_acc": 0.00942,
+ "test_loss": 4.812504239654541,
+ "test_acc": 0.01,
+ "lyapunov": 1.5690714410503808,
+ "grad_norm": 0.15635175889858405,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 132.10770106315613
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.341316756591797,
+ "train_acc": 0.00872,
+ "test_loss": 4.791230865478516,
+ "test_acc": 0.01,
+ "lyapunov": 1.5663795004720273,
+ "grad_norm": 0.13120586242402146,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 132.12851881980896
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.343846289520264,
+ "train_acc": 0.00826,
+ "test_loss": 4.791252892303467,
+ "test_acc": 0.01,
+ "lyapunov": 1.5686628943514032,
+ "grad_norm": 0.12574649548787997,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 132.11882972717285
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.341886834716797,
+ "train_acc": 0.00924,
+ "test_loss": 4.7894229957580565,
+ "test_acc": 0.01,
+ "lyapunov": 1.566991005712153,
+ "grad_norm": 0.12125233233583547,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 132.1242277622223
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.341545905151367,
+ "train_acc": 0.00844,
+ "test_loss": 4.781455255126953,
+ "test_acc": 0.01,
+ "lyapunov": 1.566652334559604,
+ "grad_norm": 0.11877593044343822,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 132.1204969882965
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.343738833465576,
+ "train_acc": 0.0089,
+ "test_loss": 4.782108512115479,
+ "test_acc": 0.01,
+ "lyapunov": 1.5686877148840435,
+ "grad_norm": 0.14685494918897216,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 132.1582751274109
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.340985955505371,
+ "train_acc": 0.0095,
+ "test_loss": 4.780940398406982,
+ "test_acc": 0.01,
+ "lyapunov": 1.5660363987583639,
+ "grad_norm": 0.11589911056077733,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 132.11265683174133
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.343754200744629,
+ "train_acc": 0.00968,
+ "test_loss": 4.7895281066894535,
+ "test_acc": 0.01,
+ "lyapunov": 1.5686014985184535,
+ "grad_norm": 0.14358686229070586,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 132.08578968048096
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.345564033660889,
+ "train_acc": 0.00894,
+ "test_loss": 4.789863642883301,
+ "test_acc": 0.01,
+ "lyapunov": 1.5702618372714734,
+ "grad_norm": 0.15311883643219684,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 132.07862830162048
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.342584033355713,
+ "train_acc": 0.00908,
+ "test_loss": 4.779020539093017,
+ "test_acc": 0.01,
+ "lyapunov": 1.5677639367940175,
+ "grad_norm": 0.15329364714098923,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 132.16318249702454
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.341682634429931,
+ "train_acc": 0.00944,
+ "test_loss": 4.782007501220703,
+ "test_acc": 0.01,
+ "lyapunov": 1.5667803564949718,
+ "grad_norm": 0.13761474702045567,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 132.10979580879211
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.342693343200684,
+ "train_acc": 0.00874,
+ "test_loss": 4.785680311584473,
+ "test_acc": 0.01,
+ "lyapunov": 1.5677480008596045,
+ "grad_norm": 0.14227357176692468,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 132.14933609962463
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.339641748504639,
+ "train_acc": 0.00948,
+ "test_loss": 4.7827409004211425,
+ "test_acc": 0.01,
+ "lyapunov": 1.5646268839726363,
+ "grad_norm": 0.11276908599413558,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 132.07238721847534
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.341200107269287,
+ "train_acc": 0.00926,
+ "test_loss": 4.787122599792481,
+ "test_acc": 0.01,
+ "lyapunov": 1.566309593217757,
+ "grad_norm": 0.11577298218878175,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 132.08721160888672
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.341790512847901,
+ "train_acc": 0.0089,
+ "test_loss": 4.78599192199707,
+ "test_acc": 0.01,
+ "lyapunov": 1.5669051058152144,
+ "grad_norm": 0.11406538673568321,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 132.13204169273376
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.342709656066894,
+ "train_acc": 0.0095,
+ "test_loss": 4.784429030609131,
+ "test_acc": 0.01,
+ "lyapunov": 1.5678098799322573,
+ "grad_norm": 0.1301621255904577,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 132.10533571243286
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.341824940795899,
+ "train_acc": 0.00922,
+ "test_loss": 4.7872933067321775,
+ "test_acc": 0.01,
+ "lyapunov": 1.5669465708305768,
+ "grad_norm": 0.11590542924579983,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 132.09704732894897
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.341511313171386,
+ "train_acc": 0.00974,
+ "test_loss": 4.7792837577819824,
+ "test_acc": 0.01,
+ "lyapunov": 1.5666430996507026,
+ "grad_norm": 0.11256165029712978,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 132.12034392356873
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.341457148132324,
+ "train_acc": 0.00972,
+ "test_loss": 4.780789426422119,
+ "test_acc": 0.01,
+ "lyapunov": 1.5665654376949496,
+ "grad_norm": 0.10204898242159913,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 132.14241123199463
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.3405984710693355,
+ "train_acc": 0.00948,
+ "test_loss": 4.778655993652344,
+ "test_acc": 0.01,
+ "lyapunov": 1.5656854539271206,
+ "grad_norm": 0.12809073544865285,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 132.08009314537048
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.340534744262695,
+ "train_acc": 0.0091,
+ "test_loss": 4.780472738647461,
+ "test_acc": 0.01,
+ "lyapunov": 1.5655692928587384,
+ "grad_norm": 0.10313184635997721,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 132.0838325023651
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.340677046051026,
+ "train_acc": 0.00992,
+ "test_loss": 4.781814497375488,
+ "test_acc": 0.01,
+ "lyapunov": 1.5657385788915101,
+ "grad_norm": 0.10334450883525552,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 132.11706686019897
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.341100224914551,
+ "train_acc": 0.01,
+ "test_loss": 4.7812304672241215,
+ "test_acc": 0.01,
+ "lyapunov": 1.5661775379839455,
+ "grad_norm": 0.1264085338408933,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 132.12464785575867
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.341793058776855,
+ "train_acc": 0.01,
+ "test_loss": 4.78042247467041,
+ "test_acc": 0.01,
+ "lyapunov": 1.5669281586356785,
+ "grad_norm": 0.09436149541511535,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 132.1470422744751
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.349506974182129,
+ "train_acc": 0.01,
+ "test_loss": 4.78042266998291,
+ "test_acc": 0.01,
+ "lyapunov": 1.5731076300906404,
+ "grad_norm": 0.1178995174742038,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 132.09918355941772
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.342189108886719,
+ "train_acc": 0.01,
+ "test_loss": 4.781454308319092,
+ "test_acc": 0.01,
+ "lyapunov": 1.5673414352909683,
+ "grad_norm": 0.09081347881139741,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 132.10713911056519
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.341546408996582,
+ "train_acc": 0.01,
+ "test_loss": 4.781454162597656,
+ "test_acc": 0.01,
+ "lyapunov": 1.5666629228445574,
+ "grad_norm": 0.09019678612458548,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 132.1311194896698
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.341715382995606,
+ "train_acc": 0.01,
+ "test_loss": 4.782687770843506,
+ "test_acc": 0.01,
+ "lyapunov": 1.5668335332894874,
+ "grad_norm": 0.09070167126439822,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 132.13174676895142
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.342021694946289,
+ "train_acc": 0.01,
+ "test_loss": 4.782687942504883,
+ "test_acc": 0.01,
+ "lyapunov": 1.5671642540056077,
+ "grad_norm": 0.09082797851606526,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 132.09515190124512
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.339607263183594,
+ "train_acc": 0.01,
+ "test_loss": 4.782687832641601,
+ "test_acc": 0.01,
+ "lyapunov": 1.5645978752609409,
+ "grad_norm": 0.090368422289998,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 132.06873154640198
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 5.170418347930908,
+ "train_acc": 0.01482,
+ "test_loss": 4.874806223297119,
+ "test_acc": 0.0107,
+ "lyapunov": 2.4393880626429683,
+ "grad_norm": 5.345734057581178,
+ "grad_max_sv": 4.483905690908432,
+ "grad_min_sv": 8.954973220731688e-08,
+ "grad_condition": 129025189.7290709,
+ "lr": 0.0009998903417374227,
+ "time_sec": 177.46578431129456
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.886182316741944,
+ "train_acc": 0.01718,
+ "test_loss": 4.80269637298584,
+ "test_acc": 0.0102,
+ "lyapunov": 1.9971744041613606,
+ "grad_norm": 3.4433992950689616,
+ "grad_max_sv": 2.739058768749237,
+ "grad_min_sv": 5.745658385736263e-08,
+ "grad_condition": 84538548.49489692,
+ "lr": 0.0009995614150494292,
+ "time_sec": 177.3906273841858
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.783107050323486,
+ "train_acc": 0.01528,
+ "test_loss": 4.738721482086182,
+ "test_acc": 0.01,
+ "lyapunov": 1.8048184826550886,
+ "grad_norm": 2.047885898328211,
+ "grad_max_sv": 1.4787879481911659,
+ "grad_min_sv": 3.2768289852033726e-08,
+ "grad_condition": 566050825.5696664,
+ "lr": 0.0009990133642141358,
+ "time_sec": 177.4175295829773
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.751416029052734,
+ "train_acc": 0.01606,
+ "test_loss": 4.630446166992187,
+ "test_acc": 0.01,
+ "lyapunov": 1.707960840991086,
+ "grad_norm": 1.4476075782979456,
+ "grad_max_sv": 0.836699303984642,
+ "grad_min_sv": 1.4332362594222718e-08,
+ "grad_condition": 24679971260.08811,
+ "lr": 0.0009982464296247522,
+ "time_sec": 177.5156271457672
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.7807122309875485,
+ "train_acc": 0.01428,
+ "test_loss": 4.622669477844238,
+ "test_acc": 0.01,
+ "lyapunov": 1.7041781695602496,
+ "grad_norm": 1.050316146928851,
+ "grad_max_sv": 0.498383151658345,
+ "grad_min_sv": 3.796087105340611e-11,
+ "grad_condition": 139863529616.57062,
+ "lr": 0.0009972609476841367,
+ "time_sec": 177.43440508842468
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.8388256774902345,
+ "train_acc": 0.01308,
+ "test_loss": 4.649810864257812,
+ "test_acc": 0.01,
+ "lyapunov": 1.6965309613196136,
+ "grad_norm": 0.6788898927695144,
+ "grad_max_sv": 0.42595611810684203,
+ "grad_min_sv": 1.5628448124239113e-12,
+ "grad_condition": 206494283007.18826,
+ "lr": 0.000996057350657239,
+ "time_sec": 177.44785737991333
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.8986459965515134,
+ "train_acc": 0.01186,
+ "test_loss": 4.708990380859375,
+ "test_acc": 0.01,
+ "lyapunov": 1.7017012535763518,
+ "grad_norm": 0.48731250728585107,
+ "grad_max_sv": 0.33343438915908336,
+ "grad_min_sv": 5.53908882765212e-13,
+ "grad_condition": 254093723126.4781,
+ "lr": 0.000994636166481494,
+ "time_sec": 177.37777757644653
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.943858919830323,
+ "train_acc": 0.01104,
+ "test_loss": 5.26636118927002,
+ "test_acc": 0.01,
+ "lyapunov": 1.7182561540237777,
+ "grad_norm": 0.48999999014626605,
+ "grad_max_sv": 0.25608402006328107,
+ "grad_min_sv": 9.286946471073546e-14,
+ "grad_condition": 242351728116.98883,
+ "lr": 0.0009929980185352525,
+ "time_sec": 177.387188911438
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.979513124542236,
+ "train_acc": 0.01144,
+ "test_loss": 5.497952555084228,
+ "test_acc": 0.01,
+ "lyapunov": 1.7062027213518576,
+ "grad_norm": 0.42079758157884545,
+ "grad_max_sv": 0.2485219370573759,
+ "grad_min_sv": 1.885935727798404e-14,
+ "grad_condition": 245798317000.96808,
+ "lr": 0.0009911436253643444,
+ "time_sec": 177.38124251365662
+ },
+ {
+ "epoch": 10,
+ "train_loss": 5.0166656953430175,
+ "train_acc": 0.01076,
+ "test_loss": 4.605617906188965,
+ "test_acc": 0.01,
+ "lyapunov": 1.6932507491172732,
+ "grad_norm": 0.420321050632811,
+ "grad_max_sv": 0.2404270452912897,
+ "grad_min_sv": 9.577507932467198e-25,
+ "grad_condition": 240427045291.03647,
+ "lr": 0.0009890738003669028,
+ "time_sec": 177.3316354751587
+ },
+ {
+ "epoch": 11,
+ "train_loss": 5.0578450691223145,
+ "train_acc": 0.0114,
+ "test_loss": 4.605764473724365,
+ "test_acc": 0.01,
+ "lyapunov": 1.6895873580137482,
+ "grad_norm": 0.49178900029145406,
+ "grad_max_sv": 0.26607779785990715,
+ "grad_min_sv": 5.082064100170326e-21,
+ "grad_condition": 266077796409.95917,
+ "lr": 0.00098678945143658,
+ "time_sec": 177.35666227340698
+ },
+ {
+ "epoch": 12,
+ "train_loss": 5.092576569976806,
+ "train_acc": 0.01182,
+ "test_loss": 4.60662777633667,
+ "test_acc": 0.01,
+ "lyapunov": 1.6848897119922102,
+ "grad_norm": 0.6934058402651867,
+ "grad_max_sv": 0.34772998839616776,
+ "grad_min_sv": 1.6804705504564466e-13,
+ "grad_condition": 311062929805.2175,
+ "lr": 0.0009842915805643154,
+ "time_sec": 177.45647644996643
+ },
+ {
+ "epoch": 13,
+ "train_loss": 5.15109172531128,
+ "train_acc": 0.01186,
+ "test_loss": 4.608129429626465,
+ "test_acc": 0.01,
+ "lyapunov": 1.7015191944663788,
+ "grad_norm": 0.6846074227630976,
+ "grad_max_sv": 0.32766890451312064,
+ "grad_min_sv": 2.4578391875654614e-18,
+ "grad_condition": 327668018219.02893,
+ "lr": 0.000981581283398829,
+ "time_sec": 177.36489033699036
+ },
+ {
+ "epoch": 14,
+ "train_loss": 5.2939554736328125,
+ "train_acc": 0.0105,
+ "test_loss": 5.4404556137084965,
+ "test_acc": 0.01,
+ "lyapunov": 1.733636704247321,
+ "grad_norm": 2.0585577176009484,
+ "grad_max_sv": 0.5351610340178012,
+ "grad_min_sv": 6.043698563311623e-09,
+ "grad_condition": 125123088585.82278,
+ "lr": 0.0009786597487660333,
+ "time_sec": 177.41271114349365
+ },
+ {
+ "epoch": 15,
+ "train_loss": 5.339356228485108,
+ "train_acc": 0.01,
+ "test_loss": 5.634622732543946,
+ "test_acc": 0.01,
+ "lyapunov": 1.7321220276605747,
+ "grad_norm": 1.2474576611019448,
+ "grad_max_sv": 0.5749046392738819,
+ "grad_min_sv": 7.0887550281236514e-09,
+ "grad_condition": 17881232094.586456,
+ "lr": 0.0009755282581475766,
+ "time_sec": 177.42803382873535
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.213154935302734,
+ "train_acc": 0.00934,
+ "test_loss": 5.393290295410156,
+ "test_acc": 0.01,
+ "lyapunov": 1.5737932243615465,
+ "grad_norm": 0.46647750812487915,
+ "grad_max_sv": 0.27153575848788025,
+ "grad_min_sv": 1.5242528473500716e-09,
+ "grad_condition": 77568831402.5238,
+ "lr": 0.0009721881851187403,
+ "time_sec": 177.44743824005127
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.262427766418457,
+ "train_acc": 0.01022,
+ "test_loss": 4.925324077606201,
+ "test_acc": 0.01,
+ "lyapunov": 1.5760375502164408,
+ "grad_norm": 0.6268713729269668,
+ "grad_max_sv": 0.37553633116185664,
+ "grad_min_sv": 3.283041272093994e-09,
+ "grad_condition": 31488669291.59237,
+ "lr": 0.0009686409947459456,
+ "time_sec": 177.47271943092346
+ },
+ {
+ "epoch": 18,
+ "train_loss": 5.289855928497315,
+ "train_acc": 0.009,
+ "test_loss": 5.166483688354492,
+ "test_acc": 0.01,
+ "lyapunov": 1.5759224303238226,
+ "grad_norm": 0.4193761222715419,
+ "grad_max_sv": 0.26443815175443885,
+ "grad_min_sv": 1.8233460938992724e-09,
+ "grad_condition": 83574980362.08054,
+ "lr": 0.0009648882429441254,
+ "time_sec": 177.47960138320923
+ },
+ {
+ "epoch": 19,
+ "train_loss": 5.3201322650146485,
+ "train_acc": 0.0104,
+ "test_loss": 5.085500339508057,
+ "test_acc": 0.01,
+ "lyapunov": 1.5752660103161316,
+ "grad_norm": 0.35145865174653673,
+ "grad_max_sv": 0.1685528600588441,
+ "grad_min_sv": 5.831233779827688e-12,
+ "grad_condition": 106917248964.36707,
+ "lr": 0.00096093157579425,
+ "time_sec": 177.47897052764893
+ },
+ {
+ "epoch": 20,
+ "train_loss": 5.3543471484375,
+ "train_acc": 0.00944,
+ "test_loss": 5.246659634399414,
+ "test_acc": 0.01,
+ "lyapunov": 1.575355000812989,
+ "grad_norm": 0.5222583225299012,
+ "grad_max_sv": 0.10507027432322502,
+ "grad_min_sv": 7.849948703277934e-12,
+ "grad_condition": 72947428086.86752,
+ "lr": 0.0009567727288213001,
+ "time_sec": 177.43105292320251
+ },
+ {
+ "epoch": 21,
+ "train_loss": 5.354224435882569,
+ "train_acc": 0.00964,
+ "test_loss": 5.22655355682373,
+ "test_acc": 0.01,
+ "lyapunov": 1.577795330520786,
+ "grad_norm": 1.7696193327514464,
+ "grad_max_sv": 0.04788816105574369,
+ "grad_min_sv": 3.098440861051027e-15,
+ "grad_condition": 47515160306.08334,
+ "lr": 0.0009524135262330095,
+ "time_sec": 177.38868117332458
+ },
+ {
+ "epoch": 22,
+ "train_loss": 5.359287767486572,
+ "train_acc": 0.00866,
+ "test_loss": 5.144994302368164,
+ "test_acc": 0.01,
+ "lyapunov": 1.5772388463130083,
+ "grad_norm": 0.521407113480236,
+ "grad_max_sv": 0.16268486455082892,
+ "grad_min_sv": 1.0480323490539272e-12,
+ "grad_condition": 114294670712.50664,
+ "lr": 0.0009478558801197061,
+ "time_sec": 177.4581241607666
+ },
+ {
+ "epoch": 23,
+ "train_loss": 5.359366517028809,
+ "train_acc": 0.00984,
+ "test_loss": 5.14449934387207,
+ "test_acc": 0.01,
+ "lyapunov": 1.5788166193705995,
+ "grad_norm": 0.47520625785430726,
+ "grad_max_sv": 0.14188788905739785,
+ "grad_min_sv": 7.763794243203392e-13,
+ "grad_condition": 90263258979.91963,
+ "lr": 0.000943101789615607,
+ "time_sec": 177.4587037563324
+ },
+ {
+ "epoch": 24,
+ "train_loss": 5.363788315887451,
+ "train_acc": 0.00998,
+ "test_loss": 5.219554689025879,
+ "test_acc": 0.01,
+ "lyapunov": 1.5823031307181434,
+ "grad_norm": 0.45933897983850147,
+ "grad_max_sv": 0.1220944058150053,
+ "grad_min_sv": 8.70957522797587e-13,
+ "grad_condition": 79316477379.01375,
+ "lr": 0.0009381533400219313,
+ "time_sec": 177.45913338661194
+ },
+ {
+ "epoch": 25,
+ "train_loss": 5.365634008026123,
+ "train_acc": 0.0094,
+ "test_loss": 5.931232183074951,
+ "test_acc": 0.01,
+ "lyapunov": 1.5886532437161107,
+ "grad_norm": 0.43344753842757794,
+ "grad_max_sv": 0.017200349643826485,
+ "grad_min_sv": 1.0856606585118899e-15,
+ "grad_condition": 17078915149.903616,
+ "lr": 0.0009330127018922189,
+ "time_sec": 177.41433334350586
+ },
+ {
+ "epoch": 26,
+ "train_loss": 5.356309142761231,
+ "train_acc": 0.00862,
+ "test_loss": 5.939939945220948,
+ "test_acc": 0.01,
+ "lyapunov": 1.5817654276138071,
+ "grad_norm": 0.3773119512884375,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000927682130080253,
+ "time_sec": 177.42445373535156
+ },
+ {
+ "epoch": 27,
+ "train_loss": 5.356818426208496,
+ "train_acc": 0.00902,
+ "test_loss": 6.903866325378418,
+ "test_acc": 0.01,
+ "lyapunov": 1.5823859988576006,
+ "grad_norm": 0.4182139130247132,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0009221639627510072,
+ "time_sec": 177.31799745559692
+ },
+ {
+ "epoch": 28,
+ "train_loss": 5.391271570739746,
+ "train_acc": 0.00976,
+ "test_loss": 5.460548217773438,
+ "test_acc": 0.01,
+ "lyapunov": 1.5841533107220973,
+ "grad_norm": 0.523477636772141,
+ "grad_max_sv": 0.3192333810031414,
+ "grad_min_sv": 2.9275436547182563e-09,
+ "grad_condition": 203519819.7178569,
+ "lr": 0.0009164606203550494,
+ "time_sec": 177.46226978302002
+ },
+ {
+ "epoch": 29,
+ "train_loss": 5.375988426361084,
+ "train_acc": 0.00942,
+ "test_loss": 5.342045057678223,
+ "test_acc": 0.01,
+ "lyapunov": 1.584143414521766,
+ "grad_norm": 0.4275297259535999,
+ "grad_max_sv": 0.29515107311308386,
+ "grad_min_sv": 1.5519966579252698e-09,
+ "grad_condition": 5083754884.994722,
+ "lr": 0.0009105746045668516,
+ "time_sec": 177.49048447608948
+ },
+ {
+ "epoch": 30,
+ "train_loss": 5.3762526119995115,
+ "train_acc": 0.00992,
+ "test_loss": 5.335840890502929,
+ "test_acc": 0.01,
+ "lyapunov": 1.5899017634599104,
+ "grad_norm": 0.46512305667247905,
+ "grad_max_sv": 0.24659424126148224,
+ "grad_min_sv": 2.2743761505509726e-12,
+ "grad_condition": 128688559196.96506,
+ "lr": 0.0009045084971874733,
+ "time_sec": 177.4821593761444
+ },
+ {
+ "epoch": 31,
+ "train_loss": 5.376188383178711,
+ "train_acc": 0.00954,
+ "test_loss": 5.376922852325439,
+ "test_acc": 0.01,
+ "lyapunov": 1.5906847974528437,
+ "grad_norm": 0.40698064884293045,
+ "grad_max_sv": 0.2344340980052948,
+ "grad_min_sv": 1.6077615594515009e-12,
+ "grad_condition": 119697955045.46411,
+ "lr": 0.0008982649590120977,
+ "time_sec": 177.51625323295593
+ },
+ {
+ "epoch": 32,
+ "train_loss": 5.373684441070557,
+ "train_acc": 0.00944,
+ "test_loss": 5.2473334838867185,
+ "test_acc": 0.01,
+ "lyapunov": 1.5879211066019199,
+ "grad_norm": 0.3720940356738668,
+ "grad_max_sv": 0.20825780294835566,
+ "grad_min_sv": 3.7871002154344376e-10,
+ "grad_condition": 69233328517.31859,
+ "lr": 0.0008918467286629196,
+ "time_sec": 177.5158429145813
+ },
+ {
+ "epoch": 33,
+ "train_loss": 5.369580058288574,
+ "train_acc": 0.00906,
+ "test_loss": 5.292366073608399,
+ "test_acc": 0.01,
+ "lyapunov": 1.5872128549439217,
+ "grad_norm": 0.36741579981339867,
+ "grad_max_sv": 0.16275404021143913,
+ "grad_min_sv": 3.5290433862002075e-13,
+ "grad_condition": 135525270524.32925,
+ "lr": 0.0008852566213878943,
+ "time_sec": 177.54218769073486
+ },
+ {
+ "epoch": 34,
+ "train_loss": 5.364965376129151,
+ "train_acc": 0.00946,
+ "test_loss": 5.301969288635254,
+ "test_acc": 0.01,
+ "lyapunov": 1.5879910906867298,
+ "grad_norm": 0.40385833520326136,
+ "grad_max_sv": 0.09459194829687476,
+ "grad_min_sv": 2.8168103316895143e-14,
+ "grad_condition": 90889833007.94754,
+ "lr": 0.000878497527825878,
+ "time_sec": 177.56994581222534
+ },
+ {
+ "epoch": 35,
+ "train_loss": 5.367663076019287,
+ "train_acc": 0.01036,
+ "test_loss": 5.347993537902832,
+ "test_acc": 0.01,
+ "lyapunov": 1.5875165621033105,
+ "grad_norm": 0.3132720633072883,
+ "grad_max_sv": 0.1425728589296341,
+ "grad_min_sv": 2.007235616198558e-14,
+ "grad_condition": 139708753283.34723,
+ "lr": 0.000871572412738697,
+ "time_sec": 177.49852347373962
+ },
+ {
+ "epoch": 36,
+ "train_loss": 5.370810558624267,
+ "train_acc": 0.01022,
+ "test_loss": 5.382797595214844,
+ "test_acc": 0.01,
+ "lyapunov": 1.5899634550294608,
+ "grad_norm": 0.30370352801828593,
+ "grad_max_sv": 0.16092172265052795,
+ "grad_min_sv": 4.485897177730539e-14,
+ "grad_condition": 154470905347.59918,
+ "lr": 0.0008644843137107055,
+ "time_sec": 177.4556074142456
+ },
+ {
+ "epoch": 37,
+ "train_loss": 5.384568545379639,
+ "train_acc": 0.01018,
+ "test_loss": 5.296823876953125,
+ "test_acc": 0.01,
+ "lyapunov": 1.5977905272217967,
+ "grad_norm": 0.266373358722962,
+ "grad_max_sv": 0.14979717023670674,
+ "grad_min_sv": 7.171554109546675e-14,
+ "grad_condition": 140879720678.9068,
+ "lr": 0.0008572363398164014,
+ "time_sec": 177.47119235992432
+ },
+ {
+ "epoch": 38,
+ "train_loss": 5.370039872131348,
+ "train_acc": 0.01028,
+ "test_loss": 5.444481262207031,
+ "test_acc": 0.01,
+ "lyapunov": 1.5899496447399755,
+ "grad_norm": 0.3096876275058644,
+ "grad_max_sv": 0.15369951017200947,
+ "grad_min_sv": 9.48148632228887e-14,
+ "grad_condition": 141735332362.74988,
+ "lr": 0.0008498316702566826,
+ "time_sec": 177.47467923164368
+ },
+ {
+ "epoch": 39,
+ "train_loss": 5.369657610778809,
+ "train_acc": 0.01024,
+ "test_loss": 5.390600685119629,
+ "test_acc": 0.01,
+ "lyapunov": 1.5896801790008155,
+ "grad_norm": 0.3108555116352423,
+ "grad_max_sv": 0.1614890903234482,
+ "grad_min_sv": 9.349701492890973e-14,
+ "grad_condition": 149566173130.64127,
+ "lr": 0.0008422735529643442,
+ "time_sec": 177.4328293800354
+ },
+ {
+ "epoch": 40,
+ "train_loss": 5.3822917242431645,
+ "train_acc": 0.0093,
+ "test_loss": 5.184299499511718,
+ "test_acc": 0.01,
+ "lyapunov": 1.6002484066102205,
+ "grad_norm": 0.24882538015615607,
+ "grad_max_sv": 0.04936090065166354,
+ "grad_min_sv": 6.934642584876431e-15,
+ "grad_condition": 48367763332.42686,
+ "lr": 0.0008345653031794289,
+ "time_sec": 177.37197065353394
+ },
+ {
+ "epoch": 41,
+ "train_loss": 5.373546744842529,
+ "train_acc": 0.00964,
+ "test_loss": 5.196872940063477,
+ "test_acc": 0.01,
+ "lyapunov": 1.5940455433047946,
+ "grad_norm": 0.2191391775580976,
+ "grad_max_sv": 0.09365939311683177,
+ "grad_min_sv": 1.5882716898553207e-15,
+ "grad_condition": 93493384840.27858,
+ "lr": 0.0008267103019950526,
+ "time_sec": 177.47450184822083
+ },
+ {
+ "epoch": 42,
+ "train_loss": 5.368149404144287,
+ "train_acc": 0.00874,
+ "test_loss": 5.14538009185791,
+ "test_acc": 0.01,
+ "lyapunov": 1.590694589383157,
+ "grad_norm": 0.22212098932442453,
+ "grad_max_sv": 0.10206865929067135,
+ "grad_min_sv": 2.3133067448522557e-15,
+ "grad_condition": 101840784421.61417,
+ "lr": 0.0008187119948743447,
+ "time_sec": 177.46074080467224
+ },
+ {
+ "epoch": 43,
+ "train_loss": 5.367429432983398,
+ "train_acc": 0.00892,
+ "test_loss": 5.233426832580567,
+ "test_acc": 0.01,
+ "lyapunov": 1.591343494327477,
+ "grad_norm": 0.23543493742380756,
+ "grad_max_sv": 0.08834987077862025,
+ "grad_min_sv": 5.952270134521069e-16,
+ "grad_condition": 88299394994.77124,
+ "lr": 0.000810573890139155,
+ "time_sec": 177.47843408584595
+ },
+ {
+ "epoch": 44,
+ "train_loss": 5.3674171057128905,
+ "train_acc": 0.00878,
+ "test_loss": 5.2093109710693355,
+ "test_acc": 0.01,
+ "lyapunov": 1.5915821013243303,
+ "grad_norm": 0.1990598758819041,
+ "grad_max_sv": 0.07391932224854827,
+ "grad_min_sv": 4.4595190727564784e-24,
+ "grad_condition": 73919322248.21725,
+ "lr": 0.0008022995574311873,
+ "time_sec": 177.49818992614746
+ },
+ {
+ "epoch": 45,
+ "train_loss": 5.367794494018555,
+ "train_acc": 0.00928,
+ "test_loss": 5.287538707733154,
+ "test_acc": 0.01,
+ "lyapunov": 1.5911102807125472,
+ "grad_norm": 0.23659112992785783,
+ "grad_max_sv": 0.0903646806254983,
+ "grad_min_sv": 2.044203469301876e-16,
+ "grad_condition": 90346621799.15851,
+ "lr": 0.0007938926261462363,
+ "time_sec": 177.41696000099182
+ },
+ {
+ "epoch": 46,
+ "train_loss": 5.376998851623535,
+ "train_acc": 0.00968,
+ "test_loss": 5.387116500854492,
+ "test_acc": 0.01,
+ "lyapunov": 1.5990899456736376,
+ "grad_norm": 0.2197692685737557,
+ "grad_max_sv": 0.09713525734841824,
+ "grad_min_sv": 1.4019481757585365e-15,
+ "grad_condition": 96996163686.28548,
+ "lr": 0.0007853567838422158,
+ "time_sec": 177.49049758911133
+ },
+ {
+ "epoch": 47,
+ "train_loss": 5.367403378448486,
+ "train_acc": 0.00904,
+ "test_loss": 5.152558483886719,
+ "test_acc": 0.01,
+ "lyapunov": 1.5909755915936912,
+ "grad_norm": 0.20354351323110018,
+ "grad_max_sv": 0.09671832993626595,
+ "grad_min_sv": 1.7095434307863795e-15,
+ "grad_condition": 96550067706.91704,
+ "lr": 0.0007766957746216719,
+ "time_sec": 177.440682888031
+ },
+ {
+ "epoch": 48,
+ "train_loss": 5.3691537622070316,
+ "train_acc": 0.009,
+ "test_loss": 5.103178468322754,
+ "test_acc": 0.01,
+ "lyapunov": 1.5926780014696633,
+ "grad_norm": 0.20080565969562386,
+ "grad_max_sv": 0.09486224502325058,
+ "grad_min_sv": 1.5909231309062707e-15,
+ "grad_condition": 94698098961.85327,
+ "lr": 0.0007679133974894982,
+ "time_sec": 177.45987153053284
+ },
+ {
+ "epoch": 49,
+ "train_loss": 5.367714106140137,
+ "train_acc": 0.0093,
+ "test_loss": 5.090968506622314,
+ "test_acc": 0.01,
+ "lyapunov": 1.5918231150683235,
+ "grad_norm": 0.21785142639292177,
+ "grad_max_sv": 0.08113837614655495,
+ "grad_min_sv": 1.754494669434441e-20,
+ "grad_condition": 81138374637.8342,
+ "lr": 0.000759013504686565,
+ "time_sec": 177.4056305885315
+ },
+ {
+ "epoch": 50,
+ "train_loss": 5.370782024841309,
+ "train_acc": 0.00932,
+ "test_loss": 5.1753190261840825,
+ "test_acc": 0.01,
+ "lyapunov": 1.5940865891059037,
+ "grad_norm": 0.20444563688390227,
+ "grad_max_sv": 0.07656172616407275,
+ "grad_min_sv": 2.696277782642207e-17,
+ "grad_condition": 76559876296.83813,
+ "lr": 0.0007499999999999998,
+ "time_sec": 177.39811301231384
+ },
+ {
+ "epoch": 51,
+ "train_loss": 5.368595368652343,
+ "train_acc": 0.0093,
+ "test_loss": 5.130212609863281,
+ "test_acc": 0.01,
+ "lyapunov": 1.5924014548206573,
+ "grad_norm": 0.2110899983642968,
+ "grad_max_sv": 0.09537852350622415,
+ "grad_min_sv": 2.1267942984928308e-15,
+ "grad_condition": 95172191574.00798,
+ "lr": 0.0007408768370508575,
+ "time_sec": 177.437908411026
+ },
+ {
+ "epoch": 52,
+ "train_loss": 5.368308511657715,
+ "train_acc": 0.0095,
+ "test_loss": 5.122430040740967,
+ "test_acc": 0.01,
+ "lyapunov": 1.5921837594503028,
+ "grad_norm": 0.22274269152603762,
+ "grad_max_sv": 0.09443439822643995,
+ "grad_min_sv": 1.7298829634439422e-15,
+ "grad_condition": 94273467470.68217,
+ "lr": 0.0007316480175599307,
+ "time_sec": 177.40578150749207
+ },
+ {
+ "epoch": 53,
+ "train_loss": 5.369929014434814,
+ "train_acc": 0.01008,
+ "test_loss": 5.085774603271484,
+ "test_acc": 0.01,
+ "lyapunov": 1.5937723787239446,
+ "grad_norm": 0.20295993227713832,
+ "grad_max_sv": 0.09454309139400721,
+ "grad_min_sv": 6.450947046344728e-16,
+ "grad_condition": 94479862712.68396,
+ "lr": 0.0007223175895924635,
+ "time_sec": 177.40152430534363
+ },
+ {
+ "epoch": 54,
+ "train_loss": 5.373923838806152,
+ "train_acc": 0.00952,
+ "test_loss": 5.077367216491699,
+ "test_acc": 0.01,
+ "lyapunov": 1.5964158435002007,
+ "grad_norm": 0.2154712788436217,
+ "grad_max_sv": 0.09458265658468008,
+ "grad_min_sv": 2.433638441241118e-15,
+ "grad_condition": 94352900611.06958,
+ "lr": 0.0007128896457825361,
+ "time_sec": 177.4158182144165
+ },
+ {
+ "epoch": 55,
+ "train_loss": 5.367228227386475,
+ "train_acc": 0.01046,
+ "test_loss": 5.130655932617188,
+ "test_acc": 0.01,
+ "lyapunov": 1.5918423345936534,
+ "grad_norm": 0.21491158085488357,
+ "grad_max_sv": 0.07526904288679362,
+ "grad_min_sv": 2.528540900743907e-16,
+ "grad_condition": 75246607455.27087,
+ "lr": 0.0007033683215378998,
+ "time_sec": 177.39575290679932
+ },
+ {
+ "epoch": 56,
+ "train_loss": 5.367513545684814,
+ "train_acc": 0.00982,
+ "test_loss": 5.064245509338379,
+ "test_acc": 0.01,
+ "lyapunov": 1.5908652431214862,
+ "grad_norm": 0.20945675875630285,
+ "grad_max_sv": 0.07764090299606323,
+ "grad_min_sv": 1.3979459340183045e-15,
+ "grad_condition": 77513163313.73227,
+ "lr": 0.0006937577932260512,
+ "time_sec": 177.41370344161987
+ },
+ {
+ "epoch": 57,
+ "train_loss": 5.378045714263916,
+ "train_acc": 0.0097,
+ "test_loss": 5.010745031738281,
+ "test_acc": 0.01,
+ "lyapunov": 1.5985675842865654,
+ "grad_norm": 0.21081504402843954,
+ "grad_max_sv": 0.08188115861266851,
+ "grad_min_sv": 5.212303423583328e-17,
+ "grad_condition": 81876236542.23714,
+ "lr": 0.0006840622763423388,
+ "time_sec": 177.4101119041443
+ },
+ {
+ "epoch": 58,
+ "train_loss": 5.369592454376221,
+ "train_acc": 0.00954,
+ "test_loss": 5.001489561462402,
+ "test_acc": 0.01,
+ "lyapunov": 1.594169369743913,
+ "grad_norm": 0.22207129747707732,
+ "grad_max_sv": 0.06061144880950451,
+ "grad_min_sv": 8.52425895192004e-34,
+ "grad_condition": 60611448809.5045,
+ "lr": 0.0006742860236609073,
+ "time_sec": 177.40956783294678
+ },
+ {
+ "epoch": 59,
+ "train_loss": 5.369317971343994,
+ "train_acc": 0.00942,
+ "test_loss": 5.000968522644043,
+ "test_acc": 0.01,
+ "lyapunov": 1.593946976429971,
+ "grad_norm": 0.21723304995593648,
+ "grad_max_sv": 0.06631144480779767,
+ "grad_min_sv": 5.644079889684282e-43,
+ "grad_condition": 66311444807.79767,
+ "lr": 0.0006644333233692913,
+ "time_sec": 177.41563248634338
+ },
+ {
+ "epoch": 60,
+ "train_loss": 5.367086203613281,
+ "train_acc": 0.00986,
+ "test_loss": 4.980809173583984,
+ "test_acc": 0.01,
+ "lyapunov": 1.5923281987304883,
+ "grad_norm": 0.22232157475356287,
+ "grad_max_sv": 0.05571612091735005,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55716120917.35005,
+ "lr": 0.0006545084971874734,
+ "time_sec": 177.36889171600342
+ },
+ {
+ "epoch": 61,
+ "train_loss": 5.372129827270508,
+ "train_acc": 0.00924,
+ "test_loss": 5.0162686882019045,
+ "test_acc": 0.01,
+ "lyapunov": 1.5957943103502474,
+ "grad_norm": 0.2315139450623546,
+ "grad_max_sv": 0.05857418505474925,
+ "grad_min_sv": 3.503246160812043e-47,
+ "grad_condition": 58574185054.74925,
+ "lr": 0.0006445158984722354,
+ "time_sec": 177.3955101966858
+ },
+ {
+ "epoch": 62,
+ "train_loss": 5.376675976257324,
+ "train_acc": 0.01028,
+ "test_loss": 4.951765003204346,
+ "test_acc": 0.01,
+ "lyapunov": 1.5998592873668427,
+ "grad_norm": 0.23053009469996935,
+ "grad_max_sv": 0.049639166425913574,
+ "grad_min_sv": 3.503246160812043e-47,
+ "grad_condition": 49639166425.913574,
+ "lr": 0.0006344599103076324,
+ "time_sec": 177.38628578186035
+ },
+ {
+ "epoch": 63,
+ "train_loss": 5.3675309051513675,
+ "train_acc": 0.00898,
+ "test_loss": 4.976654839324951,
+ "test_acc": 0.01,
+ "lyapunov": 1.59307188481626,
+ "grad_norm": 0.247010688591046,
+ "grad_max_sv": 0.04920805087313056,
+ "grad_min_sv": 0.0,
+ "grad_condition": 49208050873.13057,
+ "lr": 0.0006243449435824269,
+ "time_sec": 177.40613865852356
+ },
+ {
+ "epoch": 64,
+ "train_loss": 5.367255066528321,
+ "train_acc": 0.0097,
+ "test_loss": 5.067697259521484,
+ "test_acc": 0.01,
+ "lyapunov": 1.5924071750372573,
+ "grad_norm": 0.2341571351131304,
+ "grad_max_sv": 0.05343637596815824,
+ "grad_min_sv": 0.0,
+ "grad_condition": 53436375968.15825,
+ "lr": 0.0006141754350553275,
+ "time_sec": 177.3703956604004
+ },
+ {
+ "epoch": 65,
+ "train_loss": 5.367540504302979,
+ "train_acc": 0.00908,
+ "test_loss": 4.9729307174682615,
+ "test_acc": 0.01,
+ "lyapunov": 1.5929816647258865,
+ "grad_norm": 0.23218078781210785,
+ "grad_max_sv": 0.05375193590298295,
+ "grad_min_sv": 0.0,
+ "grad_condition": 53751935902.98295,
+ "lr": 0.0006039558454088793,
+ "time_sec": 177.38945150375366
+ },
+ {
+ "epoch": 66,
+ "train_loss": 5.366137564239502,
+ "train_acc": 0.00936,
+ "test_loss": 4.934913189697266,
+ "test_acc": 0.01,
+ "lyapunov": 1.5917930770713045,
+ "grad_norm": 0.21702876886168843,
+ "grad_max_sv": 0.04379821689799428,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43798216897.99428,
+ "lr": 0.000593690657292862,
+ "time_sec": 177.4724154472351
+ },
+ {
+ "epoch": 67,
+ "train_loss": 5.370335599822998,
+ "train_acc": 0.00978,
+ "test_loss": 4.938832836914062,
+ "test_acc": 0.01,
+ "lyapunov": 1.5958915979356108,
+ "grad_norm": 0.26747204938928953,
+ "grad_max_sv": 0.038104135124012825,
+ "grad_min_sv": 0.0,
+ "grad_condition": 38104135124.01283,
+ "lr": 0.0005833843733580507,
+ "time_sec": 177.42428302764893
+ },
+ {
+ "epoch": 68,
+ "train_loss": 5.367096372375488,
+ "train_acc": 0.00948,
+ "test_loss": 4.961852867126465,
+ "test_acc": 0.01,
+ "lyapunov": 1.5927841407258798,
+ "grad_norm": 0.24628304430345999,
+ "grad_max_sv": 0.037431048322469,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37431048322.468994,
+ "lr": 0.0005730415142812054,
+ "time_sec": 177.35656356811523
+ },
+ {
+ "epoch": 69,
+ "train_loss": 5.367298457641602,
+ "train_acc": 0.00942,
+ "test_loss": 4.985350135040283,
+ "test_acc": 0.01,
+ "lyapunov": 1.5926642820353398,
+ "grad_norm": 0.26713274620852084,
+ "grad_max_sv": 0.0558107316493988,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55810731649.3988,
+ "lr": 0.0005626666167821517,
+ "time_sec": 177.404226064682
+ },
+ {
+ "epoch": 70,
+ "train_loss": 5.370034771118164,
+ "train_acc": 0.01,
+ "test_loss": 4.9722988952636715,
+ "test_acc": 0.01,
+ "lyapunov": 1.5953361000246404,
+ "grad_norm": 0.2772668383220675,
+ "grad_max_sv": 0.059619830828160046,
+ "grad_min_sv": 0.0,
+ "grad_condition": 59619830828.16006,
+ "lr": 0.0005522642316338265,
+ "time_sec": 177.41033554077148
+ },
+ {
+ "epoch": 71,
+ "train_loss": 5.3663228466796875,
+ "train_acc": 0.0097,
+ "test_loss": 4.996751819610596,
+ "test_acc": 0.01,
+ "lyapunov": 1.592004930881588,
+ "grad_norm": 0.27122147817442865,
+ "grad_max_sv": 0.051365063060075045,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51365063060.07505,
+ "lr": 0.0005418389216661573,
+ "time_sec": 177.41588258743286
+ },
+ {
+ "epoch": 72,
+ "train_loss": 5.3688113453674315,
+ "train_acc": 0.00906,
+ "test_loss": 4.95511130065918,
+ "test_acc": 0.01,
+ "lyapunov": 1.5943079513052236,
+ "grad_norm": 0.2940023518744728,
+ "grad_max_sv": 0.043863069359213115,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43863069359.21311,
+ "lr": 0.0005313952597646563,
+ "time_sec": 177.4312937259674
+ },
+ {
+ "epoch": 73,
+ "train_loss": 5.369862328338623,
+ "train_acc": 0.00916,
+ "test_loss": 4.928821298217773,
+ "test_acc": 0.01,
+ "lyapunov": 1.5948649678388824,
+ "grad_norm": 0.337053679491892,
+ "grad_max_sv": 0.03650999316014349,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36509993160.14349,
+ "lr": 0.0005209378268645994,
+ "time_sec": 177.47835731506348
+ },
+ {
+ "epoch": 74,
+ "train_loss": 5.366141536560058,
+ "train_acc": 0.00956,
+ "test_loss": 4.951869967651367,
+ "test_acc": 0.01,
+ "lyapunov": 1.591574984133396,
+ "grad_norm": 0.34688609459259695,
+ "grad_max_sv": 0.0532405337318778,
+ "grad_min_sv": 0.0,
+ "grad_condition": 53240533731.87779,
+ "lr": 0.0005104712099416781,
+ "time_sec": 177.39541888237
+ },
+ {
+ "epoch": 75,
+ "train_loss": 5.3659246875,
+ "train_acc": 0.00862,
+ "test_loss": 4.96804543762207,
+ "test_acc": 0.01,
+ "lyapunov": 1.5917583252767773,
+ "grad_norm": 0.49942333201069317,
+ "grad_max_sv": 0.04099391270428896,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40993912704.288956,
+ "lr": 0.0004999999999999996,
+ "time_sec": 177.3808958530426
+ },
+ {
+ "epoch": 76,
+ "train_loss": 5.3697430253601075,
+ "train_acc": 0.00932,
+ "test_loss": 4.843025128173828,
+ "test_acc": 0.01,
+ "lyapunov": 1.5954608170272748,
+ "grad_norm": 0.5592194591464297,
+ "grad_max_sv": 0.03530313139781356,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35303131397.81356,
+ "lr": 0.0004895287900583212,
+ "time_sec": 177.36198616027832
+ },
+ {
+ "epoch": 77,
+ "train_loss": 5.369125059814453,
+ "train_acc": 0.00908,
+ "test_loss": 4.996518075561523,
+ "test_acc": 0.01,
+ "lyapunov": 1.5947885577331113,
+ "grad_norm": 0.5290088024656862,
+ "grad_max_sv": 0.017188509553670885,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17188509553.670883,
+ "lr": 0.0004790621731353997,
+ "time_sec": 177.27709126472473
+ },
+ {
+ "epoch": 78,
+ "train_loss": 5.368183317260742,
+ "train_acc": 0.01024,
+ "test_loss": 4.973466501617431,
+ "test_acc": 0.01,
+ "lyapunov": 1.5941324002297639,
+ "grad_norm": 0.6809743973398079,
+ "grad_max_sv": 0.029488482885062693,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29488482885.062695,
+ "lr": 0.000468604740235343,
+ "time_sec": 177.3189423084259
+ },
+ {
+ "epoch": 79,
+ "train_loss": 5.367250970458985,
+ "train_acc": 0.00956,
+ "test_loss": 4.950716239929199,
+ "test_acc": 0.01,
+ "lyapunov": 1.5930783117518705,
+ "grad_norm": 1.411636125689672,
+ "grad_max_sv": 0.031192977959290148,
+ "grad_min_sv": 0.0,
+ "grad_condition": 31192977959.29015,
+ "lr": 0.00045816107833384175,
+ "time_sec": 177.3485884666443
+ },
+ {
+ "epoch": 80,
+ "train_loss": 5.366609226837158,
+ "train_acc": 0.01002,
+ "test_loss": 4.952863761901855,
+ "test_acc": 0.01,
+ "lyapunov": 1.5922869257914745,
+ "grad_norm": 1.0613102889069541,
+ "grad_max_sv": 0.042383548151701686,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42383548151.70168,
+ "lr": 0.0004477357683661729,
+ "time_sec": 177.41135001182556
+ },
+ {
+ "epoch": 81,
+ "train_loss": 5.367390147705078,
+ "train_acc": 0.00896,
+ "test_loss": 4.965977513885498,
+ "test_acc": 0.01,
+ "lyapunov": 1.5931403121679946,
+ "grad_norm": 1.113579115473781,
+ "grad_max_sv": 0.039911494683474304,
+ "grad_min_sv": 0.0,
+ "grad_condition": 39911494683.474304,
+ "lr": 0.00043733338321784746,
+ "time_sec": 177.3696448802948
+ },
+ {
+ "epoch": 82,
+ "train_loss": 5.374857454833984,
+ "train_acc": 0.0098,
+ "test_loss": 4.912637939453125,
+ "test_acc": 0.01,
+ "lyapunov": 1.5992167480766315,
+ "grad_norm": 1.3681227141701577,
+ "grad_max_sv": 0.032051424495875835,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32051424495.875835,
+ "lr": 0.0004269584857187939,
+ "time_sec": 177.33939170837402
+ },
+ {
+ "epoch": 83,
+ "train_loss": 5.365830071716308,
+ "train_acc": 0.01,
+ "test_loss": 4.93360542678833,
+ "test_acc": 0.01,
+ "lyapunov": 1.5919503589420367,
+ "grad_norm": 1.2908239754732598,
+ "grad_max_sv": 0.018338044127449393,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18338044127.449394,
+ "lr": 0.0004166156266419484,
+ "time_sec": 177.30572271347046
+ },
+ {
+ "epoch": 84,
+ "train_loss": 5.369314513549805,
+ "train_acc": 0.01032,
+ "test_loss": 4.962402893066407,
+ "test_acc": 0.01,
+ "lyapunov": 1.5951606830977418,
+ "grad_norm": 1.2430323961128404,
+ "grad_max_sv": 0.014490698464214802,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14490698464.214802,
+ "lr": 0.0004063093427071373,
+ "time_sec": 177.2841637134552
+ },
+ {
+ "epoch": 85,
+ "train_loss": 5.377282650604248,
+ "train_acc": 0.00908,
+ "test_loss": 4.969677833557129,
+ "test_acc": 0.01,
+ "lyapunov": 1.5993056263765106,
+ "grad_norm": 1.0935450948855057,
+ "grad_max_sv": 0.03076445385813713,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30764453858.137135,
+ "lr": 0.0003960441545911199,
+ "time_sec": 177.35037755966187
+ },
+ {
+ "epoch": 86,
+ "train_loss": 5.365991982879638,
+ "train_acc": 0.00934,
+ "test_loss": 4.960339687347412,
+ "test_acc": 0.01,
+ "lyapunov": 1.591959211527539,
+ "grad_norm": 1.0249256686134756,
+ "grad_max_sv": 0.03798610083758831,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37986100837.5883,
+ "lr": 0.0003858245649446718,
+ "time_sec": 177.35586881637573
+ },
+ {
+ "epoch": 87,
+ "train_loss": 5.36631558807373,
+ "train_acc": 0.00936,
+ "test_loss": 4.948922778320313,
+ "test_acc": 0.01,
+ "lyapunov": 1.5924714169538845,
+ "grad_norm": 0.8096413328413968,
+ "grad_max_sv": 0.033394893538206814,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33394893538.206818,
+ "lr": 0.00037565505641757235,
+ "time_sec": 177.3941514492035
+ },
+ {
+ "epoch": 88,
+ "train_loss": 5.372631300354004,
+ "train_acc": 0.01006,
+ "test_loss": 4.890858795166015,
+ "test_acc": 0.01,
+ "lyapunov": 1.5971073076853057,
+ "grad_norm": 0.3735195103580093,
+ "grad_max_sv": 0.02607831247150898,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26078312471.50898,
+ "lr": 0.00036554008969236695,
+ "time_sec": 177.28741931915283
+ },
+ {
+ "epoch": 89,
+ "train_loss": 5.367757025299072,
+ "train_acc": 0.0093,
+ "test_loss": 4.9563854202270505,
+ "test_acc": 0.01,
+ "lyapunov": 1.593846448242207,
+ "grad_norm": 0.4162028440796633,
+ "grad_max_sv": 0.030028719501569868,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30028719501.569862,
+ "lr": 0.0003554841015277638,
+ "time_sec": 177.30004262924194
+ },
+ {
+ "epoch": 90,
+ "train_loss": 5.369390062561036,
+ "train_acc": 0.01028,
+ "test_loss": 4.903431629943848,
+ "test_acc": 0.01,
+ "lyapunov": 1.5944386360895297,
+ "grad_norm": 0.45537462137938906,
+ "grad_max_sv": 0.03309078188613057,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33090781886.130573,
+ "lr": 0.000345491502812526,
+ "time_sec": 177.33181858062744
+ },
+ {
+ "epoch": 91,
+ "train_loss": 5.36617555480957,
+ "train_acc": 0.0097,
+ "test_loss": 4.973295672607422,
+ "test_acc": 0.01,
+ "lyapunov": 1.5924281744700868,
+ "grad_norm": 0.42959416759344066,
+ "grad_max_sv": 0.02529722950421274,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25297229504.212738,
+ "lr": 0.0003355666766307081,
+ "time_sec": 177.29152536392212
+ },
+ {
+ "epoch": 92,
+ "train_loss": 5.3661282931518555,
+ "train_acc": 0.0106,
+ "test_loss": 4.874008221435547,
+ "test_acc": 0.01,
+ "lyapunov": 1.5923549528317074,
+ "grad_norm": 0.4739333324657675,
+ "grad_max_sv": 0.027486719330772756,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27486719330.77276,
+ "lr": 0.00032571397633909225,
+ "time_sec": 177.3095293045044
+ },
+ {
+ "epoch": 93,
+ "train_loss": 5.36726612121582,
+ "train_acc": 0.00952,
+ "test_loss": 4.844555052947998,
+ "test_acc": 0.01,
+ "lyapunov": 1.5933535443547437,
+ "grad_norm": 0.4489090651028355,
+ "grad_max_sv": 0.027935726940631865,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27935726940.631866,
+ "lr": 0.00031593772365766094,
+ "time_sec": 177.29880285263062
+ },
+ {
+ "epoch": 94,
+ "train_loss": 5.367507637634278,
+ "train_acc": 0.00938,
+ "test_loss": 4.85123999710083,
+ "test_acc": 0.01,
+ "lyapunov": 1.593514009509855,
+ "grad_norm": 0.49488308768779743,
+ "grad_max_sv": 0.03786678058095276,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37866780580.95277,
+ "lr": 0.0003062422067739483,
+ "time_sec": 177.66627550125122
+ },
+ {
+ "epoch": 95,
+ "train_loss": 5.367161036987305,
+ "train_acc": 0.01,
+ "test_loss": 4.919075784301758,
+ "test_acc": 0.01,
+ "lyapunov": 1.593309577468716,
+ "grad_norm": 0.49632556697910357,
+ "grad_max_sv": 0.03764305226504803,
+ "grad_min_sv": 0.0,
+ "grad_condition": 37643052265.04803,
+ "lr": 0.00029663167846209965,
+ "time_sec": 177.35125970840454
+ },
+ {
+ "epoch": 96,
+ "train_loss": 5.368773625488282,
+ "train_acc": 0.00952,
+ "test_loss": 4.886889329528809,
+ "test_acc": 0.01,
+ "lyapunov": 1.5946083480439832,
+ "grad_norm": 0.5634579068593676,
+ "grad_max_sv": 0.033481535781174895,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33481535781.174904,
+ "lr": 0.00028711035421746345,
+ "time_sec": 177.33729600906372
+ },
+ {
+ "epoch": 97,
+ "train_loss": 5.373278410797119,
+ "train_acc": 0.0092,
+ "test_loss": 4.919860540771484,
+ "test_acc": 0.01,
+ "lyapunov": 1.5970366150521866,
+ "grad_norm": 0.5241288299265501,
+ "grad_max_sv": 0.02991771958768368,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29917719587.683678,
+ "lr": 0.00027768241040753615,
+ "time_sec": 177.3373203277588
+ },
+ {
+ "epoch": 98,
+ "train_loss": 5.367487851867676,
+ "train_acc": 0.00984,
+ "test_loss": 4.922154154968262,
+ "test_acc": 0.01,
+ "lyapunov": 1.5938531629874577,
+ "grad_norm": 0.6102489153602656,
+ "grad_max_sv": 0.02815253552980721,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28152535529.807213,
+ "lr": 0.00026835198244006903,
+ "time_sec": 177.35172653198242
+ },
+ {
+ "epoch": 99,
+ "train_loss": 5.367893275756836,
+ "train_acc": 0.01038,
+ "test_loss": 4.930574498748779,
+ "test_acc": 0.01,
+ "lyapunov": 1.593941973908173,
+ "grad_norm": 0.5921377439478998,
+ "grad_max_sv": 0.03409935408271849,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34099354082.718487,
+ "lr": 0.0002591231629491421,
+ "time_sec": 177.36736416816711
+ },
+ {
+ "epoch": 100,
+ "train_loss": 5.372079080200195,
+ "train_acc": 0.01062,
+ "test_loss": 4.915191829681397,
+ "test_acc": 0.01,
+ "lyapunov": 1.596833938832783,
+ "grad_norm": 0.5930918441111938,
+ "grad_max_sv": 0.033569992519915104,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33569992519.915108,
+ "lr": 0.0002499999999999997,
+ "time_sec": 177.3853051662445
+ },
+ {
+ "epoch": 101,
+ "train_loss": 5.365807982940674,
+ "train_acc": 0.00976,
+ "test_loss": 4.926369466400146,
+ "test_acc": 0.01,
+ "lyapunov": 1.5920866029646696,
+ "grad_norm": 1.2269794373451623,
+ "grad_max_sv": 0.03278505662456155,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32785056624.561546,
+ "lr": 0.00024098649531343477,
+ "time_sec": 177.41039776802063
+ },
+ {
+ "epoch": 102,
+ "train_loss": 5.3670011302185054,
+ "train_acc": 0.00968,
+ "test_loss": 5.182023647308349,
+ "test_acc": 0.01,
+ "lyapunov": 1.5932530469601722,
+ "grad_norm": 0.5812477341116522,
+ "grad_max_sv": 0.03314556856639683,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33145568566.39683,
+ "lr": 0.0002320866025105016,
+ "time_sec": 177.37316060066223
+ },
+ {
+ "epoch": 103,
+ "train_loss": 5.371551856231689,
+ "train_acc": 0.01004,
+ "test_loss": 4.899476731109619,
+ "test_acc": 0.01,
+ "lyapunov": 1.5966654973261802,
+ "grad_norm": 0.610767105839377,
+ "grad_max_sv": 0.02582362242974341,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25823622429.74341,
+ "lr": 0.0002233042253783278,
+ "time_sec": 177.36590600013733
+ },
+ {
+ "epoch": 104,
+ "train_loss": 5.368561768646241,
+ "train_acc": 0.00946,
+ "test_loss": 4.930848654174805,
+ "test_acc": 0.01,
+ "lyapunov": 1.5947173150908915,
+ "grad_norm": 0.6422628015235555,
+ "grad_max_sv": 0.025343496771529316,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25343496771.529316,
+ "lr": 0.000214643216157784,
+ "time_sec": 177.3882737159729
+ },
+ {
+ "epoch": 105,
+ "train_loss": 5.36991615814209,
+ "train_acc": 0.0091,
+ "test_loss": 4.899362311553955,
+ "test_acc": 0.01,
+ "lyapunov": 1.5956382519753693,
+ "grad_norm": 0.5876379942472394,
+ "grad_max_sv": 0.02119842660613358,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21198426606.133583,
+ "lr": 0.00020610737385376332,
+ "time_sec": 177.41758513450623
+ },
+ {
+ "epoch": 106,
+ "train_loss": 5.366515799407959,
+ "train_acc": 0.01026,
+ "test_loss": 4.887499784851074,
+ "test_acc": 0.01,
+ "lyapunov": 1.592897226743381,
+ "grad_norm": 0.6201818264513558,
+ "grad_max_sv": 0.0033281870651990174,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3328187065.1990175,
+ "lr": 0.00019770044256881242,
+ "time_sec": 177.3366186618805
+ },
+ {
+ "epoch": 107,
+ "train_loss": 5.368152584533691,
+ "train_acc": 0.00916,
+ "test_loss": 4.894157613372803,
+ "test_acc": 0.01,
+ "lyapunov": 1.5942484835529571,
+ "grad_norm": 0.7280576803690416,
+ "grad_max_sv": 0.027869051974266767,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27869051974.266766,
+ "lr": 0.0001894261098608447,
+ "time_sec": 177.37792563438416
+ },
+ {
+ "epoch": 108,
+ "train_loss": 5.3665059283447265,
+ "train_acc": 0.00976,
+ "test_loss": 4.915471728515625,
+ "test_acc": 0.01,
+ "lyapunov": 1.592840023662733,
+ "grad_norm": 0.7424554492649038,
+ "grad_max_sv": 0.026440556207671762,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26440556207.67176,
+ "lr": 0.000181288005125655,
+ "time_sec": 177.35853958129883
+ },
+ {
+ "epoch": 109,
+ "train_loss": 5.376394969329834,
+ "train_acc": 0.01022,
+ "test_loss": 4.922409371948242,
+ "test_acc": 0.01,
+ "lyapunov": 1.6003244386609559,
+ "grad_norm": 0.8040426103005965,
+ "grad_max_sv": 0.024923838768154384,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24923838768.15438,
+ "lr": 0.0001732896980049473,
+ "time_sec": 177.31202268600464
+ },
+ {
+ "epoch": 110,
+ "train_loss": 5.376544867401123,
+ "train_acc": 0.01006,
+ "test_loss": 4.9106194869995115,
+ "test_acc": 0.01,
+ "lyapunov": 1.5990420381736268,
+ "grad_norm": 0.7808973134784486,
+ "grad_max_sv": 0.023315236158668994,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23315236158.668995,
+ "lr": 0.00016543469682057076,
+ "time_sec": 177.3295497894287
+ },
+ {
+ "epoch": 111,
+ "train_loss": 5.366748910522461,
+ "train_acc": 0.01,
+ "test_loss": 4.904478953552246,
+ "test_acc": 0.01,
+ "lyapunov": 1.5930900046282717,
+ "grad_norm": 0.8315740534061841,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 177.3059582710266
+ },
+ {
+ "epoch": 112,
+ "train_loss": 5.365462461242676,
+ "train_acc": 0.0097,
+ "test_loss": 4.909817778778076,
+ "test_acc": 0.01,
+ "lyapunov": 1.591839042770893,
+ "grad_norm": 1.0644316030188519,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 177.3259735107422
+ },
+ {
+ "epoch": 113,
+ "train_loss": 5.366983929290772,
+ "train_acc": 0.01,
+ "test_loss": 4.893335526275635,
+ "test_acc": 0.01,
+ "lyapunov": 1.5934227226335373,
+ "grad_norm": 1.0331708046855217,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 177.29799342155457
+ },
+ {
+ "epoch": 114,
+ "train_loss": 5.367780682678223,
+ "train_acc": 0.01,
+ "test_loss": 4.896582912445068,
+ "test_acc": 0.01,
+ "lyapunov": 1.5942320003533912,
+ "grad_norm": 1.09308769834869,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00013551568628929425,
+ "time_sec": 177.33024215698242
+ },
+ {
+ "epoch": 115,
+ "train_loss": 5.367718472900391,
+ "train_acc": 0.01,
+ "test_loss": 4.895343659973144,
+ "test_acc": 0.01,
+ "lyapunov": 1.5940615042396213,
+ "grad_norm": 1.2673802568939343,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 177.3362259864807
+ },
+ {
+ "epoch": 116,
+ "train_loss": 5.3657911352539065,
+ "train_acc": 0.01,
+ "test_loss": 4.906929530334473,
+ "test_acc": 0.01,
+ "lyapunov": 1.5921993859283758,
+ "grad_norm": 1.2617224687326039,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 177.28457856178284
+ },
+ {
+ "epoch": 117,
+ "train_loss": 5.366755274505615,
+ "train_acc": 0.00962,
+ "test_loss": 4.891025592041015,
+ "test_acc": 0.01,
+ "lyapunov": 1.5932053120239922,
+ "grad_norm": 1.3667828520013348,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 177.260840177536
+ },
+ {
+ "epoch": 118,
+ "train_loss": 5.369936829376221,
+ "train_acc": 0.00938,
+ "test_loss": 4.908762777709961,
+ "test_acc": 0.01,
+ "lyapunov": 1.5956426922927427,
+ "grad_norm": 1.4737347393486513,
+ "grad_max_sv": 0.002789213368669152,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2789213368.6691523,
+ "lr": 0.00010815327133708009,
+ "time_sec": 177.28786754608154
+ },
+ {
+ "epoch": 119,
+ "train_loss": 5.367702166290283,
+ "train_acc": 0.01006,
+ "test_loss": 4.900025549316406,
+ "test_acc": 0.01,
+ "lyapunov": 1.5938852357742426,
+ "grad_norm": 1.445693487120252,
+ "grad_max_sv": 0.004225540207698941,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4225540207.698941,
+ "lr": 0.00010173504098790182,
+ "time_sec": 177.32281279563904
+ },
+ {
+ "epoch": 120,
+ "train_loss": 5.366396225891113,
+ "train_acc": 0.01,
+ "test_loss": 4.875214715576172,
+ "test_acc": 0.01,
+ "lyapunov": 1.5928466237719408,
+ "grad_norm": 1.5218270915127643,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 177.28257083892822
+ },
+ {
+ "epoch": 121,
+ "train_loss": 5.366784219818115,
+ "train_acc": 0.01,
+ "test_loss": 4.868653475952148,
+ "test_acc": 0.01,
+ "lyapunov": 1.5932423071483213,
+ "grad_norm": 1.5915107890267433,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 177.2724094390869
+ },
+ {
+ "epoch": 122,
+ "train_loss": 5.3684937673950195,
+ "train_acc": 0.0095,
+ "test_loss": 4.872081127929688,
+ "test_acc": 0.01,
+ "lyapunov": 1.5947217929088855,
+ "grad_norm": 1.7802951927894717,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 177.29115104675293
+ },
+ {
+ "epoch": 123,
+ "train_loss": 5.368383057250977,
+ "train_acc": 0.00976,
+ "test_loss": 4.865282067871094,
+ "test_acc": 0.01,
+ "lyapunov": 1.5946415565202914,
+ "grad_norm": 1.8635884798014917,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 177.29619812965393
+ },
+ {
+ "epoch": 124,
+ "train_loss": 5.369555229797363,
+ "train_acc": 0.01,
+ "test_loss": 4.850182081604004,
+ "test_acc": 0.01,
+ "lyapunov": 1.595543795839295,
+ "grad_norm": 1.9786412883932707,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 177.28673815727234
+ },
+ {
+ "epoch": 125,
+ "train_loss": 5.366839987792969,
+ "train_acc": 0.0099,
+ "test_loss": 4.863481466674805,
+ "test_acc": 0.01,
+ "lyapunov": 1.5933110564566024,
+ "grad_norm": 1.981713372629457,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 177.54408073425293
+ },
+ {
+ "epoch": 126,
+ "train_loss": 5.367286334533691,
+ "train_acc": 0.00978,
+ "test_loss": 4.864164552307129,
+ "test_acc": 0.01,
+ "lyapunov": 1.593780165133269,
+ "grad_norm": 2.0792063115884303,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 177.27722811698914
+ },
+ {
+ "epoch": 127,
+ "train_loss": 5.377017222900391,
+ "train_acc": 0.00976,
+ "test_loss": 4.867053485107422,
+ "test_acc": 0.01,
+ "lyapunov": 1.5985291836511752,
+ "grad_norm": 1.8808489686841805,
+ "grad_max_sv": 0.0020057843998074532,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2005784399.8074532,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 177.32938599586487
+ },
+ {
+ "epoch": 128,
+ "train_loss": 5.3731236241149904,
+ "train_acc": 0.0099,
+ "test_loss": 4.862087628173828,
+ "test_acc": 0.01,
+ "lyapunov": 1.5972985928625707,
+ "grad_norm": 2.0544715272998646,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 177.26091361045837
+ },
+ {
+ "epoch": 129,
+ "train_loss": 5.366952188110352,
+ "train_acc": 0.00966,
+ "test_loss": 4.87226043548584,
+ "test_acc": 0.01,
+ "lyapunov": 1.5934485755003323,
+ "grad_norm": 2.0287817825331826,
+ "grad_max_sv": 0.0008733986876904964,
+ "grad_min_sv": 0.0,
+ "grad_condition": 873398687.6904964,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 177.30408883094788
+ },
+ {
+ "epoch": 130,
+ "train_loss": 5.36849506149292,
+ "train_acc": 0.01004,
+ "test_loss": 4.863279203796386,
+ "test_acc": 0.01,
+ "lyapunov": 1.594751832735203,
+ "grad_norm": 1.980669281269925,
+ "grad_max_sv": 0.010736069735139608,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10736069735.139608,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 177.28869652748108
+ },
+ {
+ "epoch": 131,
+ "train_loss": 5.377595603637696,
+ "train_acc": 0.01,
+ "test_loss": 4.866737941741944,
+ "test_acc": 0.01,
+ "lyapunov": 1.5995000756305198,
+ "grad_norm": 2.154727256033659,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 177.257958650589
+ },
+ {
+ "epoch": 132,
+ "train_loss": 5.369090413818359,
+ "train_acc": 0.01,
+ "test_loss": 4.858406136322022,
+ "test_acc": 0.01,
+ "lyapunov": 1.5953167524484113,
+ "grad_norm": 2.191344847482899,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 177.27152252197266
+ },
+ {
+ "epoch": 133,
+ "train_loss": 5.3665374522399905,
+ "train_acc": 0.01,
+ "test_loss": 4.860008187866211,
+ "test_acc": 0.01,
+ "lyapunov": 1.5930466167152386,
+ "grad_norm": 2.0841828503003916,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 177.28846549987793
+ },
+ {
+ "epoch": 134,
+ "train_loss": 5.366383743286133,
+ "train_acc": 0.00974,
+ "test_loss": 4.848487128448486,
+ "test_acc": 0.01,
+ "lyapunov": 1.592855043118567,
+ "grad_norm": 2.195653914411608,
+ "grad_max_sv": 0.0033036706037819384,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3303670603.7819386,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 177.28988027572632
+ },
+ {
+ "epoch": 135,
+ "train_loss": 5.367761196746827,
+ "train_acc": 0.00998,
+ "test_loss": 4.859366925048828,
+ "test_acc": 0.01,
+ "lyapunov": 1.594165514802079,
+ "grad_norm": 2.1904859959999126,
+ "grad_max_sv": 0.0012543844059109688,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1254384405.9109688,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 177.2780725955963
+ },
+ {
+ "epoch": 136,
+ "train_loss": 5.366510193634033,
+ "train_acc": 0.01,
+ "test_loss": 4.8595954734802245,
+ "test_acc": 0.01,
+ "lyapunov": 1.5930009638257039,
+ "grad_norm": 2.1839168134099793,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 177.28521990776062
+ },
+ {
+ "epoch": 137,
+ "train_loss": 5.367833109741211,
+ "train_acc": 0.01,
+ "test_loss": 4.850632510375976,
+ "test_acc": 0.01,
+ "lyapunov": 1.5938955752745918,
+ "grad_norm": 2.14228114693839,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 177.32584595680237
+ },
+ {
+ "epoch": 138,
+ "train_loss": 5.378068528137207,
+ "train_acc": 0.01018,
+ "test_loss": 4.858175395202637,
+ "test_acc": 0.01,
+ "lyapunov": 1.5998802581406615,
+ "grad_norm": 2.218784068596557,
+ "grad_max_sv": 0.0014573325868695974,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1457332586.8695974,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 177.31577253341675
+ },
+ {
+ "epoch": 139,
+ "train_loss": 5.367863772277832,
+ "train_acc": 0.01034,
+ "test_loss": 4.8480802886962895,
+ "test_acc": 0.01,
+ "lyapunov": 1.5942664253132424,
+ "grad_norm": 2.2444364897318794,
+ "grad_max_sv": 0.012257534638047218,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12257534638.047218,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 177.30443215370178
+ },
+ {
+ "epoch": 140,
+ "train_loss": 5.366426722717285,
+ "train_acc": 0.00962,
+ "test_loss": 4.848219221496582,
+ "test_acc": 0.01,
+ "lyapunov": 1.5928701375756422,
+ "grad_norm": 2.3192997356397203,
+ "grad_max_sv": 0.006218939693644643,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6218939693.644643,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 177.33384609222412
+ },
+ {
+ "epoch": 141,
+ "train_loss": 5.36580462097168,
+ "train_acc": 0.00986,
+ "test_loss": 4.850540889739991,
+ "test_acc": 0.01,
+ "lyapunov": 1.592248017830617,
+ "grad_norm": 2.287220965288124,
+ "grad_max_sv": 0.0013559065759181977,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1355906575.9181976,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 177.32693576812744
+ },
+ {
+ "epoch": 142,
+ "train_loss": 5.3662375875854496,
+ "train_acc": 0.01,
+ "test_loss": 4.853694881439209,
+ "test_acc": 0.01,
+ "lyapunov": 1.5927291526209058,
+ "grad_norm": 2.302468482661773,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 177.3142066001892
+ },
+ {
+ "epoch": 143,
+ "train_loss": 5.372984427642822,
+ "train_acc": 0.01004,
+ "test_loss": 4.852922064208984,
+ "test_acc": 0.01,
+ "lyapunov": 1.597528722889893,
+ "grad_norm": 2.348373340052694,
+ "grad_max_sv": 0.0011802260298281908,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1180226029.8281908,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 177.3356897830963
+ },
+ {
+ "epoch": 144,
+ "train_loss": 5.368205472106934,
+ "train_acc": 0.00984,
+ "test_loss": 4.849281020355225,
+ "test_acc": 0.01,
+ "lyapunov": 1.594479467252941,
+ "grad_norm": 2.312922144804607,
+ "grad_max_sv": 0.0006380858831107616,
+ "grad_min_sv": 0.0,
+ "grad_condition": 638085883.1107616,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 177.28971314430237
+ },
+ {
+ "epoch": 145,
+ "train_loss": 5.366419898681641,
+ "train_acc": 0.01006,
+ "test_loss": 4.848984435272217,
+ "test_acc": 0.01,
+ "lyapunov": 1.592920510360347,
+ "grad_norm": 2.317195419975272,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 177.31689953804016
+ },
+ {
+ "epoch": 146,
+ "train_loss": 5.373454104766846,
+ "train_acc": 0.01,
+ "test_loss": 4.849994027709961,
+ "test_acc": 0.01,
+ "lyapunov": 1.598964246642559,
+ "grad_norm": 2.4233925402092833,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 177.32813477516174
+ },
+ {
+ "epoch": 147,
+ "train_loss": 5.3674054251098635,
+ "train_acc": 0.01,
+ "test_loss": 4.851546574401856,
+ "test_acc": 0.01,
+ "lyapunov": 1.5935643969289481,
+ "grad_norm": 2.3247951305562196,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 177.28444719314575
+ },
+ {
+ "epoch": 148,
+ "train_loss": 5.3666025303649905,
+ "train_acc": 0.01,
+ "test_loss": 4.8515466201782225,
+ "test_acc": 0.01,
+ "lyapunov": 1.5931046256019026,
+ "grad_norm": 2.3395920546004754,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 177.2980020046234
+ },
+ {
+ "epoch": 149,
+ "train_loss": 5.365688817749024,
+ "train_acc": 0.01,
+ "test_loss": 4.851546644592285,
+ "test_acc": 0.01,
+ "lyapunov": 1.5921499198659912,
+ "grad_norm": 2.4070679367245766,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 177.28436994552612
+ },
+ {
+ "epoch": 150,
+ "train_loss": 5.363941977539063,
+ "train_acc": 0.01,
+ "test_loss": 4.851546675109863,
+ "test_acc": 0.01,
+ "lyapunov": 1.5903311498329769,
+ "grad_norm": 2.3202323044197746,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 177.27790570259094
+ }
+ ]
+ }
+} \ No newline at end of file