summaryrefslogtreecommitdiff
path: root/runs/depth_scaling_stable_init
diff options
context:
space:
mode:
Diffstat (limited to 'runs/depth_scaling_stable_init')
-rw-r--r--runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json23
-rw-r--r--runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json16822
2 files changed, 16845 insertions, 0 deletions
diff --git a/runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json b/runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json
new file mode 100644
index 0000000..a220257
--- /dev/null
+++ b/runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json
@@ -0,0 +1,23 @@
+{
+ "dataset": "cifar100",
+ "depths": [
+ 4,
+ 8,
+ 12,
+ 16
+ ],
+ "T": 4,
+ "epochs": 150,
+ "batch_size": 128,
+ "lr": 0.001,
+ "lambda_reg": 0.1,
+ "lambda_target": -0.1,
+ "data_dir": "./data",
+ "out_dir": "runs/depth_scaling_stable_init",
+ "device": "cuda",
+ "seed": 42,
+ "no_progress": false,
+ "reg_type": "squared",
+ "warmup_epochs": 20,
+ "stable_init": true
+} \ No newline at end of file
diff --git a/runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json b/runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json
new file mode 100644
index 0000000..3de0e89
--- /dev/null
+++ b/runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json
@@ -0,0 +1,16822 @@
+{
+ "vanilla": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 3.8700216691589358,
+ "train_acc": 0.12266,
+ "test_loss": 3.471041242599487,
+ "test_acc": 0.1892,
+ "lyapunov": null,
+ "grad_norm": 5.871605597993606,
+ "grad_max_sv": 4.127117091417313,
+ "grad_min_sv": 1.0455270382792037e-07,
+ "grad_condition": 49062288.68792993,
+ "lr": 0.0009998903417374227,
+ "time_sec": 16.27198028564453
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.1769318112182616,
+ "train_acc": 0.22848,
+ "test_loss": 3.0822217151641844,
+ "test_acc": 0.2623,
+ "lyapunov": null,
+ "grad_norm": 4.062262644221631,
+ "grad_max_sv": 2.610152545571327,
+ "grad_min_sv": 7.51297792088955e-08,
+ "grad_condition": 5467508398.9579,
+ "lr": 0.0009995614150494292,
+ "time_sec": 15.849408626556396
+ },
+ {
+ "epoch": 3,
+ "train_loss": 2.7716760053253173,
+ "train_acc": 0.30112,
+ "test_loss": 2.786010754776001,
+ "test_acc": 0.3025,
+ "lyapunov": null,
+ "grad_norm": 3.306849913177874,
+ "grad_max_sv": 1.982076707482338,
+ "grad_min_sv": 6.276024400175828e-08,
+ "grad_condition": 35650611.42411845,
+ "lr": 0.0009990133642141358,
+ "time_sec": 15.585639715194702
+ },
+ {
+ "epoch": 4,
+ "train_loss": 2.52623803855896,
+ "train_acc": 0.34808,
+ "test_loss": 2.753477826690674,
+ "test_acc": 0.31,
+ "lyapunov": null,
+ "grad_norm": 2.9097492182391815,
+ "grad_max_sv": 1.6385449588298797,
+ "grad_min_sv": 5.4328751075694014e-08,
+ "grad_condition": 39318936.04767501,
+ "lr": 0.0009982464296247522,
+ "time_sec": 15.567962408065796
+ },
+ {
+ "epoch": 5,
+ "train_loss": 2.336665892715454,
+ "train_acc": 0.38814,
+ "test_loss": 2.762642176055908,
+ "test_acc": 0.3278,
+ "lyapunov": null,
+ "grad_norm": 2.633575942359962,
+ "grad_max_sv": 1.4780948996543883,
+ "grad_min_sv": 4.9716202832339465e-08,
+ "grad_condition": 36374716.14412971,
+ "lr": 0.0009972609476841367,
+ "time_sec": 15.589628219604492
+ },
+ {
+ "epoch": 6,
+ "train_loss": 2.1819915383148194,
+ "train_acc": 0.42402,
+ "test_loss": 2.879850026321411,
+ "test_acc": 0.3169,
+ "lyapunov": null,
+ "grad_norm": 2.4016337956595826,
+ "grad_max_sv": 1.2914279341697692,
+ "grad_min_sv": 4.639223961377947e-08,
+ "grad_condition": 67967054.09377375,
+ "lr": 0.000996057350657239,
+ "time_sec": 15.569096803665161
+ },
+ {
+ "epoch": 7,
+ "train_loss": 2.051711977081299,
+ "train_acc": 0.45262,
+ "test_loss": 2.3678430866241453,
+ "test_acc": 0.3932,
+ "lyapunov": null,
+ "grad_norm": 2.226191538130221,
+ "grad_max_sv": 1.1724753439426423,
+ "grad_min_sv": 4.296711672013842e-08,
+ "grad_condition": 36498738.129443035,
+ "lr": 0.000994636166481494,
+ "time_sec": 15.596983671188354
+ },
+ {
+ "epoch": 8,
+ "train_loss": 1.940541718597412,
+ "train_acc": 0.47698,
+ "test_loss": 2.2571875411987303,
+ "test_acc": 0.4255,
+ "lyapunov": null,
+ "grad_norm": 2.0805351562913987,
+ "grad_max_sv": 1.1051331430673599,
+ "grad_min_sv": 4.002405433189971e-08,
+ "grad_condition": 35597702.92584355,
+ "lr": 0.0009929980185352525,
+ "time_sec": 15.578535795211792
+ },
+ {
+ "epoch": 9,
+ "train_loss": 1.8394872580337525,
+ "train_acc": 0.49896,
+ "test_loss": 2.447062807273865,
+ "test_acc": 0.3908,
+ "lyapunov": null,
+ "grad_norm": 1.95549418174433,
+ "grad_max_sv": 0.9836901038885116,
+ "grad_min_sv": 3.7306198631681385e-08,
+ "grad_condition": 62081794.94354477,
+ "lr": 0.0009911436253643444,
+ "time_sec": 15.615386486053467
+ },
+ {
+ "epoch": 10,
+ "train_loss": 1.7619124493789673,
+ "train_acc": 0.51634,
+ "test_loss": 2.1738934711456297,
+ "test_acc": 0.4315,
+ "lyapunov": null,
+ "grad_norm": 1.8481164153982472,
+ "grad_max_sv": 0.9101693272590637,
+ "grad_min_sv": 3.497988239065109e-08,
+ "grad_condition": 46371834.68583612,
+ "lr": 0.0009890738003669028,
+ "time_sec": 15.591166496276855
+ },
+ {
+ "epoch": 11,
+ "train_loss": 1.6779080270385742,
+ "train_acc": 0.5374,
+ "test_loss": 2.1254464902877808,
+ "test_acc": 0.4554,
+ "lyapunov": null,
+ "grad_norm": 1.761015251152075,
+ "grad_max_sv": 0.8580568209290504,
+ "grad_min_sv": 3.36019686630884e-08,
+ "grad_condition": 43516726.56073545,
+ "lr": 0.00098678945143658,
+ "time_sec": 15.584970235824585
+ },
+ {
+ "epoch": 12,
+ "train_loss": 1.6224668700790406,
+ "train_acc": 0.5503,
+ "test_loss": 2.1070931062698364,
+ "test_acc": 0.4572,
+ "lyapunov": null,
+ "grad_norm": 1.6795284434799669,
+ "grad_max_sv": 0.8227274164557457,
+ "grad_min_sv": 3.2408061501065785e-08,
+ "grad_condition": 46743715.81403457,
+ "lr": 0.0009842915805643154,
+ "time_sec": 15.587612390518188
+ },
+ {
+ "epoch": 13,
+ "train_loss": 1.5589283563995362,
+ "train_acc": 0.56658,
+ "test_loss": 2.109080162811279,
+ "test_acc": 0.4555,
+ "lyapunov": null,
+ "grad_norm": 1.6107025543208409,
+ "grad_max_sv": 0.7555071026086807,
+ "grad_min_sv": 3.021804662181257e-08,
+ "grad_condition": 771669383.9576478,
+ "lr": 0.000981581283398829,
+ "time_sec": 15.570199012756348
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.5079251358795167,
+ "train_acc": 0.57552,
+ "test_loss": 2.0982689178466796,
+ "test_acc": 0.4612,
+ "lyapunov": null,
+ "grad_norm": 1.5561237300872648,
+ "grad_max_sv": 0.7464557528495789,
+ "grad_min_sv": 2.9360349014517782e-08,
+ "grad_condition": 57384357.84720645,
+ "lr": 0.0009786597487660333,
+ "time_sec": 15.58092999458313
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.4521892065048219,
+ "train_acc": 0.59046,
+ "test_loss": 2.311817477607727,
+ "test_acc": 0.4302,
+ "lyapunov": null,
+ "grad_norm": 1.5030460275712159,
+ "grad_max_sv": 0.6973782196640969,
+ "grad_min_sv": 2.806552138745477e-08,
+ "grad_condition": 50094988.442197144,
+ "lr": 0.0009755282581475766,
+ "time_sec": 15.59303069114685
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.4043401465606689,
+ "train_acc": 0.6018,
+ "test_loss": 1.9470401285171508,
+ "test_acc": 0.4966,
+ "lyapunov": null,
+ "grad_norm": 1.4501603734300015,
+ "grad_max_sv": 0.6692761570215225,
+ "grad_min_sv": 2.707263816043026e-08,
+ "grad_condition": 123937233.96376769,
+ "lr": 0.0009721881851187403,
+ "time_sec": 15.581094026565552
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.3696716709136962,
+ "train_acc": 0.61152,
+ "test_loss": 1.937501217842102,
+ "test_acc": 0.499,
+ "lyapunov": null,
+ "grad_norm": 1.4220829625575298,
+ "grad_max_sv": 0.6630528435111046,
+ "grad_min_sv": 2.6855075777043603e-08,
+ "grad_condition": 85926301.07871899,
+ "lr": 0.0009686409947459456,
+ "time_sec": 15.594961643218994
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.3274028357696532,
+ "train_acc": 0.62202,
+ "test_loss": 2.163087944793701,
+ "test_acc": 0.4562,
+ "lyapunov": null,
+ "grad_norm": 1.3749658522523285,
+ "grad_max_sv": 0.6294455677270889,
+ "grad_min_sv": 2.59231922022235e-08,
+ "grad_condition": 301195911.7425653,
+ "lr": 0.0009648882429441254,
+ "time_sec": 15.60923433303833
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.2825380062484741,
+ "train_acc": 0.63366,
+ "test_loss": 2.012470700645447,
+ "test_acc": 0.4881,
+ "lyapunov": null,
+ "grad_norm": 1.3365974210853477,
+ "grad_max_sv": 0.6173068635165692,
+ "grad_min_sv": 2.522445298643039e-08,
+ "grad_condition": 107736394.99929431,
+ "lr": 0.00096093157579425,
+ "time_sec": 15.59559416770935
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.2454956715774537,
+ "train_acc": 0.63962,
+ "test_loss": 1.862760306930542,
+ "test_acc": 0.5166,
+ "lyapunov": null,
+ "grad_norm": 1.3087654259412098,
+ "grad_max_sv": 0.583590354025364,
+ "grad_min_sv": 2.470869329140868e-08,
+ "grad_condition": 28538129.547009837,
+ "lr": 0.0009567727288213001,
+ "time_sec": 15.578768253326416
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.2203223657226563,
+ "train_acc": 0.64712,
+ "test_loss": 1.8641546312332153,
+ "test_acc": 0.5193,
+ "lyapunov": null,
+ "grad_norm": 1.2837238048732729,
+ "grad_max_sv": 0.5924517832696438,
+ "grad_min_sv": 2.4348954538039312e-08,
+ "grad_condition": 93781869.91679552,
+ "lr": 0.0009524135262330095,
+ "time_sec": 15.614121198654175
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.1865811985397339,
+ "train_acc": 0.65476,
+ "test_loss": 2.0345648471832276,
+ "test_acc": 0.4893,
+ "lyapunov": null,
+ "grad_norm": 1.2512260920694542,
+ "grad_max_sv": 0.5759196959435939,
+ "grad_min_sv": 2.384011341116654e-08,
+ "grad_condition": 30288258.368695997,
+ "lr": 0.0009478558801197061,
+ "time_sec": 15.612670183181763
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.1597199523544313,
+ "train_acc": 0.66328,
+ "test_loss": 1.7475012817382813,
+ "test_acc": 0.5456,
+ "lyapunov": null,
+ "grad_norm": 1.22099214296503,
+ "grad_max_sv": 0.550060736387968,
+ "grad_min_sv": 2.259520101161039e-08,
+ "grad_condition": 44796813.002676345,
+ "lr": 0.000943101789615607,
+ "time_sec": 15.634280920028687
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.1278974151992798,
+ "train_acc": 0.67306,
+ "test_loss": 1.9481268964767455,
+ "test_acc": 0.5126,
+ "lyapunov": null,
+ "grad_norm": 1.204438554486539,
+ "grad_max_sv": 0.5349243931472302,
+ "grad_min_sv": 2.225912898324439e-08,
+ "grad_condition": 183220898.93468145,
+ "lr": 0.0009381533400219313,
+ "time_sec": 15.649690389633179
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.096091796951294,
+ "train_acc": 0.68,
+ "test_loss": 2.0196787605285644,
+ "test_acc": 0.5038,
+ "lyapunov": null,
+ "grad_norm": 1.1805395110366357,
+ "grad_max_sv": 0.5209554739296436,
+ "grad_min_sv": 2.1478067243539635e-08,
+ "grad_condition": 4139399544.237787,
+ "lr": 0.0009330127018922189,
+ "time_sec": 15.62510895729065
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.0776387982559203,
+ "train_acc": 0.6821,
+ "test_loss": 1.9688811008453369,
+ "test_acc": 0.5111,
+ "lyapunov": null,
+ "grad_norm": 1.1581479939567827,
+ "grad_max_sv": 0.5094197139143943,
+ "grad_min_sv": 2.1775440942062298e-08,
+ "grad_condition": 34416173.97374034,
+ "lr": 0.000927682130080253,
+ "time_sec": 15.616900444030762
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.039057155227661,
+ "train_acc": 0.69314,
+ "test_loss": 1.9735270919799806,
+ "test_acc": 0.5109,
+ "lyapunov": null,
+ "grad_norm": 1.1358478872536777,
+ "grad_max_sv": 0.49843145087361335,
+ "grad_min_sv": 2.0908967124713685e-08,
+ "grad_condition": 147733329.90615898,
+ "lr": 0.0009221639627510072,
+ "time_sec": 15.589634418487549
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.0186366636657715,
+ "train_acc": 0.698,
+ "test_loss": 1.849167727470398,
+ "test_acc": 0.5327,
+ "lyapunov": null,
+ "grad_norm": 1.1179885484776635,
+ "grad_max_sv": 0.4846231251955032,
+ "grad_min_sv": 2.064624871154358e-08,
+ "grad_condition": 187535295.68791586,
+ "lr": 0.0009164606203550494,
+ "time_sec": 15.606561422348022
+ },
+ {
+ "epoch": 29,
+ "train_loss": 0.9894418817901611,
+ "train_acc": 0.70704,
+ "test_loss": 1.9159385116577148,
+ "test_acc": 0.5256,
+ "lyapunov": null,
+ "grad_norm": 1.1033010317922292,
+ "grad_max_sv": 0.49175669252872467,
+ "grad_min_sv": 2.0545614226596954e-08,
+ "grad_condition": 28139106.19650669,
+ "lr": 0.0009105746045668516,
+ "time_sec": 15.596401453018188
+ },
+ {
+ "epoch": 30,
+ "train_loss": 0.9679239891052246,
+ "train_acc": 0.7117,
+ "test_loss": 1.7626015129089356,
+ "test_acc": 0.5579,
+ "lyapunov": null,
+ "grad_norm": 1.0852050474778043,
+ "grad_max_sv": 0.4818247281014919,
+ "grad_min_sv": 2.036887303824564e-08,
+ "grad_condition": 39564164.33428894,
+ "lr": 0.0009045084971874733,
+ "time_sec": 15.594120025634766
+ },
+ {
+ "epoch": 31,
+ "train_loss": 0.9477154457473755,
+ "train_acc": 0.71644,
+ "test_loss": 2.001366552734375,
+ "test_acc": 0.5184,
+ "lyapunov": null,
+ "grad_norm": 1.0714526476916026,
+ "grad_max_sv": 0.45983982309699056,
+ "grad_min_sv": 1.9430452840446533e-08,
+ "grad_condition": 51624978.6905687,
+ "lr": 0.0008982649590120977,
+ "time_sec": 15.600859880447388
+ },
+ {
+ "epoch": 32,
+ "train_loss": 0.922220166015625,
+ "train_acc": 0.72322,
+ "test_loss": 1.8274271976470948,
+ "test_acc": 0.552,
+ "lyapunov": null,
+ "grad_norm": 1.0486432180828922,
+ "grad_max_sv": 0.4561096005141735,
+ "grad_min_sv": 1.9119260000893812e-08,
+ "grad_condition": 81358962.64807202,
+ "lr": 0.0008918467286629196,
+ "time_sec": 15.56894040107727
+ },
+ {
+ "epoch": 33,
+ "train_loss": 0.9045637095451355,
+ "train_acc": 0.72804,
+ "test_loss": 1.885004960823059,
+ "test_acc": 0.543,
+ "lyapunov": null,
+ "grad_norm": 1.0374896564588747,
+ "grad_max_sv": 0.4518023140728474,
+ "grad_min_sv": 1.917957178319829e-08,
+ "grad_condition": 182673348.7808311,
+ "lr": 0.0008852566213878943,
+ "time_sec": 15.568547010421753
+ },
+ {
+ "epoch": 34,
+ "train_loss": 0.8857564904785157,
+ "train_acc": 0.7319,
+ "test_loss": 1.9111962642669678,
+ "test_acc": 0.5412,
+ "lyapunov": null,
+ "grad_norm": 1.0274666482550194,
+ "grad_max_sv": 0.4493935935199261,
+ "grad_min_sv": 1.881604217469912e-08,
+ "grad_condition": 248617918.33796087,
+ "lr": 0.000878497527825878,
+ "time_sec": 15.588915586471558
+ },
+ {
+ "epoch": 35,
+ "train_loss": 0.8623492621994019,
+ "train_acc": 0.73752,
+ "test_loss": 1.9594444644927977,
+ "test_acc": 0.5265,
+ "lyapunov": null,
+ "grad_norm": 1.0169882023721266,
+ "grad_max_sv": 0.4450283505022526,
+ "grad_min_sv": 1.8621021413700588e-08,
+ "grad_condition": 51970835.60873811,
+ "lr": 0.000871572412738697,
+ "time_sec": 15.614988565444946
+ },
+ {
+ "epoch": 36,
+ "train_loss": 0.847761401977539,
+ "train_acc": 0.7438,
+ "test_loss": 1.8443275575637816,
+ "test_acc": 0.549,
+ "lyapunov": null,
+ "grad_norm": 0.9972656465889882,
+ "grad_max_sv": 0.42991913110017776,
+ "grad_min_sv": 1.8110683554228845e-08,
+ "grad_condition": 63643440.089395806,
+ "lr": 0.0008644843137107055,
+ "time_sec": 15.585567474365234
+ },
+ {
+ "epoch": 37,
+ "train_loss": 0.8332586885261536,
+ "train_acc": 0.74546,
+ "test_loss": 1.8331810934066772,
+ "test_acc": 0.5565,
+ "lyapunov": null,
+ "grad_norm": 0.986142343180959,
+ "grad_max_sv": 0.43020778223872186,
+ "grad_min_sv": 1.820308022093542e-08,
+ "grad_condition": 38440650.114556134,
+ "lr": 0.0008572363398164014,
+ "time_sec": 15.585892915725708
+ },
+ {
+ "epoch": 38,
+ "train_loss": 0.808667633934021,
+ "train_acc": 0.75458,
+ "test_loss": 1.8140192237854005,
+ "test_acc": 0.563,
+ "lyapunov": null,
+ "grad_norm": 0.9767417084572454,
+ "grad_max_sv": 0.43866117894649503,
+ "grad_min_sv": 1.805343496832229e-08,
+ "grad_condition": 246839591.75793108,
+ "lr": 0.0008498316702566826,
+ "time_sec": 15.576987028121948
+ },
+ {
+ "epoch": 39,
+ "train_loss": 0.7920477479743957,
+ "train_acc": 0.75774,
+ "test_loss": 1.998388723373413,
+ "test_acc": 0.5317,
+ "lyapunov": null,
+ "grad_norm": 0.9634949356985317,
+ "grad_max_sv": 0.41083301454782484,
+ "grad_min_sv": 1.7408181231248764e-08,
+ "grad_condition": 207856381.9830411,
+ "lr": 0.0008422735529643442,
+ "time_sec": 15.604882955551147
+ },
+ {
+ "epoch": 40,
+ "train_loss": 0.783684113292694,
+ "train_acc": 0.76062,
+ "test_loss": 1.8349973222732543,
+ "test_acc": 0.5584,
+ "lyapunov": null,
+ "grad_norm": 0.9543715044222432,
+ "grad_max_sv": 0.4067095577716827,
+ "grad_min_sv": 1.715405322372243e-08,
+ "grad_condition": 38065468.34049429,
+ "lr": 0.0008345653031794289,
+ "time_sec": 15.61448359489441
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.756040623588562,
+ "train_acc": 0.76704,
+ "test_loss": 1.8635019605636596,
+ "test_acc": 0.5623,
+ "lyapunov": null,
+ "grad_norm": 0.9400945005657612,
+ "grad_max_sv": 0.4006481133401394,
+ "grad_min_sv": 1.706379215496434e-08,
+ "grad_condition": 129917875.15326138,
+ "lr": 0.0008267103019950526,
+ "time_sec": 15.605446100234985
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.747281655292511,
+ "train_acc": 0.77008,
+ "test_loss": 1.804893379020691,
+ "test_acc": 0.5637,
+ "lyapunov": null,
+ "grad_norm": 0.9342754196581016,
+ "grad_max_sv": 0.4069997236132622,
+ "grad_min_sv": 1.690411219660258e-08,
+ "grad_condition": 833088985.4088073,
+ "lr": 0.0008187119948743447,
+ "time_sec": 15.598352432250977
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.7258966027832031,
+ "train_acc": 0.7753,
+ "test_loss": 1.808250590133667,
+ "test_acc": 0.5688,
+ "lyapunov": null,
+ "grad_norm": 0.916899863328162,
+ "grad_max_sv": 0.39457144513726233,
+ "grad_min_sv": 1.6684048499693294e-08,
+ "grad_condition": 39061518.56268385,
+ "lr": 0.000810573890139155,
+ "time_sec": 15.596754550933838
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.7053343192100525,
+ "train_acc": 0.78078,
+ "test_loss": 1.9365575828552246,
+ "test_acc": 0.5516,
+ "lyapunov": null,
+ "grad_norm": 0.909458464797614,
+ "grad_max_sv": 0.38970902636647226,
+ "grad_min_sv": 1.6407527701767232e-08,
+ "grad_condition": 42244499.19662833,
+ "lr": 0.0008022995574311873,
+ "time_sec": 15.606269836425781
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.6963989092254639,
+ "train_acc": 0.7839,
+ "test_loss": 1.8283310445785523,
+ "test_acc": 0.5639,
+ "lyapunov": null,
+ "grad_norm": 0.9004438327166017,
+ "grad_max_sv": 0.39948956444859507,
+ "grad_min_sv": 1.6195382334174836e-08,
+ "grad_condition": 362020379.02432,
+ "lr": 0.0007938926261462363,
+ "time_sec": 15.588224411010742
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.690151353931427,
+ "train_acc": 0.78312,
+ "test_loss": 1.838386841392517,
+ "test_acc": 0.5656,
+ "lyapunov": null,
+ "grad_norm": 0.8990022149636615,
+ "grad_max_sv": 0.3958965942263603,
+ "grad_min_sv": 1.6439048992683212e-08,
+ "grad_condition": 739976934.4713734,
+ "lr": 0.0007853567838422158,
+ "time_sec": 15.608047008514404
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.6644145600509643,
+ "train_acc": 0.79316,
+ "test_loss": 1.7317404174804687,
+ "test_acc": 0.5881,
+ "lyapunov": null,
+ "grad_norm": 0.8888942071856848,
+ "grad_max_sv": 0.3830097340047359,
+ "grad_min_sv": 1.5947025791551715e-08,
+ "grad_condition": 43737023.5418247,
+ "lr": 0.0007766957746216719,
+ "time_sec": 15.61106562614441
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.6501899867248535,
+ "train_acc": 0.7961,
+ "test_loss": 2.0301314384460447,
+ "test_acc": 0.5481,
+ "lyapunov": null,
+ "grad_norm": 0.8710848056333472,
+ "grad_max_sv": 0.37484541684389117,
+ "grad_min_sv": 1.568856004691144e-08,
+ "grad_condition": 71400760.33312531,
+ "lr": 0.0007679133974894982,
+ "time_sec": 15.616482496261597
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.6407210964202881,
+ "train_acc": 0.79878,
+ "test_loss": 1.8660895137786866,
+ "test_acc": 0.5703,
+ "lyapunov": null,
+ "grad_norm": 0.8631402634979823,
+ "grad_max_sv": 0.3794224761426449,
+ "grad_min_sv": 1.5698247981393855e-08,
+ "grad_condition": 48831357.42187855,
+ "lr": 0.000759013504686565,
+ "time_sec": 15.608244180679321
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.635532203464508,
+ "train_acc": 0.79966,
+ "test_loss": 1.8019765382766724,
+ "test_acc": 0.5773,
+ "lyapunov": null,
+ "grad_norm": 0.8639281681323187,
+ "grad_max_sv": 0.3756891183555126,
+ "grad_min_sv": 1.5385762375426383e-08,
+ "grad_condition": 443886531.5137703,
+ "lr": 0.0007499999999999998,
+ "time_sec": 15.595497369766235
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.6136586366081238,
+ "train_acc": 0.8078,
+ "test_loss": 1.985259211730957,
+ "test_acc": 0.5541,
+ "lyapunov": null,
+ "grad_norm": 0.8502360335489318,
+ "grad_max_sv": 0.38991634622216226,
+ "grad_min_sv": 1.589003087859586e-08,
+ "grad_condition": 36685688.17597731,
+ "lr": 0.0007408768370508575,
+ "time_sec": 15.606870174407959
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.6016868180465699,
+ "train_acc": 0.81054,
+ "test_loss": 1.9059622749328613,
+ "test_acc": 0.5677,
+ "lyapunov": null,
+ "grad_norm": 0.839451980682905,
+ "grad_max_sv": 0.3655779927968979,
+ "grad_min_sv": 1.50471602150537e-08,
+ "grad_condition": 68824107.55111663,
+ "lr": 0.0007316480175599307,
+ "time_sec": 15.595157861709595
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.5874249538040162,
+ "train_acc": 0.81406,
+ "test_loss": 1.9880520868301392,
+ "test_acc": 0.5586,
+ "lyapunov": null,
+ "grad_norm": 0.8317551917480781,
+ "grad_max_sv": 0.3655713267624378,
+ "grad_min_sv": 1.5141927978482016e-08,
+ "grad_condition": 349299867.91202754,
+ "lr": 0.0007223175895924635,
+ "time_sec": 15.589019060134888
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.577422985610962,
+ "train_acc": 0.8184,
+ "test_loss": 1.9396752899169922,
+ "test_acc": 0.5636,
+ "lyapunov": null,
+ "grad_norm": 0.8261938394130597,
+ "grad_max_sv": 0.3618521079421043,
+ "grad_min_sv": 1.4864520584507642e-08,
+ "grad_condition": 553216070.5433874,
+ "lr": 0.0007128896457825361,
+ "time_sec": 15.610572338104248
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.5702339578819275,
+ "train_acc": 0.81924,
+ "test_loss": 1.8778120471954345,
+ "test_acc": 0.5713,
+ "lyapunov": null,
+ "grad_norm": 0.8242148097122628,
+ "grad_max_sv": 0.36288107857108115,
+ "grad_min_sv": 1.4883936903103966e-08,
+ "grad_condition": 52140637.21728975,
+ "lr": 0.0007033683215378998,
+ "time_sec": 15.605257749557495
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.5589845707130432,
+ "train_acc": 0.82372,
+ "test_loss": 1.8699417673110963,
+ "test_acc": 0.5751,
+ "lyapunov": null,
+ "grad_norm": 0.8186771944690047,
+ "grad_max_sv": 0.346701592952013,
+ "grad_min_sv": 1.459523215271985e-08,
+ "grad_condition": 46853728.14353165,
+ "lr": 0.0006937577932260512,
+ "time_sec": 15.589865684509277
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.5443892800807952,
+ "train_acc": 0.82776,
+ "test_loss": 1.965821966934204,
+ "test_acc": 0.5664,
+ "lyapunov": null,
+ "grad_norm": 0.8036351010817813,
+ "grad_max_sv": 0.3483227726072073,
+ "grad_min_sv": 1.4410761232583335e-08,
+ "grad_condition": 73431270.59891501,
+ "lr": 0.0006840622763423388,
+ "time_sec": 15.590615510940552
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.5372896729660034,
+ "train_acc": 0.82954,
+ "test_loss": 1.876914355659485,
+ "test_acc": 0.5811,
+ "lyapunov": null,
+ "grad_norm": 0.7997423554449953,
+ "grad_max_sv": 0.34569344371557237,
+ "grad_min_sv": 1.4015608398366443e-08,
+ "grad_condition": 828306651.3532289,
+ "lr": 0.0006742860236609073,
+ "time_sec": 15.640390872955322
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.5291300660514832,
+ "train_acc": 0.83176,
+ "test_loss": 1.8113979286193849,
+ "test_acc": 0.5866,
+ "lyapunov": null,
+ "grad_norm": 0.7903239162734349,
+ "grad_max_sv": 0.34317835718393325,
+ "grad_min_sv": 1.4270118212610095e-08,
+ "grad_condition": 130381299.82028241,
+ "lr": 0.0006644333233692913,
+ "time_sec": 15.598358869552612
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.5121459530830383,
+ "train_acc": 0.83708,
+ "test_loss": 1.8623944423675538,
+ "test_acc": 0.5809,
+ "lyapunov": null,
+ "grad_norm": 0.7828571196598214,
+ "grad_max_sv": 0.33372929617762565,
+ "grad_min_sv": 1.3842122733448425e-08,
+ "grad_condition": 47391163.99310992,
+ "lr": 0.0006545084971874734,
+ "time_sec": 15.594441413879395
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.5045927854156494,
+ "train_acc": 0.83722,
+ "test_loss": 1.868363607597351,
+ "test_acc": 0.5833,
+ "lyapunov": null,
+ "grad_norm": 0.782632751951769,
+ "grad_max_sv": 0.3441222012042999,
+ "grad_min_sv": 1.4132956021933527e-08,
+ "grad_condition": 770221957.2190915,
+ "lr": 0.0006445158984722354,
+ "time_sec": 15.625693082809448
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.4909844134426117,
+ "train_acc": 0.84268,
+ "test_loss": 1.9616632486343384,
+ "test_acc": 0.5686,
+ "lyapunov": null,
+ "grad_norm": 0.7640706557919354,
+ "grad_max_sv": 0.3262421116232872,
+ "grad_min_sv": 1.3609901451661078e-08,
+ "grad_condition": 70578003.89460334,
+ "lr": 0.0006344599103076324,
+ "time_sec": 15.61337399482727
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.47858007513046263,
+ "train_acc": 0.84808,
+ "test_loss": 1.8504299934387207,
+ "test_acc": 0.5864,
+ "lyapunov": null,
+ "grad_norm": 0.7612944717059198,
+ "grad_max_sv": 0.3300259932875633,
+ "grad_min_sv": 1.34369991692607e-08,
+ "grad_condition": 1366561815.948382,
+ "lr": 0.0006243449435824269,
+ "time_sec": 15.618177652359009
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.47501785024642945,
+ "train_acc": 0.84756,
+ "test_loss": 1.8781955436706543,
+ "test_acc": 0.5869,
+ "lyapunov": null,
+ "grad_norm": 0.7572180647827939,
+ "grad_max_sv": 0.3278561718761921,
+ "grad_min_sv": 1.3324545805690896e-08,
+ "grad_condition": 581046380.377969,
+ "lr": 0.0006141754350553275,
+ "time_sec": 15.624166488647461
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.4702414323043823,
+ "train_acc": 0.84926,
+ "test_loss": 1.892370820426941,
+ "test_acc": 0.586,
+ "lyapunov": null,
+ "grad_norm": 0.7563650221448377,
+ "grad_max_sv": 0.3307614929974079,
+ "grad_min_sv": 1.3784487005921026e-08,
+ "grad_condition": 464200921.7045374,
+ "lr": 0.0006039558454088793,
+ "time_sec": 15.617845058441162
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.45756534008026123,
+ "train_acc": 0.85312,
+ "test_loss": 1.9519972061157227,
+ "test_acc": 0.5808,
+ "lyapunov": null,
+ "grad_norm": 0.7420841565788096,
+ "grad_max_sv": 0.33202062249183656,
+ "grad_min_sv": 1.338400364191486e-08,
+ "grad_condition": 499395104.1034541,
+ "lr": 0.000593690657292862,
+ "time_sec": 15.611196994781494
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.44467548862457273,
+ "train_acc": 0.85686,
+ "test_loss": 1.9216414470672607,
+ "test_acc": 0.5822,
+ "lyapunov": null,
+ "grad_norm": 0.7382025740357703,
+ "grad_max_sv": 0.3282777763903141,
+ "grad_min_sv": 1.3046149181881323e-08,
+ "grad_condition": 346705862.33150136,
+ "lr": 0.0005833843733580507,
+ "time_sec": 15.611254215240479
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.43985233959198,
+ "train_acc": 0.85918,
+ "test_loss": 1.8851093154907226,
+ "test_acc": 0.5926,
+ "lyapunov": null,
+ "grad_norm": 0.7289145095731725,
+ "grad_max_sv": 0.32352428287267687,
+ "grad_min_sv": 1.3040011394684428e-08,
+ "grad_condition": 442041574.8141201,
+ "lr": 0.0005730415142812054,
+ "time_sec": 15.625309467315674
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.4362604184055328,
+ "train_acc": 0.85998,
+ "test_loss": 1.8714712146759034,
+ "test_acc": 0.5926,
+ "lyapunov": null,
+ "grad_norm": 0.7311888404996788,
+ "grad_max_sv": 0.31886391565203664,
+ "grad_min_sv": 1.2968906573272102e-08,
+ "grad_condition": 3567171952.0862184,
+ "lr": 0.0005626666167821517,
+ "time_sec": 15.61151123046875
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.42215480308532716,
+ "train_acc": 0.86416,
+ "test_loss": 2.019381594085693,
+ "test_acc": 0.5791,
+ "lyapunov": null,
+ "grad_norm": 0.721768423243528,
+ "grad_max_sv": 0.3247049540281296,
+ "grad_min_sv": 1.2853580642424936e-08,
+ "grad_condition": 450059064.02256596,
+ "lr": 0.0005522642316338265,
+ "time_sec": 15.629756689071655
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.4138381930923462,
+ "train_acc": 0.8672,
+ "test_loss": 1.8805969470977784,
+ "test_acc": 0.5939,
+ "lyapunov": null,
+ "grad_norm": 0.7122183187054967,
+ "grad_max_sv": 0.31785007640719415,
+ "grad_min_sv": 1.2996066436378461e-08,
+ "grad_condition": 197171308.1464749,
+ "lr": 0.0005418389216661573,
+ "time_sec": 15.619616270065308
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.40292635828018186,
+ "train_acc": 0.86882,
+ "test_loss": 1.9322007545471191,
+ "test_acc": 0.5786,
+ "lyapunov": null,
+ "grad_norm": 0.7085910743884665,
+ "grad_max_sv": 0.3134432151913643,
+ "grad_min_sv": 1.2498033243762453e-08,
+ "grad_condition": 793091340.8871062,
+ "lr": 0.0005313952597646563,
+ "time_sec": 15.617356300354004
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.40141631307601927,
+ "train_acc": 0.86948,
+ "test_loss": 1.8957605976104737,
+ "test_acc": 0.599,
+ "lyapunov": null,
+ "grad_norm": 0.7091751625468098,
+ "grad_max_sv": 0.3174535669386387,
+ "grad_min_sv": 1.2447811244958862e-08,
+ "grad_condition": 249741254.61747846,
+ "lr": 0.0005209378268645994,
+ "time_sec": 15.621675968170166
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.3882115649795532,
+ "train_acc": 0.87366,
+ "test_loss": 1.98493223361969,
+ "test_acc": 0.5838,
+ "lyapunov": null,
+ "grad_norm": 0.6962545006972763,
+ "grad_max_sv": 0.31799899972975254,
+ "grad_min_sv": 1.2635416091113378e-08,
+ "grad_condition": 228682453.11998367,
+ "lr": 0.0005104712099416781,
+ "time_sec": 15.613324403762817
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.3784026951885223,
+ "train_acc": 0.8775,
+ "test_loss": 1.9258492612838745,
+ "test_acc": 0.5894,
+ "lyapunov": null,
+ "grad_norm": 0.6897862834083666,
+ "grad_max_sv": 0.3025407921522856,
+ "grad_min_sv": 1.191642424076822e-08,
+ "grad_condition": 517580765.4604114,
+ "lr": 0.0004999999999999996,
+ "time_sec": 15.604532957077026
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.3745850126075745,
+ "train_acc": 0.87942,
+ "test_loss": 1.8862019395828247,
+ "test_acc": 0.597,
+ "lyapunov": null,
+ "grad_norm": 0.6831871296489548,
+ "grad_max_sv": 0.30832933597266676,
+ "grad_min_sv": 1.2160173869495832e-08,
+ "grad_condition": 947775184.6338822,
+ "lr": 0.0004895287900583212,
+ "time_sec": 15.608951568603516
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.3610551133441925,
+ "train_acc": 0.88172,
+ "test_loss": 1.880063851928711,
+ "test_acc": 0.6012,
+ "lyapunov": null,
+ "grad_norm": 0.6743453354187542,
+ "grad_max_sv": 0.29855253025889394,
+ "grad_min_sv": 1.2030242225015767e-08,
+ "grad_condition": 516312299.61059207,
+ "lr": 0.0004790621731353997,
+ "time_sec": 15.615072250366211
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.3575943685531616,
+ "train_acc": 0.88478,
+ "test_loss": 1.9622120880126954,
+ "test_acc": 0.5938,
+ "lyapunov": null,
+ "grad_norm": 0.6751503647014531,
+ "grad_max_sv": 0.30869465619325637,
+ "grad_min_sv": 1.1962258270568903e-08,
+ "grad_condition": 156961942.34190208,
+ "lr": 0.000468604740235343,
+ "time_sec": 15.620108127593994
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.356780963382721,
+ "train_acc": 0.88514,
+ "test_loss": 1.9785774551391602,
+ "test_acc": 0.5895,
+ "lyapunov": null,
+ "grad_norm": 0.6750273249196351,
+ "grad_max_sv": 0.29922002404928205,
+ "grad_min_sv": 1.1769536231547029e-08,
+ "grad_condition": 159293637.70185965,
+ "lr": 0.00045816107833384175,
+ "time_sec": 15.615866899490356
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.34938912315368653,
+ "train_acc": 0.8876,
+ "test_loss": 1.9177911525726319,
+ "test_acc": 0.5916,
+ "lyapunov": null,
+ "grad_norm": 0.6633930537019016,
+ "grad_max_sv": 0.29133019372820856,
+ "grad_min_sv": 1.1681813408617736e-08,
+ "grad_condition": 263364196.96272945,
+ "lr": 0.0004477357683661729,
+ "time_sec": 15.618734359741211
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.34074662324905397,
+ "train_acc": 0.8899,
+ "test_loss": 1.947013536453247,
+ "test_acc": 0.5907,
+ "lyapunov": null,
+ "grad_norm": 0.6597022593428697,
+ "grad_max_sv": 0.29191571436822417,
+ "grad_min_sv": 1.156299900565089e-08,
+ "grad_condition": 1345147447.952278,
+ "lr": 0.00043733338321784746,
+ "time_sec": 15.646045923233032
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.33476794362068174,
+ "train_acc": 0.89196,
+ "test_loss": 1.995362993812561,
+ "test_acc": 0.5918,
+ "lyapunov": null,
+ "grad_norm": 0.6563550515125143,
+ "grad_max_sv": 0.28989207223057745,
+ "grad_min_sv": 1.1521310828500105e-08,
+ "grad_condition": 1549368517.9852664,
+ "lr": 0.0004269584857187939,
+ "time_sec": 15.651390075683594
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.32779589292526246,
+ "train_acc": 0.89466,
+ "test_loss": 1.9326098243713379,
+ "test_acc": 0.5984,
+ "lyapunov": null,
+ "grad_norm": 0.6471640564495617,
+ "grad_max_sv": 0.29146968461573125,
+ "grad_min_sv": 1.1487493853379327e-08,
+ "grad_condition": 92617304.39349434,
+ "lr": 0.0004166156266419484,
+ "time_sec": 15.611905336380005
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.3205149848842621,
+ "train_acc": 0.89636,
+ "test_loss": 2.084268938064575,
+ "test_acc": 0.5809,
+ "lyapunov": null,
+ "grad_norm": 0.6452842014274853,
+ "grad_max_sv": 0.2868046831339598,
+ "grad_min_sv": 1.1289359868812965e-08,
+ "grad_condition": 186807946.77140856,
+ "lr": 0.0004063093427071373,
+ "time_sec": 15.605120658874512
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.31429147192001344,
+ "train_acc": 0.89772,
+ "test_loss": 1.8867773443222047,
+ "test_acc": 0.6067,
+ "lyapunov": null,
+ "grad_norm": 0.6402388209165808,
+ "grad_max_sv": 0.29072388894855977,
+ "grad_min_sv": 1.1252009047418853e-08,
+ "grad_condition": 102815726.30519769,
+ "lr": 0.0003960441545911199,
+ "time_sec": 15.619008302688599
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.3057248209381104,
+ "train_acc": 0.90034,
+ "test_loss": 1.9401320112228393,
+ "test_acc": 0.5983,
+ "lyapunov": null,
+ "grad_norm": 0.6311267078269261,
+ "grad_max_sv": 0.2907364759594202,
+ "grad_min_sv": 1.1278600659490879e-08,
+ "grad_condition": 156533701.22010937,
+ "lr": 0.0003858245649446718,
+ "time_sec": 15.645244359970093
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.3014916487598419,
+ "train_acc": 0.9024,
+ "test_loss": 1.9676358179092408,
+ "test_acc": 0.5951,
+ "lyapunov": null,
+ "grad_norm": 0.6286377862812311,
+ "grad_max_sv": 0.29410710372030735,
+ "grad_min_sv": 1.117144211807558e-08,
+ "grad_condition": 1243341457.898049,
+ "lr": 0.00037565505641757235,
+ "time_sec": 15.613637685775757
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.2975629404449463,
+ "train_acc": 0.90206,
+ "test_loss": 1.9475040822982788,
+ "test_acc": 0.6007,
+ "lyapunov": null,
+ "grad_norm": 0.6288857771151286,
+ "grad_max_sv": 0.29210252575576306,
+ "grad_min_sv": 1.1327018099556787e-08,
+ "grad_condition": 449577659.23919934,
+ "lr": 0.00036554008969236695,
+ "time_sec": 15.627456188201904
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.2940291863822937,
+ "train_acc": 0.90424,
+ "test_loss": 1.9751218059539795,
+ "test_acc": 0.6041,
+ "lyapunov": null,
+ "grad_norm": 0.624248588717073,
+ "grad_max_sv": 0.27752059176564214,
+ "grad_min_sv": 1.0839235129161267e-08,
+ "grad_condition": 328108890.12738866,
+ "lr": 0.0003554841015277638,
+ "time_sec": 15.661294221878052
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.28330512808799746,
+ "train_acc": 0.90742,
+ "test_loss": 1.9922785207748412,
+ "test_acc": 0.6018,
+ "lyapunov": null,
+ "grad_norm": 0.6169602856180438,
+ "grad_max_sv": 0.2886409737169743,
+ "grad_min_sv": 1.0983499523081752e-08,
+ "grad_condition": 97610883.30544701,
+ "lr": 0.000345491502812526,
+ "time_sec": 15.610979795455933
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.2814662490653992,
+ "train_acc": 0.90908,
+ "test_loss": 1.9960870874404908,
+ "test_acc": 0.5995,
+ "lyapunov": null,
+ "grad_norm": 0.6132865794782463,
+ "grad_max_sv": 0.28339540734887125,
+ "grad_min_sv": 1.0941020271021395e-08,
+ "grad_condition": 145384408.70816708,
+ "lr": 0.0003355666766307081,
+ "time_sec": 15.639533281326294
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.2761197953605652,
+ "train_acc": 0.91006,
+ "test_loss": 1.993612285232544,
+ "test_acc": 0.6007,
+ "lyapunov": null,
+ "grad_norm": 0.6073672916952068,
+ "grad_max_sv": 0.2746456813067198,
+ "grad_min_sv": 1.0572886616905252e-08,
+ "grad_condition": 62093577.47245115,
+ "lr": 0.00032571397633909225,
+ "time_sec": 15.616953611373901
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.2773143856334686,
+ "train_acc": 0.90906,
+ "test_loss": 1.9627196998596192,
+ "test_acc": 0.5993,
+ "lyapunov": null,
+ "grad_norm": 0.6057396266879189,
+ "grad_max_sv": 0.27635425254702567,
+ "grad_min_sv": 1.0533270900208586e-08,
+ "grad_condition": 200919941.49428365,
+ "lr": 0.00031593772365766094,
+ "time_sec": 15.62587594985962
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.2620466177368164,
+ "train_acc": 0.91416,
+ "test_loss": 2.0111697412490845,
+ "test_acc": 0.602,
+ "lyapunov": null,
+ "grad_norm": 0.5926928515974628,
+ "grad_max_sv": 0.28529031090438367,
+ "grad_min_sv": 1.0650170428677317e-08,
+ "grad_condition": 743433094.0082552,
+ "lr": 0.0003062422067739483,
+ "time_sec": 15.626370191574097
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.2537871124172211,
+ "train_acc": 0.91762,
+ "test_loss": 1.9979699476242065,
+ "test_acc": 0.5996,
+ "lyapunov": null,
+ "grad_norm": 0.5795471657923094,
+ "grad_max_sv": 0.27274232916533947,
+ "grad_min_sv": 1.036865705178816e-08,
+ "grad_condition": 309294232.0879529,
+ "lr": 0.00029663167846209965,
+ "time_sec": 15.634578943252563
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.2604071279144287,
+ "train_acc": 0.91558,
+ "test_loss": 2.0250939807891846,
+ "test_acc": 0.5981,
+ "lyapunov": null,
+ "grad_norm": 0.5880459177262352,
+ "grad_max_sv": 0.27270981669425964,
+ "grad_min_sv": 1.0527747556186851e-08,
+ "grad_condition": 634008594.0035694,
+ "lr": 0.00028711035421746345,
+ "time_sec": 15.610902070999146
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.25580399082183836,
+ "train_acc": 0.91794,
+ "test_loss": 1.9363522800445556,
+ "test_acc": 0.611,
+ "lyapunov": null,
+ "grad_norm": 0.5834698969226986,
+ "grad_max_sv": 0.2803939372301102,
+ "grad_min_sv": 1.0679914613353353e-08,
+ "grad_condition": 719199780.3413004,
+ "lr": 0.00027768241040753615,
+ "time_sec": 15.64728569984436
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.24704306831359862,
+ "train_acc": 0.92026,
+ "test_loss": 1.959199716567993,
+ "test_acc": 0.6064,
+ "lyapunov": null,
+ "grad_norm": 0.5767069189645235,
+ "grad_max_sv": 0.2719736970961094,
+ "grad_min_sv": 1.0407105681484868e-08,
+ "grad_condition": 507738893.5347587,
+ "lr": 0.00026835198244006903,
+ "time_sec": 15.606433153152466
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.23963388308048247,
+ "train_acc": 0.92232,
+ "test_loss": 2.0193208892822265,
+ "test_acc": 0.604,
+ "lyapunov": null,
+ "grad_norm": 0.5636948581506628,
+ "grad_max_sv": 0.2563767429441214,
+ "grad_min_sv": 9.613457626483913e-09,
+ "grad_condition": 152598313.52871948,
+ "lr": 0.0002591231629491421,
+ "time_sec": 15.63752031326294
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.24343088443756103,
+ "train_acc": 0.92086,
+ "test_loss": 1.9747429904937743,
+ "test_acc": 0.6041,
+ "lyapunov": null,
+ "grad_norm": 0.5699300559096447,
+ "grad_max_sv": 0.270798621699214,
+ "grad_min_sv": 1.0453353890187232e-08,
+ "grad_condition": 2642582699.9195356,
+ "lr": 0.0002499999999999997,
+ "time_sec": 15.625839710235596
+ },
+ {
+ "epoch": 101,
+ "train_loss": 0.2352629409980774,
+ "train_acc": 0.92396,
+ "test_loss": 1.989087490463257,
+ "test_acc": 0.6026,
+ "lyapunov": null,
+ "grad_norm": 0.5635783773655396,
+ "grad_max_sv": 0.2760987766087055,
+ "grad_min_sv": 1.0676657122982158e-08,
+ "grad_condition": 230608448.0042146,
+ "lr": 0.00024098649531343477,
+ "time_sec": 15.618889093399048
+ },
+ {
+ "epoch": 102,
+ "train_loss": 0.23230449400901795,
+ "train_acc": 0.9242,
+ "test_loss": 2.011552722930908,
+ "test_acc": 0.6012,
+ "lyapunov": null,
+ "grad_norm": 0.5597262828511032,
+ "grad_max_sv": 0.2676333624869585,
+ "grad_min_sv": 1.013142310103167e-08,
+ "grad_condition": 765944599.5566685,
+ "lr": 0.0002320866025105016,
+ "time_sec": 15.619239091873169
+ },
+ {
+ "epoch": 103,
+ "train_loss": 0.22586535712242126,
+ "train_acc": 0.92702,
+ "test_loss": 1.984936227798462,
+ "test_acc": 0.6064,
+ "lyapunov": null,
+ "grad_norm": 0.5525662827107412,
+ "grad_max_sv": 0.26978373192250726,
+ "grad_min_sv": 1.0020810805059718e-08,
+ "grad_condition": 426927099.4434453,
+ "lr": 0.0002233042253783278,
+ "time_sec": 15.617717981338501
+ },
+ {
+ "epoch": 104,
+ "train_loss": 0.2259028799390793,
+ "train_acc": 0.92724,
+ "test_loss": 1.9414194402694702,
+ "test_acc": 0.6138,
+ "lyapunov": null,
+ "grad_norm": 0.5552198456176712,
+ "grad_max_sv": 0.2549734696745872,
+ "grad_min_sv": 9.559075114318542e-09,
+ "grad_condition": 2183845809.503984,
+ "lr": 0.000214643216157784,
+ "time_sec": 15.639457702636719
+ },
+ {
+ "epoch": 105,
+ "train_loss": 0.21585512964725495,
+ "train_acc": 0.93068,
+ "test_loss": 1.9875489110946656,
+ "test_acc": 0.606,
+ "lyapunov": null,
+ "grad_norm": 0.545110676363793,
+ "grad_max_sv": 0.2662647683173418,
+ "grad_min_sv": 9.966519613335139e-09,
+ "grad_condition": 304520020.74158037,
+ "lr": 0.00020610737385376332,
+ "time_sec": 15.633507013320923
+ },
+ {
+ "epoch": 106,
+ "train_loss": 0.2177306656885147,
+ "train_acc": 0.92888,
+ "test_loss": 2.001543083000183,
+ "test_acc": 0.6039,
+ "lyapunov": null,
+ "grad_norm": 0.550439381212866,
+ "grad_max_sv": 0.2616906825453043,
+ "grad_min_sv": 9.792636692686207e-09,
+ "grad_condition": 257664085.8931566,
+ "lr": 0.00019770044256881242,
+ "time_sec": 15.617624759674072
+ },
+ {
+ "epoch": 107,
+ "train_loss": 0.21544821160316469,
+ "train_acc": 0.93026,
+ "test_loss": 1.982275790977478,
+ "test_acc": 0.6101,
+ "lyapunov": null,
+ "grad_norm": 0.5459895500350969,
+ "grad_max_sv": 0.25458521842956544,
+ "grad_min_sv": 9.842609948471428e-09,
+ "grad_condition": 482597026.39869213,
+ "lr": 0.0001894261098608447,
+ "time_sec": 15.647446632385254
+ },
+ {
+ "epoch": 108,
+ "train_loss": 0.2111588809776306,
+ "train_acc": 0.93214,
+ "test_loss": 1.9962615560531616,
+ "test_acc": 0.6122,
+ "lyapunov": null,
+ "grad_norm": 0.5418984142700298,
+ "grad_max_sv": 0.2645403627306223,
+ "grad_min_sv": 9.923241169051967e-09,
+ "grad_condition": 365555925.75439864,
+ "lr": 0.000181288005125655,
+ "time_sec": 15.624069213867188
+ },
+ {
+ "epoch": 109,
+ "train_loss": 0.20284160462856293,
+ "train_acc": 0.9356,
+ "test_loss": 1.9948909492492677,
+ "test_acc": 0.6088,
+ "lyapunov": null,
+ "grad_norm": 0.528437343256151,
+ "grad_max_sv": 0.259377746284008,
+ "grad_min_sv": 9.446828402957103e-09,
+ "grad_condition": 445873699.40050447,
+ "lr": 0.0001732896980049473,
+ "time_sec": 15.619670867919922
+ },
+ {
+ "epoch": 110,
+ "train_loss": 0.20353743035316468,
+ "train_acc": 0.93482,
+ "test_loss": 1.986756645965576,
+ "test_acc": 0.6055,
+ "lyapunov": null,
+ "grad_norm": 0.5264966046483858,
+ "grad_max_sv": 0.2641640670597553,
+ "grad_min_sv": 9.887280825321421e-09,
+ "grad_condition": 138912649.1504107,
+ "lr": 0.00016543469682057076,
+ "time_sec": 15.631803512573242
+ },
+ {
+ "epoch": 111,
+ "train_loss": 0.20074854846000673,
+ "train_acc": 0.93586,
+ "test_loss": 1.9947669797897338,
+ "test_acc": 0.6121,
+ "lyapunov": null,
+ "grad_norm": 0.5275548784671268,
+ "grad_max_sv": 0.2535504408180714,
+ "grad_min_sv": 9.46079494620021e-09,
+ "grad_condition": 547036967.0533922,
+ "lr": 0.00015772644703565552,
+ "time_sec": 15.61940598487854
+ },
+ {
+ "epoch": 112,
+ "train_loss": 0.19321160237312318,
+ "train_acc": 0.9385,
+ "test_loss": 2.0327499378204346,
+ "test_acc": 0.6062,
+ "lyapunov": null,
+ "grad_norm": 0.5166537604057669,
+ "grad_max_sv": 0.25912084989249706,
+ "grad_min_sv": 9.35720720976474e-09,
+ "grad_condition": 95478514.06504653,
+ "lr": 0.00015016832974331713,
+ "time_sec": 15.630404233932495
+ },
+ {
+ "epoch": 113,
+ "train_loss": 0.19881929339408874,
+ "train_acc": 0.93676,
+ "test_loss": 1.9957002614974975,
+ "test_acc": 0.6131,
+ "lyapunov": null,
+ "grad_norm": 0.5256468964094271,
+ "grad_max_sv": 0.26186227425932884,
+ "grad_min_sv": 9.776758263992796e-09,
+ "grad_condition": 531930595.36185646,
+ "lr": 0.00014276366018359834,
+ "time_sec": 15.610270023345947
+ },
+ {
+ "epoch": 114,
+ "train_loss": 0.19278850085735322,
+ "train_acc": 0.93894,
+ "test_loss": 1.9826040161132812,
+ "test_acc": 0.6131,
+ "lyapunov": null,
+ "grad_norm": 0.5148800122190731,
+ "grad_max_sv": 0.2489961117506027,
+ "grad_min_sv": 9.322825122396599e-09,
+ "grad_condition": 159545806.21783024,
+ "lr": 0.00013551568628929425,
+ "time_sec": 15.641097784042358
+ },
+ {
+ "epoch": 115,
+ "train_loss": 0.18285285237312318,
+ "train_acc": 0.9414,
+ "test_loss": 1.991772039604187,
+ "test_acc": 0.6142,
+ "lyapunov": null,
+ "grad_norm": 0.5028991850276996,
+ "grad_max_sv": 0.25001580603420737,
+ "grad_min_sv": 9.509952834441983e-09,
+ "grad_condition": 842043304.8653241,
+ "lr": 0.00012842758726130276,
+ "time_sec": 15.624920845031738
+ },
+ {
+ "epoch": 116,
+ "train_loss": 0.18698999623775484,
+ "train_acc": 0.94058,
+ "test_loss": 2.0126701816558836,
+ "test_acc": 0.6119,
+ "lyapunov": null,
+ "grad_norm": 0.5095041564276453,
+ "grad_max_sv": 0.26496921889483926,
+ "grad_min_sv": 9.780998184343373e-09,
+ "grad_condition": 568079773.7667667,
+ "lr": 0.0001215024721741218,
+ "time_sec": 15.629492282867432
+ },
+ {
+ "epoch": 117,
+ "train_loss": 0.18326869733810425,
+ "train_acc": 0.94208,
+ "test_loss": 2.0141338161468507,
+ "test_acc": 0.6109,
+ "lyapunov": null,
+ "grad_norm": 0.5053898511223723,
+ "grad_max_sv": 0.25150991678237916,
+ "grad_min_sv": 9.336200610613604e-09,
+ "grad_condition": 1717749653.6011043,
+ "lr": 0.00011474337861210538,
+ "time_sec": 15.634049415588379
+ },
+ {
+ "epoch": 118,
+ "train_loss": 0.18224171819210053,
+ "train_acc": 0.94188,
+ "test_loss": 2.0296729431152345,
+ "test_acc": 0.6105,
+ "lyapunov": null,
+ "grad_norm": 0.5029285155771278,
+ "grad_max_sv": 0.23879224769771099,
+ "grad_min_sv": 8.82893005297973e-09,
+ "grad_condition": 239804345.46782646,
+ "lr": 0.00010815327133708009,
+ "time_sec": 15.628947496414185
+ },
+ {
+ "epoch": 119,
+ "train_loss": 0.18119296488761902,
+ "train_acc": 0.94198,
+ "test_loss": 2.0246818908691404,
+ "test_acc": 0.6087,
+ "lyapunov": null,
+ "grad_norm": 0.5032702983874193,
+ "grad_max_sv": 0.24678345806896687,
+ "grad_min_sv": 9.113220317789883e-09,
+ "grad_condition": 857312795.1343833,
+ "lr": 0.00010173504098790182,
+ "time_sec": 15.6134774684906
+ },
+ {
+ "epoch": 120,
+ "train_loss": 0.17719127690315248,
+ "train_acc": 0.9427,
+ "test_loss": 2.01081164188385,
+ "test_acc": 0.6174,
+ "lyapunov": null,
+ "grad_norm": 0.5004254149003725,
+ "grad_max_sv": 0.246440602093935,
+ "grad_min_sv": 9.41313048775233e-09,
+ "grad_condition": 138861626.69393042,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 15.636605978012085
+ },
+ {
+ "epoch": 121,
+ "train_loss": 0.17499777765274047,
+ "train_acc": 0.94382,
+ "test_loss": 1.9586133924484252,
+ "test_acc": 0.6191,
+ "lyapunov": null,
+ "grad_norm": 0.49798749889404575,
+ "grad_max_sv": 0.24333747774362563,
+ "grad_min_sv": 8.965640931665048e-09,
+ "grad_condition": 199036180.79499412,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 15.640979051589966
+ },
+ {
+ "epoch": 122,
+ "train_loss": 0.17186202396392822,
+ "train_acc": 0.94454,
+ "test_loss": 2.0166892234802245,
+ "test_acc": 0.6135,
+ "lyapunov": null,
+ "grad_norm": 0.49330378790067125,
+ "grad_max_sv": 0.25466611608862877,
+ "grad_min_sv": 9.453950847171378e-09,
+ "grad_condition": 478328271.5351636,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 15.646830320358276
+ },
+ {
+ "epoch": 123,
+ "train_loss": 0.16818810626506805,
+ "train_acc": 0.94736,
+ "test_loss": 2.019712274169922,
+ "test_acc": 0.6142,
+ "lyapunov": null,
+ "grad_norm": 0.48351538018550005,
+ "grad_max_sv": 0.23057686612010003,
+ "grad_min_sv": 8.829706591578778e-09,
+ "grad_condition": 119186809.27894473,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 15.61932897567749
+ },
+ {
+ "epoch": 124,
+ "train_loss": 0.1690133387851715,
+ "train_acc": 0.94626,
+ "test_loss": 2.0480916412353514,
+ "test_acc": 0.6128,
+ "lyapunov": null,
+ "grad_norm": 0.48572744080768737,
+ "grad_max_sv": 0.23872192315757274,
+ "grad_min_sv": 8.860755323661872e-09,
+ "grad_condition": 3145605466.955108,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 15.644042730331421
+ },
+ {
+ "epoch": 125,
+ "train_loss": 0.168843046336174,
+ "train_acc": 0.94632,
+ "test_loss": 2.0204298835754395,
+ "test_acc": 0.6129,
+ "lyapunov": null,
+ "grad_norm": 0.4870048472763099,
+ "grad_max_sv": 0.23674570098519326,
+ "grad_min_sv": 8.746680829206827e-09,
+ "grad_condition": 1043463046.0193933,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 15.637329578399658
+ },
+ {
+ "epoch": 126,
+ "train_loss": 0.1671668215227127,
+ "train_acc": 0.94594,
+ "test_loss": 2.002202911376953,
+ "test_acc": 0.6131,
+ "lyapunov": null,
+ "grad_norm": 0.48754920878473634,
+ "grad_max_sv": 0.24048108272254468,
+ "grad_min_sv": 9.09920443853407e-09,
+ "grad_condition": 222641480.08621296,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 15.630179405212402
+ },
+ {
+ "epoch": 127,
+ "train_loss": 0.1643574129629135,
+ "train_acc": 0.94886,
+ "test_loss": 1.9984551259994507,
+ "test_acc": 0.6156,
+ "lyapunov": null,
+ "grad_norm": 0.47845542032939736,
+ "grad_max_sv": 0.24418257176876068,
+ "grad_min_sv": 9.058184188338348e-09,
+ "grad_condition": 1384258325.8409991,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 15.670144081115723
+ },
+ {
+ "epoch": 128,
+ "train_loss": 0.16359006194114686,
+ "train_acc": 0.9479,
+ "test_loss": 2.0345991184234617,
+ "test_acc": 0.6179,
+ "lyapunov": null,
+ "grad_norm": 0.48011615670673446,
+ "grad_max_sv": 0.2456669148057699,
+ "grad_min_sv": 9.08018520576876e-09,
+ "grad_condition": 6539583536.661702,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 15.629289150238037
+ },
+ {
+ "epoch": 129,
+ "train_loss": 0.16212649368047713,
+ "train_acc": 0.94982,
+ "test_loss": 2.010682648849487,
+ "test_acc": 0.6175,
+ "lyapunov": null,
+ "grad_norm": 0.4761536550945564,
+ "grad_max_sv": 0.232033634185791,
+ "grad_min_sv": 8.589821504130924e-09,
+ "grad_condition": 3119446573.9156704,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 15.64078950881958
+ },
+ {
+ "epoch": 130,
+ "train_loss": 0.16086667060375215,
+ "train_acc": 0.94958,
+ "test_loss": 1.9803698434829713,
+ "test_acc": 0.6147,
+ "lyapunov": null,
+ "grad_norm": 0.47391205330881436,
+ "grad_max_sv": 0.2445445589721203,
+ "grad_min_sv": 8.864201939140243e-09,
+ "grad_condition": 1504896403.9424946,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 15.639111280441284
+ },
+ {
+ "epoch": 131,
+ "train_loss": 0.1630353739786148,
+ "train_acc": 0.94778,
+ "test_loss": 2.0161276233673098,
+ "test_acc": 0.6182,
+ "lyapunov": null,
+ "grad_norm": 0.47703771588416854,
+ "grad_max_sv": 0.24524084888398648,
+ "grad_min_sv": 8.949330069585661e-09,
+ "grad_condition": 366306191.4994844,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 15.648417472839355
+ },
+ {
+ "epoch": 132,
+ "train_loss": 0.1624550827550888,
+ "train_acc": 0.94854,
+ "test_loss": 2.0064841974258423,
+ "test_acc": 0.6153,
+ "lyapunov": null,
+ "grad_norm": 0.4818820971540279,
+ "grad_max_sv": 0.24392225965857506,
+ "grad_min_sv": 9.014241386749028e-09,
+ "grad_condition": 324500193.81381315,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 15.652456998825073
+ },
+ {
+ "epoch": 133,
+ "train_loss": 0.15666789950847626,
+ "train_acc": 0.95052,
+ "test_loss": 2.004924358177185,
+ "test_acc": 0.614,
+ "lyapunov": null,
+ "grad_norm": 0.4692967462799058,
+ "grad_max_sv": 0.23394662290811538,
+ "grad_min_sv": 8.633084696250959e-09,
+ "grad_condition": 738953051.583332,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 15.626720190048218
+ },
+ {
+ "epoch": 134,
+ "train_loss": 0.15714832616329194,
+ "train_acc": 0.951,
+ "test_loss": 1.9721798049926758,
+ "test_acc": 0.6189,
+ "lyapunov": null,
+ "grad_norm": 0.4708593375349624,
+ "grad_max_sv": 0.2399698007851839,
+ "grad_min_sv": 8.714008907333149e-09,
+ "grad_condition": 459943684.01348275,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 15.634363174438477
+ },
+ {
+ "epoch": 135,
+ "train_loss": 0.15481690949440002,
+ "train_acc": 0.95178,
+ "test_loss": 2.056765143966675,
+ "test_acc": 0.6141,
+ "lyapunov": null,
+ "grad_norm": 0.46512649923966126,
+ "grad_max_sv": 0.23735021129250528,
+ "grad_min_sv": 8.604525054706907e-09,
+ "grad_condition": 441311318.94657505,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 15.641301155090332
+ },
+ {
+ "epoch": 136,
+ "train_loss": 0.15590213608264922,
+ "train_acc": 0.95074,
+ "test_loss": 1.9664541049957276,
+ "test_acc": 0.615,
+ "lyapunov": null,
+ "grad_norm": 0.4718253897994526,
+ "grad_max_sv": 0.24445511549711227,
+ "grad_min_sv": 8.92059932467576e-09,
+ "grad_condition": 155779083.2595345,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 15.650960445404053
+ },
+ {
+ "epoch": 137,
+ "train_loss": 0.15185086236953735,
+ "train_acc": 0.95326,
+ "test_loss": 2.047826315307617,
+ "test_acc": 0.6137,
+ "lyapunov": null,
+ "grad_norm": 0.46215794046576214,
+ "grad_max_sv": 0.2249258290976286,
+ "grad_min_sv": 8.299157507572763e-09,
+ "grad_condition": 391195089.613189,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 15.619166374206543
+ },
+ {
+ "epoch": 138,
+ "train_loss": 0.15070438093185426,
+ "train_acc": 0.95262,
+ "test_loss": 2.030345579147339,
+ "test_acc": 0.6129,
+ "lyapunov": null,
+ "grad_norm": 0.4608066254891212,
+ "grad_max_sv": 0.234202978387475,
+ "grad_min_sv": 8.521646538895875e-09,
+ "grad_condition": 5129724937.383492,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 15.623726606369019
+ },
+ {
+ "epoch": 139,
+ "train_loss": 0.15612281042575837,
+ "train_acc": 0.95076,
+ "test_loss": 2.0557478452682494,
+ "test_acc": 0.612,
+ "lyapunov": null,
+ "grad_norm": 0.47103497229286695,
+ "grad_max_sv": 0.23263695724308492,
+ "grad_min_sv": 8.57658385075566e-09,
+ "grad_condition": 101811752.76010731,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 15.65443754196167
+ },
+ {
+ "epoch": 140,
+ "train_loss": 0.15597544308423997,
+ "train_acc": 0.95086,
+ "test_loss": 1.9863805370330812,
+ "test_acc": 0.6151,
+ "lyapunov": null,
+ "grad_norm": 0.46515955894700917,
+ "grad_max_sv": 0.22864672914147377,
+ "grad_min_sv": 8.669487886083091e-09,
+ "grad_condition": 2093311134.8373718,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 15.636597394943237
+ },
+ {
+ "epoch": 141,
+ "train_loss": 0.15137063200950623,
+ "train_acc": 0.95232,
+ "test_loss": 2.0044470993041994,
+ "test_acc": 0.6185,
+ "lyapunov": null,
+ "grad_norm": 0.4628286057156769,
+ "grad_max_sv": 0.24093721210956573,
+ "grad_min_sv": 8.729446927135563e-09,
+ "grad_condition": 3146827225.783096,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 15.6335289478302
+ },
+ {
+ "epoch": 142,
+ "train_loss": 0.15115962938308716,
+ "train_acc": 0.95278,
+ "test_loss": 1.9897070358276367,
+ "test_acc": 0.6186,
+ "lyapunov": null,
+ "grad_norm": 0.45849067649845243,
+ "grad_max_sv": 0.22538469620049,
+ "grad_min_sv": 8.402085760331798e-09,
+ "grad_condition": 1185010790.8687212,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 15.64037299156189
+ },
+ {
+ "epoch": 143,
+ "train_loss": 0.15024116450309755,
+ "train_acc": 0.95378,
+ "test_loss": 1.9762957132339478,
+ "test_acc": 0.62,
+ "lyapunov": null,
+ "grad_norm": 0.4584088819764392,
+ "grad_max_sv": 0.22209009900689125,
+ "grad_min_sv": 8.452660355321145e-09,
+ "grad_condition": 1556012288.1682973,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 15.659480571746826
+ },
+ {
+ "epoch": 144,
+ "train_loss": 0.1521627188205719,
+ "train_acc": 0.95232,
+ "test_loss": 2.0099195236206056,
+ "test_acc": 0.615,
+ "lyapunov": null,
+ "grad_norm": 0.46494782588161737,
+ "grad_max_sv": 0.238496233522892,
+ "grad_min_sv": 8.729236520774175e-09,
+ "grad_condition": 69857580.46396288,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 15.64352297782898
+ },
+ {
+ "epoch": 145,
+ "train_loss": 0.15200012585163117,
+ "train_acc": 0.95196,
+ "test_loss": 1.98911852684021,
+ "test_acc": 0.6161,
+ "lyapunov": null,
+ "grad_norm": 0.46350518405517277,
+ "grad_max_sv": 0.22944532111287116,
+ "grad_min_sv": 8.441616768887356e-09,
+ "grad_condition": 1044568693.4332545,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 15.670719385147095
+ },
+ {
+ "epoch": 146,
+ "train_loss": 0.1524506710958481,
+ "train_acc": 0.95248,
+ "test_loss": 1.9624867490768432,
+ "test_acc": 0.6194,
+ "lyapunov": null,
+ "grad_norm": 0.46296967599985495,
+ "grad_max_sv": 0.24031115397810937,
+ "grad_min_sv": 8.944420498528671e-09,
+ "grad_condition": 254633054.1592765,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 15.643468141555786
+ },
+ {
+ "epoch": 147,
+ "train_loss": 0.15344970943927766,
+ "train_acc": 0.95206,
+ "test_loss": 2.0164750316619875,
+ "test_acc": 0.6171,
+ "lyapunov": null,
+ "grad_norm": 0.4641053248109342,
+ "grad_max_sv": 0.24226672500371932,
+ "grad_min_sv": 8.89504937415242e-09,
+ "grad_condition": 221436071.47224984,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 15.642008066177368
+ },
+ {
+ "epoch": 148,
+ "train_loss": 0.15008926822185517,
+ "train_acc": 0.95316,
+ "test_loss": 2.007580140686035,
+ "test_acc": 0.6105,
+ "lyapunov": null,
+ "grad_norm": 0.4593316495579621,
+ "grad_max_sv": 0.23314933404326438,
+ "grad_min_sv": 8.37392370464738e-09,
+ "grad_condition": 1235759721.5215242,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 15.637904644012451
+ },
+ {
+ "epoch": 149,
+ "train_loss": 0.1545172585248947,
+ "train_acc": 0.95082,
+ "test_loss": 1.9932567636489869,
+ "test_acc": 0.6167,
+ "lyapunov": null,
+ "grad_norm": 0.46711595173344705,
+ "grad_max_sv": 0.24011613838374615,
+ "grad_min_sv": 9.01919292514708e-09,
+ "grad_condition": 533582982.17976344,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 15.649343013763428
+ },
+ {
+ "epoch": 150,
+ "train_loss": 0.15159378504276275,
+ "train_acc": 0.95298,
+ "test_loss": 1.981881332397461,
+ "test_acc": 0.6151,
+ "lyapunov": null,
+ "grad_norm": 0.4631918119140012,
+ "grad_max_sv": 0.23626054041087627,
+ "grad_min_sv": 8.505257114788459e-09,
+ "grad_condition": 368578452.6540891,
+ "lr": 0.0,
+ "time_sec": 15.655460119247437
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 4.193410815277099,
+ "train_acc": 0.07754,
+ "test_loss": 4.000027540588379,
+ "test_acc": 0.1084,
+ "lyapunov": null,
+ "grad_norm": 5.824766820168824,
+ "grad_max_sv": 4.574610841274262,
+ "grad_min_sv": 1.0190309995827818e-07,
+ "grad_condition": 64142283.19081552,
+ "lr": 0.0009998903417374227,
+ "time_sec": 32.83128619194031
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.561303809967041,
+ "train_acc": 0.15712,
+ "test_loss": 3.590533604812622,
+ "test_acc": 0.1573,
+ "lyapunov": null,
+ "grad_norm": 3.9411000996615257,
+ "grad_max_sv": 2.8509309351444245,
+ "grad_min_sv": 7.158311222943414e-08,
+ "grad_condition": 97792152.02989444,
+ "lr": 0.0009995614150494292,
+ "time_sec": 32.72442889213562
+ },
+ {
+ "epoch": 3,
+ "train_loss": 3.1933692501068114,
+ "train_acc": 0.21822,
+ "test_loss": 3.4406786922454833,
+ "test_acc": 0.1888,
+ "lyapunov": null,
+ "grad_norm": 2.91352219919842,
+ "grad_max_sv": 1.9122859120368958,
+ "grad_min_sv": 5.4513909730768975e-08,
+ "grad_condition": 41901882.724198125,
+ "lr": 0.0009990133642141358,
+ "time_sec": 32.71043276786804
+ },
+ {
+ "epoch": 4,
+ "train_loss": 2.9170604755401612,
+ "train_acc": 0.266,
+ "test_loss": 3.0161821269989013,
+ "test_acc": 0.2662,
+ "lyapunov": null,
+ "grad_norm": 2.4579814839971488,
+ "grad_max_sv": 1.375921016931534,
+ "grad_min_sv": 4.532563397940948e-08,
+ "grad_condition": 34954497.395048514,
+ "lr": 0.0009982464296247522,
+ "time_sec": 32.71440148353577
+ },
+ {
+ "epoch": 5,
+ "train_loss": 2.6815094689941406,
+ "train_acc": 0.31454,
+ "test_loss": 3.171553889846802,
+ "test_acc": 0.2379,
+ "lyapunov": null,
+ "grad_norm": 2.19104728864566,
+ "grad_max_sv": 1.1679374247789382,
+ "grad_min_sv": 4.075679240767016e-08,
+ "grad_condition": 34176946.0056582,
+ "lr": 0.0009972609476841367,
+ "time_sec": 32.70787262916565
+ },
+ {
+ "epoch": 6,
+ "train_loss": 2.512476542663574,
+ "train_acc": 0.34722,
+ "test_loss": 2.8388263694763185,
+ "test_acc": 0.2956,
+ "lyapunov": null,
+ "grad_norm": 2.024852807897748,
+ "grad_max_sv": 1.048439186811447,
+ "grad_min_sv": 3.766053036924344e-08,
+ "grad_condition": 110646045.40063909,
+ "lr": 0.000996057350657239,
+ "time_sec": 32.716644048690796
+ },
+ {
+ "epoch": 7,
+ "train_loss": 2.3700338256072997,
+ "train_acc": 0.37646,
+ "test_loss": 2.664342771148682,
+ "test_acc": 0.3267,
+ "lyapunov": null,
+ "grad_norm": 1.8863637744279735,
+ "grad_max_sv": 0.9381255134940147,
+ "grad_min_sv": 3.53045587958567e-08,
+ "grad_condition": 91691166.21261387,
+ "lr": 0.000994636166481494,
+ "time_sec": 32.70954084396362
+ },
+ {
+ "epoch": 8,
+ "train_loss": 2.241964275894165,
+ "train_acc": 0.40536,
+ "test_loss": 2.3703575309753417,
+ "test_acc": 0.3827,
+ "lyapunov": null,
+ "grad_norm": 1.79442458506404,
+ "grad_max_sv": 0.8764713048934937,
+ "grad_min_sv": 3.357538055498432e-08,
+ "grad_condition": 85483165.80410945,
+ "lr": 0.0009929980185352525,
+ "time_sec": 32.705676794052124
+ },
+ {
+ "epoch": 9,
+ "train_loss": 2.1290865299224855,
+ "train_acc": 0.43074,
+ "test_loss": 2.346775402069092,
+ "test_acc": 0.3898,
+ "lyapunov": null,
+ "grad_norm": 1.6946660597355347,
+ "grad_max_sv": 0.8082527592778206,
+ "grad_min_sv": 3.168056596919433e-08,
+ "grad_condition": 84022920.74591663,
+ "lr": 0.0009911436253643444,
+ "time_sec": 32.81319451332092
+ },
+ {
+ "epoch": 10,
+ "train_loss": 2.0410905982208254,
+ "train_acc": 0.45114,
+ "test_loss": 2.352191310119629,
+ "test_acc": 0.4016,
+ "lyapunov": null,
+ "grad_norm": 1.6077351393537498,
+ "grad_max_sv": 0.7309410408139229,
+ "grad_min_sv": 2.985739961935963e-08,
+ "grad_condition": 36398179.92957014,
+ "lr": 0.0009890738003669028,
+ "time_sec": 32.67559885978699
+ },
+ {
+ "epoch": 11,
+ "train_loss": 1.9488755139160157,
+ "train_acc": 0.47108,
+ "test_loss": 2.292022847747803,
+ "test_acc": 0.4149,
+ "lyapunov": null,
+ "grad_norm": 1.5472074192305951,
+ "grad_max_sv": 0.6999917805194855,
+ "grad_min_sv": 2.931911482484395e-08,
+ "grad_condition": 29185684.451776367,
+ "lr": 0.00098678945143658,
+ "time_sec": 32.67131185531616
+ },
+ {
+ "epoch": 12,
+ "train_loss": 1.8751110802459716,
+ "train_acc": 0.48868,
+ "test_loss": 2.234260977935791,
+ "test_acc": 0.4219,
+ "lyapunov": null,
+ "grad_norm": 1.477638716923594,
+ "grad_max_sv": 0.647687041759491,
+ "grad_min_sv": 2.7830199432477e-08,
+ "grad_condition": 45906260.41435587,
+ "lr": 0.0009842915805643154,
+ "time_sec": 32.67626142501831
+ },
+ {
+ "epoch": 13,
+ "train_loss": 1.8070984636688232,
+ "train_acc": 0.50424,
+ "test_loss": 2.1869627113342287,
+ "test_acc": 0.4348,
+ "lyapunov": null,
+ "grad_norm": 1.4268137700999757,
+ "grad_max_sv": 0.6230859503149986,
+ "grad_min_sv": 2.6403634246358056e-08,
+ "grad_condition": 81962325.61583482,
+ "lr": 0.000981581283398829,
+ "time_sec": 32.71280646324158
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.7594015161895753,
+ "train_acc": 0.51666,
+ "test_loss": 2.225412437438965,
+ "test_acc": 0.4269,
+ "lyapunov": null,
+ "grad_norm": 1.3750641538015655,
+ "grad_max_sv": 0.5909776814281941,
+ "grad_min_sv": 2.5812447444067965e-08,
+ "grad_condition": 110809015.48631673,
+ "lr": 0.0009786597487660333,
+ "time_sec": 32.71353602409363
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.7050045301437378,
+ "train_acc": 0.5265,
+ "test_loss": 2.2115724647521975,
+ "test_acc": 0.4374,
+ "lyapunov": null,
+ "grad_norm": 1.3299355868966125,
+ "grad_max_sv": 0.5802051067352295,
+ "grad_min_sv": 2.5246993384797634e-08,
+ "grad_condition": 26653204.194885753,
+ "lr": 0.0009755282581475766,
+ "time_sec": 32.709041357040405
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.6458034181976318,
+ "train_acc": 0.54052,
+ "test_loss": 2.3288159313201904,
+ "test_acc": 0.4224,
+ "lyapunov": null,
+ "grad_norm": 1.2807898189857698,
+ "grad_max_sv": 0.5446614563465119,
+ "grad_min_sv": 2.4021811557278783e-08,
+ "grad_condition": 91338509.7437632,
+ "lr": 0.0009721881851187403,
+ "time_sec": 32.697059869766235
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.5929106069946288,
+ "train_acc": 0.55406,
+ "test_loss": 2.1113224380493163,
+ "test_acc": 0.4616,
+ "lyapunov": null,
+ "grad_norm": 1.2337526465020512,
+ "grad_max_sv": 0.5095916628837586,
+ "grad_min_sv": 2.2903062109336237e-08,
+ "grad_condition": 57294649.60211961,
+ "lr": 0.0009686409947459456,
+ "time_sec": 32.683470726013184
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.5314323492813111,
+ "train_acc": 0.5677,
+ "test_loss": 2.091776432800293,
+ "test_acc": 0.47,
+ "lyapunov": null,
+ "grad_norm": 1.1978845665370097,
+ "grad_max_sv": 0.5015841260552406,
+ "grad_min_sv": 2.2305156793800408e-08,
+ "grad_condition": 29492886.216326892,
+ "lr": 0.0009648882429441254,
+ "time_sec": 32.737040281295776
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.5103012445449828,
+ "train_acc": 0.57236,
+ "test_loss": 2.0679006351470948,
+ "test_acc": 0.4779,
+ "lyapunov": null,
+ "grad_norm": 1.1728126223162796,
+ "grad_max_sv": 0.4839314170181751,
+ "grad_min_sv": 2.174818596739625e-08,
+ "grad_condition": 107997783.86314659,
+ "lr": 0.00096093157579425,
+ "time_sec": 32.67225241661072
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.4595962884140015,
+ "train_acc": 0.58662,
+ "test_loss": 2.1169062660217284,
+ "test_acc": 0.4706,
+ "lyapunov": null,
+ "grad_norm": 1.1438665670784203,
+ "grad_max_sv": 0.469496750831604,
+ "grad_min_sv": 2.1164104392623617e-08,
+ "grad_condition": 64696771.4776402,
+ "lr": 0.0009567727288213001,
+ "time_sec": 32.6800582408905
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.42210446144104,
+ "train_acc": 0.59338,
+ "test_loss": 2.0751025535583496,
+ "test_acc": 0.4744,
+ "lyapunov": null,
+ "grad_norm": 1.1159812479247186,
+ "grad_max_sv": 0.45728652998805047,
+ "grad_min_sv": 2.1470654895661135e-08,
+ "grad_condition": 28760658.649009824,
+ "lr": 0.0009524135262330095,
+ "time_sec": 32.680222272872925
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.3733370163345338,
+ "train_acc": 0.60568,
+ "test_loss": 2.1397033340454104,
+ "test_acc": 0.4725,
+ "lyapunov": null,
+ "grad_norm": 1.0820101912101088,
+ "grad_max_sv": 0.4380739636719227,
+ "grad_min_sv": 2.027442237706456e-08,
+ "grad_condition": 33804989.22411772,
+ "lr": 0.0009478558801197061,
+ "time_sec": 32.683854818344116
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.3259621669006347,
+ "train_acc": 0.61976,
+ "test_loss": 2.082161441612244,
+ "test_acc": 0.4868,
+ "lyapunov": null,
+ "grad_norm": 1.0590598804772053,
+ "grad_max_sv": 0.4320934973657131,
+ "grad_min_sv": 1.9754895681789452e-08,
+ "grad_condition": 49199633.36386584,
+ "lr": 0.000943101789615607,
+ "time_sec": 32.705042362213135
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.3155639976882934,
+ "train_acc": 0.62032,
+ "test_loss": 2.108880234527588,
+ "test_acc": 0.4823,
+ "lyapunov": null,
+ "grad_norm": 1.046890854380851,
+ "grad_max_sv": 0.42886915877461435,
+ "grad_min_sv": 1.9609551714372398e-08,
+ "grad_condition": 41053712.713573575,
+ "lr": 0.0009381533400219313,
+ "time_sec": 32.71632719039917
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.273603660621643,
+ "train_acc": 0.63364,
+ "test_loss": 2.0933273361206055,
+ "test_acc": 0.4852,
+ "lyapunov": null,
+ "grad_norm": 1.024436079028184,
+ "grad_max_sv": 0.41587754189968107,
+ "grad_min_sv": 1.9385000169652723e-08,
+ "grad_condition": 51992204.20794226,
+ "lr": 0.0009330127018922189,
+ "time_sec": 32.702069997787476
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.2419982319259644,
+ "train_acc": 0.6399,
+ "test_loss": 2.1144972944259646,
+ "test_acc": 0.4865,
+ "lyapunov": null,
+ "grad_norm": 1.0088705466095338,
+ "grad_max_sv": 0.39710880219936373,
+ "grad_min_sv": 1.870035526846392e-08,
+ "grad_condition": 181692609.81395656,
+ "lr": 0.000927682130080253,
+ "time_sec": 32.707526445388794
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.2189629228973389,
+ "train_acc": 0.6436,
+ "test_loss": 2.204226477432251,
+ "test_acc": 0.476,
+ "lyapunov": null,
+ "grad_norm": 0.9979053902708439,
+ "grad_max_sv": 0.3974333480000496,
+ "grad_min_sv": 1.8178674205185376e-08,
+ "grad_condition": 88033285.18865582,
+ "lr": 0.0009221639627510072,
+ "time_sec": 32.74215221405029
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.196308147392273,
+ "train_acc": 0.65004,
+ "test_loss": 2.3723191680908204,
+ "test_acc": 0.4591,
+ "lyapunov": null,
+ "grad_norm": 0.975077074369322,
+ "grad_max_sv": 0.40025187358260156,
+ "grad_min_sv": 1.829182182389033e-08,
+ "grad_condition": 38849966.98297453,
+ "lr": 0.0009164606203550494,
+ "time_sec": 32.70245599746704
+ },
+ {
+ "epoch": 29,
+ "train_loss": 1.1692425540161133,
+ "train_acc": 0.65714,
+ "test_loss": 2.2748174949645996,
+ "test_acc": 0.4746,
+ "lyapunov": null,
+ "grad_norm": 0.9656994259472406,
+ "grad_max_sv": 0.3973592549562454,
+ "grad_min_sv": 1.812226688574503e-08,
+ "grad_condition": 39408166.232041776,
+ "lr": 0.0009105746045668516,
+ "time_sec": 32.71292495727539
+ },
+ {
+ "epoch": 30,
+ "train_loss": 1.1311084144973755,
+ "train_acc": 0.66644,
+ "test_loss": 2.1602066425323487,
+ "test_acc": 0.4933,
+ "lyapunov": null,
+ "grad_norm": 0.9503788281741601,
+ "grad_max_sv": 0.3813568793237209,
+ "grad_min_sv": 1.7537509381174154e-08,
+ "grad_condition": 91136622.64604397,
+ "lr": 0.0009045084971874733,
+ "time_sec": 32.729275941848755
+ },
+ {
+ "epoch": 31,
+ "train_loss": 1.107859415283203,
+ "train_acc": 0.67202,
+ "test_loss": 2.088518197631836,
+ "test_acc": 0.5149,
+ "lyapunov": null,
+ "grad_norm": 0.946846205217341,
+ "grad_max_sv": 0.38662919625639913,
+ "grad_min_sv": 1.787647136014536e-08,
+ "grad_condition": 37247674.11503151,
+ "lr": 0.0008982649590120977,
+ "time_sec": 32.724801540374756
+ },
+ {
+ "epoch": 32,
+ "train_loss": 1.075172028541565,
+ "train_acc": 0.68254,
+ "test_loss": 2.11543652381897,
+ "test_acc": 0.5052,
+ "lyapunov": null,
+ "grad_norm": 0.919583751793241,
+ "grad_max_sv": 0.37590193301439284,
+ "grad_min_sv": 1.7335351598646298e-08,
+ "grad_condition": 32173699.63890195,
+ "lr": 0.0008918467286629196,
+ "time_sec": 32.70777225494385
+ },
+ {
+ "epoch": 33,
+ "train_loss": 1.0526020958709716,
+ "train_acc": 0.68626,
+ "test_loss": 2.283646846008301,
+ "test_acc": 0.4816,
+ "lyapunov": null,
+ "grad_norm": 0.9156820464594853,
+ "grad_max_sv": 0.37288443073630334,
+ "grad_min_sv": 1.682198175895211e-08,
+ "grad_condition": 41766926.72855186,
+ "lr": 0.0008852566213878943,
+ "time_sec": 32.71830630302429
+ },
+ {
+ "epoch": 34,
+ "train_loss": 1.0363747980117797,
+ "train_acc": 0.69038,
+ "test_loss": 2.207733528137207,
+ "test_acc": 0.4943,
+ "lyapunov": null,
+ "grad_norm": 0.9077261463073804,
+ "grad_max_sv": 0.3598011791706085,
+ "grad_min_sv": 1.6353098675377097e-08,
+ "grad_condition": 114742140.57000451,
+ "lr": 0.000878497527825878,
+ "time_sec": 32.70716309547424
+ },
+ {
+ "epoch": 35,
+ "train_loss": 1.0068622560119629,
+ "train_acc": 0.69648,
+ "test_loss": 2.274261113357544,
+ "test_acc": 0.489,
+ "lyapunov": null,
+ "grad_norm": 0.8883949473822523,
+ "grad_max_sv": 0.3505275271832943,
+ "grad_min_sv": 1.6455692852801463e-08,
+ "grad_condition": 31982637.47738139,
+ "lr": 0.000871572412738697,
+ "time_sec": 32.704782009124756
+ },
+ {
+ "epoch": 36,
+ "train_loss": 0.9864518771362305,
+ "train_acc": 0.7021,
+ "test_loss": 2.3541188930511474,
+ "test_acc": 0.4898,
+ "lyapunov": null,
+ "grad_norm": 0.8736045940658475,
+ "grad_max_sv": 0.3457980893552303,
+ "grad_min_sv": 1.5842762313145187e-08,
+ "grad_condition": 32188123.411770713,
+ "lr": 0.0008644843137107055,
+ "time_sec": 32.691269397735596
+ },
+ {
+ "epoch": 37,
+ "train_loss": 0.9681263439178467,
+ "train_acc": 0.7075,
+ "test_loss": 2.195126131439209,
+ "test_acc": 0.5033,
+ "lyapunov": null,
+ "grad_norm": 0.8711424558239054,
+ "grad_max_sv": 0.34736732244491575,
+ "grad_min_sv": 1.5827014727270993e-08,
+ "grad_condition": 66500862.978035614,
+ "lr": 0.0008572363398164014,
+ "time_sec": 32.69683265686035
+ },
+ {
+ "epoch": 38,
+ "train_loss": 0.9408467683601379,
+ "train_acc": 0.71608,
+ "test_loss": 2.1800164726257325,
+ "test_acc": 0.5109,
+ "lyapunov": null,
+ "grad_norm": 0.8497079289449048,
+ "grad_max_sv": 0.33491997644305227,
+ "grad_min_sv": 1.5505913916746828e-08,
+ "grad_condition": 37981645.21243934,
+ "lr": 0.0008498316702566826,
+ "time_sec": 32.67169213294983
+ },
+ {
+ "epoch": 39,
+ "train_loss": 0.9174955882263184,
+ "train_acc": 0.7231,
+ "test_loss": 2.332292454910278,
+ "test_acc": 0.4984,
+ "lyapunov": null,
+ "grad_norm": 0.8483669541798352,
+ "grad_max_sv": 0.3449387975037098,
+ "grad_min_sv": 1.5716625918760217e-08,
+ "grad_condition": 38753621.785681486,
+ "lr": 0.0008422735529643442,
+ "time_sec": 32.668078660964966
+ },
+ {
+ "epoch": 40,
+ "train_loss": 0.8970937779045105,
+ "train_acc": 0.72826,
+ "test_loss": 2.282168871688843,
+ "test_acc": 0.5053,
+ "lyapunov": null,
+ "grad_norm": 0.8354606142013189,
+ "grad_max_sv": 0.3270870424807072,
+ "grad_min_sv": 1.5267581635058926e-08,
+ "grad_condition": 95751205.07057047,
+ "lr": 0.0008345653031794289,
+ "time_sec": 32.70110583305359
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.8763418362236023,
+ "train_acc": 0.73382,
+ "test_loss": 2.3397656742095947,
+ "test_acc": 0.504,
+ "lyapunov": null,
+ "grad_norm": 0.8300379125306362,
+ "grad_max_sv": 0.33984693363308904,
+ "grad_min_sv": 1.5102269786126942e-08,
+ "grad_condition": 36575363.166415855,
+ "lr": 0.0008267103019950526,
+ "time_sec": 32.68285536766052
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.8614973092651367,
+ "train_acc": 0.73702,
+ "test_loss": 2.217091986083984,
+ "test_acc": 0.513,
+ "lyapunov": null,
+ "grad_norm": 0.8218045461669631,
+ "grad_max_sv": 0.32567850723862646,
+ "grad_min_sv": 1.507071445694397e-08,
+ "grad_condition": 48789917.15280264,
+ "lr": 0.0008187119948743447,
+ "time_sec": 32.685330867767334
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.8463610815429687,
+ "train_acc": 0.74162,
+ "test_loss": 2.238330067062378,
+ "test_acc": 0.5145,
+ "lyapunov": null,
+ "grad_norm": 0.8111621240187793,
+ "grad_max_sv": 0.3245612893253565,
+ "grad_min_sv": 1.4757356182567606e-08,
+ "grad_condition": 2265212011.074665,
+ "lr": 0.000810573890139155,
+ "time_sec": 32.6937038898468
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.8388264699935913,
+ "train_acc": 0.7425,
+ "test_loss": 2.2916201137542727,
+ "test_acc": 0.5146,
+ "lyapunov": null,
+ "grad_norm": 0.806013800687461,
+ "grad_max_sv": 0.3360877387225628,
+ "grad_min_sv": 1.4701122835053537e-08,
+ "grad_condition": 56062708.17707713,
+ "lr": 0.0008022995574311873,
+ "time_sec": 32.70379972457886
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.8080853428649902,
+ "train_acc": 0.75246,
+ "test_loss": 2.31492944984436,
+ "test_acc": 0.519,
+ "lyapunov": null,
+ "grad_norm": 0.7954463291291034,
+ "grad_max_sv": 0.3197424054145813,
+ "grad_min_sv": 1.4746050645180267e-08,
+ "grad_condition": 648957804.3057442,
+ "lr": 0.0007938926261462363,
+ "time_sec": 32.704816579818726
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.8025041796875,
+ "train_acc": 0.753,
+ "test_loss": 2.3807359542846678,
+ "test_acc": 0.5181,
+ "lyapunov": null,
+ "grad_norm": 0.7945005415191121,
+ "grad_max_sv": 0.31871558651328086,
+ "grad_min_sv": 1.4457539215806392e-08,
+ "grad_condition": 62012558.50813458,
+ "lr": 0.0007853567838422158,
+ "time_sec": 32.7154860496521
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.7847597545051574,
+ "train_acc": 0.75886,
+ "test_loss": 2.305859538269043,
+ "test_acc": 0.5185,
+ "lyapunov": null,
+ "grad_norm": 0.7791668550262338,
+ "grad_max_sv": 0.3171059262007475,
+ "grad_min_sv": 1.4160447076028148e-08,
+ "grad_condition": 51678874.24460314,
+ "lr": 0.0007766957746216719,
+ "time_sec": 32.71022868156433
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.7660661986160279,
+ "train_acc": 0.7635,
+ "test_loss": 2.373494161605835,
+ "test_acc": 0.5197,
+ "lyapunov": null,
+ "grad_norm": 0.7662493930118918,
+ "grad_max_sv": 0.3144552931189537,
+ "grad_min_sv": 1.4124776402668626e-08,
+ "grad_condition": 42937106.53672977,
+ "lr": 0.0007679133974894982,
+ "time_sec": 32.722716093063354
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.7557950233268738,
+ "train_acc": 0.76584,
+ "test_loss": 2.2862959323883056,
+ "test_acc": 0.5222,
+ "lyapunov": null,
+ "grad_norm": 0.7719008014476091,
+ "grad_max_sv": 0.3158703289926052,
+ "grad_min_sv": 1.4232268583103113e-08,
+ "grad_condition": 39203631.14441905,
+ "lr": 0.000759013504686565,
+ "time_sec": 32.71821331977844
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.7287120180892944,
+ "train_acc": 0.77398,
+ "test_loss": 2.2880530021667482,
+ "test_acc": 0.5331,
+ "lyapunov": null,
+ "grad_norm": 0.7580370777565381,
+ "grad_max_sv": 0.31812012754380703,
+ "grad_min_sv": 1.3956443738194491e-08,
+ "grad_condition": 56488826.56667278,
+ "lr": 0.0007499999999999998,
+ "time_sec": 32.74500012397766
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.7047131567382813,
+ "train_acc": 0.77944,
+ "test_loss": 2.3342226333618163,
+ "test_acc": 0.5242,
+ "lyapunov": null,
+ "grad_norm": 0.7467723064599141,
+ "grad_max_sv": 0.3062335759401321,
+ "grad_min_sv": 1.365980890968843e-08,
+ "grad_condition": 48288096.27243978,
+ "lr": 0.0007408768370508575,
+ "time_sec": 32.73174715042114
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.701608234500885,
+ "train_acc": 0.78146,
+ "test_loss": 2.4530138679504394,
+ "test_acc": 0.5151,
+ "lyapunov": null,
+ "grad_norm": 0.744474034267783,
+ "grad_max_sv": 0.31273389905691146,
+ "grad_min_sv": 1.386061017072393e-08,
+ "grad_condition": 128824936.60768087,
+ "lr": 0.0007316480175599307,
+ "time_sec": 32.70361828804016
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.6784094618415832,
+ "train_acc": 0.7874,
+ "test_loss": 2.3597243209838865,
+ "test_acc": 0.5275,
+ "lyapunov": null,
+ "grad_norm": 0.7374795544632287,
+ "grad_max_sv": 0.30512114986777306,
+ "grad_min_sv": 1.3410438691116578e-08,
+ "grad_condition": 185757572.3538422,
+ "lr": 0.0007223175895924635,
+ "time_sec": 32.71756291389465
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.6558182954406738,
+ "train_acc": 0.795,
+ "test_loss": 2.376951601028442,
+ "test_acc": 0.5316,
+ "lyapunov": null,
+ "grad_norm": 0.7251324903072741,
+ "grad_max_sv": 0.2987603921443224,
+ "grad_min_sv": 1.2931078906264214e-08,
+ "grad_condition": 35614928.216609366,
+ "lr": 0.0007128896457825361,
+ "time_sec": 32.73335146903992
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.6438722687911987,
+ "train_acc": 0.79842,
+ "test_loss": 2.4439307792663576,
+ "test_acc": 0.5237,
+ "lyapunov": null,
+ "grad_norm": 0.7208427013257759,
+ "grad_max_sv": 0.2992406666278839,
+ "grad_min_sv": 1.321393890141298e-08,
+ "grad_condition": 86775812.1538335,
+ "lr": 0.0007033683215378998,
+ "time_sec": 32.714346408843994
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.6417430144309998,
+ "train_acc": 0.7972,
+ "test_loss": 2.3790397010803224,
+ "test_acc": 0.5275,
+ "lyapunov": null,
+ "grad_norm": 0.7192864641522134,
+ "grad_max_sv": 0.2877038486301899,
+ "grad_min_sv": 1.3027487994767515e-08,
+ "grad_condition": 758527469.2650627,
+ "lr": 0.0006937577932260512,
+ "time_sec": 32.70229887962341
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.6262681634902955,
+ "train_acc": 0.803,
+ "test_loss": 2.401387868881226,
+ "test_acc": 0.5319,
+ "lyapunov": null,
+ "grad_norm": 0.7121380891152584,
+ "grad_max_sv": 0.2965920139104128,
+ "grad_min_sv": 1.279559212457454e-08,
+ "grad_condition": 184239403.66627008,
+ "lr": 0.0006840622763423388,
+ "time_sec": 32.71753239631653
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.6120203521347046,
+ "train_acc": 0.80732,
+ "test_loss": 2.503086555862427,
+ "test_acc": 0.5165,
+ "lyapunov": null,
+ "grad_norm": 0.7090038692309348,
+ "grad_max_sv": 0.2882195271551609,
+ "grad_min_sv": 1.2676824923812945e-08,
+ "grad_condition": 64942214.60915594,
+ "lr": 0.0006742860236609073,
+ "time_sec": 32.75395059585571
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.5998075243473053,
+ "train_acc": 0.81224,
+ "test_loss": 2.4825798515319826,
+ "test_acc": 0.5223,
+ "lyapunov": null,
+ "grad_norm": 0.7030307704517706,
+ "grad_max_sv": 0.28765259496867657,
+ "grad_min_sv": 1.2779274688370229e-08,
+ "grad_condition": 182642047.07290906,
+ "lr": 0.0006644333233692913,
+ "time_sec": 32.70982766151428
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.5948525179862976,
+ "train_acc": 0.81162,
+ "test_loss": 2.5030276454925535,
+ "test_acc": 0.5207,
+ "lyapunov": null,
+ "grad_norm": 0.7026252294626018,
+ "grad_max_sv": 0.2934992775321007,
+ "grad_min_sv": 1.284481914573185e-08,
+ "grad_condition": 541914476.4363593,
+ "lr": 0.0006545084971874734,
+ "time_sec": 32.69038796424866
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.572040382938385,
+ "train_acc": 0.81932,
+ "test_loss": 2.5733165519714354,
+ "test_acc": 0.5197,
+ "lyapunov": null,
+ "grad_norm": 0.6845429439823613,
+ "grad_max_sv": 0.28906508460640906,
+ "grad_min_sv": 1.2416446168797556e-08,
+ "grad_condition": 83143739.39889392,
+ "lr": 0.0006445158984722354,
+ "time_sec": 32.70990490913391
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.5523873634338379,
+ "train_acc": 0.82446,
+ "test_loss": 2.563892342758179,
+ "test_acc": 0.5248,
+ "lyapunov": null,
+ "grad_norm": 0.677689496712232,
+ "grad_max_sv": 0.2810227505862713,
+ "grad_min_sv": 1.2061726063945787e-08,
+ "grad_condition": 161335990.45839816,
+ "lr": 0.0006344599103076324,
+ "time_sec": 32.714717864990234
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.537570647277832,
+ "train_acc": 0.82928,
+ "test_loss": 2.5110877151489257,
+ "test_acc": 0.5309,
+ "lyapunov": null,
+ "grad_norm": 0.6752075838217867,
+ "grad_max_sv": 0.2918707847595215,
+ "grad_min_sv": 1.2428116336060669e-08,
+ "grad_condition": 62614290.824099444,
+ "lr": 0.0006243449435824269,
+ "time_sec": 32.73838663101196
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.525590337715149,
+ "train_acc": 0.83162,
+ "test_loss": 2.5260006717681884,
+ "test_acc": 0.5365,
+ "lyapunov": null,
+ "grad_norm": 0.6614195891575191,
+ "grad_max_sv": 0.2785448797047138,
+ "grad_min_sv": 1.2074160667119305e-08,
+ "grad_condition": 68726347.69115171,
+ "lr": 0.0006141754350553275,
+ "time_sec": 32.716681241989136
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.506968226633072,
+ "train_acc": 0.83974,
+ "test_loss": 2.4551146259307863,
+ "test_acc": 0.5332,
+ "lyapunov": null,
+ "grad_norm": 0.6515058246983421,
+ "grad_max_sv": 0.28096592277288435,
+ "grad_min_sv": 1.183612223995545e-08,
+ "grad_condition": 56796145.61117469,
+ "lr": 0.0006039558454088793,
+ "time_sec": 32.72992730140686
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.5121252582931518,
+ "train_acc": 0.8359,
+ "test_loss": 2.4647022022247316,
+ "test_acc": 0.5374,
+ "lyapunov": null,
+ "grad_norm": 0.6569185851243321,
+ "grad_max_sv": 0.2686118472367525,
+ "grad_min_sv": 1.1671607616763752e-08,
+ "grad_condition": 198976036.41965005,
+ "lr": 0.000593690657292862,
+ "time_sec": 32.737778425216675
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.5035950432968139,
+ "train_acc": 0.83814,
+ "test_loss": 2.5104728435516357,
+ "test_acc": 0.5334,
+ "lyapunov": null,
+ "grad_norm": 0.6543970572426195,
+ "grad_max_sv": 0.27697036042809486,
+ "grad_min_sv": 1.1793683101109492e-08,
+ "grad_condition": 2176927259.024586,
+ "lr": 0.0005833843733580507,
+ "time_sec": 32.73714327812195
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.4827924027252197,
+ "train_acc": 0.8449,
+ "test_loss": 2.483680333328247,
+ "test_acc": 0.5362,
+ "lyapunov": null,
+ "grad_norm": 0.6424274790982618,
+ "grad_max_sv": 0.26836494021117685,
+ "grad_min_sv": 1.1452091713826107e-08,
+ "grad_condition": 64248156.31133513,
+ "lr": 0.0005730415142812054,
+ "time_sec": 32.73483109474182
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.463097783498764,
+ "train_acc": 0.85106,
+ "test_loss": 2.5873930728912353,
+ "test_acc": 0.5352,
+ "lyapunov": null,
+ "grad_norm": 0.6283493250843613,
+ "grad_max_sv": 0.26704199202358725,
+ "grad_min_sv": 1.1449700967197662e-08,
+ "grad_condition": 133571192.62172851,
+ "lr": 0.0005626666167821517,
+ "time_sec": 32.76736545562744
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.45964255402565,
+ "train_acc": 0.8516,
+ "test_loss": 2.4906038509368895,
+ "test_acc": 0.5466,
+ "lyapunov": null,
+ "grad_norm": 0.6392818623657084,
+ "grad_max_sv": 0.2811981987208128,
+ "grad_min_sv": 1.1691557246645834e-08,
+ "grad_condition": 83552341.63512965,
+ "lr": 0.0005522642316338265,
+ "time_sec": 32.76137971878052
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.44885221929550173,
+ "train_acc": 0.85536,
+ "test_loss": 2.5581497470855714,
+ "test_acc": 0.5417,
+ "lyapunov": null,
+ "grad_norm": 0.627505222045094,
+ "grad_max_sv": 0.2669704511761665,
+ "grad_min_sv": 1.135505285909666e-08,
+ "grad_condition": 55019996.6299631,
+ "lr": 0.0005418389216661573,
+ "time_sec": 32.754613161087036
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.4373334138870239,
+ "train_acc": 0.85988,
+ "test_loss": 2.5293708190917967,
+ "test_acc": 0.5385,
+ "lyapunov": null,
+ "grad_norm": 0.6228439231508988,
+ "grad_max_sv": 0.27325935252010825,
+ "grad_min_sv": 1.1285354627535438e-08,
+ "grad_condition": 404302529.70424557,
+ "lr": 0.0005313952597646563,
+ "time_sec": 32.747488260269165
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.43413398032188416,
+ "train_acc": 0.86118,
+ "test_loss": 2.59562434463501,
+ "test_acc": 0.5355,
+ "lyapunov": null,
+ "grad_norm": 0.6246623504935193,
+ "grad_max_sv": 0.26360294707119464,
+ "grad_min_sv": 1.0827903220485963e-08,
+ "grad_condition": 202498413.83885324,
+ "lr": 0.0005209378268645994,
+ "time_sec": 32.75055932998657
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.42070443333625795,
+ "train_acc": 0.86404,
+ "test_loss": 2.620591529083252,
+ "test_acc": 0.5311,
+ "lyapunov": null,
+ "grad_norm": 0.6160094351570171,
+ "grad_max_sv": 0.2604650367051363,
+ "grad_min_sv": 1.0893297332399688e-08,
+ "grad_condition": 109053309.86634846,
+ "lr": 0.0005104712099416781,
+ "time_sec": 32.766777753829956
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.41482046060562133,
+ "train_acc": 0.86586,
+ "test_loss": 2.6253975078582763,
+ "test_acc": 0.5364,
+ "lyapunov": null,
+ "grad_norm": 0.614383474689519,
+ "grad_max_sv": 0.2657254245132208,
+ "grad_min_sv": 1.1066643729282667e-08,
+ "grad_condition": 1358046707.310991,
+ "lr": 0.0004999999999999996,
+ "time_sec": 32.753093004226685
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.40771523109436036,
+ "train_acc": 0.8674,
+ "test_loss": 2.7234753631591797,
+ "test_acc": 0.5307,
+ "lyapunov": null,
+ "grad_norm": 0.6089832611690313,
+ "grad_max_sv": 0.2631608698517084,
+ "grad_min_sv": 1.1065733136576827e-08,
+ "grad_condition": 124518956.20538023,
+ "lr": 0.0004895287900583212,
+ "time_sec": 32.7672004699707
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.3850809427070618,
+ "train_acc": 0.87682,
+ "test_loss": 2.6585358211517334,
+ "test_acc": 0.5378,
+ "lyapunov": null,
+ "grad_norm": 0.5905288728439135,
+ "grad_max_sv": 0.2512054055929184,
+ "grad_min_sv": 1.0597189950382891e-08,
+ "grad_condition": 141685910.93483096,
+ "lr": 0.0004790621731353997,
+ "time_sec": 32.75537824630737
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.3790111728191376,
+ "train_acc": 0.87892,
+ "test_loss": 2.6925399055480956,
+ "test_acc": 0.5368,
+ "lyapunov": null,
+ "grad_norm": 0.5936477423986493,
+ "grad_max_sv": 0.2708817757666111,
+ "grad_min_sv": 1.0561610550192946e-08,
+ "grad_condition": 244253851.38396016,
+ "lr": 0.000468604740235343,
+ "time_sec": 32.734121561050415
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.376044921131134,
+ "train_acc": 0.87726,
+ "test_loss": 2.6398166637420655,
+ "test_acc": 0.5322,
+ "lyapunov": null,
+ "grad_norm": 0.5949427297273714,
+ "grad_max_sv": 0.2605267588049173,
+ "grad_min_sv": 1.0820864476679404e-08,
+ "grad_condition": 62663126.18808526,
+ "lr": 0.00045816107833384175,
+ "time_sec": 32.72508406639099
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.3590127901649475,
+ "train_acc": 0.88356,
+ "test_loss": 2.6562103397369383,
+ "test_acc": 0.5313,
+ "lyapunov": null,
+ "grad_norm": 0.57614839106705,
+ "grad_max_sv": 0.2479171995073557,
+ "grad_min_sv": 1.0216514026700069e-08,
+ "grad_condition": 168918888.0387075,
+ "lr": 0.0004477357683661729,
+ "time_sec": 32.7580771446228
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.35495832427978513,
+ "train_acc": 0.88512,
+ "test_loss": 2.6037187816619873,
+ "test_acc": 0.5424,
+ "lyapunov": null,
+ "grad_norm": 0.5731602731960765,
+ "grad_max_sv": 0.2532364260405302,
+ "grad_min_sv": 1.0580176048897299e-08,
+ "grad_condition": 286643189.9936029,
+ "lr": 0.00043733338321784746,
+ "time_sec": 32.72826409339905
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.3466758195114136,
+ "train_acc": 0.88818,
+ "test_loss": 2.6409978286743163,
+ "test_acc": 0.5399,
+ "lyapunov": null,
+ "grad_norm": 0.5643305573749353,
+ "grad_max_sv": 0.25191599801182746,
+ "grad_min_sv": 9.937639448582419e-09,
+ "grad_condition": 418028032.15621006,
+ "lr": 0.0004269584857187939,
+ "time_sec": 32.73789381980896
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.337517634677887,
+ "train_acc": 0.89068,
+ "test_loss": 2.6804797424316407,
+ "test_acc": 0.5387,
+ "lyapunov": null,
+ "grad_norm": 0.5635653171134332,
+ "grad_max_sv": 0.24921411760151385,
+ "grad_min_sv": 1.007469917777351e-08,
+ "grad_condition": 232954348.7021001,
+ "lr": 0.0004166156266419484,
+ "time_sec": 32.75311326980591
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.32895935908317564,
+ "train_acc": 0.89278,
+ "test_loss": 2.670875820159912,
+ "test_acc": 0.5417,
+ "lyapunov": null,
+ "grad_norm": 0.5604425901768842,
+ "grad_max_sv": 0.25350802317261695,
+ "grad_min_sv": 1.0073376105132481e-08,
+ "grad_condition": 810741849.6024733,
+ "lr": 0.0004063093427071373,
+ "time_sec": 32.75568342208862
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.31874533922195436,
+ "train_acc": 0.89668,
+ "test_loss": 2.726188472366333,
+ "test_acc": 0.5437,
+ "lyapunov": null,
+ "grad_norm": 0.5474219905771217,
+ "grad_max_sv": 0.24635729603469372,
+ "grad_min_sv": 9.822750767244857e-09,
+ "grad_condition": 407705693.9191896,
+ "lr": 0.0003960441545911199,
+ "time_sec": 32.74805927276611
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.3149368803215027,
+ "train_acc": 0.89756,
+ "test_loss": 2.7214178714752197,
+ "test_acc": 0.5419,
+ "lyapunov": null,
+ "grad_norm": 0.5494081042104078,
+ "grad_max_sv": 0.2415832221508026,
+ "grad_min_sv": 9.84441673934286e-09,
+ "grad_condition": 259925587.23227444,
+ "lr": 0.0003858245649446718,
+ "time_sec": 32.80679273605347
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.3021876361656189,
+ "train_acc": 0.9004,
+ "test_loss": 2.7706982093811034,
+ "test_acc": 0.5429,
+ "lyapunov": null,
+ "grad_norm": 0.5427208210607071,
+ "grad_max_sv": 0.24498338885605336,
+ "grad_min_sv": 9.92075648437174e-09,
+ "grad_condition": 232757368.44567218,
+ "lr": 0.00037565505641757235,
+ "time_sec": 32.76810097694397
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.297262005405426,
+ "train_acc": 0.90436,
+ "test_loss": 2.736396257019043,
+ "test_acc": 0.5423,
+ "lyapunov": null,
+ "grad_norm": 0.5343970285585263,
+ "grad_max_sv": 0.24844259656965734,
+ "grad_min_sv": 9.910514466504247e-09,
+ "grad_condition": 1110263065.3705904,
+ "lr": 0.00036554008969236695,
+ "time_sec": 32.74753546714783
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.28578209706306457,
+ "train_acc": 0.90734,
+ "test_loss": 2.850689685058594,
+ "test_acc": 0.5399,
+ "lyapunov": null,
+ "grad_norm": 0.5254402888094797,
+ "grad_max_sv": 0.23409140817821025,
+ "grad_min_sv": 9.523284056017854e-09,
+ "grad_condition": 1231623659.8277283,
+ "lr": 0.0003554841015277638,
+ "time_sec": 32.79159116744995
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.2832814686203003,
+ "train_acc": 0.90616,
+ "test_loss": 2.8175382946014405,
+ "test_acc": 0.537,
+ "lyapunov": null,
+ "grad_norm": 0.5216211125471195,
+ "grad_max_sv": 0.23542476668953896,
+ "grad_min_sv": 9.459231551322244e-09,
+ "grad_condition": 1301223464.6618998,
+ "lr": 0.000345491502812526,
+ "time_sec": 32.78084850311279
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.28347388619422914,
+ "train_acc": 0.90788,
+ "test_loss": 2.831140581512451,
+ "test_acc": 0.5444,
+ "lyapunov": null,
+ "grad_norm": 0.5319613521776031,
+ "grad_max_sv": 0.23012890443205833,
+ "grad_min_sv": 9.377407441096135e-09,
+ "grad_condition": 228524276.50434837,
+ "lr": 0.0003355666766307081,
+ "time_sec": 32.71651744842529
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.27393528344631196,
+ "train_acc": 0.91052,
+ "test_loss": 2.775809415435791,
+ "test_acc": 0.545,
+ "lyapunov": null,
+ "grad_norm": 0.5149918732183307,
+ "grad_max_sv": 0.23977560102939605,
+ "grad_min_sv": 9.41244274865055e-09,
+ "grad_condition": 202495109.8759535,
+ "lr": 0.00032571397633909225,
+ "time_sec": 32.70667123794556
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.2638559838104248,
+ "train_acc": 0.9163,
+ "test_loss": 2.7468856441497804,
+ "test_acc": 0.5537,
+ "lyapunov": null,
+ "grad_norm": 0.5066198396238114,
+ "grad_max_sv": 0.23251476027071477,
+ "grad_min_sv": 9.16693782366737e-09,
+ "grad_condition": 232699226.05631667,
+ "lr": 0.00031593772365766094,
+ "time_sec": 32.71683645248413
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.25781995408058167,
+ "train_acc": 0.9156,
+ "test_loss": 2.771767431640625,
+ "test_acc": 0.5456,
+ "lyapunov": null,
+ "grad_norm": 0.5052996090758677,
+ "grad_max_sv": 0.23510573096573353,
+ "grad_min_sv": 8.963649589916433e-09,
+ "grad_condition": 1701543645.1210911,
+ "lr": 0.0003062422067739483,
+ "time_sec": 32.713576555252075
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.25086621726989744,
+ "train_acc": 0.91784,
+ "test_loss": 2.8765688217163086,
+ "test_acc": 0.5451,
+ "lyapunov": null,
+ "grad_norm": 0.49975532415921886,
+ "grad_max_sv": 0.236967783421278,
+ "grad_min_sv": 9.25259010277346e-09,
+ "grad_condition": 145241238.20565036,
+ "lr": 0.00029663167846209965,
+ "time_sec": 32.73633694648743
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.24672197101354598,
+ "train_acc": 0.91946,
+ "test_loss": 2.8446786346435546,
+ "test_acc": 0.5438,
+ "lyapunov": null,
+ "grad_norm": 0.49641090183932196,
+ "grad_max_sv": 0.22625510580837727,
+ "grad_min_sv": 8.7457359089553e-09,
+ "grad_condition": 1836850483.766,
+ "lr": 0.00028711035421746345,
+ "time_sec": 32.76619052886963
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.23921704626083373,
+ "train_acc": 0.92148,
+ "test_loss": 2.797951399230957,
+ "test_acc": 0.5532,
+ "lyapunov": null,
+ "grad_norm": 0.49423071935175245,
+ "grad_max_sv": 0.24016087874770164,
+ "grad_min_sv": 8.990743178508703e-09,
+ "grad_condition": 210059856.3178285,
+ "lr": 0.00027768241040753615,
+ "time_sec": 32.82350516319275
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.23695792595386506,
+ "train_acc": 0.9223,
+ "test_loss": 2.8982477020263673,
+ "test_acc": 0.5432,
+ "lyapunov": null,
+ "grad_norm": 0.4903348629723419,
+ "grad_max_sv": 0.22139078341424465,
+ "grad_min_sv": 8.704557989333561e-09,
+ "grad_condition": 233405578.91055053,
+ "lr": 0.00026835198244006903,
+ "time_sec": 32.75874900817871
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.22282506870508195,
+ "train_acc": 0.92698,
+ "test_loss": 2.896362300491333,
+ "test_acc": 0.544,
+ "lyapunov": null,
+ "grad_norm": 0.4754599951900147,
+ "grad_max_sv": 0.22327796779572964,
+ "grad_min_sv": 8.601119547287876e-09,
+ "grad_condition": 868925326.22085,
+ "lr": 0.0002591231629491421,
+ "time_sec": 32.74084424972534
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.22439868947982788,
+ "train_acc": 0.92668,
+ "test_loss": 2.888060118484497,
+ "test_acc": 0.553,
+ "lyapunov": null,
+ "grad_norm": 0.4789261726309551,
+ "grad_max_sv": 0.22355457432568074,
+ "grad_min_sv": 8.837810024564172e-09,
+ "grad_condition": 804604193.8746045,
+ "lr": 0.0002499999999999997,
+ "time_sec": 32.76948523521423
+ },
+ {
+ "epoch": 101,
+ "train_loss": 0.21471880633354187,
+ "train_acc": 0.93042,
+ "test_loss": 2.926622017288208,
+ "test_acc": 0.5459,
+ "lyapunov": null,
+ "grad_norm": 0.46758839629635496,
+ "grad_max_sv": 0.2257686872035265,
+ "grad_min_sv": 8.604181156836657e-09,
+ "grad_condition": 364480196.7882508,
+ "lr": 0.00024098649531343477,
+ "time_sec": 32.761115312576294
+ },
+ {
+ "epoch": 102,
+ "train_loss": 0.20999815567016603,
+ "train_acc": 0.93128,
+ "test_loss": 2.7882490966796873,
+ "test_acc": 0.5578,
+ "lyapunov": null,
+ "grad_norm": 0.46851254306004025,
+ "grad_max_sv": 0.21838495172560216,
+ "grad_min_sv": 8.37696591199713e-09,
+ "grad_condition": 1510396720.662658,
+ "lr": 0.0002320866025105016,
+ "time_sec": 32.72404432296753
+ },
+ {
+ "epoch": 103,
+ "train_loss": 0.20526846901893617,
+ "train_acc": 0.93262,
+ "test_loss": 2.8693388496398926,
+ "test_acc": 0.554,
+ "lyapunov": null,
+ "grad_norm": 0.4589602275699082,
+ "grad_max_sv": 0.22509709745645523,
+ "grad_min_sv": 8.420789482605027e-09,
+ "grad_condition": 1371218202.1419,
+ "lr": 0.0002233042253783278,
+ "time_sec": 32.752496004104614
+ },
+ {
+ "epoch": 104,
+ "train_loss": 0.20646339273929595,
+ "train_acc": 0.9335,
+ "test_loss": 2.89330929107666,
+ "test_acc": 0.5483,
+ "lyapunov": null,
+ "grad_norm": 0.46636768633733616,
+ "grad_max_sv": 0.22183220721781255,
+ "grad_min_sv": 8.39393208819329e-09,
+ "grad_condition": 1827094910.9746387,
+ "lr": 0.000214643216157784,
+ "time_sec": 32.74421238899231
+ },
+ {
+ "epoch": 105,
+ "train_loss": 0.20053612211227417,
+ "train_acc": 0.93402,
+ "test_loss": 2.904328105926514,
+ "test_acc": 0.5506,
+ "lyapunov": null,
+ "grad_norm": 0.45700070764272066,
+ "grad_max_sv": 0.21747002471238375,
+ "grad_min_sv": 8.216160540282366e-09,
+ "grad_condition": 1664593727.1128445,
+ "lr": 0.00020610737385376332,
+ "time_sec": 32.724817991256714
+ },
+ {
+ "epoch": 106,
+ "train_loss": 0.1944782396030426,
+ "train_acc": 0.9362,
+ "test_loss": 2.8657500442504884,
+ "test_acc": 0.5488,
+ "lyapunov": null,
+ "grad_norm": 0.44687014031192024,
+ "grad_max_sv": 0.2213790450245142,
+ "grad_min_sv": 8.454356608192382e-09,
+ "grad_condition": 127028340.10294946,
+ "lr": 0.00019770044256881242,
+ "time_sec": 32.7451388835907
+ },
+ {
+ "epoch": 107,
+ "train_loss": 0.19279775314331055,
+ "train_acc": 0.93688,
+ "test_loss": 2.898486404800415,
+ "test_acc": 0.5523,
+ "lyapunov": null,
+ "grad_norm": 0.44614463029775897,
+ "grad_max_sv": 0.2167466938495636,
+ "grad_min_sv": 8.415876304873615e-09,
+ "grad_condition": 262012758.78866345,
+ "lr": 0.0001894261098608447,
+ "time_sec": 32.76267623901367
+ },
+ {
+ "epoch": 108,
+ "train_loss": 0.1886401759147644,
+ "train_acc": 0.93904,
+ "test_loss": 2.833827450942993,
+ "test_acc": 0.5567,
+ "lyapunov": null,
+ "grad_norm": 0.4435964290199411,
+ "grad_max_sv": 0.2225849311798811,
+ "grad_min_sv": 8.340220883015782e-09,
+ "grad_condition": 118785929.89668731,
+ "lr": 0.000181288005125655,
+ "time_sec": 32.86235594749451
+ },
+ {
+ "epoch": 109,
+ "train_loss": 0.1890174783563614,
+ "train_acc": 0.93882,
+ "test_loss": 2.941585520553589,
+ "test_acc": 0.5491,
+ "lyapunov": null,
+ "grad_norm": 0.4464239579148638,
+ "grad_max_sv": 0.21364586874842645,
+ "grad_min_sv": 8.245146911967442e-09,
+ "grad_condition": 716792612.4830931,
+ "lr": 0.0001732896980049473,
+ "time_sec": 32.74325895309448
+ },
+ {
+ "epoch": 110,
+ "train_loss": 0.18055749108314514,
+ "train_acc": 0.94126,
+ "test_loss": 2.9359549655914305,
+ "test_acc": 0.5517,
+ "lyapunov": null,
+ "grad_norm": 0.4349334962787559,
+ "grad_max_sv": 0.2089217260479927,
+ "grad_min_sv": 8.043115946556504e-09,
+ "grad_condition": 2200871643.370809,
+ "lr": 0.00016543469682057076,
+ "time_sec": 32.756227016448975
+ },
+ {
+ "epoch": 111,
+ "train_loss": 0.17659846026420592,
+ "train_acc": 0.9445,
+ "test_loss": 2.904285785675049,
+ "test_acc": 0.5552,
+ "lyapunov": null,
+ "grad_norm": 0.4288194869102633,
+ "grad_max_sv": 0.2133932262659073,
+ "grad_min_sv": 7.951804889029523e-09,
+ "grad_condition": 127160230.15537345,
+ "lr": 0.00015772644703565552,
+ "time_sec": 32.73052453994751
+ },
+ {
+ "epoch": 112,
+ "train_loss": 0.17598180088996887,
+ "train_acc": 0.9431,
+ "test_loss": 2.916234812545776,
+ "test_acc": 0.5566,
+ "lyapunov": null,
+ "grad_norm": 0.43046200088706854,
+ "grad_max_sv": 0.21027521118521691,
+ "grad_min_sv": 8.006027082247107e-09,
+ "grad_condition": 1303838738.9934053,
+ "lr": 0.00015016832974331713,
+ "time_sec": 32.737369775772095
+ },
+ {
+ "epoch": 113,
+ "train_loss": 0.167477658700943,
+ "train_acc": 0.94562,
+ "test_loss": 2.930574794006348,
+ "test_acc": 0.5492,
+ "lyapunov": null,
+ "grad_norm": 0.4188552255465725,
+ "grad_max_sv": 0.2074826244264841,
+ "grad_min_sv": 7.807182782865966e-09,
+ "grad_condition": 1013028230.5722786,
+ "lr": 0.00014276366018359834,
+ "time_sec": 32.78035497665405
+ },
+ {
+ "epoch": 114,
+ "train_loss": 0.16470729023933411,
+ "train_acc": 0.94658,
+ "test_loss": 2.9235076808929445,
+ "test_acc": 0.55,
+ "lyapunov": null,
+ "grad_norm": 0.4196468917250276,
+ "grad_max_sv": 0.2061817307025194,
+ "grad_min_sv": 7.639872719872321e-09,
+ "grad_condition": 147774842.88971734,
+ "lr": 0.00013551568628929425,
+ "time_sec": 32.71555685997009
+ },
+ {
+ "epoch": 115,
+ "train_loss": 0.15979129463195801,
+ "train_acc": 0.95014,
+ "test_loss": 2.8977687450408935,
+ "test_acc": 0.5554,
+ "lyapunov": null,
+ "grad_norm": 0.4109842368882969,
+ "grad_max_sv": 0.20125124976038933,
+ "grad_min_sv": 7.641511092990049e-09,
+ "grad_condition": 152806383.8905374,
+ "lr": 0.00012842758726130276,
+ "time_sec": 32.74684023857117
+ },
+ {
+ "epoch": 116,
+ "train_loss": 0.15650701507091522,
+ "train_acc": 0.94994,
+ "test_loss": 2.963372290420532,
+ "test_acc": 0.5536,
+ "lyapunov": null,
+ "grad_norm": 0.40714256168185947,
+ "grad_max_sv": 0.21380255445837976,
+ "grad_min_sv": 7.601124127343262e-09,
+ "grad_condition": 187963441.14469656,
+ "lr": 0.0001215024721741218,
+ "time_sec": 32.740856885910034
+ },
+ {
+ "epoch": 117,
+ "train_loss": 0.15483391536712646,
+ "train_acc": 0.95134,
+ "test_loss": 2.9223466384887695,
+ "test_acc": 0.5589,
+ "lyapunov": null,
+ "grad_norm": 0.4061085309679021,
+ "grad_max_sv": 0.20323452018201352,
+ "grad_min_sv": 7.630000256912337e-09,
+ "grad_condition": 541093755.1409919,
+ "lr": 0.00011474337861210538,
+ "time_sec": 32.71646022796631
+ },
+ {
+ "epoch": 118,
+ "train_loss": 0.15986083958148956,
+ "train_acc": 0.9476,
+ "test_loss": 2.890314678955078,
+ "test_acc": 0.5619,
+ "lyapunov": null,
+ "grad_norm": 0.4176419876084519,
+ "grad_max_sv": 0.20986161157488822,
+ "grad_min_sv": 7.767054953627256e-09,
+ "grad_condition": 181416124.9826005,
+ "lr": 0.00010815327133708009,
+ "time_sec": 32.71689772605896
+ },
+ {
+ "epoch": 119,
+ "train_loss": 0.15443852434635164,
+ "train_acc": 0.95028,
+ "test_loss": 2.9833076015472413,
+ "test_acc": 0.5504,
+ "lyapunov": null,
+ "grad_norm": 0.4094461556500699,
+ "grad_max_sv": 0.20980317294597625,
+ "grad_min_sv": 7.66585938392992e-09,
+ "grad_condition": 1289363850.184981,
+ "lr": 0.00010173504098790182,
+ "time_sec": 32.76529359817505
+ },
+ {
+ "epoch": 120,
+ "train_loss": 0.1513664803981781,
+ "train_acc": 0.95076,
+ "test_loss": 2.9521168746948243,
+ "test_acc": 0.5535,
+ "lyapunov": null,
+ "grad_norm": 0.40458507675773164,
+ "grad_max_sv": 0.2091453868895769,
+ "grad_min_sv": 7.546225789991506e-09,
+ "grad_condition": 191790265.63931364,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 32.75906276702881
+ },
+ {
+ "epoch": 121,
+ "train_loss": 0.1482712536096573,
+ "train_acc": 0.95224,
+ "test_loss": 3.008343357849121,
+ "test_acc": 0.5524,
+ "lyapunov": null,
+ "grad_norm": 0.40250293552115596,
+ "grad_max_sv": 0.20429235510528088,
+ "grad_min_sv": 7.4167842699346915e-09,
+ "grad_condition": 1004863133.4087012,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 32.738195180892944
+ },
+ {
+ "epoch": 122,
+ "train_loss": 0.1433233982515335,
+ "train_acc": 0.95406,
+ "test_loss": 2.8811149784088137,
+ "test_acc": 0.5615,
+ "lyapunov": null,
+ "grad_norm": 0.3918685762307977,
+ "grad_max_sv": 0.21150657180696725,
+ "grad_min_sv": 7.566205814736106e-09,
+ "grad_condition": 4864615061.542827,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 32.760249853134155
+ },
+ {
+ "epoch": 123,
+ "train_loss": 0.140904153547287,
+ "train_acc": 0.95554,
+ "test_loss": 3.0434706832885743,
+ "test_acc": 0.5488,
+ "lyapunov": null,
+ "grad_norm": 0.39134340646439314,
+ "grad_max_sv": 0.21096068248152733,
+ "grad_min_sv": 7.420657745899582e-09,
+ "grad_condition": 474788541.70389444,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 32.84018850326538
+ },
+ {
+ "epoch": 124,
+ "train_loss": 0.1424632687997818,
+ "train_acc": 0.95448,
+ "test_loss": 3.006509048843384,
+ "test_acc": 0.5549,
+ "lyapunov": null,
+ "grad_norm": 0.3952350465926858,
+ "grad_max_sv": 0.20579442996531724,
+ "grad_min_sv": 7.2102639599776894e-09,
+ "grad_condition": 640121523.7171735,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 32.73241114616394
+ },
+ {
+ "epoch": 125,
+ "train_loss": 0.13608443251609803,
+ "train_acc": 0.95782,
+ "test_loss": 2.9692224075317384,
+ "test_acc": 0.5578,
+ "lyapunov": null,
+ "grad_norm": 0.38466881950137,
+ "grad_max_sv": 0.19782444536685945,
+ "grad_min_sv": 7.223557173946516e-09,
+ "grad_condition": 248263306.50433522,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 32.678467988967896
+ },
+ {
+ "epoch": 126,
+ "train_loss": 0.13552211750030518,
+ "train_acc": 0.95626,
+ "test_loss": 3.032096587371826,
+ "test_acc": 0.5536,
+ "lyapunov": null,
+ "grad_norm": 0.3837934860475664,
+ "grad_max_sv": 0.19592427872121335,
+ "grad_min_sv": 7.1880338589928525e-09,
+ "grad_condition": 1098788620.3456562,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 32.70717906951904
+ },
+ {
+ "epoch": 127,
+ "train_loss": 0.1351850691795349,
+ "train_acc": 0.95776,
+ "test_loss": 2.9195703174591063,
+ "test_acc": 0.5604,
+ "lyapunov": null,
+ "grad_norm": 0.3835199995919498,
+ "grad_max_sv": 0.19671063385903836,
+ "grad_min_sv": 7.301026294463924e-09,
+ "grad_condition": 998102013.5820692,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 32.741135597229004
+ },
+ {
+ "epoch": 128,
+ "train_loss": 0.13267261865139007,
+ "train_acc": 0.95764,
+ "test_loss": 2.9626207927703856,
+ "test_acc": 0.5545,
+ "lyapunov": null,
+ "grad_norm": 0.3832565427194031,
+ "grad_max_sv": 0.2010548248887062,
+ "grad_min_sv": 7.084323496310118e-09,
+ "grad_condition": 1908110316.0124466,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 32.724841356277466
+ },
+ {
+ "epoch": 129,
+ "train_loss": 0.13098865546941757,
+ "train_acc": 0.95846,
+ "test_loss": 3.011842226791382,
+ "test_acc": 0.5506,
+ "lyapunov": null,
+ "grad_norm": 0.37939468237880797,
+ "grad_max_sv": 0.20046190060675145,
+ "grad_min_sv": 7.379042803222838e-09,
+ "grad_condition": 356098689.45926607,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 32.721606492996216
+ },
+ {
+ "epoch": 130,
+ "train_loss": 0.12933046006202698,
+ "train_acc": 0.95886,
+ "test_loss": 3.0411768558502197,
+ "test_acc": 0.5527,
+ "lyapunov": null,
+ "grad_norm": 0.37924053294163973,
+ "grad_max_sv": 0.20988954231142998,
+ "grad_min_sv": 7.388776484596772e-09,
+ "grad_condition": 554124327.4297839,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 32.76217794418335
+ },
+ {
+ "epoch": 131,
+ "train_loss": 0.12891825794219972,
+ "train_acc": 0.95952,
+ "test_loss": 3.000077504730225,
+ "test_acc": 0.5546,
+ "lyapunov": null,
+ "grad_norm": 0.3741869428415791,
+ "grad_max_sv": 0.1881616409868002,
+ "grad_min_sv": 7.156842123405213e-09,
+ "grad_condition": 312499495.3085783,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 32.74306511878967
+ },
+ {
+ "epoch": 132,
+ "train_loss": 0.12583676107883454,
+ "train_acc": 0.96062,
+ "test_loss": 3.0664391510009765,
+ "test_acc": 0.5534,
+ "lyapunov": null,
+ "grad_norm": 0.3704229743876738,
+ "grad_max_sv": 0.19701430164277553,
+ "grad_min_sv": 7.223526106328419e-09,
+ "grad_condition": 1413194923.3587193,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 32.808775424957275
+ },
+ {
+ "epoch": 133,
+ "train_loss": 0.13008767341136931,
+ "train_acc": 0.95896,
+ "test_loss": 3.0139704319000242,
+ "test_acc": 0.5574,
+ "lyapunov": null,
+ "grad_norm": 0.3764215368002029,
+ "grad_max_sv": 0.18944438602775335,
+ "grad_min_sv": 7.082572564553764e-09,
+ "grad_condition": 874087736.501687,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 32.82065176963806
+ },
+ {
+ "epoch": 134,
+ "train_loss": 0.1276783154821396,
+ "train_acc": 0.95996,
+ "test_loss": 3.022883545303345,
+ "test_acc": 0.5532,
+ "lyapunov": null,
+ "grad_norm": 0.375861463579636,
+ "grad_max_sv": 0.20601846650242805,
+ "grad_min_sv": 6.996468762177945e-09,
+ "grad_condition": 1890410555.4428897,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 32.80414128303528
+ },
+ {
+ "epoch": 135,
+ "train_loss": 0.12308010986804963,
+ "train_acc": 0.9606,
+ "test_loss": 2.9876843898773195,
+ "test_acc": 0.5593,
+ "lyapunov": null,
+ "grad_norm": 0.36736730687062175,
+ "grad_max_sv": 0.19790339954197406,
+ "grad_min_sv": 7.039625574654928e-09,
+ "grad_condition": 157775177.85623857,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 32.851438760757446
+ },
+ {
+ "epoch": 136,
+ "train_loss": 0.12776446427345275,
+ "train_acc": 0.96144,
+ "test_loss": 3.0140146301269533,
+ "test_acc": 0.5535,
+ "lyapunov": null,
+ "grad_norm": 0.3714043891983977,
+ "grad_max_sv": 0.19383110255002975,
+ "grad_min_sv": 7.2285312062653555e-09,
+ "grad_condition": 999433479.7051426,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 32.794949769973755
+ },
+ {
+ "epoch": 137,
+ "train_loss": 0.12337936633110047,
+ "train_acc": 0.96152,
+ "test_loss": 2.9756490589141844,
+ "test_acc": 0.5589,
+ "lyapunov": null,
+ "grad_norm": 0.36599462716404635,
+ "grad_max_sv": 0.18621533513069152,
+ "grad_min_sv": 6.8799666707621e-09,
+ "grad_condition": 2633273626.2954164,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 32.78418707847595
+ },
+ {
+ "epoch": 138,
+ "train_loss": 0.12530339601516724,
+ "train_acc": 0.96096,
+ "test_loss": 2.9389760871887205,
+ "test_acc": 0.5643,
+ "lyapunov": null,
+ "grad_norm": 0.36857224147370304,
+ "grad_max_sv": 0.19519462659955025,
+ "grad_min_sv": 7.2010847566817904e-09,
+ "grad_condition": 1104132755.735764,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 32.72880840301514
+ },
+ {
+ "epoch": 139,
+ "train_loss": 0.12289305024623871,
+ "train_acc": 0.9611,
+ "test_loss": 3.0236512790679932,
+ "test_acc": 0.5543,
+ "lyapunov": null,
+ "grad_norm": 0.3682552501598832,
+ "grad_max_sv": 0.20100074261426926,
+ "grad_min_sv": 7.34378154774052e-09,
+ "grad_condition": 1520683884.3197339,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 32.78127360343933
+ },
+ {
+ "epoch": 140,
+ "train_loss": 0.12596595900058746,
+ "train_acc": 0.95946,
+ "test_loss": 2.973658073425293,
+ "test_acc": 0.561,
+ "lyapunov": null,
+ "grad_norm": 0.3717079213334779,
+ "grad_max_sv": 0.1950546268373728,
+ "grad_min_sv": 7.189997905268728e-09,
+ "grad_condition": 1974792452.4561849,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 32.781864643096924
+ },
+ {
+ "epoch": 141,
+ "train_loss": 0.12001886625289918,
+ "train_acc": 0.96264,
+ "test_loss": 2.990137744522095,
+ "test_acc": 0.5583,
+ "lyapunov": null,
+ "grad_norm": 0.3612101803004304,
+ "grad_max_sv": 0.19684142302721738,
+ "grad_min_sv": 7.084273648266673e-09,
+ "grad_condition": 1957601954.2835248,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 32.77344870567322
+ },
+ {
+ "epoch": 142,
+ "train_loss": 0.12250841891288758,
+ "train_acc": 0.96208,
+ "test_loss": 3.0072501789093016,
+ "test_acc": 0.557,
+ "lyapunov": null,
+ "grad_norm": 0.3656411150745857,
+ "grad_max_sv": 0.18694628309458494,
+ "grad_min_sv": 6.765250024683839e-09,
+ "grad_condition": 728041100.7004558,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 32.78335380554199
+ },
+ {
+ "epoch": 143,
+ "train_loss": 0.12062059470653534,
+ "train_acc": 0.96196,
+ "test_loss": 2.9649132221221923,
+ "test_acc": 0.5592,
+ "lyapunov": null,
+ "grad_norm": 0.36372343649597894,
+ "grad_max_sv": 0.19535562619566918,
+ "grad_min_sv": 6.99444468851753e-09,
+ "grad_condition": 1233101804.7440555,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 32.80367183685303
+ },
+ {
+ "epoch": 144,
+ "train_loss": 0.12207864775896073,
+ "train_acc": 0.96178,
+ "test_loss": 3.036870691680908,
+ "test_acc": 0.5574,
+ "lyapunov": null,
+ "grad_norm": 0.3636070415011162,
+ "grad_max_sv": 0.20035785287618638,
+ "grad_min_sv": 7.128019625154275e-09,
+ "grad_condition": 171713281.12199268,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 32.81153345108032
+ },
+ {
+ "epoch": 145,
+ "train_loss": 0.11943841837644577,
+ "train_acc": 0.96326,
+ "test_loss": 2.9936345024108886,
+ "test_acc": 0.5606,
+ "lyapunov": null,
+ "grad_norm": 0.3616987855339011,
+ "grad_max_sv": 0.19010693076997995,
+ "grad_min_sv": 6.951608487104404e-09,
+ "grad_condition": 4475866647.186778,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 32.77432584762573
+ },
+ {
+ "epoch": 146,
+ "train_loss": 0.12161365668535233,
+ "train_acc": 0.96184,
+ "test_loss": 3.0051653202056885,
+ "test_acc": 0.5534,
+ "lyapunov": null,
+ "grad_norm": 0.36606365240898514,
+ "grad_max_sv": 0.19566274229437114,
+ "grad_min_sv": 7.090793683911957e-09,
+ "grad_condition": 1292263099.7971816,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 32.722100257873535
+ },
+ {
+ "epoch": 147,
+ "train_loss": 0.11985450011253357,
+ "train_acc": 0.96366,
+ "test_loss": 2.9604510833740236,
+ "test_acc": 0.5575,
+ "lyapunov": null,
+ "grad_norm": 0.36142233410993513,
+ "grad_max_sv": 0.19281328432261943,
+ "grad_min_sv": 7.25558266457792e-09,
+ "grad_condition": 7387609214.887906,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 32.73111319541931
+ },
+ {
+ "epoch": 148,
+ "train_loss": 0.11937485624313354,
+ "train_acc": 0.96304,
+ "test_loss": 3.0363352073669434,
+ "test_acc": 0.555,
+ "lyapunov": null,
+ "grad_norm": 0.3611567529216887,
+ "grad_max_sv": 0.1957642961293459,
+ "grad_min_sv": 7.231622295303733e-09,
+ "grad_condition": 393022755.7130184,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 32.739211320877075
+ },
+ {
+ "epoch": 149,
+ "train_loss": 0.11994361319065094,
+ "train_acc": 0.96282,
+ "test_loss": 2.9720828590393067,
+ "test_acc": 0.5586,
+ "lyapunov": null,
+ "grad_norm": 0.36260803003121506,
+ "grad_max_sv": 0.19581739362329245,
+ "grad_min_sv": 6.825674283401049e-09,
+ "grad_condition": 640655030.4564087,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 32.73686075210571
+ },
+ {
+ "epoch": 150,
+ "train_loss": 0.12198109043121338,
+ "train_acc": 0.96096,
+ "test_loss": 3.0690538398742677,
+ "test_acc": 0.5514,
+ "lyapunov": null,
+ "grad_norm": 0.3640908774200121,
+ "grad_max_sv": 0.19363359715789558,
+ "grad_min_sv": 6.96894196785744e-09,
+ "grad_condition": 273507263.305566,
+ "lr": 0.0,
+ "time_sec": 32.99615716934204
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 4.494552028656006,
+ "train_acc": 0.03786,
+ "test_loss": 4.61479503326416,
+ "test_acc": 0.0201,
+ "lyapunov": null,
+ "grad_norm": 4.970128680900294,
+ "grad_max_sv": 4.1727720379829405,
+ "grad_min_sv": 8.289555068485832e-08,
+ "grad_condition": 76452781.51601897,
+ "lr": 0.0009998903417374227,
+ "time_sec": 49.85722231864929
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.9854862425994875,
+ "train_acc": 0.08822,
+ "test_loss": 4.992143798828125,
+ "test_acc": 0.0271,
+ "lyapunov": null,
+ "grad_norm": 3.054976721991771,
+ "grad_max_sv": 2.33364659845829,
+ "grad_min_sv": 4.921280333802791e-08,
+ "grad_condition": 63442313.555687234,
+ "lr": 0.0009995614150494292,
+ "time_sec": 49.82543992996216
+ },
+ {
+ "epoch": 3,
+ "train_loss": 3.6997953691101073,
+ "train_acc": 0.12854,
+ "test_loss": 4.995684532165527,
+ "test_acc": 0.0293,
+ "lyapunov": null,
+ "grad_norm": 2.062296620286874,
+ "grad_max_sv": 1.3390462696552277,
+ "grad_min_sv": 3.588550117061828e-08,
+ "grad_condition": 44525979.84656793,
+ "lr": 0.0009990133642141358,
+ "time_sec": 49.824538707733154
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.5368371379089356,
+ "train_acc": 0.15444,
+ "test_loss": 5.110721218109131,
+ "test_acc": 0.0304,
+ "lyapunov": null,
+ "grad_norm": 1.6796942132426855,
+ "grad_max_sv": 0.9513197481632233,
+ "grad_min_sv": 2.9029874798469635e-08,
+ "grad_condition": 38187587.0072392,
+ "lr": 0.0009982464296247522,
+ "time_sec": 49.857542514801025
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.4063741930389404,
+ "train_acc": 0.1804,
+ "test_loss": 4.820973803710937,
+ "test_acc": 0.0488,
+ "lyapunov": null,
+ "grad_norm": 1.5228591587706575,
+ "grad_max_sv": 0.8078360810875893,
+ "grad_min_sv": 2.6718039813911078e-08,
+ "grad_condition": 36188290.78873479,
+ "lr": 0.0009972609476841367,
+ "time_sec": 49.83380579948425
+ },
+ {
+ "epoch": 6,
+ "train_loss": 3.298316816482544,
+ "train_acc": 0.19704,
+ "test_loss": 4.687854388427734,
+ "test_acc": 0.063,
+ "lyapunov": null,
+ "grad_norm": 1.430907384491558,
+ "grad_max_sv": 0.7338306248188019,
+ "grad_min_sv": 2.5322855712328617e-08,
+ "grad_condition": 32479596.327881176,
+ "lr": 0.000996057350657239,
+ "time_sec": 49.85435748100281
+ },
+ {
+ "epoch": 7,
+ "train_loss": 3.212421199264526,
+ "train_acc": 0.21768,
+ "test_loss": 5.175653315734864,
+ "test_acc": 0.0504,
+ "lyapunov": null,
+ "grad_norm": 1.336875610023359,
+ "grad_max_sv": 0.649027307331562,
+ "grad_min_sv": 2.378195060326327e-08,
+ "grad_condition": 32637118.77699437,
+ "lr": 0.000994636166481494,
+ "time_sec": 49.8446729183197
+ },
+ {
+ "epoch": 8,
+ "train_loss": 3.138554875640869,
+ "train_acc": 0.22894,
+ "test_loss": 5.807579966735839,
+ "test_acc": 0.0462,
+ "lyapunov": null,
+ "grad_norm": 1.2679659601013358,
+ "grad_max_sv": 0.5943921484053135,
+ "grad_min_sv": 2.2575583161904557e-08,
+ "grad_condition": 97277800.55107144,
+ "lr": 0.0009929980185352525,
+ "time_sec": 49.8536856174469
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.0594152055358887,
+ "train_acc": 0.24342,
+ "test_loss": 5.896516481018066,
+ "test_acc": 0.0504,
+ "lyapunov": null,
+ "grad_norm": 1.1948384399270802,
+ "grad_max_sv": 0.5371919803321361,
+ "grad_min_sv": 2.1378302061947352e-08,
+ "grad_condition": 43411043.09074741,
+ "lr": 0.0009911436253643444,
+ "time_sec": 49.826568365097046
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.0018548110961913,
+ "train_acc": 0.25334,
+ "test_loss": 6.065813122558594,
+ "test_acc": 0.0461,
+ "lyapunov": null,
+ "grad_norm": 1.1307569845828864,
+ "grad_max_sv": 0.49591890424489976,
+ "grad_min_sv": 2.0269659145588648e-08,
+ "grad_condition": 137243724.22937468,
+ "lr": 0.0009890738003669028,
+ "time_sec": 49.83774471282959
+ },
+ {
+ "epoch": 11,
+ "train_loss": 2.955089698944092,
+ "train_acc": 0.2653,
+ "test_loss": 5.9151001647949215,
+ "test_acc": 0.0512,
+ "lyapunov": null,
+ "grad_norm": 1.067241785689624,
+ "grad_max_sv": 0.4469477400183678,
+ "grad_min_sv": 1.8805797574739103e-08,
+ "grad_condition": 39379357.71574137,
+ "lr": 0.00098678945143658,
+ "time_sec": 49.843921184539795
+ },
+ {
+ "epoch": 12,
+ "train_loss": 2.9137347607421873,
+ "train_acc": 0.27164,
+ "test_loss": 6.294404597473145,
+ "test_acc": 0.0476,
+ "lyapunov": null,
+ "grad_norm": 1.0355748395798314,
+ "grad_max_sv": 0.4451711155474186,
+ "grad_min_sv": 1.9072327144360128e-08,
+ "grad_condition": 11465758103.108255,
+ "lr": 0.0009842915805643154,
+ "time_sec": 49.864059925079346
+ },
+ {
+ "epoch": 13,
+ "train_loss": 2.8780907594299316,
+ "train_acc": 0.2771,
+ "test_loss": 5.592148977661132,
+ "test_acc": 0.0478,
+ "lyapunov": null,
+ "grad_norm": 0.9968605810380445,
+ "grad_max_sv": 0.42295421436429026,
+ "grad_min_sv": 1.8676737473244386e-08,
+ "grad_condition": 25252476.39695831,
+ "lr": 0.000981581283398829,
+ "time_sec": 49.83604097366333
+ },
+ {
+ "epoch": 14,
+ "train_loss": 2.83197486907959,
+ "train_acc": 0.28466,
+ "test_loss": 5.6323877784729,
+ "test_acc": 0.0609,
+ "lyapunov": null,
+ "grad_norm": 0.9600893848651761,
+ "grad_max_sv": 0.40282900631427765,
+ "grad_min_sv": 1.79312983100699e-08,
+ "grad_condition": 46420938.26971118,
+ "lr": 0.0009786597487660333,
+ "time_sec": 49.834007263183594
+ },
+ {
+ "epoch": 15,
+ "train_loss": 2.8022082035064697,
+ "train_acc": 0.29582,
+ "test_loss": 6.161382629394531,
+ "test_acc": 0.067,
+ "lyapunov": null,
+ "grad_norm": 0.9375482131775189,
+ "grad_max_sv": 0.38931420594453814,
+ "grad_min_sv": 1.7493153070535784e-08,
+ "grad_condition": 36503130.621698126,
+ "lr": 0.0009755282581475766,
+ "time_sec": 49.843669176101685
+ },
+ {
+ "epoch": 16,
+ "train_loss": 2.7717318687438963,
+ "train_acc": 0.29786,
+ "test_loss": 6.750612663269043,
+ "test_acc": 0.0319,
+ "lyapunov": null,
+ "grad_norm": 0.914689907325661,
+ "grad_max_sv": 0.3722547680139542,
+ "grad_min_sv": 1.6777755511981906e-08,
+ "grad_condition": 56626372.0449656,
+ "lr": 0.0009721881851187403,
+ "time_sec": 49.83157706260681
+ },
+ {
+ "epoch": 17,
+ "train_loss": 2.737800383453369,
+ "train_acc": 0.30562,
+ "test_loss": 6.416880516052246,
+ "test_acc": 0.0612,
+ "lyapunov": null,
+ "grad_norm": 0.8943352214027238,
+ "grad_max_sv": 0.35389882922172544,
+ "grad_min_sv": 1.6637817648601504e-08,
+ "grad_condition": 27086037.56335088,
+ "lr": 0.0009686409947459456,
+ "time_sec": 49.84391736984253
+ },
+ {
+ "epoch": 18,
+ "train_loss": 2.726037522125244,
+ "train_acc": 0.30952,
+ "test_loss": 6.604639881896973,
+ "test_acc": 0.0459,
+ "lyapunov": null,
+ "grad_norm": 0.8840199433360627,
+ "grad_max_sv": 0.35427382588386536,
+ "grad_min_sv": 1.631152495851218e-08,
+ "grad_condition": 30779446.928706445,
+ "lr": 0.0009648882429441254,
+ "time_sec": 49.85922360420227
+ },
+ {
+ "epoch": 19,
+ "train_loss": 2.6859044135284424,
+ "train_acc": 0.31622,
+ "test_loss": 5.795512687683106,
+ "test_acc": 0.057,
+ "lyapunov": null,
+ "grad_norm": 0.8549569769936459,
+ "grad_max_sv": 0.33466122299432755,
+ "grad_min_sv": 1.565257393698616e-08,
+ "grad_condition": 29386830.435270645,
+ "lr": 0.00096093157579425,
+ "time_sec": 49.82556509971619
+ },
+ {
+ "epoch": 20,
+ "train_loss": 2.6536119274902346,
+ "train_acc": 0.3221,
+ "test_loss": 6.344257983398437,
+ "test_acc": 0.044,
+ "lyapunov": null,
+ "grad_norm": 0.8449773123460955,
+ "grad_max_sv": 0.3348921127617359,
+ "grad_min_sv": 1.5790628153482257e-08,
+ "grad_condition": 98318741.07961987,
+ "lr": 0.0009567727288213001,
+ "time_sec": 49.83516526222229
+ },
+ {
+ "epoch": 21,
+ "train_loss": 2.6361696144104005,
+ "train_acc": 0.32656,
+ "test_loss": 7.515093251800537,
+ "test_acc": 0.0334,
+ "lyapunov": null,
+ "grad_norm": 0.8336479900582607,
+ "grad_max_sv": 0.3216260939836502,
+ "grad_min_sv": 1.536505757071538e-08,
+ "grad_condition": 26686558.28517064,
+ "lr": 0.0009524135262330095,
+ "time_sec": 49.80964422225952
+ },
+ {
+ "epoch": 22,
+ "train_loss": 2.609321441345215,
+ "train_acc": 0.33038,
+ "test_loss": 6.987834294128418,
+ "test_acc": 0.0336,
+ "lyapunov": null,
+ "grad_norm": 0.8111631557338365,
+ "grad_max_sv": 0.32318604178726673,
+ "grad_min_sv": 1.552950264216424e-08,
+ "grad_condition": 31459791.97556909,
+ "lr": 0.0009478558801197061,
+ "time_sec": 49.83420443534851
+ },
+ {
+ "epoch": 23,
+ "train_loss": 2.5819150804138182,
+ "train_acc": 0.33626,
+ "test_loss": 5.626160023498535,
+ "test_acc": 0.0597,
+ "lyapunov": null,
+ "grad_norm": 0.7975730239086433,
+ "grad_max_sv": 0.2971249621361494,
+ "grad_min_sv": 1.4598027968382166e-08,
+ "grad_condition": 29388140.880233955,
+ "lr": 0.000943101789615607,
+ "time_sec": 49.84738302230835
+ },
+ {
+ "epoch": 24,
+ "train_loss": 2.563654583282471,
+ "train_acc": 0.34112,
+ "test_loss": 8.088758407592774,
+ "test_acc": 0.0365,
+ "lyapunov": null,
+ "grad_norm": 0.7820981992902372,
+ "grad_max_sv": 0.30556059442460537,
+ "grad_min_sv": 1.4405372743275802e-08,
+ "grad_condition": 36896273.106267676,
+ "lr": 0.0009381533400219313,
+ "time_sec": 49.83872365951538
+ },
+ {
+ "epoch": 25,
+ "train_loss": 2.5395704370880128,
+ "train_acc": 0.3453,
+ "test_loss": 6.280784951782227,
+ "test_acc": 0.0419,
+ "lyapunov": null,
+ "grad_norm": 0.7796352290200003,
+ "grad_max_sv": 0.29107407070696356,
+ "grad_min_sv": 1.438702274536574e-08,
+ "grad_condition": 23506322.84645006,
+ "lr": 0.0009330127018922189,
+ "time_sec": 49.84307074546814
+ },
+ {
+ "epoch": 26,
+ "train_loss": 2.516899804611206,
+ "train_acc": 0.34914,
+ "test_loss": 6.8854626892089845,
+ "test_acc": 0.0472,
+ "lyapunov": null,
+ "grad_norm": 0.7654504890703723,
+ "grad_max_sv": 0.2898920584470034,
+ "grad_min_sv": 1.4131242567771985e-08,
+ "grad_condition": 36962656.131567374,
+ "lr": 0.000927682130080253,
+ "time_sec": 49.82866811752319
+ },
+ {
+ "epoch": 27,
+ "train_loss": 2.486618924636841,
+ "train_acc": 0.35846,
+ "test_loss": 6.096959390258789,
+ "test_acc": 0.0526,
+ "lyapunov": null,
+ "grad_norm": 0.7544470177982979,
+ "grad_max_sv": 0.2747815653681755,
+ "grad_min_sv": 1.4021938565811353e-08,
+ "grad_condition": 22894223.22709341,
+ "lr": 0.0009221639627510072,
+ "time_sec": 49.833322048187256
+ },
+ {
+ "epoch": 28,
+ "train_loss": 2.4692860332489013,
+ "train_acc": 0.35872,
+ "test_loss": 7.058197943115235,
+ "test_acc": 0.0368,
+ "lyapunov": null,
+ "grad_norm": 0.7556141642776453,
+ "grad_max_sv": 0.2829656444489956,
+ "grad_min_sv": 1.4026384997922747e-08,
+ "grad_condition": 24010034.28343827,
+ "lr": 0.0009164606203550494,
+ "time_sec": 49.853132247924805
+ },
+ {
+ "epoch": 29,
+ "train_loss": 2.458679496536255,
+ "train_acc": 0.36202,
+ "test_loss": 5.932370195007325,
+ "test_acc": 0.0515,
+ "lyapunov": null,
+ "grad_norm": 0.7489931312284205,
+ "grad_max_sv": 0.2846912644803524,
+ "grad_min_sv": 1.3950906180867743e-08,
+ "grad_condition": 759126756.028516,
+ "lr": 0.0009105746045668516,
+ "time_sec": 49.815508127212524
+ },
+ {
+ "epoch": 30,
+ "train_loss": 2.440240175704956,
+ "train_acc": 0.3643,
+ "test_loss": 5.7076008422851565,
+ "test_acc": 0.0545,
+ "lyapunov": null,
+ "grad_norm": 0.7451604093710013,
+ "grad_max_sv": 0.27726204246282576,
+ "grad_min_sv": 1.3802408763141649e-08,
+ "grad_condition": 25518721.12854769,
+ "lr": 0.0009045084971874733,
+ "time_sec": 49.83587169647217
+ },
+ {
+ "epoch": 31,
+ "train_loss": 2.413286708908081,
+ "train_acc": 0.37092,
+ "test_loss": 5.388267793273926,
+ "test_acc": 0.0567,
+ "lyapunov": null,
+ "grad_norm": 0.734602471620392,
+ "grad_max_sv": 0.2801205262541771,
+ "grad_min_sv": 1.3700489934209691e-08,
+ "grad_condition": 70621872.17100011,
+ "lr": 0.0008982649590120977,
+ "time_sec": 49.82285523414612
+ },
+ {
+ "epoch": 32,
+ "train_loss": 2.3982598586273194,
+ "train_acc": 0.37454,
+ "test_loss": 4.8633959762573244,
+ "test_acc": 0.0614,
+ "lyapunov": null,
+ "grad_norm": 0.7317568960693007,
+ "grad_max_sv": 0.27396991699934004,
+ "grad_min_sv": 1.3639147818100827e-08,
+ "grad_condition": 29568703.15011265,
+ "lr": 0.0008918467286629196,
+ "time_sec": 49.83714246749878
+ },
+ {
+ "epoch": 33,
+ "train_loss": 2.3700755281066894,
+ "train_acc": 0.37942,
+ "test_loss": 5.800725856018066,
+ "test_acc": 0.062,
+ "lyapunov": null,
+ "grad_norm": 0.7363325475877537,
+ "grad_max_sv": 0.27091147713363173,
+ "grad_min_sv": 1.3641409607467736e-08,
+ "grad_condition": 23422095.65938937,
+ "lr": 0.0008852566213878943,
+ "time_sec": 49.85065937042236
+ },
+ {
+ "epoch": 34,
+ "train_loss": 2.3484229640197753,
+ "train_acc": 0.38438,
+ "test_loss": 5.51493988494873,
+ "test_acc": 0.0489,
+ "lyapunov": null,
+ "grad_norm": 0.7318255060238914,
+ "grad_max_sv": 0.2700826805084944,
+ "grad_min_sv": 1.3733222553602431e-08,
+ "grad_condition": 23110083.817654673,
+ "lr": 0.000878497527825878,
+ "time_sec": 49.825148820877075
+ },
+ {
+ "epoch": 35,
+ "train_loss": 2.332993766708374,
+ "train_acc": 0.38728,
+ "test_loss": 6.365867942047119,
+ "test_acc": 0.0266,
+ "lyapunov": null,
+ "grad_norm": 0.7235217593940582,
+ "grad_max_sv": 0.26724731288850306,
+ "grad_min_sv": 1.3652239799766264e-08,
+ "grad_condition": 21635340.607584503,
+ "lr": 0.000871572412738697,
+ "time_sec": 49.830586194992065
+ },
+ {
+ "epoch": 36,
+ "train_loss": 2.306020415649414,
+ "train_acc": 0.39186,
+ "test_loss": 5.792026341247559,
+ "test_acc": 0.0452,
+ "lyapunov": null,
+ "grad_norm": 0.7128640395593397,
+ "grad_max_sv": 0.26750593855977056,
+ "grad_min_sv": 1.3493218886662105e-08,
+ "grad_condition": 28714487.625810385,
+ "lr": 0.0008644843137107055,
+ "time_sec": 49.84518265724182
+ },
+ {
+ "epoch": 37,
+ "train_loss": 2.2972560415649412,
+ "train_acc": 0.39398,
+ "test_loss": 6.719418971252441,
+ "test_acc": 0.0336,
+ "lyapunov": null,
+ "grad_norm": 0.7133630215784597,
+ "grad_max_sv": 0.2599464699625969,
+ "grad_min_sv": 1.321531789555408e-08,
+ "grad_condition": 23431301.61775563,
+ "lr": 0.0008572363398164014,
+ "time_sec": 49.80765676498413
+ },
+ {
+ "epoch": 38,
+ "train_loss": 2.2751118283843996,
+ "train_acc": 0.39982,
+ "test_loss": 5.9905416282653805,
+ "test_acc": 0.0405,
+ "lyapunov": null,
+ "grad_norm": 0.711317525951205,
+ "grad_max_sv": 0.25357839167118074,
+ "grad_min_sv": 1.3227913819857662e-08,
+ "grad_condition": 22136545.95270278,
+ "lr": 0.0008498316702566826,
+ "time_sec": 49.8195858001709
+ },
+ {
+ "epoch": 39,
+ "train_loss": 2.2572131638336184,
+ "train_acc": 0.40186,
+ "test_loss": 5.522994046783447,
+ "test_acc": 0.0292,
+ "lyapunov": null,
+ "grad_norm": 0.7046395490795619,
+ "grad_max_sv": 0.2534454546868801,
+ "grad_min_sv": 1.3053050565425828e-08,
+ "grad_condition": 23267030.12204785,
+ "lr": 0.0008422735529643442,
+ "time_sec": 49.82005977630615
+ },
+ {
+ "epoch": 40,
+ "train_loss": 2.247441282196045,
+ "train_acc": 0.40386,
+ "test_loss": 6.156334571838379,
+ "test_acc": 0.0459,
+ "lyapunov": null,
+ "grad_norm": 0.7028096798670115,
+ "grad_max_sv": 0.2492887545377016,
+ "grad_min_sv": 1.295731734268779e-08,
+ "grad_condition": 27228242.583258677,
+ "lr": 0.0008345653031794289,
+ "time_sec": 49.840070724487305
+ },
+ {
+ "epoch": 41,
+ "train_loss": 2.240987236175537,
+ "train_acc": 0.4064,
+ "test_loss": 6.480609422302246,
+ "test_acc": 0.03,
+ "lyapunov": null,
+ "grad_norm": 0.6963939273563242,
+ "grad_max_sv": 0.25355591997504234,
+ "grad_min_sv": 1.3210752133896442e-08,
+ "grad_condition": 51874622.58196541,
+ "lr": 0.0008267103019950526,
+ "time_sec": 49.89214468002319
+ },
+ {
+ "epoch": 42,
+ "train_loss": 2.2241448893737794,
+ "train_acc": 0.40938,
+ "test_loss": 7.472731929016113,
+ "test_acc": 0.0364,
+ "lyapunov": null,
+ "grad_norm": 0.6886576186838276,
+ "grad_max_sv": 0.24406687431037427,
+ "grad_min_sv": 1.2965910546614001e-08,
+ "grad_condition": 26237426.90185051,
+ "lr": 0.0008187119948743447,
+ "time_sec": 49.831929445266724
+ },
+ {
+ "epoch": 43,
+ "train_loss": 2.195390332183838,
+ "train_acc": 0.41482,
+ "test_loss": 6.986102354431153,
+ "test_acc": 0.0354,
+ "lyapunov": null,
+ "grad_norm": 0.692064929980546,
+ "grad_max_sv": 0.24136908873915672,
+ "grad_min_sv": 1.287102841251997e-08,
+ "grad_condition": 29191367.16539036,
+ "lr": 0.000810573890139155,
+ "time_sec": 49.820056438446045
+ },
+ {
+ "epoch": 44,
+ "train_loss": 2.1865518129730224,
+ "train_acc": 0.41708,
+ "test_loss": 6.7771270584106444,
+ "test_acc": 0.0393,
+ "lyapunov": null,
+ "grad_norm": 0.6868416402158027,
+ "grad_max_sv": 0.2486371211707592,
+ "grad_min_sv": 1.2717046270899201e-08,
+ "grad_condition": 39400931.65148838,
+ "lr": 0.0008022995574311873,
+ "time_sec": 49.82724571228027
+ },
+ {
+ "epoch": 45,
+ "train_loss": 2.176023401031494,
+ "train_acc": 0.41766,
+ "test_loss": 6.5321983726501465,
+ "test_acc": 0.0329,
+ "lyapunov": null,
+ "grad_norm": 0.688101634481696,
+ "grad_max_sv": 0.2483655706048012,
+ "grad_min_sv": 1.2939461641048311e-08,
+ "grad_condition": 24745167.039308526,
+ "lr": 0.0007938926261462363,
+ "time_sec": 49.83728241920471
+ },
+ {
+ "epoch": 46,
+ "train_loss": 2.157371569519043,
+ "train_acc": 0.42422,
+ "test_loss": 5.901077621459961,
+ "test_acc": 0.0536,
+ "lyapunov": null,
+ "grad_norm": 0.6810937554159694,
+ "grad_max_sv": 0.2453255333006382,
+ "grad_min_sv": 1.2790355725933455e-08,
+ "grad_condition": 42427572.437124,
+ "lr": 0.0007853567838422158,
+ "time_sec": 49.83260989189148
+ },
+ {
+ "epoch": 47,
+ "train_loss": 2.1449081243896484,
+ "train_acc": 0.42456,
+ "test_loss": 6.075893556213379,
+ "test_acc": 0.042,
+ "lyapunov": null,
+ "grad_norm": 0.677274699872145,
+ "grad_max_sv": 0.23359011709690095,
+ "grad_min_sv": 1.2604452173659019e-08,
+ "grad_condition": 23439756.57327797,
+ "lr": 0.0007766957746216719,
+ "time_sec": 49.81248760223389
+ },
+ {
+ "epoch": 48,
+ "train_loss": 2.121114821166992,
+ "train_acc": 0.43062,
+ "test_loss": 6.324017465209961,
+ "test_acc": 0.0699,
+ "lyapunov": null,
+ "grad_norm": 0.6768119432582711,
+ "grad_max_sv": 0.23583042696118356,
+ "grad_min_sv": 1.2428631641914211e-08,
+ "grad_condition": 26576129.087632615,
+ "lr": 0.0007679133974894982,
+ "time_sec": 49.85111737251282
+ },
+ {
+ "epoch": 49,
+ "train_loss": 2.1201681073760987,
+ "train_acc": 0.43092,
+ "test_loss": 5.493146458435058,
+ "test_acc": 0.0673,
+ "lyapunov": null,
+ "grad_norm": 0.6795448834334495,
+ "grad_max_sv": 0.24224164076149463,
+ "grad_min_sv": 1.2691686027133109e-08,
+ "grad_condition": 24348457.963241145,
+ "lr": 0.000759013504686565,
+ "time_sec": 49.81028628349304
+ },
+ {
+ "epoch": 50,
+ "train_loss": 2.082837229309082,
+ "train_acc": 0.4386,
+ "test_loss": 6.459659493255615,
+ "test_acc": 0.0616,
+ "lyapunov": null,
+ "grad_norm": 0.6728576224616372,
+ "grad_max_sv": 0.23022082336246968,
+ "grad_min_sv": 1.2368064503109899e-08,
+ "grad_condition": 23985269.670404635,
+ "lr": 0.0007499999999999998,
+ "time_sec": 49.82207798957825
+ },
+ {
+ "epoch": 51,
+ "train_loss": 2.0762338228607176,
+ "train_acc": 0.43984,
+ "test_loss": 6.028357986450195,
+ "test_acc": 0.0474,
+ "lyapunov": null,
+ "grad_norm": 0.671786463321322,
+ "grad_max_sv": 0.23933242298662663,
+ "grad_min_sv": 1.2453496028852485e-08,
+ "grad_condition": 27468424.752658807,
+ "lr": 0.0007408768370508575,
+ "time_sec": 49.839146852493286
+ },
+ {
+ "epoch": 52,
+ "train_loss": 2.068026172409058,
+ "train_acc": 0.44324,
+ "test_loss": 6.386326299285889,
+ "test_acc": 0.0521,
+ "lyapunov": null,
+ "grad_norm": 0.6708600139651663,
+ "grad_max_sv": 0.24169348366558552,
+ "grad_min_sv": 1.2435446072878164e-08,
+ "grad_condition": 53682617.89361428,
+ "lr": 0.0007316480175599307,
+ "time_sec": 49.84106373786926
+ },
+ {
+ "epoch": 53,
+ "train_loss": 2.0512850422668456,
+ "train_acc": 0.44514,
+ "test_loss": 5.693611965942383,
+ "test_acc": 0.0412,
+ "lyapunov": null,
+ "grad_norm": 0.6693562330574987,
+ "grad_max_sv": 0.23974683545529843,
+ "grad_min_sv": 1.2387516072631665e-08,
+ "grad_condition": 26566156.55520319,
+ "lr": 0.0007223175895924635,
+ "time_sec": 49.83973002433777
+ },
+ {
+ "epoch": 54,
+ "train_loss": 2.0340771446990966,
+ "train_acc": 0.45072,
+ "test_loss": 6.135411253356933,
+ "test_acc": 0.0562,
+ "lyapunov": null,
+ "grad_norm": 0.6690638479693323,
+ "grad_max_sv": 0.23783069401979445,
+ "grad_min_sv": 1.2572742053018614e-08,
+ "grad_condition": 21778321.765234537,
+ "lr": 0.0007128896457825361,
+ "time_sec": 49.87506914138794
+ },
+ {
+ "epoch": 55,
+ "train_loss": 2.0094136617279053,
+ "train_acc": 0.45566,
+ "test_loss": 5.745096834564209,
+ "test_acc": 0.0572,
+ "lyapunov": null,
+ "grad_norm": 0.6669166301057209,
+ "grad_max_sv": 0.23878032267093657,
+ "grad_min_sv": 1.231176157273639e-08,
+ "grad_condition": 29310923.371788334,
+ "lr": 0.0007033683215378998,
+ "time_sec": 49.82778191566467
+ },
+ {
+ "epoch": 56,
+ "train_loss": 2.0006568963241578,
+ "train_acc": 0.457,
+ "test_loss": 6.5824570434570315,
+ "test_acc": 0.0501,
+ "lyapunov": null,
+ "grad_norm": 0.6683455061699762,
+ "grad_max_sv": 0.23399036526679992,
+ "grad_min_sv": 1.2379160156672509e-08,
+ "grad_condition": 42922377.98757514,
+ "lr": 0.0006937577932260512,
+ "time_sec": 49.85116100311279
+ },
+ {
+ "epoch": 57,
+ "train_loss": 1.9894362976074218,
+ "train_acc": 0.45838,
+ "test_loss": 6.51012366104126,
+ "test_acc": 0.0442,
+ "lyapunov": null,
+ "grad_norm": 0.6646066170012002,
+ "grad_max_sv": 0.23274879157543182,
+ "grad_min_sv": 1.238940085523943e-08,
+ "grad_condition": 24070465.15252796,
+ "lr": 0.0006840622763423388,
+ "time_sec": 49.8274929523468
+ },
+ {
+ "epoch": 58,
+ "train_loss": 1.9678663694000245,
+ "train_acc": 0.46314,
+ "test_loss": 6.619851453399658,
+ "test_acc": 0.0576,
+ "lyapunov": null,
+ "grad_norm": 0.6643541450786883,
+ "grad_max_sv": 0.23393345512449742,
+ "grad_min_sv": 1.2389777363092103e-08,
+ "grad_condition": 38285129.517120846,
+ "lr": 0.0006742860236609073,
+ "time_sec": 49.837411880493164
+ },
+ {
+ "epoch": 59,
+ "train_loss": 1.965532445755005,
+ "train_acc": 0.46532,
+ "test_loss": 7.184655822753906,
+ "test_acc": 0.0412,
+ "lyapunov": null,
+ "grad_norm": 0.6645069826423124,
+ "grad_max_sv": 0.23921045735478402,
+ "grad_min_sv": 1.2522070774040328e-08,
+ "grad_condition": 95635689.47436689,
+ "lr": 0.0006644333233692913,
+ "time_sec": 49.82288122177124
+ },
+ {
+ "epoch": 60,
+ "train_loss": 1.9421441039657592,
+ "train_acc": 0.46942,
+ "test_loss": 6.0968818130493165,
+ "test_acc": 0.0396,
+ "lyapunov": null,
+ "grad_norm": 0.6647686483063734,
+ "grad_max_sv": 0.23022540807723998,
+ "grad_min_sv": 1.2435142121569597e-08,
+ "grad_condition": 36516212.89900361,
+ "lr": 0.0006545084971874734,
+ "time_sec": 49.836525440216064
+ },
+ {
+ "epoch": 61,
+ "train_loss": 1.9307384226989746,
+ "train_acc": 0.4713,
+ "test_loss": 7.351404643249512,
+ "test_acc": 0.0467,
+ "lyapunov": null,
+ "grad_norm": 0.6598071015542969,
+ "grad_max_sv": 0.23300293684005738,
+ "grad_min_sv": 1.2553449488250656e-08,
+ "grad_condition": 21336349.83542385,
+ "lr": 0.0006445158984722354,
+ "time_sec": 49.81679058074951
+ },
+ {
+ "epoch": 62,
+ "train_loss": 1.9107242463684082,
+ "train_acc": 0.47584,
+ "test_loss": 7.41353745803833,
+ "test_acc": 0.0564,
+ "lyapunov": null,
+ "grad_norm": 0.6632922829797736,
+ "grad_max_sv": 0.23702187687158585,
+ "grad_min_sv": 1.256866596290214e-08,
+ "grad_condition": 414252068.6680373,
+ "lr": 0.0006344599103076324,
+ "time_sec": 49.81079959869385
+ },
+ {
+ "epoch": 63,
+ "train_loss": 1.906180576171875,
+ "train_acc": 0.47704,
+ "test_loss": 8.345553895568848,
+ "test_acc": 0.0514,
+ "lyapunov": null,
+ "grad_norm": 0.6641303546175715,
+ "grad_max_sv": 0.23919319920241833,
+ "grad_min_sv": 1.2445030603269736e-08,
+ "grad_condition": 48181552.89073322,
+ "lr": 0.0006243449435824269,
+ "time_sec": 49.834824323654175
+ },
+ {
+ "epoch": 64,
+ "train_loss": 1.896571351852417,
+ "train_acc": 0.48022,
+ "test_loss": 7.706241481018067,
+ "test_acc": 0.0495,
+ "lyapunov": null,
+ "grad_norm": 0.6580911542263143,
+ "grad_max_sv": 0.233155807107687,
+ "grad_min_sv": 1.2258548102821176e-08,
+ "grad_condition": 147912368.09627536,
+ "lr": 0.0006141754350553275,
+ "time_sec": 49.827706813812256
+ },
+ {
+ "epoch": 65,
+ "train_loss": 1.8689342678833007,
+ "train_acc": 0.48694,
+ "test_loss": 7.604910266113281,
+ "test_acc": 0.068,
+ "lyapunov": null,
+ "grad_norm": 0.6601961376883955,
+ "grad_max_sv": 0.24266679622232915,
+ "grad_min_sv": 1.2337946858967385e-08,
+ "grad_condition": 109479288.75078002,
+ "lr": 0.0006039558454088793,
+ "time_sec": 49.847835063934326
+ },
+ {
+ "epoch": 66,
+ "train_loss": 1.8541412976837157,
+ "train_acc": 0.4913,
+ "test_loss": 7.621131346130371,
+ "test_acc": 0.0502,
+ "lyapunov": null,
+ "grad_norm": 0.6526859807082246,
+ "grad_max_sv": 0.22503522336483,
+ "grad_min_sv": 1.1999139423735094e-08,
+ "grad_condition": 27658012.606830657,
+ "lr": 0.000593690657292862,
+ "time_sec": 49.83453869819641
+ },
+ {
+ "epoch": 67,
+ "train_loss": 1.8500203356170655,
+ "train_acc": 0.4895,
+ "test_loss": 8.448241088867187,
+ "test_acc": 0.0602,
+ "lyapunov": null,
+ "grad_norm": 0.654584216781727,
+ "grad_max_sv": 0.23166645579040052,
+ "grad_min_sv": 1.2144356195328832e-08,
+ "grad_condition": 57526231.39027766,
+ "lr": 0.0005833843733580507,
+ "time_sec": 49.87798357009888
+ },
+ {
+ "epoch": 68,
+ "train_loss": 1.8333191384887695,
+ "train_acc": 0.49588,
+ "test_loss": 7.663671650695801,
+ "test_acc": 0.0539,
+ "lyapunov": null,
+ "grad_norm": 0.6550869721940646,
+ "grad_max_sv": 0.23333334550261497,
+ "grad_min_sv": 1.2233289833907257e-08,
+ "grad_condition": 24346438.395213075,
+ "lr": 0.0005730415142812054,
+ "time_sec": 49.82582187652588
+ },
+ {
+ "epoch": 69,
+ "train_loss": 1.8119923030090332,
+ "train_acc": 0.50032,
+ "test_loss": 7.175043432617188,
+ "test_acc": 0.0712,
+ "lyapunov": null,
+ "grad_norm": 0.6513215911180641,
+ "grad_max_sv": 0.2193699970841408,
+ "grad_min_sv": 1.1865115855103081e-08,
+ "grad_condition": 26929150.493882775,
+ "lr": 0.0005626666167821517,
+ "time_sec": 49.80794405937195
+ },
+ {
+ "epoch": 70,
+ "train_loss": 1.8089694079589844,
+ "train_acc": 0.49764,
+ "test_loss": 7.612014476013184,
+ "test_acc": 0.0538,
+ "lyapunov": null,
+ "grad_norm": 0.6557711961342083,
+ "grad_max_sv": 0.23481616117060183,
+ "grad_min_sv": 1.21222042414465e-08,
+ "grad_condition": 49730665.95439996,
+ "lr": 0.0005522642316338265,
+ "time_sec": 49.81162214279175
+ },
+ {
+ "epoch": 71,
+ "train_loss": 1.794535770225525,
+ "train_acc": 0.50302,
+ "test_loss": 8.002939363861085,
+ "test_acc": 0.054,
+ "lyapunov": null,
+ "grad_norm": 0.6530360122929442,
+ "grad_max_sv": 0.22891747988760472,
+ "grad_min_sv": 1.2135645938160522e-08,
+ "grad_condition": 30239652.54848214,
+ "lr": 0.0005418389216661573,
+ "time_sec": 49.83351969718933
+ },
+ {
+ "epoch": 72,
+ "train_loss": 1.7888313204574584,
+ "train_acc": 0.50272,
+ "test_loss": 7.378663352966308,
+ "test_acc": 0.0477,
+ "lyapunov": null,
+ "grad_norm": 0.6515803468137452,
+ "grad_max_sv": 0.223580015450716,
+ "grad_min_sv": 1.2234114341730384e-08,
+ "grad_condition": 31177170.11021496,
+ "lr": 0.0005313952597646563,
+ "time_sec": 49.80682587623596
+ },
+ {
+ "epoch": 73,
+ "train_loss": 1.7610743871688843,
+ "train_acc": 0.51094,
+ "test_loss": 7.5734631568908695,
+ "test_acc": 0.0456,
+ "lyapunov": null,
+ "grad_norm": 0.6471442109164438,
+ "grad_max_sv": 0.23298447765409946,
+ "grad_min_sv": 1.2235564984808267e-08,
+ "grad_condition": 30205955.557135515,
+ "lr": 0.0005209378268645994,
+ "time_sec": 49.8284707069397
+ },
+ {
+ "epoch": 74,
+ "train_loss": 1.743510553855896,
+ "train_acc": 0.51648,
+ "test_loss": 8.115744052124024,
+ "test_acc": 0.0597,
+ "lyapunov": null,
+ "grad_norm": 0.6470361414945306,
+ "grad_max_sv": 0.22419601753354074,
+ "grad_min_sv": 1.175036056857981e-08,
+ "grad_condition": 44883670.89626708,
+ "lr": 0.0005104712099416781,
+ "time_sec": 49.81434655189514
+ },
+ {
+ "epoch": 75,
+ "train_loss": 1.732315214996338,
+ "train_acc": 0.5162,
+ "test_loss": 8.69449387588501,
+ "test_acc": 0.0443,
+ "lyapunov": null,
+ "grad_norm": 0.6534168175273212,
+ "grad_max_sv": 0.22915640994906425,
+ "grad_min_sv": 1.2120835880813362e-08,
+ "grad_condition": 30203938.86272805,
+ "lr": 0.0004999999999999996,
+ "time_sec": 49.822524070739746
+ },
+ {
+ "epoch": 76,
+ "train_loss": 1.7280053578186034,
+ "train_acc": 0.51708,
+ "test_loss": 8.161399678039551,
+ "test_acc": 0.0506,
+ "lyapunov": null,
+ "grad_norm": 0.6519718595623971,
+ "grad_max_sv": 0.22868257723748683,
+ "grad_min_sv": 1.1916949028967227e-08,
+ "grad_condition": 27392099.189085342,
+ "lr": 0.0004895287900583212,
+ "time_sec": 49.806185245513916
+ },
+ {
+ "epoch": 77,
+ "train_loss": 1.707364101486206,
+ "train_acc": 0.52106,
+ "test_loss": 8.635691497802734,
+ "test_acc": 0.0553,
+ "lyapunov": null,
+ "grad_norm": 0.6489518165829526,
+ "grad_max_sv": 0.22707784324884414,
+ "grad_min_sv": 1.21318999957154e-08,
+ "grad_condition": 22161799.719214164,
+ "lr": 0.0004790621731353997,
+ "time_sec": 49.8337197303772
+ },
+ {
+ "epoch": 78,
+ "train_loss": 1.699185922279358,
+ "train_acc": 0.52508,
+ "test_loss": 8.116340428161621,
+ "test_acc": 0.059,
+ "lyapunov": null,
+ "grad_norm": 0.6466631616175401,
+ "grad_max_sv": 0.2242755901068449,
+ "grad_min_sv": 1.197350978088263e-08,
+ "grad_condition": 22907889.143189352,
+ "lr": 0.000468604740235343,
+ "time_sec": 49.84882068634033
+ },
+ {
+ "epoch": 79,
+ "train_loss": 1.6851876223754882,
+ "train_acc": 0.53002,
+ "test_loss": 7.6594300460815425,
+ "test_acc": 0.0668,
+ "lyapunov": null,
+ "grad_norm": 0.6508056360794745,
+ "grad_max_sv": 0.22947054952383042,
+ "grad_min_sv": 1.2146863270084962e-08,
+ "grad_condition": 50400181.57036874,
+ "lr": 0.00045816107833384175,
+ "time_sec": 49.81526827812195
+ },
+ {
+ "epoch": 80,
+ "train_loss": 1.6667000872421265,
+ "train_acc": 0.53166,
+ "test_loss": 7.577922117614746,
+ "test_acc": 0.0581,
+ "lyapunov": null,
+ "grad_norm": 0.6484594553766964,
+ "grad_max_sv": 0.22649560272693633,
+ "grad_min_sv": 1.2028468630853606e-08,
+ "grad_condition": 33979879.18367102,
+ "lr": 0.0004477357683661729,
+ "time_sec": 49.79970574378967
+ },
+ {
+ "epoch": 81,
+ "train_loss": 1.6529949746704102,
+ "train_acc": 0.53676,
+ "test_loss": 7.7760236434936525,
+ "test_acc": 0.061,
+ "lyapunov": null,
+ "grad_norm": 0.6501069318076672,
+ "grad_max_sv": 0.22972256727516652,
+ "grad_min_sv": 1.196574576337213e-08,
+ "grad_condition": 396215587.1427422,
+ "lr": 0.00043733338321784746,
+ "time_sec": 49.81192994117737
+ },
+ {
+ "epoch": 82,
+ "train_loss": 1.6425591729736329,
+ "train_acc": 0.53686,
+ "test_loss": 7.6887285552978515,
+ "test_acc": 0.0449,
+ "lyapunov": null,
+ "grad_norm": 0.6461003642754752,
+ "grad_max_sv": 0.23114448301494123,
+ "grad_min_sv": 1.2002917063394513e-08,
+ "grad_condition": 58155843.95520236,
+ "lr": 0.0004269584857187939,
+ "time_sec": 49.80897355079651
+ },
+ {
+ "epoch": 83,
+ "train_loss": 1.6318637802124023,
+ "train_acc": 0.54154,
+ "test_loss": 7.384182490539551,
+ "test_acc": 0.0735,
+ "lyapunov": null,
+ "grad_norm": 0.639611071259903,
+ "grad_max_sv": 0.22576675675809382,
+ "grad_min_sv": 1.1820984322299943e-08,
+ "grad_condition": 61458281.56309018,
+ "lr": 0.0004166156266419484,
+ "time_sec": 49.81825590133667
+ },
+ {
+ "epoch": 84,
+ "train_loss": 1.6224907682418823,
+ "train_acc": 0.54502,
+ "test_loss": 6.842728860473633,
+ "test_acc": 0.0545,
+ "lyapunov": null,
+ "grad_norm": 0.6421226956015884,
+ "grad_max_sv": 0.21887084767222403,
+ "grad_min_sv": 1.1874146338408664e-08,
+ "grad_condition": 36085101.45868175,
+ "lr": 0.0004063093427071373,
+ "time_sec": 49.907301902770996
+ },
+ {
+ "epoch": 85,
+ "train_loss": 1.6129507275390624,
+ "train_acc": 0.5441,
+ "test_loss": 8.217321695709229,
+ "test_acc": 0.0637,
+ "lyapunov": null,
+ "grad_norm": 0.6427366718485839,
+ "grad_max_sv": 0.23318556658923625,
+ "grad_min_sv": 1.2124754387304871e-08,
+ "grad_condition": 42339311.94718243,
+ "lr": 0.0003960441545911199,
+ "time_sec": 49.83733892440796
+ },
+ {
+ "epoch": 86,
+ "train_loss": 1.5975109223556518,
+ "train_acc": 0.54868,
+ "test_loss": 7.930374978637695,
+ "test_acc": 0.0457,
+ "lyapunov": null,
+ "grad_norm": 0.648213394339368,
+ "grad_max_sv": 0.23059269934892654,
+ "grad_min_sv": 1.2111861368707676e-08,
+ "grad_condition": 42084970.06037265,
+ "lr": 0.0003858245649446718,
+ "time_sec": 49.827972412109375
+ },
+ {
+ "epoch": 87,
+ "train_loss": 1.5812813794708251,
+ "train_acc": 0.55458,
+ "test_loss": 7.960672058105469,
+ "test_acc": 0.0501,
+ "lyapunov": null,
+ "grad_norm": 0.6429264180119875,
+ "grad_max_sv": 0.2283397376537323,
+ "grad_min_sv": 1.2037938704190233e-08,
+ "grad_condition": 24951514.668881785,
+ "lr": 0.00037565505641757235,
+ "time_sec": 49.82942318916321
+ },
+ {
+ "epoch": 88,
+ "train_loss": 1.573117269897461,
+ "train_acc": 0.55398,
+ "test_loss": 8.257780656433106,
+ "test_acc": 0.0591,
+ "lyapunov": null,
+ "grad_norm": 0.6443323703742537,
+ "grad_max_sv": 0.22722676433622838,
+ "grad_min_sv": 1.201048842325303e-08,
+ "grad_condition": 22188712.23632911,
+ "lr": 0.00036554008969236695,
+ "time_sec": 49.86358904838562
+ },
+ {
+ "epoch": 89,
+ "train_loss": 1.5576643622207642,
+ "train_acc": 0.55992,
+ "test_loss": 8.274403761291504,
+ "test_acc": 0.041,
+ "lyapunov": null,
+ "grad_norm": 0.6402469644123193,
+ "grad_max_sv": 0.22650128416717052,
+ "grad_min_sv": 1.1862416463004343e-08,
+ "grad_condition": 35019834.9168684,
+ "lr": 0.0003554841015277638,
+ "time_sec": 49.83419132232666
+ },
+ {
+ "epoch": 90,
+ "train_loss": 1.549127948036194,
+ "train_acc": 0.56466,
+ "test_loss": 7.301855851745605,
+ "test_acc": 0.0718,
+ "lyapunov": null,
+ "grad_norm": 0.6449275085704251,
+ "grad_max_sv": 0.22556735202670097,
+ "grad_min_sv": 1.1762558954631075e-08,
+ "grad_condition": 21940981.03509561,
+ "lr": 0.000345491502812526,
+ "time_sec": 49.81568884849548
+ },
+ {
+ "epoch": 91,
+ "train_loss": 1.5344566452407837,
+ "train_acc": 0.56436,
+ "test_loss": 8.916962014770508,
+ "test_acc": 0.0515,
+ "lyapunov": null,
+ "grad_norm": 0.6463598068323441,
+ "grad_max_sv": 0.23813196495175362,
+ "grad_min_sv": 1.2199751642932855e-08,
+ "grad_condition": 45733250.122319184,
+ "lr": 0.0003355666766307081,
+ "time_sec": 49.839728355407715
+ },
+ {
+ "epoch": 92,
+ "train_loss": 1.5208702486419678,
+ "train_acc": 0.56684,
+ "test_loss": 8.993258874511719,
+ "test_acc": 0.054,
+ "lyapunov": null,
+ "grad_norm": 0.6391383040365451,
+ "grad_max_sv": 0.22249663844704629,
+ "grad_min_sv": 1.166908096122965e-08,
+ "grad_condition": 28597379.63678825,
+ "lr": 0.00032571397633909225,
+ "time_sec": 49.850322008132935
+ },
+ {
+ "epoch": 93,
+ "train_loss": 1.5081010787582398,
+ "train_acc": 0.57028,
+ "test_loss": 9.433806256103516,
+ "test_acc": 0.0535,
+ "lyapunov": null,
+ "grad_norm": 0.6456709453433311,
+ "grad_max_sv": 0.23419931791722776,
+ "grad_min_sv": 1.195185940633392e-08,
+ "grad_condition": 29245401.732327044,
+ "lr": 0.00031593772365766094,
+ "time_sec": 49.83537983894348
+ },
+ {
+ "epoch": 94,
+ "train_loss": 1.4969723129653931,
+ "train_acc": 0.57362,
+ "test_loss": 8.755092433166505,
+ "test_acc": 0.0528,
+ "lyapunov": null,
+ "grad_norm": 0.6461658506271033,
+ "grad_max_sv": 0.22756082080304624,
+ "grad_min_sv": 1.1912134220692926e-08,
+ "grad_condition": 23423387.436489962,
+ "lr": 0.0003062422067739483,
+ "time_sec": 49.80311179161072
+ },
+ {
+ "epoch": 95,
+ "train_loss": 2.9494932527923585,
+ "train_acc": 0.411,
+ "test_loss": 4.676254756927491,
+ "test_acc": 0.0505,
+ "lyapunov": null,
+ "grad_norm": 0.8335419963078607,
+ "grad_max_sv": 0.3271928407251835,
+ "grad_min_sv": 1.4720300411941168e-08,
+ "grad_condition": 24067860.441598095,
+ "lr": 0.00029663167846209965,
+ "time_sec": 49.814762115478516
+ },
+ {
+ "epoch": 96,
+ "train_loss": 3.6572426443481447,
+ "train_acc": 0.1492,
+ "test_loss": 5.234876950836181,
+ "test_acc": 0.0688,
+ "lyapunov": null,
+ "grad_norm": 0.5523560840003197,
+ "grad_max_sv": 0.18005239982157945,
+ "grad_min_sv": 9.93911985318341e-09,
+ "grad_condition": 91354773.39239445,
+ "lr": 0.00028711035421746345,
+ "time_sec": 49.84577131271362
+ },
+ {
+ "epoch": 97,
+ "train_loss": 3.3812893244171143,
+ "train_acc": 0.19184,
+ "test_loss": 4.862454182434082,
+ "test_acc": 0.077,
+ "lyapunov": null,
+ "grad_norm": 0.5636212270422577,
+ "grad_max_sv": 0.18343333192169667,
+ "grad_min_sv": 1.0359513497038009e-08,
+ "grad_condition": 20784291.458693452,
+ "lr": 0.00027768241040753615,
+ "time_sec": 49.83091354370117
+ },
+ {
+ "epoch": 98,
+ "train_loss": 3.179550113220215,
+ "train_acc": 0.2255,
+ "test_loss": 4.858168863677979,
+ "test_acc": 0.0807,
+ "lyapunov": null,
+ "grad_norm": 0.5839200776735536,
+ "grad_max_sv": 0.18244810923933982,
+ "grad_min_sv": 1.037966059214135e-08,
+ "grad_condition": 22427331.372158233,
+ "lr": 0.00026835198244006903,
+ "time_sec": 49.867558002471924
+ },
+ {
+ "epoch": 99,
+ "train_loss": 3.02292495223999,
+ "train_acc": 0.25396,
+ "test_loss": 5.169387593078613,
+ "test_acc": 0.0881,
+ "lyapunov": null,
+ "grad_norm": 0.595907429260728,
+ "grad_max_sv": 0.1938932089135051,
+ "grad_min_sv": 1.105600735823442e-08,
+ "grad_condition": 39890639.04859903,
+ "lr": 0.0002591231629491421,
+ "time_sec": 49.82200026512146
+ },
+ {
+ "epoch": 100,
+ "train_loss": 2.9043469207000734,
+ "train_acc": 0.27584,
+ "test_loss": 4.884814841461182,
+ "test_acc": 0.0989,
+ "lyapunov": null,
+ "grad_norm": 0.5987053513470115,
+ "grad_max_sv": 0.1915395434945822,
+ "grad_min_sv": 1.0967718520123356e-08,
+ "grad_condition": 507391317.2637795,
+ "lr": 0.0002499999999999997,
+ "time_sec": 49.835878133773804
+ },
+ {
+ "epoch": 101,
+ "train_loss": 2.8044686096191405,
+ "train_acc": 0.29558,
+ "test_loss": 4.889270275497436,
+ "test_acc": 0.0981,
+ "lyapunov": null,
+ "grad_norm": 0.6096838460034203,
+ "grad_max_sv": 0.20316330213099718,
+ "grad_min_sv": 1.1341824002197854e-08,
+ "grad_condition": 19853325.836087834,
+ "lr": 0.00024098649531343477,
+ "time_sec": 49.85874676704407
+ },
+ {
+ "epoch": 102,
+ "train_loss": 2.697149913482666,
+ "train_acc": 0.3167,
+ "test_loss": 4.92620325088501,
+ "test_acc": 0.1009,
+ "lyapunov": null,
+ "grad_norm": 0.6154909980411829,
+ "grad_max_sv": 0.20256872698664666,
+ "grad_min_sv": 1.1648207248748933e-08,
+ "grad_condition": 19320886.90158599,
+ "lr": 0.0002320866025105016,
+ "time_sec": 50.07639527320862
+ },
+ {
+ "epoch": 103,
+ "train_loss": 2.618629614944458,
+ "train_acc": 0.33036,
+ "test_loss": 5.49400161895752,
+ "test_acc": 0.1068,
+ "lyapunov": null,
+ "grad_norm": 0.6217563116117207,
+ "grad_max_sv": 0.20746214482933284,
+ "grad_min_sv": 1.1507716859981975e-08,
+ "grad_condition": 25949652.78149998,
+ "lr": 0.0002233042253783278,
+ "time_sec": 49.818949460983276
+ },
+ {
+ "epoch": 104,
+ "train_loss": 2.540534757156372,
+ "train_acc": 0.34564,
+ "test_loss": 4.9159078086853025,
+ "test_acc": 0.1126,
+ "lyapunov": null,
+ "grad_norm": 0.6217698336501172,
+ "grad_max_sv": 0.20552988573908806,
+ "grad_min_sv": 1.1522777731975964e-08,
+ "grad_condition": 21899890.551626954,
+ "lr": 0.000214643216157784,
+ "time_sec": 49.87585234642029
+ },
+ {
+ "epoch": 105,
+ "train_loss": 2.479596985321045,
+ "train_acc": 0.35746,
+ "test_loss": 5.100056993484497,
+ "test_acc": 0.1253,
+ "lyapunov": null,
+ "grad_norm": 0.6287156405132894,
+ "grad_max_sv": 0.2140802226960659,
+ "grad_min_sv": 1.1805095190275949e-08,
+ "grad_condition": 26208309.323742133,
+ "lr": 0.00020610737385376332,
+ "time_sec": 49.82085204124451
+ },
+ {
+ "epoch": 106,
+ "train_loss": 2.415481425552368,
+ "train_acc": 0.36924,
+ "test_loss": 4.742834524536133,
+ "test_acc": 0.1225,
+ "lyapunov": null,
+ "grad_norm": 0.6282670457594898,
+ "grad_max_sv": 0.21101173125207423,
+ "grad_min_sv": 1.1938832567004453e-08,
+ "grad_condition": 33782298.89931901,
+ "lr": 0.00019770044256881242,
+ "time_sec": 49.805906534194946
+ },
+ {
+ "epoch": 107,
+ "train_loss": 2.3521559171295165,
+ "train_acc": 0.38442,
+ "test_loss": 5.213879206848144,
+ "test_acc": 0.1211,
+ "lyapunov": null,
+ "grad_norm": 0.6335700941216259,
+ "grad_max_sv": 0.21410419717431067,
+ "grad_min_sv": 1.1941749475385954e-08,
+ "grad_condition": 22110752.957356386,
+ "lr": 0.0001894261098608447,
+ "time_sec": 49.83317017555237
+ },
+ {
+ "epoch": 108,
+ "train_loss": 2.302857539215088,
+ "train_acc": 0.39628,
+ "test_loss": 5.207193740844726,
+ "test_acc": 0.1285,
+ "lyapunov": null,
+ "grad_norm": 0.6359374602349686,
+ "grad_max_sv": 0.21151717714965343,
+ "grad_min_sv": 1.187537558844376e-08,
+ "grad_condition": 37488925.60398644,
+ "lr": 0.000181288005125655,
+ "time_sec": 49.82870650291443
+ },
+ {
+ "epoch": 109,
+ "train_loss": 2.2536745275878904,
+ "train_acc": 0.40138,
+ "test_loss": 5.2042837226867675,
+ "test_acc": 0.1322,
+ "lyapunov": null,
+ "grad_norm": 0.6289692207235398,
+ "grad_max_sv": 0.20782952345907688,
+ "grad_min_sv": 1.1739032497459779e-08,
+ "grad_condition": 29358916.829315763,
+ "lr": 0.0001732896980049473,
+ "time_sec": 49.83245229721069
+ },
+ {
+ "epoch": 110,
+ "train_loss": 2.2073010168457032,
+ "train_acc": 0.40866,
+ "test_loss": 5.739359895324707,
+ "test_acc": 0.1227,
+ "lyapunov": null,
+ "grad_norm": 0.6385992521842959,
+ "grad_max_sv": 0.2127275388687849,
+ "grad_min_sv": 1.1950131779958628e-08,
+ "grad_condition": 28764337.97746384,
+ "lr": 0.00016543469682057076,
+ "time_sec": 49.83092474937439
+ },
+ {
+ "epoch": 111,
+ "train_loss": 2.1692623610687254,
+ "train_acc": 0.41942,
+ "test_loss": 6.2040216323852535,
+ "test_acc": 0.1309,
+ "lyapunov": null,
+ "grad_norm": 0.6444316866103925,
+ "grad_max_sv": 0.21499809809029102,
+ "grad_min_sv": 1.1752886208693526e-08,
+ "grad_condition": 31962706.67450107,
+ "lr": 0.00015772644703565552,
+ "time_sec": 49.85021710395813
+ },
+ {
+ "epoch": 112,
+ "train_loss": 2.1302712613677977,
+ "train_acc": 0.42516,
+ "test_loss": 5.75790121383667,
+ "test_acc": 0.1399,
+ "lyapunov": null,
+ "grad_norm": 0.6329896331917518,
+ "grad_max_sv": 0.21649966202676296,
+ "grad_min_sv": 1.2179612900176106e-08,
+ "grad_condition": 34093436.46700279,
+ "lr": 0.00015016832974331713,
+ "time_sec": 49.81994557380676
+ },
+ {
+ "epoch": 113,
+ "train_loss": 2.1065593459701537,
+ "train_acc": 0.43386,
+ "test_loss": 6.140606423950195,
+ "test_acc": 0.1364,
+ "lyapunov": null,
+ "grad_norm": 0.6373030825503643,
+ "grad_max_sv": 0.2152324143797159,
+ "grad_min_sv": 1.191059096350422e-08,
+ "grad_condition": 24786528.45697539,
+ "lr": 0.00014276366018359834,
+ "time_sec": 49.832173347473145
+ },
+ {
+ "epoch": 114,
+ "train_loss": 2.0826868451690674,
+ "train_acc": 0.43754,
+ "test_loss": 7.314329501342773,
+ "test_acc": 0.1193,
+ "lyapunov": null,
+ "grad_norm": 0.6350963671857877,
+ "grad_max_sv": 0.2231900453567505,
+ "grad_min_sv": 1.2137735866390998e-08,
+ "grad_condition": 27948227.054936886,
+ "lr": 0.00013551568628929425,
+ "time_sec": 49.82054424285889
+ },
+ {
+ "epoch": 115,
+ "train_loss": 2.057500901184082,
+ "train_acc": 0.44596,
+ "test_loss": 5.995877742004395,
+ "test_acc": 0.1372,
+ "lyapunov": null,
+ "grad_norm": 0.6319121818844147,
+ "grad_max_sv": 0.2083717118948698,
+ "grad_min_sv": 1.1799914823723556e-08,
+ "grad_condition": 35488295.07860346,
+ "lr": 0.00012842758726130276,
+ "time_sec": 49.81160569190979
+ },
+ {
+ "epoch": 116,
+ "train_loss": 2.027409094619751,
+ "train_acc": 0.452,
+ "test_loss": 7.286285119628906,
+ "test_acc": 0.122,
+ "lyapunov": null,
+ "grad_norm": 0.639785065376269,
+ "grad_max_sv": 0.2164283238351345,
+ "grad_min_sv": 1.1941236867721305e-08,
+ "grad_condition": 66360354.77809191,
+ "lr": 0.0001215024721741218,
+ "time_sec": 49.836623191833496
+ },
+ {
+ "epoch": 117,
+ "train_loss": 1.998638267250061,
+ "train_acc": 0.45694,
+ "test_loss": 6.76222890625,
+ "test_acc": 0.1205,
+ "lyapunov": null,
+ "grad_norm": 0.6411689060332757,
+ "grad_max_sv": 0.21728002466261387,
+ "grad_min_sv": 1.186145185405607e-08,
+ "grad_condition": 25472303.080288395,
+ "lr": 0.00011474337861210538,
+ "time_sec": 49.835474252700806
+ },
+ {
+ "epoch": 118,
+ "train_loss": 1.9871974803924561,
+ "train_acc": 0.46078,
+ "test_loss": 6.990749812316895,
+ "test_acc": 0.1306,
+ "lyapunov": null,
+ "grad_norm": 0.6401613879770299,
+ "grad_max_sv": 0.21996232829988002,
+ "grad_min_sv": 1.212309715947768e-08,
+ "grad_condition": 43599185.89621965,
+ "lr": 0.00010815327133708009,
+ "time_sec": 49.82992196083069
+ },
+ {
+ "epoch": 119,
+ "train_loss": 1.9558954917144775,
+ "train_acc": 0.46806,
+ "test_loss": 6.338745205688476,
+ "test_acc": 0.1423,
+ "lyapunov": null,
+ "grad_norm": 0.6380666956188763,
+ "grad_max_sv": 0.21726358123123646,
+ "grad_min_sv": 1.1924941875629536e-08,
+ "grad_condition": 23332267.546088994,
+ "lr": 0.00010173504098790182,
+ "time_sec": 49.8153715133667
+ },
+ {
+ "epoch": 120,
+ "train_loss": 1.9510743766784668,
+ "train_acc": 0.46974,
+ "test_loss": 6.733411245727539,
+ "test_acc": 0.1243,
+ "lyapunov": null,
+ "grad_norm": 0.6418284890195846,
+ "grad_max_sv": 0.22671268545091153,
+ "grad_min_sv": 1.199444485400214e-08,
+ "grad_condition": 24711059.275352217,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 49.81182289123535
+ },
+ {
+ "epoch": 121,
+ "train_loss": 1.9362508995819092,
+ "train_acc": 0.47356,
+ "test_loss": 6.134232345581054,
+ "test_acc": 0.1378,
+ "lyapunov": null,
+ "grad_norm": 0.6346296231277031,
+ "grad_max_sv": 0.21598901376128196,
+ "grad_min_sv": 1.1970328496480053e-08,
+ "grad_condition": 25346274.751641985,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 49.83584427833557
+ },
+ {
+ "epoch": 122,
+ "train_loss": 1.9162643937683106,
+ "train_acc": 0.4749,
+ "test_loss": 7.639575733947754,
+ "test_acc": 0.1265,
+ "lyapunov": null,
+ "grad_norm": 0.6378739210927734,
+ "grad_max_sv": 0.21739229559898376,
+ "grad_min_sv": 1.1819409628278932e-08,
+ "grad_condition": 181332693.33855394,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 49.82065296173096
+ },
+ {
+ "epoch": 123,
+ "train_loss": 1.9041280354309083,
+ "train_acc": 0.47994,
+ "test_loss": 6.308480444335937,
+ "test_acc": 0.1392,
+ "lyapunov": null,
+ "grad_norm": 0.6332843460906636,
+ "grad_max_sv": 0.21474863290786744,
+ "grad_min_sv": 1.1848325226493373e-08,
+ "grad_condition": 30395117.45243178,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 49.83568549156189
+ },
+ {
+ "epoch": 124,
+ "train_loss": 1.888980817489624,
+ "train_acc": 0.48018,
+ "test_loss": 6.931203792572021,
+ "test_acc": 0.1361,
+ "lyapunov": null,
+ "grad_norm": 0.6468989904611825,
+ "grad_max_sv": 0.22639431655406952,
+ "grad_min_sv": 1.2179835734427157e-08,
+ "grad_condition": 27031913.997842442,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 49.86228370666504
+ },
+ {
+ "epoch": 125,
+ "train_loss": 1.8688794164657592,
+ "train_acc": 0.48822,
+ "test_loss": 7.4782632530212405,
+ "test_acc": 0.132,
+ "lyapunov": null,
+ "grad_norm": 0.6436381282742432,
+ "grad_max_sv": 0.21808561868965626,
+ "grad_min_sv": 1.21570175322383e-08,
+ "grad_condition": 33380104.6057067,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 49.83109521865845
+ },
+ {
+ "epoch": 126,
+ "train_loss": 1.8640016136932374,
+ "train_acc": 0.491,
+ "test_loss": 6.5455432174682615,
+ "test_acc": 0.1403,
+ "lyapunov": null,
+ "grad_norm": 0.6367336212592833,
+ "grad_max_sv": 0.22216320559382438,
+ "grad_min_sv": 1.1826145895899032e-08,
+ "grad_condition": 33022831.75443542,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 49.83457159996033
+ },
+ {
+ "epoch": 127,
+ "train_loss": 1.8510954288101196,
+ "train_acc": 0.4882,
+ "test_loss": 7.0682084793090825,
+ "test_acc": 0.1326,
+ "lyapunov": null,
+ "grad_norm": 0.6431259646730736,
+ "grad_max_sv": 0.22209820635616778,
+ "grad_min_sv": 1.2136436526935524e-08,
+ "grad_condition": 66497220.94224206,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 49.83670258522034
+ },
+ {
+ "epoch": 128,
+ "train_loss": 1.8453027178573609,
+ "train_acc": 0.49042,
+ "test_loss": 6.2842555938720706,
+ "test_acc": 0.1305,
+ "lyapunov": null,
+ "grad_norm": 0.6383805845227949,
+ "grad_max_sv": 0.21130143105983734,
+ "grad_min_sv": 1.1917887206280842e-08,
+ "grad_condition": 43204631.05359116,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 49.81800961494446
+ },
+ {
+ "epoch": 129,
+ "train_loss": 1.8346676333618164,
+ "train_acc": 0.4945,
+ "test_loss": 6.274330713653565,
+ "test_acc": 0.1391,
+ "lyapunov": null,
+ "grad_norm": 0.6376052549176046,
+ "grad_max_sv": 0.2089413482695818,
+ "grad_min_sv": 1.1727769512470676e-08,
+ "grad_condition": 27159660.544945084,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 49.845595598220825
+ },
+ {
+ "epoch": 130,
+ "train_loss": 1.830022028465271,
+ "train_acc": 0.49474,
+ "test_loss": 6.249729978942871,
+ "test_acc": 0.1459,
+ "lyapunov": null,
+ "grad_norm": 0.6453711202585213,
+ "grad_max_sv": 0.2190984409302473,
+ "grad_min_sv": 1.2224324771881178e-08,
+ "grad_condition": 22960059.51271691,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 49.87020516395569
+ },
+ {
+ "epoch": 131,
+ "train_loss": 1.8177084483337402,
+ "train_acc": 0.49802,
+ "test_loss": 6.943641340637207,
+ "test_acc": 0.1332,
+ "lyapunov": null,
+ "grad_norm": 0.6440523788025603,
+ "grad_max_sv": 0.21554723903536796,
+ "grad_min_sv": 1.1872820722402811e-08,
+ "grad_condition": 25176936.12047171,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 49.89444398880005
+ },
+ {
+ "epoch": 132,
+ "train_loss": 1.8117612997817993,
+ "train_acc": 0.4992,
+ "test_loss": 7.735134202575684,
+ "test_acc": 0.1244,
+ "lyapunov": null,
+ "grad_norm": 0.6458623734804945,
+ "grad_max_sv": 0.2287333384156227,
+ "grad_min_sv": 1.2116058153988085e-08,
+ "grad_condition": 23082329.335862808,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 49.84588980674744
+ },
+ {
+ "epoch": 133,
+ "train_loss": 1.811845332069397,
+ "train_acc": 0.50014,
+ "test_loss": 7.118609297180176,
+ "test_acc": 0.1331,
+ "lyapunov": null,
+ "grad_norm": 0.638841020277806,
+ "grad_max_sv": 0.21471160911023618,
+ "grad_min_sv": 1.1894429352565794e-08,
+ "grad_condition": 24148328.84591496,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 49.831459283828735
+ },
+ {
+ "epoch": 134,
+ "train_loss": 1.8001032112121582,
+ "train_acc": 0.50294,
+ "test_loss": 7.107429740142822,
+ "test_acc": 0.1282,
+ "lyapunov": null,
+ "grad_norm": 0.6464497671620558,
+ "grad_max_sv": 0.23182750679552555,
+ "grad_min_sv": 1.2161121044212964e-08,
+ "grad_condition": 54577461.874021314,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 49.83904433250427
+ },
+ {
+ "epoch": 135,
+ "train_loss": 1.7929331283569336,
+ "train_acc": 0.50366,
+ "test_loss": 7.344893767547608,
+ "test_acc": 0.1271,
+ "lyapunov": null,
+ "grad_norm": 0.6435222264694869,
+ "grad_max_sv": 0.2192435622215271,
+ "grad_min_sv": 1.2271505814287487e-08,
+ "grad_condition": 22236846.49951817,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 49.82794523239136
+ },
+ {
+ "epoch": 136,
+ "train_loss": 1.8045927509307862,
+ "train_acc": 0.49886,
+ "test_loss": 8.085471559143066,
+ "test_acc": 0.1207,
+ "lyapunov": null,
+ "grad_norm": 0.6382347842581513,
+ "grad_max_sv": 0.22427703253924847,
+ "grad_min_sv": 1.216163273837223e-08,
+ "grad_condition": 28207277.011594873,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 49.88175678253174
+ },
+ {
+ "epoch": 137,
+ "train_loss": 1.7832990637588502,
+ "train_acc": 0.50496,
+ "test_loss": 6.688453459167481,
+ "test_acc": 0.1334,
+ "lyapunov": null,
+ "grad_norm": 0.6418151086385053,
+ "grad_max_sv": 0.21794002875685692,
+ "grad_min_sv": 1.2034389010318058e-08,
+ "grad_condition": 22793569.96555335,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 49.84071898460388
+ },
+ {
+ "epoch": 138,
+ "train_loss": 1.7905620854187012,
+ "train_acc": 0.50572,
+ "test_loss": 7.2380154365539555,
+ "test_acc": 0.129,
+ "lyapunov": null,
+ "grad_norm": 0.6407824951102813,
+ "grad_max_sv": 0.22645330876111985,
+ "grad_min_sv": 1.2214871658589033e-08,
+ "grad_condition": 20569116.284954578,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 49.84640121459961
+ },
+ {
+ "epoch": 139,
+ "train_loss": 1.788800776901245,
+ "train_acc": 0.50604,
+ "test_loss": 7.676028425598145,
+ "test_acc": 0.1308,
+ "lyapunov": null,
+ "grad_norm": 0.6393065831907885,
+ "grad_max_sv": 0.2201111435890198,
+ "grad_min_sv": 1.206703041933821e-08,
+ "grad_condition": 28068636.701712035,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 49.82333970069885
+ },
+ {
+ "epoch": 140,
+ "train_loss": 1.7775352002334595,
+ "train_acc": 0.50992,
+ "test_loss": 6.824903617858887,
+ "test_acc": 0.1382,
+ "lyapunov": null,
+ "grad_norm": 0.6429938723422318,
+ "grad_max_sv": 0.21460832096636295,
+ "grad_min_sv": 1.17411291786218e-08,
+ "grad_condition": 31960287.943684638,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 49.83107376098633
+ },
+ {
+ "epoch": 141,
+ "train_loss": 1.7772767013931274,
+ "train_acc": 0.50912,
+ "test_loss": 8.417906446838378,
+ "test_acc": 0.1201,
+ "lyapunov": null,
+ "grad_norm": 0.6414560412377437,
+ "grad_max_sv": 0.22789728231728076,
+ "grad_min_sv": 1.2347990069327964e-08,
+ "grad_condition": 21519591.2698054,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 49.830055475234985
+ },
+ {
+ "epoch": 142,
+ "train_loss": 1.7722079333496095,
+ "train_acc": 0.5074,
+ "test_loss": 7.479126264190674,
+ "test_acc": 0.1332,
+ "lyapunov": null,
+ "grad_norm": 0.6492349389016402,
+ "grad_max_sv": 0.23224957659840584,
+ "grad_min_sv": 1.2359584963816949e-08,
+ "grad_condition": 23310731.56809649,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 49.821824073791504
+ },
+ {
+ "epoch": 143,
+ "train_loss": 1.7706715833282471,
+ "train_acc": 0.50882,
+ "test_loss": 6.759830638885498,
+ "test_acc": 0.1312,
+ "lyapunov": null,
+ "grad_norm": 0.6386303224852788,
+ "grad_max_sv": 0.21973421648144723,
+ "grad_min_sv": 1.2129359658330508e-08,
+ "grad_condition": 22303453.162939433,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 49.82608699798584
+ },
+ {
+ "epoch": 144,
+ "train_loss": 1.770061126937866,
+ "train_acc": 0.51042,
+ "test_loss": 8.168591398620606,
+ "test_acc": 0.1265,
+ "lyapunov": null,
+ "grad_norm": 0.6443170070907279,
+ "grad_max_sv": 0.22507050447165966,
+ "grad_min_sv": 1.2152392936393141e-08,
+ "grad_condition": 22873019.852206793,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 49.8205029964447
+ },
+ {
+ "epoch": 145,
+ "train_loss": 1.7649179027938844,
+ "train_acc": 0.509,
+ "test_loss": 7.854398386383057,
+ "test_acc": 0.1211,
+ "lyapunov": null,
+ "grad_norm": 0.63938639247204,
+ "grad_max_sv": 0.22039102129638194,
+ "grad_min_sv": 1.1966107968386375e-08,
+ "grad_condition": 29791248.29023991,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 49.8352313041687
+ },
+ {
+ "epoch": 146,
+ "train_loss": 1.771636342201233,
+ "train_acc": 0.50926,
+ "test_loss": 7.595294637298584,
+ "test_acc": 0.1263,
+ "lyapunov": null,
+ "grad_norm": 0.6439134858087602,
+ "grad_max_sv": 0.22073593139648437,
+ "grad_min_sv": 1.1903592189027589e-08,
+ "grad_condition": 36630674.258442916,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 49.85316801071167
+ },
+ {
+ "epoch": 147,
+ "train_loss": 1.7654109023666382,
+ "train_acc": 0.50992,
+ "test_loss": 7.858496125793457,
+ "test_acc": 0.1228,
+ "lyapunov": null,
+ "grad_norm": 0.6452120448477214,
+ "grad_max_sv": 0.21640395522117614,
+ "grad_min_sv": 1.1791314735720703e-08,
+ "grad_condition": 36184836.96072569,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 49.80920720100403
+ },
+ {
+ "epoch": 148,
+ "train_loss": 1.76628436378479,
+ "train_acc": 0.50766,
+ "test_loss": 8.274021264648438,
+ "test_acc": 0.1088,
+ "lyapunov": null,
+ "grad_norm": 0.6448148716908921,
+ "grad_max_sv": 0.22330073527991773,
+ "grad_min_sv": 1.2051270137369841e-08,
+ "grad_condition": 21403660.781028073,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 49.84639763832092
+ },
+ {
+ "epoch": 149,
+ "train_loss": 1.7641568323135377,
+ "train_acc": 0.50932,
+ "test_loss": 7.1706701782226565,
+ "test_acc": 0.1418,
+ "lyapunov": null,
+ "grad_norm": 0.6419761185100763,
+ "grad_max_sv": 0.22420972734689712,
+ "grad_min_sv": 1.2012330221494726e-08,
+ "grad_condition": 44951323.39984313,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 49.835381269454956
+ },
+ {
+ "epoch": 150,
+ "train_loss": 1.7616498372650147,
+ "train_acc": 0.51152,
+ "test_loss": 7.837383623504639,
+ "test_acc": 0.1182,
+ "lyapunov": null,
+ "grad_norm": 0.6426676505435569,
+ "grad_max_sv": 0.21811567358672618,
+ "grad_min_sv": 1.1744335026014906e-08,
+ "grad_condition": 40653937.072005436,
+ "lr": 0.0,
+ "time_sec": 49.85364270210266
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 4.790666111755371,
+ "train_acc": 0.0165,
+ "test_loss": 4.9503300064086915,
+ "test_acc": 0.01,
+ "lyapunov": null,
+ "grad_norm": 5.291697588876432,
+ "grad_max_sv": 4.663330984115601,
+ "grad_min_sv": 7.994122603882659e-08,
+ "grad_condition": 204227559.8068969,
+ "lr": 0.0009998903417374227,
+ "time_sec": 66.97809171676636
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.437635167236328,
+ "train_acc": 0.03372,
+ "test_loss": 4.9434486038208005,
+ "test_acc": 0.0109,
+ "lyapunov": null,
+ "grad_norm": 3.3795440241281205,
+ "grad_max_sv": 2.9110051512718202,
+ "grad_min_sv": 5.2089944511252154e-08,
+ "grad_condition": 566186137.812573,
+ "lr": 0.0009995614150494292,
+ "time_sec": 66.91377472877502
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.26833670211792,
+ "train_acc": 0.04816,
+ "test_loss": 4.993957643127441,
+ "test_acc": 0.0118,
+ "lyapunov": null,
+ "grad_norm": 2.265691942587348,
+ "grad_max_sv": 1.775827443599701,
+ "grad_min_sv": 3.447322165783806e-08,
+ "grad_condition": 193597124.56597418,
+ "lr": 0.0009990133642141358,
+ "time_sec": 66.95397591590881
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.126825766448975,
+ "train_acc": 0.0657,
+ "test_loss": 5.033058495330811,
+ "test_acc": 0.0133,
+ "lyapunov": null,
+ "grad_norm": 1.503639209245557,
+ "grad_max_sv": 0.996296688914299,
+ "grad_min_sv": 2.3224798484378083e-08,
+ "grad_condition": 47352815.280070126,
+ "lr": 0.0009982464296247522,
+ "time_sec": 66.94082856178284
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.033032944335938,
+ "train_acc": 0.07788,
+ "test_loss": 5.366096397399902,
+ "test_acc": 0.0146,
+ "lyapunov": null,
+ "grad_norm": 1.2167707155197347,
+ "grad_max_sv": 0.7315087422728539,
+ "grad_min_sv": 1.914776174977151e-08,
+ "grad_condition": 65647468.63073953,
+ "lr": 0.0009972609476841367,
+ "time_sec": 66.9649748802185
+ },
+ {
+ "epoch": 6,
+ "train_loss": 3.9636214042663576,
+ "train_acc": 0.08816,
+ "test_loss": 5.34757041015625,
+ "test_acc": 0.0149,
+ "lyapunov": null,
+ "grad_norm": 1.109160273746945,
+ "grad_max_sv": 0.6089150205254554,
+ "grad_min_sv": 1.7710445950058773e-08,
+ "grad_condition": 77884060.5331116,
+ "lr": 0.000996057350657239,
+ "time_sec": 66.97061657905579
+ },
+ {
+ "epoch": 7,
+ "train_loss": 3.9122159162902834,
+ "train_acc": 0.09544,
+ "test_loss": 5.439447886657715,
+ "test_acc": 0.013,
+ "lyapunov": null,
+ "grad_norm": 1.0363457541084344,
+ "grad_max_sv": 0.5376138880848884,
+ "grad_min_sv": 1.6374132377761085e-08,
+ "grad_condition": 48186425.879532695,
+ "lr": 0.000994636166481494,
+ "time_sec": 67.02947664260864
+ },
+ {
+ "epoch": 8,
+ "train_loss": 3.860605283126831,
+ "train_acc": 0.10604,
+ "test_loss": 5.774677875518798,
+ "test_acc": 0.0152,
+ "lyapunov": null,
+ "grad_norm": 0.9855402112805093,
+ "grad_max_sv": 0.5275192707777023,
+ "grad_min_sv": 1.6650217127267554e-08,
+ "grad_condition": 36767266.40486912,
+ "lr": 0.0009929980185352525,
+ "time_sec": 66.97124218940735
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.8149237147521973,
+ "train_acc": 0.11454,
+ "test_loss": 5.3070202072143555,
+ "test_acc": 0.0222,
+ "lyapunov": null,
+ "grad_norm": 0.9330412728543993,
+ "grad_max_sv": 0.4647836610674858,
+ "grad_min_sv": 1.5222168972539585e-08,
+ "grad_condition": 49307207.804101914,
+ "lr": 0.0009911436253643444,
+ "time_sec": 67.01966977119446
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.7818530071258545,
+ "train_acc": 0.12014,
+ "test_loss": 5.634545847320557,
+ "test_acc": 0.0199,
+ "lyapunov": null,
+ "grad_norm": 0.8719008089031304,
+ "grad_max_sv": 0.40649077892303465,
+ "grad_min_sv": 1.4515182727992126e-08,
+ "grad_condition": 38341756.409908436,
+ "lr": 0.0009890738003669028,
+ "time_sec": 67.23870015144348
+ },
+ {
+ "epoch": 11,
+ "train_loss": 3.743896211090088,
+ "train_acc": 0.12462,
+ "test_loss": 5.8831702270507815,
+ "test_acc": 0.0241,
+ "lyapunov": null,
+ "grad_norm": 0.8436698179223415,
+ "grad_max_sv": 0.39998230785131456,
+ "grad_min_sv": 1.4137996530785845e-08,
+ "grad_condition": 231359110.35725895,
+ "lr": 0.00098678945143658,
+ "time_sec": 67.23693895339966
+ },
+ {
+ "epoch": 12,
+ "train_loss": 3.7158116050720214,
+ "train_acc": 0.12962,
+ "test_loss": 5.8489625442504884,
+ "test_acc": 0.0182,
+ "lyapunov": null,
+ "grad_norm": 0.8103156188684312,
+ "grad_max_sv": 0.36918022111058235,
+ "grad_min_sv": 1.3637384886633352e-08,
+ "grad_condition": 38409273.56149448,
+ "lr": 0.0009842915805643154,
+ "time_sec": 67.05321264266968
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.690355722808838,
+ "train_acc": 0.13444,
+ "test_loss": 5.952298941802979,
+ "test_acc": 0.0139,
+ "lyapunov": null,
+ "grad_norm": 0.7799393076966175,
+ "grad_max_sv": 0.3450939729809761,
+ "grad_min_sv": 1.3063578439224261e-08,
+ "grad_condition": 267805312.78349906,
+ "lr": 0.000981581283398829,
+ "time_sec": 67.01498341560364
+ },
+ {
+ "epoch": 14,
+ "train_loss": 3.660913709640503,
+ "train_acc": 0.13974,
+ "test_loss": 5.962563812255859,
+ "test_acc": 0.0157,
+ "lyapunov": null,
+ "grad_norm": 0.7562346727823589,
+ "grad_max_sv": 0.3272464439272881,
+ "grad_min_sv": 1.2569073787327411e-08,
+ "grad_condition": 28603602.411010243,
+ "lr": 0.0009786597487660333,
+ "time_sec": 67.02658581733704
+ },
+ {
+ "epoch": 15,
+ "train_loss": 3.6474139246368407,
+ "train_acc": 0.14148,
+ "test_loss": 6.562283952331543,
+ "test_acc": 0.0135,
+ "lyapunov": null,
+ "grad_norm": 0.7393349403998549,
+ "grad_max_sv": 0.33356437757611274,
+ "grad_min_sv": 1.2411575255055763e-08,
+ "grad_condition": 43624327.61961842,
+ "lr": 0.0009755282581475766,
+ "time_sec": 67.03324222564697
+ },
+ {
+ "epoch": 16,
+ "train_loss": 3.625168949737549,
+ "train_acc": 0.1432,
+ "test_loss": 6.292130155944824,
+ "test_acc": 0.0141,
+ "lyapunov": null,
+ "grad_norm": 0.7144248820011195,
+ "grad_max_sv": 0.31020588912069796,
+ "grad_min_sv": 1.2080284056414925e-08,
+ "grad_condition": 29549483.252300274,
+ "lr": 0.0009721881851187403,
+ "time_sec": 66.97783041000366
+ },
+ {
+ "epoch": 17,
+ "train_loss": 3.597680552520752,
+ "train_acc": 0.14858,
+ "test_loss": 6.235865226745606,
+ "test_acc": 0.0101,
+ "lyapunov": null,
+ "grad_norm": 0.6905264720289787,
+ "grad_max_sv": 0.2911532886326313,
+ "grad_min_sv": 1.1886577161446255e-08,
+ "grad_condition": 31227215.280764975,
+ "lr": 0.0009686409947459456,
+ "time_sec": 67.08970355987549
+ },
+ {
+ "epoch": 18,
+ "train_loss": 3.5831439966583254,
+ "train_acc": 0.1503,
+ "test_loss": 5.975571099853515,
+ "test_acc": 0.0174,
+ "lyapunov": null,
+ "grad_norm": 0.6807202195385632,
+ "grad_max_sv": 0.28772652372717855,
+ "grad_min_sv": 1.1393226486029751e-08,
+ "grad_condition": 137655636.45168823,
+ "lr": 0.0009648882429441254,
+ "time_sec": 66.99836611747742
+ },
+ {
+ "epoch": 19,
+ "train_loss": 3.5665633306121824,
+ "train_acc": 0.15322,
+ "test_loss": 5.7967665618896485,
+ "test_acc": 0.0147,
+ "lyapunov": null,
+ "grad_norm": 0.6692239217191613,
+ "grad_max_sv": 0.289702807366848,
+ "grad_min_sv": 1.1524174722138403e-08,
+ "grad_condition": 43837157.90767797,
+ "lr": 0.00096093157579425,
+ "time_sec": 66.98469638824463
+ },
+ {
+ "epoch": 20,
+ "train_loss": 3.5485270121765136,
+ "train_acc": 0.15842,
+ "test_loss": 6.38743748626709,
+ "test_acc": 0.0106,
+ "lyapunov": null,
+ "grad_norm": 0.6524234858247975,
+ "grad_max_sv": 0.2710107877850533,
+ "grad_min_sv": 1.1343318032097648e-08,
+ "grad_condition": 27194748.912352692,
+ "lr": 0.0009567727288213001,
+ "time_sec": 66.97950530052185
+ },
+ {
+ "epoch": 21,
+ "train_loss": 3.5387647283172607,
+ "train_acc": 0.15974,
+ "test_loss": 6.142497198486328,
+ "test_acc": 0.0122,
+ "lyapunov": null,
+ "grad_norm": 0.6404971752730705,
+ "grad_max_sv": 0.25612146519124507,
+ "grad_min_sv": 1.1065940866417101e-08,
+ "grad_condition": 27020698.902072392,
+ "lr": 0.0009524135262330095,
+ "time_sec": 67.06527757644653
+ },
+ {
+ "epoch": 22,
+ "train_loss": 3.5167810900115968,
+ "train_acc": 0.16126,
+ "test_loss": 5.6688673957824705,
+ "test_acc": 0.0192,
+ "lyapunov": null,
+ "grad_norm": 0.6273838486372684,
+ "grad_max_sv": 0.253273681178689,
+ "grad_min_sv": 1.0633086347869302e-08,
+ "grad_condition": 63663927.521495186,
+ "lr": 0.0009478558801197061,
+ "time_sec": 67.08625936508179
+ },
+ {
+ "epoch": 23,
+ "train_loss": 3.505348560180664,
+ "train_acc": 0.16408,
+ "test_loss": 6.704450527191162,
+ "test_acc": 0.0106,
+ "lyapunov": null,
+ "grad_norm": 0.6205013434735249,
+ "grad_max_sv": 0.24795704074203967,
+ "grad_min_sv": 1.0544875683748956e-08,
+ "grad_condition": 26930900.301938236,
+ "lr": 0.000943101789615607,
+ "time_sec": 67.07537865638733
+ },
+ {
+ "epoch": 24,
+ "train_loss": 3.487646808624268,
+ "train_acc": 0.16852,
+ "test_loss": 6.14088282699585,
+ "test_acc": 0.0215,
+ "lyapunov": null,
+ "grad_norm": 0.614195126220202,
+ "grad_max_sv": 0.24658647775650025,
+ "grad_min_sv": 1.0614721224211365e-08,
+ "grad_condition": 25409602.645818073,
+ "lr": 0.0009381533400219313,
+ "time_sec": 67.04035305976868
+ },
+ {
+ "epoch": 25,
+ "train_loss": 3.476624384918213,
+ "train_acc": 0.16722,
+ "test_loss": 6.3985797378540035,
+ "test_acc": 0.0153,
+ "lyapunov": null,
+ "grad_norm": 0.6065663518942211,
+ "grad_max_sv": 0.24001154042780398,
+ "grad_min_sv": 1.0449337081719356e-08,
+ "grad_condition": 26892625.00106412,
+ "lr": 0.0009330127018922189,
+ "time_sec": 66.98434329032898
+ },
+ {
+ "epoch": 26,
+ "train_loss": 3.451528890914917,
+ "train_acc": 0.17194,
+ "test_loss": 7.005337218475342,
+ "test_acc": 0.0161,
+ "lyapunov": null,
+ "grad_norm": 0.5958316341461533,
+ "grad_max_sv": 0.23011010847985744,
+ "grad_min_sv": 1.0420057322546583e-08,
+ "grad_condition": 25092916.983647533,
+ "lr": 0.000927682130080253,
+ "time_sec": 67.00863981246948
+ },
+ {
+ "epoch": 27,
+ "train_loss": 3.438732011184692,
+ "train_acc": 0.17512,
+ "test_loss": 6.713776673126221,
+ "test_acc": 0.0158,
+ "lyapunov": null,
+ "grad_norm": 0.5885432606585439,
+ "grad_max_sv": 0.22313685715198517,
+ "grad_min_sv": 1.0256330273961112e-08,
+ "grad_condition": 25498257.67463268,
+ "lr": 0.0009221639627510072,
+ "time_sec": 66.99373292922974
+ },
+ {
+ "epoch": 28,
+ "train_loss": 3.425728820877075,
+ "train_acc": 0.17648,
+ "test_loss": 6.706079711914063,
+ "test_acc": 0.0161,
+ "lyapunov": null,
+ "grad_norm": 0.5776306796513797,
+ "grad_max_sv": 0.21763003207743167,
+ "grad_min_sv": 1.0131521277489953e-08,
+ "grad_condition": 25502860.727228213,
+ "lr": 0.0009164606203550494,
+ "time_sec": 66.99960255622864
+ },
+ {
+ "epoch": 29,
+ "train_loss": 3.415288860321045,
+ "train_acc": 0.18104,
+ "test_loss": 7.00422691116333,
+ "test_acc": 0.0154,
+ "lyapunov": null,
+ "grad_norm": 0.5811456709025584,
+ "grad_max_sv": 0.2154564827680588,
+ "grad_min_sv": 1.0227832727971453e-08,
+ "grad_condition": 23155291.155594237,
+ "lr": 0.0009105746045668516,
+ "time_sec": 67.00278520584106
+ },
+ {
+ "epoch": 30,
+ "train_loss": 3.3993768449401855,
+ "train_acc": 0.18168,
+ "test_loss": 6.7661912048339845,
+ "test_acc": 0.0159,
+ "lyapunov": null,
+ "grad_norm": 0.5774334611780905,
+ "grad_max_sv": 0.21602067165076733,
+ "grad_min_sv": 9.999383252662363e-09,
+ "grad_condition": 46830102.49335132,
+ "lr": 0.0009045084971874733,
+ "time_sec": 67.01802110671997
+ },
+ {
+ "epoch": 31,
+ "train_loss": 3.39102335395813,
+ "train_acc": 0.183,
+ "test_loss": 6.575534628295898,
+ "test_acc": 0.0259,
+ "lyapunov": null,
+ "grad_norm": 0.5750391869831528,
+ "grad_max_sv": 0.21328589245676993,
+ "grad_min_sv": 1.0037052611266972e-08,
+ "grad_condition": 25219793.844095282,
+ "lr": 0.0008982649590120977,
+ "time_sec": 66.98685121536255
+ },
+ {
+ "epoch": 32,
+ "train_loss": 3.3709024705505373,
+ "train_acc": 0.1847,
+ "test_loss": 6.773156211090088,
+ "test_acc": 0.0241,
+ "lyapunov": null,
+ "grad_norm": 0.5682008127495727,
+ "grad_max_sv": 0.20905940011143684,
+ "grad_min_sv": 9.929261479690864e-09,
+ "grad_condition": 24026442.614084087,
+ "lr": 0.0008918467286629196,
+ "time_sec": 66.98118853569031
+ },
+ {
+ "epoch": 33,
+ "train_loss": 3.35322883605957,
+ "train_acc": 0.19048,
+ "test_loss": 6.544390415191651,
+ "test_acc": 0.0174,
+ "lyapunov": null,
+ "grad_norm": 0.5641011790857979,
+ "grad_max_sv": 0.21131759136915207,
+ "grad_min_sv": 9.970292436448092e-09,
+ "grad_condition": 108439933.80954358,
+ "lr": 0.0008852566213878943,
+ "time_sec": 67.0021116733551
+ },
+ {
+ "epoch": 34,
+ "train_loss": 3.346888256225586,
+ "train_acc": 0.1906,
+ "test_loss": 6.572783890533447,
+ "test_acc": 0.0249,
+ "lyapunov": null,
+ "grad_norm": 0.5631657519504247,
+ "grad_max_sv": 0.20612632147967816,
+ "grad_min_sv": 9.939895384558639e-09,
+ "grad_condition": 27859013.00420784,
+ "lr": 0.000878497527825878,
+ "time_sec": 66.99292349815369
+ },
+ {
+ "epoch": 35,
+ "train_loss": 3.3364852532958986,
+ "train_acc": 0.19192,
+ "test_loss": 6.624941380310059,
+ "test_acc": 0.0267,
+ "lyapunov": null,
+ "grad_norm": 0.5605769760458655,
+ "grad_max_sv": 0.20491612255573272,
+ "grad_min_sv": 9.870486683549728e-09,
+ "grad_condition": 23146292.907969765,
+ "lr": 0.000871572412738697,
+ "time_sec": 66.99680066108704
+ },
+ {
+ "epoch": 36,
+ "train_loss": 3.3320838648986815,
+ "train_acc": 0.19194,
+ "test_loss": 6.509025389099121,
+ "test_acc": 0.0338,
+ "lyapunov": null,
+ "grad_norm": 0.5514752672797416,
+ "grad_max_sv": 0.19631769321858883,
+ "grad_min_sv": 9.801347783389147e-09,
+ "grad_condition": 22925424.744912885,
+ "lr": 0.0008644843137107055,
+ "time_sec": 67.00271224975586
+ },
+ {
+ "epoch": 37,
+ "train_loss": 3.3248722314453123,
+ "train_acc": 0.19368,
+ "test_loss": 6.660050495910644,
+ "test_acc": 0.0232,
+ "lyapunov": null,
+ "grad_norm": 0.5549782000253485,
+ "grad_max_sv": 0.20016637705266477,
+ "grad_min_sv": 9.80520761806325e-09,
+ "grad_condition": 43150496.42441137,
+ "lr": 0.0008572363398164014,
+ "time_sec": 67.00392818450928
+ },
+ {
+ "epoch": 38,
+ "train_loss": 3.3040303685760497,
+ "train_acc": 0.1978,
+ "test_loss": 6.438115409851074,
+ "test_acc": 0.0278,
+ "lyapunov": null,
+ "grad_norm": 0.552679160616354,
+ "grad_max_sv": 0.20150073878467084,
+ "grad_min_sv": 9.978901688301178e-09,
+ "grad_condition": 24404614.851154737,
+ "lr": 0.0008498316702566826,
+ "time_sec": 66.97884392738342
+ },
+ {
+ "epoch": 39,
+ "train_loss": 3.295093801422119,
+ "train_acc": 0.2004,
+ "test_loss": 6.857768655395508,
+ "test_acc": 0.0356,
+ "lyapunov": null,
+ "grad_norm": 0.5456414300888803,
+ "grad_max_sv": 0.19542820267379285,
+ "grad_min_sv": 9.64108341980352e-09,
+ "grad_condition": 38418267.99625971,
+ "lr": 0.0008422735529643442,
+ "time_sec": 66.989262342453
+ },
+ {
+ "epoch": 40,
+ "train_loss": 3.2807973724365236,
+ "train_acc": 0.20254,
+ "test_loss": 7.183624605560302,
+ "test_acc": 0.0288,
+ "lyapunov": null,
+ "grad_norm": 0.5502236317298648,
+ "grad_max_sv": 0.20073941312730312,
+ "grad_min_sv": 9.736421222039659e-09,
+ "grad_condition": 23971099.963185668,
+ "lr": 0.0008345653031794289,
+ "time_sec": 67.05479025840759
+ },
+ {
+ "epoch": 41,
+ "train_loss": 3.27089994934082,
+ "train_acc": 0.20396,
+ "test_loss": 7.336966199493408,
+ "test_acc": 0.0235,
+ "lyapunov": null,
+ "grad_norm": 0.5476662910413355,
+ "grad_max_sv": 0.19763046652078628,
+ "grad_min_sv": 9.775574641435192e-09,
+ "grad_condition": 23640934.778466806,
+ "lr": 0.0008267103019950526,
+ "time_sec": 67.02259588241577
+ },
+ {
+ "epoch": 42,
+ "train_loss": 3.2620423323059082,
+ "train_acc": 0.20586,
+ "test_loss": 6.97865482788086,
+ "test_acc": 0.0258,
+ "lyapunov": null,
+ "grad_norm": 0.5434507884263167,
+ "grad_max_sv": 0.19267416559159756,
+ "grad_min_sv": 9.676590862622846e-09,
+ "grad_condition": 32692140.861607928,
+ "lr": 0.0008187119948743447,
+ "time_sec": 67.11938738822937
+ },
+ {
+ "epoch": 43,
+ "train_loss": 3.246746938018799,
+ "train_acc": 0.20984,
+ "test_loss": 7.017108020019531,
+ "test_acc": 0.027,
+ "lyapunov": null,
+ "grad_norm": 0.5396772430481056,
+ "grad_max_sv": 0.1911445375531912,
+ "grad_min_sv": 9.706909992468482e-09,
+ "grad_condition": 22347408.62738797,
+ "lr": 0.000810573890139155,
+ "time_sec": 67.11671566963196
+ },
+ {
+ "epoch": 44,
+ "train_loss": 3.2492278230285643,
+ "train_acc": 0.20804,
+ "test_loss": 6.893268182373047,
+ "test_acc": 0.0274,
+ "lyapunov": null,
+ "grad_norm": 0.5383084022428465,
+ "grad_max_sv": 0.18535939790308475,
+ "grad_min_sv": 9.539425227522713e-09,
+ "grad_condition": 74582506.47418927,
+ "lr": 0.0008022995574311873,
+ "time_sec": 67.00796937942505
+ },
+ {
+ "epoch": 45,
+ "train_loss": 3.2271074884796143,
+ "train_acc": 0.2125,
+ "test_loss": 6.6321695571899415,
+ "test_acc": 0.0298,
+ "lyapunov": null,
+ "grad_norm": 0.5350882941371298,
+ "grad_max_sv": 0.18614536896348,
+ "grad_min_sv": 9.520675481561152e-09,
+ "grad_condition": 519972815.1749519,
+ "lr": 0.0007938926261462363,
+ "time_sec": 67.05224251747131
+ },
+ {
+ "epoch": 46,
+ "train_loss": 3.223205012207031,
+ "train_acc": 0.21378,
+ "test_loss": 8.111690937805175,
+ "test_acc": 0.0245,
+ "lyapunov": null,
+ "grad_norm": 0.5313315491107766,
+ "grad_max_sv": 0.18769054301083088,
+ "grad_min_sv": 9.561545546987737e-09,
+ "grad_condition": 22558726.834869802,
+ "lr": 0.0007853567838422158,
+ "time_sec": 67.02692914009094
+ },
+ {
+ "epoch": 47,
+ "train_loss": 3.2102231874084475,
+ "train_acc": 0.21366,
+ "test_loss": 7.20476734161377,
+ "test_acc": 0.0268,
+ "lyapunov": null,
+ "grad_norm": 0.5300596779522426,
+ "grad_max_sv": 0.18552429899573325,
+ "grad_min_sv": 9.575782686233047e-09,
+ "grad_condition": 21495882.964656584,
+ "lr": 0.0007766957746216719,
+ "time_sec": 67.0929958820343
+ },
+ {
+ "epoch": 48,
+ "train_loss": 3.202328568191528,
+ "train_acc": 0.21738,
+ "test_loss": 7.143350020599366,
+ "test_acc": 0.0275,
+ "lyapunov": null,
+ "grad_norm": 0.5275781384357864,
+ "grad_max_sv": 0.18636706620454788,
+ "grad_min_sv": 9.551907610705345e-09,
+ "grad_condition": 33257654.14790963,
+ "lr": 0.0007679133974894982,
+ "time_sec": 67.10289525985718
+ },
+ {
+ "epoch": 49,
+ "train_loss": 3.1964333237457274,
+ "train_acc": 0.21696,
+ "test_loss": 7.0859999771118165,
+ "test_acc": 0.0354,
+ "lyapunov": null,
+ "grad_norm": 0.5290459768999093,
+ "grad_max_sv": 0.18547305800020694,
+ "grad_min_sv": 9.539052431978278e-09,
+ "grad_condition": 34652740.14328016,
+ "lr": 0.000759013504686565,
+ "time_sec": 67.11912679672241
+ },
+ {
+ "epoch": 50,
+ "train_loss": 3.1868507556152346,
+ "train_acc": 0.2195,
+ "test_loss": 7.204959943389893,
+ "test_acc": 0.0247,
+ "lyapunov": null,
+ "grad_norm": 0.5304998310773968,
+ "grad_max_sv": 0.1833030626177788,
+ "grad_min_sv": 9.589407306935527e-09,
+ "grad_condition": 93768948.14927751,
+ "lr": 0.0007499999999999998,
+ "time_sec": 67.06959462165833
+ },
+ {
+ "epoch": 51,
+ "train_loss": 3.1883190923309326,
+ "train_acc": 0.21784,
+ "test_loss": 7.328389108276367,
+ "test_acc": 0.0303,
+ "lyapunov": null,
+ "grad_norm": 0.5248467282170762,
+ "grad_max_sv": 0.18131516128778458,
+ "grad_min_sv": 9.465690375617952e-09,
+ "grad_condition": 47668215.59636396,
+ "lr": 0.0007408768370508575,
+ "time_sec": 67.01846742630005
+ },
+ {
+ "epoch": 52,
+ "train_loss": 3.1719473053741454,
+ "train_acc": 0.22166,
+ "test_loss": 8.36594852142334,
+ "test_acc": 0.025,
+ "lyapunov": null,
+ "grad_norm": 0.5248103969653446,
+ "grad_max_sv": 0.17532115392386913,
+ "grad_min_sv": 9.532304753867572e-09,
+ "grad_condition": 26041874.469802074,
+ "lr": 0.0007316480175599307,
+ "time_sec": 67.03516387939453
+ },
+ {
+ "epoch": 53,
+ "train_loss": 3.1698596488952635,
+ "train_acc": 0.22132,
+ "test_loss": 8.36387837677002,
+ "test_acc": 0.0251,
+ "lyapunov": null,
+ "grad_norm": 0.5233372908286834,
+ "grad_max_sv": 0.17466790974140167,
+ "grad_min_sv": 9.286205268632663e-09,
+ "grad_condition": 21363168.099911686,
+ "lr": 0.0007223175895924635,
+ "time_sec": 67.02187657356262
+ },
+ {
+ "epoch": 54,
+ "train_loss": 3.152655903167725,
+ "train_acc": 0.22722,
+ "test_loss": 8.196963485717774,
+ "test_acc": 0.0261,
+ "lyapunov": null,
+ "grad_norm": 0.5285400405038103,
+ "grad_max_sv": 0.17916450947523116,
+ "grad_min_sv": 9.4594759324218e-09,
+ "grad_condition": 82291006.99579689,
+ "lr": 0.0007128896457825361,
+ "time_sec": 66.97509050369263
+ },
+ {
+ "epoch": 55,
+ "train_loss": 3.1408946729278564,
+ "train_acc": 0.22896,
+ "test_loss": 8.031216970825195,
+ "test_acc": 0.0238,
+ "lyapunov": null,
+ "grad_norm": 0.5251164499697153,
+ "grad_max_sv": 0.17466633953154087,
+ "grad_min_sv": 9.452194638104316e-09,
+ "grad_condition": 22653052.01456701,
+ "lr": 0.0007033683215378998,
+ "time_sec": 67.00176858901978
+ },
+ {
+ "epoch": 56,
+ "train_loss": 3.1348105377960205,
+ "train_acc": 0.22832,
+ "test_loss": 8.950087960815429,
+ "test_acc": 0.0204,
+ "lyapunov": null,
+ "grad_norm": 0.5200008300943049,
+ "grad_max_sv": 0.17119008600711821,
+ "grad_min_sv": 9.414464659240895e-09,
+ "grad_condition": 31689823.38588159,
+ "lr": 0.0006937577932260512,
+ "time_sec": 66.97579646110535
+ },
+ {
+ "epoch": 57,
+ "train_loss": 3.1169134953308104,
+ "train_acc": 0.23282,
+ "test_loss": 8.065475146484374,
+ "test_acc": 0.0311,
+ "lyapunov": null,
+ "grad_norm": 0.5241244870526487,
+ "grad_max_sv": 0.17154259756207466,
+ "grad_min_sv": 9.529985643685902e-09,
+ "grad_condition": 28312826.48374013,
+ "lr": 0.0006840622763423388,
+ "time_sec": 66.9856812953949
+ },
+ {
+ "epoch": 58,
+ "train_loss": 3.1234397563171385,
+ "train_acc": 0.22962,
+ "test_loss": 8.583345112609864,
+ "test_acc": 0.0222,
+ "lyapunov": null,
+ "grad_norm": 0.5197452718406793,
+ "grad_max_sv": 0.17415275909006595,
+ "grad_min_sv": 9.31348687893685e-09,
+ "grad_condition": 21270072.13306666,
+ "lr": 0.0006742860236609073,
+ "time_sec": 66.99910068511963
+ },
+ {
+ "epoch": 59,
+ "train_loss": 3.1087922663879395,
+ "train_acc": 0.23302,
+ "test_loss": 8.37566005859375,
+ "test_acc": 0.0239,
+ "lyapunov": null,
+ "grad_norm": 0.5182628480059946,
+ "grad_max_sv": 0.17543886601924896,
+ "grad_min_sv": 9.358361164474304e-09,
+ "grad_condition": 31647391.583267204,
+ "lr": 0.0006644333233692913,
+ "time_sec": 66.97189855575562
+ },
+ {
+ "epoch": 60,
+ "train_loss": 3.0956507678985594,
+ "train_acc": 0.23662,
+ "test_loss": 7.7532292655944826,
+ "test_acc": 0.0248,
+ "lyapunov": null,
+ "grad_norm": 0.5195814358053482,
+ "grad_max_sv": 0.1776260558515787,
+ "grad_min_sv": 9.643665624392561e-09,
+ "grad_condition": 22666276.356990974,
+ "lr": 0.0006545084971874734,
+ "time_sec": 67.00041198730469
+ },
+ {
+ "epoch": 61,
+ "train_loss": 3.092038777694702,
+ "train_acc": 0.23596,
+ "test_loss": 7.946604266357422,
+ "test_acc": 0.0245,
+ "lyapunov": null,
+ "grad_norm": 0.5196921425232948,
+ "grad_max_sv": 0.17445886991918086,
+ "grad_min_sv": 9.508607204389285e-09,
+ "grad_condition": 21427055.017691903,
+ "lr": 0.0006445158984722354,
+ "time_sec": 67.06589937210083
+ },
+ {
+ "epoch": 62,
+ "train_loss": 3.079979831466675,
+ "train_acc": 0.23898,
+ "test_loss": 9.319492291259765,
+ "test_acc": 0.0213,
+ "lyapunov": null,
+ "grad_norm": 0.5186454829421666,
+ "grad_max_sv": 0.16986236572265626,
+ "grad_min_sv": 9.32054670874094e-09,
+ "grad_condition": 31246817.26616311,
+ "lr": 0.0006344599103076324,
+ "time_sec": 66.99018096923828
+ },
+ {
+ "epoch": 63,
+ "train_loss": 3.0727787420654296,
+ "train_acc": 0.23906,
+ "test_loss": 8.948303262329102,
+ "test_acc": 0.0269,
+ "lyapunov": null,
+ "grad_norm": 0.5175233947350019,
+ "grad_max_sv": 0.16513913124799728,
+ "grad_min_sv": 9.338011380810585e-09,
+ "grad_condition": 24005876.4941143,
+ "lr": 0.0006243449435824269,
+ "time_sec": 66.9405734539032
+ },
+ {
+ "epoch": 64,
+ "train_loss": 3.074298862915039,
+ "train_acc": 0.23708,
+ "test_loss": 9.195949301147461,
+ "test_acc": 0.0262,
+ "lyapunov": null,
+ "grad_norm": 0.5221855467062518,
+ "grad_max_sv": 0.17083160430192948,
+ "grad_min_sv": 9.452190228090296e-09,
+ "grad_condition": 48343788.07302423,
+ "lr": 0.0006141754350553275,
+ "time_sec": 67.0041880607605
+ },
+ {
+ "epoch": 65,
+ "train_loss": 3.0613560808563234,
+ "train_acc": 0.24008,
+ "test_loss": 8.735752813720703,
+ "test_acc": 0.0271,
+ "lyapunov": null,
+ "grad_norm": 0.5207095947451149,
+ "grad_max_sv": 0.1693739652633667,
+ "grad_min_sv": 9.425346239599897e-09,
+ "grad_condition": 23106579.847053923,
+ "lr": 0.0006039558454088793,
+ "time_sec": 66.9728434085846
+ },
+ {
+ "epoch": 66,
+ "train_loss": 3.050594620132446,
+ "train_acc": 0.243,
+ "test_loss": 8.672268884277344,
+ "test_acc": 0.0298,
+ "lyapunov": null,
+ "grad_norm": 0.5161820441185401,
+ "grad_max_sv": 0.1685989484190941,
+ "grad_min_sv": 9.325516864278071e-09,
+ "grad_condition": 20646125.746492933,
+ "lr": 0.000593690657292862,
+ "time_sec": 66.97670912742615
+ },
+ {
+ "epoch": 67,
+ "train_loss": 3.0404045782470703,
+ "train_acc": 0.2468,
+ "test_loss": 9.001078883361817,
+ "test_acc": 0.0227,
+ "lyapunov": null,
+ "grad_norm": 0.5184119200981759,
+ "grad_max_sv": 0.1701225485652685,
+ "grad_min_sv": 9.472868531257284e-09,
+ "grad_condition": 23517656.45251561,
+ "lr": 0.0005833843733580507,
+ "time_sec": 66.96425604820251
+ },
+ {
+ "epoch": 68,
+ "train_loss": 3.0347717694091796,
+ "train_acc": 0.24578,
+ "test_loss": 8.55764455871582,
+ "test_acc": 0.0204,
+ "lyapunov": null,
+ "grad_norm": 0.5177787618737804,
+ "grad_max_sv": 0.17245440557599068,
+ "grad_min_sv": 9.351008802005456e-09,
+ "grad_condition": 26504498.6419156,
+ "lr": 0.0005730415142812054,
+ "time_sec": 66.987557888031
+ },
+ {
+ "epoch": 69,
+ "train_loss": 3.0343177091979983,
+ "train_acc": 0.24472,
+ "test_loss": 8.6480171875,
+ "test_acc": 0.0252,
+ "lyapunov": null,
+ "grad_norm": 0.5144704452610198,
+ "grad_max_sv": 0.16564900018274784,
+ "grad_min_sv": 9.403833016452534e-09,
+ "grad_condition": 27296778.54875686,
+ "lr": 0.0005626666167821517,
+ "time_sec": 66.97946643829346
+ },
+ {
+ "epoch": 70,
+ "train_loss": 3.019142656097412,
+ "train_acc": 0.25006,
+ "test_loss": 8.915339315795899,
+ "test_acc": 0.0291,
+ "lyapunov": null,
+ "grad_norm": 0.5199788677371252,
+ "grad_max_sv": 0.16652515456080436,
+ "grad_min_sv": 9.64339011144677e-09,
+ "grad_condition": 23020050.410736304,
+ "lr": 0.0005522642316338265,
+ "time_sec": 66.97834086418152
+ },
+ {
+ "epoch": 71,
+ "train_loss": 3.0120436127471923,
+ "train_acc": 0.25124,
+ "test_loss": 9.489800686645507,
+ "test_acc": 0.0229,
+ "lyapunov": null,
+ "grad_norm": 0.5170392758240284,
+ "grad_max_sv": 0.16549308113753797,
+ "grad_min_sv": 9.466763362109277e-09,
+ "grad_condition": 23186013.564122196,
+ "lr": 0.0005418389216661573,
+ "time_sec": 66.98612070083618
+ },
+ {
+ "epoch": 72,
+ "train_loss": 3.005094768676758,
+ "train_acc": 0.25262,
+ "test_loss": 9.240029809570313,
+ "test_acc": 0.0228,
+ "lyapunov": null,
+ "grad_norm": 0.5193656479358113,
+ "grad_max_sv": 0.16801112554967404,
+ "grad_min_sv": 9.608471449040756e-09,
+ "grad_condition": 72045711.1919595,
+ "lr": 0.0005313952597646563,
+ "time_sec": 66.99170446395874
+ },
+ {
+ "epoch": 73,
+ "train_loss": 2.9903506928253174,
+ "train_acc": 0.25404,
+ "test_loss": 9.075869140625,
+ "test_acc": 0.0255,
+ "lyapunov": null,
+ "grad_norm": 0.517195719023633,
+ "grad_max_sv": 0.16475822702050208,
+ "grad_min_sv": 9.421488161853731e-09,
+ "grad_condition": 20088448.14143536,
+ "lr": 0.0005209378268645994,
+ "time_sec": 66.99337768554688
+ },
+ {
+ "epoch": 74,
+ "train_loss": 2.9886431184387208,
+ "train_acc": 0.25206,
+ "test_loss": 8.946782205200195,
+ "test_acc": 0.0216,
+ "lyapunov": null,
+ "grad_norm": 0.5156132053442515,
+ "grad_max_sv": 0.1671187650412321,
+ "grad_min_sv": 9.546754539679903e-09,
+ "grad_condition": 20526453.312863432,
+ "lr": 0.0005104712099416781,
+ "time_sec": 66.97370409965515
+ },
+ {
+ "epoch": 75,
+ "train_loss": 2.978247420654297,
+ "train_acc": 0.25748,
+ "test_loss": 8.795244805908203,
+ "test_acc": 0.0265,
+ "lyapunov": null,
+ "grad_norm": 0.5172367229977752,
+ "grad_max_sv": 0.16712253615260125,
+ "grad_min_sv": 9.516156018046784e-09,
+ "grad_condition": 30249731.938419342,
+ "lr": 0.0004999999999999996,
+ "time_sec": 67.0042519569397
+ },
+ {
+ "epoch": 76,
+ "train_loss": 2.975222046432495,
+ "train_acc": 0.2575,
+ "test_loss": 7.9467042022705074,
+ "test_acc": 0.0274,
+ "lyapunov": null,
+ "grad_norm": 0.5205213451239863,
+ "grad_max_sv": 0.16927127800881864,
+ "grad_min_sv": 9.570786241308582e-09,
+ "grad_condition": 21297706.844217338,
+ "lr": 0.0004895287900583212,
+ "time_sec": 66.98396968841553
+ },
+ {
+ "epoch": 77,
+ "train_loss": 2.9694722108459475,
+ "train_acc": 0.25688,
+ "test_loss": 8.63839992980957,
+ "test_acc": 0.027,
+ "lyapunov": null,
+ "grad_norm": 0.5171656548088565,
+ "grad_max_sv": 0.16773934625089168,
+ "grad_min_sv": 9.45730138160461e-09,
+ "grad_condition": 53792449.33116071,
+ "lr": 0.0004790621731353997,
+ "time_sec": 67.06471967697144
+ },
+ {
+ "epoch": 78,
+ "train_loss": 2.954387292098999,
+ "train_acc": 0.26136,
+ "test_loss": 8.785921076965332,
+ "test_acc": 0.0231,
+ "lyapunov": null,
+ "grad_norm": 0.5158257600732294,
+ "grad_max_sv": 0.16913142390549182,
+ "grad_min_sv": 9.432701836287194e-09,
+ "grad_condition": 22764076.692523666,
+ "lr": 0.000468604740235343,
+ "time_sec": 66.98979210853577
+ },
+ {
+ "epoch": 79,
+ "train_loss": 2.951801152191162,
+ "train_acc": 0.26352,
+ "test_loss": 8.070646887207031,
+ "test_acc": 0.0255,
+ "lyapunov": null,
+ "grad_norm": 0.5174682191745558,
+ "grad_max_sv": 0.16524536907672882,
+ "grad_min_sv": 9.502134473704515e-09,
+ "grad_condition": 19794117.95628558,
+ "lr": 0.00045816107833384175,
+ "time_sec": 67.00397682189941
+ },
+ {
+ "epoch": 80,
+ "train_loss": 2.945303405151367,
+ "train_acc": 0.25934,
+ "test_loss": 8.538162045288086,
+ "test_acc": 0.0261,
+ "lyapunov": null,
+ "grad_norm": 0.5164921536500987,
+ "grad_max_sv": 0.16473788283765317,
+ "grad_min_sv": 9.313295684654222e-09,
+ "grad_condition": 20076070.15299391,
+ "lr": 0.0004477357683661729,
+ "time_sec": 66.99750208854675
+ },
+ {
+ "epoch": 81,
+ "train_loss": 2.9330507093811033,
+ "train_acc": 0.26472,
+ "test_loss": 9.089803251647949,
+ "test_acc": 0.0256,
+ "lyapunov": null,
+ "grad_norm": 0.5182949552264074,
+ "grad_max_sv": 0.16235619597136974,
+ "grad_min_sv": 9.617397696282115e-09,
+ "grad_condition": 30543590.097258378,
+ "lr": 0.00043733338321784746,
+ "time_sec": 66.96942782402039
+ },
+ {
+ "epoch": 82,
+ "train_loss": 2.931871794204712,
+ "train_acc": 0.26478,
+ "test_loss": 9.64152674560547,
+ "test_acc": 0.0219,
+ "lyapunov": null,
+ "grad_norm": 0.5176276155464238,
+ "grad_max_sv": 0.16380822993814945,
+ "grad_min_sv": 9.444439504069369e-09,
+ "grad_condition": 55360326.762117185,
+ "lr": 0.0004269584857187939,
+ "time_sec": 66.98204827308655
+ },
+ {
+ "epoch": 83,
+ "train_loss": 2.9243045820617675,
+ "train_acc": 0.2654,
+ "test_loss": 8.998370599365234,
+ "test_acc": 0.0286,
+ "lyapunov": null,
+ "grad_norm": 0.5221359210821417,
+ "grad_max_sv": 0.16723665855824948,
+ "grad_min_sv": 9.730227464033181e-09,
+ "grad_condition": 37510081.93776859,
+ "lr": 0.0004166156266419484,
+ "time_sec": 67.03800463676453
+ },
+ {
+ "epoch": 84,
+ "train_loss": 2.910555010223389,
+ "train_acc": 0.26936,
+ "test_loss": 9.721973526000976,
+ "test_acc": 0.0313,
+ "lyapunov": null,
+ "grad_norm": 0.519552420362012,
+ "grad_max_sv": 0.16508992463350297,
+ "grad_min_sv": 9.647469361231953e-09,
+ "grad_condition": 55059867.79942672,
+ "lr": 0.0004063093427071373,
+ "time_sec": 67.02205467224121
+ },
+ {
+ "epoch": 85,
+ "train_loss": 2.908977954711914,
+ "train_acc": 0.26772,
+ "test_loss": 9.513397438049317,
+ "test_acc": 0.0262,
+ "lyapunov": null,
+ "grad_norm": 0.5225336336313486,
+ "grad_max_sv": 0.1674807954579592,
+ "grad_min_sv": 9.611194474665185e-09,
+ "grad_condition": 61660610.28358656,
+ "lr": 0.0003960441545911199,
+ "time_sec": 66.98397827148438
+ },
+ {
+ "epoch": 86,
+ "train_loss": 2.9070045388793946,
+ "train_acc": 0.26946,
+ "test_loss": 9.42815225982666,
+ "test_acc": 0.0253,
+ "lyapunov": null,
+ "grad_norm": 0.5163838704970162,
+ "grad_max_sv": 0.15979891866445542,
+ "grad_min_sv": 9.371719027900793e-09,
+ "grad_condition": 27067310.492935486,
+ "lr": 0.0003858245649446718,
+ "time_sec": 67.00940752029419
+ },
+ {
+ "epoch": 87,
+ "train_loss": 2.8997818164825437,
+ "train_acc": 0.27182,
+ "test_loss": 9.99990376586914,
+ "test_acc": 0.0235,
+ "lyapunov": null,
+ "grad_norm": 0.5185938331206461,
+ "grad_max_sv": 0.1670172270387411,
+ "grad_min_sv": 9.72940567521563e-09,
+ "grad_condition": 41690290.30450606,
+ "lr": 0.00037565505641757235,
+ "time_sec": 66.98136639595032
+ },
+ {
+ "epoch": 88,
+ "train_loss": 2.8861678593444826,
+ "train_acc": 0.27088,
+ "test_loss": 9.440834574890136,
+ "test_acc": 0.0223,
+ "lyapunov": null,
+ "grad_norm": 0.5210845021802476,
+ "grad_max_sv": 0.16573623865842818,
+ "grad_min_sv": 9.66025861803832e-09,
+ "grad_condition": 21401152.005565703,
+ "lr": 0.00036554008969236695,
+ "time_sec": 66.97698450088501
+ },
+ {
+ "epoch": 89,
+ "train_loss": 2.879338860092163,
+ "train_acc": 0.2741,
+ "test_loss": 9.169851208496095,
+ "test_acc": 0.0199,
+ "lyapunov": null,
+ "grad_norm": 0.5207447841157706,
+ "grad_max_sv": 0.16667181067168713,
+ "grad_min_sv": 9.689165991755289e-09,
+ "grad_condition": 26973958.650769584,
+ "lr": 0.0003554841015277638,
+ "time_sec": 67.01995515823364
+ },
+ {
+ "epoch": 90,
+ "train_loss": 2.8748147813415525,
+ "train_acc": 0.27324,
+ "test_loss": 10.077813652038575,
+ "test_acc": 0.022,
+ "lyapunov": null,
+ "grad_norm": 0.5199671563562479,
+ "grad_max_sv": 0.16343193501234055,
+ "grad_min_sv": 9.647999926754025e-09,
+ "grad_condition": 21023683.920218416,
+ "lr": 0.000345491502812526,
+ "time_sec": 67.06868648529053
+ },
+ {
+ "epoch": 91,
+ "train_loss": 2.8696892933654787,
+ "train_acc": 0.27466,
+ "test_loss": 9.565517497253419,
+ "test_acc": 0.0229,
+ "lyapunov": null,
+ "grad_norm": 0.5208386545074176,
+ "grad_max_sv": 0.16384688578546047,
+ "grad_min_sv": 9.741156603571e-09,
+ "grad_condition": 20234282.31156399,
+ "lr": 0.0003355666766307081,
+ "time_sec": 67.05189514160156
+ },
+ {
+ "epoch": 92,
+ "train_loss": 2.8643893748474123,
+ "train_acc": 0.27506,
+ "test_loss": 9.676446484375,
+ "test_acc": 0.0222,
+ "lyapunov": null,
+ "grad_norm": 0.5227536692673017,
+ "grad_max_sv": 0.16562484614551068,
+ "grad_min_sv": 9.696238559286918e-09,
+ "grad_condition": 19364268.060319778,
+ "lr": 0.00032571397633909225,
+ "time_sec": 67.04055285453796
+ },
+ {
+ "epoch": 93,
+ "train_loss": 2.9157111973571777,
+ "train_acc": 0.2694,
+ "test_loss": 10.502802850341796,
+ "test_acc": 0.016,
+ "lyapunov": null,
+ "grad_norm": 0.5304583427147314,
+ "grad_max_sv": 0.16479565128684043,
+ "grad_min_sv": 9.75800383412606e-09,
+ "grad_condition": 23919445.487485204,
+ "lr": 0.00031593772365766094,
+ "time_sec": 67.07202672958374
+ },
+ {
+ "epoch": 94,
+ "train_loss": 3.5718225437927247,
+ "train_acc": 0.14984,
+ "test_loss": 8.342486605834962,
+ "test_acc": 0.0173,
+ "lyapunov": null,
+ "grad_norm": 0.47865396629415263,
+ "grad_max_sv": 0.146741402707994,
+ "grad_min_sv": 8.774483893636553e-09,
+ "grad_condition": 22076860.426247958,
+ "lr": 0.0003062422067739483,
+ "time_sec": 66.99063777923584
+ },
+ {
+ "epoch": 95,
+ "train_loss": 3.3590557197570803,
+ "train_acc": 0.18824,
+ "test_loss": 9.117096383666992,
+ "test_acc": 0.018,
+ "lyapunov": null,
+ "grad_norm": 0.47849958749977733,
+ "grad_max_sv": 0.14531232379376888,
+ "grad_min_sv": 8.800075565473798e-09,
+ "grad_condition": 21940629.92360129,
+ "lr": 0.00029663167846209965,
+ "time_sec": 66.97514224052429
+ },
+ {
+ "epoch": 96,
+ "train_loss": 3.2702466972351076,
+ "train_acc": 0.2019,
+ "test_loss": 9.76727836151123,
+ "test_acc": 0.0196,
+ "lyapunov": null,
+ "grad_norm": 0.47937534710610474,
+ "grad_max_sv": 0.14464113656431438,
+ "grad_min_sv": 8.792039801926166e-09,
+ "grad_condition": 89660660.43121836,
+ "lr": 0.00028711035421746345,
+ "time_sec": 66.99873089790344
+ },
+ {
+ "epoch": 97,
+ "train_loss": 3.2227031265258788,
+ "train_acc": 0.21062,
+ "test_loss": 9.626097766113281,
+ "test_acc": 0.02,
+ "lyapunov": null,
+ "grad_norm": 0.4871680253381029,
+ "grad_max_sv": 0.15086784306913614,
+ "grad_min_sv": 9.198363076778903e-09,
+ "grad_condition": 18446455.013218474,
+ "lr": 0.00027768241040753615,
+ "time_sec": 67.01664638519287
+ },
+ {
+ "epoch": 98,
+ "train_loss": 3.1770834211730956,
+ "train_acc": 0.21918,
+ "test_loss": 9.366678713989257,
+ "test_acc": 0.0189,
+ "lyapunov": null,
+ "grad_norm": 0.48983757815120343,
+ "grad_max_sv": 0.14779492281377316,
+ "grad_min_sv": 9.026428729463909e-09,
+ "grad_condition": 18794227.40584495,
+ "lr": 0.00026835198244006903,
+ "time_sec": 66.9809033870697
+ },
+ {
+ "epoch": 99,
+ "train_loss": 3.154748341598511,
+ "train_acc": 0.22074,
+ "test_loss": 8.755814114379882,
+ "test_acc": 0.0203,
+ "lyapunov": null,
+ "grad_norm": 0.49142802947586006,
+ "grad_max_sv": 0.14894249550998212,
+ "grad_min_sv": 9.186921921030405e-09,
+ "grad_condition": 243665710.2249507,
+ "lr": 0.0002591231629491421,
+ "time_sec": 66.99194574356079
+ },
+ {
+ "epoch": 100,
+ "train_loss": 3.120311908035278,
+ "train_acc": 0.229,
+ "test_loss": 9.377279025268555,
+ "test_acc": 0.019,
+ "lyapunov": null,
+ "grad_norm": 0.49378455655907144,
+ "grad_max_sv": 0.1519782803952694,
+ "grad_min_sv": 9.117503733946376e-09,
+ "grad_condition": 21901137.13681825,
+ "lr": 0.0002499999999999997,
+ "time_sec": 66.99540328979492
+ },
+ {
+ "epoch": 101,
+ "train_loss": 3.102491766357422,
+ "train_acc": 0.23234,
+ "test_loss": 9.32430498046875,
+ "test_acc": 0.0219,
+ "lyapunov": null,
+ "grad_norm": 0.49627664046313075,
+ "grad_max_sv": 0.15419429913163185,
+ "grad_min_sv": 9.201821271620503e-09,
+ "grad_condition": 21776686.85204944,
+ "lr": 0.00024098649531343477,
+ "time_sec": 66.98357772827148
+ },
+ {
+ "epoch": 102,
+ "train_loss": 3.085017224731445,
+ "train_acc": 0.23322,
+ "test_loss": 9.753949787902831,
+ "test_acc": 0.0193,
+ "lyapunov": null,
+ "grad_norm": 0.49406280305370465,
+ "grad_max_sv": 0.15118828602135181,
+ "grad_min_sv": 9.171319623191288e-09,
+ "grad_condition": 24151283.383643005,
+ "lr": 0.0002320866025105016,
+ "time_sec": 66.97265934944153
+ },
+ {
+ "epoch": 103,
+ "train_loss": 3.066944828414917,
+ "train_acc": 0.23798,
+ "test_loss": 9.439580722045898,
+ "test_acc": 0.0198,
+ "lyapunov": null,
+ "grad_norm": 0.49800148183033643,
+ "grad_max_sv": 0.15005342811346054,
+ "grad_min_sv": 9.260063320998268e-09,
+ "grad_condition": 32769732.654720783,
+ "lr": 0.0002233042253783278,
+ "time_sec": 67.00615048408508
+ },
+ {
+ "epoch": 104,
+ "train_loss": 3.0457233097839356,
+ "train_acc": 0.24206,
+ "test_loss": 9.283833685302735,
+ "test_acc": 0.022,
+ "lyapunov": null,
+ "grad_norm": 0.5005816660320969,
+ "grad_max_sv": 0.15397185049951076,
+ "grad_min_sv": 9.2347574705276e-09,
+ "grad_condition": 39740043.841383025,
+ "lr": 0.000214643216157784,
+ "time_sec": 66.98598265647888
+ },
+ {
+ "epoch": 105,
+ "train_loss": 3.0319893937683107,
+ "train_acc": 0.24054,
+ "test_loss": 9.208142726135254,
+ "test_acc": 0.0215,
+ "lyapunov": null,
+ "grad_norm": 0.4998792272266736,
+ "grad_max_sv": 0.15734503231942654,
+ "grad_min_sv": 9.254817884274402e-09,
+ "grad_condition": 23445108.874561593,
+ "lr": 0.00020610737385376332,
+ "time_sec": 66.97633767127991
+ },
+ {
+ "epoch": 106,
+ "train_loss": 3.0231310614013673,
+ "train_acc": 0.2459,
+ "test_loss": 9.397696965026855,
+ "test_acc": 0.0216,
+ "lyapunov": null,
+ "grad_norm": 0.5036514636560196,
+ "grad_max_sv": 0.15039666295051574,
+ "grad_min_sv": 9.292655003714615e-09,
+ "grad_condition": 456660482.4660243,
+ "lr": 0.00019770044256881242,
+ "time_sec": 66.97969722747803
+ },
+ {
+ "epoch": 107,
+ "train_loss": 3.015210195846558,
+ "train_acc": 0.24924,
+ "test_loss": 9.136646028137207,
+ "test_acc": 0.0253,
+ "lyapunov": null,
+ "grad_norm": 0.5044102710994137,
+ "grad_max_sv": 0.15338496044278144,
+ "grad_min_sv": 9.416407534962313e-09,
+ "grad_condition": 29814119.267252993,
+ "lr": 0.0001894261098608447,
+ "time_sec": 66.9929895401001
+ },
+ {
+ "epoch": 108,
+ "train_loss": 2.992950742034912,
+ "train_acc": 0.25076,
+ "test_loss": 9.683133767700195,
+ "test_acc": 0.0206,
+ "lyapunov": null,
+ "grad_norm": 0.5024766427018658,
+ "grad_max_sv": 0.15207941457629204,
+ "grad_min_sv": 9.368817296961928e-09,
+ "grad_condition": 25707665.821010012,
+ "lr": 0.000181288005125655,
+ "time_sec": 67.04599475860596
+ },
+ {
+ "epoch": 109,
+ "train_loss": 2.9911826483917237,
+ "train_acc": 0.25182,
+ "test_loss": 9.541546542358398,
+ "test_acc": 0.0216,
+ "lyapunov": null,
+ "grad_norm": 0.5050428635829171,
+ "grad_max_sv": 0.1559975240379572,
+ "grad_min_sv": 9.425568786580741e-09,
+ "grad_condition": 29011942.837490637,
+ "lr": 0.0001732896980049473,
+ "time_sec": 66.9745888710022
+ },
+ {
+ "epoch": 110,
+ "train_loss": 2.9719406244659425,
+ "train_acc": 0.25626,
+ "test_loss": 9.304527082824707,
+ "test_acc": 0.0239,
+ "lyapunov": null,
+ "grad_norm": 0.50709757758927,
+ "grad_max_sv": 0.15366660207509994,
+ "grad_min_sv": 9.407841375375093e-09,
+ "grad_condition": 20259210.324132033,
+ "lr": 0.00016543469682057076,
+ "time_sec": 67.00725531578064
+ },
+ {
+ "epoch": 111,
+ "train_loss": 2.9610974934387206,
+ "train_acc": 0.25892,
+ "test_loss": 9.905137655639649,
+ "test_acc": 0.0233,
+ "lyapunov": null,
+ "grad_norm": 0.5069510646769094,
+ "grad_max_sv": 0.16044184900820255,
+ "grad_min_sv": 9.517911378487121e-09,
+ "grad_condition": 20572867.320830267,
+ "lr": 0.00015772644703565552,
+ "time_sec": 66.96853518486023
+ },
+ {
+ "epoch": 112,
+ "train_loss": 2.956413153839111,
+ "train_acc": 0.25946,
+ "test_loss": 10.164678506469727,
+ "test_acc": 0.0226,
+ "lyapunov": null,
+ "grad_norm": 0.5077720159938983,
+ "grad_max_sv": 0.15506692193448543,
+ "grad_min_sv": 9.397505702779529e-09,
+ "grad_condition": 22578916.073937874,
+ "lr": 0.00015016832974331713,
+ "time_sec": 67.01250433921814
+ },
+ {
+ "epoch": 113,
+ "train_loss": 2.9505707207489014,
+ "train_acc": 0.26056,
+ "test_loss": 9.862203175354004,
+ "test_acc": 0.0237,
+ "lyapunov": null,
+ "grad_norm": 0.508430292455553,
+ "grad_max_sv": 0.1596985150128603,
+ "grad_min_sv": 9.460744607170391e-09,
+ "grad_condition": 18853883.48562253,
+ "lr": 0.00014276366018359834,
+ "time_sec": 66.99557614326477
+ },
+ {
+ "epoch": 114,
+ "train_loss": 2.9415723051452636,
+ "train_acc": 0.2616,
+ "test_loss": 9.63483480834961,
+ "test_acc": 0.0232,
+ "lyapunov": null,
+ "grad_norm": 0.5104303932486228,
+ "grad_max_sv": 0.1552283179014921,
+ "grad_min_sv": 9.445251571464034e-09,
+ "grad_condition": 693766580.7640529,
+ "lr": 0.00013551568628929425,
+ "time_sec": 66.99906969070435
+ },
+ {
+ "epoch": 115,
+ "train_loss": 2.9388054510498045,
+ "train_acc": 0.26148,
+ "test_loss": 9.398469245910645,
+ "test_acc": 0.0231,
+ "lyapunov": null,
+ "grad_norm": 0.5141390434712518,
+ "grad_max_sv": 0.16008906662464142,
+ "grad_min_sv": 9.453520891100631e-09,
+ "grad_condition": 21355980.767428003,
+ "lr": 0.00012842758726130276,
+ "time_sec": 66.97847414016724
+ },
+ {
+ "epoch": 116,
+ "train_loss": 2.9283171284484864,
+ "train_acc": 0.26438,
+ "test_loss": 9.456967205810546,
+ "test_acc": 0.0244,
+ "lyapunov": null,
+ "grad_norm": 0.5133058115565678,
+ "grad_max_sv": 0.15975738912820817,
+ "grad_min_sv": 9.5292529520008e-09,
+ "grad_condition": 22298576.095964633,
+ "lr": 0.0001215024721741218,
+ "time_sec": 66.9903039932251
+ },
+ {
+ "epoch": 117,
+ "train_loss": 2.919693772506714,
+ "train_acc": 0.26682,
+ "test_loss": 9.649295095825195,
+ "test_acc": 0.0229,
+ "lyapunov": null,
+ "grad_norm": 0.5098040600332114,
+ "grad_max_sv": 0.15964976735413075,
+ "grad_min_sv": 9.535333161947435e-09,
+ "grad_condition": 18488699.782394268,
+ "lr": 0.00011474337861210538,
+ "time_sec": 66.98530316352844
+ },
+ {
+ "epoch": 118,
+ "train_loss": 2.9129154638671877,
+ "train_acc": 0.26648,
+ "test_loss": 9.582696447753905,
+ "test_acc": 0.0252,
+ "lyapunov": null,
+ "grad_norm": 0.5137327165981059,
+ "grad_max_sv": 0.15674266032874584,
+ "grad_min_sv": 9.422415092608106e-09,
+ "grad_condition": 21769035.1047443,
+ "lr": 0.00010815327133708009,
+ "time_sec": 67.0712718963623
+ },
+ {
+ "epoch": 119,
+ "train_loss": 2.90771673576355,
+ "train_acc": 0.26738,
+ "test_loss": 9.686517756652831,
+ "test_acc": 0.0223,
+ "lyapunov": null,
+ "grad_norm": 0.5112636160904589,
+ "grad_max_sv": 0.15690986551344394,
+ "grad_min_sv": 9.557581368002666e-09,
+ "grad_condition": 65271422.15119822,
+ "lr": 0.00010173504098790182,
+ "time_sec": 66.99134540557861
+ },
+ {
+ "epoch": 120,
+ "train_loss": 2.903361056442261,
+ "train_acc": 0.26626,
+ "test_loss": 9.534084574890137,
+ "test_acc": 0.025,
+ "lyapunov": null,
+ "grad_norm": 0.5139337490910202,
+ "grad_max_sv": 0.16002687215805053,
+ "grad_min_sv": 9.488575995753035e-09,
+ "grad_condition": 26500108.07568959,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 66.98560166358948
+ },
+ {
+ "epoch": 121,
+ "train_loss": 2.8838987274169923,
+ "train_acc": 0.27268,
+ "test_loss": 9.002799011230469,
+ "test_acc": 0.0286,
+ "lyapunov": null,
+ "grad_norm": 0.5181242234216702,
+ "grad_max_sv": 0.15681598484516143,
+ "grad_min_sv": 9.58419937996391e-09,
+ "grad_condition": 21911011.850442223,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 66.99542880058289
+ },
+ {
+ "epoch": 122,
+ "train_loss": 2.8907574623107912,
+ "train_acc": 0.27284,
+ "test_loss": 9.40299231262207,
+ "test_acc": 0.023,
+ "lyapunov": null,
+ "grad_norm": 0.5154755058010533,
+ "grad_max_sv": 0.16150307320058346,
+ "grad_min_sv": 9.692825331253373e-09,
+ "grad_condition": 20117302.380122818,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 66.98236727714539
+ },
+ {
+ "epoch": 123,
+ "train_loss": 2.8763803490448,
+ "train_acc": 0.2739,
+ "test_loss": 9.18796940612793,
+ "test_acc": 0.0263,
+ "lyapunov": null,
+ "grad_norm": 0.514194573203304,
+ "grad_max_sv": 0.15613614898175002,
+ "grad_min_sv": 9.584234908488477e-09,
+ "grad_condition": 18777275.99405461,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 66.99689793586731
+ },
+ {
+ "epoch": 124,
+ "train_loss": 2.8843617086029054,
+ "train_acc": 0.27144,
+ "test_loss": 9.370162466430664,
+ "test_acc": 0.0248,
+ "lyapunov": null,
+ "grad_norm": 0.5136262444075659,
+ "grad_max_sv": 0.15881695374846458,
+ "grad_min_sv": 9.587037638758567e-09,
+ "grad_condition": 18534833.152038723,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 66.98831605911255
+ },
+ {
+ "epoch": 125,
+ "train_loss": 2.8742648021697996,
+ "train_acc": 0.27246,
+ "test_loss": 9.4968570602417,
+ "test_acc": 0.0258,
+ "lyapunov": null,
+ "grad_norm": 0.5172296409721588,
+ "grad_max_sv": 0.15975196473300457,
+ "grad_min_sv": 9.493101107982404e-09,
+ "grad_condition": 20120176.988574862,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 66.98702692985535
+ },
+ {
+ "epoch": 126,
+ "train_loss": 2.868820255508423,
+ "train_acc": 0.27476,
+ "test_loss": 9.60731820678711,
+ "test_acc": 0.0243,
+ "lyapunov": null,
+ "grad_norm": 0.5204414887458292,
+ "grad_max_sv": 0.16092863790690898,
+ "grad_min_sv": 9.674041201446215e-09,
+ "grad_condition": 18855250.862980247,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 66.97707200050354
+ },
+ {
+ "epoch": 127,
+ "train_loss": 2.8692937660217286,
+ "train_acc": 0.27484,
+ "test_loss": 9.273512542724609,
+ "test_acc": 0.0252,
+ "lyapunov": null,
+ "grad_norm": 0.5162971653606119,
+ "grad_max_sv": 0.16184906139969826,
+ "grad_min_sv": 9.668298800447062e-09,
+ "grad_condition": 21519277.77695776,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 67.0102117061615
+ },
+ {
+ "epoch": 128,
+ "train_loss": 2.8623614330291747,
+ "train_acc": 0.27702,
+ "test_loss": 9.566067819213867,
+ "test_acc": 0.0239,
+ "lyapunov": null,
+ "grad_norm": 0.5161277911748794,
+ "grad_max_sv": 0.1572089247405529,
+ "grad_min_sv": 9.598460455964574e-09,
+ "grad_condition": 40264946.42458854,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 66.9910991191864
+ },
+ {
+ "epoch": 129,
+ "train_loss": 2.8542457569122313,
+ "train_acc": 0.27896,
+ "test_loss": 9.585708435058594,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.5185536839510844,
+ "grad_max_sv": 0.16669968273490668,
+ "grad_min_sv": 9.84268076209549e-09,
+ "grad_condition": 20409849.055229448,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 67.02374720573425
+ },
+ {
+ "epoch": 130,
+ "train_loss": 2.8572039877319337,
+ "train_acc": 0.27668,
+ "test_loss": 9.687789022827149,
+ "test_acc": 0.0255,
+ "lyapunov": null,
+ "grad_norm": 0.5186381052419109,
+ "grad_max_sv": 0.15739406496286393,
+ "grad_min_sv": 9.484110215923769e-09,
+ "grad_condition": 32956127.450649947,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 67.0042040348053
+ },
+ {
+ "epoch": 131,
+ "train_loss": 2.8510476612854005,
+ "train_acc": 0.27938,
+ "test_loss": 9.569248272705078,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.5207995350849649,
+ "grad_max_sv": 0.16004110053181647,
+ "grad_min_sv": 9.74696345579229e-09,
+ "grad_condition": 19170988.284027696,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 67.01241946220398
+ },
+ {
+ "epoch": 132,
+ "train_loss": 2.846966871871948,
+ "train_acc": 0.28012,
+ "test_loss": 9.591386764526368,
+ "test_acc": 0.0255,
+ "lyapunov": null,
+ "grad_norm": 0.5190948064684937,
+ "grad_max_sv": 0.16090917438268662,
+ "grad_min_sv": 9.59687692925204e-09,
+ "grad_condition": 19916201.19002537,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 66.99244403839111
+ },
+ {
+ "epoch": 133,
+ "train_loss": 2.849546993560791,
+ "train_acc": 0.2807,
+ "test_loss": 9.568466381835938,
+ "test_acc": 0.0256,
+ "lyapunov": null,
+ "grad_norm": 0.5185948998509293,
+ "grad_max_sv": 0.1592203661799431,
+ "grad_min_sv": 9.741048792588635e-09,
+ "grad_condition": 21889901.09234864,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 66.98589158058167
+ },
+ {
+ "epoch": 134,
+ "train_loss": 2.8438784635925294,
+ "train_acc": 0.28108,
+ "test_loss": 9.896654699707032,
+ "test_acc": 0.0239,
+ "lyapunov": null,
+ "grad_norm": 0.5160935862439748,
+ "grad_max_sv": 0.1570783667266369,
+ "grad_min_sv": 9.671757885201804e-09,
+ "grad_condition": 260951372.1762239,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 66.98548531532288
+ },
+ {
+ "epoch": 135,
+ "train_loss": 2.834603865356445,
+ "train_acc": 0.28228,
+ "test_loss": 9.507378176879882,
+ "test_acc": 0.0279,
+ "lyapunov": null,
+ "grad_norm": 0.5182545697342097,
+ "grad_max_sv": 0.16007349267601967,
+ "grad_min_sv": 9.658516472721423e-09,
+ "grad_condition": 19713617.954316415,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 67.04329872131348
+ },
+ {
+ "epoch": 136,
+ "train_loss": 2.839189874649048,
+ "train_acc": 0.28064,
+ "test_loss": 9.359465802001953,
+ "test_acc": 0.0248,
+ "lyapunov": null,
+ "grad_norm": 0.5169244988974169,
+ "grad_max_sv": 0.16038464941084385,
+ "grad_min_sv": 9.551935577917225e-09,
+ "grad_condition": 92654982.50365481,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 67.0141191482544
+ },
+ {
+ "epoch": 137,
+ "train_loss": 2.8397282981109617,
+ "train_acc": 0.28072,
+ "test_loss": 9.637136407470702,
+ "test_acc": 0.0232,
+ "lyapunov": null,
+ "grad_norm": 0.5171965418231472,
+ "grad_max_sv": 0.1600246898829937,
+ "grad_min_sv": 9.73793786961108e-09,
+ "grad_condition": 49688363.904323384,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 67.01152467727661
+ },
+ {
+ "epoch": 138,
+ "train_loss": 2.832450699005127,
+ "train_acc": 0.2818,
+ "test_loss": 9.6108934967041,
+ "test_acc": 0.0257,
+ "lyapunov": null,
+ "grad_norm": 0.5180887909699459,
+ "grad_max_sv": 0.15756660997867583,
+ "grad_min_sv": 9.721027080522582e-09,
+ "grad_condition": 111964333.48758218,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 66.98093700408936
+ },
+ {
+ "epoch": 139,
+ "train_loss": 2.831738001098633,
+ "train_acc": 0.28372,
+ "test_loss": 9.70671376953125,
+ "test_acc": 0.0243,
+ "lyapunov": null,
+ "grad_norm": 0.5175564205755943,
+ "grad_max_sv": 0.15984287559986116,
+ "grad_min_sv": 9.567414729211298e-09,
+ "grad_condition": 30908421.83810656,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 66.98836731910706
+ },
+ {
+ "epoch": 140,
+ "train_loss": 2.8314741302490236,
+ "train_acc": 0.2828,
+ "test_loss": 9.671274719238282,
+ "test_acc": 0.0253,
+ "lyapunov": null,
+ "grad_norm": 0.5195292394658827,
+ "grad_max_sv": 0.16055516712367535,
+ "grad_min_sv": 9.656845009232972e-09,
+ "grad_condition": 116770748.01439288,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 67.06937670707703
+ },
+ {
+ "epoch": 141,
+ "train_loss": 2.8331345532226564,
+ "train_acc": 0.28274,
+ "test_loss": 9.6149158203125,
+ "test_acc": 0.0254,
+ "lyapunov": null,
+ "grad_norm": 0.5200947221378508,
+ "grad_max_sv": 0.1620084557682276,
+ "grad_min_sv": 9.736931689749428e-09,
+ "grad_condition": 45631030.28761599,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 67.04308843612671
+ },
+ {
+ "epoch": 142,
+ "train_loss": 2.8309748402404784,
+ "train_acc": 0.28162,
+ "test_loss": 9.762360348510741,
+ "test_acc": 0.0236,
+ "lyapunov": null,
+ "grad_norm": 0.5193749464503752,
+ "grad_max_sv": 0.16398511864244938,
+ "grad_min_sv": 9.725219179967937e-09,
+ "grad_condition": 21389461.650285553,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 66.99746632575989
+ },
+ {
+ "epoch": 143,
+ "train_loss": 2.8280009740447998,
+ "train_acc": 0.28424,
+ "test_loss": 9.46468698425293,
+ "test_acc": 0.0236,
+ "lyapunov": null,
+ "grad_norm": 0.5183118315610563,
+ "grad_max_sv": 0.15934774614870548,
+ "grad_min_sv": 9.612720197615943e-09,
+ "grad_condition": 28184363.311956126,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 67.1207172870636
+ },
+ {
+ "epoch": 144,
+ "train_loss": 2.8344388133239744,
+ "train_acc": 0.27982,
+ "test_loss": 9.481146864318848,
+ "test_acc": 0.0253,
+ "lyapunov": null,
+ "grad_norm": 0.5191802199413043,
+ "grad_max_sv": 0.16139711774885654,
+ "grad_min_sv": 9.682644661057616e-09,
+ "grad_condition": 19530671.727896534,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 67.00769138336182
+ },
+ {
+ "epoch": 145,
+ "train_loss": 2.8336991081237795,
+ "train_acc": 0.28372,
+ "test_loss": 9.66582228088379,
+ "test_acc": 0.0261,
+ "lyapunov": null,
+ "grad_norm": 0.5185987884305854,
+ "grad_max_sv": 0.16210929341614247,
+ "grad_min_sv": 9.609004592014969e-09,
+ "grad_condition": 19136474.88235427,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 67.0150043964386
+ },
+ {
+ "epoch": 146,
+ "train_loss": 2.8299831028747557,
+ "train_acc": 0.28278,
+ "test_loss": 9.453235021972656,
+ "test_acc": 0.0257,
+ "lyapunov": null,
+ "grad_norm": 0.5191689479196915,
+ "grad_max_sv": 0.16032814532518386,
+ "grad_min_sv": 9.704305628868703e-09,
+ "grad_condition": 46973186.46224795,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 67.00002098083496
+ },
+ {
+ "epoch": 147,
+ "train_loss": 2.825070192184448,
+ "train_acc": 0.28334,
+ "test_loss": 9.736306394958497,
+ "test_acc": 0.0241,
+ "lyapunov": null,
+ "grad_norm": 0.5194004947332557,
+ "grad_max_sv": 0.15663104616105555,
+ "grad_min_sv": 9.712660245519977e-09,
+ "grad_condition": 19953974.129073095,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 67.0251133441925
+ },
+ {
+ "epoch": 148,
+ "train_loss": 2.8285147483825686,
+ "train_acc": 0.28494,
+ "test_loss": 9.718778967285155,
+ "test_acc": 0.0232,
+ "lyapunov": null,
+ "grad_norm": 0.519735769986064,
+ "grad_max_sv": 0.16175503246486186,
+ "grad_min_sv": 9.61004464027082e-09,
+ "grad_condition": 41640518.28457622,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 66.99386191368103
+ },
+ {
+ "epoch": 149,
+ "train_loss": 2.8338044094085695,
+ "train_acc": 0.2828,
+ "test_loss": 9.769097790527344,
+ "test_acc": 0.025,
+ "lyapunov": null,
+ "grad_norm": 0.518369855767956,
+ "grad_max_sv": 0.16054188311100007,
+ "grad_min_sv": 9.553421861929757e-09,
+ "grad_condition": 19432504.243999995,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 66.99177241325378
+ },
+ {
+ "epoch": 150,
+ "train_loss": 2.8278376667022704,
+ "train_acc": 0.28346,
+ "test_loss": 9.647385183715821,
+ "test_acc": 0.0242,
+ "lyapunov": null,
+ "grad_norm": 0.5190962063342817,
+ "grad_max_sv": 0.16339128278195858,
+ "grad_min_sv": 9.625854724415461e-09,
+ "grad_condition": 26849402.241447162,
+ "lr": 0.0,
+ "time_sec": 66.99396753311157
+ }
+ ]
+ },
+ "lyapunov": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 4.0711297009277345,
+ "train_acc": 0.09922,
+ "test_loss": 3.9652711036682127,
+ "test_acc": 0.106,
+ "lyapunov": 2.009106175978775,
+ "grad_norm": 5.770356961936896,
+ "grad_max_sv": 4.216659033298493,
+ "grad_min_sv": 1.0549574099294467e-07,
+ "grad_condition": 83568782.62868212,
+ "lr": 0.0009998903417374227,
+ "time_sec": 41.888622999191284
+ },
+ {
+ "epoch": 2,
+ "train_loss": 3.7634158575439454,
+ "train_acc": 0.13558,
+ "test_loss": 4.481808354949951,
+ "test_acc": 0.0542,
+ "lyapunov": 1.6958206730425511,
+ "grad_norm": 3.6343119962391017,
+ "grad_max_sv": 2.4889110922813416,
+ "grad_min_sv": 6.732413328491837e-08,
+ "grad_condition": 91225677.18337384,
+ "lr": 0.0009995614150494292,
+ "time_sec": 41.84356164932251
+ },
+ {
+ "epoch": 3,
+ "train_loss": 3.6647304371643066,
+ "train_acc": 0.1493,
+ "test_loss": 4.3052373779296875,
+ "test_acc": 0.0762,
+ "lyapunov": 1.6261345663338975,
+ "grad_norm": 2.8093749766197624,
+ "grad_max_sv": 1.7556122809648513,
+ "grad_min_sv": 5.287189366841305e-08,
+ "grad_condition": 314142006.47060126,
+ "lr": 0.0009990133642141358,
+ "time_sec": 41.84758758544922
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.546524167175293,
+ "train_acc": 0.16742,
+ "test_loss": 5.702491674804688,
+ "test_acc": 0.0294,
+ "lyapunov": 1.5553575302938671,
+ "grad_norm": 2.385940862508357,
+ "grad_max_sv": 1.40236736536026,
+ "grad_min_sv": 4.480527846517646e-08,
+ "grad_condition": 43664896.37977407,
+ "lr": 0.0009982464296247522,
+ "time_sec": 41.83865737915039
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.4743005490112306,
+ "train_acc": 0.18312,
+ "test_loss": 8.196367356872559,
+ "test_acc": 0.019,
+ "lyapunov": 1.5279129725283065,
+ "grad_norm": 2.072916387891114,
+ "grad_max_sv": 1.1730020090937614,
+ "grad_min_sv": 3.8785105194172334e-08,
+ "grad_condition": 32346211.56806183,
+ "lr": 0.0009972609476841367,
+ "time_sec": 41.85976266860962
+ },
+ {
+ "epoch": 6,
+ "train_loss": 3.4256133052062987,
+ "train_acc": 0.19342,
+ "test_loss": 9.553438766479491,
+ "test_acc": 0.0187,
+ "lyapunov": 1.5210750066410854,
+ "grad_norm": 1.8439895228569763,
+ "grad_max_sv": 0.9858661040663719,
+ "grad_min_sv": 3.4533098991484934e-08,
+ "grad_condition": 35319864.79656621,
+ "lr": 0.000996057350657239,
+ "time_sec": 41.841728925704956
+ },
+ {
+ "epoch": 7,
+ "train_loss": 3.4064867937469483,
+ "train_acc": 0.2019,
+ "test_loss": 11.607983041381836,
+ "test_acc": 0.0152,
+ "lyapunov": 1.523884119280159,
+ "grad_norm": 1.687138246958699,
+ "grad_max_sv": 0.8869923338294029,
+ "grad_min_sv": 3.151686688296351e-08,
+ "grad_condition": 33789366.4765297,
+ "lr": 0.000994636166481494,
+ "time_sec": 41.84767436981201
+ },
+ {
+ "epoch": 8,
+ "train_loss": 3.434463021774292,
+ "train_acc": 0.19834,
+ "test_loss": 11.012699322509766,
+ "test_acc": 0.0218,
+ "lyapunov": 1.5377070940364048,
+ "grad_norm": 1.5753285999803672,
+ "grad_max_sv": 0.8568978801369667,
+ "grad_min_sv": 2.9292211212172958e-08,
+ "grad_condition": 38247647.23104979,
+ "lr": 0.0009929980185352525,
+ "time_sec": 41.83318567276001
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.4525474771118163,
+ "train_acc": 0.19694,
+ "test_loss": 13.244960899353027,
+ "test_acc": 0.0188,
+ "lyapunov": 1.5521414874459776,
+ "grad_norm": 1.4910263576831584,
+ "grad_max_sv": 0.7901037082076072,
+ "grad_min_sv": 2.7871724133082115e-08,
+ "grad_condition": 652853959.565771,
+ "lr": 0.0009911436253643444,
+ "time_sec": 41.85349941253662
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.4827073947906495,
+ "train_acc": 0.19456,
+ "test_loss": 13.097009005737304,
+ "test_acc": 0.0142,
+ "lyapunov": 1.54852739807285,
+ "grad_norm": 1.3918276084929038,
+ "grad_max_sv": 0.7072893396019936,
+ "grad_min_sv": 2.5679541396095296e-08,
+ "grad_condition": 39117704.605187416,
+ "lr": 0.0009890738003669028,
+ "time_sec": 41.853031635284424
+ },
+ {
+ "epoch": 11,
+ "train_loss": 3.502148910446167,
+ "train_acc": 0.19276,
+ "test_loss": 14.30014864807129,
+ "test_acc": 0.0163,
+ "lyapunov": 1.5574408672044955,
+ "grad_norm": 1.3267443475145169,
+ "grad_max_sv": 0.6856341227889061,
+ "grad_min_sv": 2.4468690279499938e-08,
+ "grad_condition": 36359188.54410316,
+ "lr": 0.00098678945143658,
+ "time_sec": 41.87047362327576
+ },
+ {
+ "epoch": 12,
+ "train_loss": 3.5455151155090334,
+ "train_acc": 0.1879,
+ "test_loss": 12.457445967102052,
+ "test_acc": 0.0197,
+ "lyapunov": 1.5671831793187525,
+ "grad_norm": 1.2480528019241246,
+ "grad_max_sv": 0.6239843934774398,
+ "grad_min_sv": 2.3005261242953905e-08,
+ "grad_condition": 526118663.91773003,
+ "lr": 0.0009842915805643154,
+ "time_sec": 41.888609409332275
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.6091552614593505,
+ "train_acc": 0.17994,
+ "test_loss": 12.732378463745118,
+ "test_acc": 0.0121,
+ "lyapunov": 1.568660382419596,
+ "grad_norm": 1.1583490651743926,
+ "grad_max_sv": 0.581366877257824,
+ "grad_min_sv": 2.1129029859068282e-08,
+ "grad_condition": 32416771.726506818,
+ "lr": 0.000981581283398829,
+ "time_sec": 41.91386127471924
+ },
+ {
+ "epoch": 14,
+ "train_loss": 3.791756629562378,
+ "train_acc": 0.15402,
+ "test_loss": 15.130843069458008,
+ "test_acc": 0.0119,
+ "lyapunov": 1.616871199034669,
+ "grad_norm": 1.087286539710877,
+ "grad_max_sv": 0.572893675416708,
+ "grad_min_sv": 1.9829283692818224e-08,
+ "grad_condition": 32374293.19268779,
+ "lr": 0.0009786597487660333,
+ "time_sec": 41.84876489639282
+ },
+ {
+ "epoch": 15,
+ "train_loss": 3.8399617958068846,
+ "train_acc": 0.14724,
+ "test_loss": 17.94291413269043,
+ "test_acc": 0.0166,
+ "lyapunov": 1.6528625835847977,
+ "grad_norm": 1.0379429629839805,
+ "grad_max_sv": 0.5574500106275082,
+ "grad_min_sv": 1.8863349182662857e-08,
+ "grad_condition": 39761225.70266014,
+ "lr": 0.0009755282581475766,
+ "time_sec": 41.82764172554016
+ },
+ {
+ "epoch": 16,
+ "train_loss": 3.8371740995025636,
+ "train_acc": 0.15152,
+ "test_loss": 13.5413774017334,
+ "test_acc": 0.01,
+ "lyapunov": 1.648486807218293,
+ "grad_norm": 0.9596716866271199,
+ "grad_max_sv": 0.5051649369299411,
+ "grad_min_sv": 1.7647910632856423e-08,
+ "grad_condition": 34020323.13172309,
+ "lr": 0.0009721881851187403,
+ "time_sec": 41.84924578666687
+ },
+ {
+ "epoch": 17,
+ "train_loss": 3.890597806930542,
+ "train_acc": 0.14732,
+ "test_loss": 14.242138269042968,
+ "test_acc": 0.0132,
+ "lyapunov": 1.6423247948936794,
+ "grad_norm": 0.8982590539538886,
+ "grad_max_sv": 0.46011053323745726,
+ "grad_min_sv": 1.6221578684992576e-08,
+ "grad_condition": 227922899.83540225,
+ "lr": 0.0009686409947459456,
+ "time_sec": 41.824068784713745
+ },
+ {
+ "epoch": 18,
+ "train_loss": 3.8945003430938723,
+ "train_acc": 0.14424,
+ "test_loss": 12.652154109191894,
+ "test_acc": 0.009,
+ "lyapunov": 1.6140738649441457,
+ "grad_norm": 0.8509250568629757,
+ "grad_max_sv": 0.4146191440522671,
+ "grad_min_sv": 1.5334739790484608e-08,
+ "grad_condition": 46249959.20615914,
+ "lr": 0.0009648882429441254,
+ "time_sec": 41.92591094970703
+ },
+ {
+ "epoch": 19,
+ "train_loss": 3.911494416732788,
+ "train_acc": 0.14534,
+ "test_loss": 10.313947262573242,
+ "test_acc": 0.01,
+ "lyapunov": 1.6057381596406708,
+ "grad_norm": 0.8291056062070911,
+ "grad_max_sv": 0.39902378544211387,
+ "grad_min_sv": 1.5037980047316603e-08,
+ "grad_condition": 51800842.237051465,
+ "lr": 0.00096093157579425,
+ "time_sec": 41.85994362831116
+ },
+ {
+ "epoch": 20,
+ "train_loss": 3.9858800520324706,
+ "train_acc": 0.13508,
+ "test_loss": 9.495584085083008,
+ "test_acc": 0.0117,
+ "lyapunov": 1.5699561761163385,
+ "grad_norm": 0.8464930976238112,
+ "grad_max_sv": 0.4136614315211773,
+ "grad_min_sv": 1.490709049438779e-08,
+ "grad_condition": 522735678.0721162,
+ "lr": 0.0009567727288213001,
+ "time_sec": 41.85805010795593
+ },
+ {
+ "epoch": 21,
+ "train_loss": 4.023155120925903,
+ "train_acc": 0.12818,
+ "test_loss": 10.004813737487792,
+ "test_acc": 0.0135,
+ "lyapunov": 1.5752095285888827,
+ "grad_norm": 0.8291979613527221,
+ "grad_max_sv": 0.38449598476290703,
+ "grad_min_sv": 1.4266561158826629e-08,
+ "grad_condition": 100203024.77550165,
+ "lr": 0.0009524135262330095,
+ "time_sec": 41.84737300872803
+ },
+ {
+ "epoch": 22,
+ "train_loss": 4.029212285461425,
+ "train_acc": 0.12438,
+ "test_loss": 12.173621334838867,
+ "test_acc": 0.01,
+ "lyapunov": 1.5598359254315077,
+ "grad_norm": 0.7501647761926934,
+ "grad_max_sv": 0.36557952016592027,
+ "grad_min_sv": 1.3507705134974124e-08,
+ "grad_condition": 32668036.703706127,
+ "lr": 0.0009478558801197061,
+ "time_sec": 41.83857583999634
+ },
+ {
+ "epoch": 23,
+ "train_loss": 4.038732503051758,
+ "train_acc": 0.12626,
+ "test_loss": 8.940043533325195,
+ "test_acc": 0.011,
+ "lyapunov": 1.5640881744492086,
+ "grad_norm": 0.7404717741571084,
+ "grad_max_sv": 0.36797516867518426,
+ "grad_min_sv": 1.314027773258175e-08,
+ "grad_condition": 31266761.905169785,
+ "lr": 0.000943101789615607,
+ "time_sec": 41.82795524597168
+ },
+ {
+ "epoch": 24,
+ "train_loss": 4.0988731300354,
+ "train_acc": 0.11452,
+ "test_loss": 12.849692756652832,
+ "test_acc": 0.0107,
+ "lyapunov": 1.550421966311267,
+ "grad_norm": 0.7098563411237487,
+ "grad_max_sv": 0.36257990449666977,
+ "grad_min_sv": 1.25359189376284e-08,
+ "grad_condition": 40983554.09727303,
+ "lr": 0.0009381533400219313,
+ "time_sec": 41.85472393035889
+ },
+ {
+ "epoch": 25,
+ "train_loss": 4.209664036712646,
+ "train_acc": 0.09956,
+ "test_loss": 13.292383435058595,
+ "test_acc": 0.01,
+ "lyapunov": 1.5532953726970935,
+ "grad_norm": 0.6761784984779601,
+ "grad_max_sv": 0.3498499631881714,
+ "grad_min_sv": 1.1860140708419564e-08,
+ "grad_condition": 35321140.57939846,
+ "lr": 0.0009330127018922189,
+ "time_sec": 41.83675241470337
+ },
+ {
+ "epoch": 26,
+ "train_loss": 4.387504685211182,
+ "train_acc": 0.06822,
+ "test_loss": 13.442844244384766,
+ "test_acc": 0.01,
+ "lyapunov": 1.5123424859303038,
+ "grad_norm": 0.613666343544254,
+ "grad_max_sv": 0.312596595287323,
+ "grad_min_sv": 9.974056802697362e-09,
+ "grad_condition": 73223482.84978306,
+ "lr": 0.000927682130080253,
+ "time_sec": 41.83025002479553
+ },
+ {
+ "epoch": 27,
+ "train_loss": 4.494176885528565,
+ "train_acc": 0.0543,
+ "test_loss": 11.84754227294922,
+ "test_acc": 0.0094,
+ "lyapunov": 1.4815948003393304,
+ "grad_norm": 0.5747479343845562,
+ "grad_max_sv": 0.3057863064110279,
+ "grad_min_sv": 8.438247317554826e-09,
+ "grad_condition": 38945619.0197791,
+ "lr": 0.0009221639627510072,
+ "time_sec": 41.84781360626221
+ },
+ {
+ "epoch": 28,
+ "train_loss": 4.46251156829834,
+ "train_acc": 0.05616,
+ "test_loss": 11.681759558105469,
+ "test_acc": 0.01,
+ "lyapunov": 1.4850436720396856,
+ "grad_norm": 0.5367103881878276,
+ "grad_max_sv": 0.27574604004621506,
+ "grad_min_sv": 7.970707525950527e-09,
+ "grad_condition": 43556131.981196605,
+ "lr": 0.0009164606203550494,
+ "time_sec": 41.85157370567322
+ },
+ {
+ "epoch": 29,
+ "train_loss": 4.478804314422607,
+ "train_acc": 0.05546,
+ "test_loss": 13.70535901184082,
+ "test_acc": 0.01,
+ "lyapunov": 1.4930339225417817,
+ "grad_norm": 0.4922959043886969,
+ "grad_max_sv": 0.26684653796255586,
+ "grad_min_sv": 7.476301915054772e-09,
+ "grad_condition": 50660877.44966361,
+ "lr": 0.0009105746045668516,
+ "time_sec": 41.84281659126282
+ },
+ {
+ "epoch": 30,
+ "train_loss": 4.461830242156982,
+ "train_acc": 0.05732,
+ "test_loss": 16.430956909179688,
+ "test_acc": 0.01,
+ "lyapunov": 1.4880318653857922,
+ "grad_norm": 0.463062312015885,
+ "grad_max_sv": 0.24580183289945126,
+ "grad_min_sv": 6.99083638443232e-09,
+ "grad_condition": 91544069.9810532,
+ "lr": 0.0009045084971874733,
+ "time_sec": 41.85340070724487
+ },
+ {
+ "epoch": 31,
+ "train_loss": 4.449828500366211,
+ "train_acc": 0.06014,
+ "test_loss": 16.980024148559572,
+ "test_acc": 0.01,
+ "lyapunov": 1.515285712068953,
+ "grad_norm": 0.46991707412670536,
+ "grad_max_sv": 0.24059981070458888,
+ "grad_min_sv": 7.035010417960619e-09,
+ "grad_condition": 75974624.60279362,
+ "lr": 0.0008982649590120977,
+ "time_sec": 41.8510844707489
+ },
+ {
+ "epoch": 32,
+ "train_loss": 4.437514468383789,
+ "train_acc": 0.06294,
+ "test_loss": 18.52886298980713,
+ "test_acc": 0.01,
+ "lyapunov": 1.5204427940461336,
+ "grad_norm": 0.45125734819245583,
+ "grad_max_sv": 0.22053336799144746,
+ "grad_min_sv": 6.6175200534590585e-09,
+ "grad_condition": 48917947.725726604,
+ "lr": 0.0008918467286629196,
+ "time_sec": 41.869179248809814
+ },
+ {
+ "epoch": 33,
+ "train_loss": 4.40278786529541,
+ "train_acc": 0.06556,
+ "test_loss": 18.846385064697266,
+ "test_acc": 0.01,
+ "lyapunov": 1.4883441946390645,
+ "grad_norm": 0.45666973025646995,
+ "grad_max_sv": 0.21949558071792125,
+ "grad_min_sv": 6.802780549985954e-09,
+ "grad_condition": 36143230.241273426,
+ "lr": 0.0008852566213878943,
+ "time_sec": 41.84911870956421
+ },
+ {
+ "epoch": 34,
+ "train_loss": 4.40820367401123,
+ "train_acc": 0.06462,
+ "test_loss": 20.250594232177736,
+ "test_acc": 0.01,
+ "lyapunov": 1.4780629108019192,
+ "grad_norm": 0.4533983560833586,
+ "grad_max_sv": 0.21924315206706524,
+ "grad_min_sv": 6.449878905967488e-09,
+ "grad_condition": 45022497.55124281,
+ "lr": 0.000878497527825878,
+ "time_sec": 41.82957434654236
+ },
+ {
+ "epoch": 35,
+ "train_loss": 4.416326632080078,
+ "train_acc": 0.06346,
+ "test_loss": 18.319365844726562,
+ "test_acc": 0.01,
+ "lyapunov": 1.4840021791970333,
+ "grad_norm": 0.44153691028523245,
+ "grad_max_sv": 0.20659824572503566,
+ "grad_min_sv": 6.229376612806869e-09,
+ "grad_condition": 59088146.05455335,
+ "lr": 0.000871572412738697,
+ "time_sec": 41.850478410720825
+ },
+ {
+ "epoch": 36,
+ "train_loss": 4.408258157043457,
+ "train_acc": 0.064,
+ "test_loss": 20.95832971191406,
+ "test_acc": 0.01,
+ "lyapunov": 1.479226511152809,
+ "grad_norm": 0.4410718020248668,
+ "grad_max_sv": 0.2093581147491932,
+ "grad_min_sv": 6.282209370940539e-09,
+ "grad_condition": 105188788.23632967,
+ "lr": 0.0008644843137107055,
+ "time_sec": 41.878541469573975
+ },
+ {
+ "epoch": 37,
+ "train_loss": 4.407336394348144,
+ "train_acc": 0.06656,
+ "test_loss": 16.102902310180664,
+ "test_acc": 0.01,
+ "lyapunov": 1.4862678380268615,
+ "grad_norm": 0.44349953997935043,
+ "grad_max_sv": 0.215363934263587,
+ "grad_min_sv": 6.384406239789975e-09,
+ "grad_condition": 37599506.61324627,
+ "lr": 0.0008572363398164014,
+ "time_sec": 41.84441637992859
+ },
+ {
+ "epoch": 38,
+ "train_loss": 4.39930072052002,
+ "train_acc": 0.06716,
+ "test_loss": 14.936711614990234,
+ "test_acc": 0.01,
+ "lyapunov": 1.4831183868296005,
+ "grad_norm": 0.45835307206344844,
+ "grad_max_sv": 0.22024714946746826,
+ "grad_min_sv": 6.405372059842263e-09,
+ "grad_condition": 66702014.21939925,
+ "lr": 0.0008498316702566826,
+ "time_sec": 41.848416805267334
+ },
+ {
+ "epoch": 39,
+ "train_loss": 4.400538181915283,
+ "train_acc": 0.06598,
+ "test_loss": 16.468564752197267,
+ "test_acc": 0.01,
+ "lyapunov": 1.4876915777430815,
+ "grad_norm": 0.4485664393328264,
+ "grad_max_sv": 0.22156519442796707,
+ "grad_min_sv": 6.4785729367994316e-09,
+ "grad_condition": 280429030.69459355,
+ "lr": 0.0008422735529643442,
+ "time_sec": 41.86299443244934
+ },
+ {
+ "epoch": 40,
+ "train_loss": 4.397091385955811,
+ "train_acc": 0.06734,
+ "test_loss": 18.54481873931885,
+ "test_acc": 0.01,
+ "lyapunov": 1.4808301129914305,
+ "grad_norm": 0.4299005955382572,
+ "grad_max_sv": 0.2034155208617449,
+ "grad_min_sv": 6.2005965799361015e-09,
+ "grad_condition": 44401112.87668381,
+ "lr": 0.0008345653031794289,
+ "time_sec": 41.8275043964386
+ },
+ {
+ "epoch": 41,
+ "train_loss": 4.386424259796143,
+ "train_acc": 0.06824,
+ "test_loss": 21.206073614501953,
+ "test_acc": 0.01,
+ "lyapunov": 1.4804525152801553,
+ "grad_norm": 0.4248718447548538,
+ "grad_max_sv": 0.20124743394553662,
+ "grad_min_sv": 6.046653282243408e-09,
+ "grad_condition": 40043238.334212705,
+ "lr": 0.0008267103019950526,
+ "time_sec": 41.85425305366516
+ },
+ {
+ "epoch": 42,
+ "train_loss": 4.386167093048096,
+ "train_acc": 0.0676,
+ "test_loss": 19.16770219116211,
+ "test_acc": 0.01,
+ "lyapunov": 1.4792915119234558,
+ "grad_norm": 0.4093890186492107,
+ "grad_max_sv": 0.1878580778837204,
+ "grad_min_sv": 5.876780584390673e-09,
+ "grad_condition": 44144026.50569831,
+ "lr": 0.0008187119948743447,
+ "time_sec": 41.865527868270874
+ },
+ {
+ "epoch": 43,
+ "train_loss": 4.397055397033691,
+ "train_acc": 0.06784,
+ "test_loss": 18.22021773529053,
+ "test_acc": 0.01,
+ "lyapunov": 1.4911047723287207,
+ "grad_norm": 0.42408941793691435,
+ "grad_max_sv": 0.1856762148439884,
+ "grad_min_sv": 5.8528611551061925e-09,
+ "grad_condition": 150471528.47198898,
+ "lr": 0.000810573890139155,
+ "time_sec": 41.851991176605225
+ },
+ {
+ "epoch": 44,
+ "train_loss": 4.418051720123291,
+ "train_acc": 0.06534,
+ "test_loss": 18.890657635498048,
+ "test_acc": 0.01,
+ "lyapunov": 1.506059860634377,
+ "grad_norm": 0.41379860519627926,
+ "grad_max_sv": 0.1912920583039522,
+ "grad_min_sv": 5.7118770109554354e-09,
+ "grad_condition": 70799416.84221649,
+ "lr": 0.0008022995574311873,
+ "time_sec": 41.855762004852295
+ },
+ {
+ "epoch": 45,
+ "train_loss": 4.555874091186523,
+ "train_acc": 0.05074,
+ "test_loss": 16.445907543945314,
+ "test_acc": 0.01,
+ "lyapunov": 1.5668693082716765,
+ "grad_norm": 0.421064301771623,
+ "grad_max_sv": 0.20280106514692306,
+ "grad_min_sv": 5.1596785455299e-09,
+ "grad_condition": 50522308.14501454,
+ "lr": 0.0007938926261462363,
+ "time_sec": 41.843982219696045
+ },
+ {
+ "epoch": 46,
+ "train_loss": 4.56307541015625,
+ "train_acc": 0.04834,
+ "test_loss": 15.170621519470215,
+ "test_acc": 0.01,
+ "lyapunov": 1.5478406470754873,
+ "grad_norm": 0.4022239019959698,
+ "grad_max_sv": 0.20177871510386466,
+ "grad_min_sv": 4.925644440934018e-09,
+ "grad_condition": 51504299.42247386,
+ "lr": 0.0007853567838422158,
+ "time_sec": 41.843809366226196
+ },
+ {
+ "epoch": 47,
+ "train_loss": 4.461052338867187,
+ "train_acc": 0.06168,
+ "test_loss": 13.590689770507813,
+ "test_acc": 0.01,
+ "lyapunov": 1.539207870698036,
+ "grad_norm": 0.39483180875809476,
+ "grad_max_sv": 0.18038341253995896,
+ "grad_min_sv": 5.225175523509984e-09,
+ "grad_condition": 48416053.199461475,
+ "lr": 0.0007766957746216719,
+ "time_sec": 41.86233711242676
+ },
+ {
+ "epoch": 48,
+ "train_loss": 4.483129704589844,
+ "train_acc": 0.06082,
+ "test_loss": 15.866412992858887,
+ "test_acc": 0.01,
+ "lyapunov": 1.5564451214602537,
+ "grad_norm": 0.4001213731670661,
+ "grad_max_sv": 0.17479643113911153,
+ "grad_min_sv": 4.983967312466309e-09,
+ "grad_condition": 45597451.14778058,
+ "lr": 0.0007679133974894982,
+ "time_sec": 41.860371828079224
+ },
+ {
+ "epoch": 49,
+ "train_loss": 4.563996811523437,
+ "train_acc": 0.05704,
+ "test_loss": 14.467741319274902,
+ "test_acc": 0.01,
+ "lyapunov": 1.7151714895692323,
+ "grad_norm": 0.35765858704843245,
+ "grad_max_sv": 0.17724147401750087,
+ "grad_min_sv": 4.611558551666846e-09,
+ "grad_condition": 3652674833.016098,
+ "lr": 0.000759013504686565,
+ "time_sec": 41.88652062416077
+ },
+ {
+ "epoch": 50,
+ "train_loss": 4.699548272705078,
+ "train_acc": 0.04798,
+ "test_loss": 14.650819215393067,
+ "test_acc": 0.01,
+ "lyapunov": 1.8773073610442375,
+ "grad_norm": 0.3237139765922586,
+ "grad_max_sv": 0.18019139617681504,
+ "grad_min_sv": 4.004119223688374e-09,
+ "grad_condition": 56553030.085173145,
+ "lr": 0.0007499999999999998,
+ "time_sec": 41.8651602268219
+ },
+ {
+ "epoch": 51,
+ "train_loss": 4.856528885040283,
+ "train_acc": 0.01108,
+ "test_loss": 13.696816278076172,
+ "test_acc": 0.01,
+ "lyapunov": 1.4683626176756057,
+ "grad_norm": 0.238328597603378,
+ "grad_max_sv": 0.17753527872264385,
+ "grad_min_sv": 2.2218590706860787e-10,
+ "grad_condition": 124996343340.03922,
+ "lr": 0.0007408768370508575,
+ "time_sec": 41.89140796661377
+ },
+ {
+ "epoch": 52,
+ "train_loss": 4.859013377990722,
+ "train_acc": 0.0091,
+ "test_loss": 13.624913540649414,
+ "test_acc": 0.01,
+ "lyapunov": 1.465970806453539,
+ "grad_norm": 0.16106795495349294,
+ "grad_max_sv": 0.1110096687451005,
+ "grad_min_sv": 6.2731757239434485e-15,
+ "grad_condition": 110304236489.90335,
+ "lr": 0.0007316480175599307,
+ "time_sec": 41.900989294052124
+ },
+ {
+ "epoch": 53,
+ "train_loss": 4.851568754730224,
+ "train_acc": 0.00906,
+ "test_loss": 15.073454458618164,
+ "test_acc": 0.01,
+ "lyapunov": 1.456499196684269,
+ "grad_norm": 0.1430055471916021,
+ "grad_max_sv": 0.09564914535731077,
+ "grad_min_sv": 1.5236447104070445e-15,
+ "grad_condition": 95502112628.56236,
+ "lr": 0.0007223175895924635,
+ "time_sec": 41.87765717506409
+ },
+ {
+ "epoch": 54,
+ "train_loss": 4.851486787261963,
+ "train_acc": 0.0096,
+ "test_loss": 15.396797889709473,
+ "test_acc": 0.01,
+ "lyapunov": 1.4582891162399136,
+ "grad_norm": 0.1275918494558622,
+ "grad_max_sv": 0.07877833610400557,
+ "grad_min_sv": 1.1071724086990746e-23,
+ "grad_condition": 78778336103.16934,
+ "lr": 0.0007128896457825361,
+ "time_sec": 41.84445524215698
+ },
+ {
+ "epoch": 55,
+ "train_loss": 4.850928226623535,
+ "train_acc": 0.00872,
+ "test_loss": 14.606024462890625,
+ "test_acc": 0.01,
+ "lyapunov": 1.4591175653135684,
+ "grad_norm": 0.12323118676067203,
+ "grad_max_sv": 0.07178116273134946,
+ "grad_min_sv": 2.5052708059998736e-20,
+ "grad_condition": 71781161032.94218,
+ "lr": 0.0007033683215378998,
+ "time_sec": 41.84666895866394
+ },
+ {
+ "epoch": 56,
+ "train_loss": 4.852352551269531,
+ "train_acc": 0.0098,
+ "test_loss": 14.902420947265625,
+ "test_acc": 0.01,
+ "lyapunov": 1.4618816878789527,
+ "grad_norm": 0.114352449118403,
+ "grad_max_sv": 0.06100161336362362,
+ "grad_min_sv": 6.896960539960325e-27,
+ "grad_condition": 61001613363.62309,
+ "lr": 0.0006937577932260512,
+ "time_sec": 41.880367279052734
+ },
+ {
+ "epoch": 57,
+ "train_loss": 4.852858272247315,
+ "train_acc": 0.01102,
+ "test_loss": 14.057881980895996,
+ "test_acc": 0.01,
+ "lyapunov": 1.4654078419556094,
+ "grad_norm": 0.10881533107486291,
+ "grad_max_sv": 0.05331473303958774,
+ "grad_min_sv": 1.4012984643248171e-46,
+ "grad_condition": 53314733039.58773,
+ "lr": 0.0006840622763423388,
+ "time_sec": 41.84727120399475
+ },
+ {
+ "epoch": 58,
+ "train_loss": 4.851343263397217,
+ "train_acc": 0.01044,
+ "test_loss": 14.620996353149414,
+ "test_acc": 0.01,
+ "lyapunov": 1.4605532884597778,
+ "grad_norm": 0.11574598071345925,
+ "grad_max_sv": 0.06319006895646453,
+ "grad_min_sv": 2.802712535772941e-41,
+ "grad_condition": 63190068956.46452,
+ "lr": 0.0006742860236609073,
+ "time_sec": 41.8674533367157
+ },
+ {
+ "epoch": 59,
+ "train_loss": 4.852657847747802,
+ "train_acc": 0.0102,
+ "test_loss": 14.391234281921387,
+ "test_acc": 0.01,
+ "lyapunov": 1.4630218619275885,
+ "grad_norm": 0.1117850897535104,
+ "grad_max_sv": 0.057737766206264494,
+ "grad_min_sv": 8.962900509942182e-33,
+ "grad_condition": 57737766206.2645,
+ "lr": 0.0006644333233692913,
+ "time_sec": 41.853941679000854
+ },
+ {
+ "epoch": 60,
+ "train_loss": 4.851071483917236,
+ "train_acc": 0.00948,
+ "test_loss": 14.590808624267579,
+ "test_acc": 0.01,
+ "lyapunov": 1.4618642052726063,
+ "grad_norm": 0.10400000692897449,
+ "grad_max_sv": 0.04577720589004457,
+ "grad_min_sv": 0.0,
+ "grad_condition": 45777205890.04457,
+ "lr": 0.0006545084971874734,
+ "time_sec": 41.848552227020264
+ },
+ {
+ "epoch": 61,
+ "train_loss": 4.852240568084717,
+ "train_acc": 0.0095,
+ "test_loss": 14.59047717590332,
+ "test_acc": 0.01,
+ "lyapunov": 1.4638908500866512,
+ "grad_norm": 0.10799934715249591,
+ "grad_max_sv": 0.05035868901759386,
+ "grad_min_sv": 0.0,
+ "grad_condition": 50358689017.59386,
+ "lr": 0.0006445158984722354,
+ "time_sec": 41.850308418273926
+ },
+ {
+ "epoch": 62,
+ "train_loss": 4.852433279266357,
+ "train_acc": 0.01012,
+ "test_loss": 15.986171211242675,
+ "test_acc": 0.01,
+ "lyapunov": 1.4649500645639952,
+ "grad_norm": 0.10733331744324738,
+ "grad_max_sv": 0.05229583606123924,
+ "grad_min_sv": 0.0,
+ "grad_condition": 52295836061.23924,
+ "lr": 0.0006344599103076324,
+ "time_sec": 41.855886936187744
+ },
+ {
+ "epoch": 63,
+ "train_loss": 4.85242006362915,
+ "train_acc": 0.00952,
+ "test_loss": 13.999450773620605,
+ "test_acc": 0.01,
+ "lyapunov": 1.4631946355180667,
+ "grad_norm": 0.10887508886634635,
+ "grad_max_sv": 0.05549173932522535,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55491739325.22536,
+ "lr": 0.0006243449435824269,
+ "time_sec": 41.875603675842285
+ },
+ {
+ "epoch": 64,
+ "train_loss": 4.852031197509765,
+ "train_acc": 0.00988,
+ "test_loss": 13.823671005249023,
+ "test_acc": 0.01,
+ "lyapunov": 1.46498492947015,
+ "grad_norm": 0.10631816229605466,
+ "grad_max_sv": 0.050992762017995116,
+ "grad_min_sv": 0.0,
+ "grad_condition": 50992762017.99512,
+ "lr": 0.0006141754350553275,
+ "time_sec": 41.84609389305115
+ },
+ {
+ "epoch": 65,
+ "train_loss": 4.851191096801758,
+ "train_acc": 0.01018,
+ "test_loss": 13.375173307800292,
+ "test_acc": 0.01,
+ "lyapunov": 1.4641655095093085,
+ "grad_norm": 0.1010577343573765,
+ "grad_max_sv": 0.042480578925460574,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42480578925.46058,
+ "lr": 0.0006039558454088793,
+ "time_sec": 41.83738660812378
+ },
+ {
+ "epoch": 66,
+ "train_loss": 4.852197050323486,
+ "train_acc": 0.00882,
+ "test_loss": 14.165961294555665,
+ "test_acc": 0.01,
+ "lyapunov": 1.4664015864472255,
+ "grad_norm": 0.09792907198844746,
+ "grad_max_sv": 0.036209277296438816,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36209277296.43882,
+ "lr": 0.000593690657292862,
+ "time_sec": 41.797043323516846
+ },
+ {
+ "epoch": 67,
+ "train_loss": 4.85130561340332,
+ "train_acc": 0.0101,
+ "test_loss": 14.011718264770508,
+ "test_acc": 0.01,
+ "lyapunov": 1.4650892686965826,
+ "grad_norm": 0.09456101481889781,
+ "grad_max_sv": 0.02113236514851451,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21132365148.514507,
+ "lr": 0.0005833843733580507,
+ "time_sec": 41.754011154174805
+ },
+ {
+ "epoch": 68,
+ "train_loss": 4.852421583099365,
+ "train_acc": 0.00954,
+ "test_loss": 13.768776727294922,
+ "test_acc": 0.01,
+ "lyapunov": 1.4679525093654233,
+ "grad_norm": 0.09464764660731555,
+ "grad_max_sv": 0.025787328323349356,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25787328323.349358,
+ "lr": 0.0005730415142812054,
+ "time_sec": 42.026938676834106
+ },
+ {
+ "epoch": 69,
+ "train_loss": 4.85272935760498,
+ "train_acc": 0.00984,
+ "test_loss": 13.534171914672852,
+ "test_acc": 0.01,
+ "lyapunov": 1.4685536226653078,
+ "grad_norm": 0.09557086506346626,
+ "grad_max_sv": 0.026282459730282426,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26282459730.282425,
+ "lr": 0.0005626666167821517,
+ "time_sec": 41.802675008773804
+ },
+ {
+ "epoch": 70,
+ "train_loss": 4.851980906524658,
+ "train_acc": 0.01004,
+ "test_loss": 13.33881396484375,
+ "test_acc": 0.01,
+ "lyapunov": 1.4669674391026997,
+ "grad_norm": 0.09715157690608033,
+ "grad_max_sv": 0.03565134848468006,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35651348484.68006,
+ "lr": 0.0005522642316338265,
+ "time_sec": 41.813010931015015
+ },
+ {
+ "epoch": 71,
+ "train_loss": 4.85278720413208,
+ "train_acc": 0.01006,
+ "test_loss": 12.802179231262206,
+ "test_acc": 0.01,
+ "lyapunov": 1.468117561791559,
+ "grad_norm": 0.09992948652871142,
+ "grad_max_sv": 0.03685425859875977,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36854258598.759766,
+ "lr": 0.0005418389216661573,
+ "time_sec": 41.84488320350647
+ },
+ {
+ "epoch": 72,
+ "train_loss": 4.851398905639648,
+ "train_acc": 0.00926,
+ "test_loss": 13.120699348449707,
+ "test_acc": 0.01,
+ "lyapunov": 1.4663349237588361,
+ "grad_norm": 0.0922810139338614,
+ "grad_max_sv": 0.021838864544406533,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21838864544.406532,
+ "lr": 0.0005313952597646563,
+ "time_sec": 41.80693006515503
+ },
+ {
+ "epoch": 73,
+ "train_loss": 4.852625637207031,
+ "train_acc": 0.01006,
+ "test_loss": 14.170262338256835,
+ "test_acc": 0.01,
+ "lyapunov": 1.4684231619700752,
+ "grad_norm": 0.09725476129415889,
+ "grad_max_sv": 0.03474617879837751,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34746178798.37752,
+ "lr": 0.0005209378268645994,
+ "time_sec": 41.80283856391907
+ },
+ {
+ "epoch": 74,
+ "train_loss": 4.854615002288818,
+ "train_acc": 0.01012,
+ "test_loss": 13.06523247833252,
+ "test_acc": 0.01,
+ "lyapunov": 1.4741113576132927,
+ "grad_norm": 0.09355435634576315,
+ "grad_max_sv": 0.026293953135609626,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26293953135.609627,
+ "lr": 0.0005104712099416781,
+ "time_sec": 41.77813935279846
+ },
+ {
+ "epoch": 75,
+ "train_loss": 4.8521118782043455,
+ "train_acc": 0.01014,
+ "test_loss": 13.227028475952148,
+ "test_acc": 0.01,
+ "lyapunov": 1.4683185632881302,
+ "grad_norm": 0.09873531057612077,
+ "grad_max_sv": 0.029217457259073855,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29217457259.073853,
+ "lr": 0.0004999999999999996,
+ "time_sec": 41.80186319351196
+ },
+ {
+ "epoch": 76,
+ "train_loss": 4.8521026638793945,
+ "train_acc": 0.00974,
+ "test_loss": 13.727623275756835,
+ "test_acc": 0.01,
+ "lyapunov": 1.4683916117529126,
+ "grad_norm": 0.09359089364340291,
+ "grad_max_sv": 0.019284735713154078,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19284735713.154076,
+ "lr": 0.0004895287900583212,
+ "time_sec": 41.79860997200012
+ },
+ {
+ "epoch": 77,
+ "train_loss": 4.85240275100708,
+ "train_acc": 0.00924,
+ "test_loss": 13.845351657104493,
+ "test_acc": 0.01,
+ "lyapunov": 1.469331070285319,
+ "grad_norm": 0.09291177556896672,
+ "grad_max_sv": 0.02184786768630147,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21847867686.30147,
+ "lr": 0.0004790621731353997,
+ "time_sec": 41.78152871131897
+ },
+ {
+ "epoch": 78,
+ "train_loss": 4.853202556762695,
+ "train_acc": 0.0094,
+ "test_loss": 12.943718765258788,
+ "test_acc": 0.01,
+ "lyapunov": 1.4710808498475252,
+ "grad_norm": 0.09560356806636944,
+ "grad_max_sv": 0.024571862118318678,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24571862118.318676,
+ "lr": 0.000468604740235343,
+ "time_sec": 41.800830364227295
+ },
+ {
+ "epoch": 79,
+ "train_loss": 4.852821475524903,
+ "train_acc": 0.00916,
+ "test_loss": 13.06967273864746,
+ "test_acc": 0.01,
+ "lyapunov": 1.4714962222691996,
+ "grad_norm": 0.09286348407291162,
+ "grad_max_sv": 0.01579846618697047,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15798466186.97047,
+ "lr": 0.00045816107833384175,
+ "time_sec": 41.79053092002869
+ },
+ {
+ "epoch": 80,
+ "train_loss": 4.852609764556885,
+ "train_acc": 0.00954,
+ "test_loss": 13.320957052612306,
+ "test_acc": 0.01,
+ "lyapunov": 1.4709682016421461,
+ "grad_norm": 0.09107911624268931,
+ "grad_max_sv": 0.013279847288504242,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13279847288.504242,
+ "lr": 0.0004477357683661729,
+ "time_sec": 41.762046813964844
+ },
+ {
+ "epoch": 81,
+ "train_loss": 4.851465040130615,
+ "train_acc": 0.00952,
+ "test_loss": 13.012565188598632,
+ "test_acc": 0.01,
+ "lyapunov": 1.468221844004853,
+ "grad_norm": 0.09041003134861456,
+ "grad_max_sv": 0.007651371089741588,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7651371089.741588,
+ "lr": 0.00043733338321784746,
+ "time_sec": 41.751330614089966
+ },
+ {
+ "epoch": 82,
+ "train_loss": 4.852081020355224,
+ "train_acc": 0.00966,
+ "test_loss": 12.822627255249023,
+ "test_acc": 0.01,
+ "lyapunov": 1.4696848944324972,
+ "grad_norm": 0.09065480177880879,
+ "grad_max_sv": 0.01019995305687189,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10199953056.871891,
+ "lr": 0.0004269584857187939,
+ "time_sec": 41.86999726295471
+ },
+ {
+ "epoch": 83,
+ "train_loss": 4.852022810516358,
+ "train_acc": 0.00996,
+ "test_loss": 12.253762084960938,
+ "test_acc": 0.01,
+ "lyapunov": 1.4689973016529132,
+ "grad_norm": 0.09460842094540753,
+ "grad_max_sv": 0.029235992394387723,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29235992394.38772,
+ "lr": 0.0004166156266419484,
+ "time_sec": 41.76723504066467
+ },
+ {
+ "epoch": 84,
+ "train_loss": 4.852035647277832,
+ "train_acc": 0.01024,
+ "test_loss": 12.115891886901855,
+ "test_acc": 0.01,
+ "lyapunov": 1.4691770165167806,
+ "grad_norm": 0.09360646750239629,
+ "grad_max_sv": 0.019934501592069866,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19934501592.069862,
+ "lr": 0.0004063093427071373,
+ "time_sec": 41.82295870780945
+ },
+ {
+ "epoch": 85,
+ "train_loss": 4.852076805419922,
+ "train_acc": 0.00986,
+ "test_loss": 12.878702352905274,
+ "test_acc": 0.01,
+ "lyapunov": 1.4699803453577145,
+ "grad_norm": 0.09050948837033777,
+ "grad_max_sv": 0.010260828444734216,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10260828444.734217,
+ "lr": 0.0003960441545911199,
+ "time_sec": 41.740272521972656
+ },
+ {
+ "epoch": 86,
+ "train_loss": 4.853503344268799,
+ "train_acc": 0.00942,
+ "test_loss": 13.130225515747071,
+ "test_acc": 0.01,
+ "lyapunov": 1.473677592204355,
+ "grad_norm": 0.08911124738850405,
+ "grad_max_sv": 0.0034935059491544964,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3493505949.154496,
+ "lr": 0.0003858245649446718,
+ "time_sec": 41.71459937095642
+ },
+ {
+ "epoch": 87,
+ "train_loss": 4.852846223449707,
+ "train_acc": 0.0098,
+ "test_loss": 13.668508865356445,
+ "test_acc": 0.01,
+ "lyapunov": 1.4720799718671442,
+ "grad_norm": 0.09028155404620607,
+ "grad_max_sv": 0.008756613591685891,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8756613591.685892,
+ "lr": 0.00037565505641757235,
+ "time_sec": 41.74625873565674
+ },
+ {
+ "epoch": 88,
+ "train_loss": 4.852147266693115,
+ "train_acc": 0.01,
+ "test_loss": 13.016764665222167,
+ "test_acc": 0.01,
+ "lyapunov": 1.4709450503444428,
+ "grad_norm": 0.08907329873744592,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00036554008969236695,
+ "time_sec": 41.72583556175232
+ },
+ {
+ "epoch": 89,
+ "train_loss": 4.854143925933838,
+ "train_acc": 0.00968,
+ "test_loss": 13.080362130737305,
+ "test_acc": 0.01,
+ "lyapunov": 1.4749400249832427,
+ "grad_norm": 0.09887236057674029,
+ "grad_max_sv": 0.017000502441078424,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17000502441.078424,
+ "lr": 0.0003554841015277638,
+ "time_sec": 41.776273250579834
+ },
+ {
+ "epoch": 90,
+ "train_loss": 4.852338234405518,
+ "train_acc": 0.00894,
+ "test_loss": 13.206872094726563,
+ "test_acc": 0.01,
+ "lyapunov": 1.470992279784454,
+ "grad_norm": 0.08990915500150026,
+ "grad_max_sv": 0.004822738515213132,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4822738515.213132,
+ "lr": 0.000345491502812526,
+ "time_sec": 41.74059700965881
+ },
+ {
+ "epoch": 91,
+ "train_loss": 4.854439675140381,
+ "train_acc": 0.0098,
+ "test_loss": 13.193742947387696,
+ "test_acc": 0.01,
+ "lyapunov": 1.4752069266555865,
+ "grad_norm": 0.09195463137068469,
+ "grad_max_sv": 0.016309724561870097,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16309724561.870098,
+ "lr": 0.0003355666766307081,
+ "time_sec": 41.72685122489929
+ },
+ {
+ "epoch": 92,
+ "train_loss": 4.852755132141113,
+ "train_acc": 0.00966,
+ "test_loss": 12.651437782287598,
+ "test_acc": 0.01,
+ "lyapunov": 1.4722728369485996,
+ "grad_norm": 0.09031090314491075,
+ "grad_max_sv": 0.013889235025271774,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13889235025.27177,
+ "lr": 0.00032571397633909225,
+ "time_sec": 41.76129865646362
+ },
+ {
+ "epoch": 93,
+ "train_loss": 4.852394995727539,
+ "train_acc": 0.00978,
+ "test_loss": 13.140398934936524,
+ "test_acc": 0.01,
+ "lyapunov": 1.4706439609112947,
+ "grad_norm": 0.09896021199497843,
+ "grad_max_sv": 0.012632346572354436,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12632346572.354437,
+ "lr": 0.00031593772365766094,
+ "time_sec": 41.7473201751709
+ },
+ {
+ "epoch": 94,
+ "train_loss": 4.853237281036377,
+ "train_acc": 0.00878,
+ "test_loss": 12.807959544372558,
+ "test_acc": 0.01,
+ "lyapunov": 1.4736966973985248,
+ "grad_norm": 0.09036941229411612,
+ "grad_max_sv": 0.008218426816165447,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8218426816.165448,
+ "lr": 0.0003062422067739483,
+ "time_sec": 41.732847452163696
+ },
+ {
+ "epoch": 95,
+ "train_loss": 4.852389494171143,
+ "train_acc": 0.00908,
+ "test_loss": 12.560802192687989,
+ "test_acc": 0.01,
+ "lyapunov": 1.471325798412723,
+ "grad_norm": 0.08925054999698791,
+ "grad_max_sv": 0.00795787493698299,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7957874936.982989,
+ "lr": 0.00029663167846209965,
+ "time_sec": 41.743444204330444
+ },
+ {
+ "epoch": 96,
+ "train_loss": 4.852095717926026,
+ "train_acc": 0.00964,
+ "test_loss": 12.698743003845214,
+ "test_acc": 0.01,
+ "lyapunov": 1.4707305251484941,
+ "grad_norm": 0.08980211873044659,
+ "grad_max_sv": 0.006079048849642277,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6079048849.642277,
+ "lr": 0.00028711035421746345,
+ "time_sec": 41.744508266448975
+ },
+ {
+ "epoch": 97,
+ "train_loss": 4.852325097198486,
+ "train_acc": 0.00998,
+ "test_loss": 12.385714389038085,
+ "test_acc": 0.01,
+ "lyapunov": 1.4707067143886596,
+ "grad_norm": 0.09303110633276697,
+ "grad_max_sv": 0.013369420357048512,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13369420357.048512,
+ "lr": 0.00027768241040753615,
+ "time_sec": 41.777459383010864
+ },
+ {
+ "epoch": 98,
+ "train_loss": 4.852114578399658,
+ "train_acc": 0.00946,
+ "test_loss": 12.616465420532226,
+ "test_acc": 0.01,
+ "lyapunov": 1.4709890193646522,
+ "grad_norm": 0.08982717043210414,
+ "grad_max_sv": 0.011742619890719652,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11742619890.719652,
+ "lr": 0.00026835198244006903,
+ "time_sec": 41.74090838432312
+ },
+ {
+ "epoch": 99,
+ "train_loss": 4.852081492767334,
+ "train_acc": 0.00914,
+ "test_loss": 12.773276670837403,
+ "test_acc": 0.01,
+ "lyapunov": 1.4708703545963062,
+ "grad_norm": 0.08820725715813042,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002591231629491421,
+ "time_sec": 41.70957374572754
+ },
+ {
+ "epoch": 100,
+ "train_loss": 4.852057821807861,
+ "train_acc": 0.00854,
+ "test_loss": 12.903013801574707,
+ "test_acc": 0.01,
+ "lyapunov": 1.470713365718227,
+ "grad_norm": 0.08831333485556404,
+ "grad_max_sv": 0.001176884165033698,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1176884165.033698,
+ "lr": 0.0002499999999999997,
+ "time_sec": 41.70664095878601
+ },
+ {
+ "epoch": 101,
+ "train_loss": 4.852297632446289,
+ "train_acc": 0.0088,
+ "test_loss": 12.991321166992188,
+ "test_acc": 0.01,
+ "lyapunov": 1.471470196838574,
+ "grad_norm": 0.08844546443228318,
+ "grad_max_sv": 0.0007792085409164429,
+ "grad_min_sv": 0.0,
+ "grad_condition": 779208540.9164429,
+ "lr": 0.00024098649531343477,
+ "time_sec": 41.72946095466614
+ },
+ {
+ "epoch": 102,
+ "train_loss": 4.85340077835083,
+ "train_acc": 0.00928,
+ "test_loss": 12.494372912597656,
+ "test_acc": 0.01,
+ "lyapunov": 1.4734248584493652,
+ "grad_norm": 0.0904122316991309,
+ "grad_max_sv": 0.01403848035261035,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14038480352.610352,
+ "lr": 0.0002320866025105016,
+ "time_sec": 41.72011160850525
+ },
+ {
+ "epoch": 103,
+ "train_loss": 4.8527667138671875,
+ "train_acc": 0.00854,
+ "test_loss": 13.111592295837402,
+ "test_acc": 0.01,
+ "lyapunov": 1.4726007445084164,
+ "grad_norm": 0.08932121120200033,
+ "grad_max_sv": 0.004739455413073301,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4739455413.073301,
+ "lr": 0.0002233042253783278,
+ "time_sec": 41.74779987335205
+ },
+ {
+ "epoch": 104,
+ "train_loss": 4.852004501037598,
+ "train_acc": 0.00946,
+ "test_loss": 12.720405123901367,
+ "test_acc": 0.01,
+ "lyapunov": 1.4705228412242801,
+ "grad_norm": 0.08860158464501969,
+ "grad_max_sv": 0.006343359779566527,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6343359779.566526,
+ "lr": 0.000214643216157784,
+ "time_sec": 41.75279927253723
+ },
+ {
+ "epoch": 105,
+ "train_loss": 4.852732130584717,
+ "train_acc": 0.00936,
+ "test_loss": 12.728569932556152,
+ "test_acc": 0.01,
+ "lyapunov": 1.4726796906317592,
+ "grad_norm": 0.08858840001436137,
+ "grad_max_sv": 0.0021229078993201256,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2122907899.3201256,
+ "lr": 0.00020610737385376332,
+ "time_sec": 41.71723484992981
+ },
+ {
+ "epoch": 106,
+ "train_loss": 4.852207695922852,
+ "train_acc": 0.00926,
+ "test_loss": 12.709718621826172,
+ "test_acc": 0.01,
+ "lyapunov": 1.4712865084333493,
+ "grad_norm": 0.08830963721683445,
+ "grad_max_sv": 0.0027129428926855326,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2712942892.6855326,
+ "lr": 0.00019770044256881242,
+ "time_sec": 41.71148443222046
+ },
+ {
+ "epoch": 107,
+ "train_loss": 4.85225803314209,
+ "train_acc": 0.00982,
+ "test_loss": 12.837951531982421,
+ "test_acc": 0.01,
+ "lyapunov": 1.4712638537902052,
+ "grad_norm": 0.08902472521530928,
+ "grad_max_sv": 0.008135201036930084,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8135201036.930084,
+ "lr": 0.0001894261098608447,
+ "time_sec": 41.72528624534607
+ },
+ {
+ "epoch": 108,
+ "train_loss": 4.852549499511719,
+ "train_acc": 0.00936,
+ "test_loss": 13.247559573364258,
+ "test_acc": 0.01,
+ "lyapunov": 1.4724893740680822,
+ "grad_norm": 0.08825387718460724,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000181288005125655,
+ "time_sec": 41.74774885177612
+ },
+ {
+ "epoch": 109,
+ "train_loss": 4.85227595916748,
+ "train_acc": 0.00946,
+ "test_loss": 13.13632116241455,
+ "test_acc": 0.01,
+ "lyapunov": 1.471560059910845,
+ "grad_norm": 0.08956498900691849,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001732896980049473,
+ "time_sec": 41.7323522567749
+ },
+ {
+ "epoch": 110,
+ "train_loss": 4.852233708801269,
+ "train_acc": 0.00902,
+ "test_loss": 13.550802612304688,
+ "test_acc": 0.01,
+ "lyapunov": 1.4712924996910193,
+ "grad_norm": 0.08901901086212888,
+ "grad_max_sv": 0.004322580248117447,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4322580248.117447,
+ "lr": 0.00016543469682057076,
+ "time_sec": 41.74680209159851
+ },
+ {
+ "epoch": 111,
+ "train_loss": 4.852689293060303,
+ "train_acc": 0.00916,
+ "test_loss": 13.372785118103028,
+ "test_acc": 0.01,
+ "lyapunov": 1.4729326292681877,
+ "grad_norm": 0.08862372209724671,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 41.72367000579834
+ },
+ {
+ "epoch": 112,
+ "train_loss": 4.855245245056152,
+ "train_acc": 0.00918,
+ "test_loss": 13.167806037902832,
+ "test_acc": 0.01,
+ "lyapunov": 1.4768958594792945,
+ "grad_norm": 0.08841785458131039,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 41.73188829421997
+ },
+ {
+ "epoch": 113,
+ "train_loss": 4.852458833618164,
+ "train_acc": 0.00882,
+ "test_loss": 13.374362356567383,
+ "test_acc": 0.01,
+ "lyapunov": 1.4722495371728297,
+ "grad_norm": 0.08871568614447918,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 41.71817493438721
+ },
+ {
+ "epoch": 114,
+ "train_loss": 4.851942072448731,
+ "train_acc": 0.00902,
+ "test_loss": 13.413740673828125,
+ "test_acc": 0.01,
+ "lyapunov": 1.4704074313878404,
+ "grad_norm": 0.08870214010553126,
+ "grad_max_sv": 0.0019620250910520553,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1962025091.0520554,
+ "lr": 0.00013551568628929425,
+ "time_sec": 41.72637939453125
+ },
+ {
+ "epoch": 115,
+ "train_loss": 4.853842346343994,
+ "train_acc": 0.00876,
+ "test_loss": 13.078753887939452,
+ "test_acc": 0.01,
+ "lyapunov": 1.4757750683733264,
+ "grad_norm": 0.08934074054242225,
+ "grad_max_sv": 0.0054347761906683445,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5434776190.6683445,
+ "lr": 0.00012842758726130276,
+ "time_sec": 41.711642265319824
+ },
+ {
+ "epoch": 116,
+ "train_loss": 4.852122984466552,
+ "train_acc": 0.0092,
+ "test_loss": 13.219519885253906,
+ "test_acc": 0.01,
+ "lyapunov": 1.4712010920809968,
+ "grad_norm": 0.08808712563631747,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 41.74567747116089
+ },
+ {
+ "epoch": 117,
+ "train_loss": 4.8583870220947265,
+ "train_acc": 0.00938,
+ "test_loss": 13.296599545288085,
+ "test_acc": 0.01,
+ "lyapunov": 1.4836899404940398,
+ "grad_norm": 0.08878474499083394,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 41.72996282577515
+ },
+ {
+ "epoch": 118,
+ "train_loss": 4.8542758628845215,
+ "train_acc": 0.0095,
+ "test_loss": 13.232178741455078,
+ "test_acc": 0.01,
+ "lyapunov": 1.476102854284789,
+ "grad_norm": 0.08869739853760654,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010815327133708009,
+ "time_sec": 41.73535418510437
+ },
+ {
+ "epoch": 119,
+ "train_loss": 4.852905385437012,
+ "train_acc": 0.00894,
+ "test_loss": 13.59550298614502,
+ "test_acc": 0.01,
+ "lyapunov": 1.4737293317799678,
+ "grad_norm": 0.08826212131432655,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010173504098790182,
+ "time_sec": 41.72545409202576
+ },
+ {
+ "epoch": 120,
+ "train_loss": 4.852262009429932,
+ "train_acc": 0.0092,
+ "test_loss": 13.53664966430664,
+ "test_acc": 0.01,
+ "lyapunov": 1.471702798248252,
+ "grad_norm": 0.08816229564695008,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 41.747995376586914
+ },
+ {
+ "epoch": 121,
+ "train_loss": 4.852286165924072,
+ "train_acc": 0.00938,
+ "test_loss": 13.543427288818359,
+ "test_acc": 0.01,
+ "lyapunov": 1.4718451771284917,
+ "grad_norm": 0.0882556097544163,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 41.71251606941223
+ },
+ {
+ "epoch": 122,
+ "train_loss": 4.852815079193115,
+ "train_acc": 0.00866,
+ "test_loss": 13.50841277770996,
+ "test_acc": 0.01,
+ "lyapunov": 1.4734657941876774,
+ "grad_norm": 0.08834171363916951,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 41.828593492507935
+ },
+ {
+ "epoch": 123,
+ "train_loss": 4.8519872172546386,
+ "train_acc": 0.0097,
+ "test_loss": 13.492674378967285,
+ "test_acc": 0.01,
+ "lyapunov": 1.470838068696239,
+ "grad_norm": 0.08874014439548912,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 41.981213331222534
+ },
+ {
+ "epoch": 124,
+ "train_loss": 4.853034484252929,
+ "train_acc": 0.009,
+ "test_loss": 13.126736920166016,
+ "test_acc": 0.01,
+ "lyapunov": 1.4740290989351394,
+ "grad_norm": 0.08813885370977613,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 41.71132040023804
+ },
+ {
+ "epoch": 125,
+ "train_loss": 4.85233381652832,
+ "train_acc": 0.00952,
+ "test_loss": 13.397762631225586,
+ "test_acc": 0.01,
+ "lyapunov": 1.471941991230411,
+ "grad_norm": 0.08812641091996891,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 41.72543954849243
+ },
+ {
+ "epoch": 126,
+ "train_loss": 4.8525572804260255,
+ "train_acc": 0.0096,
+ "test_loss": 13.308763629150391,
+ "test_acc": 0.01,
+ "lyapunov": 1.472656028349991,
+ "grad_norm": 0.08840738704987161,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 41.72384238243103
+ },
+ {
+ "epoch": 127,
+ "train_loss": 4.855584846191406,
+ "train_acc": 0.00946,
+ "test_loss": 13.759437710571289,
+ "test_acc": 0.01,
+ "lyapunov": 1.4782639266279958,
+ "grad_norm": 0.08826506573029154,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 41.73837852478027
+ },
+ {
+ "epoch": 128,
+ "train_loss": 4.85253405090332,
+ "train_acc": 0.00946,
+ "test_loss": 13.737331958007813,
+ "test_acc": 0.01,
+ "lyapunov": 1.4725991725311864,
+ "grad_norm": 0.08806307055084844,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 41.761263847351074
+ },
+ {
+ "epoch": 129,
+ "train_loss": 4.852324590759277,
+ "train_acc": 0.01,
+ "test_loss": 13.721236633300782,
+ "test_acc": 0.01,
+ "lyapunov": 1.4719348380632717,
+ "grad_norm": 0.08813587403770864,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 41.74943208694458
+ },
+ {
+ "epoch": 130,
+ "train_loss": 4.85221561340332,
+ "train_acc": 0.00954,
+ "test_loss": 13.78914153137207,
+ "test_acc": 0.01,
+ "lyapunov": 1.4716954301385319,
+ "grad_norm": 0.08851547081560074,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 41.76015615463257
+ },
+ {
+ "epoch": 131,
+ "train_loss": 4.852464799957275,
+ "train_acc": 0.00878,
+ "test_loss": 13.605609268188477,
+ "test_acc": 0.01,
+ "lyapunov": 1.4723939121226826,
+ "grad_norm": 0.08823360335901036,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 41.77037334442139
+ },
+ {
+ "epoch": 132,
+ "train_loss": 4.852380610198975,
+ "train_acc": 0.00896,
+ "test_loss": 13.703162010192871,
+ "test_acc": 0.01,
+ "lyapunov": 1.4721423701557053,
+ "grad_norm": 0.08806535417914078,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 41.78282904624939
+ },
+ {
+ "epoch": 133,
+ "train_loss": 4.853441643676758,
+ "train_acc": 0.00924,
+ "test_loss": 13.780622036743164,
+ "test_acc": 0.01,
+ "lyapunov": 1.4737608521185872,
+ "grad_norm": 0.08786943886020787,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 41.94830918312073
+ },
+ {
+ "epoch": 134,
+ "train_loss": 4.8520362255859375,
+ "train_acc": 0.00954,
+ "test_loss": 13.83701887512207,
+ "test_acc": 0.01,
+ "lyapunov": 1.471004798284272,
+ "grad_norm": 0.08837937530648805,
+ "grad_max_sv": 0.000659800786525011,
+ "grad_min_sv": 0.0,
+ "grad_condition": 659800786.5250111,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 41.915955781936646
+ },
+ {
+ "epoch": 135,
+ "train_loss": 4.852150169067383,
+ "train_acc": 0.00958,
+ "test_loss": 13.836302838134765,
+ "test_acc": 0.01,
+ "lyapunov": 1.471451068473289,
+ "grad_norm": 0.0887060490050228,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 41.69927930831909
+ },
+ {
+ "epoch": 136,
+ "train_loss": 4.853155226898194,
+ "train_acc": 0.00916,
+ "test_loss": 13.758418685913085,
+ "test_acc": 0.01,
+ "lyapunov": 1.4742048859901136,
+ "grad_norm": 0.09745955508136325,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 41.71672034263611
+ },
+ {
+ "epoch": 137,
+ "train_loss": 4.85282894165039,
+ "train_acc": 0.00928,
+ "test_loss": 13.801075386047364,
+ "test_acc": 0.01,
+ "lyapunov": 1.4736028842608948,
+ "grad_norm": 0.08838780479254947,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 41.86513018608093
+ },
+ {
+ "epoch": 138,
+ "train_loss": 4.852049649047852,
+ "train_acc": 0.00982,
+ "test_loss": 13.844301895141601,
+ "test_acc": 0.01,
+ "lyapunov": 1.4711221602871596,
+ "grad_norm": 0.0886793780466303,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 41.807748317718506
+ },
+ {
+ "epoch": 139,
+ "train_loss": 4.853534520874024,
+ "train_acc": 0.01,
+ "test_loss": 13.770389680480957,
+ "test_acc": 0.01,
+ "lyapunov": 1.4747250278282653,
+ "grad_norm": 0.08808641740018294,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 41.780285596847534
+ },
+ {
+ "epoch": 140,
+ "train_loss": 4.851904624481201,
+ "train_acc": 0.0096,
+ "test_loss": 13.713402738952636,
+ "test_acc": 0.01,
+ "lyapunov": 1.4706565852055464,
+ "grad_norm": 0.08806158709361275,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 41.71153283119202
+ },
+ {
+ "epoch": 141,
+ "train_loss": 4.852294711456299,
+ "train_acc": 0.00974,
+ "test_loss": 13.674919595336915,
+ "test_acc": 0.01,
+ "lyapunov": 1.4719334886507,
+ "grad_norm": 0.08848605705342659,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 41.75360417366028
+ },
+ {
+ "epoch": 142,
+ "train_loss": 4.852051578979492,
+ "train_acc": 0.00986,
+ "test_loss": 13.683543762207032,
+ "test_acc": 0.01,
+ "lyapunov": 1.4711576669722262,
+ "grad_norm": 0.08814132937210956,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 41.73791003227234
+ },
+ {
+ "epoch": 143,
+ "train_loss": 4.852365187683105,
+ "train_acc": 0.00984,
+ "test_loss": 13.635780154418946,
+ "test_acc": 0.01,
+ "lyapunov": 1.4721494221016573,
+ "grad_norm": 0.08862731675513442,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 41.75744414329529
+ },
+ {
+ "epoch": 144,
+ "train_loss": 4.852421789550781,
+ "train_acc": 0.00964,
+ "test_loss": 13.633413438415527,
+ "test_acc": 0.01,
+ "lyapunov": 1.4723204545047888,
+ "grad_norm": 0.08863761801039138,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 41.74138283729553
+ },
+ {
+ "epoch": 145,
+ "train_loss": 4.852283345336914,
+ "train_acc": 0.00988,
+ "test_loss": 13.618844378662109,
+ "test_acc": 0.01,
+ "lyapunov": 1.471912037990892,
+ "grad_norm": 0.08829552590637708,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 41.73318958282471
+ },
+ {
+ "epoch": 146,
+ "train_loss": 4.852081503601074,
+ "train_acc": 0.00942,
+ "test_loss": 13.636005783081055,
+ "test_acc": 0.01,
+ "lyapunov": 1.4712535944741096,
+ "grad_norm": 0.0881891115278494,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 41.7281494140625
+ },
+ {
+ "epoch": 147,
+ "train_loss": 4.851804008331299,
+ "train_acc": 0.00964,
+ "test_loss": 13.61884249420166,
+ "test_acc": 0.01,
+ "lyapunov": 1.4703791028703266,
+ "grad_norm": 0.08816211822553004,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 41.74032163619995
+ },
+ {
+ "epoch": 148,
+ "train_loss": 4.8529896348571775,
+ "train_acc": 0.0097,
+ "test_loss": 13.650962756347656,
+ "test_acc": 0.01,
+ "lyapunov": 1.4741563284793473,
+ "grad_norm": 0.08847924183215054,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 41.70267343521118
+ },
+ {
+ "epoch": 149,
+ "train_loss": 4.851896666412354,
+ "train_acc": 0.01,
+ "test_loss": 13.636007565307617,
+ "test_acc": 0.01,
+ "lyapunov": 1.470671361669555,
+ "grad_norm": 0.08871972262513622,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 41.72864389419556
+ },
+ {
+ "epoch": 150,
+ "train_loss": 4.852557410736084,
+ "train_acc": 0.01,
+ "test_loss": 13.636007955932618,
+ "test_acc": 0.01,
+ "lyapunov": 1.4727459463012187,
+ "grad_norm": 0.08844840269295245,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 41.74263858795166
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 4.735240103759765,
+ "train_acc": 0.02524,
+ "test_loss": 4.866816416931153,
+ "test_acc": 0.0196,
+ "lyapunov": 2.026013672809162,
+ "grad_norm": 5.2515251679689285,
+ "grad_max_sv": 4.178838831186295,
+ "grad_min_sv": 9.041712029367321e-08,
+ "grad_condition": 179649161.33195654,
+ "lr": 0.0009998903417374227,
+ "time_sec": 87.18950843811035
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.5068304737854,
+ "train_acc": 0.03554,
+ "test_loss": 5.026126983642578,
+ "test_acc": 0.0173,
+ "lyapunov": 1.7496998066182636,
+ "grad_norm": 3.127286126154696,
+ "grad_max_sv": 2.359567102789879,
+ "grad_min_sv": 5.685370215550989e-08,
+ "grad_condition": 519592009.8775345,
+ "lr": 0.0009995614150494292,
+ "time_sec": 87.2297294139862
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.461366838684082,
+ "train_acc": 0.03612,
+ "test_loss": 4.588225796508789,
+ "test_acc": 0.0214,
+ "lyapunov": 1.5944948662882266,
+ "grad_norm": 1.7421788335036872,
+ "grad_max_sv": 1.159491127729416,
+ "grad_min_sv": 3.012503119736998e-08,
+ "grad_condition": 46872158.840100154,
+ "lr": 0.0009990133642141358,
+ "time_sec": 87.14756369590759
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.419443615722656,
+ "train_acc": 0.0416,
+ "test_loss": 5.286386401367188,
+ "test_acc": 0.01,
+ "lyapunov": 1.5645387861734765,
+ "grad_norm": 1.1211397301440151,
+ "grad_max_sv": 0.6769661128520965,
+ "grad_min_sv": 1.748986164784583e-08,
+ "grad_condition": 61425339.07877908,
+ "lr": 0.0009982464296247522,
+ "time_sec": 87.12213373184204
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.423492089996338,
+ "train_acc": 0.04338,
+ "test_loss": 6.2819957962036135,
+ "test_acc": 0.01,
+ "lyapunov": 1.5490608950100286,
+ "grad_norm": 0.8706870069158426,
+ "grad_max_sv": 0.5114456944167614,
+ "grad_min_sv": 1.31196238317699e-08,
+ "grad_condition": 53181583.053102724,
+ "lr": 0.0009972609476841367,
+ "time_sec": 87.13790082931519
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.523505429840088,
+ "train_acc": 0.03268,
+ "test_loss": 5.438013370513916,
+ "test_acc": 0.0125,
+ "lyapunov": 1.5594564731163747,
+ "grad_norm": 0.857804226532666,
+ "grad_max_sv": 0.49648181200027464,
+ "grad_min_sv": 1.1631784305188297e-08,
+ "grad_condition": 65912570.425740495,
+ "lr": 0.000996057350657239,
+ "time_sec": 87.11513113975525
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.491675056762696,
+ "train_acc": 0.03868,
+ "test_loss": 4.85823662109375,
+ "test_acc": 0.01,
+ "lyapunov": 1.5649392903613313,
+ "grad_norm": 0.922475970431733,
+ "grad_max_sv": 0.5282619304955005,
+ "grad_min_sv": 1.3700025544571837e-08,
+ "grad_condition": 115221136.73324652,
+ "lr": 0.000994636166481494,
+ "time_sec": 87.11052560806274
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.458245279388428,
+ "train_acc": 0.04286,
+ "test_loss": 5.0693019569396975,
+ "test_acc": 0.01,
+ "lyapunov": 1.564261608416467,
+ "grad_norm": 0.8247796151577914,
+ "grad_max_sv": 0.4666087761521339,
+ "grad_min_sv": 1.2590186138083937e-08,
+ "grad_condition": 80951881.02073678,
+ "lr": 0.0009929980185352525,
+ "time_sec": 87.10055899620056
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.479283211364746,
+ "train_acc": 0.04164,
+ "test_loss": 4.6463909927368165,
+ "test_acc": 0.01,
+ "lyapunov": 1.5368007479421317,
+ "grad_norm": 0.7899216729609227,
+ "grad_max_sv": 0.41627604588866235,
+ "grad_min_sv": 1.04147358570561e-08,
+ "grad_condition": 47679788.12689672,
+ "lr": 0.0009911436253643444,
+ "time_sec": 87.12877798080444
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.452324397583008,
+ "train_acc": 0.0458,
+ "test_loss": 4.653008950805664,
+ "test_acc": 0.01,
+ "lyapunov": 1.5427158729499564,
+ "grad_norm": 0.693102659392051,
+ "grad_max_sv": 0.39028600230813026,
+ "grad_min_sv": 9.917548506044316e-09,
+ "grad_condition": 50871255.950711094,
+ "lr": 0.0009890738003669028,
+ "time_sec": 87.09939312934875
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.498550581054688,
+ "train_acc": 0.04238,
+ "test_loss": 4.798313717651367,
+ "test_acc": 0.01,
+ "lyapunov": 1.562767594061849,
+ "grad_norm": 0.7157991404315234,
+ "grad_max_sv": 0.3735340617597103,
+ "grad_min_sv": 9.18097689817099e-09,
+ "grad_condition": 76046170.48271176,
+ "lr": 0.00098678945143658,
+ "time_sec": 87.10426044464111
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.4704539869689945,
+ "train_acc": 0.04582,
+ "test_loss": 4.7863667205810545,
+ "test_acc": 0.01,
+ "lyapunov": 1.5232323402029169,
+ "grad_norm": 0.6028364454937816,
+ "grad_max_sv": 0.332496403157711,
+ "grad_min_sv": 8.755317024156106e-09,
+ "grad_condition": 43134971.96461357,
+ "lr": 0.0009842915805643154,
+ "time_sec": 87.09469079971313
+ },
+ {
+ "epoch": 13,
+ "train_loss": 4.537702497558594,
+ "train_acc": 0.03896,
+ "test_loss": 4.654966796875,
+ "test_acc": 0.01,
+ "lyapunov": 1.54529083567812,
+ "grad_norm": 0.6292726486160667,
+ "grad_max_sv": 0.3057276763021946,
+ "grad_min_sv": 6.5090396415661e-09,
+ "grad_condition": 700356710.9321487,
+ "lr": 0.000981581283398829,
+ "time_sec": 87.09531950950623
+ },
+ {
+ "epoch": 14,
+ "train_loss": 4.620839001159668,
+ "train_acc": 0.0303,
+ "test_loss": 4.868439013671875,
+ "test_acc": 0.01,
+ "lyapunov": 1.5458131620036366,
+ "grad_norm": 0.5338695301373511,
+ "grad_max_sv": 0.29795307405292987,
+ "grad_min_sv": 5.120543077052897e-09,
+ "grad_condition": 339314023.7111832,
+ "lr": 0.0009786597487660333,
+ "time_sec": 87.12465906143188
+ },
+ {
+ "epoch": 15,
+ "train_loss": 4.513916426849366,
+ "train_acc": 0.04438,
+ "test_loss": 4.835803776550293,
+ "test_acc": 0.01,
+ "lyapunov": 1.5507933197119046,
+ "grad_norm": 0.6007957930506477,
+ "grad_max_sv": 0.3038324311375618,
+ "grad_min_sv": 6.934315210233022e-09,
+ "grad_condition": 198097346.8229193,
+ "lr": 0.0009755282581475766,
+ "time_sec": 87.08587527275085
+ },
+ {
+ "epoch": 16,
+ "train_loss": 4.492137908630371,
+ "train_acc": 0.04818,
+ "test_loss": 4.887235678100586,
+ "test_acc": 0.01,
+ "lyapunov": 1.5494948896910528,
+ "grad_norm": 0.5976636149826597,
+ "grad_max_sv": 0.30106121934950353,
+ "grad_min_sv": 7.290029437057033e-09,
+ "grad_condition": 63284303.580263734,
+ "lr": 0.0009721881851187403,
+ "time_sec": 87.09524250030518
+ },
+ {
+ "epoch": 17,
+ "train_loss": 4.575829989471435,
+ "train_acc": 0.03854,
+ "test_loss": 4.948842854309082,
+ "test_acc": 0.01,
+ "lyapunov": 1.53777074539448,
+ "grad_norm": 0.5014123935951768,
+ "grad_max_sv": 0.29032444581389427,
+ "grad_min_sv": 5.414256840086118e-09,
+ "grad_condition": 69838858.70858149,
+ "lr": 0.0009686409947459456,
+ "time_sec": 87.14909029006958
+ },
+ {
+ "epoch": 18,
+ "train_loss": 4.597054883728028,
+ "train_acc": 0.03624,
+ "test_loss": 4.844102088165283,
+ "test_acc": 0.01,
+ "lyapunov": 1.5350244057452893,
+ "grad_norm": 0.5123739316899657,
+ "grad_max_sv": 0.26398728154599665,
+ "grad_min_sv": 5.243455172138089e-09,
+ "grad_condition": 119920046.5630234,
+ "lr": 0.0009648882429441254,
+ "time_sec": 87.09620761871338
+ },
+ {
+ "epoch": 19,
+ "train_loss": 4.620368363647461,
+ "train_acc": 0.03384,
+ "test_loss": 4.720510952758789,
+ "test_acc": 0.01,
+ "lyapunov": 1.5356951705025286,
+ "grad_norm": 0.47243607957213,
+ "grad_max_sv": 0.24507929012179375,
+ "grad_min_sv": 5.088020715859898e-09,
+ "grad_condition": 57785330.0936975,
+ "lr": 0.00096093157579425,
+ "time_sec": 87.11660838127136
+ },
+ {
+ "epoch": 20,
+ "train_loss": 4.613923555145264,
+ "train_acc": 0.03756,
+ "test_loss": 5.093030418395996,
+ "test_acc": 0.01,
+ "lyapunov": 1.5330088199556942,
+ "grad_norm": 0.5270298408202432,
+ "grad_max_sv": 0.2416334819048643,
+ "grad_min_sv": 4.882703122420853e-09,
+ "grad_condition": 311593743.69228464,
+ "lr": 0.0009567727288213001,
+ "time_sec": 87.09937357902527
+ },
+ {
+ "epoch": 21,
+ "train_loss": 4.636924856567383,
+ "train_acc": 0.036,
+ "test_loss": 5.04784955368042,
+ "test_acc": 0.01,
+ "lyapunov": 1.5540363645309683,
+ "grad_norm": 0.526606906737193,
+ "grad_max_sv": 0.24690264500677586,
+ "grad_min_sv": 5.1651495895903985e-09,
+ "grad_condition": 691559676.1292815,
+ "lr": 0.0009524135262330095,
+ "time_sec": 87.11412358283997
+ },
+ {
+ "epoch": 22,
+ "train_loss": 4.679128698577881,
+ "train_acc": 0.02896,
+ "test_loss": 4.895172619628906,
+ "test_acc": 0.01,
+ "lyapunov": 1.547908184778355,
+ "grad_norm": 0.44727272149588615,
+ "grad_max_sv": 0.24925720058381556,
+ "grad_min_sv": 4.642139438126858e-09,
+ "grad_condition": 66478210.43898354,
+ "lr": 0.0009478558801197061,
+ "time_sec": 87.11094355583191
+ },
+ {
+ "epoch": 23,
+ "train_loss": 4.662371476287841,
+ "train_acc": 0.03188,
+ "test_loss": 4.795903799438476,
+ "test_acc": 0.01,
+ "lyapunov": 1.5548140889848285,
+ "grad_norm": 0.5260267923584394,
+ "grad_max_sv": 0.23556945472955704,
+ "grad_min_sv": 4.337634041588854e-09,
+ "grad_condition": 1025805594.4440111,
+ "lr": 0.000943101789615607,
+ "time_sec": 87.11297392845154
+ },
+ {
+ "epoch": 24,
+ "train_loss": 4.6645262229919435,
+ "train_acc": 0.03214,
+ "test_loss": 5.057237059783936,
+ "test_acc": 0.01,
+ "lyapunov": 1.5496064592200471,
+ "grad_norm": 0.6505246940270789,
+ "grad_max_sv": 0.2576914459466934,
+ "grad_min_sv": 4.8245041350813974e-09,
+ "grad_condition": 94704831.81255548,
+ "lr": 0.0009381533400219313,
+ "time_sec": 87.10920405387878
+ },
+ {
+ "epoch": 25,
+ "train_loss": 4.654648971710205,
+ "train_acc": 0.0322,
+ "test_loss": 5.318339912414551,
+ "test_acc": 0.01,
+ "lyapunov": 1.565699156592874,
+ "grad_norm": 0.4161938321621143,
+ "grad_max_sv": 0.2134155698120594,
+ "grad_min_sv": 3.946434762314155e-09,
+ "grad_condition": 254671281.05499464,
+ "lr": 0.0009330127018922189,
+ "time_sec": 87.13201785087585
+ },
+ {
+ "epoch": 26,
+ "train_loss": 4.791520259552002,
+ "train_acc": 0.02372,
+ "test_loss": 4.959452788543701,
+ "test_acc": 0.01,
+ "lyapunov": 1.600033207012869,
+ "grad_norm": 0.9779964796296537,
+ "grad_max_sv": 0.2255085190758109,
+ "grad_min_sv": 3.1466205011160244e-09,
+ "grad_condition": 11039609220.08119,
+ "lr": 0.000927682130080253,
+ "time_sec": 87.18698191642761
+ },
+ {
+ "epoch": 27,
+ "train_loss": 4.69488529296875,
+ "train_acc": 0.03142,
+ "test_loss": 5.3654563461303715,
+ "test_acc": 0.01,
+ "lyapunov": 1.5987402142771066,
+ "grad_norm": 0.6442328720311332,
+ "grad_max_sv": 0.23703443501144647,
+ "grad_min_sv": 3.5609615074683707e-09,
+ "grad_condition": 1745246073.6363997,
+ "lr": 0.0009221639627510072,
+ "time_sec": 87.134925365448
+ },
+ {
+ "epoch": 28,
+ "train_loss": 4.606881724700928,
+ "train_acc": 0.03926,
+ "test_loss": 4.73573546295166,
+ "test_acc": 0.0103,
+ "lyapunov": 1.5937491731570506,
+ "grad_norm": 0.4194063933325514,
+ "grad_max_sv": 0.21865120753645897,
+ "grad_min_sv": 3.87901320235591e-09,
+ "grad_condition": 523863784.21676093,
+ "lr": 0.0009164606203550494,
+ "time_sec": 87.14774799346924
+ },
+ {
+ "epoch": 29,
+ "train_loss": 4.617493250274658,
+ "train_acc": 0.03728,
+ "test_loss": 4.662520077514649,
+ "test_acc": 0.01,
+ "lyapunov": 1.596246981559812,
+ "grad_norm": 0.3789306278435458,
+ "grad_max_sv": 0.19524494409561158,
+ "grad_min_sv": 3.4768166591418737e-09,
+ "grad_condition": 236541357.234686,
+ "lr": 0.0009105746045668516,
+ "time_sec": 87.11421346664429
+ },
+ {
+ "epoch": 30,
+ "train_loss": 4.631677906799316,
+ "train_acc": 0.03778,
+ "test_loss": 6.121908515167236,
+ "test_acc": 0.01,
+ "lyapunov": 1.6226924099885593,
+ "grad_norm": 0.44716784199095383,
+ "grad_max_sv": 0.1934027548879385,
+ "grad_min_sv": 3.3855620726374116e-09,
+ "grad_condition": 581199629.6704518,
+ "lr": 0.0009045084971874733,
+ "time_sec": 87.11589574813843
+ },
+ {
+ "epoch": 31,
+ "train_loss": 4.7931158798217774,
+ "train_acc": 0.02286,
+ "test_loss": 4.620251409912109,
+ "test_acc": 0.0092,
+ "lyapunov": 1.6308694739475884,
+ "grad_norm": 0.550187770618441,
+ "grad_max_sv": 0.18949946835637094,
+ "grad_min_sv": 1.786556805578803e-09,
+ "grad_condition": 42877123442.64499,
+ "lr": 0.0008982649590120977,
+ "time_sec": 87.1836428642273
+ },
+ {
+ "epoch": 32,
+ "train_loss": 4.760539370574951,
+ "train_acc": 0.02752,
+ "test_loss": 4.657791676330566,
+ "test_acc": 0.01,
+ "lyapunov": 1.6191697065787547,
+ "grad_norm": 0.3614365919222485,
+ "grad_max_sv": 0.17497441843152045,
+ "grad_min_sv": 1.779506375100445e-09,
+ "grad_condition": 13836124253.01267,
+ "lr": 0.0008918467286629196,
+ "time_sec": 87.18445110321045
+ },
+ {
+ "epoch": 33,
+ "train_loss": 4.739889914245605,
+ "train_acc": 0.029,
+ "test_loss": 4.71790985031128,
+ "test_acc": 0.0111,
+ "lyapunov": 1.6113197523004867,
+ "grad_norm": 0.3353632004468733,
+ "grad_max_sv": 0.1673861812800169,
+ "grad_min_sv": 7.641599533418533e-10,
+ "grad_condition": 13965803361.130926,
+ "lr": 0.0008852566213878943,
+ "time_sec": 87.21766877174377
+ },
+ {
+ "epoch": 34,
+ "train_loss": 4.753917649078369,
+ "train_acc": 0.02908,
+ "test_loss": 6.4435778312683105,
+ "test_acc": 0.01,
+ "lyapunov": 1.6236087751510504,
+ "grad_norm": 0.32686722214079433,
+ "grad_max_sv": 0.16869123242795467,
+ "grad_min_sv": 5.19174209905656e-10,
+ "grad_condition": 25949866712.408104,
+ "lr": 0.000878497527825878,
+ "time_sec": 87.14275527000427
+ },
+ {
+ "epoch": 35,
+ "train_loss": 4.802844509124756,
+ "train_acc": 0.0244,
+ "test_loss": 6.557575407409668,
+ "test_acc": 0.01,
+ "lyapunov": 1.6418090259937375,
+ "grad_norm": 0.4988110566872576,
+ "grad_max_sv": 0.1611970603466034,
+ "grad_min_sv": 7.265029261023372e-10,
+ "grad_condition": 19350605239.471405,
+ "lr": 0.000871572412738697,
+ "time_sec": 87.16936993598938
+ },
+ {
+ "epoch": 36,
+ "train_loss": 4.776907616271973,
+ "train_acc": 0.02782,
+ "test_loss": 4.822451950073242,
+ "test_acc": 0.01,
+ "lyapunov": 1.649027470737467,
+ "grad_norm": 0.342256043849884,
+ "grad_max_sv": 0.15263066124171018,
+ "grad_min_sv": 1.2339334798351036e-10,
+ "grad_condition": 9338850661.261333,
+ "lr": 0.0008644843137107055,
+ "time_sec": 87.186208486557
+ },
+ {
+ "epoch": 37,
+ "train_loss": 4.772866481628418,
+ "train_acc": 0.0269,
+ "test_loss": 6.221601684570312,
+ "test_acc": 0.01,
+ "lyapunov": 1.6788606286963539,
+ "grad_norm": 0.6629649981625318,
+ "grad_max_sv": 0.17593900030478835,
+ "grad_min_sv": 2.304191549799707e-09,
+ "grad_condition": 9259298449.8995,
+ "lr": 0.0008572363398164014,
+ "time_sec": 87.18624091148376
+ },
+ {
+ "epoch": 38,
+ "train_loss": 4.77164099029541,
+ "train_acc": 0.02672,
+ "test_loss": 4.766420809936523,
+ "test_acc": 0.01,
+ "lyapunov": 1.7235305708692508,
+ "grad_norm": 0.3937581266699412,
+ "grad_max_sv": 0.17076923064887523,
+ "grad_min_sv": 4.0183006136103404e-10,
+ "grad_condition": 16063615551.021002,
+ "lr": 0.0008498316702566826,
+ "time_sec": 87.20626258850098
+ },
+ {
+ "epoch": 39,
+ "train_loss": 4.807452021179199,
+ "train_acc": 0.02832,
+ "test_loss": 4.899550021362304,
+ "test_acc": 0.01,
+ "lyapunov": 1.8249543252808358,
+ "grad_norm": 0.5715574182036978,
+ "grad_max_sv": 0.16177968972187956,
+ "grad_min_sv": 3.793029192220455e-10,
+ "grad_condition": 8307565763.804538,
+ "lr": 0.0008422735529643442,
+ "time_sec": 87.19903802871704
+ },
+ {
+ "epoch": 40,
+ "train_loss": 4.760174724121094,
+ "train_acc": 0.0279,
+ "test_loss": 5.857627616119385,
+ "test_acc": 0.01,
+ "lyapunov": 1.7056615718490327,
+ "grad_norm": 0.4256172750988047,
+ "grad_max_sv": 0.16561466939747332,
+ "grad_min_sv": 2.058724911119941e-09,
+ "grad_condition": 512180966.31238127,
+ "lr": 0.0008345653031794289,
+ "time_sec": 87.21863722801208
+ },
+ {
+ "epoch": 41,
+ "train_loss": 4.69559801071167,
+ "train_acc": 0.02966,
+ "test_loss": 5.604364262390137,
+ "test_acc": 0.01,
+ "lyapunov": 1.5935010431367722,
+ "grad_norm": 0.35011105073884097,
+ "grad_max_sv": 0.18168312907218934,
+ "grad_min_sv": 2.4247929442111626e-09,
+ "grad_condition": 93356754.736842,
+ "lr": 0.0008267103019950526,
+ "time_sec": 87.22393608093262
+ },
+ {
+ "epoch": 42,
+ "train_loss": 4.709802615814209,
+ "train_acc": 0.02616,
+ "test_loss": 4.870189538574219,
+ "test_acc": 0.01,
+ "lyapunov": 1.615870985228692,
+ "grad_norm": 0.31755349221985774,
+ "grad_max_sv": 0.17116790413856506,
+ "grad_min_sv": 2.5351133262074833e-09,
+ "grad_condition": 220960563.35692176,
+ "lr": 0.0008187119948743447,
+ "time_sec": 87.20640540122986
+ },
+ {
+ "epoch": 43,
+ "train_loss": 4.793043034057617,
+ "train_acc": 0.02262,
+ "test_loss": 5.881324156951904,
+ "test_acc": 0.01,
+ "lyapunov": 1.7521904277069795,
+ "grad_norm": 0.5590339405433944,
+ "grad_max_sv": 0.14497370515600777,
+ "grad_min_sv": 3.9279086975103414e-10,
+ "grad_condition": 19019670561.939625,
+ "lr": 0.000810573890139155,
+ "time_sec": 87.31258749961853
+ },
+ {
+ "epoch": 44,
+ "train_loss": 4.844116692810059,
+ "train_acc": 0.02276,
+ "test_loss": 5.395824824523926,
+ "test_acc": 0.01,
+ "lyapunov": 1.8710771832624664,
+ "grad_norm": 0.5293965973008694,
+ "grad_max_sv": 0.1555709108710289,
+ "grad_min_sv": 4.2711866910149697e-10,
+ "grad_condition": 14548258948.991043,
+ "lr": 0.0008022995574311873,
+ "time_sec": 87.18556952476501
+ },
+ {
+ "epoch": 45,
+ "train_loss": 4.8768616571044925,
+ "train_acc": 0.02038,
+ "test_loss": 4.61512779083252,
+ "test_acc": 0.01,
+ "lyapunov": 1.8506627338926505,
+ "grad_norm": 0.6998099846191761,
+ "grad_max_sv": 0.13765994729474187,
+ "grad_min_sv": 5.812380418716187e-11,
+ "grad_condition": 29846677946.806488,
+ "lr": 0.0007938926261462363,
+ "time_sec": 87.2240195274353
+ },
+ {
+ "epoch": 46,
+ "train_loss": 4.969230243377686,
+ "train_acc": 0.01168,
+ "test_loss": 7.386215936279297,
+ "test_acc": 0.01,
+ "lyapunov": 1.8457061924288034,
+ "grad_norm": 1.2406105764459343,
+ "grad_max_sv": 0.11906649246811866,
+ "grad_min_sv": 3.98718814026065e-11,
+ "grad_condition": 92245006784.32524,
+ "lr": 0.0007853567838422158,
+ "time_sec": 87.17690944671631
+ },
+ {
+ "epoch": 47,
+ "train_loss": 4.875964500274658,
+ "train_acc": 0.01072,
+ "test_loss": 6.527316121673584,
+ "test_acc": 0.01,
+ "lyapunov": 1.5310816859345302,
+ "grad_norm": 0.16182231228887384,
+ "grad_max_sv": 0.08984448052942753,
+ "grad_min_sv": 1.0441322375968024e-16,
+ "grad_condition": 89835727617.94872,
+ "lr": 0.0007766957746216719,
+ "time_sec": 87.1852126121521
+ },
+ {
+ "epoch": 48,
+ "train_loss": 4.875588766021728,
+ "train_acc": 0.00916,
+ "test_loss": 6.651647409820557,
+ "test_acc": 0.01,
+ "lyapunov": 1.5314356905724995,
+ "grad_norm": 0.17879068685955746,
+ "grad_max_sv": 0.09055437743663788,
+ "grad_min_sv": 2.807460538981671e-16,
+ "grad_condition": 90529399768.58862,
+ "lr": 0.0007679133974894982,
+ "time_sec": 87.19542217254639
+ },
+ {
+ "epoch": 49,
+ "train_loss": 4.874160293884278,
+ "train_acc": 0.00928,
+ "test_loss": 6.9806133621215825,
+ "test_acc": 0.01,
+ "lyapunov": 1.5310221773279293,
+ "grad_norm": 0.15914063982748972,
+ "grad_max_sv": 0.0841954169794917,
+ "grad_min_sv": 1.1028138256059021e-16,
+ "grad_condition": 84186278073.27275,
+ "lr": 0.000759013504686565,
+ "time_sec": 87.18294835090637
+ },
+ {
+ "epoch": 50,
+ "train_loss": 4.874967584228516,
+ "train_acc": 0.0088,
+ "test_loss": 7.2512130996704105,
+ "test_acc": 0.01,
+ "lyapunov": 1.531926109052985,
+ "grad_norm": 0.13359997166294424,
+ "grad_max_sv": 0.07885234858840703,
+ "grad_min_sv": 1.5449564137240798e-17,
+ "grad_condition": 78851261996.51497,
+ "lr": 0.0007499999999999998,
+ "time_sec": 87.1744954586029
+ },
+ {
+ "epoch": 51,
+ "train_loss": 4.873049064331055,
+ "train_acc": 0.00894,
+ "test_loss": 7.2680836700439455,
+ "test_acc": 0.01,
+ "lyapunov": 1.5300328816904132,
+ "grad_norm": 0.13566663059488987,
+ "grad_max_sv": 0.06801612647250295,
+ "grad_min_sv": 3.3721854663294077e-28,
+ "grad_condition": 68016126472.50293,
+ "lr": 0.0007408768370508575,
+ "time_sec": 87.2090744972229
+ },
+ {
+ "epoch": 52,
+ "train_loss": 4.8752045971679685,
+ "train_acc": 0.00998,
+ "test_loss": 7.319013902282715,
+ "test_acc": 0.01,
+ "lyapunov": 1.5358237284223746,
+ "grad_norm": 0.15295505609252377,
+ "grad_max_sv": 0.07399358823895455,
+ "grad_min_sv": 4.036005675649565e-34,
+ "grad_condition": 73993588238.95454,
+ "lr": 0.0007316480175599307,
+ "time_sec": 87.17916941642761
+ },
+ {
+ "epoch": 53,
+ "train_loss": 4.875089646759033,
+ "train_acc": 0.00932,
+ "test_loss": 6.708341079711914,
+ "test_acc": 0.01,
+ "lyapunov": 1.535219712025674,
+ "grad_norm": 0.15337946692641713,
+ "grad_max_sv": 0.0786401204764843,
+ "grad_min_sv": 9.418872962396182e-34,
+ "grad_condition": 78640120476.4843,
+ "lr": 0.0007223175895924635,
+ "time_sec": 87.19920134544373
+ },
+ {
+ "epoch": 54,
+ "train_loss": 4.8763134245300295,
+ "train_acc": 0.00954,
+ "test_loss": 7.893965859985352,
+ "test_acc": 0.01,
+ "lyapunov": 1.5382219912755826,
+ "grad_norm": 0.14430315662174414,
+ "grad_max_sv": 0.0842284008860588,
+ "grad_min_sv": 1.4016176262153585e-17,
+ "grad_condition": 84227307606.50656,
+ "lr": 0.0007128896457825361,
+ "time_sec": 87.16732549667358
+ },
+ {
+ "epoch": 55,
+ "train_loss": 4.880924655761719,
+ "train_acc": 0.00986,
+ "test_loss": 8.769433529663086,
+ "test_acc": 0.01,
+ "lyapunov": 1.5441064075435824,
+ "grad_norm": 0.16740838552751033,
+ "grad_max_sv": 0.08879097644239664,
+ "grad_min_sv": 3.0302474954849e-15,
+ "grad_condition": 88489187160.01863,
+ "lr": 0.0007033683215378998,
+ "time_sec": 87.23270034790039
+ },
+ {
+ "epoch": 56,
+ "train_loss": 4.880691115722656,
+ "train_acc": 0.00984,
+ "test_loss": 8.956744931030274,
+ "test_acc": 0.01,
+ "lyapunov": 1.5440428296623327,
+ "grad_norm": 0.169681128943872,
+ "grad_max_sv": 0.08683812469244004,
+ "grad_min_sv": 2.6780771295629216e-16,
+ "grad_condition": 86810744990.1141,
+ "lr": 0.0006937577932260512,
+ "time_sec": 87.5180823802948
+ },
+ {
+ "epoch": 57,
+ "train_loss": 4.875461320648193,
+ "train_acc": 0.00882,
+ "test_loss": 7.914718838500977,
+ "test_acc": 0.01,
+ "lyapunov": 1.5361771690266213,
+ "grad_norm": 0.13744745585086549,
+ "grad_max_sv": 0.08106257226318121,
+ "grad_min_sv": 4.602306454836924e-17,
+ "grad_condition": 81058882088.7789,
+ "lr": 0.0006840622763423388,
+ "time_sec": 87.23774647712708
+ },
+ {
+ "epoch": 58,
+ "train_loss": 4.876462248229981,
+ "train_acc": 0.0086,
+ "test_loss": 7.521480532836914,
+ "test_acc": 0.01,
+ "lyapunov": 1.5380861676867357,
+ "grad_norm": 0.1308094426729998,
+ "grad_max_sv": 0.07691145669668913,
+ "grad_min_sv": 5.2512441923478546e-21,
+ "grad_condition": 76911456255.58595,
+ "lr": 0.0006742860236609073,
+ "time_sec": 87.19443416595459
+ },
+ {
+ "epoch": 59,
+ "train_loss": 4.876125813751221,
+ "train_acc": 0.00958,
+ "test_loss": 9.108944590759277,
+ "test_acc": 0.01,
+ "lyapunov": 1.5374773286492622,
+ "grad_norm": 0.13065965995697965,
+ "grad_max_sv": 0.07693316899240017,
+ "grad_min_sv": 4.628041294277668e-28,
+ "grad_condition": 76933168992.40013,
+ "lr": 0.0006644333233692913,
+ "time_sec": 87.11430335044861
+ },
+ {
+ "epoch": 60,
+ "train_loss": 4.876531585845948,
+ "train_acc": 0.01002,
+ "test_loss": 8.708165438842773,
+ "test_acc": 0.01,
+ "lyapunov": 1.540081706193402,
+ "grad_norm": 0.12514364110494514,
+ "grad_max_sv": 0.04278304530307651,
+ "grad_min_sv": 5.111839701214236e-27,
+ "grad_condition": 42783045303.07613,
+ "lr": 0.0006545084971874734,
+ "time_sec": 87.08950901031494
+ },
+ {
+ "epoch": 61,
+ "train_loss": 4.876955277404785,
+ "train_acc": 0.00986,
+ "test_loss": 9.633759455871582,
+ "test_acc": 0.01,
+ "lyapunov": 1.5432406968777748,
+ "grad_norm": 0.13030696119131907,
+ "grad_max_sv": 0.01869940897449851,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18699408974.498512,
+ "lr": 0.0006445158984722354,
+ "time_sec": 87.06369233131409
+ },
+ {
+ "epoch": 62,
+ "train_loss": 4.880256801300049,
+ "train_acc": 0.00914,
+ "test_loss": 8.106962710571288,
+ "test_acc": 0.01,
+ "lyapunov": 1.5493804704197838,
+ "grad_norm": 0.13707953455281482,
+ "grad_max_sv": 0.05703742457553744,
+ "grad_min_sv": 2.412788074144182e-18,
+ "grad_condition": 57037235841.35691,
+ "lr": 0.0006344599103076324,
+ "time_sec": 87.23956346511841
+ },
+ {
+ "epoch": 63,
+ "train_loss": 4.877262191009521,
+ "train_acc": 0.00972,
+ "test_loss": 9.24615108947754,
+ "test_acc": 0.01,
+ "lyapunov": 1.5415991502039879,
+ "grad_norm": 0.13665560919633327,
+ "grad_max_sv": 0.0726124294102192,
+ "grad_min_sv": 2.0682456318226844e-23,
+ "grad_condition": 72612429408.54066,
+ "lr": 0.0006243449435824269,
+ "time_sec": 87.23054909706116
+ },
+ {
+ "epoch": 64,
+ "train_loss": 4.87730983215332,
+ "train_acc": 0.00936,
+ "test_loss": 10.058143447875976,
+ "test_acc": 0.01,
+ "lyapunov": 1.5422342823594428,
+ "grad_norm": 0.12004208587403144,
+ "grad_max_sv": 0.06160930292680859,
+ "grad_min_sv": 0.0,
+ "grad_condition": 61609302926.80859,
+ "lr": 0.0006141754350553275,
+ "time_sec": 87.30030584335327
+ },
+ {
+ "epoch": 65,
+ "train_loss": 4.878948260040283,
+ "train_acc": 0.0093,
+ "test_loss": 9.260436712646484,
+ "test_acc": 0.01,
+ "lyapunov": 1.5483233312816571,
+ "grad_norm": 0.12423135486220072,
+ "grad_max_sv": 0.0546061669010669,
+ "grad_min_sv": 0.0,
+ "grad_condition": 54606166901.066895,
+ "lr": 0.0006039558454088793,
+ "time_sec": 87.31754422187805
+ },
+ {
+ "epoch": 66,
+ "train_loss": 4.881117270965576,
+ "train_acc": 0.00976,
+ "test_loss": 7.955686111450195,
+ "test_acc": 0.01,
+ "lyapunov": 1.5531517626989224,
+ "grad_norm": 0.1466609355894601,
+ "grad_max_sv": 0.05231738574802876,
+ "grad_min_sv": 0.0,
+ "grad_condition": 52317385748.02876,
+ "lr": 0.000593690657292862,
+ "time_sec": 87.25684475898743
+ },
+ {
+ "epoch": 67,
+ "train_loss": 4.87848960723877,
+ "train_acc": 0.0093,
+ "test_loss": 8.291721563720703,
+ "test_acc": 0.01,
+ "lyapunov": 1.5488468536635493,
+ "grad_norm": 0.13358884588524558,
+ "grad_max_sv": 0.046516909170895814,
+ "grad_min_sv": 0.0,
+ "grad_condition": 46516909170.89581,
+ "lr": 0.0005833843733580507,
+ "time_sec": 87.23024368286133
+ },
+ {
+ "epoch": 68,
+ "train_loss": 4.876251863098145,
+ "train_acc": 0.00948,
+ "test_loss": 8.313035414123535,
+ "test_acc": 0.01,
+ "lyapunov": 1.5433335642680488,
+ "grad_norm": 0.10782264609925914,
+ "grad_max_sv": 0.04402522062882781,
+ "grad_min_sv": 0.0,
+ "grad_condition": 44025220628.827805,
+ "lr": 0.0005730415142812054,
+ "time_sec": 87.16200470924377
+ },
+ {
+ "epoch": 69,
+ "train_loss": 4.877121996459961,
+ "train_acc": 0.00992,
+ "test_loss": 6.634935369110107,
+ "test_acc": 0.01,
+ "lyapunov": 1.5465551251950471,
+ "grad_norm": 0.10524482896626382,
+ "grad_max_sv": 0.03552310774102807,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35523107741.02806,
+ "lr": 0.0005626666167821517,
+ "time_sec": 87.16768336296082
+ },
+ {
+ "epoch": 70,
+ "train_loss": 4.877148870697021,
+ "train_acc": 0.00924,
+ "test_loss": 5.170057612609863,
+ "test_acc": 0.01,
+ "lyapunov": 1.544044288223052,
+ "grad_norm": 0.12272040694034365,
+ "grad_max_sv": 0.042177446838468316,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42177446838.46831,
+ "lr": 0.0005522642316338265,
+ "time_sec": 87.17852282524109
+ },
+ {
+ "epoch": 71,
+ "train_loss": 4.878114613800049,
+ "train_acc": 0.00918,
+ "test_loss": 5.881608570861816,
+ "test_acc": 0.01,
+ "lyapunov": 1.5485444328059321,
+ "grad_norm": 0.1267744759308649,
+ "grad_max_sv": 0.03348520016297698,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33485200162.97698,
+ "lr": 0.0005418389216661573,
+ "time_sec": 87.12145924568176
+ },
+ {
+ "epoch": 72,
+ "train_loss": 4.877243146057129,
+ "train_acc": 0.00954,
+ "test_loss": 4.831268686676025,
+ "test_acc": 0.01,
+ "lyapunov": 1.5455416965362665,
+ "grad_norm": 0.11162604722177562,
+ "grad_max_sv": 0.04829189190641046,
+ "grad_min_sv": 0.0,
+ "grad_condition": 48291891906.41045,
+ "lr": 0.0005313952597646563,
+ "time_sec": 87.20591306686401
+ },
+ {
+ "epoch": 73,
+ "train_loss": 4.877523553466797,
+ "train_acc": 0.00916,
+ "test_loss": 5.21819946975708,
+ "test_acc": 0.01,
+ "lyapunov": 1.5469345262898204,
+ "grad_norm": 0.1695274830056392,
+ "grad_max_sv": 0.03528429148718715,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35284291487.18715,
+ "lr": 0.0005209378268645994,
+ "time_sec": 87.15492391586304
+ },
+ {
+ "epoch": 74,
+ "train_loss": 4.878687818603516,
+ "train_acc": 0.00902,
+ "test_loss": 7.045982824707031,
+ "test_acc": 0.01,
+ "lyapunov": 1.548920457320445,
+ "grad_norm": 0.11876165619339213,
+ "grad_max_sv": 0.0398634166456759,
+ "grad_min_sv": 0.0,
+ "grad_condition": 39863416645.675896,
+ "lr": 0.0005104712099416781,
+ "time_sec": 87.20987892150879
+ },
+ {
+ "epoch": 75,
+ "train_loss": 4.8802404374694826,
+ "train_acc": 0.00952,
+ "test_loss": 5.816082705688476,
+ "test_acc": 0.01,
+ "lyapunov": 1.5510207057913856,
+ "grad_norm": 0.11814260313160607,
+ "grad_max_sv": 0.04241896355524659,
+ "grad_min_sv": 0.0,
+ "grad_condition": 42418963555.24659,
+ "lr": 0.0004999999999999996,
+ "time_sec": 87.17034125328064
+ },
+ {
+ "epoch": 76,
+ "train_loss": 4.877049774017334,
+ "train_acc": 0.01008,
+ "test_loss": 5.791509801483154,
+ "test_acc": 0.01,
+ "lyapunov": 1.545583454544282,
+ "grad_norm": 0.10644494843061181,
+ "grad_max_sv": 0.044637566059827806,
+ "grad_min_sv": 0.0,
+ "grad_condition": 44637566059.827805,
+ "lr": 0.0004895287900583212,
+ "time_sec": 87.17367744445801
+ },
+ {
+ "epoch": 77,
+ "train_loss": 4.876323641052246,
+ "train_acc": 0.00964,
+ "test_loss": 5.184193676757812,
+ "test_acc": 0.01,
+ "lyapunov": 1.5437548282506215,
+ "grad_norm": 0.10450293107653293,
+ "grad_max_sv": 0.04073738274164498,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40737382741.64498,
+ "lr": 0.0004790621731353997,
+ "time_sec": 87.17853283882141
+ },
+ {
+ "epoch": 78,
+ "train_loss": 4.8809456416320804,
+ "train_acc": 0.00946,
+ "test_loss": 4.926686591339111,
+ "test_acc": 0.01,
+ "lyapunov": 1.5541882484465304,
+ "grad_norm": 0.12051319198728945,
+ "grad_max_sv": 0.033642015885561705,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33642015885.561707,
+ "lr": 0.000468604740235343,
+ "time_sec": 87.15360975265503
+ },
+ {
+ "epoch": 79,
+ "train_loss": 4.878056556091309,
+ "train_acc": 0.00886,
+ "test_loss": 4.698637203979493,
+ "test_acc": 0.01,
+ "lyapunov": 1.5484835391154375,
+ "grad_norm": 0.11143972892340351,
+ "grad_max_sv": 0.03221007520332932,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32210075203.329323,
+ "lr": 0.00045816107833384175,
+ "time_sec": 87.12274217605591
+ },
+ {
+ "epoch": 80,
+ "train_loss": 4.877688450622559,
+ "train_acc": 0.00998,
+ "test_loss": 4.708519946289062,
+ "test_acc": 0.01,
+ "lyapunov": 1.5479903696747996,
+ "grad_norm": 0.10853834057327462,
+ "grad_max_sv": 0.03808168638497591,
+ "grad_min_sv": 0.0,
+ "grad_condition": 38081686384.97591,
+ "lr": 0.0004477357683661729,
+ "time_sec": 87.16511940956116
+ },
+ {
+ "epoch": 81,
+ "train_loss": 4.877410650787353,
+ "train_acc": 0.00924,
+ "test_loss": 5.326217936706543,
+ "test_acc": 0.01,
+ "lyapunov": 1.5462311384318126,
+ "grad_norm": 0.1078272819076305,
+ "grad_max_sv": 0.0341941992752254,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34194199275.225403,
+ "lr": 0.00043733338321784746,
+ "time_sec": 87.13259315490723
+ },
+ {
+ "epoch": 82,
+ "train_loss": 4.878852579498291,
+ "train_acc": 0.00992,
+ "test_loss": 5.124214416503906,
+ "test_acc": 0.01,
+ "lyapunov": 1.551578131783039,
+ "grad_norm": 0.11924540172549285,
+ "grad_max_sv": 0.032149143144488336,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32149143144.488342,
+ "lr": 0.0004269584857187939,
+ "time_sec": 87.15441107749939
+ },
+ {
+ "epoch": 83,
+ "train_loss": 4.877541376647949,
+ "train_acc": 0.00962,
+ "test_loss": 5.2295348327636715,
+ "test_acc": 0.01,
+ "lyapunov": 1.5478261575064696,
+ "grad_norm": 0.1053498185299808,
+ "grad_max_sv": 0.026044291676953435,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26044291676.953438,
+ "lr": 0.0004166156266419484,
+ "time_sec": 87.16295027732849
+ },
+ {
+ "epoch": 84,
+ "train_loss": 4.877119447631836,
+ "train_acc": 0.00984,
+ "test_loss": 5.116746160888672,
+ "test_acc": 0.01,
+ "lyapunov": 1.5470911304054358,
+ "grad_norm": 0.10156236054846617,
+ "grad_max_sv": 0.028701860643923282,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28701860643.92328,
+ "lr": 0.0004063093427071373,
+ "time_sec": 87.13170576095581
+ },
+ {
+ "epoch": 85,
+ "train_loss": 4.878303242034912,
+ "train_acc": 0.01008,
+ "test_loss": 4.748899824523925,
+ "test_acc": 0.01,
+ "lyapunov": 1.5509575178556125,
+ "grad_norm": 0.1141388454907746,
+ "grad_max_sv": 0.033817021455615756,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33817021455.61576,
+ "lr": 0.0003960441545911199,
+ "time_sec": 87.10089588165283
+ },
+ {
+ "epoch": 86,
+ "train_loss": 4.87876032699585,
+ "train_acc": 0.0097,
+ "test_loss": 4.651885162353516,
+ "test_acc": 0.01,
+ "lyapunov": 1.5511503161676705,
+ "grad_norm": 0.09785209813867382,
+ "grad_max_sv": 0.027630697237327695,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27630697237.32769,
+ "lr": 0.0003858245649446718,
+ "time_sec": 87.0941972732544
+ },
+ {
+ "epoch": 87,
+ "train_loss": 4.877712865142822,
+ "train_acc": 0.00998,
+ "test_loss": 5.250769630432129,
+ "test_acc": 0.01,
+ "lyapunov": 1.548732325549016,
+ "grad_norm": 0.1974258085478382,
+ "grad_max_sv": 0.02602379145100713,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26023791451.00713,
+ "lr": 0.00037565505641757235,
+ "time_sec": 87.11909556388855
+ },
+ {
+ "epoch": 88,
+ "train_loss": 4.877790277404785,
+ "train_acc": 0.00996,
+ "test_loss": 5.091197055053711,
+ "test_acc": 0.01,
+ "lyapunov": 1.5483774038227014,
+ "grad_norm": 0.10333331120218883,
+ "grad_max_sv": 0.03042559456080198,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30425594560.801983,
+ "lr": 0.00036554008969236695,
+ "time_sec": 87.1078622341156
+ },
+ {
+ "epoch": 89,
+ "train_loss": 4.877677908020019,
+ "train_acc": 0.0099,
+ "test_loss": 5.058323477935791,
+ "test_acc": 0.01,
+ "lyapunov": 1.5483884863231494,
+ "grad_norm": 0.09905622622525881,
+ "grad_max_sv": 0.03069272106513381,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30692721065.133812,
+ "lr": 0.0003554841015277638,
+ "time_sec": 87.05663800239563
+ },
+ {
+ "epoch": 90,
+ "train_loss": 4.881804440917969,
+ "train_acc": 0.0106,
+ "test_loss": 5.362990502166748,
+ "test_acc": 0.01,
+ "lyapunov": 1.553605647648082,
+ "grad_norm": 0.10267946386955158,
+ "grad_max_sv": 0.030273563507944346,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30273563507.944347,
+ "lr": 0.000345491502812526,
+ "time_sec": 87.06899333000183
+ },
+ {
+ "epoch": 91,
+ "train_loss": 4.879398302917481,
+ "train_acc": 0.01,
+ "test_loss": 5.126827237701416,
+ "test_acc": 0.01,
+ "lyapunov": 1.5521758828321686,
+ "grad_norm": 0.12087522031268683,
+ "grad_max_sv": 0.03009325391612947,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30093253916.129467,
+ "lr": 0.0003355666766307081,
+ "time_sec": 87.05256390571594
+ },
+ {
+ "epoch": 92,
+ "train_loss": 4.880291121673584,
+ "train_acc": 0.00988,
+ "test_loss": 5.26154695892334,
+ "test_acc": 0.01,
+ "lyapunov": 1.5549428770914102,
+ "grad_norm": 0.13231588784429352,
+ "grad_max_sv": 0.03350330209359527,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33503302093.595264,
+ "lr": 0.00032571397633909225,
+ "time_sec": 87.10619926452637
+ },
+ {
+ "epoch": 93,
+ "train_loss": 4.8782078823852535,
+ "train_acc": 0.00968,
+ "test_loss": 5.271252917480469,
+ "test_acc": 0.01,
+ "lyapunov": 1.5495562916216643,
+ "grad_norm": 0.12175801600529883,
+ "grad_max_sv": 0.03186503546312451,
+ "grad_min_sv": 0.0,
+ "grad_condition": 31865035463.12451,
+ "lr": 0.00031593772365766094,
+ "time_sec": 87.12923264503479
+ },
+ {
+ "epoch": 94,
+ "train_loss": 4.87740290222168,
+ "train_acc": 0.00982,
+ "test_loss": 5.075842178344726,
+ "test_acc": 0.01,
+ "lyapunov": 1.547658307473068,
+ "grad_norm": 0.11436426699794455,
+ "grad_max_sv": 0.02530919690616429,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25309196906.164288,
+ "lr": 0.0003062422067739483,
+ "time_sec": 87.08783769607544
+ },
+ {
+ "epoch": 95,
+ "train_loss": 4.877675037384034,
+ "train_acc": 0.00952,
+ "test_loss": 5.33029627532959,
+ "test_acc": 0.01,
+ "lyapunov": 1.5485165667960712,
+ "grad_norm": 0.10074303038813699,
+ "grad_max_sv": 0.03554986314848065,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35549863148.48065,
+ "lr": 0.00029663167846209965,
+ "time_sec": 87.08289909362793
+ },
+ {
+ "epoch": 96,
+ "train_loss": 4.877177648620606,
+ "train_acc": 0.01022,
+ "test_loss": 5.369173509216308,
+ "test_acc": 0.01,
+ "lyapunov": 1.5468677212210262,
+ "grad_norm": 0.1013436246118025,
+ "grad_max_sv": 0.03922831532545388,
+ "grad_min_sv": 0.0,
+ "grad_condition": 39228315325.45387,
+ "lr": 0.00028711035421746345,
+ "time_sec": 87.09603428840637
+ },
+ {
+ "epoch": 97,
+ "train_loss": 4.881449295959473,
+ "train_acc": 0.00942,
+ "test_loss": 4.928601164245605,
+ "test_acc": 0.01,
+ "lyapunov": 1.5567159265508432,
+ "grad_norm": 0.10170216841041604,
+ "grad_max_sv": 0.021827650628983973,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21827650628.98397,
+ "lr": 0.00027768241040753615,
+ "time_sec": 87.07169818878174
+ },
+ {
+ "epoch": 98,
+ "train_loss": 4.8775743408203125,
+ "train_acc": 0.00984,
+ "test_loss": 4.987854670715332,
+ "test_acc": 0.01,
+ "lyapunov": 1.548287238916168,
+ "grad_norm": 0.12626493811946907,
+ "grad_max_sv": 0.03011642089113593,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30116420891.135933,
+ "lr": 0.00026835198244006903,
+ "time_sec": 87.164879322052
+ },
+ {
+ "epoch": 99,
+ "train_loss": 4.878459322357178,
+ "train_acc": 0.00968,
+ "test_loss": 4.931130755615234,
+ "test_acc": 0.01,
+ "lyapunov": 1.5513008421339343,
+ "grad_norm": 0.1050431882077805,
+ "grad_max_sv": 0.026918977173045276,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26918977173.045277,
+ "lr": 0.0002591231629491421,
+ "time_sec": 87.06193971633911
+ },
+ {
+ "epoch": 100,
+ "train_loss": 4.877405020904541,
+ "train_acc": 0.00972,
+ "test_loss": 4.892998168182373,
+ "test_acc": 0.01,
+ "lyapunov": 1.5485746119638233,
+ "grad_norm": 0.10391039157029125,
+ "grad_max_sv": 0.009399653738364577,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9399653738.364578,
+ "lr": 0.0002499999999999997,
+ "time_sec": 86.99319124221802
+ },
+ {
+ "epoch": 101,
+ "train_loss": 4.878013845367431,
+ "train_acc": 0.00972,
+ "test_loss": 4.892334498596192,
+ "test_acc": 0.01,
+ "lyapunov": 1.549886227568702,
+ "grad_norm": 0.10312805970588344,
+ "grad_max_sv": 0.020510493777692318,
+ "grad_min_sv": 0.0,
+ "grad_condition": 20510493777.692318,
+ "lr": 0.00024098649531343477,
+ "time_sec": 87.05790066719055
+ },
+ {
+ "epoch": 102,
+ "train_loss": 4.878095693969726,
+ "train_acc": 0.00976,
+ "test_loss": 4.820429385375976,
+ "test_acc": 0.01,
+ "lyapunov": 1.5501237391206004,
+ "grad_norm": 0.11558211080028734,
+ "grad_max_sv": 0.024952154234051706,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24952154234.051704,
+ "lr": 0.0002320866025105016,
+ "time_sec": 87.05184125900269
+ },
+ {
+ "epoch": 103,
+ "train_loss": 4.878661685333252,
+ "train_acc": 0.01018,
+ "test_loss": 5.300121360015869,
+ "test_acc": 0.01,
+ "lyapunov": 1.551538582957919,
+ "grad_norm": 0.12567932831666664,
+ "grad_max_sv": 0.012993747182190419,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12993747182.190418,
+ "lr": 0.0002233042253783278,
+ "time_sec": 87.06061792373657
+ },
+ {
+ "epoch": 104,
+ "train_loss": 4.877294933776856,
+ "train_acc": 0.0099,
+ "test_loss": 5.135670352172852,
+ "test_acc": 0.01,
+ "lyapunov": 1.5485212714470866,
+ "grad_norm": 0.09250410480818645,
+ "grad_max_sv": 0.004851618967950344,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4851618967.950345,
+ "lr": 0.000214643216157784,
+ "time_sec": 87.05238747596741
+ },
+ {
+ "epoch": 105,
+ "train_loss": 4.877063808746338,
+ "train_acc": 0.00988,
+ "test_loss": 5.725478736877442,
+ "test_acc": 0.01,
+ "lyapunov": 1.5481484466806397,
+ "grad_norm": 0.09550603539231842,
+ "grad_max_sv": 0.011385573633015155,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11385573633.015156,
+ "lr": 0.00020610737385376332,
+ "time_sec": 87.0910587310791
+ },
+ {
+ "epoch": 106,
+ "train_loss": 4.877282638549804,
+ "train_acc": 0.00984,
+ "test_loss": 5.60465906829834,
+ "test_acc": 0.01,
+ "lyapunov": 1.5483009687165166,
+ "grad_norm": 0.10354511535570549,
+ "grad_max_sv": 0.02720399503596127,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27203995035.961273,
+ "lr": 0.00019770044256881242,
+ "time_sec": 87.10812902450562
+ },
+ {
+ "epoch": 107,
+ "train_loss": 4.876681364440918,
+ "train_acc": 0.00976,
+ "test_loss": 5.2093520240783695,
+ "test_acc": 0.01,
+ "lyapunov": 1.5473160725420394,
+ "grad_norm": 0.09575843142426103,
+ "grad_max_sv": 0.007643958646804094,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7643958646.804095,
+ "lr": 0.0001894261098608447,
+ "time_sec": 87.00347948074341
+ },
+ {
+ "epoch": 108,
+ "train_loss": 4.878350821228027,
+ "train_acc": 0.01052,
+ "test_loss": 4.913621876525879,
+ "test_acc": 0.01,
+ "lyapunov": 1.5520180210737926,
+ "grad_norm": 0.1307850708492295,
+ "grad_max_sv": 0.016565991286188363,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16565991286.188366,
+ "lr": 0.000181288005125655,
+ "time_sec": 87.0159866809845
+ },
+ {
+ "epoch": 109,
+ "train_loss": 4.876669662628174,
+ "train_acc": 0.01016,
+ "test_loss": 4.88301672668457,
+ "test_acc": 0.01,
+ "lyapunov": 1.5467288201422338,
+ "grad_norm": 0.09856162731459642,
+ "grad_max_sv": 0.014887689799070358,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14887689799.070358,
+ "lr": 0.0001732896980049473,
+ "time_sec": 86.99599003791809
+ },
+ {
+ "epoch": 110,
+ "train_loss": 4.877418764038086,
+ "train_acc": 0.00988,
+ "test_loss": 5.01456753540039,
+ "test_acc": 0.01,
+ "lyapunov": 1.549457520170285,
+ "grad_norm": 0.11878011333313225,
+ "grad_max_sv": 0.005905823782086372,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5905823782.086372,
+ "lr": 0.00016543469682057076,
+ "time_sec": 87.00050139427185
+ },
+ {
+ "epoch": 111,
+ "train_loss": 4.877375203704834,
+ "train_acc": 0.01016,
+ "test_loss": 4.923972444152832,
+ "test_acc": 0.01,
+ "lyapunov": 1.549215167074862,
+ "grad_norm": 0.11051840491520531,
+ "grad_max_sv": 0.007604151451960206,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7604151451.960205,
+ "lr": 0.00015772644703565552,
+ "time_sec": 87.03872609138489
+ },
+ {
+ "epoch": 112,
+ "train_loss": 4.87747160736084,
+ "train_acc": 0.0097,
+ "test_loss": 4.956568124389649,
+ "test_acc": 0.01,
+ "lyapunov": 1.5494032619554368,
+ "grad_norm": 0.11381662366828246,
+ "grad_max_sv": 0.01119147464632988,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11191474646.32988,
+ "lr": 0.00015016832974331713,
+ "time_sec": 87.11299419403076
+ },
+ {
+ "epoch": 113,
+ "train_loss": 4.87979639755249,
+ "train_acc": 0.01012,
+ "test_loss": 4.926776232910156,
+ "test_acc": 0.01,
+ "lyapunov": 1.5544771361533942,
+ "grad_norm": 0.15709933765078352,
+ "grad_max_sv": 0.00347123583778739,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3471235837.78739,
+ "lr": 0.00014276366018359834,
+ "time_sec": 87.06232452392578
+ },
+ {
+ "epoch": 114,
+ "train_loss": 4.878047005310059,
+ "train_acc": 0.00952,
+ "test_loss": 4.92212592086792,
+ "test_acc": 0.01,
+ "lyapunov": 1.5507129702116826,
+ "grad_norm": 0.10294832245991155,
+ "grad_max_sv": 0.012609629379585385,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12609629379.585384,
+ "lr": 0.00013551568628929425,
+ "time_sec": 87.06694340705872
+ },
+ {
+ "epoch": 115,
+ "train_loss": 4.877151131134033,
+ "train_acc": 0.0092,
+ "test_loss": 4.918728126525879,
+ "test_acc": 0.01,
+ "lyapunov": 1.548615127878116,
+ "grad_norm": 0.10263613090186025,
+ "grad_max_sv": 0.006314583634957671,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6314583634.957671,
+ "lr": 0.00012842758726130276,
+ "time_sec": 87.03067350387573
+ },
+ {
+ "epoch": 116,
+ "train_loss": 4.87786820098877,
+ "train_acc": 0.00982,
+ "test_loss": 5.00487536239624,
+ "test_acc": 0.01,
+ "lyapunov": 1.5504866353691082,
+ "grad_norm": 0.12269127259842373,
+ "grad_max_sv": 0.014170486759394408,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14170486759.39441,
+ "lr": 0.0001215024721741218,
+ "time_sec": 87.00306367874146
+ },
+ {
+ "epoch": 117,
+ "train_loss": 4.876784671478272,
+ "train_acc": 0.00974,
+ "test_loss": 5.023514326477051,
+ "test_acc": 0.01,
+ "lyapunov": 1.5474366047193326,
+ "grad_norm": 0.10427521316985092,
+ "grad_max_sv": 0.004411047184839844,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4411047184.839845,
+ "lr": 0.00011474337861210538,
+ "time_sec": 87.03306269645691
+ },
+ {
+ "epoch": 118,
+ "train_loss": 4.877164349365234,
+ "train_acc": 0.01002,
+ "test_loss": 4.991419695281983,
+ "test_acc": 0.01,
+ "lyapunov": 1.5484020453889658,
+ "grad_norm": 0.10471789513305493,
+ "grad_max_sv": 0.008587307529523969,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8587307529.523969,
+ "lr": 0.00010815327133708009,
+ "time_sec": 87.06011486053467
+ },
+ {
+ "epoch": 119,
+ "train_loss": 4.876861254577637,
+ "train_acc": 0.00988,
+ "test_loss": 5.089453727722168,
+ "test_acc": 0.01,
+ "lyapunov": 1.5475890602906952,
+ "grad_norm": 0.10992180658040822,
+ "grad_max_sv": 0.009593591233715415,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9593591233.715414,
+ "lr": 0.00010173504098790182,
+ "time_sec": 87.0181610584259
+ },
+ {
+ "epoch": 120,
+ "train_loss": 4.87691458618164,
+ "train_acc": 0.00984,
+ "test_loss": 5.0014659088134765,
+ "test_acc": 0.01,
+ "lyapunov": 1.5480926106957829,
+ "grad_norm": 0.10767138662291806,
+ "grad_max_sv": 0.0038278432097285987,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3827843209.728598,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 86.99478530883789
+ },
+ {
+ "epoch": 121,
+ "train_loss": 4.877940362548828,
+ "train_acc": 0.00962,
+ "test_loss": 4.935777435302734,
+ "test_acc": 0.01,
+ "lyapunov": 1.5509431261540678,
+ "grad_norm": 0.13054112707845358,
+ "grad_max_sv": 0.006552627170458436,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6552627170.458437,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 87.0364146232605
+ },
+ {
+ "epoch": 122,
+ "train_loss": 4.877626941223144,
+ "train_acc": 0.01018,
+ "test_loss": 4.956711478424072,
+ "test_acc": 0.01,
+ "lyapunov": 1.549799994434542,
+ "grad_norm": 0.12579422138988705,
+ "grad_max_sv": 0.012472250685095786,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12472250685.095787,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 87.04438400268555
+ },
+ {
+ "epoch": 123,
+ "train_loss": 4.8773612213134765,
+ "train_acc": 0.01028,
+ "test_loss": 5.112759294128418,
+ "test_acc": 0.01,
+ "lyapunov": 1.5493231264831464,
+ "grad_norm": 0.11869948278714595,
+ "grad_max_sv": 0.006990070082247257,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6990070082.247256,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 87.04442477226257
+ },
+ {
+ "epoch": 124,
+ "train_loss": 4.876904801330566,
+ "train_acc": 0.00974,
+ "test_loss": 5.0848597717285156,
+ "test_acc": 0.01,
+ "lyapunov": 1.547949957725642,
+ "grad_norm": 0.11622328135609243,
+ "grad_max_sv": 0.00592916551977396,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5929165519.773959,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 87.02583312988281
+ },
+ {
+ "epoch": 125,
+ "train_loss": 4.876884867248535,
+ "train_acc": 0.00994,
+ "test_loss": 5.093001669311524,
+ "test_acc": 0.01,
+ "lyapunov": 1.5479519553196706,
+ "grad_norm": 0.11394234129927898,
+ "grad_max_sv": 0.003486808715388179,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3486808715.388179,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 87.01634311676025
+ },
+ {
+ "epoch": 126,
+ "train_loss": 4.87686362991333,
+ "train_acc": 0.00962,
+ "test_loss": 5.044818876647949,
+ "test_acc": 0.01,
+ "lyapunov": 1.5478015985635236,
+ "grad_norm": 0.11528475995319568,
+ "grad_max_sv": 0.01741538755595684,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17415387555.95684,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 87.03749418258667
+ },
+ {
+ "epoch": 127,
+ "train_loss": 4.877244481811523,
+ "train_acc": 0.00992,
+ "test_loss": 5.0011329849243165,
+ "test_acc": 0.01,
+ "lyapunov": 1.5490661807682202,
+ "grad_norm": 0.11235050252375584,
+ "grad_max_sv": 0.0023714601527899505,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2371460152.7899504,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 87.06668877601624
+ },
+ {
+ "epoch": 128,
+ "train_loss": 4.877482815856934,
+ "train_acc": 0.01004,
+ "test_loss": 5.234975555419922,
+ "test_acc": 0.01,
+ "lyapunov": 1.549882313784431,
+ "grad_norm": 0.11546242652617031,
+ "grad_max_sv": 0.0007256413344293832,
+ "grad_min_sv": 0.0,
+ "grad_condition": 725641334.4293833,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 87.02991795539856
+ },
+ {
+ "epoch": 129,
+ "train_loss": 4.8767640072631835,
+ "train_acc": 0.01006,
+ "test_loss": 5.377161560821533,
+ "test_acc": 0.01,
+ "lyapunov": 1.5474718257289408,
+ "grad_norm": 0.12203371483427425,
+ "grad_max_sv": 0.016016411827877164,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16016411827.877163,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 87.09737348556519
+ },
+ {
+ "epoch": 130,
+ "train_loss": 4.8772621307373045,
+ "train_acc": 0.00994,
+ "test_loss": 5.146733520507812,
+ "test_acc": 0.01,
+ "lyapunov": 1.5492317725325484,
+ "grad_norm": 0.13239853793431725,
+ "grad_max_sv": 0.007805489096790552,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7805489096.790552,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 87.02493596076965
+ },
+ {
+ "epoch": 131,
+ "train_loss": 4.878482946472168,
+ "train_acc": 0.01002,
+ "test_loss": 5.187312270355225,
+ "test_acc": 0.01,
+ "lyapunov": 1.5515824739280564,
+ "grad_norm": 0.13050261520417258,
+ "grad_max_sv": 0.003781923418864608,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3781923418.8646073,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 87.00766158103943
+ },
+ {
+ "epoch": 132,
+ "train_loss": 4.8773687062072755,
+ "train_acc": 0.01038,
+ "test_loss": 5.233526524353027,
+ "test_acc": 0.01,
+ "lyapunov": 1.5493864241768331,
+ "grad_norm": 0.13275623808990364,
+ "grad_max_sv": 0.00900785457342863,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9007854573.42863,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 87.07332277297974
+ },
+ {
+ "epoch": 133,
+ "train_loss": 4.877119999389649,
+ "train_acc": 0.01,
+ "test_loss": 5.208364566040039,
+ "test_acc": 0.01,
+ "lyapunov": 1.5486897553324395,
+ "grad_norm": 0.13669667117137443,
+ "grad_max_sv": 0.0031375800725072624,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3137580072.507262,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 87.08415913581848
+ },
+ {
+ "epoch": 134,
+ "train_loss": 4.876680097198486,
+ "train_acc": 0.01026,
+ "test_loss": 5.228788011169434,
+ "test_acc": 0.01,
+ "lyapunov": 1.5476158646976246,
+ "grad_norm": 0.1315586247563803,
+ "grad_max_sv": 0.0019336893223226071,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1933689322.322607,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 87.04997158050537
+ },
+ {
+ "epoch": 135,
+ "train_loss": 4.877045626525879,
+ "train_acc": 0.00998,
+ "test_loss": 5.150844607543945,
+ "test_acc": 0.01,
+ "lyapunov": 1.5484065021700262,
+ "grad_norm": 0.16019208167708357,
+ "grad_max_sv": 0.0067828110419213775,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6782811041.921377,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 87.07145261764526
+ },
+ {
+ "epoch": 136,
+ "train_loss": 4.877011717224121,
+ "train_acc": 0.00942,
+ "test_loss": 5.185321200561523,
+ "test_acc": 0.01,
+ "lyapunov": 1.5481893522355257,
+ "grad_norm": 0.16513336675938264,
+ "grad_max_sv": 0.006155044818297028,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6155044818.297029,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 87.08501839637756
+ },
+ {
+ "epoch": 137,
+ "train_loss": 4.877299792480469,
+ "train_acc": 0.00994,
+ "test_loss": 5.153644463348389,
+ "test_acc": 0.01,
+ "lyapunov": 1.5492148905458962,
+ "grad_norm": 0.14657870229772474,
+ "grad_max_sv": 0.007406354090198875,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7406354090.1988735,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 87.17517495155334
+ },
+ {
+ "epoch": 138,
+ "train_loss": 4.877124798736572,
+ "train_acc": 0.01016,
+ "test_loss": 5.164669793701172,
+ "test_acc": 0.01,
+ "lyapunov": 1.548459598170522,
+ "grad_norm": 0.15457514508897918,
+ "grad_max_sv": 0.012952858628705145,
+ "grad_min_sv": 0.0,
+ "grad_condition": 12952858628.705143,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 87.19324207305908
+ },
+ {
+ "epoch": 139,
+ "train_loss": 4.877282972564697,
+ "train_acc": 0.00982,
+ "test_loss": 5.207451676940918,
+ "test_acc": 0.01,
+ "lyapunov": 1.5492830764302208,
+ "grad_norm": 0.18425099220738375,
+ "grad_max_sv": 0.0019508119206875564,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1950811920.6875565,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 87.13183116912842
+ },
+ {
+ "epoch": 140,
+ "train_loss": 4.877498146057129,
+ "train_acc": 0.00968,
+ "test_loss": 5.200590103149414,
+ "test_acc": 0.01,
+ "lyapunov": 1.5491700614504802,
+ "grad_norm": 0.1734732516042842,
+ "grad_max_sv": 0.01371888890862465,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13718888908.62465,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 87.21231150627136
+ },
+ {
+ "epoch": 141,
+ "train_loss": 4.8770866912841795,
+ "train_acc": 0.00992,
+ "test_loss": 5.190837601470947,
+ "test_acc": 0.01,
+ "lyapunov": 1.548795386653422,
+ "grad_norm": 0.14753103772737095,
+ "grad_max_sv": 0.005145562486723066,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5145562486.723065,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 87.26526665687561
+ },
+ {
+ "epoch": 142,
+ "train_loss": 4.8766608699035645,
+ "train_acc": 0.00968,
+ "test_loss": 5.162030874633789,
+ "test_acc": 0.01,
+ "lyapunov": 1.5475660821665889,
+ "grad_norm": 0.15219397900813178,
+ "grad_max_sv": 0.005608938308432699,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5608938308.432698,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 87.12494492530823
+ },
+ {
+ "epoch": 143,
+ "train_loss": 4.8769151321411135,
+ "train_acc": 0.01004,
+ "test_loss": 5.153072937011719,
+ "test_acc": 0.01,
+ "lyapunov": 1.5482893115114373,
+ "grad_norm": 0.15346228098731488,
+ "grad_max_sv": 0.001303949998691678,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1303949998.691678,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 87.097491979599
+ },
+ {
+ "epoch": 144,
+ "train_loss": 4.877143389892578,
+ "train_acc": 0.0097,
+ "test_loss": 5.164535620117188,
+ "test_acc": 0.01,
+ "lyapunov": 1.5487491736936447,
+ "grad_norm": 0.15811775595604075,
+ "grad_max_sv": 0.008902552211657167,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8902552211.657166,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 87.06983470916748
+ },
+ {
+ "epoch": 145,
+ "train_loss": 4.876982822113037,
+ "train_acc": 0.00984,
+ "test_loss": 5.165194831848145,
+ "test_acc": 0.01,
+ "lyapunov": 1.5484599853720507,
+ "grad_norm": 0.1582019401241392,
+ "grad_max_sv": 0.004445526329800486,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4445526329.800487,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 87.08561754226685
+ },
+ {
+ "epoch": 146,
+ "train_loss": 4.876878872375488,
+ "train_acc": 0.00992,
+ "test_loss": 5.165199098205567,
+ "test_acc": 0.01,
+ "lyapunov": 1.5481780770489626,
+ "grad_norm": 0.16041164237051417,
+ "grad_max_sv": 0.003941980935633182,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3941980935.6331825,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 87.0421531200409
+ },
+ {
+ "epoch": 147,
+ "train_loss": 4.8771999089050295,
+ "train_acc": 0.01004,
+ "test_loss": 5.164550498199463,
+ "test_acc": 0.01,
+ "lyapunov": 1.5491338004846402,
+ "grad_norm": 0.16309259034155005,
+ "grad_max_sv": 0.004459652304649353,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4459652304.649353,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 87.06988906860352
+ },
+ {
+ "epoch": 148,
+ "train_loss": 4.876641088562011,
+ "train_acc": 0.00982,
+ "test_loss": 5.164551524353027,
+ "test_acc": 0.01,
+ "lyapunov": 1.5472115714226842,
+ "grad_norm": 0.15826813584085664,
+ "grad_max_sv": 0.008349275542423129,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8349275542.423129,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 87.10272812843323
+ },
+ {
+ "epoch": 149,
+ "train_loss": 4.877132370300293,
+ "train_acc": 0.01012,
+ "test_loss": 5.164552142333984,
+ "test_acc": 0.01,
+ "lyapunov": 1.5489305702926557,
+ "grad_norm": 0.15991562154962183,
+ "grad_max_sv": 0.0012625465169548988,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1262546516.9548988,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 87.08622741699219
+ },
+ {
+ "epoch": 150,
+ "train_loss": 4.876020973968505,
+ "train_acc": 0.0099,
+ "test_loss": 5.164552197265625,
+ "test_acc": 0.01,
+ "lyapunov": 1.545588637251988,
+ "grad_norm": 0.16382667555465003,
+ "grad_max_sv": 0.008686219714581967,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8686219714.581966,
+ "lr": 0.0,
+ "time_sec": 87.09966802597046
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 4.855030886230469,
+ "train_acc": 0.0148,
+ "test_loss": 4.869620406341553,
+ "test_acc": 0.01,
+ "lyapunov": 2.2862052685769316,
+ "grad_norm": 4.935339749560766,
+ "grad_max_sv": 4.1397371053695675,
+ "grad_min_sv": 8.49077093301176e-08,
+ "grad_condition": 60021939.87195291,
+ "lr": 0.0009998903417374227,
+ "time_sec": 132.66977620124817
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.676363162231445,
+ "train_acc": 0.01706,
+ "test_loss": 4.653746462249756,
+ "test_acc": 0.01,
+ "lyapunov": 1.9439213897870935,
+ "grad_norm": 2.813935189124443,
+ "grad_max_sv": 2.2243280917406083,
+ "grad_min_sv": 4.668241500582759e-08,
+ "grad_condition": 69883158.92021513,
+ "lr": 0.0009995614150494292,
+ "time_sec": 132.62859869003296
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.635125137634278,
+ "train_acc": 0.0156,
+ "test_loss": 4.85989921875,
+ "test_acc": 0.01,
+ "lyapunov": 1.709093817359651,
+ "grad_norm": 1.402581704275357,
+ "grad_max_sv": 1.0371076561510564,
+ "grad_min_sv": 1.9744334944187383e-08,
+ "grad_condition": 12965122527.521233,
+ "lr": 0.0009990133642141358,
+ "time_sec": 132.57633781433105
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.640354335479737,
+ "train_acc": 0.01534,
+ "test_loss": 4.637619474792481,
+ "test_acc": 0.01,
+ "lyapunov": 1.6715390605999685,
+ "grad_norm": 0.9398579368308534,
+ "grad_max_sv": 0.6633182838559151,
+ "grad_min_sv": 1.2069862256511819e-08,
+ "grad_condition": 8530355196.976077,
+ "lr": 0.0009982464296247522,
+ "time_sec": 132.54676032066345
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.64221305480957,
+ "train_acc": 0.01564,
+ "test_loss": 4.680573092651367,
+ "test_acc": 0.01,
+ "lyapunov": 1.657093484688293,
+ "grad_norm": 0.552135234831364,
+ "grad_max_sv": 0.3695975001901388,
+ "grad_min_sv": 2.375610143283509e-09,
+ "grad_condition": 53738580663.96106,
+ "lr": 0.0009972609476841367,
+ "time_sec": 132.5168435573578
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.6413539511108395,
+ "train_acc": 0.01584,
+ "test_loss": 5.049699407958984,
+ "test_acc": 0.0103,
+ "lyapunov": 1.6153722675255193,
+ "grad_norm": 0.5032723336212916,
+ "grad_max_sv": 0.3346161611378193,
+ "grad_min_sv": 1.7202862416924891e-09,
+ "grad_condition": 61330096051.013405,
+ "lr": 0.000996057350657239,
+ "time_sec": 132.53665018081665
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.6673028504943845,
+ "train_acc": 0.01474,
+ "test_loss": 4.570369634246826,
+ "test_acc": 0.0114,
+ "lyapunov": 1.6155120164841947,
+ "grad_norm": 0.406883512526028,
+ "grad_max_sv": 0.2576971501111984,
+ "grad_min_sv": 1.9000999133456468e-10,
+ "grad_condition": 77661364868.79805,
+ "lr": 0.000994636166481494,
+ "time_sec": 132.51018714904785
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.760079259643555,
+ "train_acc": 0.01052,
+ "test_loss": 4.907698545074463,
+ "test_acc": 0.01,
+ "lyapunov": 1.5642740458173825,
+ "grad_norm": 0.7987649812847755,
+ "grad_max_sv": 0.6862246070057154,
+ "grad_min_sv": 1.0877307097171696e-08,
+ "grad_condition": 32321166738.690815,
+ "lr": 0.0009929980185352525,
+ "time_sec": 132.5572907924652
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.772606210021973,
+ "train_acc": 0.00996,
+ "test_loss": 4.704743336486817,
+ "test_acc": 0.01,
+ "lyapunov": 1.5716174904952573,
+ "grad_norm": 0.8148548143851404,
+ "grad_max_sv": 0.6870301708579063,
+ "grad_min_sv": 1.1020205989789069e-08,
+ "grad_condition": 2417926250.6670694,
+ "lr": 0.0009911436253643444,
+ "time_sec": 132.52283430099487
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.773616914978027,
+ "train_acc": 0.01062,
+ "test_loss": 4.874710052490235,
+ "test_acc": 0.01,
+ "lyapunov": 1.562704872292326,
+ "grad_norm": 0.6675097799983111,
+ "grad_max_sv": 0.5464496180415154,
+ "grad_min_sv": 7.172653980753015e-09,
+ "grad_condition": 20965681724.308956,
+ "lr": 0.0009890738003669028,
+ "time_sec": 132.5459840297699
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.773348721618652,
+ "train_acc": 0.01024,
+ "test_loss": 4.6200670059204105,
+ "test_acc": 0.01,
+ "lyapunov": 1.562029262637848,
+ "grad_norm": 0.5488543058826973,
+ "grad_max_sv": 0.4311558365821838,
+ "grad_min_sv": 2.9074530078217566e-09,
+ "grad_condition": 49435903159.65074,
+ "lr": 0.00098678945143658,
+ "time_sec": 132.52372455596924
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.780688554229736,
+ "train_acc": 0.01046,
+ "test_loss": 4.7990555023193355,
+ "test_acc": 0.01,
+ "lyapunov": 1.557410420359248,
+ "grad_norm": 0.39735835708243683,
+ "grad_max_sv": 0.29783011190593245,
+ "grad_min_sv": 2.955632668999543e-10,
+ "grad_condition": 137320228990.74185,
+ "lr": 0.0009842915805643154,
+ "time_sec": 132.52459120750427
+ },
+ {
+ "epoch": 13,
+ "train_loss": 4.794568827362061,
+ "train_acc": 0.00944,
+ "test_loss": 4.6620225440979,
+ "test_acc": 0.01,
+ "lyapunov": 1.5579908677684071,
+ "grad_norm": 0.3760550232574214,
+ "grad_max_sv": 0.27942878790199754,
+ "grad_min_sv": 7.445462603040203e-10,
+ "grad_condition": 105013083205.519,
+ "lr": 0.000981581283398829,
+ "time_sec": 132.5209527015686
+ },
+ {
+ "epoch": 14,
+ "train_loss": 4.809564754486084,
+ "train_acc": 0.00862,
+ "test_loss": 4.655567189025879,
+ "test_acc": 0.01,
+ "lyapunov": 1.571449481007998,
+ "grad_norm": 0.33124516886493516,
+ "grad_max_sv": 0.21216185558587314,
+ "grad_min_sv": 5.858595327667813e-10,
+ "grad_condition": 110751878933.28384,
+ "lr": 0.0009786597487660333,
+ "time_sec": 132.577819108963
+ },
+ {
+ "epoch": 15,
+ "train_loss": 4.816427656860352,
+ "train_acc": 0.00936,
+ "test_loss": 4.6545363082885745,
+ "test_acc": 0.01,
+ "lyapunov": 1.5565597386006504,
+ "grad_norm": 0.2791973343426611,
+ "grad_max_sv": 0.1684179350733757,
+ "grad_min_sv": 6.917982259102923e-13,
+ "grad_condition": 127223674978.58926,
+ "lr": 0.0009755282581475766,
+ "time_sec": 132.58430194854736
+ },
+ {
+ "epoch": 16,
+ "train_loss": 4.829237567138672,
+ "train_acc": 0.00908,
+ "test_loss": 4.629003553771972,
+ "test_acc": 0.01,
+ "lyapunov": 1.5557427775219579,
+ "grad_norm": 0.2712716184485074,
+ "grad_max_sv": 0.1436759451404214,
+ "grad_min_sv": 3.50392380214562e-13,
+ "grad_condition": 118193912798.78633,
+ "lr": 0.0009721881851187403,
+ "time_sec": 132.49679327011108
+ },
+ {
+ "epoch": 17,
+ "train_loss": 4.842587297058105,
+ "train_acc": 0.00944,
+ "test_loss": 4.633112139892578,
+ "test_acc": 0.01,
+ "lyapunov": 1.554307114742601,
+ "grad_norm": 0.26245775185719383,
+ "grad_max_sv": 0.140065660700202,
+ "grad_min_sv": 2.6676405041443376e-15,
+ "grad_condition": 139703664535.0272,
+ "lr": 0.0009686409947459456,
+ "time_sec": 132.52488541603088
+ },
+ {
+ "epoch": 18,
+ "train_loss": 4.85334480545044,
+ "train_acc": 0.0098,
+ "test_loss": 4.6145305236816405,
+ "test_acc": 0.01,
+ "lyapunov": 1.5502319726187859,
+ "grad_norm": 0.20648576741983057,
+ "grad_max_sv": 0.11613305620849132,
+ "grad_min_sv": 2.4641309551932607e-14,
+ "grad_condition": 112456376406.20891,
+ "lr": 0.0009648882429441254,
+ "time_sec": 132.53546261787415
+ },
+ {
+ "epoch": 19,
+ "train_loss": 4.8756606997680665,
+ "train_acc": 0.00972,
+ "test_loss": 4.63894914932251,
+ "test_acc": 0.01,
+ "lyapunov": 1.5529851959184613,
+ "grad_norm": 0.29909579690838006,
+ "grad_max_sv": 0.2365069929510355,
+ "grad_min_sv": 8.824648532682828e-14,
+ "grad_condition": 223546987940.7954,
+ "lr": 0.00096093157579425,
+ "time_sec": 132.5408227443695
+ },
+ {
+ "epoch": 20,
+ "train_loss": 4.8827299949646,
+ "train_acc": 0.01024,
+ "test_loss": 4.622587729644775,
+ "test_acc": 0.01,
+ "lyapunov": 1.556399286555512,
+ "grad_norm": 0.15272550856176187,
+ "grad_max_sv": 0.08741383519954979,
+ "grad_min_sv": 8.699695565641333e-15,
+ "grad_condition": 85913025020.82304,
+ "lr": 0.0009567727288213001,
+ "time_sec": 132.51366233825684
+ },
+ {
+ "epoch": 21,
+ "train_loss": 4.884711999969483,
+ "train_acc": 0.00998,
+ "test_loss": 4.606764881896972,
+ "test_acc": 0.01,
+ "lyapunov": 1.5493811259184347,
+ "grad_norm": 0.2280734728397927,
+ "grad_max_sv": 0.17737758290022612,
+ "grad_min_sv": 1.7983389117226294e-14,
+ "grad_condition": 174310016585.06476,
+ "lr": 0.0009524135262330095,
+ "time_sec": 132.5240728855133
+ },
+ {
+ "epoch": 22,
+ "train_loss": 4.88518779006958,
+ "train_acc": 0.00898,
+ "test_loss": 4.625405541229248,
+ "test_acc": 0.01,
+ "lyapunov": 1.5538233515551634,
+ "grad_norm": 0.21224774170023955,
+ "grad_max_sv": 0.15938115157186986,
+ "grad_min_sv": 3.1749157935371154e-14,
+ "grad_condition": 154547913667.9044,
+ "lr": 0.0009478558801197061,
+ "time_sec": 132.49090003967285
+ },
+ {
+ "epoch": 23,
+ "train_loss": 4.87999728149414,
+ "train_acc": 0.01018,
+ "test_loss": 4.662280471801758,
+ "test_acc": 0.01,
+ "lyapunov": 1.5508448772723107,
+ "grad_norm": 0.15119163863092763,
+ "grad_max_sv": 0.08865232784301043,
+ "grad_min_sv": 7.005994597272193e-16,
+ "grad_condition": 88575401119.44853,
+ "lr": 0.000943101789615607,
+ "time_sec": 132.47974038124084
+ },
+ {
+ "epoch": 24,
+ "train_loss": 4.881147270202637,
+ "train_acc": 0.00976,
+ "test_loss": 4.615948718261719,
+ "test_acc": 0.01,
+ "lyapunov": 1.5512399081988713,
+ "grad_norm": 0.15770676446584825,
+ "grad_max_sv": 0.10294295214116574,
+ "grad_min_sv": 5.7741339454657465e-15,
+ "grad_condition": 102285384766.49887,
+ "lr": 0.0009381533400219313,
+ "time_sec": 132.52317762374878
+ },
+ {
+ "epoch": 25,
+ "train_loss": 4.880569260253906,
+ "train_acc": 0.00984,
+ "test_loss": 4.610492027282715,
+ "test_acc": 0.01,
+ "lyapunov": 1.5512746035900262,
+ "grad_norm": 0.14554815906091484,
+ "grad_max_sv": 0.08865004125982523,
+ "grad_min_sv": 2.6778839672578997e-16,
+ "grad_condition": 88627301882.68987,
+ "lr": 0.0009330127018922189,
+ "time_sec": 132.56079196929932
+ },
+ {
+ "epoch": 26,
+ "train_loss": 4.881224513397217,
+ "train_acc": 0.01002,
+ "test_loss": 4.747660410308838,
+ "test_acc": 0.01,
+ "lyapunov": 1.5542162702516522,
+ "grad_norm": 0.1391562981495577,
+ "grad_max_sv": 0.08203545394353569,
+ "grad_min_sv": 2.822381678288234e-15,
+ "grad_condition": 81722256507.78954,
+ "lr": 0.000927682130080253,
+ "time_sec": 132.5239975452423
+ },
+ {
+ "epoch": 27,
+ "train_loss": 4.881258678741455,
+ "train_acc": 0.0098,
+ "test_loss": 4.790026293182373,
+ "test_acc": 0.01,
+ "lyapunov": 1.5510657614149401,
+ "grad_norm": 0.14725967817424349,
+ "grad_max_sv": 0.09194991793483495,
+ "grad_min_sv": 4.568772527401975e-15,
+ "grad_condition": 91398390464.57925,
+ "lr": 0.0009221639627510072,
+ "time_sec": 132.526837348938
+ },
+ {
+ "epoch": 28,
+ "train_loss": 4.880898860931397,
+ "train_acc": 0.0102,
+ "test_loss": 4.802646064758301,
+ "test_acc": 0.01,
+ "lyapunov": 1.5514030862037482,
+ "grad_norm": 0.14347689217252269,
+ "grad_max_sv": 0.09245897587388754,
+ "grad_min_sv": 1.0843861076282981e-15,
+ "grad_condition": 92342187840.9415,
+ "lr": 0.0009164606203550494,
+ "time_sec": 132.5042200088501
+ },
+ {
+ "epoch": 29,
+ "train_loss": 4.880448774719238,
+ "train_acc": 0.01046,
+ "test_loss": 4.7516579360961915,
+ "test_acc": 0.01,
+ "lyapunov": 1.5519556474807623,
+ "grad_norm": 0.13309334546952373,
+ "grad_max_sv": 0.08154573319479823,
+ "grad_min_sv": 9.282067880476938e-16,
+ "grad_condition": 81454842058.19734,
+ "lr": 0.0009105746045668516,
+ "time_sec": 132.52633500099182
+ },
+ {
+ "epoch": 30,
+ "train_loss": 4.883071630401611,
+ "train_acc": 0.00954,
+ "test_loss": 4.771951943206787,
+ "test_acc": 0.01,
+ "lyapunov": 1.554316602399587,
+ "grad_norm": 0.14789859288021653,
+ "grad_max_sv": 0.09579872786998749,
+ "grad_min_sv": 3.051331237308755e-15,
+ "grad_condition": 95468711969.6211,
+ "lr": 0.0009045084971874733,
+ "time_sec": 132.5885534286499
+ },
+ {
+ "epoch": 31,
+ "train_loss": 4.881176261901856,
+ "train_acc": 0.00888,
+ "test_loss": 4.774106753540039,
+ "test_acc": 0.01,
+ "lyapunov": 1.5536001310933887,
+ "grad_norm": 0.13112482323923252,
+ "grad_max_sv": 0.07564891651272773,
+ "grad_min_sv": 2.107048715412855e-15,
+ "grad_condition": 75454097088.2188,
+ "lr": 0.0008982649590120977,
+ "time_sec": 132.49479031562805
+ },
+ {
+ "epoch": 32,
+ "train_loss": 4.880477762145996,
+ "train_acc": 0.00962,
+ "test_loss": 4.746245973968506,
+ "test_acc": 0.01,
+ "lyapunov": 1.5537874387658162,
+ "grad_norm": 0.12461403839681509,
+ "grad_max_sv": 0.062327271420508625,
+ "grad_min_sv": 1.0725391843424482e-20,
+ "grad_condition": 62327270693.35764,
+ "lr": 0.0008918467286629196,
+ "time_sec": 132.4852647781372
+ },
+ {
+ "epoch": 33,
+ "train_loss": 4.881243226470947,
+ "train_acc": 0.00888,
+ "test_loss": 4.736703532409668,
+ "test_acc": 0.01,
+ "lyapunov": 1.556170121788064,
+ "grad_norm": 0.1148317700659679,
+ "grad_max_sv": 0.05345285767689347,
+ "grad_min_sv": 0.0,
+ "grad_condition": 53452857676.89348,
+ "lr": 0.0008852566213878943,
+ "time_sec": 132.53890919685364
+ },
+ {
+ "epoch": 34,
+ "train_loss": 4.881585180969238,
+ "train_acc": 0.01008,
+ "test_loss": 4.703427969360352,
+ "test_acc": 0.01,
+ "lyapunov": 1.5578572292766912,
+ "grad_norm": 0.11335239335552806,
+ "grad_max_sv": 0.052668086066842076,
+ "grad_min_sv": 0.0,
+ "grad_condition": 52668086066.84208,
+ "lr": 0.000878497527825878,
+ "time_sec": 132.64637637138367
+ },
+ {
+ "epoch": 35,
+ "train_loss": 4.882511229858398,
+ "train_acc": 0.0097,
+ "test_loss": 4.681371363830566,
+ "test_acc": 0.01,
+ "lyapunov": 1.5592110135671122,
+ "grad_norm": 0.12058968555924836,
+ "grad_max_sv": 0.06217097630724311,
+ "grad_min_sv": 0.0,
+ "grad_condition": 62170976307.2431,
+ "lr": 0.000871572412738697,
+ "time_sec": 132.43680119514465
+ },
+ {
+ "epoch": 36,
+ "train_loss": 4.881192719268799,
+ "train_acc": 0.00946,
+ "test_loss": 4.697506471252441,
+ "test_acc": 0.01,
+ "lyapunov": 1.5561128973655993,
+ "grad_norm": 0.11655881819882306,
+ "grad_max_sv": 0.058859458193182945,
+ "grad_min_sv": 8.230737425630695e-40,
+ "grad_condition": 58859458193.182945,
+ "lr": 0.0008644843137107055,
+ "time_sec": 132.4848039150238
+ },
+ {
+ "epoch": 37,
+ "train_loss": 4.8825209786987305,
+ "train_acc": 0.00972,
+ "test_loss": 4.694917836761475,
+ "test_acc": 0.01,
+ "lyapunov": 1.5584492564506238,
+ "grad_norm": 0.13341533833277566,
+ "grad_max_sv": 0.07657676143571734,
+ "grad_min_sv": 1.687390330982044e-16,
+ "grad_condition": 76560751213.82744,
+ "lr": 0.0008572363398164014,
+ "time_sec": 132.51812028884888
+ },
+ {
+ "epoch": 38,
+ "train_loss": 4.882141689910888,
+ "train_acc": 0.01016,
+ "test_loss": 4.688916626739502,
+ "test_acc": 0.01,
+ "lyapunov": 1.5593435761263914,
+ "grad_norm": 0.11853299040694154,
+ "grad_max_sv": 0.055678781820461154,
+ "grad_min_sv": 6.767910398009686e-40,
+ "grad_condition": 55678781820.46116,
+ "lr": 0.0008498316702566826,
+ "time_sec": 132.56456470489502
+ },
+ {
+ "epoch": 39,
+ "train_loss": 4.8832370683288575,
+ "train_acc": 0.01006,
+ "test_loss": 4.7038502136230465,
+ "test_acc": 0.01,
+ "lyapunov": 1.5620976924286474,
+ "grad_norm": 0.11941743088728123,
+ "grad_max_sv": 0.05502237342298031,
+ "grad_min_sv": 8.246841147582715e-40,
+ "grad_condition": 55022373422.9803,
+ "lr": 0.0008422735529643442,
+ "time_sec": 132.5043168067932
+ },
+ {
+ "epoch": 40,
+ "train_loss": 4.884805080718994,
+ "train_acc": 0.00916,
+ "test_loss": 4.710450775146485,
+ "test_acc": 0.01,
+ "lyapunov": 1.5655303751416219,
+ "grad_norm": 0.12619034606889276,
+ "grad_max_sv": 0.06059649083763361,
+ "grad_min_sv": 2.3062997125157342e-34,
+ "grad_condition": 60596490837.63362,
+ "lr": 0.0008345653031794289,
+ "time_sec": 132.5351688861847
+ },
+ {
+ "epoch": 41,
+ "train_loss": 4.886436430511474,
+ "train_acc": 0.00842,
+ "test_loss": 4.693475389099121,
+ "test_acc": 0.01,
+ "lyapunov": 1.566963563794675,
+ "grad_norm": 0.13196364661308996,
+ "grad_max_sv": 0.06961128637194633,
+ "grad_min_sv": 1.1737794876080507e-22,
+ "grad_condition": 69611286362.64899,
+ "lr": 0.0008267103019950526,
+ "time_sec": 132.51111769676208
+ },
+ {
+ "epoch": 42,
+ "train_loss": 4.882716519012451,
+ "train_acc": 0.00938,
+ "test_loss": 4.694032908630371,
+ "test_acc": 0.01,
+ "lyapunov": 1.5620074573990024,
+ "grad_norm": 0.11781162776823918,
+ "grad_max_sv": 0.046270584035664794,
+ "grad_min_sv": 0.0,
+ "grad_condition": 46270584035.664795,
+ "lr": 0.0008187119948743447,
+ "time_sec": 132.5160994529724
+ },
+ {
+ "epoch": 43,
+ "train_loss": 4.8821180502319335,
+ "train_acc": 0.00952,
+ "test_loss": 4.7027722869873045,
+ "test_acc": 0.01,
+ "lyapunov": 1.561017348638276,
+ "grad_norm": 0.11312831534529132,
+ "grad_max_sv": 0.04106818297877908,
+ "grad_min_sv": 0.0,
+ "grad_condition": 41068182978.77908,
+ "lr": 0.000810573890139155,
+ "time_sec": 132.5087025165558
+ },
+ {
+ "epoch": 44,
+ "train_loss": 4.883875316619873,
+ "train_acc": 0.00868,
+ "test_loss": 4.726299923706055,
+ "test_acc": 0.01,
+ "lyapunov": 1.5633756574767326,
+ "grad_norm": 0.12667296790156193,
+ "grad_max_sv": 0.0658588983118534,
+ "grad_min_sv": 1.0092078216956858e-18,
+ "grad_condition": 65858810617.60825,
+ "lr": 0.0008022995574311873,
+ "time_sec": 132.5128674507141
+ },
+ {
+ "epoch": 45,
+ "train_loss": 4.883541934661865,
+ "train_acc": 0.00932,
+ "test_loss": 4.7017227630615235,
+ "test_acc": 0.01,
+ "lyapunov": 1.5632145856042652,
+ "grad_norm": 0.12309109072630019,
+ "grad_max_sv": 0.05839173295535147,
+ "grad_min_sv": 3.503246160812043e-47,
+ "grad_condition": 58391732955.35146,
+ "lr": 0.0007938926261462363,
+ "time_sec": 132.53016304969788
+ },
+ {
+ "epoch": 46,
+ "train_loss": 4.888793373718261,
+ "train_acc": 0.00888,
+ "test_loss": 4.696292651367187,
+ "test_acc": 0.01,
+ "lyapunov": 1.5750811136592076,
+ "grad_norm": 0.13746736535152312,
+ "grad_max_sv": 0.058484140876680614,
+ "grad_min_sv": 0.0,
+ "grad_condition": 58484140876.68062,
+ "lr": 0.0007853567838422158,
+ "time_sec": 132.50724458694458
+ },
+ {
+ "epoch": 47,
+ "train_loss": 4.883440639190674,
+ "train_acc": 0.00972,
+ "test_loss": 4.701148196411133,
+ "test_acc": 0.01,
+ "lyapunov": 1.564275365351411,
+ "grad_norm": 0.12158899868830998,
+ "grad_max_sv": 0.05122774885967374,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51227748859.673744,
+ "lr": 0.0007766957746216719,
+ "time_sec": 132.50299715995789
+ },
+ {
+ "epoch": 48,
+ "train_loss": 4.884719120330811,
+ "train_acc": 0.00906,
+ "test_loss": 4.729176859283447,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687132698800557,
+ "grad_norm": 0.12254448404539135,
+ "grad_max_sv": 0.040120215015485884,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40120215015.485886,
+ "lr": 0.0007679133974894982,
+ "time_sec": 132.46641159057617
+ },
+ {
+ "epoch": 49,
+ "train_loss": 4.884110562133789,
+ "train_acc": 0.00872,
+ "test_loss": 4.725056867980957,
+ "test_acc": 0.01,
+ "lyapunov": 1.5669305754439604,
+ "grad_norm": 0.1149187900499572,
+ "grad_max_sv": 0.03382976925931871,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33829769259.318707,
+ "lr": 0.000759013504686565,
+ "time_sec": 132.51045417785645
+ },
+ {
+ "epoch": 50,
+ "train_loss": 4.883614390563965,
+ "train_acc": 0.00966,
+ "test_loss": 4.709762881469727,
+ "test_acc": 0.01,
+ "lyapunov": 1.566156323608535,
+ "grad_norm": 0.12258255087018385,
+ "grad_max_sv": 0.034629582427442074,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34629582427.44206,
+ "lr": 0.0007499999999999998,
+ "time_sec": 132.5417709350586
+ },
+ {
+ "epoch": 51,
+ "train_loss": 4.8839620613098145,
+ "train_acc": 0.0093,
+ "test_loss": 4.6980411888122555,
+ "test_acc": 0.01,
+ "lyapunov": 1.5664365087323786,
+ "grad_norm": 0.13769170593996222,
+ "grad_max_sv": 0.04753138842061162,
+ "grad_min_sv": 0.0,
+ "grad_condition": 47531388420.61162,
+ "lr": 0.0007408768370508575,
+ "time_sec": 132.5473415851593
+ },
+ {
+ "epoch": 52,
+ "train_loss": 4.883951457366943,
+ "train_acc": 0.0097,
+ "test_loss": 4.7330233673095705,
+ "test_acc": 0.01,
+ "lyapunov": 1.5676923822563933,
+ "grad_norm": 0.12914534017358148,
+ "grad_max_sv": 0.03236106717959046,
+ "grad_min_sv": 0.0,
+ "grad_condition": 32361067179.590466,
+ "lr": 0.0007316480175599307,
+ "time_sec": 132.50377297401428
+ },
+ {
+ "epoch": 53,
+ "train_loss": 4.883413257293701,
+ "train_acc": 0.00908,
+ "test_loss": 4.7225365089416504,
+ "test_acc": 0.01,
+ "lyapunov": 1.5648496943666501,
+ "grad_norm": 0.1255861922278266,
+ "grad_max_sv": 0.04178534299135208,
+ "grad_min_sv": 0.0,
+ "grad_condition": 41785342991.35208,
+ "lr": 0.0007223175895924635,
+ "time_sec": 132.52618622779846
+ },
+ {
+ "epoch": 54,
+ "train_loss": 4.8835242868041995,
+ "train_acc": 0.00984,
+ "test_loss": 4.827378164672852,
+ "test_acc": 0.01,
+ "lyapunov": 1.5652363522888144,
+ "grad_norm": 0.11717740789911417,
+ "grad_max_sv": 0.04349024128168821,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43490241281.68822,
+ "lr": 0.0007128896457825361,
+ "time_sec": 132.49181389808655
+ },
+ {
+ "epoch": 55,
+ "train_loss": 4.885148456573487,
+ "train_acc": 0.00938,
+ "test_loss": 4.805696286010742,
+ "test_acc": 0.01,
+ "lyapunov": 1.5694574946942537,
+ "grad_norm": 0.11719591784462954,
+ "grad_max_sv": 0.027647955063730478,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27647955063.73048,
+ "lr": 0.0007033683215378998,
+ "time_sec": 132.4630925655365
+ },
+ {
+ "epoch": 56,
+ "train_loss": 4.8840925729370115,
+ "train_acc": 0.00916,
+ "test_loss": 4.817810218048096,
+ "test_acc": 0.01,
+ "lyapunov": 1.5679599275369474,
+ "grad_norm": 0.10763202558448146,
+ "grad_max_sv": 0.024515782250091434,
+ "grad_min_sv": 0.0,
+ "grad_condition": 24515782250.09143,
+ "lr": 0.0006937577932260512,
+ "time_sec": 132.42955470085144
+ },
+ {
+ "epoch": 57,
+ "train_loss": 4.883760057678223,
+ "train_acc": 0.0095,
+ "test_loss": 4.856276947784424,
+ "test_acc": 0.01,
+ "lyapunov": 1.5672943607315688,
+ "grad_norm": 0.11038524447317109,
+ "grad_max_sv": 0.031160860368981958,
+ "grad_min_sv": 0.0,
+ "grad_condition": 31160860368.981956,
+ "lr": 0.0006840622763423388,
+ "time_sec": 132.52315950393677
+ },
+ {
+ "epoch": 58,
+ "train_loss": 4.884222667388916,
+ "train_acc": 0.00974,
+ "test_loss": 4.874290851593018,
+ "test_acc": 0.01,
+ "lyapunov": 1.567508033779271,
+ "grad_norm": 0.11849561013061653,
+ "grad_max_sv": 0.03593655498698354,
+ "grad_min_sv": 0.0,
+ "grad_condition": 35936554986.983536,
+ "lr": 0.0006742860236609073,
+ "time_sec": 132.47893905639648
+ },
+ {
+ "epoch": 59,
+ "train_loss": 4.88414927734375,
+ "train_acc": 0.00932,
+ "test_loss": 4.812584387207031,
+ "test_acc": 0.01,
+ "lyapunov": 1.5678569962606406,
+ "grad_norm": 0.11036912590820531,
+ "grad_max_sv": 0.028424020344391464,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28424020344.391468,
+ "lr": 0.0006644333233692913,
+ "time_sec": 132.4449987411499
+ },
+ {
+ "epoch": 60,
+ "train_loss": 4.8860119464111325,
+ "train_acc": 0.00866,
+ "test_loss": 4.839297940826416,
+ "test_acc": 0.01,
+ "lyapunov": 1.5727104262622726,
+ "grad_norm": 0.12489417029089354,
+ "grad_max_sv": 0.0449837657622993,
+ "grad_min_sv": 0.0,
+ "grad_condition": 44983765762.2993,
+ "lr": 0.0006545084971874734,
+ "time_sec": 132.52293181419373
+ },
+ {
+ "epoch": 61,
+ "train_loss": 4.884305205383301,
+ "train_acc": 0.01046,
+ "test_loss": 4.857601212310791,
+ "test_acc": 0.01,
+ "lyapunov": 1.5686972680908944,
+ "grad_norm": 0.11135287490998455,
+ "grad_max_sv": 0.04157614354044199,
+ "grad_min_sv": 0.0,
+ "grad_condition": 41576143540.44199,
+ "lr": 0.0006445158984722354,
+ "time_sec": 132.51698970794678
+ },
+ {
+ "epoch": 62,
+ "train_loss": 4.884398639678955,
+ "train_acc": 0.00944,
+ "test_loss": 4.833207711791992,
+ "test_acc": 0.01,
+ "lyapunov": 1.5687918172163122,
+ "grad_norm": 0.11243013251101783,
+ "grad_max_sv": 0.043204908631742,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43204908631.742004,
+ "lr": 0.0006344599103076324,
+ "time_sec": 132.51721620559692
+ },
+ {
+ "epoch": 63,
+ "train_loss": 4.884688519744873,
+ "train_acc": 0.00908,
+ "test_loss": 4.811236346435547,
+ "test_acc": 0.01,
+ "lyapunov": 1.570080169326509,
+ "grad_norm": 0.11662661682539925,
+ "grad_max_sv": 0.02772782016545534,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27727820165.455345,
+ "lr": 0.0006243449435824269,
+ "time_sec": 132.50267052650452
+ },
+ {
+ "epoch": 64,
+ "train_loss": 4.8855357188415525,
+ "train_acc": 0.0096,
+ "test_loss": 4.834980075073243,
+ "test_acc": 0.01,
+ "lyapunov": 1.5721226451951829,
+ "grad_norm": 0.12180207356240787,
+ "grad_max_sv": 0.013557582441717387,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13557582441.717386,
+ "lr": 0.0006141754350553275,
+ "time_sec": 132.6969666481018
+ },
+ {
+ "epoch": 65,
+ "train_loss": 4.884502696838379,
+ "train_acc": 0.00962,
+ "test_loss": 4.815651828765869,
+ "test_acc": 0.01,
+ "lyapunov": 1.5692061444987422,
+ "grad_norm": 0.13731619014897972,
+ "grad_max_sv": 0.036923335213214156,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36923335213.21416,
+ "lr": 0.0006039558454088793,
+ "time_sec": 132.4734799861908
+ },
+ {
+ "epoch": 66,
+ "train_loss": 4.88990579711914,
+ "train_acc": 0.00978,
+ "test_loss": 4.791162698364258,
+ "test_acc": 0.01,
+ "lyapunov": 1.581291075862582,
+ "grad_norm": 0.14075282121769883,
+ "grad_max_sv": 0.039619889203459026,
+ "grad_min_sv": 0.0,
+ "grad_condition": 39619889203.45903,
+ "lr": 0.000593690657292862,
+ "time_sec": 132.52782583236694
+ },
+ {
+ "epoch": 67,
+ "train_loss": 4.888191639251709,
+ "train_acc": 0.00998,
+ "test_loss": 4.805363137054443,
+ "test_acc": 0.01,
+ "lyapunov": 1.5781969777153582,
+ "grad_norm": 0.11852732787787948,
+ "grad_max_sv": 0.03636179021559656,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36361790215.59656,
+ "lr": 0.0005833843733580507,
+ "time_sec": 132.50655126571655
+ },
+ {
+ "epoch": 68,
+ "train_loss": 4.885113808746338,
+ "train_acc": 0.0092,
+ "test_loss": 4.790876692962646,
+ "test_acc": 0.01,
+ "lyapunov": 1.5712030659551206,
+ "grad_norm": 0.11464904106569235,
+ "grad_max_sv": 0.02942234524525702,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29422345245.25702,
+ "lr": 0.0005730415142812054,
+ "time_sec": 132.44155955314636
+ },
+ {
+ "epoch": 69,
+ "train_loss": 4.886073732910156,
+ "train_acc": 0.00874,
+ "test_loss": 4.788568280029297,
+ "test_acc": 0.01,
+ "lyapunov": 1.5744608549205847,
+ "grad_norm": 0.11158557694696751,
+ "grad_max_sv": 0.004607879696413875,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4607879696.413875,
+ "lr": 0.0005626666167821517,
+ "time_sec": 132.44937348365784
+ },
+ {
+ "epoch": 70,
+ "train_loss": 4.885406183319092,
+ "train_acc": 0.00988,
+ "test_loss": 4.791419393157959,
+ "test_acc": 0.01,
+ "lyapunov": 1.5723789460823665,
+ "grad_norm": 0.1093341588876136,
+ "grad_max_sv": 0.013379927957430482,
+ "grad_min_sv": 0.0,
+ "grad_condition": 13379927957.430483,
+ "lr": 0.0005522642316338265,
+ "time_sec": 132.44818544387817
+ },
+ {
+ "epoch": 71,
+ "train_loss": 4.885112988128662,
+ "train_acc": 0.00898,
+ "test_loss": 4.807086729431153,
+ "test_acc": 0.01,
+ "lyapunov": 1.5718346922598836,
+ "grad_norm": 0.12168415122862028,
+ "grad_max_sv": 0.014193862210959196,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14193862210.959198,
+ "lr": 0.0005418389216661573,
+ "time_sec": 132.46469593048096
+ },
+ {
+ "epoch": 72,
+ "train_loss": 4.888309308624268,
+ "train_acc": 0.00942,
+ "test_loss": 4.786458195495605,
+ "test_acc": 0.01,
+ "lyapunov": 1.5786126913012142,
+ "grad_norm": 0.1257472430943546,
+ "grad_max_sv": 0.00992818851955235,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9928188519.55235,
+ "lr": 0.0005313952597646563,
+ "time_sec": 132.4868745803833
+ },
+ {
+ "epoch": 73,
+ "train_loss": 4.8883187344360355,
+ "train_acc": 0.01008,
+ "test_loss": 4.763764072418213,
+ "test_acc": 0.01,
+ "lyapunov": 1.5783945306792588,
+ "grad_norm": 0.16063770590325258,
+ "grad_max_sv": 0.02905639265663922,
+ "grad_min_sv": 0.0,
+ "grad_condition": 29056392656.63922,
+ "lr": 0.0005209378268645994,
+ "time_sec": 132.40988731384277
+ },
+ {
+ "epoch": 74,
+ "train_loss": 4.885095281524658,
+ "train_acc": 0.00904,
+ "test_loss": 4.771036297607422,
+ "test_acc": 0.01,
+ "lyapunov": 1.5722466762108571,
+ "grad_norm": 0.332703681561214,
+ "grad_max_sv": 0.009321404900401831,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9321404900.40183,
+ "lr": 0.0005104712099416781,
+ "time_sec": 132.41944670677185
+ },
+ {
+ "epoch": 75,
+ "train_loss": 4.8858135334777835,
+ "train_acc": 0.00924,
+ "test_loss": 4.7793162803649905,
+ "test_acc": 0.01,
+ "lyapunov": 1.573599765367825,
+ "grad_norm": 0.3785245081976868,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004999999999999996,
+ "time_sec": 132.43439865112305
+ },
+ {
+ "epoch": 76,
+ "train_loss": 4.885755948486328,
+ "train_acc": 0.00894,
+ "test_loss": 4.775339208984375,
+ "test_acc": 0.01,
+ "lyapunov": 1.5738494380965562,
+ "grad_norm": 0.26809830726413736,
+ "grad_max_sv": 0.00972625520080328,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9726255200.80328,
+ "lr": 0.0004895287900583212,
+ "time_sec": 132.4453580379486
+ },
+ {
+ "epoch": 77,
+ "train_loss": 4.886971358032227,
+ "train_acc": 0.0088,
+ "test_loss": 4.780246302032471,
+ "test_acc": 0.01,
+ "lyapunov": 1.576519505447134,
+ "grad_norm": 0.5857000867492739,
+ "grad_max_sv": 0.015286983083933591,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15286983083.933594,
+ "lr": 0.0004790621731353997,
+ "time_sec": 132.4340922832489
+ },
+ {
+ "epoch": 78,
+ "train_loss": 4.8857606088256835,
+ "train_acc": 0.00878,
+ "test_loss": 4.796332804870605,
+ "test_acc": 0.01,
+ "lyapunov": 1.574093949764281,
+ "grad_norm": 0.19474925059694603,
+ "grad_max_sv": 0.007740102289244532,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7740102289.244532,
+ "lr": 0.000468604740235343,
+ "time_sec": 132.4252007007599
+ },
+ {
+ "epoch": 79,
+ "train_loss": 4.8854332868957515,
+ "train_acc": 0.00904,
+ "test_loss": 4.7431994110107425,
+ "test_acc": 0.01,
+ "lyapunov": 1.5728687746140657,
+ "grad_norm": 0.2002833929164076,
+ "grad_max_sv": 0.018612090731039643,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18612090731.039646,
+ "lr": 0.00045816107833384175,
+ "time_sec": 132.41635990142822
+ },
+ {
+ "epoch": 80,
+ "train_loss": 4.88607871963501,
+ "train_acc": 0.00908,
+ "test_loss": 4.782230687713623,
+ "test_acc": 0.01,
+ "lyapunov": 1.5748912559445862,
+ "grad_norm": 0.2663292726664251,
+ "grad_max_sv": 0.0006320734973996878,
+ "grad_min_sv": 0.0,
+ "grad_condition": 632073497.3996878,
+ "lr": 0.0004477357683661729,
+ "time_sec": 132.3943703174591
+ },
+ {
+ "epoch": 81,
+ "train_loss": 4.885633817596435,
+ "train_acc": 0.00894,
+ "test_loss": 4.773731129455566,
+ "test_acc": 0.01,
+ "lyapunov": 1.5739493342616675,
+ "grad_norm": 0.19467627817910108,
+ "grad_max_sv": 0.004234243137761951,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4234243137.7619505,
+ "lr": 0.00043733338321784746,
+ "time_sec": 132.42148518562317
+ },
+ {
+ "epoch": 82,
+ "train_loss": 4.890183934631348,
+ "train_acc": 0.00922,
+ "test_loss": 4.80019803237915,
+ "test_acc": 0.01,
+ "lyapunov": 1.58174940356818,
+ "grad_norm": 0.2693904362677404,
+ "grad_max_sv": 0.023508542357012628,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23508542357.01263,
+ "lr": 0.0004269584857187939,
+ "time_sec": 132.48368287086487
+ },
+ {
+ "epoch": 83,
+ "train_loss": 4.887686183624267,
+ "train_acc": 0.00988,
+ "test_loss": 4.6776658203125,
+ "test_acc": 0.01,
+ "lyapunov": 1.574008427922378,
+ "grad_norm": 0.2293228968062561,
+ "grad_max_sv": 0.06707085431553424,
+ "grad_min_sv": 5.322572622808566e-16,
+ "grad_condition": 67002509647.244484,
+ "lr": 0.0004166156266419484,
+ "time_sec": 132.49965047836304
+ },
+ {
+ "epoch": 84,
+ "train_loss": 4.887849067077637,
+ "train_acc": 0.01004,
+ "test_loss": 4.733781813049316,
+ "test_acc": 0.01,
+ "lyapunov": 1.573820165356102,
+ "grad_norm": 0.14901481902367925,
+ "grad_max_sv": 0.09299901695922017,
+ "grad_min_sv": 1.6405075679230025e-16,
+ "grad_condition": 92982403383.72546,
+ "lr": 0.0004063093427071373,
+ "time_sec": 132.49851322174072
+ },
+ {
+ "epoch": 85,
+ "train_loss": 4.891140226135254,
+ "train_acc": 0.00994,
+ "test_loss": 4.79980509262085,
+ "test_acc": 0.01,
+ "lyapunov": 1.5841534381632305,
+ "grad_norm": 0.14782164130887582,
+ "grad_max_sv": 0.07909845747053623,
+ "grad_min_sv": 4.4865151314265836e-26,
+ "grad_condition": 79098457470.53198,
+ "lr": 0.0003960441545911199,
+ "time_sec": 132.5316731929779
+ },
+ {
+ "epoch": 86,
+ "train_loss": 4.887021747589111,
+ "train_acc": 0.00944,
+ "test_loss": 4.776346062469482,
+ "test_acc": 0.01,
+ "lyapunov": 1.5762594874252749,
+ "grad_norm": 0.12848068900948553,
+ "grad_max_sv": 0.05206927340477705,
+ "grad_min_sv": 0.0,
+ "grad_condition": 52069273404.777054,
+ "lr": 0.0003858245649446718,
+ "time_sec": 132.53142595291138
+ },
+ {
+ "epoch": 87,
+ "train_loss": 4.889097787322998,
+ "train_acc": 0.00868,
+ "test_loss": 4.707060712432861,
+ "test_acc": 0.01,
+ "lyapunov": 1.5793669498180185,
+ "grad_norm": 0.1548551396628501,
+ "grad_max_sv": 0.07543672090396285,
+ "grad_min_sv": 1.994722925254039e-23,
+ "grad_condition": 75436720902.41975,
+ "lr": 0.00037565505641757235,
+ "time_sec": 132.56474471092224
+ },
+ {
+ "epoch": 88,
+ "train_loss": 4.887517103881836,
+ "train_acc": 0.00934,
+ "test_loss": 4.697494779968261,
+ "test_acc": 0.01,
+ "lyapunov": 1.5769202114675966,
+ "grad_norm": 0.12499428379004662,
+ "grad_max_sv": 0.06417224258184433,
+ "grad_min_sv": 3.819406582541987e-27,
+ "grad_condition": 64172242581.844055,
+ "lr": 0.00036554008969236695,
+ "time_sec": 132.5758376121521
+ },
+ {
+ "epoch": 89,
+ "train_loss": 4.889558787384034,
+ "train_acc": 0.00908,
+ "test_loss": 4.738901914978027,
+ "test_acc": 0.01,
+ "lyapunov": 1.5814725813048576,
+ "grad_norm": 0.1259682508249713,
+ "grad_max_sv": 0.05729179736226797,
+ "grad_min_sv": 0.0,
+ "grad_condition": 57291797362.26797,
+ "lr": 0.0003554841015277638,
+ "time_sec": 132.55631971359253
+ },
+ {
+ "epoch": 90,
+ "train_loss": 4.887118022155762,
+ "train_acc": 0.00926,
+ "test_loss": 4.745434680175781,
+ "test_acc": 0.01,
+ "lyapunov": 1.57591240881654,
+ "grad_norm": 0.12675049544335418,
+ "grad_max_sv": 0.0551216053776443,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55121605377.64431,
+ "lr": 0.000345491502812526,
+ "time_sec": 132.52520608901978
+ },
+ {
+ "epoch": 91,
+ "train_loss": 4.886403057098389,
+ "train_acc": 0.01032,
+ "test_loss": 4.728809788513184,
+ "test_acc": 0.01,
+ "lyapunov": 1.575149437045807,
+ "grad_norm": 0.12166328349782148,
+ "grad_max_sv": 0.04358728057704866,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43587280577.04866,
+ "lr": 0.0003355666766307081,
+ "time_sec": 132.5356101989746
+ },
+ {
+ "epoch": 92,
+ "train_loss": 4.886422184295654,
+ "train_acc": 0.00926,
+ "test_loss": 4.738454541015625,
+ "test_acc": 0.01,
+ "lyapunov": 1.5745899811425172,
+ "grad_norm": 0.11920532388570855,
+ "grad_max_sv": 0.05519997598603368,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55199975986.033676,
+ "lr": 0.00032571397633909225,
+ "time_sec": 132.55407977104187
+ },
+ {
+ "epoch": 93,
+ "train_loss": 4.886163410339355,
+ "train_acc": 0.00948,
+ "test_loss": 4.729941507720947,
+ "test_acc": 0.01,
+ "lyapunov": 1.5739426192115336,
+ "grad_norm": 0.13075040975965602,
+ "grad_max_sv": 0.051908688899129626,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51908688899.12963,
+ "lr": 0.00031593772365766094,
+ "time_sec": 132.55454182624817
+ },
+ {
+ "epoch": 94,
+ "train_loss": 4.889471523284912,
+ "train_acc": 0.00938,
+ "test_loss": 4.726048579406738,
+ "test_acc": 0.01,
+ "lyapunov": 1.5820539750711387,
+ "grad_norm": 0.13111792932705457,
+ "grad_max_sv": 0.04076082408428192,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40760824084.28192,
+ "lr": 0.0003062422067739483,
+ "time_sec": 132.50855350494385
+ },
+ {
+ "epoch": 95,
+ "train_loss": 4.886597353057861,
+ "train_acc": 0.00966,
+ "test_loss": 4.721816172790527,
+ "test_acc": 0.01,
+ "lyapunov": 1.5761216878890991,
+ "grad_norm": 0.10242530878744271,
+ "grad_max_sv": 0.018115377286449075,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18115377286.449074,
+ "lr": 0.00029663167846209965,
+ "time_sec": 132.52085852622986
+ },
+ {
+ "epoch": 96,
+ "train_loss": 4.8871041314697266,
+ "train_acc": 0.00878,
+ "test_loss": 4.708365040588379,
+ "test_acc": 0.01,
+ "lyapunov": 1.5773879777440025,
+ "grad_norm": 0.11832202769749675,
+ "grad_max_sv": 0.01925608702003956,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19256087020.03956,
+ "lr": 0.00028711035421746345,
+ "time_sec": 132.48231029510498
+ },
+ {
+ "epoch": 97,
+ "train_loss": 4.885575797424316,
+ "train_acc": 0.00956,
+ "test_loss": 4.758969999694824,
+ "test_acc": 0.01,
+ "lyapunov": 1.5739980253112285,
+ "grad_norm": 0.102958848729015,
+ "grad_max_sv": 0.00836998880840838,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8369988808.4083805,
+ "lr": 0.00027768241040753615,
+ "time_sec": 132.4623761177063
+ },
+ {
+ "epoch": 98,
+ "train_loss": 4.885688443298339,
+ "train_acc": 0.00946,
+ "test_loss": 4.7685779739379885,
+ "test_acc": 0.01,
+ "lyapunov": 1.5737464616975516,
+ "grad_norm": 0.11414360687104802,
+ "grad_max_sv": 0.033959317160770296,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33959317160.770294,
+ "lr": 0.00026835198244006903,
+ "time_sec": 132.65263080596924
+ },
+ {
+ "epoch": 99,
+ "train_loss": 4.888634443054199,
+ "train_acc": 0.00974,
+ "test_loss": 4.754720726013184,
+ "test_acc": 0.01,
+ "lyapunov": 1.5796314081572511,
+ "grad_norm": 0.11056614929218114,
+ "grad_max_sv": 0.034730975748971105,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34730975748.9711,
+ "lr": 0.0002591231629491421,
+ "time_sec": 132.53659439086914
+ },
+ {
+ "epoch": 100,
+ "train_loss": 4.888005011444092,
+ "train_acc": 0.00978,
+ "test_loss": 4.7091091361999515,
+ "test_acc": 0.01,
+ "lyapunov": 1.5793088131853381,
+ "grad_norm": 0.11538715899109499,
+ "grad_max_sv": 0.027404929930344223,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27404929930.344227,
+ "lr": 0.0002499999999999997,
+ "time_sec": 132.47063946723938
+ },
+ {
+ "epoch": 101,
+ "train_loss": 4.890101184844971,
+ "train_acc": 0.00978,
+ "test_loss": 4.713412440490723,
+ "test_acc": 0.01,
+ "lyapunov": 1.583473697037953,
+ "grad_norm": 0.14124961194918514,
+ "grad_max_sv": 0.030058392463251947,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30058392463.251945,
+ "lr": 0.00024098649531343477,
+ "time_sec": 132.50555539131165
+ },
+ {
+ "epoch": 102,
+ "train_loss": 4.887625363464355,
+ "train_acc": 0.01148,
+ "test_loss": 4.7020545562744145,
+ "test_acc": 0.01,
+ "lyapunov": 1.579564877178358,
+ "grad_norm": 0.1297826697220666,
+ "grad_max_sv": 0.019950845977291465,
+ "grad_min_sv": 0.0,
+ "grad_condition": 19950845977.291466,
+ "lr": 0.0002320866025105016,
+ "time_sec": 132.43331456184387
+ },
+ {
+ "epoch": 103,
+ "train_loss": 4.889458109130859,
+ "train_acc": 0.00924,
+ "test_loss": 4.700020100402832,
+ "test_acc": 0.01,
+ "lyapunov": 1.5832947227351195,
+ "grad_norm": 0.16304165123375366,
+ "grad_max_sv": 0.00834191357716918,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8341913577.16918,
+ "lr": 0.0002233042253783278,
+ "time_sec": 132.42489337921143
+ },
+ {
+ "epoch": 104,
+ "train_loss": 4.888043740234375,
+ "train_acc": 0.00976,
+ "test_loss": 4.690122833251953,
+ "test_acc": 0.01,
+ "lyapunov": 1.580241550874832,
+ "grad_norm": 0.16164115490422049,
+ "grad_max_sv": 0.00892186602577567,
+ "grad_min_sv": 0.0,
+ "grad_condition": 8921866025.775671,
+ "lr": 0.000214643216157784,
+ "time_sec": 132.40913486480713
+ },
+ {
+ "epoch": 105,
+ "train_loss": 4.885801515350342,
+ "train_acc": 0.00962,
+ "test_loss": 4.70759442062378,
+ "test_acc": 0.01,
+ "lyapunov": 1.5747494935379613,
+ "grad_norm": 0.10757507074973427,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376332,
+ "time_sec": 132.41837000846863
+ },
+ {
+ "epoch": 106,
+ "train_loss": 4.886232281951904,
+ "train_acc": 0.00966,
+ "test_loss": 4.676759211730957,
+ "test_acc": 0.01,
+ "lyapunov": 1.5755804490555279,
+ "grad_norm": 0.11054714782321104,
+ "grad_max_sv": 0.016818781569600105,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16818781569.600103,
+ "lr": 0.00019770044256881242,
+ "time_sec": 132.38776516914368
+ },
+ {
+ "epoch": 107,
+ "train_loss": 4.889010899200439,
+ "train_acc": 0.00964,
+ "test_loss": 4.686521159362793,
+ "test_acc": 0.01,
+ "lyapunov": 1.5793325800420073,
+ "grad_norm": 0.5205851606002122,
+ "grad_max_sv": 0.027481868257746102,
+ "grad_min_sv": 0.0,
+ "grad_condition": 27481868257.7461,
+ "lr": 0.0001894261098608447,
+ "time_sec": 132.4469666481018
+ },
+ {
+ "epoch": 108,
+ "train_loss": 4.885496775512696,
+ "train_acc": 0.00916,
+ "test_loss": 4.701310534667969,
+ "test_acc": 0.01,
+ "lyapunov": 1.5739044819951362,
+ "grad_norm": 0.9976131592675321,
+ "grad_max_sv": 0.010380421532317996,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10380421532.317997,
+ "lr": 0.000181288005125655,
+ "time_sec": 132.34952044487
+ },
+ {
+ "epoch": 109,
+ "train_loss": 4.88569960144043,
+ "train_acc": 0.00982,
+ "test_loss": 4.704411970520019,
+ "test_acc": 0.01,
+ "lyapunov": 1.574234271598289,
+ "grad_norm": 0.9761047066143378,
+ "grad_max_sv": 0.026565171172842385,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26565171172.842384,
+ "lr": 0.0001732896980049473,
+ "time_sec": 132.45858502388
+ },
+ {
+ "epoch": 110,
+ "train_loss": 4.885857049255371,
+ "train_acc": 0.00906,
+ "test_loss": 4.700390522766114,
+ "test_acc": 0.01,
+ "lyapunov": 1.5747647572051533,
+ "grad_norm": 1.1449227675806375,
+ "grad_max_sv": 0.025618467247113585,
+ "grad_min_sv": 0.0,
+ "grad_condition": 25618467247.113586,
+ "lr": 0.00016543469682057076,
+ "time_sec": 132.4441635608673
+ },
+ {
+ "epoch": 111,
+ "train_loss": 4.886974509887695,
+ "train_acc": 0.00982,
+ "test_loss": 4.78629910736084,
+ "test_acc": 0.01,
+ "lyapunov": 1.5769317887933052,
+ "grad_norm": 0.9679265494141023,
+ "grad_max_sv": 0.03804315887391567,
+ "grad_min_sv": 0.0,
+ "grad_condition": 38043158873.91567,
+ "lr": 0.00015772644703565552,
+ "time_sec": 132.5875232219696
+ },
+ {
+ "epoch": 112,
+ "train_loss": 4.886453926544189,
+ "train_acc": 0.00974,
+ "test_loss": 4.8048784591674805,
+ "test_acc": 0.01,
+ "lyapunov": 1.5754460748809074,
+ "grad_norm": 0.8807920950548352,
+ "grad_max_sv": 0.03984132050536573,
+ "grad_min_sv": 0.0,
+ "grad_condition": 39841320505.36573,
+ "lr": 0.00015016832974331713,
+ "time_sec": 132.5120551586151
+ },
+ {
+ "epoch": 113,
+ "train_loss": 4.885906947784424,
+ "train_acc": 0.00966,
+ "test_loss": 4.798358418273926,
+ "test_acc": 0.01,
+ "lyapunov": 1.5747274245752398,
+ "grad_norm": 0.8637882261226464,
+ "grad_max_sv": 0.033320454647764564,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33320454647.764565,
+ "lr": 0.00014276366018359834,
+ "time_sec": 132.50000762939453
+ },
+ {
+ "epoch": 114,
+ "train_loss": 4.885719304962159,
+ "train_acc": 0.00982,
+ "test_loss": 4.793103702545166,
+ "test_acc": 0.01,
+ "lyapunov": 1.5744778527628125,
+ "grad_norm": 0.782099951820462,
+ "grad_max_sv": 0.03417456489987671,
+ "grad_min_sv": 0.0,
+ "grad_condition": 34174564899.87671,
+ "lr": 0.00013551568628929425,
+ "time_sec": 132.49124789237976
+ },
+ {
+ "epoch": 115,
+ "train_loss": 4.8859512828063965,
+ "train_acc": 0.00934,
+ "test_loss": 4.802629745483398,
+ "test_acc": 0.01,
+ "lyapunov": 1.575113305960165,
+ "grad_norm": 0.7049115792540724,
+ "grad_max_sv": 0.018358896067366005,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18358896067.366005,
+ "lr": 0.00012842758726130276,
+ "time_sec": 132.44965839385986
+ },
+ {
+ "epoch": 116,
+ "train_loss": 4.886716898498535,
+ "train_acc": 0.01,
+ "test_loss": 4.802504382324218,
+ "test_acc": 0.01,
+ "lyapunov": 1.5769645506158814,
+ "grad_norm": 0.7070432983143201,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 132.43424487113953
+ },
+ {
+ "epoch": 117,
+ "train_loss": 4.8879242680358885,
+ "train_acc": 0.00916,
+ "test_loss": 4.805041016387939,
+ "test_acc": 0.01,
+ "lyapunov": 1.5800700291343357,
+ "grad_norm": 0.7061830114700672,
+ "grad_max_sv": 0.02115973932668567,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21159739326.68567,
+ "lr": 0.00011474337861210538,
+ "time_sec": 132.52493023872375
+ },
+ {
+ "epoch": 118,
+ "train_loss": 4.885882244415283,
+ "train_acc": 0.01036,
+ "test_loss": 4.74331266784668,
+ "test_acc": 0.01,
+ "lyapunov": 1.5747067300255035,
+ "grad_norm": 0.7245826894780792,
+ "grad_max_sv": 0.03378571714274585,
+ "grad_min_sv": 0.0,
+ "grad_condition": 33785717142.745857,
+ "lr": 0.00010815327133708009,
+ "time_sec": 132.48710799217224
+ },
+ {
+ "epoch": 119,
+ "train_loss": 4.886389665374756,
+ "train_acc": 0.00962,
+ "test_loss": 4.740865539550781,
+ "test_acc": 0.01,
+ "lyapunov": 1.5762843387511076,
+ "grad_norm": 0.7753676227893881,
+ "grad_max_sv": 0.03039190392009914,
+ "grad_min_sv": 0.0,
+ "grad_condition": 30391903920.09914,
+ "lr": 0.00010173504098790182,
+ "time_sec": 132.4465343952179
+ },
+ {
+ "epoch": 120,
+ "train_loss": 4.886249551086426,
+ "train_acc": 0.00964,
+ "test_loss": 4.7418055305480955,
+ "test_acc": 0.01,
+ "lyapunov": 1.5757878259624667,
+ "grad_norm": 0.7403330417590244,
+ "grad_max_sv": 0.03614077656529844,
+ "grad_min_sv": 0.0,
+ "grad_condition": 36140776565.29844,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 132.79633259773254
+ },
+ {
+ "epoch": 121,
+ "train_loss": 4.886320632019043,
+ "train_acc": 0.0099,
+ "test_loss": 4.7293956802368164,
+ "test_acc": 0.01,
+ "lyapunov": 1.5760322620191842,
+ "grad_norm": 0.7505635192152501,
+ "grad_max_sv": 0.026077959313988687,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26077959313.988686,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 133.23189043998718
+ },
+ {
+ "epoch": 122,
+ "train_loss": 4.887943274230957,
+ "train_acc": 0.00948,
+ "test_loss": 4.919895000457764,
+ "test_acc": 0.01,
+ "lyapunov": 1.5784789354295072,
+ "grad_norm": 0.6996628561837273,
+ "grad_max_sv": 0.0160073421895504,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16007342189.550396,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 132.61993741989136
+ },
+ {
+ "epoch": 123,
+ "train_loss": 4.886383193359375,
+ "train_acc": 0.01012,
+ "test_loss": 4.8154360328674315,
+ "test_acc": 0.01,
+ "lyapunov": 1.5765104918833583,
+ "grad_norm": 0.8202114075319168,
+ "grad_max_sv": 0.0287565924692899,
+ "grad_min_sv": 0.0,
+ "grad_condition": 28756592469.289906,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 132.69449758529663
+ },
+ {
+ "epoch": 124,
+ "train_loss": 4.885598735046386,
+ "train_acc": 0.01062,
+ "test_loss": 4.811818315124512,
+ "test_acc": 0.01,
+ "lyapunov": 1.5741741837138106,
+ "grad_norm": 0.7110817230064039,
+ "grad_max_sv": 0.04011002266779542,
+ "grad_min_sv": 0.0,
+ "grad_condition": 40110022667.795425,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 132.79418468475342
+ },
+ {
+ "epoch": 125,
+ "train_loss": 4.887531413879395,
+ "train_acc": 0.00998,
+ "test_loss": 4.798822694396972,
+ "test_acc": 0.01,
+ "lyapunov": 1.5775156819911869,
+ "grad_norm": 0.6755952206914222,
+ "grad_max_sv": 0.03821564754471183,
+ "grad_min_sv": 0.0,
+ "grad_condition": 38215647544.71183,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 132.56555151939392
+ },
+ {
+ "epoch": 126,
+ "train_loss": 4.885848933258057,
+ "train_acc": 0.0096,
+ "test_loss": 4.79271836013794,
+ "test_acc": 0.01,
+ "lyapunov": 1.5746296488720437,
+ "grad_norm": 0.783689796852182,
+ "grad_max_sv": 0.0219818449113518,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21981844911.3518,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 132.44697856903076
+ },
+ {
+ "epoch": 127,
+ "train_loss": 4.885011657409668,
+ "train_acc": 0.0099,
+ "test_loss": 4.796478929901123,
+ "test_acc": 0.01,
+ "lyapunov": 1.5726598202420012,
+ "grad_norm": 0.746827927020454,
+ "grad_max_sv": 0.006885465793311596,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6885465793.311597,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 132.4967279434204
+ },
+ {
+ "epoch": 128,
+ "train_loss": 4.885314655151367,
+ "train_acc": 0.00972,
+ "test_loss": 4.764711624908447,
+ "test_acc": 0.01,
+ "lyapunov": 1.5735664736584325,
+ "grad_norm": 0.7327332821536672,
+ "grad_max_sv": 0.000560962175950408,
+ "grad_min_sv": 0.0,
+ "grad_condition": 560962175.950408,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 132.5673258304596
+ },
+ {
+ "epoch": 129,
+ "train_loss": 4.886808303070068,
+ "train_acc": 0.00958,
+ "test_loss": 4.767883946990967,
+ "test_acc": 0.01,
+ "lyapunov": 1.5768778150343834,
+ "grad_norm": 0.7089376244924456,
+ "grad_max_sv": 0.0005988820921629667,
+ "grad_min_sv": 0.0,
+ "grad_condition": 598882092.1629667,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 132.46098804473877
+ },
+ {
+ "epoch": 130,
+ "train_loss": 4.886055064697266,
+ "train_acc": 0.00958,
+ "test_loss": 4.76520872039795,
+ "test_acc": 0.01,
+ "lyapunov": 1.575562137167167,
+ "grad_norm": 0.8017477597198375,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 132.55271816253662
+ },
+ {
+ "epoch": 131,
+ "train_loss": 4.8861244363403324,
+ "train_acc": 0.0098,
+ "test_loss": 4.774403156280518,
+ "test_acc": 0.01,
+ "lyapunov": 1.5755851704751134,
+ "grad_norm": 0.8346593666537984,
+ "grad_max_sv": 0.0012377811130136252,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1237781113.0136251,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 132.4554464817047
+ },
+ {
+ "epoch": 132,
+ "train_loss": 4.8852793449401855,
+ "train_acc": 0.00998,
+ "test_loss": 4.771010957336426,
+ "test_acc": 0.01,
+ "lyapunov": 1.573425286566205,
+ "grad_norm": 0.7375330331800295,
+ "grad_max_sv": 0.006311370152980089,
+ "grad_min_sv": 0.0,
+ "grad_condition": 6311370152.980089,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 132.4216513633728
+ },
+ {
+ "epoch": 133,
+ "train_loss": 4.884971447448731,
+ "train_acc": 0.00938,
+ "test_loss": 4.771634101104737,
+ "test_acc": 0.01,
+ "lyapunov": 1.572620025985991,
+ "grad_norm": 0.6774345796584929,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 132.4028835296631
+ },
+ {
+ "epoch": 134,
+ "train_loss": 4.885691842803955,
+ "train_acc": 0.01002,
+ "test_loss": 4.844159544372559,
+ "test_acc": 0.01,
+ "lyapunov": 1.57454265353015,
+ "grad_norm": 0.7944955115704805,
+ "grad_max_sv": 0.02395228371024132,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23952283710.241318,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 132.41754722595215
+ },
+ {
+ "epoch": 135,
+ "train_loss": 4.8864432501220705,
+ "train_acc": 0.0101,
+ "test_loss": 4.844892832946777,
+ "test_acc": 0.01,
+ "lyapunov": 1.575845740945138,
+ "grad_norm": 0.7437160641154223,
+ "grad_max_sv": 0.020727850822731854,
+ "grad_min_sv": 0.0,
+ "grad_condition": 20727850822.731853,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 132.44422578811646
+ },
+ {
+ "epoch": 136,
+ "train_loss": 4.8851325263977055,
+ "train_acc": 0.0098,
+ "test_loss": 4.8378851570129395,
+ "test_acc": 0.01,
+ "lyapunov": 1.5731066611721694,
+ "grad_norm": 0.6658420197701125,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 132.38768362998962
+ },
+ {
+ "epoch": 137,
+ "train_loss": 4.885479872436523,
+ "train_acc": 0.01006,
+ "test_loss": 4.843586358642578,
+ "test_acc": 0.01,
+ "lyapunov": 1.5740535426932527,
+ "grad_norm": 0.7299510564419838,
+ "grad_max_sv": 0.003957807831466198,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3957807831.466198,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 132.38154101371765
+ },
+ {
+ "epoch": 138,
+ "train_loss": 4.884863400421143,
+ "train_acc": 0.01014,
+ "test_loss": 4.843053856658935,
+ "test_acc": 0.01,
+ "lyapunov": 1.5721587311581273,
+ "grad_norm": 0.6927716154040414,
+ "grad_max_sv": 0.017578842211514713,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17578842211.51471,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 132.4182834625244
+ },
+ {
+ "epoch": 139,
+ "train_loss": 4.884934008331299,
+ "train_acc": 0.01022,
+ "test_loss": 4.844250295257568,
+ "test_acc": 0.01,
+ "lyapunov": 1.5725375057181434,
+ "grad_norm": 0.6981880900264675,
+ "grad_max_sv": 0.0031383157707750796,
+ "grad_min_sv": 0.0,
+ "grad_condition": 3138315770.7750797,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 132.41427326202393
+ },
+ {
+ "epoch": 140,
+ "train_loss": 4.885497499389649,
+ "train_acc": 0.00972,
+ "test_loss": 4.844135813903809,
+ "test_acc": 0.01,
+ "lyapunov": 1.574064860868332,
+ "grad_norm": 0.774635016593933,
+ "grad_max_sv": 0.005403042444959283,
+ "grad_min_sv": 0.0,
+ "grad_condition": 5403042444.959283,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 132.38426899909973
+ },
+ {
+ "epoch": 141,
+ "train_loss": 4.885045772247315,
+ "train_acc": 0.01014,
+ "test_loss": 4.8358864456176756,
+ "test_acc": 0.01,
+ "lyapunov": 1.5727792880724154,
+ "grad_norm": 0.7412742981630644,
+ "grad_max_sv": 0.011697014886885881,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11697014886.885881,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 132.46910786628723
+ },
+ {
+ "epoch": 142,
+ "train_loss": 4.884702201538086,
+ "train_acc": 0.01002,
+ "test_loss": 4.838421836090088,
+ "test_acc": 0.01,
+ "lyapunov": 1.5717649999481942,
+ "grad_norm": 0.7113065718119301,
+ "grad_max_sv": 0.00798416011966765,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7984160119.66765,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 132.44912910461426
+ },
+ {
+ "epoch": 143,
+ "train_loss": 4.885199571380615,
+ "train_acc": 0.00982,
+ "test_loss": 4.841495401763916,
+ "test_acc": 0.01,
+ "lyapunov": 1.5731582995265951,
+ "grad_norm": 0.705829448061863,
+ "grad_max_sv": 0.021906211972236633,
+ "grad_min_sv": 0.0,
+ "grad_condition": 21906211972.236633,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 132.39459085464478
+ },
+ {
+ "epoch": 144,
+ "train_loss": 4.884931218566894,
+ "train_acc": 0.01002,
+ "test_loss": 4.842521714782714,
+ "test_acc": 0.01,
+ "lyapunov": 1.5725436259413619,
+ "grad_norm": 0.7770696416339791,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 132.33704686164856
+ },
+ {
+ "epoch": 145,
+ "train_loss": 4.885003453521729,
+ "train_acc": 0.01038,
+ "test_loss": 4.84215620880127,
+ "test_acc": 0.01,
+ "lyapunov": 1.5727140568101499,
+ "grad_norm": 0.7469803441120764,
+ "grad_max_sv": 0.007154888892546296,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7154888892.546295,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 132.3757495880127
+ },
+ {
+ "epoch": 146,
+ "train_loss": 4.885197346801758,
+ "train_acc": 0.00996,
+ "test_loss": 4.842266304016113,
+ "test_acc": 0.01,
+ "lyapunov": 1.5733027034403417,
+ "grad_norm": 0.7332908840273178,
+ "grad_max_sv": 0.0006548997946083546,
+ "grad_min_sv": 0.0,
+ "grad_condition": 654899794.6083546,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 132.45014452934265
+ },
+ {
+ "epoch": 147,
+ "train_loss": 4.885225572662353,
+ "train_acc": 0.01,
+ "test_loss": 4.841919314575195,
+ "test_acc": 0.01,
+ "lyapunov": 1.5734141430891384,
+ "grad_norm": 0.7407542017866708,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 132.37303113937378
+ },
+ {
+ "epoch": 148,
+ "train_loss": 4.885419764556885,
+ "train_acc": 0.01,
+ "test_loss": 4.841919337463379,
+ "test_acc": 0.01,
+ "lyapunov": 1.5739776710110247,
+ "grad_norm": 0.7868248231615788,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 132.36948442459106
+ },
+ {
+ "epoch": 149,
+ "train_loss": 4.884984393463135,
+ "train_acc": 0.01,
+ "test_loss": 4.841919581604004,
+ "test_acc": 0.01,
+ "lyapunov": 1.5726999001734703,
+ "grad_norm": 0.7663497621598592,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 132.3525311946869
+ },
+ {
+ "epoch": 150,
+ "train_loss": 4.8838786590576175,
+ "train_acc": 0.01,
+ "test_loss": 4.841919624328614,
+ "test_acc": 0.01,
+ "lyapunov": 1.5694036883161502,
+ "grad_norm": 0.6984069616734725,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 132.51661276817322
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 4.785678502502441,
+ "train_acc": 0.01854,
+ "test_loss": 4.888219262695313,
+ "test_acc": 0.0096,
+ "lyapunov": 2.2034229628570245,
+ "grad_norm": 4.9662527525898525,
+ "grad_max_sv": 4.1295246422290806,
+ "grad_min_sv": 8.43239183145883e-08,
+ "grad_condition": 57848709.59664528,
+ "lr": 0.0009998903417374227,
+ "time_sec": 178.03496599197388
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.6398111044311525,
+ "train_acc": 0.0207,
+ "test_loss": 4.653040969085693,
+ "test_acc": 0.01,
+ "lyapunov": 1.9294306939215307,
+ "grad_norm": 3.0185365178654044,
+ "grad_max_sv": 2.4029204517602922,
+ "grad_min_sv": 5.100535853952426e-08,
+ "grad_condition": 482708945.8134031,
+ "lr": 0.0009995614150494292,
+ "time_sec": 178.04272985458374
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.587504278259277,
+ "train_acc": 0.01798,
+ "test_loss": 4.565644731140137,
+ "test_acc": 0.0158,
+ "lyapunov": 1.7756437584567253,
+ "grad_norm": 1.468640621914821,
+ "grad_max_sv": 0.8633963579282863,
+ "grad_min_sv": 1.4697805644365008e-08,
+ "grad_condition": 29354955308.653522,
+ "lr": 0.0009990133642141358,
+ "time_sec": 177.90911650657654
+ },
+ {
+ "epoch": 4,
+ "train_loss": 4.609674820861817,
+ "train_acc": 0.01586,
+ "test_loss": 5.16701375579834,
+ "test_acc": 0.0101,
+ "lyapunov": 1.7137653553272452,
+ "grad_norm": 0.7203838648352618,
+ "grad_max_sv": 0.5238488506525755,
+ "grad_min_sv": 2.2053512622504097e-09,
+ "grad_condition": 75198729364.04495,
+ "lr": 0.0009982464296247522,
+ "time_sec": 177.86139965057373
+ },
+ {
+ "epoch": 5,
+ "train_loss": 4.638868305969238,
+ "train_acc": 0.01426,
+ "test_loss": 5.560866254425049,
+ "test_acc": 0.01,
+ "lyapunov": 1.6978333834796915,
+ "grad_norm": 0.5502157339199643,
+ "grad_max_sv": 0.44361272603273394,
+ "grad_min_sv": 2.7029428141806377e-12,
+ "grad_condition": 181889969040.05048,
+ "lr": 0.0009972609476841367,
+ "time_sec": 177.9277467727661
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.669847656402588,
+ "train_acc": 0.01332,
+ "test_loss": 4.8178652496337895,
+ "test_acc": 0.01,
+ "lyapunov": 1.7381863307465069,
+ "grad_norm": 0.5563091323848212,
+ "grad_max_sv": 0.37752934321761134,
+ "grad_min_sv": 1.4602178925586487e-12,
+ "grad_condition": 201992262866.57877,
+ "lr": 0.000996057350657239,
+ "time_sec": 177.8438265323639
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.702823111572266,
+ "train_acc": 0.01186,
+ "test_loss": 4.627877201843262,
+ "test_acc": 0.01,
+ "lyapunov": 1.7552724058365883,
+ "grad_norm": 0.4233607461027203,
+ "grad_max_sv": 0.35499467700719833,
+ "grad_min_sv": 3.8501282054302263e-13,
+ "grad_condition": 282171382589.46027,
+ "lr": 0.000994636166481494,
+ "time_sec": 177.7493600845337
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.722017111511231,
+ "train_acc": 0.01098,
+ "test_loss": 6.090566035461426,
+ "test_acc": 0.01,
+ "lyapunov": 1.7357035292993725,
+ "grad_norm": 0.3850039806872663,
+ "grad_max_sv": 0.3226898044347763,
+ "grad_min_sv": 7.113592445244562e-14,
+ "grad_condition": 304348428639.08154,
+ "lr": 0.0009929980185352525,
+ "time_sec": 177.78767728805542
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.741448409118652,
+ "train_acc": 0.01154,
+ "test_loss": 5.83977333984375,
+ "test_acc": 0.01,
+ "lyapunov": 1.7204718992228398,
+ "grad_norm": 0.4078264807422899,
+ "grad_max_sv": 0.31335003934800626,
+ "grad_min_sv": 1.9402458265888006e-13,
+ "grad_condition": 298038507715.96027,
+ "lr": 0.0009911436253643444,
+ "time_sec": 177.80518293380737
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.747990810241699,
+ "train_acc": 0.01106,
+ "test_loss": 6.513046632385254,
+ "test_acc": 0.01,
+ "lyapunov": 1.6953654838035175,
+ "grad_norm": 0.4292578477364445,
+ "grad_max_sv": 0.3652988448739052,
+ "grad_min_sv": 1.2809375813436604e-13,
+ "grad_condition": 342642686942.9036,
+ "lr": 0.0009890738003669028,
+ "time_sec": 177.78542613983154
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.765809431610108,
+ "train_acc": 0.01214,
+ "test_loss": 7.22933176574707,
+ "test_acc": 0.01,
+ "lyapunov": 1.7186210655495333,
+ "grad_norm": 0.4487253545215033,
+ "grad_max_sv": 0.3868314690887928,
+ "grad_min_sv": 3.013939023123918e-13,
+ "grad_condition": 329330315777.6491,
+ "lr": 0.00098678945143658,
+ "time_sec": 177.81605434417725
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.784488880615235,
+ "train_acc": 0.00986,
+ "test_loss": 4.611177786254883,
+ "test_acc": 0.01,
+ "lyapunov": 1.652159307009119,
+ "grad_norm": 0.4707826268774683,
+ "grad_max_sv": 0.3026094869710505,
+ "grad_min_sv": 3.8656478774921674e-15,
+ "grad_condition": 301420540269.25793,
+ "lr": 0.0009842915805643154,
+ "time_sec": 177.8059630393982
+ },
+ {
+ "epoch": 13,
+ "train_loss": 4.809918058624268,
+ "train_acc": 0.00966,
+ "test_loss": 5.106430908203125,
+ "test_acc": 0.01,
+ "lyapunov": 1.6707328871997726,
+ "grad_norm": 0.667273831565697,
+ "grad_max_sv": 0.24273031912744045,
+ "grad_min_sv": 1.0572839902934006e-10,
+ "grad_condition": 229305129700.13013,
+ "lr": 0.000981581283398829,
+ "time_sec": 177.8098611831665
+ },
+ {
+ "epoch": 14,
+ "train_loss": 4.825652238159179,
+ "train_acc": 0.01056,
+ "test_loss": 10.256812258911133,
+ "test_acc": 0.01,
+ "lyapunov": 1.6938227213861998,
+ "grad_norm": 1.331380545313032,
+ "grad_max_sv": 0.26493136398494244,
+ "grad_min_sv": 2.65579091596793e-10,
+ "grad_condition": 237101921206.0838,
+ "lr": 0.0009786597487660333,
+ "time_sec": 177.74433708190918
+ },
+ {
+ "epoch": 15,
+ "train_loss": 4.858567563171387,
+ "train_acc": 0.01086,
+ "test_loss": 4.6056615829467775,
+ "test_acc": 0.01,
+ "lyapunov": 1.7649985844521876,
+ "grad_norm": 0.6838854666615405,
+ "grad_max_sv": 0.34980414882302285,
+ "grad_min_sv": 2.1796140399673834e-13,
+ "grad_condition": 312022583270.1326,
+ "lr": 0.0009755282581475766,
+ "time_sec": 177.7609293460846
+ },
+ {
+ "epoch": 16,
+ "train_loss": 4.88505381439209,
+ "train_acc": 0.01104,
+ "test_loss": 4.605761392211914,
+ "test_acc": 0.01,
+ "lyapunov": 1.8020565973218445,
+ "grad_norm": 0.5845356530706413,
+ "grad_max_sv": 0.2943306349217892,
+ "grad_min_sv": 4.369502606031448e-14,
+ "grad_condition": 287139369751.0244,
+ "lr": 0.0009721881851187403,
+ "time_sec": 177.8197786808014
+ },
+ {
+ "epoch": 17,
+ "train_loss": 4.893186149749756,
+ "train_acc": 0.01036,
+ "test_loss": 4.605876076507569,
+ "test_acc": 0.01,
+ "lyapunov": 1.7787105851161205,
+ "grad_norm": 0.4680659078828573,
+ "grad_max_sv": 0.2733098614960909,
+ "grad_min_sv": 4.296774163499721e-19,
+ "grad_condition": 273309717860.49023,
+ "lr": 0.0009686409947459456,
+ "time_sec": 177.79044127464294
+ },
+ {
+ "epoch": 18,
+ "train_loss": 4.893065974731445,
+ "train_acc": 0.0107,
+ "test_loss": 4.6065135696411135,
+ "test_acc": 0.01,
+ "lyapunov": 1.718729690822494,
+ "grad_norm": 0.5727929210621684,
+ "grad_max_sv": 0.30122888199985026,
+ "grad_min_sv": 4.424719830275789e-19,
+ "grad_condition": 301228714224.6802,
+ "lr": 0.0009648882429441254,
+ "time_sec": 177.80086708068848
+ },
+ {
+ "epoch": 19,
+ "train_loss": 4.88860928604126,
+ "train_acc": 0.01,
+ "test_loss": 4.702660593414307,
+ "test_acc": 0.01,
+ "lyapunov": 1.6696165498260342,
+ "grad_norm": 0.42342867331427436,
+ "grad_max_sv": 0.34960081316530706,
+ "grad_min_sv": 2.8274243075655694e-14,
+ "grad_condition": 340909047209.5011,
+ "lr": 0.00096093157579425,
+ "time_sec": 177.7979953289032
+ },
+ {
+ "epoch": 20,
+ "train_loss": 4.903309204711914,
+ "train_acc": 0.01068,
+ "test_loss": 5.4670142036437985,
+ "test_acc": 0.01,
+ "lyapunov": 1.6678839117059927,
+ "grad_norm": 0.5364190790754718,
+ "grad_max_sv": 0.3460624013096094,
+ "grad_min_sv": 1.5815154140131103e-14,
+ "grad_condition": 341291954932.3224,
+ "lr": 0.0009567727288213001,
+ "time_sec": 177.79369568824768
+ },
+ {
+ "epoch": 21,
+ "train_loss": 4.915025991210937,
+ "train_acc": 0.01106,
+ "test_loss": 4.692510232543945,
+ "test_acc": 0.01,
+ "lyapunov": 1.6982163163402197,
+ "grad_norm": 0.5511803995310802,
+ "grad_max_sv": 0.34619002789258957,
+ "grad_min_sv": 4.733950722420789e-14,
+ "grad_condition": 333444655591.8086,
+ "lr": 0.0009524135262330095,
+ "time_sec": 177.79608535766602
+ },
+ {
+ "epoch": 22,
+ "train_loss": 4.909840554809571,
+ "train_acc": 0.01084,
+ "test_loss": 4.6062485778808595,
+ "test_acc": 0.01,
+ "lyapunov": 1.6909822228619509,
+ "grad_norm": 0.4483805706207121,
+ "grad_max_sv": 0.3018789976027193,
+ "grad_min_sv": 3.421304159357815e-14,
+ "grad_condition": 293400173556.4137,
+ "lr": 0.0009478558801197061,
+ "time_sec": 177.81299710273743
+ },
+ {
+ "epoch": 23,
+ "train_loss": 4.909692084808349,
+ "train_acc": 0.01108,
+ "test_loss": 4.6094023056030275,
+ "test_acc": 0.01,
+ "lyapunov": 1.6835671846214157,
+ "grad_norm": 0.45426031851013016,
+ "grad_max_sv": 0.3322039857506752,
+ "grad_min_sv": 6.560297434150338e-15,
+ "grad_condition": 330632003336.626,
+ "lr": 0.000943101789615607,
+ "time_sec": 177.8134524822235
+ },
+ {
+ "epoch": 24,
+ "train_loss": 4.901827787475586,
+ "train_acc": 0.011,
+ "test_loss": 4.606396533203125,
+ "test_acc": 0.01,
+ "lyapunov": 1.6725571582384426,
+ "grad_norm": 0.5007132528772561,
+ "grad_max_sv": 0.3051792338490486,
+ "grad_min_sv": 2.976912647072195e-14,
+ "grad_condition": 299276387943.3783,
+ "lr": 0.0009381533400219313,
+ "time_sec": 177.7837200164795
+ },
+ {
+ "epoch": 25,
+ "train_loss": 4.899776871948243,
+ "train_acc": 0.0109,
+ "test_loss": 4.606364790344238,
+ "test_acc": 0.01,
+ "lyapunov": 1.6670247737099142,
+ "grad_norm": 0.4224268025378797,
+ "grad_max_sv": 0.2703032233530493,
+ "grad_min_sv": 5.37251515366592e-15,
+ "grad_condition": 268629366269.90933,
+ "lr": 0.0009330127018922189,
+ "time_sec": 177.82209467887878
+ },
+ {
+ "epoch": 26,
+ "train_loss": 4.896821321258545,
+ "train_acc": 0.0107,
+ "test_loss": 4.722185048675537,
+ "test_acc": 0.01,
+ "lyapunov": 1.6472089549769526,
+ "grad_norm": 0.48011762637076694,
+ "grad_max_sv": 0.2670708648860455,
+ "grad_min_sv": 3.756115387104417e-15,
+ "grad_condition": 266170283847.3038,
+ "lr": 0.000927682130080253,
+ "time_sec": 177.78438448905945
+ },
+ {
+ "epoch": 27,
+ "train_loss": 4.906476246490478,
+ "train_acc": 0.01086,
+ "test_loss": 5.412735247802734,
+ "test_acc": 0.01,
+ "lyapunov": 1.6813617880691958,
+ "grad_norm": 0.4406715400059857,
+ "grad_max_sv": 0.25074354074895383,
+ "grad_min_sv": 6.093407208933511e-20,
+ "grad_condition": 250743525278.97955,
+ "lr": 0.0009221639627510072,
+ "time_sec": 177.7901487350464
+ },
+ {
+ "epoch": 28,
+ "train_loss": 4.893644842224121,
+ "train_acc": 0.01172,
+ "test_loss": 5.005291435241699,
+ "test_acc": 0.01,
+ "lyapunov": 1.6454817526175847,
+ "grad_norm": 0.3605258439803559,
+ "grad_max_sv": 0.2296090517193079,
+ "grad_min_sv": 8.79898850927057e-21,
+ "grad_condition": 229609049604.029,
+ "lr": 0.0009164606203550494,
+ "time_sec": 177.8756561279297
+ },
+ {
+ "epoch": 29,
+ "train_loss": 4.886972426452637,
+ "train_acc": 0.01162,
+ "test_loss": 5.60837995223999,
+ "test_acc": 0.01,
+ "lyapunov": 1.6373517272417502,
+ "grad_norm": 0.35252531034326595,
+ "grad_max_sv": 0.2174192801117897,
+ "grad_min_sv": 1.7514629554834846e-20,
+ "grad_condition": 217419276581.3401,
+ "lr": 0.0009105746045668516,
+ "time_sec": 177.83988404273987
+ },
+ {
+ "epoch": 30,
+ "train_loss": 4.887171002197266,
+ "train_acc": 0.011,
+ "test_loss": 5.029856091308594,
+ "test_acc": 0.01,
+ "lyapunov": 1.6322715209268244,
+ "grad_norm": 0.3694860441565804,
+ "grad_max_sv": 0.1933195549994707,
+ "grad_min_sv": 2.0216060912179585e-20,
+ "grad_condition": 193319550988.26825,
+ "lr": 0.0009045084971874733,
+ "time_sec": 177.91060781478882
+ },
+ {
+ "epoch": 31,
+ "train_loss": 4.882497029418945,
+ "train_acc": 0.01094,
+ "test_loss": 4.946529456329346,
+ "test_acc": 0.01,
+ "lyapunov": 1.6160695430872691,
+ "grad_norm": 0.3009086445042491,
+ "grad_max_sv": 0.17770135290920736,
+ "grad_min_sv": 3.24419256482409e-21,
+ "grad_condition": 177701352269.52295,
+ "lr": 0.0008982649590120977,
+ "time_sec": 179.66105842590332
+ },
+ {
+ "epoch": 32,
+ "train_loss": 4.880725912780762,
+ "train_acc": 0.01128,
+ "test_loss": 5.578618463897705,
+ "test_acc": 0.01,
+ "lyapunov": 1.62386571232925,
+ "grad_norm": 0.36023587191613426,
+ "grad_max_sv": 0.1822029523551464,
+ "grad_min_sv": 3.6796007523380705e-21,
+ "grad_condition": 182202951444.53656,
+ "lr": 0.0008918467286629196,
+ "time_sec": 179.0988199710846
+ },
+ {
+ "epoch": 33,
+ "train_loss": 4.908818702850342,
+ "train_acc": 0.01182,
+ "test_loss": 4.791287840270996,
+ "test_acc": 0.01,
+ "lyapunov": 1.674632024886968,
+ "grad_norm": 2.355286231583665,
+ "grad_max_sv": 0.1451555678440961,
+ "grad_min_sv": 3.147262321441897e-13,
+ "grad_condition": 145124831420.269,
+ "lr": 0.0008852566213878943,
+ "time_sec": 177.81290411949158
+ },
+ {
+ "epoch": 34,
+ "train_loss": 4.966870961761475,
+ "train_acc": 0.00932,
+ "test_loss": 4.691395782470703,
+ "test_acc": 0.01,
+ "lyapunov": 1.7797045579651738,
+ "grad_norm": 0.4484129521918933,
+ "grad_max_sv": 0.14517696127295493,
+ "grad_min_sv": 1.115426717388758e-15,
+ "grad_condition": 144975581810.04208,
+ "lr": 0.000878497527825878,
+ "time_sec": 177.8652102947235
+ },
+ {
+ "epoch": 35,
+ "train_loss": 4.915819309997558,
+ "train_acc": 0.01472,
+ "test_loss": 4.624800839996338,
+ "test_acc": 0.01,
+ "lyapunov": 1.721020828122678,
+ "grad_norm": 1.0620945447138674,
+ "grad_max_sv": 0.19911672528833152,
+ "grad_min_sv": 1.9872991955575878e-10,
+ "grad_condition": 95641187798.97682,
+ "lr": 0.000871572412738697,
+ "time_sec": 177.88512420654297
+ },
+ {
+ "epoch": 36,
+ "train_loss": 4.9530413731384275,
+ "train_acc": 0.01452,
+ "test_loss": 4.789580516052246,
+ "test_acc": 0.0101,
+ "lyapunov": 1.8076083949764672,
+ "grad_norm": 0.5972631933008199,
+ "grad_max_sv": 0.19924248810857534,
+ "grad_min_sv": 3.440275442940527e-10,
+ "grad_condition": 148843110630.56686,
+ "lr": 0.0008644843137107055,
+ "time_sec": 177.85971999168396
+ },
+ {
+ "epoch": 37,
+ "train_loss": 4.963237725219726,
+ "train_acc": 0.01242,
+ "test_loss": 9.607163096618653,
+ "test_acc": 0.01,
+ "lyapunov": 1.7487757071814574,
+ "grad_norm": 0.5178441019436488,
+ "grad_max_sv": 0.2677606202661991,
+ "grad_min_sv": 1.2794001535597794e-09,
+ "grad_condition": 118342772090.25644,
+ "lr": 0.0008572363398164014,
+ "time_sec": 177.87799191474915
+ },
+ {
+ "epoch": 38,
+ "train_loss": 4.974736349639892,
+ "train_acc": 0.01056,
+ "test_loss": 4.772847597503662,
+ "test_acc": 0.01,
+ "lyapunov": 1.6420561239847442,
+ "grad_norm": 0.7737397356236614,
+ "grad_max_sv": 0.48621650636196134,
+ "grad_min_sv": 5.431396735144922e-09,
+ "grad_condition": 1130833560.0526097,
+ "lr": 0.0008498316702566826,
+ "time_sec": 177.84695863723755
+ },
+ {
+ "epoch": 39,
+ "train_loss": 4.914389076538086,
+ "train_acc": 0.00954,
+ "test_loss": 5.4321878707885745,
+ "test_acc": 0.01,
+ "lyapunov": 1.606756867959981,
+ "grad_norm": 0.6387073953630102,
+ "grad_max_sv": 0.28100625462830064,
+ "grad_min_sv": 1.1923785099299402e-09,
+ "grad_condition": 31042166964.6133,
+ "lr": 0.0008422735529643442,
+ "time_sec": 177.8997838497162
+ },
+ {
+ "epoch": 40,
+ "train_loss": 4.907334909515381,
+ "train_acc": 0.00932,
+ "test_loss": 5.197367625427246,
+ "test_acc": 0.01,
+ "lyapunov": 1.6101341015847443,
+ "grad_norm": 0.549617557037775,
+ "grad_max_sv": 0.21684555038809777,
+ "grad_min_sv": 1.6231511646555081e-12,
+ "grad_condition": 115360148938.91074,
+ "lr": 0.0008345653031794289,
+ "time_sec": 177.88523411750793
+ },
+ {
+ "epoch": 41,
+ "train_loss": 4.9172815733337405,
+ "train_acc": 0.00966,
+ "test_loss": 5.328871868896484,
+ "test_acc": 0.01,
+ "lyapunov": 1.6233936231154615,
+ "grad_norm": 0.6437990568107412,
+ "grad_max_sv": 0.23363575600087644,
+ "grad_min_sv": 5.030357610936974e-10,
+ "grad_condition": 138575586823.60834,
+ "lr": 0.0008267103019950526,
+ "time_sec": 177.87491416931152
+ },
+ {
+ "epoch": 42,
+ "train_loss": 4.910974921875,
+ "train_acc": 0.0094,
+ "test_loss": 5.260343148803711,
+ "test_acc": 0.01,
+ "lyapunov": 1.6119288898185087,
+ "grad_norm": 0.6213630809261163,
+ "grad_max_sv": 0.2208472192287445,
+ "grad_min_sv": 1.6566058977896803e-10,
+ "grad_condition": 142601015959.25623,
+ "lr": 0.0008187119948743447,
+ "time_sec": 177.85157465934753
+ },
+ {
+ "epoch": 43,
+ "train_loss": 4.910828229217529,
+ "train_acc": 0.0082,
+ "test_loss": 4.699688921356201,
+ "test_acc": 0.01,
+ "lyapunov": 1.6258944394948232,
+ "grad_norm": 0.4079357024315036,
+ "grad_max_sv": 0.15661620609462262,
+ "grad_min_sv": 1.7684309930750455e-15,
+ "grad_condition": 156350108060.72934,
+ "lr": 0.000810573890139155,
+ "time_sec": 177.86257314682007
+ },
+ {
+ "epoch": 44,
+ "train_loss": 4.896916885833741,
+ "train_acc": 0.00922,
+ "test_loss": 4.812428985595703,
+ "test_acc": 0.01,
+ "lyapunov": 1.5950726255431504,
+ "grad_norm": 0.4783756369080321,
+ "grad_max_sv": 0.14141971599310638,
+ "grad_min_sv": 1.3813946661647787e-39,
+ "grad_condition": 141419715993.10638,
+ "lr": 0.0008022995574311873,
+ "time_sec": 177.92987060546875
+ },
+ {
+ "epoch": 45,
+ "train_loss": 4.908877978973389,
+ "train_acc": 0.00912,
+ "test_loss": 4.708805274963379,
+ "test_acc": 0.01,
+ "lyapunov": 1.6267534076710186,
+ "grad_norm": 0.7771603049125322,
+ "grad_max_sv": 0.15806035809218882,
+ "grad_min_sv": 1.4034116208559716e-15,
+ "grad_condition": 157762251235.76987,
+ "lr": 0.0007938926261462363,
+ "time_sec": 177.94272303581238
+ },
+ {
+ "epoch": 46,
+ "train_loss": 4.90580543838501,
+ "train_acc": 0.00928,
+ "test_loss": 4.734797378540039,
+ "test_acc": 0.01,
+ "lyapunov": 1.6176637389775737,
+ "grad_norm": 0.6942542366402378,
+ "grad_max_sv": 0.15787413250654936,
+ "grad_min_sv": 7.864894789560978e-16,
+ "grad_condition": 157723200668.28387,
+ "lr": 0.0007853567838422158,
+ "time_sec": 177.97623896598816
+ },
+ {
+ "epoch": 47,
+ "train_loss": 4.8965187059021,
+ "train_acc": 0.00938,
+ "test_loss": 4.6579503898620604,
+ "test_acc": 0.01,
+ "lyapunov": 1.5973099085985851,
+ "grad_norm": 0.36353228305050295,
+ "grad_max_sv": 0.13088524471968413,
+ "grad_min_sv": 1.2231276530985221e-20,
+ "grad_condition": 130885242907.8948,
+ "lr": 0.0007766957746216719,
+ "time_sec": 177.95993542671204
+ },
+ {
+ "epoch": 48,
+ "train_loss": 4.8988071447753905,
+ "train_acc": 0.00944,
+ "test_loss": 4.662165933227539,
+ "test_acc": 0.01,
+ "lyapunov": 1.603416101402029,
+ "grad_norm": 0.3898458431943687,
+ "grad_max_sv": 0.1284548096358776,
+ "grad_min_sv": 1.1576870843401716e-38,
+ "grad_condition": 128454809635.87761,
+ "lr": 0.0007679133974894982,
+ "time_sec": 177.8052430152893
+ },
+ {
+ "epoch": 49,
+ "train_loss": 4.913481904144287,
+ "train_acc": 0.00918,
+ "test_loss": 4.763600569915772,
+ "test_acc": 0.01,
+ "lyapunov": 1.6402373295610824,
+ "grad_norm": 0.5994299094599757,
+ "grad_max_sv": 0.1396894573670579,
+ "grad_min_sv": 2.779377619525618e-15,
+ "grad_condition": 139046550095.99487,
+ "lr": 0.000759013504686565,
+ "time_sec": 177.86163926124573
+ },
+ {
+ "epoch": 50,
+ "train_loss": 4.906329712219239,
+ "train_acc": 0.00982,
+ "test_loss": 4.609917034912109,
+ "test_acc": 0.01,
+ "lyapunov": 1.6202878165427985,
+ "grad_norm": 0.6143555741962269,
+ "grad_max_sv": 0.15427468828856944,
+ "grad_min_sv": 1.5586657350285492e-15,
+ "grad_condition": 153998022994.1138,
+ "lr": 0.0007499999999999998,
+ "time_sec": 177.81070852279663
+ },
+ {
+ "epoch": 51,
+ "train_loss": 4.901778139953613,
+ "train_acc": 0.01,
+ "test_loss": 5.7906026428222654,
+ "test_acc": 0.01,
+ "lyapunov": 1.6095840150438,
+ "grad_norm": 0.4846890301599483,
+ "grad_max_sv": 0.10476460931822658,
+ "grad_min_sv": 6.919555377168684e-15,
+ "grad_condition": 103682757395.60971,
+ "lr": 0.0007408768370508575,
+ "time_sec": 177.827232837677
+ },
+ {
+ "epoch": 52,
+ "train_loss": 4.897733354492187,
+ "train_acc": 0.0102,
+ "test_loss": 5.14119333190918,
+ "test_acc": 0.01,
+ "lyapunov": 1.6018984003749954,
+ "grad_norm": 0.45183942591328674,
+ "grad_max_sv": 0.08775242893025278,
+ "grad_min_sv": 1.964503741104032e-16,
+ "grad_condition": 87731321318.76743,
+ "lr": 0.0007316480175599307,
+ "time_sec": 177.8825397491455
+ },
+ {
+ "epoch": 53,
+ "train_loss": 4.899286302947998,
+ "train_acc": 0.0105,
+ "test_loss": 5.116060150146485,
+ "test_acc": 0.01,
+ "lyapunov": 1.6068680664462507,
+ "grad_norm": 0.39046803319247386,
+ "grad_max_sv": 0.10442779418081045,
+ "grad_min_sv": 1.8704405143177693e-32,
+ "grad_condition": 104427794180.81046,
+ "lr": 0.0007223175895924635,
+ "time_sec": 177.85691237449646
+ },
+ {
+ "epoch": 54,
+ "train_loss": 4.900419689025879,
+ "train_acc": 0.00974,
+ "test_loss": 6.225739611816406,
+ "test_acc": 0.01,
+ "lyapunov": 1.611330489673273,
+ "grad_norm": 0.7830684513344699,
+ "grad_max_sv": 0.08616076316975523,
+ "grad_min_sv": 7.006492321624086e-47,
+ "grad_condition": 86160763169.75522,
+ "lr": 0.0007128896457825361,
+ "time_sec": 177.79533982276917
+ },
+ {
+ "epoch": 55,
+ "train_loss": 4.90022905456543,
+ "train_acc": 0.00872,
+ "test_loss": 4.660898509216309,
+ "test_acc": 0.01,
+ "lyapunov": 1.6107879657574626,
+ "grad_norm": 0.3602507862317559,
+ "grad_max_sv": 0.07782914067938691,
+ "grad_min_sv": 0.0,
+ "grad_condition": 77829140679.3869,
+ "lr": 0.0007033683215378998,
+ "time_sec": 177.81696367263794
+ },
+ {
+ "epoch": 56,
+ "train_loss": 4.899950318450927,
+ "train_acc": 0.009,
+ "test_loss": 4.8788808166503905,
+ "test_acc": 0.01,
+ "lyapunov": 1.608769400345395,
+ "grad_norm": 0.24016992273295382,
+ "grad_max_sv": 0.07058875868096948,
+ "grad_min_sv": 0.0,
+ "grad_condition": 70588758680.96948,
+ "lr": 0.0006937577932260512,
+ "time_sec": 177.81637740135193
+ },
+ {
+ "epoch": 57,
+ "train_loss": 4.904979566650391,
+ "train_acc": 0.01016,
+ "test_loss": 4.727262957763672,
+ "test_acc": 0.01,
+ "lyapunov": 1.6228536108265752,
+ "grad_norm": 0.25668226851580556,
+ "grad_max_sv": 0.08947733379900455,
+ "grad_min_sv": 3.709630814829091e-18,
+ "grad_condition": 89476902167.92735,
+ "lr": 0.0006840622763423388,
+ "time_sec": 177.7847032546997
+ },
+ {
+ "epoch": 58,
+ "train_loss": 4.91234857635498,
+ "train_acc": 0.00984,
+ "test_loss": 4.992978315734863,
+ "test_acc": 0.01,
+ "lyapunov": 1.6392204319424641,
+ "grad_norm": 0.2870713508381296,
+ "grad_max_sv": 0.08510738047771156,
+ "grad_min_sv": 5.680980030609821e-34,
+ "grad_condition": 85107380477.71156,
+ "lr": 0.0006742860236609073,
+ "time_sec": 177.93095755577087
+ },
+ {
+ "epoch": 59,
+ "train_loss": 4.895672921447754,
+ "train_acc": 0.00956,
+ "test_loss": 4.850344149017334,
+ "test_acc": 0.01,
+ "lyapunov": 1.6016130505315482,
+ "grad_norm": 0.21955395456353394,
+ "grad_max_sv": 0.04376054578460753,
+ "grad_min_sv": 0.0,
+ "grad_condition": 43760545784.60753,
+ "lr": 0.0006644333233692913,
+ "time_sec": 178.03867888450623
+ },
+ {
+ "epoch": 60,
+ "train_loss": 4.904327979278564,
+ "train_acc": 0.01052,
+ "test_loss": 5.107528366088867,
+ "test_acc": 0.01,
+ "lyapunov": 1.6214414124598588,
+ "grad_norm": 0.4134573581512024,
+ "grad_max_sv": 0.05148340538144112,
+ "grad_min_sv": 0.0,
+ "grad_condition": 51483405381.44112,
+ "lr": 0.0006545084971874734,
+ "time_sec": 177.95739769935608
+ },
+ {
+ "epoch": 61,
+ "train_loss": 4.898002865753174,
+ "train_acc": 0.0092,
+ "test_loss": 5.260837869262695,
+ "test_acc": 0.01,
+ "lyapunov": 1.6072155035975035,
+ "grad_norm": 0.21245422531513092,
+ "grad_max_sv": 0.06225627232342958,
+ "grad_min_sv": 0.0,
+ "grad_condition": 62256272323.42959,
+ "lr": 0.0006445158984722354,
+ "time_sec": 177.8253002166748
+ },
+ {
+ "epoch": 62,
+ "train_loss": 4.895106823730469,
+ "train_acc": 0.00882,
+ "test_loss": 4.800835796356202,
+ "test_acc": 0.01,
+ "lyapunov": 1.6004807888089543,
+ "grad_norm": 0.2174674542614135,
+ "grad_max_sv": 0.05514842057600618,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55148420576.00618,
+ "lr": 0.0006344599103076324,
+ "time_sec": 177.72123980522156
+ },
+ {
+ "epoch": 63,
+ "train_loss": 4.899956417541504,
+ "train_acc": 0.0105,
+ "test_loss": 4.751542483520508,
+ "test_acc": 0.01,
+ "lyapunov": 1.6128623427637399,
+ "grad_norm": 0.40884851608059564,
+ "grad_max_sv": 0.05529614672996104,
+ "grad_min_sv": 0.0,
+ "grad_condition": 55296146729.96104,
+ "lr": 0.0006243449435824269,
+ "time_sec": 177.73331904411316
+ },
+ {
+ "epoch": 64,
+ "train_loss": 4.899741290130615,
+ "train_acc": 0.01012,
+ "test_loss": 4.856732801818848,
+ "test_acc": 0.01,
+ "lyapunov": 1.610243486931257,
+ "grad_norm": 0.2140046037475775,
+ "grad_max_sv": 0.04319468280300498,
+ "grad_min_sv": 1.2200012063541023e-32,
+ "grad_condition": 43194682803.00498,
+ "lr": 0.0006141754350553275,
+ "time_sec": 177.72633337974548
+ },
+ {
+ "epoch": 65,
+ "train_loss": 4.901744207763672,
+ "train_acc": 0.00894,
+ "test_loss": 5.05665267791748,
+ "test_acc": 0.01,
+ "lyapunov": 1.612555693482499,
+ "grad_norm": 0.41191406243662826,
+ "grad_max_sv": 0.06249867400620133,
+ "grad_min_sv": 9.569992363469874e-20,
+ "grad_condition": 62498664540.05955,
+ "lr": 0.0006039558454088793,
+ "time_sec": 177.71029257774353
+ },
+ {
+ "epoch": 66,
+ "train_loss": 4.905766971282959,
+ "train_acc": 0.00954,
+ "test_loss": 5.186077005767822,
+ "test_acc": 0.01,
+ "lyapunov": 1.6214341486201567,
+ "grad_norm": 0.4859633789458757,
+ "grad_max_sv": 0.0410848444327712,
+ "grad_min_sv": 0.0,
+ "grad_condition": 41084844432.7712,
+ "lr": 0.000593690657292862,
+ "time_sec": 177.8285129070282
+ },
+ {
+ "epoch": 67,
+ "train_loss": 4.905345126495361,
+ "train_acc": 0.00986,
+ "test_loss": 4.869504832458496,
+ "test_acc": 0.01,
+ "lyapunov": 1.6231126108437852,
+ "grad_norm": 0.39055695869151713,
+ "grad_max_sv": 0.04164083697833121,
+ "grad_min_sv": 1.4012984643248171e-46,
+ "grad_condition": 41640836978.3312,
+ "lr": 0.0005833843733580507,
+ "time_sec": 177.75302600860596
+ },
+ {
+ "epoch": 68,
+ "train_loss": 4.897688937835693,
+ "train_acc": 0.00942,
+ "test_loss": 4.753113725280762,
+ "test_acc": 0.01,
+ "lyapunov": 1.6065946210680715,
+ "grad_norm": 0.20313081565215924,
+ "grad_max_sv": 0.023377659870311616,
+ "grad_min_sv": 0.0,
+ "grad_condition": 23377659870.311615,
+ "lr": 0.0005730415142812054,
+ "time_sec": 177.63269519805908
+ },
+ {
+ "epoch": 69,
+ "train_loss": 4.898588792419433,
+ "train_acc": 0.01028,
+ "test_loss": 4.782024855804443,
+ "test_acc": 0.01,
+ "lyapunov": 1.6088185420121683,
+ "grad_norm": 0.17496031637798137,
+ "grad_max_sv": 0.026315743662416936,
+ "grad_min_sv": 0.0,
+ "grad_condition": 26315743662.416935,
+ "lr": 0.0005626666167821517,
+ "time_sec": 177.63309144973755
+ },
+ {
+ "epoch": 70,
+ "train_loss": 4.8972829446411135,
+ "train_acc": 0.00906,
+ "test_loss": 5.072041613769532,
+ "test_acc": 0.01,
+ "lyapunov": 1.606105865419978,
+ "grad_norm": 4.752321231571355,
+ "grad_max_sv": 0.01162667127500754,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11626671275.007538,
+ "lr": 0.0005522642316338265,
+ "time_sec": 177.63151264190674
+ },
+ {
+ "epoch": 71,
+ "train_loss": 4.903229199066162,
+ "train_acc": 0.00974,
+ "test_loss": 4.996621307373047,
+ "test_acc": 0.01,
+ "lyapunov": 1.618955539315558,
+ "grad_norm": 8.808121966401492,
+ "grad_max_sv": 0.009761298389639706,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9761298389.639706,
+ "lr": 0.0005418389216661573,
+ "time_sec": 177.6599452495575
+ },
+ {
+ "epoch": 72,
+ "train_loss": 4.906216805419922,
+ "train_acc": 0.00934,
+ "test_loss": 4.894567427062988,
+ "test_acc": 0.01,
+ "lyapunov": 1.628432136362471,
+ "grad_norm": 8.489795940827486,
+ "grad_max_sv": 0.016040445899125188,
+ "grad_min_sv": 0.0,
+ "grad_condition": 16040445899.125189,
+ "lr": 0.0005313952597646563,
+ "time_sec": 177.6416893005371
+ },
+ {
+ "epoch": 73,
+ "train_loss": 4.899343757019043,
+ "train_acc": 0.00984,
+ "test_loss": 4.877998015594482,
+ "test_acc": 0.01,
+ "lyapunov": 1.6116645827012903,
+ "grad_norm": 8.78253510980995,
+ "grad_max_sv": 0.011263658234383911,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11263658234.383911,
+ "lr": 0.0005209378268645994,
+ "time_sec": 177.685124874115
+ },
+ {
+ "epoch": 74,
+ "train_loss": 4.909308713531495,
+ "train_acc": 0.0098,
+ "test_loss": 4.906534819030762,
+ "test_acc": 0.01,
+ "lyapunov": 1.6356849475284976,
+ "grad_norm": 8.739719950493322,
+ "grad_max_sv": 0.018200278421863912,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18200278421.863914,
+ "lr": 0.0005104712099416781,
+ "time_sec": 177.67348718643188
+ },
+ {
+ "epoch": 75,
+ "train_loss": 4.896382185516358,
+ "train_acc": 0.00988,
+ "test_loss": 4.891489701843262,
+ "test_acc": 0.01,
+ "lyapunov": 1.6029227630561576,
+ "grad_norm": 8.719549027099202,
+ "grad_max_sv": 0.022427358670393006,
+ "grad_min_sv": 0.0,
+ "grad_condition": 22427358670.393005,
+ "lr": 0.0004999999999999996,
+ "time_sec": 177.7534384727478
+ },
+ {
+ "epoch": 76,
+ "train_loss": 4.899071414489746,
+ "train_acc": 0.00968,
+ "test_loss": 4.9015754707336425,
+ "test_acc": 0.01,
+ "lyapunov": 1.6096787852094607,
+ "grad_norm": 8.515820970435684,
+ "grad_max_sv": 0.009400015359278768,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9400015359.278769,
+ "lr": 0.0004895287900583212,
+ "time_sec": 177.62656164169312
+ },
+ {
+ "epoch": 77,
+ "train_loss": 4.898522388305664,
+ "train_acc": 0.01038,
+ "test_loss": 5.091467515563965,
+ "test_acc": 0.01,
+ "lyapunov": 1.6093772655862677,
+ "grad_norm": 8.114992022856779,
+ "grad_max_sv": 0.018641287484206258,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18641287484.20626,
+ "lr": 0.0004790621731353997,
+ "time_sec": 177.68832445144653
+ },
+ {
+ "epoch": 78,
+ "train_loss": 4.898501075897217,
+ "train_acc": 0.00976,
+ "test_loss": 5.021521907043457,
+ "test_acc": 0.01,
+ "lyapunov": 1.609497647761079,
+ "grad_norm": 8.539277939413502,
+ "grad_max_sv": 0.007715003727935254,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7715003727.935254,
+ "lr": 0.000468604740235343,
+ "time_sec": 177.67188620567322
+ },
+ {
+ "epoch": 79,
+ "train_loss": 4.89914041229248,
+ "train_acc": 0.00952,
+ "test_loss": 5.091536389160156,
+ "test_acc": 0.01,
+ "lyapunov": 1.6118732392025725,
+ "grad_norm": 8.137454688889077,
+ "grad_max_sv": 0.014247056667227299,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14247056667.227299,
+ "lr": 0.00045816107833384175,
+ "time_sec": 177.66169714927673
+ },
+ {
+ "epoch": 80,
+ "train_loss": 4.896471509552002,
+ "train_acc": 0.00904,
+ "test_loss": 5.056171662139892,
+ "test_acc": 0.01,
+ "lyapunov": 1.6047609431664351,
+ "grad_norm": 8.176635016602376,
+ "grad_max_sv": 0.01795925593469292,
+ "grad_min_sv": 0.0,
+ "grad_condition": 17959255934.69292,
+ "lr": 0.0004477357683661729,
+ "time_sec": 177.69231700897217
+ },
+ {
+ "epoch": 81,
+ "train_loss": 4.902812586059571,
+ "train_acc": 0.00932,
+ "test_loss": 4.95149069366455,
+ "test_acc": 0.01,
+ "lyapunov": 1.6196627622979987,
+ "grad_norm": 7.929696982355576,
+ "grad_max_sv": 0.0070913337520323695,
+ "grad_min_sv": 0.0,
+ "grad_condition": 7091333752.03237,
+ "lr": 0.00043733338321784746,
+ "time_sec": 177.62628316879272
+ },
+ {
+ "epoch": 82,
+ "train_loss": 4.896946704254151,
+ "train_acc": 0.00924,
+ "test_loss": 5.036287983703613,
+ "test_acc": 0.01,
+ "lyapunov": 1.606176169632036,
+ "grad_norm": 7.888136562780922,
+ "grad_max_sv": 0.0152505733538419,
+ "grad_min_sv": 0.0,
+ "grad_condition": 15250573353.8419,
+ "lr": 0.0004269584857187939,
+ "time_sec": 177.6838881969452
+ },
+ {
+ "epoch": 83,
+ "train_loss": 4.903535429534912,
+ "train_acc": 0.00942,
+ "test_loss": 4.913862983703614,
+ "test_acc": 0.01,
+ "lyapunov": 1.6229887536114744,
+ "grad_norm": 5.821543829416724,
+ "grad_max_sv": 0.0042757402297866065,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4275740229.786606,
+ "lr": 0.0004166156266419484,
+ "time_sec": 177.63864398002625
+ },
+ {
+ "epoch": 84,
+ "train_loss": 4.900573203125,
+ "train_acc": 0.00922,
+ "test_loss": 4.881514458465576,
+ "test_acc": 0.01,
+ "lyapunov": 1.6157215519634354,
+ "grad_norm": 2.3035299291537767,
+ "grad_max_sv": 0.018527308432385325,
+ "grad_min_sv": 0.0,
+ "grad_condition": 18527308432.385326,
+ "lr": 0.0004063093427071373,
+ "time_sec": 177.61864590644836
+ },
+ {
+ "epoch": 85,
+ "train_loss": 4.902895740814209,
+ "train_acc": 0.00928,
+ "test_loss": 4.858868844604492,
+ "test_acc": 0.01,
+ "lyapunov": 1.6206753049665095,
+ "grad_norm": 0.12191327008361393,
+ "grad_max_sv": 0.011266671447083354,
+ "grad_min_sv": 0.0,
+ "grad_condition": 11266671447.083355,
+ "lr": 0.0003960441545911199,
+ "time_sec": 177.60221338272095
+ },
+ {
+ "epoch": 86,
+ "train_loss": 4.899129556274414,
+ "train_acc": 0.01002,
+ "test_loss": 4.940996123504639,
+ "test_acc": 0.01,
+ "lyapunov": 1.6121560679677198,
+ "grad_norm": 1.7402391187392277,
+ "grad_max_sv": 0.002565371198579669,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2565371198.579669,
+ "lr": 0.0003858245649446718,
+ "time_sec": 177.66662287712097
+ },
+ {
+ "epoch": 87,
+ "train_loss": 4.898443488616944,
+ "train_acc": 0.0105,
+ "test_loss": 4.900648780059814,
+ "test_acc": 0.01,
+ "lyapunov": 1.6101132055072833,
+ "grad_norm": 3.9387378230742067,
+ "grad_max_sv": 0.014504804974421859,
+ "grad_min_sv": 0.0,
+ "grad_condition": 14504804974.421856,
+ "lr": 0.00037565505641757235,
+ "time_sec": 177.92060565948486
+ },
+ {
+ "epoch": 88,
+ "train_loss": 4.903396017608642,
+ "train_acc": 0.01006,
+ "test_loss": 4.946898637390137,
+ "test_acc": 0.01,
+ "lyapunov": 1.6227889701228617,
+ "grad_norm": 3.523322793117835,
+ "grad_max_sv": 0.010716242669150233,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10716242669.150234,
+ "lr": 0.00036554008969236695,
+ "time_sec": 177.71660375595093
+ },
+ {
+ "epoch": 89,
+ "train_loss": 4.898063175964356,
+ "train_acc": 0.00952,
+ "test_loss": 4.944628465270996,
+ "test_acc": 0.01,
+ "lyapunov": 1.6093785500587405,
+ "grad_norm": 3.442066441987714,
+ "grad_max_sv": 0.001931725861504674,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1931725861.5046737,
+ "lr": 0.0003554841015277638,
+ "time_sec": 177.85225415229797
+ },
+ {
+ "epoch": 90,
+ "train_loss": 4.897619627685547,
+ "train_acc": 0.00938,
+ "test_loss": 5.051801362609863,
+ "test_acc": 0.01,
+ "lyapunov": 1.608569312583455,
+ "grad_norm": 2.438214274664479,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000345491502812526,
+ "time_sec": 177.65104031562805
+ },
+ {
+ "epoch": 91,
+ "train_loss": 4.901775200042724,
+ "train_acc": 0.00952,
+ "test_loss": 4.932051847076416,
+ "test_acc": 0.01,
+ "lyapunov": 1.6196813135195876,
+ "grad_norm": 1.9676599328431443,
+ "grad_max_sv": 0.0042047965805977585,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4204796580.5977583,
+ "lr": 0.0003355666766307081,
+ "time_sec": 177.5405979156494
+ },
+ {
+ "epoch": 92,
+ "train_loss": 4.8983032328796385,
+ "train_acc": 0.0092,
+ "test_loss": 4.899715927886963,
+ "test_acc": 0.01,
+ "lyapunov": 1.6106610715846577,
+ "grad_norm": 1.4208199060741078,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00032571397633909225,
+ "time_sec": 177.52678775787354
+ },
+ {
+ "epoch": 93,
+ "train_loss": 4.899546262664795,
+ "train_acc": 0.00828,
+ "test_loss": 4.734424713134765,
+ "test_acc": 0.01,
+ "lyapunov": 1.6129982721470202,
+ "grad_norm": 0.7679133474898795,
+ "grad_max_sv": 0.001235782215371728,
+ "grad_min_sv": 0.0,
+ "grad_condition": 1235782215.371728,
+ "lr": 0.00031593772365766094,
+ "time_sec": 177.578599691391
+ },
+ {
+ "epoch": 94,
+ "train_loss": 4.897470514221191,
+ "train_acc": 0.00868,
+ "test_loss": 4.861271743774414,
+ "test_acc": 0.01,
+ "lyapunov": 1.6078075801624971,
+ "grad_norm": 0.5114523908732937,
+ "grad_max_sv": 0.010413796734064817,
+ "grad_min_sv": 0.0,
+ "grad_condition": 10413796734.064817,
+ "lr": 0.0003062422067739483,
+ "time_sec": 177.66828536987305
+ },
+ {
+ "epoch": 95,
+ "train_loss": 4.896396814422608,
+ "train_acc": 0.00902,
+ "test_loss": 4.879605053710938,
+ "test_acc": 0.01,
+ "lyapunov": 1.6050515763290094,
+ "grad_norm": 0.3961292769391823,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00029663167846209965,
+ "time_sec": 177.51401448249817
+ },
+ {
+ "epoch": 96,
+ "train_loss": 4.8946277626037595,
+ "train_acc": 0.00906,
+ "test_loss": 4.8813762161254886,
+ "test_acc": 0.01,
+ "lyapunov": 1.6007561808656854,
+ "grad_norm": 0.3223908585413378,
+ "grad_max_sv": 0.004684461047872901,
+ "grad_min_sv": 0.0,
+ "grad_condition": 4684461047.8729,
+ "lr": 0.00028711035421746345,
+ "time_sec": 177.507954120636
+ },
+ {
+ "epoch": 97,
+ "train_loss": 4.898638327026367,
+ "train_acc": 0.0089,
+ "test_loss": 4.8062256309509275,
+ "test_acc": 0.01,
+ "lyapunov": 1.6108122432933134,
+ "grad_norm": 0.26732308458116777,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00027768241040753615,
+ "time_sec": 177.541433095932
+ },
+ {
+ "epoch": 98,
+ "train_loss": 4.898670770721435,
+ "train_acc": 0.00952,
+ "test_loss": 4.863480428314209,
+ "test_acc": 0.01,
+ "lyapunov": 1.6111446103781386,
+ "grad_norm": 0.2214969265799768,
+ "grad_max_sv": 0.009903033776208759,
+ "grad_min_sv": 0.0,
+ "grad_condition": 9903033776.20876,
+ "lr": 0.00026835198244006903,
+ "time_sec": 177.60904955863953
+ },
+ {
+ "epoch": 99,
+ "train_loss": 4.897254006500244,
+ "train_acc": 0.00834,
+ "test_loss": 4.817773220062256,
+ "test_acc": 0.01,
+ "lyapunov": 1.607484469023507,
+ "grad_norm": 0.19294402621230472,
+ "grad_max_sv": 0.0008362619206309319,
+ "grad_min_sv": 0.0,
+ "grad_condition": 836261920.6309319,
+ "lr": 0.0002591231629491421,
+ "time_sec": 177.57478499412537
+ },
+ {
+ "epoch": 100,
+ "train_loss": 4.901547922363282,
+ "train_acc": 0.0089,
+ "test_loss": 4.874810285949707,
+ "test_acc": 0.01,
+ "lyapunov": 1.618047608134082,
+ "grad_norm": 0.48303744135317395,
+ "grad_max_sv": 0.0005853609647601843,
+ "grad_min_sv": 0.0,
+ "grad_condition": 585360964.7601843,
+ "lr": 0.0002499999999999997,
+ "time_sec": 177.57369899749756
+ },
+ {
+ "epoch": 101,
+ "train_loss": 4.900225694732666,
+ "train_acc": 0.0088,
+ "test_loss": 4.874546339416504,
+ "test_acc": 0.01,
+ "lyapunov": 1.6143963080842783,
+ "grad_norm": 0.10450627590873329,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00024098649531343477,
+ "time_sec": 177.6406271457672
+ },
+ {
+ "epoch": 102,
+ "train_loss": 4.897779517669678,
+ "train_acc": 0.00842,
+ "test_loss": 4.97530121307373,
+ "test_acc": 0.01,
+ "lyapunov": 1.6092621133760419,
+ "grad_norm": 0.11958307306926726,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002320866025105016,
+ "time_sec": 177.58187460899353
+ },
+ {
+ "epoch": 103,
+ "train_loss": 4.89978483215332,
+ "train_acc": 0.00836,
+ "test_loss": 4.904860715484619,
+ "test_acc": 0.01,
+ "lyapunov": 1.613416659862489,
+ "grad_norm": 0.11840174924430107,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002233042253783278,
+ "time_sec": 177.59923720359802
+ },
+ {
+ "epoch": 104,
+ "train_loss": 4.8979805488586425,
+ "train_acc": 0.0086,
+ "test_loss": 5.0884550689697265,
+ "test_acc": 0.01,
+ "lyapunov": 1.6097813783704167,
+ "grad_norm": 0.119936422604111,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000214643216157784,
+ "time_sec": 177.6080665588379
+ },
+ {
+ "epoch": 105,
+ "train_loss": 4.898741788330078,
+ "train_acc": 0.00866,
+ "test_loss": 4.9618072402954105,
+ "test_acc": 0.01,
+ "lyapunov": 1.6113920699604942,
+ "grad_norm": 0.152172750895754,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376332,
+ "time_sec": 177.6668050289154
+ },
+ {
+ "epoch": 106,
+ "train_loss": 4.899783585510254,
+ "train_acc": 0.00854,
+ "test_loss": 4.853069065856934,
+ "test_acc": 0.01,
+ "lyapunov": 1.6142695355598273,
+ "grad_norm": 0.12651234741385065,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019770044256881242,
+ "time_sec": 177.65955018997192
+ },
+ {
+ "epoch": 107,
+ "train_loss": 4.89967593460083,
+ "train_acc": 0.00888,
+ "test_loss": 4.81962833480835,
+ "test_acc": 0.01,
+ "lyapunov": 1.6138155131083924,
+ "grad_norm": 0.12897917774661904,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001894261098608447,
+ "time_sec": 178.0168354511261
+ },
+ {
+ "epoch": 108,
+ "train_loss": 4.898814065093994,
+ "train_acc": 0.00946,
+ "test_loss": 4.862646290588379,
+ "test_acc": 0.01,
+ "lyapunov": 1.6114065183702941,
+ "grad_norm": 0.12441425701414183,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000181288005125655,
+ "time_sec": 177.91981077194214
+ },
+ {
+ "epoch": 109,
+ "train_loss": 4.895898725891113,
+ "train_acc": 0.00866,
+ "test_loss": 4.898298935699463,
+ "test_acc": 0.01,
+ "lyapunov": 1.6044228336085444,
+ "grad_norm": 0.12735396729359733,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001732896980049473,
+ "time_sec": 177.5811812877655
+ },
+ {
+ "epoch": 110,
+ "train_loss": 4.897967128295899,
+ "train_acc": 0.0088,
+ "test_loss": 4.881989184570313,
+ "test_acc": 0.01,
+ "lyapunov": 1.610074214008458,
+ "grad_norm": 0.12498581799753569,
+ "grad_max_sv": 0.0005899489391595125,
+ "grad_min_sv": 0.0,
+ "grad_condition": 589948939.1595125,
+ "lr": 0.00016543469682057076,
+ "time_sec": 177.58177971839905
+ },
+ {
+ "epoch": 111,
+ "train_loss": 4.894624674987793,
+ "train_acc": 0.00892,
+ "test_loss": 4.883820623779297,
+ "test_acc": 0.01,
+ "lyapunov": 1.6010574471310277,
+ "grad_norm": 0.12140577807922988,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015772644703565552,
+ "time_sec": 177.56197333335876
+ },
+ {
+ "epoch": 112,
+ "train_loss": 4.895216448974609,
+ "train_acc": 0.00852,
+ "test_loss": 4.954343832397461,
+ "test_acc": 0.01,
+ "lyapunov": 1.602743710093486,
+ "grad_norm": 0.1186981012224881,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00015016832974331713,
+ "time_sec": 177.6377820968628
+ },
+ {
+ "epoch": 113,
+ "train_loss": 4.89654906173706,
+ "train_acc": 0.00892,
+ "test_loss": 4.86073722076416,
+ "test_acc": 0.01,
+ "lyapunov": 1.6060491681403821,
+ "grad_norm": 0.13508163826012107,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014276366018359834,
+ "time_sec": 177.58386063575745
+ },
+ {
+ "epoch": 114,
+ "train_loss": 4.8961822531127925,
+ "train_acc": 0.00894,
+ "test_loss": 4.85973716430664,
+ "test_acc": 0.01,
+ "lyapunov": 1.605295106578056,
+ "grad_norm": 0.1269661896874639,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00013551568628929425,
+ "time_sec": 177.66930723190308
+ },
+ {
+ "epoch": 115,
+ "train_loss": 4.899547542419434,
+ "train_acc": 0.00846,
+ "test_loss": 4.86928017654419,
+ "test_acc": 0.01,
+ "lyapunov": 1.611534357680689,
+ "grad_norm": 0.12942007445088913,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012842758726130276,
+ "time_sec": 177.5964391231537
+ },
+ {
+ "epoch": 116,
+ "train_loss": 4.8983458253479,
+ "train_acc": 0.00896,
+ "test_loss": 4.843299571990967,
+ "test_acc": 0.01,
+ "lyapunov": 1.6105001826420464,
+ "grad_norm": 0.13930842303851845,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001215024721741218,
+ "time_sec": 177.61230850219727
+ },
+ {
+ "epoch": 117,
+ "train_loss": 4.896871134490967,
+ "train_acc": 0.00876,
+ "test_loss": 4.854955553436279,
+ "test_acc": 0.01,
+ "lyapunov": 1.6068359040238362,
+ "grad_norm": 0.14085548109201876,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210538,
+ "time_sec": 177.60942769050598
+ },
+ {
+ "epoch": 118,
+ "train_loss": 4.895171242523193,
+ "train_acc": 0.00872,
+ "test_loss": 4.848788255310058,
+ "test_acc": 0.01,
+ "lyapunov": 1.6026884250323792,
+ "grad_norm": 0.14154856326059925,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010815327133708009,
+ "time_sec": 177.55690503120422
+ },
+ {
+ "epoch": 119,
+ "train_loss": 4.896756847839355,
+ "train_acc": 0.00832,
+ "test_loss": 4.8384888511657715,
+ "test_acc": 0.01,
+ "lyapunov": 1.6064672335944212,
+ "grad_norm": 0.13186296404041234,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010173504098790182,
+ "time_sec": 177.58031153678894
+ },
+ {
+ "epoch": 120,
+ "train_loss": 4.898055244140625,
+ "train_acc": 0.00912,
+ "test_loss": 4.863050064086914,
+ "test_acc": 0.01,
+ "lyapunov": 1.608289188131347,
+ "grad_norm": 0.13789827868104076,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252629e-05,
+ "time_sec": 177.57413148880005
+ },
+ {
+ "epoch": 121,
+ "train_loss": 4.895827691040039,
+ "train_acc": 0.00928,
+ "test_loss": 4.863882962799072,
+ "test_acc": 0.01,
+ "lyapunov": 1.6041748965792644,
+ "grad_norm": 0.1447753316018149,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.942539543314794e-05,
+ "time_sec": 177.61848878860474
+ },
+ {
+ "epoch": 122,
+ "train_loss": 4.894580706329346,
+ "train_acc": 0.0093,
+ "test_loss": 4.832992823791504,
+ "test_acc": 0.01,
+ "lyapunov": 1.6009809287917582,
+ "grad_norm": 0.13403320495860124,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.353937964495024e-05,
+ "time_sec": 177.63413906097412
+ },
+ {
+ "epoch": 123,
+ "train_loss": 4.896512101593018,
+ "train_acc": 0.00856,
+ "test_loss": 4.88107511138916,
+ "test_acc": 0.01,
+ "lyapunov": 1.6053285842661358,
+ "grad_norm": 0.1349040405870927,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.783603724899243e-05,
+ "time_sec": 177.86059856414795
+ },
+ {
+ "epoch": 124,
+ "train_loss": 4.902536525726318,
+ "train_acc": 0.00916,
+ "test_loss": 4.825576887512207,
+ "test_acc": 0.01,
+ "lyapunov": 1.618482659235025,
+ "grad_norm": 0.15260564991727005,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.231786991974666e-05,
+ "time_sec": 177.59844970703125
+ },
+ {
+ "epoch": 125,
+ "train_loss": 4.8969797262573245,
+ "train_acc": 0.00904,
+ "test_loss": 4.842672832489014,
+ "test_acc": 0.01,
+ "lyapunov": 1.607402919198546,
+ "grad_norm": 0.14681033483413716,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.698729810778072e-05,
+ "time_sec": 177.69832468032837
+ },
+ {
+ "epoch": 126,
+ "train_loss": 4.896537158660888,
+ "train_acc": 0.00922,
+ "test_loss": 4.80990348739624,
+ "test_acc": 0.01,
+ "lyapunov": 1.6063618071548773,
+ "grad_norm": 0.13507935123670756,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806817e-05,
+ "time_sec": 177.70786309242249
+ },
+ {
+ "epoch": 127,
+ "train_loss": 4.894742733154297,
+ "train_acc": 0.00798,
+ "test_loss": 4.8113509506225585,
+ "test_acc": 0.01,
+ "lyapunov": 1.6014454364776611,
+ "grad_norm": 0.1351277333350339,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.6898210384392595e-05,
+ "time_sec": 177.86230516433716
+ },
+ {
+ "epoch": 128,
+ "train_loss": 4.897651534729004,
+ "train_acc": 0.0094,
+ "test_loss": 4.849126397705078,
+ "test_acc": 0.01,
+ "lyapunov": 1.6088779442145695,
+ "grad_norm": 0.17636542409245334,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.214411988029363e-05,
+ "time_sec": 177.6271688938141
+ },
+ {
+ "epoch": 129,
+ "train_loss": 4.89603802230835,
+ "train_acc": 0.00886,
+ "test_loss": 4.837294686126709,
+ "test_acc": 0.01,
+ "lyapunov": 1.605165058694532,
+ "grad_norm": 0.1801255445906475,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.7586473766990294e-05,
+ "time_sec": 177.71211314201355
+ },
+ {
+ "epoch": 130,
+ "train_loss": 4.895125115509034,
+ "train_acc": 0.00866,
+ "test_loss": 4.808775178527832,
+ "test_acc": 0.01,
+ "lyapunov": 1.6025557109462025,
+ "grad_norm": 0.14181669608504024,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.32272711786996e-05,
+ "time_sec": 177.64269709587097
+ },
+ {
+ "epoch": 131,
+ "train_loss": 4.902938699340821,
+ "train_acc": 0.008,
+ "test_loss": 4.826445443725586,
+ "test_acc": 0.01,
+ "lyapunov": 1.6225644127487222,
+ "grad_norm": 0.15063649346643543,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.906842420574966e-05,
+ "time_sec": 177.69655632972717
+ },
+ {
+ "epoch": 132,
+ "train_loss": 4.895815797271728,
+ "train_acc": 0.00944,
+ "test_loss": 4.808843030548096,
+ "test_acc": 0.01,
+ "lyapunov": 1.6045795020544926,
+ "grad_norm": 0.13954946888706687,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.5111757055874305e-05,
+ "time_sec": 177.6466555595398
+ },
+ {
+ "epoch": 133,
+ "train_loss": 4.896005963287354,
+ "train_acc": 0.0088,
+ "test_loss": 4.82414176940918,
+ "test_acc": 0.01,
+ "lyapunov": 1.6050951605867547,
+ "grad_norm": 0.14029597054344972,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.1359005254054254e-05,
+ "time_sec": 177.6260485649109
+ },
+ {
+ "epoch": 134,
+ "train_loss": 4.898020515136719,
+ "train_acc": 0.00954,
+ "test_loss": 4.837333515167236,
+ "test_acc": 0.01,
+ "lyapunov": 1.609246312199956,
+ "grad_norm": 0.14357714581869627,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7811814881259484e-05,
+ "time_sec": 177.584956407547
+ },
+ {
+ "epoch": 135,
+ "train_loss": 4.895735731048584,
+ "train_acc": 0.0092,
+ "test_loss": 4.8159059692382815,
+ "test_acc": 0.01,
+ "lyapunov": 1.6042115407831528,
+ "grad_norm": 0.14076247756947305,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.4471741852423218e-05,
+ "time_sec": 177.55930995941162
+ },
+ {
+ "epoch": 136,
+ "train_loss": 4.899449185333252,
+ "train_acc": 0.01,
+ "test_loss": 4.8122740142822265,
+ "test_acc": 0.01,
+ "lyapunov": 1.61043234645863,
+ "grad_norm": 0.19068368741616817,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.1340251233966362e-05,
+ "time_sec": 177.60587310791016
+ },
+ {
+ "epoch": 137,
+ "train_loss": 4.895413861694336,
+ "train_acc": 0.0092,
+ "test_loss": 4.812394242858887,
+ "test_acc": 0.01,
+ "lyapunov": 1.6033874640379415,
+ "grad_norm": 0.5123554678520819,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.8418716601170932e-05,
+ "time_sec": 177.5866892337799
+ },
+ {
+ "epoch": 138,
+ "train_loss": 4.897919689941406,
+ "train_acc": 0.01,
+ "test_loss": 4.824399436187744,
+ "test_acc": 0.01,
+ "lyapunov": 1.60939773604693,
+ "grad_norm": 0.42554152230186504,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568445e-05,
+ "time_sec": 177.5575873851776
+ },
+ {
+ "epoch": 139,
+ "train_loss": 4.896585512237549,
+ "train_acc": 0.0096,
+ "test_loss": 4.813831822967529,
+ "test_acc": 0.01,
+ "lyapunov": 1.6059378885552096,
+ "grad_norm": 0.40395815580062067,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.3210548563419845e-05,
+ "time_sec": 177.5689401626587
+ },
+ {
+ "epoch": 140,
+ "train_loss": 4.896397541656494,
+ "train_acc": 0.01,
+ "test_loss": 4.813830749511719,
+ "test_acc": 0.01,
+ "lyapunov": 1.6058773750539326,
+ "grad_norm": 0.3517546520670756,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.0926199633097203e-05,
+ "time_sec": 177.56592845916748
+ },
+ {
+ "epoch": 141,
+ "train_loss": 4.897689798278809,
+ "train_acc": 0.00908,
+ "test_loss": 4.809725570678711,
+ "test_acc": 0.01,
+ "lyapunov": 1.6086021369070653,
+ "grad_norm": 0.34730980637645387,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.856374635655688e-06,
+ "time_sec": 177.57834815979004
+ },
+ {
+ "epoch": 142,
+ "train_loss": 4.897065491943359,
+ "train_acc": 0.00946,
+ "test_loss": 4.804353742218018,
+ "test_acc": 0.01,
+ "lyapunov": 1.6070060754371116,
+ "grad_norm": 0.34991199227840564,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.001981464747503e-06,
+ "time_sec": 177.5697898864746
+ },
+ {
+ "epoch": 143,
+ "train_loss": 4.895145080566406,
+ "train_acc": 0.00966,
+ "test_loss": 4.821014101409912,
+ "test_acc": 0.01,
+ "lyapunov": 1.6025798217110012,
+ "grad_norm": 0.3468579023438424,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.3638335185058295e-06,
+ "time_sec": 177.62174582481384
+ },
+ {
+ "epoch": 144,
+ "train_loss": 4.895165930786133,
+ "train_acc": 0.00984,
+ "test_loss": 4.800519823455811,
+ "test_acc": 0.01,
+ "lyapunov": 1.602697217860795,
+ "grad_norm": 0.34813989460737055,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761114e-06,
+ "time_sec": 177.58397316932678
+ },
+ {
+ "epoch": 145,
+ "train_loss": 4.896360063476562,
+ "train_acc": 0.01,
+ "test_loss": 4.800519633483887,
+ "test_acc": 0.01,
+ "lyapunov": 1.605867438913916,
+ "grad_norm": 0.3366340618642584,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.7390523158633524e-06,
+ "time_sec": 177.5893211364746
+ },
+ {
+ "epoch": 146,
+ "train_loss": 4.894688441314697,
+ "train_acc": 0.01,
+ "test_loss": 4.800520404052734,
+ "test_acc": 0.01,
+ "lyapunov": 1.6013682687374027,
+ "grad_norm": 0.3310266277326936,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.7535703752478133e-06,
+ "time_sec": 177.56866335868835
+ },
+ {
+ "epoch": 147,
+ "train_loss": 4.894518559265137,
+ "train_acc": 0.01,
+ "test_loss": 4.8005200927734375,
+ "test_acc": 0.01,
+ "lyapunov": 1.600981123307172,
+ "grad_norm": 0.3451840089468246,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642196e-07,
+ "time_sec": 177.56436419487
+ },
+ {
+ "epoch": 148,
+ "train_loss": 4.895737046356201,
+ "train_acc": 0.01,
+ "test_loss": 4.800520344543457,
+ "test_acc": 0.01,
+ "lyapunov": 1.6043054953865383,
+ "grad_norm": 0.3208172451267627,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.38584950570808e-07,
+ "time_sec": 177.5520420074463
+ },
+ {
+ "epoch": 149,
+ "train_loss": 4.894163135528564,
+ "train_acc": 0.01,
+ "test_loss": 4.800520320892334,
+ "test_acc": 0.01,
+ "lyapunov": 1.5999351096580097,
+ "grad_norm": 0.32420799089770896,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.096582625772501e-07,
+ "time_sec": 177.6083221435547
+ },
+ {
+ "epoch": 150,
+ "train_loss": 4.892976047668457,
+ "train_acc": 0.01,
+ "test_loss": 4.8005203384399415,
+ "test_acc": 0.01,
+ "lyapunov": 1.596442692724945,
+ "grad_norm": 0.32157877988197864,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 177.66009068489075
+ }
+ ]
+ }
+} \ No newline at end of file