From cd99d6b874d9d09b3bb87b8485cc787885af71f1 Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Tue, 13 Jan 2026 23:49:05 -0600 Subject: init commit --- .../cifar100_20260102-133755/config.json | 23 + .../cifar100_20260102-133755/results.json | 16822 +++++++++++++++++++ 2 files changed, 16845 insertions(+) create mode 100644 runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json create mode 100644 runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json (limited to 'runs/depth_scaling_stable_init/cifar100_20260102-133755') diff --git a/runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json b/runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json new file mode 100644 index 0000000..a220257 --- /dev/null +++ b/runs/depth_scaling_stable_init/cifar100_20260102-133755/config.json @@ -0,0 +1,23 @@ +{ + "dataset": "cifar100", + "depths": [ + 4, + 8, + 12, + 16 + ], + "T": 4, + "epochs": 150, + "batch_size": 128, + "lr": 0.001, + "lambda_reg": 0.1, + "lambda_target": -0.1, + "data_dir": "./data", + "out_dir": "runs/depth_scaling_stable_init", + "device": "cuda", + "seed": 42, + "no_progress": false, + "reg_type": "squared", + "warmup_epochs": 20, + "stable_init": true +} \ No newline at end of file diff --git a/runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json b/runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json new file mode 100644 index 0000000..3de0e89 --- /dev/null +++ b/runs/depth_scaling_stable_init/cifar100_20260102-133755/results.json @@ -0,0 +1,16822 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 3.8700216691589358, + "train_acc": 0.12266, + "test_loss": 3.471041242599487, + "test_acc": 0.1892, + "lyapunov": null, + "grad_norm": 5.871605597993606, + "grad_max_sv": 4.127117091417313, + "grad_min_sv": 1.0455270382792037e-07, + "grad_condition": 49062288.68792993, + "lr": 0.0009998903417374227, + "time_sec": 16.27198028564453 + }, + { + "epoch": 2, + "train_loss": 3.1769318112182616, + "train_acc": 0.22848, + "test_loss": 3.0822217151641844, + "test_acc": 0.2623, + "lyapunov": null, + "grad_norm": 4.062262644221631, + "grad_max_sv": 2.610152545571327, + "grad_min_sv": 7.51297792088955e-08, + "grad_condition": 5467508398.9579, + "lr": 0.0009995614150494292, + "time_sec": 15.849408626556396 + }, + { + "epoch": 3, + "train_loss": 2.7716760053253173, + "train_acc": 0.30112, + "test_loss": 2.786010754776001, + "test_acc": 0.3025, + "lyapunov": null, + "grad_norm": 3.306849913177874, + "grad_max_sv": 1.982076707482338, + "grad_min_sv": 6.276024400175828e-08, + "grad_condition": 35650611.42411845, + "lr": 0.0009990133642141358, + "time_sec": 15.585639715194702 + }, + { + "epoch": 4, + "train_loss": 2.52623803855896, + "train_acc": 0.34808, + "test_loss": 2.753477826690674, + "test_acc": 0.31, + "lyapunov": null, + "grad_norm": 2.9097492182391815, + "grad_max_sv": 1.6385449588298797, + "grad_min_sv": 5.4328751075694014e-08, + "grad_condition": 39318936.04767501, + "lr": 0.0009982464296247522, + "time_sec": 15.567962408065796 + }, + { + "epoch": 5, + "train_loss": 2.336665892715454, + "train_acc": 0.38814, + "test_loss": 2.762642176055908, + "test_acc": 0.3278, + "lyapunov": null, + "grad_norm": 2.633575942359962, + "grad_max_sv": 1.4780948996543883, + "grad_min_sv": 4.9716202832339465e-08, + "grad_condition": 36374716.14412971, + "lr": 0.0009972609476841367, + "time_sec": 15.589628219604492 + }, + { + "epoch": 6, + "train_loss": 2.1819915383148194, + "train_acc": 0.42402, + "test_loss": 2.879850026321411, + "test_acc": 0.3169, + "lyapunov": null, + "grad_norm": 2.4016337956595826, + "grad_max_sv": 1.2914279341697692, + "grad_min_sv": 4.639223961377947e-08, + "grad_condition": 67967054.09377375, + "lr": 0.000996057350657239, + "time_sec": 15.569096803665161 + }, + { + "epoch": 7, + "train_loss": 2.051711977081299, + "train_acc": 0.45262, + "test_loss": 2.3678430866241453, + "test_acc": 0.3932, + "lyapunov": null, + "grad_norm": 2.226191538130221, + "grad_max_sv": 1.1724753439426423, + "grad_min_sv": 4.296711672013842e-08, + "grad_condition": 36498738.129443035, + "lr": 0.000994636166481494, + "time_sec": 15.596983671188354 + }, + { + "epoch": 8, + "train_loss": 1.940541718597412, + "train_acc": 0.47698, + "test_loss": 2.2571875411987303, + "test_acc": 0.4255, + "lyapunov": null, + "grad_norm": 2.0805351562913987, + "grad_max_sv": 1.1051331430673599, + "grad_min_sv": 4.002405433189971e-08, + "grad_condition": 35597702.92584355, + "lr": 0.0009929980185352525, + "time_sec": 15.578535795211792 + }, + { + "epoch": 9, + "train_loss": 1.8394872580337525, + "train_acc": 0.49896, + "test_loss": 2.447062807273865, + "test_acc": 0.3908, + "lyapunov": null, + "grad_norm": 1.95549418174433, + "grad_max_sv": 0.9836901038885116, + "grad_min_sv": 3.7306198631681385e-08, + "grad_condition": 62081794.94354477, + "lr": 0.0009911436253643444, + "time_sec": 15.615386486053467 + }, + { + "epoch": 10, + "train_loss": 1.7619124493789673, + "train_acc": 0.51634, + "test_loss": 2.1738934711456297, + "test_acc": 0.4315, + "lyapunov": null, + "grad_norm": 1.8481164153982472, + "grad_max_sv": 0.9101693272590637, + "grad_min_sv": 3.497988239065109e-08, + "grad_condition": 46371834.68583612, + "lr": 0.0009890738003669028, + "time_sec": 15.591166496276855 + }, + { + "epoch": 11, + "train_loss": 1.6779080270385742, + "train_acc": 0.5374, + "test_loss": 2.1254464902877808, + "test_acc": 0.4554, + "lyapunov": null, + "grad_norm": 1.761015251152075, + "grad_max_sv": 0.8580568209290504, + "grad_min_sv": 3.36019686630884e-08, + "grad_condition": 43516726.56073545, + "lr": 0.00098678945143658, + "time_sec": 15.584970235824585 + }, + { + "epoch": 12, + "train_loss": 1.6224668700790406, + "train_acc": 0.5503, + "test_loss": 2.1070931062698364, + "test_acc": 0.4572, + "lyapunov": null, + "grad_norm": 1.6795284434799669, + "grad_max_sv": 0.8227274164557457, + "grad_min_sv": 3.2408061501065785e-08, + "grad_condition": 46743715.81403457, + "lr": 0.0009842915805643154, + "time_sec": 15.587612390518188 + }, + { + "epoch": 13, + "train_loss": 1.5589283563995362, + "train_acc": 0.56658, + "test_loss": 2.109080162811279, + "test_acc": 0.4555, + "lyapunov": null, + "grad_norm": 1.6107025543208409, + "grad_max_sv": 0.7555071026086807, + "grad_min_sv": 3.021804662181257e-08, + "grad_condition": 771669383.9576478, + "lr": 0.000981581283398829, + "time_sec": 15.570199012756348 + }, + { + "epoch": 14, + "train_loss": 1.5079251358795167, + "train_acc": 0.57552, + "test_loss": 2.0982689178466796, + "test_acc": 0.4612, + "lyapunov": null, + "grad_norm": 1.5561237300872648, + "grad_max_sv": 0.7464557528495789, + "grad_min_sv": 2.9360349014517782e-08, + "grad_condition": 57384357.84720645, + "lr": 0.0009786597487660333, + "time_sec": 15.58092999458313 + }, + { + "epoch": 15, + "train_loss": 1.4521892065048219, + "train_acc": 0.59046, + "test_loss": 2.311817477607727, + "test_acc": 0.4302, + "lyapunov": null, + "grad_norm": 1.5030460275712159, + "grad_max_sv": 0.6973782196640969, + "grad_min_sv": 2.806552138745477e-08, + "grad_condition": 50094988.442197144, + "lr": 0.0009755282581475766, + "time_sec": 15.59303069114685 + }, + { + "epoch": 16, + "train_loss": 1.4043401465606689, + "train_acc": 0.6018, + "test_loss": 1.9470401285171508, + "test_acc": 0.4966, + "lyapunov": null, + "grad_norm": 1.4501603734300015, + "grad_max_sv": 0.6692761570215225, + "grad_min_sv": 2.707263816043026e-08, + "grad_condition": 123937233.96376769, + "lr": 0.0009721881851187403, + "time_sec": 15.581094026565552 + }, + { + "epoch": 17, + "train_loss": 1.3696716709136962, + "train_acc": 0.61152, + "test_loss": 1.937501217842102, + "test_acc": 0.499, + "lyapunov": null, + "grad_norm": 1.4220829625575298, + "grad_max_sv": 0.6630528435111046, + "grad_min_sv": 2.6855075777043603e-08, + "grad_condition": 85926301.07871899, + "lr": 0.0009686409947459456, + "time_sec": 15.594961643218994 + }, + { + "epoch": 18, + "train_loss": 1.3274028357696532, + "train_acc": 0.62202, + "test_loss": 2.163087944793701, + "test_acc": 0.4562, + "lyapunov": null, + "grad_norm": 1.3749658522523285, + "grad_max_sv": 0.6294455677270889, + "grad_min_sv": 2.59231922022235e-08, + "grad_condition": 301195911.7425653, + "lr": 0.0009648882429441254, + "time_sec": 15.60923433303833 + }, + { + "epoch": 19, + "train_loss": 1.2825380062484741, + "train_acc": 0.63366, + "test_loss": 2.012470700645447, + "test_acc": 0.4881, + "lyapunov": null, + "grad_norm": 1.3365974210853477, + "grad_max_sv": 0.6173068635165692, + "grad_min_sv": 2.522445298643039e-08, + "grad_condition": 107736394.99929431, + "lr": 0.00096093157579425, + "time_sec": 15.59559416770935 + }, + { + "epoch": 20, + "train_loss": 1.2454956715774537, + "train_acc": 0.63962, + "test_loss": 1.862760306930542, + "test_acc": 0.5166, + "lyapunov": null, + "grad_norm": 1.3087654259412098, + "grad_max_sv": 0.583590354025364, + "grad_min_sv": 2.470869329140868e-08, + "grad_condition": 28538129.547009837, + "lr": 0.0009567727288213001, + "time_sec": 15.578768253326416 + }, + { + "epoch": 21, + "train_loss": 1.2203223657226563, + "train_acc": 0.64712, + "test_loss": 1.8641546312332153, + "test_acc": 0.5193, + "lyapunov": null, + "grad_norm": 1.2837238048732729, + "grad_max_sv": 0.5924517832696438, + "grad_min_sv": 2.4348954538039312e-08, + "grad_condition": 93781869.91679552, + "lr": 0.0009524135262330095, + "time_sec": 15.614121198654175 + }, + { + "epoch": 22, + "train_loss": 1.1865811985397339, + "train_acc": 0.65476, + "test_loss": 2.0345648471832276, + "test_acc": 0.4893, + "lyapunov": null, + "grad_norm": 1.2512260920694542, + "grad_max_sv": 0.5759196959435939, + "grad_min_sv": 2.384011341116654e-08, + "grad_condition": 30288258.368695997, + "lr": 0.0009478558801197061, + "time_sec": 15.612670183181763 + }, + { + "epoch": 23, + "train_loss": 1.1597199523544313, + "train_acc": 0.66328, + "test_loss": 1.7475012817382813, + "test_acc": 0.5456, + "lyapunov": null, + "grad_norm": 1.22099214296503, + "grad_max_sv": 0.550060736387968, + "grad_min_sv": 2.259520101161039e-08, + "grad_condition": 44796813.002676345, + "lr": 0.000943101789615607, + "time_sec": 15.634280920028687 + }, + { + "epoch": 24, + "train_loss": 1.1278974151992798, + "train_acc": 0.67306, + "test_loss": 1.9481268964767455, + "test_acc": 0.5126, + "lyapunov": null, + "grad_norm": 1.204438554486539, + "grad_max_sv": 0.5349243931472302, + "grad_min_sv": 2.225912898324439e-08, + "grad_condition": 183220898.93468145, + "lr": 0.0009381533400219313, + "time_sec": 15.649690389633179 + }, + { + "epoch": 25, + "train_loss": 1.096091796951294, + "train_acc": 0.68, + "test_loss": 2.0196787605285644, + "test_acc": 0.5038, + "lyapunov": null, + "grad_norm": 1.1805395110366357, + "grad_max_sv": 0.5209554739296436, + "grad_min_sv": 2.1478067243539635e-08, + "grad_condition": 4139399544.237787, + "lr": 0.0009330127018922189, + "time_sec": 15.62510895729065 + }, + { + "epoch": 26, + "train_loss": 1.0776387982559203, + "train_acc": 0.6821, + "test_loss": 1.9688811008453369, + "test_acc": 0.5111, + "lyapunov": null, + "grad_norm": 1.1581479939567827, + "grad_max_sv": 0.5094197139143943, + "grad_min_sv": 2.1775440942062298e-08, + "grad_condition": 34416173.97374034, + "lr": 0.000927682130080253, + "time_sec": 15.616900444030762 + }, + { + "epoch": 27, + "train_loss": 1.039057155227661, + "train_acc": 0.69314, + "test_loss": 1.9735270919799806, + "test_acc": 0.5109, + "lyapunov": null, + "grad_norm": 1.1358478872536777, + "grad_max_sv": 0.49843145087361335, + "grad_min_sv": 2.0908967124713685e-08, + "grad_condition": 147733329.90615898, + "lr": 0.0009221639627510072, + "time_sec": 15.589634418487549 + }, + { + "epoch": 28, + "train_loss": 1.0186366636657715, + "train_acc": 0.698, + "test_loss": 1.849167727470398, + "test_acc": 0.5327, + "lyapunov": null, + "grad_norm": 1.1179885484776635, + "grad_max_sv": 0.4846231251955032, + "grad_min_sv": 2.064624871154358e-08, + "grad_condition": 187535295.68791586, + "lr": 0.0009164606203550494, + "time_sec": 15.606561422348022 + }, + { + "epoch": 29, + "train_loss": 0.9894418817901611, + "train_acc": 0.70704, + "test_loss": 1.9159385116577148, + "test_acc": 0.5256, + "lyapunov": null, + "grad_norm": 1.1033010317922292, + "grad_max_sv": 0.49175669252872467, + "grad_min_sv": 2.0545614226596954e-08, + "grad_condition": 28139106.19650669, + "lr": 0.0009105746045668516, + "time_sec": 15.596401453018188 + }, + { + "epoch": 30, + "train_loss": 0.9679239891052246, + "train_acc": 0.7117, + "test_loss": 1.7626015129089356, + "test_acc": 0.5579, + "lyapunov": null, + "grad_norm": 1.0852050474778043, + "grad_max_sv": 0.4818247281014919, + "grad_min_sv": 2.036887303824564e-08, + "grad_condition": 39564164.33428894, + "lr": 0.0009045084971874733, + "time_sec": 15.594120025634766 + }, + { + "epoch": 31, + "train_loss": 0.9477154457473755, + "train_acc": 0.71644, + "test_loss": 2.001366552734375, + "test_acc": 0.5184, + "lyapunov": null, + "grad_norm": 1.0714526476916026, + "grad_max_sv": 0.45983982309699056, + "grad_min_sv": 1.9430452840446533e-08, + "grad_condition": 51624978.6905687, + "lr": 0.0008982649590120977, + "time_sec": 15.600859880447388 + }, + { + "epoch": 32, + "train_loss": 0.922220166015625, + "train_acc": 0.72322, + "test_loss": 1.8274271976470948, + "test_acc": 0.552, + "lyapunov": null, + "grad_norm": 1.0486432180828922, + "grad_max_sv": 0.4561096005141735, + "grad_min_sv": 1.9119260000893812e-08, + "grad_condition": 81358962.64807202, + "lr": 0.0008918467286629196, + "time_sec": 15.56894040107727 + }, + { + "epoch": 33, + "train_loss": 0.9045637095451355, + "train_acc": 0.72804, + "test_loss": 1.885004960823059, + "test_acc": 0.543, + "lyapunov": null, + "grad_norm": 1.0374896564588747, + "grad_max_sv": 0.4518023140728474, + "grad_min_sv": 1.917957178319829e-08, + "grad_condition": 182673348.7808311, + "lr": 0.0008852566213878943, + "time_sec": 15.568547010421753 + }, + { + "epoch": 34, + "train_loss": 0.8857564904785157, + "train_acc": 0.7319, + "test_loss": 1.9111962642669678, + "test_acc": 0.5412, + "lyapunov": null, + "grad_norm": 1.0274666482550194, + "grad_max_sv": 0.4493935935199261, + "grad_min_sv": 1.881604217469912e-08, + "grad_condition": 248617918.33796087, + "lr": 0.000878497527825878, + "time_sec": 15.588915586471558 + }, + { + "epoch": 35, + "train_loss": 0.8623492621994019, + "train_acc": 0.73752, + "test_loss": 1.9594444644927977, + "test_acc": 0.5265, + "lyapunov": null, + "grad_norm": 1.0169882023721266, + "grad_max_sv": 0.4450283505022526, + "grad_min_sv": 1.8621021413700588e-08, + "grad_condition": 51970835.60873811, + "lr": 0.000871572412738697, + "time_sec": 15.614988565444946 + }, + { + "epoch": 36, + "train_loss": 0.847761401977539, + "train_acc": 0.7438, + "test_loss": 1.8443275575637816, + "test_acc": 0.549, + "lyapunov": null, + "grad_norm": 0.9972656465889882, + "grad_max_sv": 0.42991913110017776, + "grad_min_sv": 1.8110683554228845e-08, + "grad_condition": 63643440.089395806, + "lr": 0.0008644843137107055, + "time_sec": 15.585567474365234 + }, + { + "epoch": 37, + "train_loss": 0.8332586885261536, + "train_acc": 0.74546, + "test_loss": 1.8331810934066772, + "test_acc": 0.5565, + "lyapunov": null, + "grad_norm": 0.986142343180959, + "grad_max_sv": 0.43020778223872186, + "grad_min_sv": 1.820308022093542e-08, + "grad_condition": 38440650.114556134, + "lr": 0.0008572363398164014, + "time_sec": 15.585892915725708 + }, + { + "epoch": 38, + "train_loss": 0.808667633934021, + "train_acc": 0.75458, + "test_loss": 1.8140192237854005, + "test_acc": 0.563, + "lyapunov": null, + "grad_norm": 0.9767417084572454, + "grad_max_sv": 0.43866117894649503, + "grad_min_sv": 1.805343496832229e-08, + "grad_condition": 246839591.75793108, + "lr": 0.0008498316702566826, + "time_sec": 15.576987028121948 + }, + { + "epoch": 39, + "train_loss": 0.7920477479743957, + "train_acc": 0.75774, + "test_loss": 1.998388723373413, + "test_acc": 0.5317, + "lyapunov": null, + "grad_norm": 0.9634949356985317, + "grad_max_sv": 0.41083301454782484, + "grad_min_sv": 1.7408181231248764e-08, + "grad_condition": 207856381.9830411, + "lr": 0.0008422735529643442, + "time_sec": 15.604882955551147 + }, + { + "epoch": 40, + "train_loss": 0.783684113292694, + "train_acc": 0.76062, + "test_loss": 1.8349973222732543, + "test_acc": 0.5584, + "lyapunov": null, + "grad_norm": 0.9543715044222432, + "grad_max_sv": 0.4067095577716827, + "grad_min_sv": 1.715405322372243e-08, + "grad_condition": 38065468.34049429, + "lr": 0.0008345653031794289, + "time_sec": 15.61448359489441 + }, + { + "epoch": 41, + "train_loss": 0.756040623588562, + "train_acc": 0.76704, + "test_loss": 1.8635019605636596, + "test_acc": 0.5623, + "lyapunov": null, + "grad_norm": 0.9400945005657612, + "grad_max_sv": 0.4006481133401394, + "grad_min_sv": 1.706379215496434e-08, + "grad_condition": 129917875.15326138, + "lr": 0.0008267103019950526, + "time_sec": 15.605446100234985 + }, + { + "epoch": 42, + "train_loss": 0.747281655292511, + "train_acc": 0.77008, + "test_loss": 1.804893379020691, + "test_acc": 0.5637, + "lyapunov": null, + "grad_norm": 0.9342754196581016, + "grad_max_sv": 0.4069997236132622, + "grad_min_sv": 1.690411219660258e-08, + "grad_condition": 833088985.4088073, + "lr": 0.0008187119948743447, + "time_sec": 15.598352432250977 + }, + { + "epoch": 43, + "train_loss": 0.7258966027832031, + "train_acc": 0.7753, + "test_loss": 1.808250590133667, + "test_acc": 0.5688, + "lyapunov": null, + "grad_norm": 0.916899863328162, + "grad_max_sv": 0.39457144513726233, + "grad_min_sv": 1.6684048499693294e-08, + "grad_condition": 39061518.56268385, + "lr": 0.000810573890139155, + "time_sec": 15.596754550933838 + }, + { + "epoch": 44, + "train_loss": 0.7053343192100525, + "train_acc": 0.78078, + "test_loss": 1.9365575828552246, + "test_acc": 0.5516, + "lyapunov": null, + "grad_norm": 0.909458464797614, + "grad_max_sv": 0.38970902636647226, + "grad_min_sv": 1.6407527701767232e-08, + "grad_condition": 42244499.19662833, + "lr": 0.0008022995574311873, + "time_sec": 15.606269836425781 + }, + { + "epoch": 45, + "train_loss": 0.6963989092254639, + "train_acc": 0.7839, + "test_loss": 1.8283310445785523, + "test_acc": 0.5639, + "lyapunov": null, + "grad_norm": 0.9004438327166017, + "grad_max_sv": 0.39948956444859507, + "grad_min_sv": 1.6195382334174836e-08, + "grad_condition": 362020379.02432, + "lr": 0.0007938926261462363, + "time_sec": 15.588224411010742 + }, + { + "epoch": 46, + "train_loss": 0.690151353931427, + "train_acc": 0.78312, + "test_loss": 1.838386841392517, + "test_acc": 0.5656, + "lyapunov": null, + "grad_norm": 0.8990022149636615, + "grad_max_sv": 0.3958965942263603, + "grad_min_sv": 1.6439048992683212e-08, + "grad_condition": 739976934.4713734, + "lr": 0.0007853567838422158, + "time_sec": 15.608047008514404 + }, + { + "epoch": 47, + "train_loss": 0.6644145600509643, + "train_acc": 0.79316, + "test_loss": 1.7317404174804687, + "test_acc": 0.5881, + "lyapunov": null, + "grad_norm": 0.8888942071856848, + "grad_max_sv": 0.3830097340047359, + "grad_min_sv": 1.5947025791551715e-08, + "grad_condition": 43737023.5418247, + "lr": 0.0007766957746216719, + "time_sec": 15.61106562614441 + }, + { + "epoch": 48, + "train_loss": 0.6501899867248535, + "train_acc": 0.7961, + "test_loss": 2.0301314384460447, + "test_acc": 0.5481, + "lyapunov": null, + "grad_norm": 0.8710848056333472, + "grad_max_sv": 0.37484541684389117, + "grad_min_sv": 1.568856004691144e-08, + "grad_condition": 71400760.33312531, + "lr": 0.0007679133974894982, + "time_sec": 15.616482496261597 + }, + { + "epoch": 49, + "train_loss": 0.6407210964202881, + "train_acc": 0.79878, + "test_loss": 1.8660895137786866, + "test_acc": 0.5703, + "lyapunov": null, + "grad_norm": 0.8631402634979823, + "grad_max_sv": 0.3794224761426449, + "grad_min_sv": 1.5698247981393855e-08, + "grad_condition": 48831357.42187855, + "lr": 0.000759013504686565, + "time_sec": 15.608244180679321 + }, + { + "epoch": 50, + "train_loss": 0.635532203464508, + "train_acc": 0.79966, + "test_loss": 1.8019765382766724, + "test_acc": 0.5773, + "lyapunov": null, + "grad_norm": 0.8639281681323187, + "grad_max_sv": 0.3756891183555126, + "grad_min_sv": 1.5385762375426383e-08, + "grad_condition": 443886531.5137703, + "lr": 0.0007499999999999998, + "time_sec": 15.595497369766235 + }, + { + "epoch": 51, + "train_loss": 0.6136586366081238, + "train_acc": 0.8078, + "test_loss": 1.985259211730957, + "test_acc": 0.5541, + "lyapunov": null, + "grad_norm": 0.8502360335489318, + "grad_max_sv": 0.38991634622216226, + "grad_min_sv": 1.589003087859586e-08, + "grad_condition": 36685688.17597731, + "lr": 0.0007408768370508575, + "time_sec": 15.606870174407959 + }, + { + "epoch": 52, + "train_loss": 0.6016868180465699, + "train_acc": 0.81054, + "test_loss": 1.9059622749328613, + "test_acc": 0.5677, + "lyapunov": null, + "grad_norm": 0.839451980682905, + "grad_max_sv": 0.3655779927968979, + "grad_min_sv": 1.50471602150537e-08, + "grad_condition": 68824107.55111663, + "lr": 0.0007316480175599307, + "time_sec": 15.595157861709595 + }, + { + "epoch": 53, + "train_loss": 0.5874249538040162, + "train_acc": 0.81406, + "test_loss": 1.9880520868301392, + "test_acc": 0.5586, + "lyapunov": null, + "grad_norm": 0.8317551917480781, + "grad_max_sv": 0.3655713267624378, + "grad_min_sv": 1.5141927978482016e-08, + "grad_condition": 349299867.91202754, + "lr": 0.0007223175895924635, + "time_sec": 15.589019060134888 + }, + { + "epoch": 54, + "train_loss": 0.577422985610962, + "train_acc": 0.8184, + "test_loss": 1.9396752899169922, + "test_acc": 0.5636, + "lyapunov": null, + "grad_norm": 0.8261938394130597, + "grad_max_sv": 0.3618521079421043, + "grad_min_sv": 1.4864520584507642e-08, + "grad_condition": 553216070.5433874, + "lr": 0.0007128896457825361, + "time_sec": 15.610572338104248 + }, + { + "epoch": 55, + "train_loss": 0.5702339578819275, + "train_acc": 0.81924, + "test_loss": 1.8778120471954345, + "test_acc": 0.5713, + "lyapunov": null, + "grad_norm": 0.8242148097122628, + "grad_max_sv": 0.36288107857108115, + "grad_min_sv": 1.4883936903103966e-08, + "grad_condition": 52140637.21728975, + "lr": 0.0007033683215378998, + "time_sec": 15.605257749557495 + }, + { + "epoch": 56, + "train_loss": 0.5589845707130432, + "train_acc": 0.82372, + "test_loss": 1.8699417673110963, + "test_acc": 0.5751, + "lyapunov": null, + "grad_norm": 0.8186771944690047, + "grad_max_sv": 0.346701592952013, + "grad_min_sv": 1.459523215271985e-08, + "grad_condition": 46853728.14353165, + "lr": 0.0006937577932260512, + "time_sec": 15.589865684509277 + }, + { + "epoch": 57, + "train_loss": 0.5443892800807952, + "train_acc": 0.82776, + "test_loss": 1.965821966934204, + "test_acc": 0.5664, + "lyapunov": null, + "grad_norm": 0.8036351010817813, + "grad_max_sv": 0.3483227726072073, + "grad_min_sv": 1.4410761232583335e-08, + "grad_condition": 73431270.59891501, + "lr": 0.0006840622763423388, + "time_sec": 15.590615510940552 + }, + { + "epoch": 58, + "train_loss": 0.5372896729660034, + "train_acc": 0.82954, + "test_loss": 1.876914355659485, + "test_acc": 0.5811, + "lyapunov": null, + "grad_norm": 0.7997423554449953, + "grad_max_sv": 0.34569344371557237, + "grad_min_sv": 1.4015608398366443e-08, + "grad_condition": 828306651.3532289, + "lr": 0.0006742860236609073, + "time_sec": 15.640390872955322 + }, + { + "epoch": 59, + "train_loss": 0.5291300660514832, + "train_acc": 0.83176, + "test_loss": 1.8113979286193849, + "test_acc": 0.5866, + "lyapunov": null, + "grad_norm": 0.7903239162734349, + "grad_max_sv": 0.34317835718393325, + "grad_min_sv": 1.4270118212610095e-08, + "grad_condition": 130381299.82028241, + "lr": 0.0006644333233692913, + "time_sec": 15.598358869552612 + }, + { + "epoch": 60, + "train_loss": 0.5121459530830383, + "train_acc": 0.83708, + "test_loss": 1.8623944423675538, + "test_acc": 0.5809, + "lyapunov": null, + "grad_norm": 0.7828571196598214, + "grad_max_sv": 0.33372929617762565, + "grad_min_sv": 1.3842122733448425e-08, + "grad_condition": 47391163.99310992, + "lr": 0.0006545084971874734, + "time_sec": 15.594441413879395 + }, + { + "epoch": 61, + "train_loss": 0.5045927854156494, + "train_acc": 0.83722, + "test_loss": 1.868363607597351, + "test_acc": 0.5833, + "lyapunov": null, + "grad_norm": 0.782632751951769, + "grad_max_sv": 0.3441222012042999, + "grad_min_sv": 1.4132956021933527e-08, + "grad_condition": 770221957.2190915, + "lr": 0.0006445158984722354, + "time_sec": 15.625693082809448 + }, + { + "epoch": 62, + "train_loss": 0.4909844134426117, + "train_acc": 0.84268, + "test_loss": 1.9616632486343384, + "test_acc": 0.5686, + "lyapunov": null, + "grad_norm": 0.7640706557919354, + "grad_max_sv": 0.3262421116232872, + "grad_min_sv": 1.3609901451661078e-08, + "grad_condition": 70578003.89460334, + "lr": 0.0006344599103076324, + "time_sec": 15.61337399482727 + }, + { + "epoch": 63, + "train_loss": 0.47858007513046263, + "train_acc": 0.84808, + "test_loss": 1.8504299934387207, + "test_acc": 0.5864, + "lyapunov": null, + "grad_norm": 0.7612944717059198, + "grad_max_sv": 0.3300259932875633, + "grad_min_sv": 1.34369991692607e-08, + "grad_condition": 1366561815.948382, + "lr": 0.0006243449435824269, + "time_sec": 15.618177652359009 + }, + { + "epoch": 64, + "train_loss": 0.47501785024642945, + "train_acc": 0.84756, + "test_loss": 1.8781955436706543, + "test_acc": 0.5869, + "lyapunov": null, + "grad_norm": 0.7572180647827939, + "grad_max_sv": 0.3278561718761921, + "grad_min_sv": 1.3324545805690896e-08, + "grad_condition": 581046380.377969, + "lr": 0.0006141754350553275, + "time_sec": 15.624166488647461 + }, + { + "epoch": 65, + "train_loss": 0.4702414323043823, + "train_acc": 0.84926, + "test_loss": 1.892370820426941, + "test_acc": 0.586, + "lyapunov": null, + "grad_norm": 0.7563650221448377, + "grad_max_sv": 0.3307614929974079, + "grad_min_sv": 1.3784487005921026e-08, + "grad_condition": 464200921.7045374, + "lr": 0.0006039558454088793, + "time_sec": 15.617845058441162 + }, + { + "epoch": 66, + "train_loss": 0.45756534008026123, + "train_acc": 0.85312, + "test_loss": 1.9519972061157227, + "test_acc": 0.5808, + "lyapunov": null, + "grad_norm": 0.7420841565788096, + "grad_max_sv": 0.33202062249183656, + "grad_min_sv": 1.338400364191486e-08, + "grad_condition": 499395104.1034541, + "lr": 0.000593690657292862, + "time_sec": 15.611196994781494 + }, + { + "epoch": 67, + "train_loss": 0.44467548862457273, + "train_acc": 0.85686, + "test_loss": 1.9216414470672607, + "test_acc": 0.5822, + "lyapunov": null, + "grad_norm": 0.7382025740357703, + "grad_max_sv": 0.3282777763903141, + "grad_min_sv": 1.3046149181881323e-08, + "grad_condition": 346705862.33150136, + "lr": 0.0005833843733580507, + "time_sec": 15.611254215240479 + }, + { + "epoch": 68, + "train_loss": 0.43985233959198, + "train_acc": 0.85918, + "test_loss": 1.8851093154907226, + "test_acc": 0.5926, + "lyapunov": null, + "grad_norm": 0.7289145095731725, + "grad_max_sv": 0.32352428287267687, + "grad_min_sv": 1.3040011394684428e-08, + "grad_condition": 442041574.8141201, + "lr": 0.0005730415142812054, + "time_sec": 15.625309467315674 + }, + { + "epoch": 69, + "train_loss": 0.4362604184055328, + "train_acc": 0.85998, + "test_loss": 1.8714712146759034, + "test_acc": 0.5926, + "lyapunov": null, + "grad_norm": 0.7311888404996788, + "grad_max_sv": 0.31886391565203664, + "grad_min_sv": 1.2968906573272102e-08, + "grad_condition": 3567171952.0862184, + "lr": 0.0005626666167821517, + "time_sec": 15.61151123046875 + }, + { + "epoch": 70, + "train_loss": 0.42215480308532716, + "train_acc": 0.86416, + "test_loss": 2.019381594085693, + "test_acc": 0.5791, + "lyapunov": null, + "grad_norm": 0.721768423243528, + "grad_max_sv": 0.3247049540281296, + "grad_min_sv": 1.2853580642424936e-08, + "grad_condition": 450059064.02256596, + "lr": 0.0005522642316338265, + "time_sec": 15.629756689071655 + }, + { + "epoch": 71, + "train_loss": 0.4138381930923462, + "train_acc": 0.8672, + "test_loss": 1.8805969470977784, + "test_acc": 0.5939, + "lyapunov": null, + "grad_norm": 0.7122183187054967, + "grad_max_sv": 0.31785007640719415, + "grad_min_sv": 1.2996066436378461e-08, + "grad_condition": 197171308.1464749, + "lr": 0.0005418389216661573, + "time_sec": 15.619616270065308 + }, + { + "epoch": 72, + "train_loss": 0.40292635828018186, + "train_acc": 0.86882, + "test_loss": 1.9322007545471191, + "test_acc": 0.5786, + "lyapunov": null, + "grad_norm": 0.7085910743884665, + "grad_max_sv": 0.3134432151913643, + "grad_min_sv": 1.2498033243762453e-08, + "grad_condition": 793091340.8871062, + "lr": 0.0005313952597646563, + "time_sec": 15.617356300354004 + }, + { + "epoch": 73, + "train_loss": 0.40141631307601927, + "train_acc": 0.86948, + "test_loss": 1.8957605976104737, + "test_acc": 0.599, + "lyapunov": null, + "grad_norm": 0.7091751625468098, + "grad_max_sv": 0.3174535669386387, + "grad_min_sv": 1.2447811244958862e-08, + "grad_condition": 249741254.61747846, + "lr": 0.0005209378268645994, + "time_sec": 15.621675968170166 + }, + { + "epoch": 74, + "train_loss": 0.3882115649795532, + "train_acc": 0.87366, + "test_loss": 1.98493223361969, + "test_acc": 0.5838, + "lyapunov": null, + "grad_norm": 0.6962545006972763, + "grad_max_sv": 0.31799899972975254, + "grad_min_sv": 1.2635416091113378e-08, + "grad_condition": 228682453.11998367, + "lr": 0.0005104712099416781, + "time_sec": 15.613324403762817 + }, + { + "epoch": 75, + "train_loss": 0.3784026951885223, + "train_acc": 0.8775, + "test_loss": 1.9258492612838745, + "test_acc": 0.5894, + "lyapunov": null, + "grad_norm": 0.6897862834083666, + "grad_max_sv": 0.3025407921522856, + "grad_min_sv": 1.191642424076822e-08, + "grad_condition": 517580765.4604114, + "lr": 0.0004999999999999996, + "time_sec": 15.604532957077026 + }, + { + "epoch": 76, + "train_loss": 0.3745850126075745, + "train_acc": 0.87942, + "test_loss": 1.8862019395828247, + "test_acc": 0.597, + "lyapunov": null, + "grad_norm": 0.6831871296489548, + "grad_max_sv": 0.30832933597266676, + "grad_min_sv": 1.2160173869495832e-08, + "grad_condition": 947775184.6338822, + "lr": 0.0004895287900583212, + "time_sec": 15.608951568603516 + }, + { + "epoch": 77, + "train_loss": 0.3610551133441925, + "train_acc": 0.88172, + "test_loss": 1.880063851928711, + "test_acc": 0.6012, + "lyapunov": null, + "grad_norm": 0.6743453354187542, + "grad_max_sv": 0.29855253025889394, + "grad_min_sv": 1.2030242225015767e-08, + "grad_condition": 516312299.61059207, + "lr": 0.0004790621731353997, + "time_sec": 15.615072250366211 + }, + { + "epoch": 78, + "train_loss": 0.3575943685531616, + "train_acc": 0.88478, + "test_loss": 1.9622120880126954, + "test_acc": 0.5938, + "lyapunov": null, + "grad_norm": 0.6751503647014531, + "grad_max_sv": 0.30869465619325637, + "grad_min_sv": 1.1962258270568903e-08, + "grad_condition": 156961942.34190208, + "lr": 0.000468604740235343, + "time_sec": 15.620108127593994 + }, + { + "epoch": 79, + "train_loss": 0.356780963382721, + "train_acc": 0.88514, + "test_loss": 1.9785774551391602, + "test_acc": 0.5895, + "lyapunov": null, + "grad_norm": 0.6750273249196351, + "grad_max_sv": 0.29922002404928205, + "grad_min_sv": 1.1769536231547029e-08, + "grad_condition": 159293637.70185965, + "lr": 0.00045816107833384175, + "time_sec": 15.615866899490356 + }, + { + "epoch": 80, + "train_loss": 0.34938912315368653, + "train_acc": 0.8876, + "test_loss": 1.9177911525726319, + "test_acc": 0.5916, + "lyapunov": null, + "grad_norm": 0.6633930537019016, + "grad_max_sv": 0.29133019372820856, + "grad_min_sv": 1.1681813408617736e-08, + "grad_condition": 263364196.96272945, + "lr": 0.0004477357683661729, + "time_sec": 15.618734359741211 + }, + { + "epoch": 81, + "train_loss": 0.34074662324905397, + "train_acc": 0.8899, + "test_loss": 1.947013536453247, + "test_acc": 0.5907, + "lyapunov": null, + "grad_norm": 0.6597022593428697, + "grad_max_sv": 0.29191571436822417, + "grad_min_sv": 1.156299900565089e-08, + "grad_condition": 1345147447.952278, + "lr": 0.00043733338321784746, + "time_sec": 15.646045923233032 + }, + { + "epoch": 82, + "train_loss": 0.33476794362068174, + "train_acc": 0.89196, + "test_loss": 1.995362993812561, + "test_acc": 0.5918, + "lyapunov": null, + "grad_norm": 0.6563550515125143, + "grad_max_sv": 0.28989207223057745, + "grad_min_sv": 1.1521310828500105e-08, + "grad_condition": 1549368517.9852664, + "lr": 0.0004269584857187939, + "time_sec": 15.651390075683594 + }, + { + "epoch": 83, + "train_loss": 0.32779589292526246, + "train_acc": 0.89466, + "test_loss": 1.9326098243713379, + "test_acc": 0.5984, + "lyapunov": null, + "grad_norm": 0.6471640564495617, + "grad_max_sv": 0.29146968461573125, + "grad_min_sv": 1.1487493853379327e-08, + "grad_condition": 92617304.39349434, + "lr": 0.0004166156266419484, + "time_sec": 15.611905336380005 + }, + { + "epoch": 84, + "train_loss": 0.3205149848842621, + "train_acc": 0.89636, + "test_loss": 2.084268938064575, + "test_acc": 0.5809, + "lyapunov": null, + "grad_norm": 0.6452842014274853, + "grad_max_sv": 0.2868046831339598, + "grad_min_sv": 1.1289359868812965e-08, + "grad_condition": 186807946.77140856, + "lr": 0.0004063093427071373, + "time_sec": 15.605120658874512 + }, + { + "epoch": 85, + "train_loss": 0.31429147192001344, + "train_acc": 0.89772, + "test_loss": 1.8867773443222047, + "test_acc": 0.6067, + "lyapunov": null, + "grad_norm": 0.6402388209165808, + "grad_max_sv": 0.29072388894855977, + "grad_min_sv": 1.1252009047418853e-08, + "grad_condition": 102815726.30519769, + "lr": 0.0003960441545911199, + "time_sec": 15.619008302688599 + }, + { + "epoch": 86, + "train_loss": 0.3057248209381104, + "train_acc": 0.90034, + "test_loss": 1.9401320112228393, + "test_acc": 0.5983, + "lyapunov": null, + "grad_norm": 0.6311267078269261, + "grad_max_sv": 0.2907364759594202, + "grad_min_sv": 1.1278600659490879e-08, + "grad_condition": 156533701.22010937, + "lr": 0.0003858245649446718, + "time_sec": 15.645244359970093 + }, + { + "epoch": 87, + "train_loss": 0.3014916487598419, + "train_acc": 0.9024, + "test_loss": 1.9676358179092408, + "test_acc": 0.5951, + "lyapunov": null, + "grad_norm": 0.6286377862812311, + "grad_max_sv": 0.29410710372030735, + "grad_min_sv": 1.117144211807558e-08, + "grad_condition": 1243341457.898049, + "lr": 0.00037565505641757235, + "time_sec": 15.613637685775757 + }, + { + "epoch": 88, + "train_loss": 0.2975629404449463, + "train_acc": 0.90206, + "test_loss": 1.9475040822982788, + "test_acc": 0.6007, + "lyapunov": null, + "grad_norm": 0.6288857771151286, + "grad_max_sv": 0.29210252575576306, + "grad_min_sv": 1.1327018099556787e-08, + "grad_condition": 449577659.23919934, + "lr": 0.00036554008969236695, + "time_sec": 15.627456188201904 + }, + { + "epoch": 89, + "train_loss": 0.2940291863822937, + "train_acc": 0.90424, + "test_loss": 1.9751218059539795, + "test_acc": 0.6041, + "lyapunov": null, + "grad_norm": 0.624248588717073, + "grad_max_sv": 0.27752059176564214, + "grad_min_sv": 1.0839235129161267e-08, + "grad_condition": 328108890.12738866, + "lr": 0.0003554841015277638, + "time_sec": 15.661294221878052 + }, + { + "epoch": 90, + "train_loss": 0.28330512808799746, + "train_acc": 0.90742, + "test_loss": 1.9922785207748412, + "test_acc": 0.6018, + "lyapunov": null, + "grad_norm": 0.6169602856180438, + "grad_max_sv": 0.2886409737169743, + "grad_min_sv": 1.0983499523081752e-08, + "grad_condition": 97610883.30544701, + "lr": 0.000345491502812526, + "time_sec": 15.610979795455933 + }, + { + "epoch": 91, + "train_loss": 0.2814662490653992, + "train_acc": 0.90908, + "test_loss": 1.9960870874404908, + "test_acc": 0.5995, + "lyapunov": null, + "grad_norm": 0.6132865794782463, + "grad_max_sv": 0.28339540734887125, + "grad_min_sv": 1.0941020271021395e-08, + "grad_condition": 145384408.70816708, + "lr": 0.0003355666766307081, + "time_sec": 15.639533281326294 + }, + { + "epoch": 92, + "train_loss": 0.2761197953605652, + "train_acc": 0.91006, + "test_loss": 1.993612285232544, + "test_acc": 0.6007, + "lyapunov": null, + "grad_norm": 0.6073672916952068, + "grad_max_sv": 0.2746456813067198, + "grad_min_sv": 1.0572886616905252e-08, + "grad_condition": 62093577.47245115, + "lr": 0.00032571397633909225, + "time_sec": 15.616953611373901 + }, + { + "epoch": 93, + "train_loss": 0.2773143856334686, + "train_acc": 0.90906, + "test_loss": 1.9627196998596192, + "test_acc": 0.5993, + "lyapunov": null, + "grad_norm": 0.6057396266879189, + "grad_max_sv": 0.27635425254702567, + "grad_min_sv": 1.0533270900208586e-08, + "grad_condition": 200919941.49428365, + "lr": 0.00031593772365766094, + "time_sec": 15.62587594985962 + }, + { + "epoch": 94, + "train_loss": 0.2620466177368164, + "train_acc": 0.91416, + "test_loss": 2.0111697412490845, + "test_acc": 0.602, + "lyapunov": null, + "grad_norm": 0.5926928515974628, + "grad_max_sv": 0.28529031090438367, + "grad_min_sv": 1.0650170428677317e-08, + "grad_condition": 743433094.0082552, + "lr": 0.0003062422067739483, + "time_sec": 15.626370191574097 + }, + { + "epoch": 95, + "train_loss": 0.2537871124172211, + "train_acc": 0.91762, + "test_loss": 1.9979699476242065, + "test_acc": 0.5996, + "lyapunov": null, + "grad_norm": 0.5795471657923094, + "grad_max_sv": 0.27274232916533947, + "grad_min_sv": 1.036865705178816e-08, + "grad_condition": 309294232.0879529, + "lr": 0.00029663167846209965, + "time_sec": 15.634578943252563 + }, + { + "epoch": 96, + "train_loss": 0.2604071279144287, + "train_acc": 0.91558, + "test_loss": 2.0250939807891846, + "test_acc": 0.5981, + "lyapunov": null, + "grad_norm": 0.5880459177262352, + "grad_max_sv": 0.27270981669425964, + "grad_min_sv": 1.0527747556186851e-08, + "grad_condition": 634008594.0035694, + "lr": 0.00028711035421746345, + "time_sec": 15.610902070999146 + }, + { + "epoch": 97, + "train_loss": 0.25580399082183836, + "train_acc": 0.91794, + "test_loss": 1.9363522800445556, + "test_acc": 0.611, + "lyapunov": null, + "grad_norm": 0.5834698969226986, + "grad_max_sv": 0.2803939372301102, + "grad_min_sv": 1.0679914613353353e-08, + "grad_condition": 719199780.3413004, + "lr": 0.00027768241040753615, + "time_sec": 15.64728569984436 + }, + { + "epoch": 98, + "train_loss": 0.24704306831359862, + "train_acc": 0.92026, + "test_loss": 1.959199716567993, + "test_acc": 0.6064, + "lyapunov": null, + "grad_norm": 0.5767069189645235, + "grad_max_sv": 0.2719736970961094, + "grad_min_sv": 1.0407105681484868e-08, + "grad_condition": 507738893.5347587, + "lr": 0.00026835198244006903, + "time_sec": 15.606433153152466 + }, + { + "epoch": 99, + "train_loss": 0.23963388308048247, + "train_acc": 0.92232, + "test_loss": 2.0193208892822265, + "test_acc": 0.604, + "lyapunov": null, + "grad_norm": 0.5636948581506628, + "grad_max_sv": 0.2563767429441214, + "grad_min_sv": 9.613457626483913e-09, + "grad_condition": 152598313.52871948, + "lr": 0.0002591231629491421, + "time_sec": 15.63752031326294 + }, + { + "epoch": 100, + "train_loss": 0.24343088443756103, + "train_acc": 0.92086, + "test_loss": 1.9747429904937743, + "test_acc": 0.6041, + "lyapunov": null, + "grad_norm": 0.5699300559096447, + "grad_max_sv": 0.270798621699214, + "grad_min_sv": 1.0453353890187232e-08, + "grad_condition": 2642582699.9195356, + "lr": 0.0002499999999999997, + "time_sec": 15.625839710235596 + }, + { + "epoch": 101, + "train_loss": 0.2352629409980774, + "train_acc": 0.92396, + "test_loss": 1.989087490463257, + "test_acc": 0.6026, + "lyapunov": null, + "grad_norm": 0.5635783773655396, + "grad_max_sv": 0.2760987766087055, + "grad_min_sv": 1.0676657122982158e-08, + "grad_condition": 230608448.0042146, + "lr": 0.00024098649531343477, + "time_sec": 15.618889093399048 + }, + { + "epoch": 102, + "train_loss": 0.23230449400901795, + "train_acc": 0.9242, + "test_loss": 2.011552722930908, + "test_acc": 0.6012, + "lyapunov": null, + "grad_norm": 0.5597262828511032, + "grad_max_sv": 0.2676333624869585, + "grad_min_sv": 1.013142310103167e-08, + "grad_condition": 765944599.5566685, + "lr": 0.0002320866025105016, + "time_sec": 15.619239091873169 + }, + { + "epoch": 103, + "train_loss": 0.22586535712242126, + "train_acc": 0.92702, + "test_loss": 1.984936227798462, + "test_acc": 0.6064, + "lyapunov": null, + "grad_norm": 0.5525662827107412, + "grad_max_sv": 0.26978373192250726, + "grad_min_sv": 1.0020810805059718e-08, + "grad_condition": 426927099.4434453, + "lr": 0.0002233042253783278, + "time_sec": 15.617717981338501 + }, + { + "epoch": 104, + "train_loss": 0.2259028799390793, + "train_acc": 0.92724, + "test_loss": 1.9414194402694702, + "test_acc": 0.6138, + "lyapunov": null, + "grad_norm": 0.5552198456176712, + "grad_max_sv": 0.2549734696745872, + "grad_min_sv": 9.559075114318542e-09, + "grad_condition": 2183845809.503984, + "lr": 0.000214643216157784, + "time_sec": 15.639457702636719 + }, + { + "epoch": 105, + "train_loss": 0.21585512964725495, + "train_acc": 0.93068, + "test_loss": 1.9875489110946656, + "test_acc": 0.606, + "lyapunov": null, + "grad_norm": 0.545110676363793, + "grad_max_sv": 0.2662647683173418, + "grad_min_sv": 9.966519613335139e-09, + "grad_condition": 304520020.74158037, + "lr": 0.00020610737385376332, + "time_sec": 15.633507013320923 + }, + { + "epoch": 106, + "train_loss": 0.2177306656885147, + "train_acc": 0.92888, + "test_loss": 2.001543083000183, + "test_acc": 0.6039, + "lyapunov": null, + "grad_norm": 0.550439381212866, + "grad_max_sv": 0.2616906825453043, + "grad_min_sv": 9.792636692686207e-09, + "grad_condition": 257664085.8931566, + "lr": 0.00019770044256881242, + "time_sec": 15.617624759674072 + }, + { + "epoch": 107, + "train_loss": 0.21544821160316469, + "train_acc": 0.93026, + "test_loss": 1.982275790977478, + "test_acc": 0.6101, + "lyapunov": null, + "grad_norm": 0.5459895500350969, + "grad_max_sv": 0.25458521842956544, + "grad_min_sv": 9.842609948471428e-09, + "grad_condition": 482597026.39869213, + "lr": 0.0001894261098608447, + "time_sec": 15.647446632385254 + }, + { + "epoch": 108, + "train_loss": 0.2111588809776306, + "train_acc": 0.93214, + "test_loss": 1.9962615560531616, + "test_acc": 0.6122, + "lyapunov": null, + "grad_norm": 0.5418984142700298, + "grad_max_sv": 0.2645403627306223, + "grad_min_sv": 9.923241169051967e-09, + "grad_condition": 365555925.75439864, + "lr": 0.000181288005125655, + "time_sec": 15.624069213867188 + }, + { + "epoch": 109, + "train_loss": 0.20284160462856293, + "train_acc": 0.9356, + "test_loss": 1.9948909492492677, + "test_acc": 0.6088, + "lyapunov": null, + "grad_norm": 0.528437343256151, + "grad_max_sv": 0.259377746284008, + "grad_min_sv": 9.446828402957103e-09, + "grad_condition": 445873699.40050447, + "lr": 0.0001732896980049473, + "time_sec": 15.619670867919922 + }, + { + "epoch": 110, + "train_loss": 0.20353743035316468, + "train_acc": 0.93482, + "test_loss": 1.986756645965576, + "test_acc": 0.6055, + "lyapunov": null, + "grad_norm": 0.5264966046483858, + "grad_max_sv": 0.2641640670597553, + "grad_min_sv": 9.887280825321421e-09, + "grad_condition": 138912649.1504107, + "lr": 0.00016543469682057076, + "time_sec": 15.631803512573242 + }, + { + "epoch": 111, + "train_loss": 0.20074854846000673, + "train_acc": 0.93586, + "test_loss": 1.9947669797897338, + "test_acc": 0.6121, + "lyapunov": null, + "grad_norm": 0.5275548784671268, + "grad_max_sv": 0.2535504408180714, + "grad_min_sv": 9.46079494620021e-09, + "grad_condition": 547036967.0533922, + "lr": 0.00015772644703565552, + "time_sec": 15.61940598487854 + }, + { + "epoch": 112, + "train_loss": 0.19321160237312318, + "train_acc": 0.9385, + "test_loss": 2.0327499378204346, + "test_acc": 0.6062, + "lyapunov": null, + "grad_norm": 0.5166537604057669, + "grad_max_sv": 0.25912084989249706, + "grad_min_sv": 9.35720720976474e-09, + "grad_condition": 95478514.06504653, + "lr": 0.00015016832974331713, + "time_sec": 15.630404233932495 + }, + { + "epoch": 113, + "train_loss": 0.19881929339408874, + "train_acc": 0.93676, + "test_loss": 1.9957002614974975, + "test_acc": 0.6131, + "lyapunov": null, + "grad_norm": 0.5256468964094271, + "grad_max_sv": 0.26186227425932884, + "grad_min_sv": 9.776758263992796e-09, + "grad_condition": 531930595.36185646, + "lr": 0.00014276366018359834, + "time_sec": 15.610270023345947 + }, + { + "epoch": 114, + "train_loss": 0.19278850085735322, + "train_acc": 0.93894, + "test_loss": 1.9826040161132812, + "test_acc": 0.6131, + "lyapunov": null, + "grad_norm": 0.5148800122190731, + "grad_max_sv": 0.2489961117506027, + "grad_min_sv": 9.322825122396599e-09, + "grad_condition": 159545806.21783024, + "lr": 0.00013551568628929425, + "time_sec": 15.641097784042358 + }, + { + "epoch": 115, + "train_loss": 0.18285285237312318, + "train_acc": 0.9414, + "test_loss": 1.991772039604187, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.5028991850276996, + "grad_max_sv": 0.25001580603420737, + "grad_min_sv": 9.509952834441983e-09, + "grad_condition": 842043304.8653241, + "lr": 0.00012842758726130276, + "time_sec": 15.624920845031738 + }, + { + "epoch": 116, + "train_loss": 0.18698999623775484, + "train_acc": 0.94058, + "test_loss": 2.0126701816558836, + "test_acc": 0.6119, + "lyapunov": null, + "grad_norm": 0.5095041564276453, + "grad_max_sv": 0.26496921889483926, + "grad_min_sv": 9.780998184343373e-09, + "grad_condition": 568079773.7667667, + "lr": 0.0001215024721741218, + "time_sec": 15.629492282867432 + }, + { + "epoch": 117, + "train_loss": 0.18326869733810425, + "train_acc": 0.94208, + "test_loss": 2.0141338161468507, + "test_acc": 0.6109, + "lyapunov": null, + "grad_norm": 0.5053898511223723, + "grad_max_sv": 0.25150991678237916, + "grad_min_sv": 9.336200610613604e-09, + "grad_condition": 1717749653.6011043, + "lr": 0.00011474337861210538, + "time_sec": 15.634049415588379 + }, + { + "epoch": 118, + "train_loss": 0.18224171819210053, + "train_acc": 0.94188, + "test_loss": 2.0296729431152345, + "test_acc": 0.6105, + "lyapunov": null, + "grad_norm": 0.5029285155771278, + "grad_max_sv": 0.23879224769771099, + "grad_min_sv": 8.82893005297973e-09, + "grad_condition": 239804345.46782646, + "lr": 0.00010815327133708009, + "time_sec": 15.628947496414185 + }, + { + "epoch": 119, + "train_loss": 0.18119296488761902, + "train_acc": 0.94198, + "test_loss": 2.0246818908691404, + "test_acc": 0.6087, + "lyapunov": null, + "grad_norm": 0.5032702983874193, + "grad_max_sv": 0.24678345806896687, + "grad_min_sv": 9.113220317789883e-09, + "grad_condition": 857312795.1343833, + "lr": 0.00010173504098790182, + "time_sec": 15.6134774684906 + }, + { + "epoch": 120, + "train_loss": 0.17719127690315248, + "train_acc": 0.9427, + "test_loss": 2.01081164188385, + "test_acc": 0.6174, + "lyapunov": null, + "grad_norm": 0.5004254149003725, + "grad_max_sv": 0.246440602093935, + "grad_min_sv": 9.41313048775233e-09, + "grad_condition": 138861626.69393042, + "lr": 9.549150281252629e-05, + "time_sec": 15.636605978012085 + }, + { + "epoch": 121, + "train_loss": 0.17499777765274047, + "train_acc": 0.94382, + "test_loss": 1.9586133924484252, + "test_acc": 0.6191, + "lyapunov": null, + "grad_norm": 0.49798749889404575, + "grad_max_sv": 0.24333747774362563, + "grad_min_sv": 8.965640931665048e-09, + "grad_condition": 199036180.79499412, + "lr": 8.942539543314794e-05, + "time_sec": 15.640979051589966 + }, + { + "epoch": 122, + "train_loss": 0.17186202396392822, + "train_acc": 0.94454, + "test_loss": 2.0166892234802245, + "test_acc": 0.6135, + "lyapunov": null, + "grad_norm": 0.49330378790067125, + "grad_max_sv": 0.25466611608862877, + "grad_min_sv": 9.453950847171378e-09, + "grad_condition": 478328271.5351636, + "lr": 8.353937964495024e-05, + "time_sec": 15.646830320358276 + }, + { + "epoch": 123, + "train_loss": 0.16818810626506805, + "train_acc": 0.94736, + "test_loss": 2.019712274169922, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.48351538018550005, + "grad_max_sv": 0.23057686612010003, + "grad_min_sv": 8.829706591578778e-09, + "grad_condition": 119186809.27894473, + "lr": 7.783603724899243e-05, + "time_sec": 15.61932897567749 + }, + { + "epoch": 124, + "train_loss": 0.1690133387851715, + "train_acc": 0.94626, + "test_loss": 2.0480916412353514, + "test_acc": 0.6128, + "lyapunov": null, + "grad_norm": 0.48572744080768737, + "grad_max_sv": 0.23872192315757274, + "grad_min_sv": 8.860755323661872e-09, + "grad_condition": 3145605466.955108, + "lr": 7.231786991974666e-05, + "time_sec": 15.644042730331421 + }, + { + "epoch": 125, + "train_loss": 0.168843046336174, + "train_acc": 0.94632, + "test_loss": 2.0204298835754395, + "test_acc": 0.6129, + "lyapunov": null, + "grad_norm": 0.4870048472763099, + "grad_max_sv": 0.23674570098519326, + "grad_min_sv": 8.746680829206827e-09, + "grad_condition": 1043463046.0193933, + "lr": 6.698729810778072e-05, + "time_sec": 15.637329578399658 + }, + { + "epoch": 126, + "train_loss": 0.1671668215227127, + "train_acc": 0.94594, + "test_loss": 2.002202911376953, + "test_acc": 0.6131, + "lyapunov": null, + "grad_norm": 0.48754920878473634, + "grad_max_sv": 0.24048108272254468, + "grad_min_sv": 9.09920443853407e-09, + "grad_condition": 222641480.08621296, + "lr": 6.184665997806817e-05, + "time_sec": 15.630179405212402 + }, + { + "epoch": 127, + "train_loss": 0.1643574129629135, + "train_acc": 0.94886, + "test_loss": 1.9984551259994507, + "test_acc": 0.6156, + "lyapunov": null, + "grad_norm": 0.47845542032939736, + "grad_max_sv": 0.24418257176876068, + "grad_min_sv": 9.058184188338348e-09, + "grad_condition": 1384258325.8409991, + "lr": 5.6898210384392595e-05, + "time_sec": 15.670144081115723 + }, + { + "epoch": 128, + "train_loss": 0.16359006194114686, + "train_acc": 0.9479, + "test_loss": 2.0345991184234617, + "test_acc": 0.6179, + "lyapunov": null, + "grad_norm": 0.48011615670673446, + "grad_max_sv": 0.2456669148057699, + "grad_min_sv": 9.08018520576876e-09, + "grad_condition": 6539583536.661702, + "lr": 5.214411988029363e-05, + "time_sec": 15.629289150238037 + }, + { + "epoch": 129, + "train_loss": 0.16212649368047713, + "train_acc": 0.94982, + "test_loss": 2.010682648849487, + "test_acc": 0.6175, + "lyapunov": null, + "grad_norm": 0.4761536550945564, + "grad_max_sv": 0.232033634185791, + "grad_min_sv": 8.589821504130924e-09, + "grad_condition": 3119446573.9156704, + "lr": 4.7586473766990294e-05, + "time_sec": 15.64078950881958 + }, + { + "epoch": 130, + "train_loss": 0.16086667060375215, + "train_acc": 0.94958, + "test_loss": 1.9803698434829713, + "test_acc": 0.6147, + "lyapunov": null, + "grad_norm": 0.47391205330881436, + "grad_max_sv": 0.2445445589721203, + "grad_min_sv": 8.864201939140243e-09, + "grad_condition": 1504896403.9424946, + "lr": 4.32272711786996e-05, + "time_sec": 15.639111280441284 + }, + { + "epoch": 131, + "train_loss": 0.1630353739786148, + "train_acc": 0.94778, + "test_loss": 2.0161276233673098, + "test_acc": 0.6182, + "lyapunov": null, + "grad_norm": 0.47703771588416854, + "grad_max_sv": 0.24524084888398648, + "grad_min_sv": 8.949330069585661e-09, + "grad_condition": 366306191.4994844, + "lr": 3.906842420574966e-05, + "time_sec": 15.648417472839355 + }, + { + "epoch": 132, + "train_loss": 0.1624550827550888, + "train_acc": 0.94854, + "test_loss": 2.0064841974258423, + "test_acc": 0.6153, + "lyapunov": null, + "grad_norm": 0.4818820971540279, + "grad_max_sv": 0.24392225965857506, + "grad_min_sv": 9.014241386749028e-09, + "grad_condition": 324500193.81381315, + "lr": 3.5111757055874305e-05, + "time_sec": 15.652456998825073 + }, + { + "epoch": 133, + "train_loss": 0.15666789950847626, + "train_acc": 0.95052, + "test_loss": 2.004924358177185, + "test_acc": 0.614, + "lyapunov": null, + "grad_norm": 0.4692967462799058, + "grad_max_sv": 0.23394662290811538, + "grad_min_sv": 8.633084696250959e-09, + "grad_condition": 738953051.583332, + "lr": 3.1359005254054254e-05, + "time_sec": 15.626720190048218 + }, + { + "epoch": 134, + "train_loss": 0.15714832616329194, + "train_acc": 0.951, + "test_loss": 1.9721798049926758, + "test_acc": 0.6189, + "lyapunov": null, + "grad_norm": 0.4708593375349624, + "grad_max_sv": 0.2399698007851839, + "grad_min_sv": 8.714008907333149e-09, + "grad_condition": 459943684.01348275, + "lr": 2.7811814881259484e-05, + "time_sec": 15.634363174438477 + }, + { + "epoch": 135, + "train_loss": 0.15481690949440002, + "train_acc": 0.95178, + "test_loss": 2.056765143966675, + "test_acc": 0.6141, + "lyapunov": null, + "grad_norm": 0.46512649923966126, + "grad_max_sv": 0.23735021129250528, + "grad_min_sv": 8.604525054706907e-09, + "grad_condition": 441311318.94657505, + "lr": 2.4471741852423218e-05, + "time_sec": 15.641301155090332 + }, + { + "epoch": 136, + "train_loss": 0.15590213608264922, + "train_acc": 0.95074, + "test_loss": 1.9664541049957276, + "test_acc": 0.615, + "lyapunov": null, + "grad_norm": 0.4718253897994526, + "grad_max_sv": 0.24445511549711227, + "grad_min_sv": 8.92059932467576e-09, + "grad_condition": 155779083.2595345, + "lr": 2.1340251233966362e-05, + "time_sec": 15.650960445404053 + }, + { + "epoch": 137, + "train_loss": 0.15185086236953735, + "train_acc": 0.95326, + "test_loss": 2.047826315307617, + "test_acc": 0.6137, + "lyapunov": null, + "grad_norm": 0.46215794046576214, + "grad_max_sv": 0.2249258290976286, + "grad_min_sv": 8.299157507572763e-09, + "grad_condition": 391195089.613189, + "lr": 1.8418716601170932e-05, + "time_sec": 15.619166374206543 + }, + { + "epoch": 138, + "train_loss": 0.15070438093185426, + "train_acc": 0.95262, + "test_loss": 2.030345579147339, + "test_acc": 0.6129, + "lyapunov": null, + "grad_norm": 0.4608066254891212, + "grad_max_sv": 0.234202978387475, + "grad_min_sv": 8.521646538895875e-09, + "grad_condition": 5129724937.383492, + "lr": 1.570841943568445e-05, + "time_sec": 15.623726606369019 + }, + { + "epoch": 139, + "train_loss": 0.15612281042575837, + "train_acc": 0.95076, + "test_loss": 2.0557478452682494, + "test_acc": 0.612, + "lyapunov": null, + "grad_norm": 0.47103497229286695, + "grad_max_sv": 0.23263695724308492, + "grad_min_sv": 8.57658385075566e-09, + "grad_condition": 101811752.76010731, + "lr": 1.3210548563419845e-05, + "time_sec": 15.65443754196167 + }, + { + "epoch": 140, + "train_loss": 0.15597544308423997, + "train_acc": 0.95086, + "test_loss": 1.9863805370330812, + "test_acc": 0.6151, + "lyapunov": null, + "grad_norm": 0.46515955894700917, + "grad_max_sv": 0.22864672914147377, + "grad_min_sv": 8.669487886083091e-09, + "grad_condition": 2093311134.8373718, + "lr": 1.0926199633097203e-05, + "time_sec": 15.636597394943237 + }, + { + "epoch": 141, + "train_loss": 0.15137063200950623, + "train_acc": 0.95232, + "test_loss": 2.0044470993041994, + "test_acc": 0.6185, + "lyapunov": null, + "grad_norm": 0.4628286057156769, + "grad_max_sv": 0.24093721210956573, + "grad_min_sv": 8.729446927135563e-09, + "grad_condition": 3146827225.783096, + "lr": 8.856374635655688e-06, + "time_sec": 15.6335289478302 + }, + { + "epoch": 142, + "train_loss": 0.15115962938308716, + "train_acc": 0.95278, + "test_loss": 1.9897070358276367, + "test_acc": 0.6186, + "lyapunov": null, + "grad_norm": 0.45849067649845243, + "grad_max_sv": 0.22538469620049, + "grad_min_sv": 8.402085760331798e-09, + "grad_condition": 1185010790.8687212, + "lr": 7.001981464747503e-06, + "time_sec": 15.64037299156189 + }, + { + "epoch": 143, + "train_loss": 0.15024116450309755, + "train_acc": 0.95378, + "test_loss": 1.9762957132339478, + "test_acc": 0.62, + "lyapunov": null, + "grad_norm": 0.4584088819764392, + "grad_max_sv": 0.22209009900689125, + "grad_min_sv": 8.452660355321145e-09, + "grad_condition": 1556012288.1682973, + "lr": 5.3638335185058295e-06, + "time_sec": 15.659480571746826 + }, + { + "epoch": 144, + "train_loss": 0.1521627188205719, + "train_acc": 0.95232, + "test_loss": 2.0099195236206056, + "test_acc": 0.615, + "lyapunov": null, + "grad_norm": 0.46494782588161737, + "grad_max_sv": 0.238496233522892, + "grad_min_sv": 8.729236520774175e-09, + "grad_condition": 69857580.46396288, + "lr": 3.942649342761114e-06, + "time_sec": 15.64352297782898 + }, + { + "epoch": 145, + "train_loss": 0.15200012585163117, + "train_acc": 0.95196, + "test_loss": 1.98911852684021, + "test_acc": 0.6161, + "lyapunov": null, + "grad_norm": 0.46350518405517277, + "grad_max_sv": 0.22944532111287116, + "grad_min_sv": 8.441616768887356e-09, + "grad_condition": 1044568693.4332545, + "lr": 2.7390523158633524e-06, + "time_sec": 15.670719385147095 + }, + { + "epoch": 146, + "train_loss": 0.1524506710958481, + "train_acc": 0.95248, + "test_loss": 1.9624867490768432, + "test_acc": 0.6194, + "lyapunov": null, + "grad_norm": 0.46296967599985495, + "grad_max_sv": 0.24031115397810937, + "grad_min_sv": 8.944420498528671e-09, + "grad_condition": 254633054.1592765, + "lr": 1.7535703752478133e-06, + "time_sec": 15.643468141555786 + }, + { + "epoch": 147, + "train_loss": 0.15344970943927766, + "train_acc": 0.95206, + "test_loss": 2.0164750316619875, + "test_acc": 0.6171, + "lyapunov": null, + "grad_norm": 0.4641053248109342, + "grad_max_sv": 0.24226672500371932, + "grad_min_sv": 8.89504937415242e-09, + "grad_condition": 221436071.47224984, + "lr": 9.866357858642196e-07, + "time_sec": 15.642008066177368 + }, + { + "epoch": 148, + "train_loss": 0.15008926822185517, + "train_acc": 0.95316, + "test_loss": 2.007580140686035, + "test_acc": 0.6105, + "lyapunov": null, + "grad_norm": 0.4593316495579621, + "grad_max_sv": 0.23314933404326438, + "grad_min_sv": 8.37392370464738e-09, + "grad_condition": 1235759721.5215242, + "lr": 4.38584950570808e-07, + "time_sec": 15.637904644012451 + }, + { + "epoch": 149, + "train_loss": 0.1545172585248947, + "train_acc": 0.95082, + "test_loss": 1.9932567636489869, + "test_acc": 0.6167, + "lyapunov": null, + "grad_norm": 0.46711595173344705, + "grad_max_sv": 0.24011613838374615, + "grad_min_sv": 9.01919292514708e-09, + "grad_condition": 533582982.17976344, + "lr": 1.096582625772501e-07, + "time_sec": 15.649343013763428 + }, + { + "epoch": 150, + "train_loss": 0.15159378504276275, + "train_acc": 0.95298, + "test_loss": 1.981881332397461, + "test_acc": 0.6151, + "lyapunov": null, + "grad_norm": 0.4631918119140012, + "grad_max_sv": 0.23626054041087627, + "grad_min_sv": 8.505257114788459e-09, + "grad_condition": 368578452.6540891, + "lr": 0.0, + "time_sec": 15.655460119247437 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.193410815277099, + "train_acc": 0.07754, + "test_loss": 4.000027540588379, + "test_acc": 0.1084, + "lyapunov": null, + "grad_norm": 5.824766820168824, + "grad_max_sv": 4.574610841274262, + "grad_min_sv": 1.0190309995827818e-07, + "grad_condition": 64142283.19081552, + "lr": 0.0009998903417374227, + "time_sec": 32.83128619194031 + }, + { + "epoch": 2, + "train_loss": 3.561303809967041, + "train_acc": 0.15712, + "test_loss": 3.590533604812622, + "test_acc": 0.1573, + "lyapunov": null, + "grad_norm": 3.9411000996615257, + "grad_max_sv": 2.8509309351444245, + "grad_min_sv": 7.158311222943414e-08, + "grad_condition": 97792152.02989444, + "lr": 0.0009995614150494292, + "time_sec": 32.72442889213562 + }, + { + "epoch": 3, + "train_loss": 3.1933692501068114, + "train_acc": 0.21822, + "test_loss": 3.4406786922454833, + "test_acc": 0.1888, + "lyapunov": null, + "grad_norm": 2.91352219919842, + "grad_max_sv": 1.9122859120368958, + "grad_min_sv": 5.4513909730768975e-08, + "grad_condition": 41901882.724198125, + "lr": 0.0009990133642141358, + "time_sec": 32.71043276786804 + }, + { + "epoch": 4, + "train_loss": 2.9170604755401612, + "train_acc": 0.266, + "test_loss": 3.0161821269989013, + "test_acc": 0.2662, + "lyapunov": null, + "grad_norm": 2.4579814839971488, + "grad_max_sv": 1.375921016931534, + "grad_min_sv": 4.532563397940948e-08, + "grad_condition": 34954497.395048514, + "lr": 0.0009982464296247522, + "time_sec": 32.71440148353577 + }, + { + "epoch": 5, + "train_loss": 2.6815094689941406, + "train_acc": 0.31454, + "test_loss": 3.171553889846802, + "test_acc": 0.2379, + "lyapunov": null, + "grad_norm": 2.19104728864566, + "grad_max_sv": 1.1679374247789382, + "grad_min_sv": 4.075679240767016e-08, + "grad_condition": 34176946.0056582, + "lr": 0.0009972609476841367, + "time_sec": 32.70787262916565 + }, + { + "epoch": 6, + "train_loss": 2.512476542663574, + "train_acc": 0.34722, + "test_loss": 2.8388263694763185, + "test_acc": 0.2956, + "lyapunov": null, + "grad_norm": 2.024852807897748, + "grad_max_sv": 1.048439186811447, + "grad_min_sv": 3.766053036924344e-08, + "grad_condition": 110646045.40063909, + "lr": 0.000996057350657239, + "time_sec": 32.716644048690796 + }, + { + "epoch": 7, + "train_loss": 2.3700338256072997, + "train_acc": 0.37646, + "test_loss": 2.664342771148682, + "test_acc": 0.3267, + "lyapunov": null, + "grad_norm": 1.8863637744279735, + "grad_max_sv": 0.9381255134940147, + "grad_min_sv": 3.53045587958567e-08, + "grad_condition": 91691166.21261387, + "lr": 0.000994636166481494, + "time_sec": 32.70954084396362 + }, + { + "epoch": 8, + "train_loss": 2.241964275894165, + "train_acc": 0.40536, + "test_loss": 2.3703575309753417, + "test_acc": 0.3827, + "lyapunov": null, + "grad_norm": 1.79442458506404, + "grad_max_sv": 0.8764713048934937, + "grad_min_sv": 3.357538055498432e-08, + "grad_condition": 85483165.80410945, + "lr": 0.0009929980185352525, + "time_sec": 32.705676794052124 + }, + { + "epoch": 9, + "train_loss": 2.1290865299224855, + "train_acc": 0.43074, + "test_loss": 2.346775402069092, + "test_acc": 0.3898, + "lyapunov": null, + "grad_norm": 1.6946660597355347, + "grad_max_sv": 0.8082527592778206, + "grad_min_sv": 3.168056596919433e-08, + "grad_condition": 84022920.74591663, + "lr": 0.0009911436253643444, + "time_sec": 32.81319451332092 + }, + { + "epoch": 10, + "train_loss": 2.0410905982208254, + "train_acc": 0.45114, + "test_loss": 2.352191310119629, + "test_acc": 0.4016, + "lyapunov": null, + "grad_norm": 1.6077351393537498, + "grad_max_sv": 0.7309410408139229, + "grad_min_sv": 2.985739961935963e-08, + "grad_condition": 36398179.92957014, + "lr": 0.0009890738003669028, + "time_sec": 32.67559885978699 + }, + { + "epoch": 11, + "train_loss": 1.9488755139160157, + "train_acc": 0.47108, + "test_loss": 2.292022847747803, + "test_acc": 0.4149, + "lyapunov": null, + "grad_norm": 1.5472074192305951, + "grad_max_sv": 0.6999917805194855, + "grad_min_sv": 2.931911482484395e-08, + "grad_condition": 29185684.451776367, + "lr": 0.00098678945143658, + "time_sec": 32.67131185531616 + }, + { + "epoch": 12, + "train_loss": 1.8751110802459716, + "train_acc": 0.48868, + "test_loss": 2.234260977935791, + "test_acc": 0.4219, + "lyapunov": null, + "grad_norm": 1.477638716923594, + "grad_max_sv": 0.647687041759491, + "grad_min_sv": 2.7830199432477e-08, + "grad_condition": 45906260.41435587, + "lr": 0.0009842915805643154, + "time_sec": 32.67626142501831 + }, + { + "epoch": 13, + "train_loss": 1.8070984636688232, + "train_acc": 0.50424, + "test_loss": 2.1869627113342287, + "test_acc": 0.4348, + "lyapunov": null, + "grad_norm": 1.4268137700999757, + "grad_max_sv": 0.6230859503149986, + "grad_min_sv": 2.6403634246358056e-08, + "grad_condition": 81962325.61583482, + "lr": 0.000981581283398829, + "time_sec": 32.71280646324158 + }, + { + "epoch": 14, + "train_loss": 1.7594015161895753, + "train_acc": 0.51666, + "test_loss": 2.225412437438965, + "test_acc": 0.4269, + "lyapunov": null, + "grad_norm": 1.3750641538015655, + "grad_max_sv": 0.5909776814281941, + "grad_min_sv": 2.5812447444067965e-08, + "grad_condition": 110809015.48631673, + "lr": 0.0009786597487660333, + "time_sec": 32.71353602409363 + }, + { + "epoch": 15, + "train_loss": 1.7050045301437378, + "train_acc": 0.5265, + "test_loss": 2.2115724647521975, + "test_acc": 0.4374, + "lyapunov": null, + "grad_norm": 1.3299355868966125, + "grad_max_sv": 0.5802051067352295, + "grad_min_sv": 2.5246993384797634e-08, + "grad_condition": 26653204.194885753, + "lr": 0.0009755282581475766, + "time_sec": 32.709041357040405 + }, + { + "epoch": 16, + "train_loss": 1.6458034181976318, + "train_acc": 0.54052, + "test_loss": 2.3288159313201904, + "test_acc": 0.4224, + "lyapunov": null, + "grad_norm": 1.2807898189857698, + "grad_max_sv": 0.5446614563465119, + "grad_min_sv": 2.4021811557278783e-08, + "grad_condition": 91338509.7437632, + "lr": 0.0009721881851187403, + "time_sec": 32.697059869766235 + }, + { + "epoch": 17, + "train_loss": 1.5929106069946288, + "train_acc": 0.55406, + "test_loss": 2.1113224380493163, + "test_acc": 0.4616, + "lyapunov": null, + "grad_norm": 1.2337526465020512, + "grad_max_sv": 0.5095916628837586, + "grad_min_sv": 2.2903062109336237e-08, + "grad_condition": 57294649.60211961, + "lr": 0.0009686409947459456, + "time_sec": 32.683470726013184 + }, + { + "epoch": 18, + "train_loss": 1.5314323492813111, + "train_acc": 0.5677, + "test_loss": 2.091776432800293, + "test_acc": 0.47, + "lyapunov": null, + "grad_norm": 1.1978845665370097, + "grad_max_sv": 0.5015841260552406, + "grad_min_sv": 2.2305156793800408e-08, + "grad_condition": 29492886.216326892, + "lr": 0.0009648882429441254, + "time_sec": 32.737040281295776 + }, + { + "epoch": 19, + "train_loss": 1.5103012445449828, + "train_acc": 0.57236, + "test_loss": 2.0679006351470948, + "test_acc": 0.4779, + "lyapunov": null, + "grad_norm": 1.1728126223162796, + "grad_max_sv": 0.4839314170181751, + "grad_min_sv": 2.174818596739625e-08, + "grad_condition": 107997783.86314659, + "lr": 0.00096093157579425, + "time_sec": 32.67225241661072 + }, + { + "epoch": 20, + "train_loss": 1.4595962884140015, + "train_acc": 0.58662, + "test_loss": 2.1169062660217284, + "test_acc": 0.4706, + "lyapunov": null, + "grad_norm": 1.1438665670784203, + "grad_max_sv": 0.469496750831604, + "grad_min_sv": 2.1164104392623617e-08, + "grad_condition": 64696771.4776402, + "lr": 0.0009567727288213001, + "time_sec": 32.6800582408905 + }, + { + "epoch": 21, + "train_loss": 1.42210446144104, + "train_acc": 0.59338, + "test_loss": 2.0751025535583496, + "test_acc": 0.4744, + "lyapunov": null, + "grad_norm": 1.1159812479247186, + "grad_max_sv": 0.45728652998805047, + "grad_min_sv": 2.1470654895661135e-08, + "grad_condition": 28760658.649009824, + "lr": 0.0009524135262330095, + "time_sec": 32.680222272872925 + }, + { + "epoch": 22, + "train_loss": 1.3733370163345338, + "train_acc": 0.60568, + "test_loss": 2.1397033340454104, + "test_acc": 0.4725, + "lyapunov": null, + "grad_norm": 1.0820101912101088, + "grad_max_sv": 0.4380739636719227, + "grad_min_sv": 2.027442237706456e-08, + "grad_condition": 33804989.22411772, + "lr": 0.0009478558801197061, + "time_sec": 32.683854818344116 + }, + { + "epoch": 23, + "train_loss": 1.3259621669006347, + "train_acc": 0.61976, + "test_loss": 2.082161441612244, + "test_acc": 0.4868, + "lyapunov": null, + "grad_norm": 1.0590598804772053, + "grad_max_sv": 0.4320934973657131, + "grad_min_sv": 1.9754895681789452e-08, + "grad_condition": 49199633.36386584, + "lr": 0.000943101789615607, + "time_sec": 32.705042362213135 + }, + { + "epoch": 24, + "train_loss": 1.3155639976882934, + "train_acc": 0.62032, + "test_loss": 2.108880234527588, + "test_acc": 0.4823, + "lyapunov": null, + "grad_norm": 1.046890854380851, + "grad_max_sv": 0.42886915877461435, + "grad_min_sv": 1.9609551714372398e-08, + "grad_condition": 41053712.713573575, + "lr": 0.0009381533400219313, + "time_sec": 32.71632719039917 + }, + { + "epoch": 25, + "train_loss": 1.273603660621643, + "train_acc": 0.63364, + "test_loss": 2.0933273361206055, + "test_acc": 0.4852, + "lyapunov": null, + "grad_norm": 1.024436079028184, + "grad_max_sv": 0.41587754189968107, + "grad_min_sv": 1.9385000169652723e-08, + "grad_condition": 51992204.20794226, + "lr": 0.0009330127018922189, + "time_sec": 32.702069997787476 + }, + { + "epoch": 26, + "train_loss": 1.2419982319259644, + "train_acc": 0.6399, + "test_loss": 2.1144972944259646, + "test_acc": 0.4865, + "lyapunov": null, + "grad_norm": 1.0088705466095338, + "grad_max_sv": 0.39710880219936373, + "grad_min_sv": 1.870035526846392e-08, + "grad_condition": 181692609.81395656, + "lr": 0.000927682130080253, + "time_sec": 32.707526445388794 + }, + { + "epoch": 27, + "train_loss": 1.2189629228973389, + "train_acc": 0.6436, + "test_loss": 2.204226477432251, + "test_acc": 0.476, + "lyapunov": null, + "grad_norm": 0.9979053902708439, + "grad_max_sv": 0.3974333480000496, + "grad_min_sv": 1.8178674205185376e-08, + "grad_condition": 88033285.18865582, + "lr": 0.0009221639627510072, + "time_sec": 32.74215221405029 + }, + { + "epoch": 28, + "train_loss": 1.196308147392273, + "train_acc": 0.65004, + "test_loss": 2.3723191680908204, + "test_acc": 0.4591, + "lyapunov": null, + "grad_norm": 0.975077074369322, + "grad_max_sv": 0.40025187358260156, + "grad_min_sv": 1.829182182389033e-08, + "grad_condition": 38849966.98297453, + "lr": 0.0009164606203550494, + "time_sec": 32.70245599746704 + }, + { + "epoch": 29, + "train_loss": 1.1692425540161133, + "train_acc": 0.65714, + "test_loss": 2.2748174949645996, + "test_acc": 0.4746, + "lyapunov": null, + "grad_norm": 0.9656994259472406, + "grad_max_sv": 0.3973592549562454, + "grad_min_sv": 1.812226688574503e-08, + "grad_condition": 39408166.232041776, + "lr": 0.0009105746045668516, + "time_sec": 32.71292495727539 + }, + { + "epoch": 30, + "train_loss": 1.1311084144973755, + "train_acc": 0.66644, + "test_loss": 2.1602066425323487, + "test_acc": 0.4933, + "lyapunov": null, + "grad_norm": 0.9503788281741601, + "grad_max_sv": 0.3813568793237209, + "grad_min_sv": 1.7537509381174154e-08, + "grad_condition": 91136622.64604397, + "lr": 0.0009045084971874733, + "time_sec": 32.729275941848755 + }, + { + "epoch": 31, + "train_loss": 1.107859415283203, + "train_acc": 0.67202, + "test_loss": 2.088518197631836, + "test_acc": 0.5149, + "lyapunov": null, + "grad_norm": 0.946846205217341, + "grad_max_sv": 0.38662919625639913, + "grad_min_sv": 1.787647136014536e-08, + "grad_condition": 37247674.11503151, + "lr": 0.0008982649590120977, + "time_sec": 32.724801540374756 + }, + { + "epoch": 32, + "train_loss": 1.075172028541565, + "train_acc": 0.68254, + "test_loss": 2.11543652381897, + "test_acc": 0.5052, + "lyapunov": null, + "grad_norm": 0.919583751793241, + "grad_max_sv": 0.37590193301439284, + "grad_min_sv": 1.7335351598646298e-08, + "grad_condition": 32173699.63890195, + "lr": 0.0008918467286629196, + "time_sec": 32.70777225494385 + }, + { + "epoch": 33, + "train_loss": 1.0526020958709716, + "train_acc": 0.68626, + "test_loss": 2.283646846008301, + "test_acc": 0.4816, + "lyapunov": null, + "grad_norm": 0.9156820464594853, + "grad_max_sv": 0.37288443073630334, + "grad_min_sv": 1.682198175895211e-08, + "grad_condition": 41766926.72855186, + "lr": 0.0008852566213878943, + "time_sec": 32.71830630302429 + }, + { + "epoch": 34, + "train_loss": 1.0363747980117797, + "train_acc": 0.69038, + "test_loss": 2.207733528137207, + "test_acc": 0.4943, + "lyapunov": null, + "grad_norm": 0.9077261463073804, + "grad_max_sv": 0.3598011791706085, + "grad_min_sv": 1.6353098675377097e-08, + "grad_condition": 114742140.57000451, + "lr": 0.000878497527825878, + "time_sec": 32.70716309547424 + }, + { + "epoch": 35, + "train_loss": 1.0068622560119629, + "train_acc": 0.69648, + "test_loss": 2.274261113357544, + "test_acc": 0.489, + "lyapunov": null, + "grad_norm": 0.8883949473822523, + "grad_max_sv": 0.3505275271832943, + "grad_min_sv": 1.6455692852801463e-08, + "grad_condition": 31982637.47738139, + "lr": 0.000871572412738697, + "time_sec": 32.704782009124756 + }, + { + "epoch": 36, + "train_loss": 0.9864518771362305, + "train_acc": 0.7021, + "test_loss": 2.3541188930511474, + "test_acc": 0.4898, + "lyapunov": null, + "grad_norm": 0.8736045940658475, + "grad_max_sv": 0.3457980893552303, + "grad_min_sv": 1.5842762313145187e-08, + "grad_condition": 32188123.411770713, + "lr": 0.0008644843137107055, + "time_sec": 32.691269397735596 + }, + { + "epoch": 37, + "train_loss": 0.9681263439178467, + "train_acc": 0.7075, + "test_loss": 2.195126131439209, + "test_acc": 0.5033, + "lyapunov": null, + "grad_norm": 0.8711424558239054, + "grad_max_sv": 0.34736732244491575, + "grad_min_sv": 1.5827014727270993e-08, + "grad_condition": 66500862.978035614, + "lr": 0.0008572363398164014, + "time_sec": 32.69683265686035 + }, + { + "epoch": 38, + "train_loss": 0.9408467683601379, + "train_acc": 0.71608, + "test_loss": 2.1800164726257325, + "test_acc": 0.5109, + "lyapunov": null, + "grad_norm": 0.8497079289449048, + "grad_max_sv": 0.33491997644305227, + "grad_min_sv": 1.5505913916746828e-08, + "grad_condition": 37981645.21243934, + "lr": 0.0008498316702566826, + "time_sec": 32.67169213294983 + }, + { + "epoch": 39, + "train_loss": 0.9174955882263184, + "train_acc": 0.7231, + "test_loss": 2.332292454910278, + "test_acc": 0.4984, + "lyapunov": null, + "grad_norm": 0.8483669541798352, + "grad_max_sv": 0.3449387975037098, + "grad_min_sv": 1.5716625918760217e-08, + "grad_condition": 38753621.785681486, + "lr": 0.0008422735529643442, + "time_sec": 32.668078660964966 + }, + { + "epoch": 40, + "train_loss": 0.8970937779045105, + "train_acc": 0.72826, + "test_loss": 2.282168871688843, + "test_acc": 0.5053, + "lyapunov": null, + "grad_norm": 0.8354606142013189, + "grad_max_sv": 0.3270870424807072, + "grad_min_sv": 1.5267581635058926e-08, + "grad_condition": 95751205.07057047, + "lr": 0.0008345653031794289, + "time_sec": 32.70110583305359 + }, + { + "epoch": 41, + "train_loss": 0.8763418362236023, + "train_acc": 0.73382, + "test_loss": 2.3397656742095947, + "test_acc": 0.504, + "lyapunov": null, + "grad_norm": 0.8300379125306362, + "grad_max_sv": 0.33984693363308904, + "grad_min_sv": 1.5102269786126942e-08, + "grad_condition": 36575363.166415855, + "lr": 0.0008267103019950526, + "time_sec": 32.68285536766052 + }, + { + "epoch": 42, + "train_loss": 0.8614973092651367, + "train_acc": 0.73702, + "test_loss": 2.217091986083984, + "test_acc": 0.513, + "lyapunov": null, + "grad_norm": 0.8218045461669631, + "grad_max_sv": 0.32567850723862646, + "grad_min_sv": 1.507071445694397e-08, + "grad_condition": 48789917.15280264, + "lr": 0.0008187119948743447, + "time_sec": 32.685330867767334 + }, + { + "epoch": 43, + "train_loss": 0.8463610815429687, + "train_acc": 0.74162, + "test_loss": 2.238330067062378, + "test_acc": 0.5145, + "lyapunov": null, + "grad_norm": 0.8111621240187793, + "grad_max_sv": 0.3245612893253565, + "grad_min_sv": 1.4757356182567606e-08, + "grad_condition": 2265212011.074665, + "lr": 0.000810573890139155, + "time_sec": 32.6937038898468 + }, + { + "epoch": 44, + "train_loss": 0.8388264699935913, + "train_acc": 0.7425, + "test_loss": 2.2916201137542727, + "test_acc": 0.5146, + "lyapunov": null, + "grad_norm": 0.806013800687461, + "grad_max_sv": 0.3360877387225628, + "grad_min_sv": 1.4701122835053537e-08, + "grad_condition": 56062708.17707713, + "lr": 0.0008022995574311873, + "time_sec": 32.70379972457886 + }, + { + "epoch": 45, + "train_loss": 0.8080853428649902, + "train_acc": 0.75246, + "test_loss": 2.31492944984436, + "test_acc": 0.519, + "lyapunov": null, + "grad_norm": 0.7954463291291034, + "grad_max_sv": 0.3197424054145813, + "grad_min_sv": 1.4746050645180267e-08, + "grad_condition": 648957804.3057442, + "lr": 0.0007938926261462363, + "time_sec": 32.704816579818726 + }, + { + "epoch": 46, + "train_loss": 0.8025041796875, + "train_acc": 0.753, + "test_loss": 2.3807359542846678, + "test_acc": 0.5181, + "lyapunov": null, + "grad_norm": 0.7945005415191121, + "grad_max_sv": 0.31871558651328086, + "grad_min_sv": 1.4457539215806392e-08, + "grad_condition": 62012558.50813458, + "lr": 0.0007853567838422158, + "time_sec": 32.7154860496521 + }, + { + "epoch": 47, + "train_loss": 0.7847597545051574, + "train_acc": 0.75886, + "test_loss": 2.305859538269043, + "test_acc": 0.5185, + "lyapunov": null, + "grad_norm": 0.7791668550262338, + "grad_max_sv": 0.3171059262007475, + "grad_min_sv": 1.4160447076028148e-08, + "grad_condition": 51678874.24460314, + "lr": 0.0007766957746216719, + "time_sec": 32.71022868156433 + }, + { + "epoch": 48, + "train_loss": 0.7660661986160279, + "train_acc": 0.7635, + "test_loss": 2.373494161605835, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.7662493930118918, + "grad_max_sv": 0.3144552931189537, + "grad_min_sv": 1.4124776402668626e-08, + "grad_condition": 42937106.53672977, + "lr": 0.0007679133974894982, + "time_sec": 32.722716093063354 + }, + { + "epoch": 49, + "train_loss": 0.7557950233268738, + "train_acc": 0.76584, + "test_loss": 2.2862959323883056, + "test_acc": 0.5222, + "lyapunov": null, + "grad_norm": 0.7719008014476091, + "grad_max_sv": 0.3158703289926052, + "grad_min_sv": 1.4232268583103113e-08, + "grad_condition": 39203631.14441905, + "lr": 0.000759013504686565, + "time_sec": 32.71821331977844 + }, + { + "epoch": 50, + "train_loss": 0.7287120180892944, + "train_acc": 0.77398, + "test_loss": 2.2880530021667482, + "test_acc": 0.5331, + "lyapunov": null, + "grad_norm": 0.7580370777565381, + "grad_max_sv": 0.31812012754380703, + "grad_min_sv": 1.3956443738194491e-08, + "grad_condition": 56488826.56667278, + "lr": 0.0007499999999999998, + "time_sec": 32.74500012397766 + }, + { + "epoch": 51, + "train_loss": 0.7047131567382813, + "train_acc": 0.77944, + "test_loss": 2.3342226333618163, + "test_acc": 0.5242, + "lyapunov": null, + "grad_norm": 0.7467723064599141, + "grad_max_sv": 0.3062335759401321, + "grad_min_sv": 1.365980890968843e-08, + "grad_condition": 48288096.27243978, + "lr": 0.0007408768370508575, + "time_sec": 32.73174715042114 + }, + { + "epoch": 52, + "train_loss": 0.701608234500885, + "train_acc": 0.78146, + "test_loss": 2.4530138679504394, + "test_acc": 0.5151, + "lyapunov": null, + "grad_norm": 0.744474034267783, + "grad_max_sv": 0.31273389905691146, + "grad_min_sv": 1.386061017072393e-08, + "grad_condition": 128824936.60768087, + "lr": 0.0007316480175599307, + "time_sec": 32.70361828804016 + }, + { + "epoch": 53, + "train_loss": 0.6784094618415832, + "train_acc": 0.7874, + "test_loss": 2.3597243209838865, + "test_acc": 0.5275, + "lyapunov": null, + "grad_norm": 0.7374795544632287, + "grad_max_sv": 0.30512114986777306, + "grad_min_sv": 1.3410438691116578e-08, + "grad_condition": 185757572.3538422, + "lr": 0.0007223175895924635, + "time_sec": 32.71756291389465 + }, + { + "epoch": 54, + "train_loss": 0.6558182954406738, + "train_acc": 0.795, + "test_loss": 2.376951601028442, + "test_acc": 0.5316, + "lyapunov": null, + "grad_norm": 0.7251324903072741, + "grad_max_sv": 0.2987603921443224, + "grad_min_sv": 1.2931078906264214e-08, + "grad_condition": 35614928.216609366, + "lr": 0.0007128896457825361, + "time_sec": 32.73335146903992 + }, + { + "epoch": 55, + "train_loss": 0.6438722687911987, + "train_acc": 0.79842, + "test_loss": 2.4439307792663576, + "test_acc": 0.5237, + "lyapunov": null, + "grad_norm": 0.7208427013257759, + "grad_max_sv": 0.2992406666278839, + "grad_min_sv": 1.321393890141298e-08, + "grad_condition": 86775812.1538335, + "lr": 0.0007033683215378998, + "time_sec": 32.714346408843994 + }, + { + "epoch": 56, + "train_loss": 0.6417430144309998, + "train_acc": 0.7972, + "test_loss": 2.3790397010803224, + "test_acc": 0.5275, + "lyapunov": null, + "grad_norm": 0.7192864641522134, + "grad_max_sv": 0.2877038486301899, + "grad_min_sv": 1.3027487994767515e-08, + "grad_condition": 758527469.2650627, + "lr": 0.0006937577932260512, + "time_sec": 32.70229887962341 + }, + { + "epoch": 57, + "train_loss": 0.6262681634902955, + "train_acc": 0.803, + "test_loss": 2.401387868881226, + "test_acc": 0.5319, + "lyapunov": null, + "grad_norm": 0.7121380891152584, + "grad_max_sv": 0.2965920139104128, + "grad_min_sv": 1.279559212457454e-08, + "grad_condition": 184239403.66627008, + "lr": 0.0006840622763423388, + "time_sec": 32.71753239631653 + }, + { + "epoch": 58, + "train_loss": 0.6120203521347046, + "train_acc": 0.80732, + "test_loss": 2.503086555862427, + "test_acc": 0.5165, + "lyapunov": null, + "grad_norm": 0.7090038692309348, + "grad_max_sv": 0.2882195271551609, + "grad_min_sv": 1.2676824923812945e-08, + "grad_condition": 64942214.60915594, + "lr": 0.0006742860236609073, + "time_sec": 32.75395059585571 + }, + { + "epoch": 59, + "train_loss": 0.5998075243473053, + "train_acc": 0.81224, + "test_loss": 2.4825798515319826, + "test_acc": 0.5223, + "lyapunov": null, + "grad_norm": 0.7030307704517706, + "grad_max_sv": 0.28765259496867657, + "grad_min_sv": 1.2779274688370229e-08, + "grad_condition": 182642047.07290906, + "lr": 0.0006644333233692913, + "time_sec": 32.70982766151428 + }, + { + "epoch": 60, + "train_loss": 0.5948525179862976, + "train_acc": 0.81162, + "test_loss": 2.5030276454925535, + "test_acc": 0.5207, + "lyapunov": null, + "grad_norm": 0.7026252294626018, + "grad_max_sv": 0.2934992775321007, + "grad_min_sv": 1.284481914573185e-08, + "grad_condition": 541914476.4363593, + "lr": 0.0006545084971874734, + "time_sec": 32.69038796424866 + }, + { + "epoch": 61, + "train_loss": 0.572040382938385, + "train_acc": 0.81932, + "test_loss": 2.5733165519714354, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.6845429439823613, + "grad_max_sv": 0.28906508460640906, + "grad_min_sv": 1.2416446168797556e-08, + "grad_condition": 83143739.39889392, + "lr": 0.0006445158984722354, + "time_sec": 32.70990490913391 + }, + { + "epoch": 62, + "train_loss": 0.5523873634338379, + "train_acc": 0.82446, + "test_loss": 2.563892342758179, + "test_acc": 0.5248, + "lyapunov": null, + "grad_norm": 0.677689496712232, + "grad_max_sv": 0.2810227505862713, + "grad_min_sv": 1.2061726063945787e-08, + "grad_condition": 161335990.45839816, + "lr": 0.0006344599103076324, + "time_sec": 32.714717864990234 + }, + { + "epoch": 63, + "train_loss": 0.537570647277832, + "train_acc": 0.82928, + "test_loss": 2.5110877151489257, + "test_acc": 0.5309, + "lyapunov": null, + "grad_norm": 0.6752075838217867, + "grad_max_sv": 0.2918707847595215, + "grad_min_sv": 1.2428116336060669e-08, + "grad_condition": 62614290.824099444, + "lr": 0.0006243449435824269, + "time_sec": 32.73838663101196 + }, + { + "epoch": 64, + "train_loss": 0.525590337715149, + "train_acc": 0.83162, + "test_loss": 2.5260006717681884, + "test_acc": 0.5365, + "lyapunov": null, + "grad_norm": 0.6614195891575191, + "grad_max_sv": 0.2785448797047138, + "grad_min_sv": 1.2074160667119305e-08, + "grad_condition": 68726347.69115171, + "lr": 0.0006141754350553275, + "time_sec": 32.716681241989136 + }, + { + "epoch": 65, + "train_loss": 0.506968226633072, + "train_acc": 0.83974, + "test_loss": 2.4551146259307863, + "test_acc": 0.5332, + "lyapunov": null, + "grad_norm": 0.6515058246983421, + "grad_max_sv": 0.28096592277288435, + "grad_min_sv": 1.183612223995545e-08, + "grad_condition": 56796145.61117469, + "lr": 0.0006039558454088793, + "time_sec": 32.72992730140686 + }, + { + "epoch": 66, + "train_loss": 0.5121252582931518, + "train_acc": 0.8359, + "test_loss": 2.4647022022247316, + "test_acc": 0.5374, + "lyapunov": null, + "grad_norm": 0.6569185851243321, + "grad_max_sv": 0.2686118472367525, + "grad_min_sv": 1.1671607616763752e-08, + "grad_condition": 198976036.41965005, + "lr": 0.000593690657292862, + "time_sec": 32.737778425216675 + }, + { + "epoch": 67, + "train_loss": 0.5035950432968139, + "train_acc": 0.83814, + "test_loss": 2.5104728435516357, + "test_acc": 0.5334, + "lyapunov": null, + "grad_norm": 0.6543970572426195, + "grad_max_sv": 0.27697036042809486, + "grad_min_sv": 1.1793683101109492e-08, + "grad_condition": 2176927259.024586, + "lr": 0.0005833843733580507, + "time_sec": 32.73714327812195 + }, + { + "epoch": 68, + "train_loss": 0.4827924027252197, + "train_acc": 0.8449, + "test_loss": 2.483680333328247, + "test_acc": 0.5362, + "lyapunov": null, + "grad_norm": 0.6424274790982618, + "grad_max_sv": 0.26836494021117685, + "grad_min_sv": 1.1452091713826107e-08, + "grad_condition": 64248156.31133513, + "lr": 0.0005730415142812054, + "time_sec": 32.73483109474182 + }, + { + "epoch": 69, + "train_loss": 0.463097783498764, + "train_acc": 0.85106, + "test_loss": 2.5873930728912353, + "test_acc": 0.5352, + "lyapunov": null, + "grad_norm": 0.6283493250843613, + "grad_max_sv": 0.26704199202358725, + "grad_min_sv": 1.1449700967197662e-08, + "grad_condition": 133571192.62172851, + "lr": 0.0005626666167821517, + "time_sec": 32.76736545562744 + }, + { + "epoch": 70, + "train_loss": 0.45964255402565, + "train_acc": 0.8516, + "test_loss": 2.4906038509368895, + "test_acc": 0.5466, + "lyapunov": null, + "grad_norm": 0.6392818623657084, + "grad_max_sv": 0.2811981987208128, + "grad_min_sv": 1.1691557246645834e-08, + "grad_condition": 83552341.63512965, + "lr": 0.0005522642316338265, + "time_sec": 32.76137971878052 + }, + { + "epoch": 71, + "train_loss": 0.44885221929550173, + "train_acc": 0.85536, + "test_loss": 2.5581497470855714, + "test_acc": 0.5417, + "lyapunov": null, + "grad_norm": 0.627505222045094, + "grad_max_sv": 0.2669704511761665, + "grad_min_sv": 1.135505285909666e-08, + "grad_condition": 55019996.6299631, + "lr": 0.0005418389216661573, + "time_sec": 32.754613161087036 + }, + { + "epoch": 72, + "train_loss": 0.4373334138870239, + "train_acc": 0.85988, + "test_loss": 2.5293708190917967, + "test_acc": 0.5385, + "lyapunov": null, + "grad_norm": 0.6228439231508988, + "grad_max_sv": 0.27325935252010825, + "grad_min_sv": 1.1285354627535438e-08, + "grad_condition": 404302529.70424557, + "lr": 0.0005313952597646563, + "time_sec": 32.747488260269165 + }, + { + "epoch": 73, + "train_loss": 0.43413398032188416, + "train_acc": 0.86118, + "test_loss": 2.59562434463501, + "test_acc": 0.5355, + "lyapunov": null, + "grad_norm": 0.6246623504935193, + "grad_max_sv": 0.26360294707119464, + "grad_min_sv": 1.0827903220485963e-08, + "grad_condition": 202498413.83885324, + "lr": 0.0005209378268645994, + "time_sec": 32.75055932998657 + }, + { + "epoch": 74, + "train_loss": 0.42070443333625795, + "train_acc": 0.86404, + "test_loss": 2.620591529083252, + "test_acc": 0.5311, + "lyapunov": null, + "grad_norm": 0.6160094351570171, + "grad_max_sv": 0.2604650367051363, + "grad_min_sv": 1.0893297332399688e-08, + "grad_condition": 109053309.86634846, + "lr": 0.0005104712099416781, + "time_sec": 32.766777753829956 + }, + { + "epoch": 75, + "train_loss": 0.41482046060562133, + "train_acc": 0.86586, + "test_loss": 2.6253975078582763, + "test_acc": 0.5364, + "lyapunov": null, + "grad_norm": 0.614383474689519, + "grad_max_sv": 0.2657254245132208, + "grad_min_sv": 1.1066643729282667e-08, + "grad_condition": 1358046707.310991, + "lr": 0.0004999999999999996, + "time_sec": 32.753093004226685 + }, + { + "epoch": 76, + "train_loss": 0.40771523109436036, + "train_acc": 0.8674, + "test_loss": 2.7234753631591797, + "test_acc": 0.5307, + "lyapunov": null, + "grad_norm": 0.6089832611690313, + "grad_max_sv": 0.2631608698517084, + "grad_min_sv": 1.1065733136576827e-08, + "grad_condition": 124518956.20538023, + "lr": 0.0004895287900583212, + "time_sec": 32.7672004699707 + }, + { + "epoch": 77, + "train_loss": 0.3850809427070618, + "train_acc": 0.87682, + "test_loss": 2.6585358211517334, + "test_acc": 0.5378, + "lyapunov": null, + "grad_norm": 0.5905288728439135, + "grad_max_sv": 0.2512054055929184, + "grad_min_sv": 1.0597189950382891e-08, + "grad_condition": 141685910.93483096, + "lr": 0.0004790621731353997, + "time_sec": 32.75537824630737 + }, + { + "epoch": 78, + "train_loss": 0.3790111728191376, + "train_acc": 0.87892, + "test_loss": 2.6925399055480956, + "test_acc": 0.5368, + "lyapunov": null, + "grad_norm": 0.5936477423986493, + "grad_max_sv": 0.2708817757666111, + "grad_min_sv": 1.0561610550192946e-08, + "grad_condition": 244253851.38396016, + "lr": 0.000468604740235343, + "time_sec": 32.734121561050415 + }, + { + "epoch": 79, + "train_loss": 0.376044921131134, + "train_acc": 0.87726, + "test_loss": 2.6398166637420655, + "test_acc": 0.5322, + "lyapunov": null, + "grad_norm": 0.5949427297273714, + "grad_max_sv": 0.2605267588049173, + "grad_min_sv": 1.0820864476679404e-08, + "grad_condition": 62663126.18808526, + "lr": 0.00045816107833384175, + "time_sec": 32.72508406639099 + }, + { + "epoch": 80, + "train_loss": 0.3590127901649475, + "train_acc": 0.88356, + "test_loss": 2.6562103397369383, + "test_acc": 0.5313, + "lyapunov": null, + "grad_norm": 0.57614839106705, + "grad_max_sv": 0.2479171995073557, + "grad_min_sv": 1.0216514026700069e-08, + "grad_condition": 168918888.0387075, + "lr": 0.0004477357683661729, + "time_sec": 32.7580771446228 + }, + { + "epoch": 81, + "train_loss": 0.35495832427978513, + "train_acc": 0.88512, + "test_loss": 2.6037187816619873, + "test_acc": 0.5424, + "lyapunov": null, + "grad_norm": 0.5731602731960765, + "grad_max_sv": 0.2532364260405302, + "grad_min_sv": 1.0580176048897299e-08, + "grad_condition": 286643189.9936029, + "lr": 0.00043733338321784746, + "time_sec": 32.72826409339905 + }, + { + "epoch": 82, + "train_loss": 0.3466758195114136, + "train_acc": 0.88818, + "test_loss": 2.6409978286743163, + "test_acc": 0.5399, + "lyapunov": null, + "grad_norm": 0.5643305573749353, + "grad_max_sv": 0.25191599801182746, + "grad_min_sv": 9.937639448582419e-09, + "grad_condition": 418028032.15621006, + "lr": 0.0004269584857187939, + "time_sec": 32.73789381980896 + }, + { + "epoch": 83, + "train_loss": 0.337517634677887, + "train_acc": 0.89068, + "test_loss": 2.6804797424316407, + "test_acc": 0.5387, + "lyapunov": null, + "grad_norm": 0.5635653171134332, + "grad_max_sv": 0.24921411760151385, + "grad_min_sv": 1.007469917777351e-08, + "grad_condition": 232954348.7021001, + "lr": 0.0004166156266419484, + "time_sec": 32.75311326980591 + }, + { + "epoch": 84, + "train_loss": 0.32895935908317564, + "train_acc": 0.89278, + "test_loss": 2.670875820159912, + "test_acc": 0.5417, + "lyapunov": null, + "grad_norm": 0.5604425901768842, + "grad_max_sv": 0.25350802317261695, + "grad_min_sv": 1.0073376105132481e-08, + "grad_condition": 810741849.6024733, + "lr": 0.0004063093427071373, + "time_sec": 32.75568342208862 + }, + { + "epoch": 85, + "train_loss": 0.31874533922195436, + "train_acc": 0.89668, + "test_loss": 2.726188472366333, + "test_acc": 0.5437, + "lyapunov": null, + "grad_norm": 0.5474219905771217, + "grad_max_sv": 0.24635729603469372, + "grad_min_sv": 9.822750767244857e-09, + "grad_condition": 407705693.9191896, + "lr": 0.0003960441545911199, + "time_sec": 32.74805927276611 + }, + { + "epoch": 86, + "train_loss": 0.3149368803215027, + "train_acc": 0.89756, + "test_loss": 2.7214178714752197, + "test_acc": 0.5419, + "lyapunov": null, + "grad_norm": 0.5494081042104078, + "grad_max_sv": 0.2415832221508026, + "grad_min_sv": 9.84441673934286e-09, + "grad_condition": 259925587.23227444, + "lr": 0.0003858245649446718, + "time_sec": 32.80679273605347 + }, + { + "epoch": 87, + "train_loss": 0.3021876361656189, + "train_acc": 0.9004, + "test_loss": 2.7706982093811034, + "test_acc": 0.5429, + "lyapunov": null, + "grad_norm": 0.5427208210607071, + "grad_max_sv": 0.24498338885605336, + "grad_min_sv": 9.92075648437174e-09, + "grad_condition": 232757368.44567218, + "lr": 0.00037565505641757235, + "time_sec": 32.76810097694397 + }, + { + "epoch": 88, + "train_loss": 0.297262005405426, + "train_acc": 0.90436, + "test_loss": 2.736396257019043, + "test_acc": 0.5423, + "lyapunov": null, + "grad_norm": 0.5343970285585263, + "grad_max_sv": 0.24844259656965734, + "grad_min_sv": 9.910514466504247e-09, + "grad_condition": 1110263065.3705904, + "lr": 0.00036554008969236695, + "time_sec": 32.74753546714783 + }, + { + "epoch": 89, + "train_loss": 0.28578209706306457, + "train_acc": 0.90734, + "test_loss": 2.850689685058594, + "test_acc": 0.5399, + "lyapunov": null, + "grad_norm": 0.5254402888094797, + "grad_max_sv": 0.23409140817821025, + "grad_min_sv": 9.523284056017854e-09, + "grad_condition": 1231623659.8277283, + "lr": 0.0003554841015277638, + "time_sec": 32.79159116744995 + }, + { + "epoch": 90, + "train_loss": 0.2832814686203003, + "train_acc": 0.90616, + "test_loss": 2.8175382946014405, + "test_acc": 0.537, + "lyapunov": null, + "grad_norm": 0.5216211125471195, + "grad_max_sv": 0.23542476668953896, + "grad_min_sv": 9.459231551322244e-09, + "grad_condition": 1301223464.6618998, + "lr": 0.000345491502812526, + "time_sec": 32.78084850311279 + }, + { + "epoch": 91, + "train_loss": 0.28347388619422914, + "train_acc": 0.90788, + "test_loss": 2.831140581512451, + "test_acc": 0.5444, + "lyapunov": null, + "grad_norm": 0.5319613521776031, + "grad_max_sv": 0.23012890443205833, + "grad_min_sv": 9.377407441096135e-09, + "grad_condition": 228524276.50434837, + "lr": 0.0003355666766307081, + "time_sec": 32.71651744842529 + }, + { + "epoch": 92, + "train_loss": 0.27393528344631196, + "train_acc": 0.91052, + "test_loss": 2.775809415435791, + "test_acc": 0.545, + "lyapunov": null, + "grad_norm": 0.5149918732183307, + "grad_max_sv": 0.23977560102939605, + "grad_min_sv": 9.41244274865055e-09, + "grad_condition": 202495109.8759535, + "lr": 0.00032571397633909225, + "time_sec": 32.70667123794556 + }, + { + "epoch": 93, + "train_loss": 0.2638559838104248, + "train_acc": 0.9163, + "test_loss": 2.7468856441497804, + "test_acc": 0.5537, + "lyapunov": null, + "grad_norm": 0.5066198396238114, + "grad_max_sv": 0.23251476027071477, + "grad_min_sv": 9.16693782366737e-09, + "grad_condition": 232699226.05631667, + "lr": 0.00031593772365766094, + "time_sec": 32.71683645248413 + }, + { + "epoch": 94, + "train_loss": 0.25781995408058167, + "train_acc": 0.9156, + "test_loss": 2.771767431640625, + "test_acc": 0.5456, + "lyapunov": null, + "grad_norm": 0.5052996090758677, + "grad_max_sv": 0.23510573096573353, + "grad_min_sv": 8.963649589916433e-09, + "grad_condition": 1701543645.1210911, + "lr": 0.0003062422067739483, + "time_sec": 32.713576555252075 + }, + { + "epoch": 95, + "train_loss": 0.25086621726989744, + "train_acc": 0.91784, + "test_loss": 2.8765688217163086, + "test_acc": 0.5451, + "lyapunov": null, + "grad_norm": 0.49975532415921886, + "grad_max_sv": 0.236967783421278, + "grad_min_sv": 9.25259010277346e-09, + "grad_condition": 145241238.20565036, + "lr": 0.00029663167846209965, + "time_sec": 32.73633694648743 + }, + { + "epoch": 96, + "train_loss": 0.24672197101354598, + "train_acc": 0.91946, + "test_loss": 2.8446786346435546, + "test_acc": 0.5438, + "lyapunov": null, + "grad_norm": 0.49641090183932196, + "grad_max_sv": 0.22625510580837727, + "grad_min_sv": 8.7457359089553e-09, + "grad_condition": 1836850483.766, + "lr": 0.00028711035421746345, + "time_sec": 32.76619052886963 + }, + { + "epoch": 97, + "train_loss": 0.23921704626083373, + "train_acc": 0.92148, + "test_loss": 2.797951399230957, + "test_acc": 0.5532, + "lyapunov": null, + "grad_norm": 0.49423071935175245, + "grad_max_sv": 0.24016087874770164, + "grad_min_sv": 8.990743178508703e-09, + "grad_condition": 210059856.3178285, + "lr": 0.00027768241040753615, + "time_sec": 32.82350516319275 + }, + { + "epoch": 98, + "train_loss": 0.23695792595386506, + "train_acc": 0.9223, + "test_loss": 2.8982477020263673, + "test_acc": 0.5432, + "lyapunov": null, + "grad_norm": 0.4903348629723419, + "grad_max_sv": 0.22139078341424465, + "grad_min_sv": 8.704557989333561e-09, + "grad_condition": 233405578.91055053, + "lr": 0.00026835198244006903, + "time_sec": 32.75874900817871 + }, + { + "epoch": 99, + "train_loss": 0.22282506870508195, + "train_acc": 0.92698, + "test_loss": 2.896362300491333, + "test_acc": 0.544, + "lyapunov": null, + "grad_norm": 0.4754599951900147, + "grad_max_sv": 0.22327796779572964, + "grad_min_sv": 8.601119547287876e-09, + "grad_condition": 868925326.22085, + "lr": 0.0002591231629491421, + "time_sec": 32.74084424972534 + }, + { + "epoch": 100, + "train_loss": 0.22439868947982788, + "train_acc": 0.92668, + "test_loss": 2.888060118484497, + "test_acc": 0.553, + "lyapunov": null, + "grad_norm": 0.4789261726309551, + "grad_max_sv": 0.22355457432568074, + "grad_min_sv": 8.837810024564172e-09, + "grad_condition": 804604193.8746045, + "lr": 0.0002499999999999997, + "time_sec": 32.76948523521423 + }, + { + "epoch": 101, + "train_loss": 0.21471880633354187, + "train_acc": 0.93042, + "test_loss": 2.926622017288208, + "test_acc": 0.5459, + "lyapunov": null, + "grad_norm": 0.46758839629635496, + "grad_max_sv": 0.2257686872035265, + "grad_min_sv": 8.604181156836657e-09, + "grad_condition": 364480196.7882508, + "lr": 0.00024098649531343477, + "time_sec": 32.761115312576294 + }, + { + "epoch": 102, + "train_loss": 0.20999815567016603, + "train_acc": 0.93128, + "test_loss": 2.7882490966796873, + "test_acc": 0.5578, + "lyapunov": null, + "grad_norm": 0.46851254306004025, + "grad_max_sv": 0.21838495172560216, + "grad_min_sv": 8.37696591199713e-09, + "grad_condition": 1510396720.662658, + "lr": 0.0002320866025105016, + "time_sec": 32.72404432296753 + }, + { + "epoch": 103, + "train_loss": 0.20526846901893617, + "train_acc": 0.93262, + "test_loss": 2.8693388496398926, + "test_acc": 0.554, + "lyapunov": null, + "grad_norm": 0.4589602275699082, + "grad_max_sv": 0.22509709745645523, + "grad_min_sv": 8.420789482605027e-09, + "grad_condition": 1371218202.1419, + "lr": 0.0002233042253783278, + "time_sec": 32.752496004104614 + }, + { + "epoch": 104, + "train_loss": 0.20646339273929595, + "train_acc": 0.9335, + "test_loss": 2.89330929107666, + "test_acc": 0.5483, + "lyapunov": null, + "grad_norm": 0.46636768633733616, + "grad_max_sv": 0.22183220721781255, + "grad_min_sv": 8.39393208819329e-09, + "grad_condition": 1827094910.9746387, + "lr": 0.000214643216157784, + "time_sec": 32.74421238899231 + }, + { + "epoch": 105, + "train_loss": 0.20053612211227417, + "train_acc": 0.93402, + "test_loss": 2.904328105926514, + "test_acc": 0.5506, + "lyapunov": null, + "grad_norm": 0.45700070764272066, + "grad_max_sv": 0.21747002471238375, + "grad_min_sv": 8.216160540282366e-09, + "grad_condition": 1664593727.1128445, + "lr": 0.00020610737385376332, + "time_sec": 32.724817991256714 + }, + { + "epoch": 106, + "train_loss": 0.1944782396030426, + "train_acc": 0.9362, + "test_loss": 2.8657500442504884, + "test_acc": 0.5488, + "lyapunov": null, + "grad_norm": 0.44687014031192024, + "grad_max_sv": 0.2213790450245142, + "grad_min_sv": 8.454356608192382e-09, + "grad_condition": 127028340.10294946, + "lr": 0.00019770044256881242, + "time_sec": 32.7451388835907 + }, + { + "epoch": 107, + "train_loss": 0.19279775314331055, + "train_acc": 0.93688, + "test_loss": 2.898486404800415, + "test_acc": 0.5523, + "lyapunov": null, + "grad_norm": 0.44614463029775897, + "grad_max_sv": 0.2167466938495636, + "grad_min_sv": 8.415876304873615e-09, + "grad_condition": 262012758.78866345, + "lr": 0.0001894261098608447, + "time_sec": 32.76267623901367 + }, + { + "epoch": 108, + "train_loss": 0.1886401759147644, + "train_acc": 0.93904, + "test_loss": 2.833827450942993, + "test_acc": 0.5567, + "lyapunov": null, + "grad_norm": 0.4435964290199411, + "grad_max_sv": 0.2225849311798811, + "grad_min_sv": 8.340220883015782e-09, + "grad_condition": 118785929.89668731, + "lr": 0.000181288005125655, + "time_sec": 32.86235594749451 + }, + { + "epoch": 109, + "train_loss": 0.1890174783563614, + "train_acc": 0.93882, + "test_loss": 2.941585520553589, + "test_acc": 0.5491, + "lyapunov": null, + "grad_norm": 0.4464239579148638, + "grad_max_sv": 0.21364586874842645, + "grad_min_sv": 8.245146911967442e-09, + "grad_condition": 716792612.4830931, + "lr": 0.0001732896980049473, + "time_sec": 32.74325895309448 + }, + { + "epoch": 110, + "train_loss": 0.18055749108314514, + "train_acc": 0.94126, + "test_loss": 2.9359549655914305, + "test_acc": 0.5517, + "lyapunov": null, + "grad_norm": 0.4349334962787559, + "grad_max_sv": 0.2089217260479927, + "grad_min_sv": 8.043115946556504e-09, + "grad_condition": 2200871643.370809, + "lr": 0.00016543469682057076, + "time_sec": 32.756227016448975 + }, + { + "epoch": 111, + "train_loss": 0.17659846026420592, + "train_acc": 0.9445, + "test_loss": 2.904285785675049, + "test_acc": 0.5552, + "lyapunov": null, + "grad_norm": 0.4288194869102633, + "grad_max_sv": 0.2133932262659073, + "grad_min_sv": 7.951804889029523e-09, + "grad_condition": 127160230.15537345, + "lr": 0.00015772644703565552, + "time_sec": 32.73052453994751 + }, + { + "epoch": 112, + "train_loss": 0.17598180088996887, + "train_acc": 0.9431, + "test_loss": 2.916234812545776, + "test_acc": 0.5566, + "lyapunov": null, + "grad_norm": 0.43046200088706854, + "grad_max_sv": 0.21027521118521691, + "grad_min_sv": 8.006027082247107e-09, + "grad_condition": 1303838738.9934053, + "lr": 0.00015016832974331713, + "time_sec": 32.737369775772095 + }, + { + "epoch": 113, + "train_loss": 0.167477658700943, + "train_acc": 0.94562, + "test_loss": 2.930574794006348, + "test_acc": 0.5492, + "lyapunov": null, + "grad_norm": 0.4188552255465725, + "grad_max_sv": 0.2074826244264841, + "grad_min_sv": 7.807182782865966e-09, + "grad_condition": 1013028230.5722786, + "lr": 0.00014276366018359834, + "time_sec": 32.78035497665405 + }, + { + "epoch": 114, + "train_loss": 0.16470729023933411, + "train_acc": 0.94658, + "test_loss": 2.9235076808929445, + "test_acc": 0.55, + "lyapunov": null, + "grad_norm": 0.4196468917250276, + "grad_max_sv": 0.2061817307025194, + "grad_min_sv": 7.639872719872321e-09, + "grad_condition": 147774842.88971734, + "lr": 0.00013551568628929425, + "time_sec": 32.71555685997009 + }, + { + "epoch": 115, + "train_loss": 0.15979129463195801, + "train_acc": 0.95014, + "test_loss": 2.8977687450408935, + "test_acc": 0.5554, + "lyapunov": null, + "grad_norm": 0.4109842368882969, + "grad_max_sv": 0.20125124976038933, + "grad_min_sv": 7.641511092990049e-09, + "grad_condition": 152806383.8905374, + "lr": 0.00012842758726130276, + "time_sec": 32.74684023857117 + }, + { + "epoch": 116, + "train_loss": 0.15650701507091522, + "train_acc": 0.94994, + "test_loss": 2.963372290420532, + "test_acc": 0.5536, + "lyapunov": null, + "grad_norm": 0.40714256168185947, + "grad_max_sv": 0.21380255445837976, + "grad_min_sv": 7.601124127343262e-09, + "grad_condition": 187963441.14469656, + "lr": 0.0001215024721741218, + "time_sec": 32.740856885910034 + }, + { + "epoch": 117, + "train_loss": 0.15483391536712646, + "train_acc": 0.95134, + "test_loss": 2.9223466384887695, + "test_acc": 0.5589, + "lyapunov": null, + "grad_norm": 0.4061085309679021, + "grad_max_sv": 0.20323452018201352, + "grad_min_sv": 7.630000256912337e-09, + "grad_condition": 541093755.1409919, + "lr": 0.00011474337861210538, + "time_sec": 32.71646022796631 + }, + { + "epoch": 118, + "train_loss": 0.15986083958148956, + "train_acc": 0.9476, + "test_loss": 2.890314678955078, + "test_acc": 0.5619, + "lyapunov": null, + "grad_norm": 0.4176419876084519, + "grad_max_sv": 0.20986161157488822, + "grad_min_sv": 7.767054953627256e-09, + "grad_condition": 181416124.9826005, + "lr": 0.00010815327133708009, + "time_sec": 32.71689772605896 + }, + { + "epoch": 119, + "train_loss": 0.15443852434635164, + "train_acc": 0.95028, + "test_loss": 2.9833076015472413, + "test_acc": 0.5504, + "lyapunov": null, + "grad_norm": 0.4094461556500699, + "grad_max_sv": 0.20980317294597625, + "grad_min_sv": 7.66585938392992e-09, + "grad_condition": 1289363850.184981, + "lr": 0.00010173504098790182, + "time_sec": 32.76529359817505 + }, + { + "epoch": 120, + "train_loss": 0.1513664803981781, + "train_acc": 0.95076, + "test_loss": 2.9521168746948243, + "test_acc": 0.5535, + "lyapunov": null, + "grad_norm": 0.40458507675773164, + "grad_max_sv": 0.2091453868895769, + "grad_min_sv": 7.546225789991506e-09, + "grad_condition": 191790265.63931364, + "lr": 9.549150281252629e-05, + "time_sec": 32.75906276702881 + }, + { + "epoch": 121, + "train_loss": 0.1482712536096573, + "train_acc": 0.95224, + "test_loss": 3.008343357849121, + "test_acc": 0.5524, + "lyapunov": null, + "grad_norm": 0.40250293552115596, + "grad_max_sv": 0.20429235510528088, + "grad_min_sv": 7.4167842699346915e-09, + "grad_condition": 1004863133.4087012, + "lr": 8.942539543314794e-05, + "time_sec": 32.738195180892944 + }, + { + "epoch": 122, + "train_loss": 0.1433233982515335, + "train_acc": 0.95406, + "test_loss": 2.8811149784088137, + "test_acc": 0.5615, + "lyapunov": null, + "grad_norm": 0.3918685762307977, + "grad_max_sv": 0.21150657180696725, + "grad_min_sv": 7.566205814736106e-09, + "grad_condition": 4864615061.542827, + "lr": 8.353937964495024e-05, + "time_sec": 32.760249853134155 + }, + { + "epoch": 123, + "train_loss": 0.140904153547287, + "train_acc": 0.95554, + "test_loss": 3.0434706832885743, + "test_acc": 0.5488, + "lyapunov": null, + "grad_norm": 0.39134340646439314, + "grad_max_sv": 0.21096068248152733, + "grad_min_sv": 7.420657745899582e-09, + "grad_condition": 474788541.70389444, + "lr": 7.783603724899243e-05, + "time_sec": 32.84018850326538 + }, + { + "epoch": 124, + "train_loss": 0.1424632687997818, + "train_acc": 0.95448, + "test_loss": 3.006509048843384, + "test_acc": 0.5549, + "lyapunov": null, + "grad_norm": 0.3952350465926858, + "grad_max_sv": 0.20579442996531724, + "grad_min_sv": 7.2102639599776894e-09, + "grad_condition": 640121523.7171735, + "lr": 7.231786991974666e-05, + "time_sec": 32.73241114616394 + }, + { + "epoch": 125, + "train_loss": 0.13608443251609803, + "train_acc": 0.95782, + "test_loss": 2.9692224075317384, + "test_acc": 0.5578, + "lyapunov": null, + "grad_norm": 0.38466881950137, + "grad_max_sv": 0.19782444536685945, + "grad_min_sv": 7.223557173946516e-09, + "grad_condition": 248263306.50433522, + "lr": 6.698729810778072e-05, + "time_sec": 32.678467988967896 + }, + { + "epoch": 126, + "train_loss": 0.13552211750030518, + "train_acc": 0.95626, + "test_loss": 3.032096587371826, + "test_acc": 0.5536, + "lyapunov": null, + "grad_norm": 0.3837934860475664, + "grad_max_sv": 0.19592427872121335, + "grad_min_sv": 7.1880338589928525e-09, + "grad_condition": 1098788620.3456562, + "lr": 6.184665997806817e-05, + "time_sec": 32.70717906951904 + }, + { + "epoch": 127, + "train_loss": 0.1351850691795349, + "train_acc": 0.95776, + "test_loss": 2.9195703174591063, + "test_acc": 0.5604, + "lyapunov": null, + "grad_norm": 0.3835199995919498, + "grad_max_sv": 0.19671063385903836, + "grad_min_sv": 7.301026294463924e-09, + "grad_condition": 998102013.5820692, + "lr": 5.6898210384392595e-05, + "time_sec": 32.741135597229004 + }, + { + "epoch": 128, + "train_loss": 0.13267261865139007, + "train_acc": 0.95764, + "test_loss": 2.9626207927703856, + "test_acc": 0.5545, + "lyapunov": null, + "grad_norm": 0.3832565427194031, + "grad_max_sv": 0.2010548248887062, + "grad_min_sv": 7.084323496310118e-09, + "grad_condition": 1908110316.0124466, + "lr": 5.214411988029363e-05, + "time_sec": 32.724841356277466 + }, + { + "epoch": 129, + "train_loss": 0.13098865546941757, + "train_acc": 0.95846, + "test_loss": 3.011842226791382, + "test_acc": 0.5506, + "lyapunov": null, + "grad_norm": 0.37939468237880797, + "grad_max_sv": 0.20046190060675145, + "grad_min_sv": 7.379042803222838e-09, + "grad_condition": 356098689.45926607, + "lr": 4.7586473766990294e-05, + "time_sec": 32.721606492996216 + }, + { + "epoch": 130, + "train_loss": 0.12933046006202698, + "train_acc": 0.95886, + "test_loss": 3.0411768558502197, + "test_acc": 0.5527, + "lyapunov": null, + "grad_norm": 0.37924053294163973, + "grad_max_sv": 0.20988954231142998, + "grad_min_sv": 7.388776484596772e-09, + "grad_condition": 554124327.4297839, + "lr": 4.32272711786996e-05, + "time_sec": 32.76217794418335 + }, + { + "epoch": 131, + "train_loss": 0.12891825794219972, + "train_acc": 0.95952, + "test_loss": 3.000077504730225, + "test_acc": 0.5546, + "lyapunov": null, + "grad_norm": 0.3741869428415791, + "grad_max_sv": 0.1881616409868002, + "grad_min_sv": 7.156842123405213e-09, + "grad_condition": 312499495.3085783, + "lr": 3.906842420574966e-05, + "time_sec": 32.74306511878967 + }, + { + "epoch": 132, + "train_loss": 0.12583676107883454, + "train_acc": 0.96062, + "test_loss": 3.0664391510009765, + "test_acc": 0.5534, + "lyapunov": null, + "grad_norm": 0.3704229743876738, + "grad_max_sv": 0.19701430164277553, + "grad_min_sv": 7.223526106328419e-09, + "grad_condition": 1413194923.3587193, + "lr": 3.5111757055874305e-05, + "time_sec": 32.808775424957275 + }, + { + "epoch": 133, + "train_loss": 0.13008767341136931, + "train_acc": 0.95896, + "test_loss": 3.0139704319000242, + "test_acc": 0.5574, + "lyapunov": null, + "grad_norm": 0.3764215368002029, + "grad_max_sv": 0.18944438602775335, + "grad_min_sv": 7.082572564553764e-09, + "grad_condition": 874087736.501687, + "lr": 3.1359005254054254e-05, + "time_sec": 32.82065176963806 + }, + { + "epoch": 134, + "train_loss": 0.1276783154821396, + "train_acc": 0.95996, + "test_loss": 3.022883545303345, + "test_acc": 0.5532, + "lyapunov": null, + "grad_norm": 0.375861463579636, + "grad_max_sv": 0.20601846650242805, + "grad_min_sv": 6.996468762177945e-09, + "grad_condition": 1890410555.4428897, + "lr": 2.7811814881259484e-05, + "time_sec": 32.80414128303528 + }, + { + "epoch": 135, + "train_loss": 0.12308010986804963, + "train_acc": 0.9606, + "test_loss": 2.9876843898773195, + "test_acc": 0.5593, + "lyapunov": null, + "grad_norm": 0.36736730687062175, + "grad_max_sv": 0.19790339954197406, + "grad_min_sv": 7.039625574654928e-09, + "grad_condition": 157775177.85623857, + "lr": 2.4471741852423218e-05, + "time_sec": 32.851438760757446 + }, + { + "epoch": 136, + "train_loss": 0.12776446427345275, + "train_acc": 0.96144, + "test_loss": 3.0140146301269533, + "test_acc": 0.5535, + "lyapunov": null, + "grad_norm": 0.3714043891983977, + "grad_max_sv": 0.19383110255002975, + "grad_min_sv": 7.2285312062653555e-09, + "grad_condition": 999433479.7051426, + "lr": 2.1340251233966362e-05, + "time_sec": 32.794949769973755 + }, + { + "epoch": 137, + "train_loss": 0.12337936633110047, + "train_acc": 0.96152, + "test_loss": 2.9756490589141844, + "test_acc": 0.5589, + "lyapunov": null, + "grad_norm": 0.36599462716404635, + "grad_max_sv": 0.18621533513069152, + "grad_min_sv": 6.8799666707621e-09, + "grad_condition": 2633273626.2954164, + "lr": 1.8418716601170932e-05, + "time_sec": 32.78418707847595 + }, + { + "epoch": 138, + "train_loss": 0.12530339601516724, + "train_acc": 0.96096, + "test_loss": 2.9389760871887205, + "test_acc": 0.5643, + "lyapunov": null, + "grad_norm": 0.36857224147370304, + "grad_max_sv": 0.19519462659955025, + "grad_min_sv": 7.2010847566817904e-09, + "grad_condition": 1104132755.735764, + "lr": 1.570841943568445e-05, + "time_sec": 32.72880840301514 + }, + { + "epoch": 139, + "train_loss": 0.12289305024623871, + "train_acc": 0.9611, + "test_loss": 3.0236512790679932, + "test_acc": 0.5543, + "lyapunov": null, + "grad_norm": 0.3682552501598832, + "grad_max_sv": 0.20100074261426926, + "grad_min_sv": 7.34378154774052e-09, + "grad_condition": 1520683884.3197339, + "lr": 1.3210548563419845e-05, + "time_sec": 32.78127360343933 + }, + { + "epoch": 140, + "train_loss": 0.12596595900058746, + "train_acc": 0.95946, + "test_loss": 2.973658073425293, + "test_acc": 0.561, + "lyapunov": null, + "grad_norm": 0.3717079213334779, + "grad_max_sv": 0.1950546268373728, + "grad_min_sv": 7.189997905268728e-09, + "grad_condition": 1974792452.4561849, + "lr": 1.0926199633097203e-05, + "time_sec": 32.781864643096924 + }, + { + "epoch": 141, + "train_loss": 0.12001886625289918, + "train_acc": 0.96264, + "test_loss": 2.990137744522095, + "test_acc": 0.5583, + "lyapunov": null, + "grad_norm": 0.3612101803004304, + "grad_max_sv": 0.19684142302721738, + "grad_min_sv": 7.084273648266673e-09, + "grad_condition": 1957601954.2835248, + "lr": 8.856374635655688e-06, + "time_sec": 32.77344870567322 + }, + { + "epoch": 142, + "train_loss": 0.12250841891288758, + "train_acc": 0.96208, + "test_loss": 3.0072501789093016, + "test_acc": 0.557, + "lyapunov": null, + "grad_norm": 0.3656411150745857, + "grad_max_sv": 0.18694628309458494, + "grad_min_sv": 6.765250024683839e-09, + "grad_condition": 728041100.7004558, + "lr": 7.001981464747503e-06, + "time_sec": 32.78335380554199 + }, + { + "epoch": 143, + "train_loss": 0.12062059470653534, + "train_acc": 0.96196, + "test_loss": 2.9649132221221923, + "test_acc": 0.5592, + "lyapunov": null, + "grad_norm": 0.36372343649597894, + "grad_max_sv": 0.19535562619566918, + "grad_min_sv": 6.99444468851753e-09, + "grad_condition": 1233101804.7440555, + "lr": 5.3638335185058295e-06, + "time_sec": 32.80367183685303 + }, + { + "epoch": 144, + "train_loss": 0.12207864775896073, + "train_acc": 0.96178, + "test_loss": 3.036870691680908, + "test_acc": 0.5574, + "lyapunov": null, + "grad_norm": 0.3636070415011162, + "grad_max_sv": 0.20035785287618638, + "grad_min_sv": 7.128019625154275e-09, + "grad_condition": 171713281.12199268, + "lr": 3.942649342761114e-06, + "time_sec": 32.81153345108032 + }, + { + "epoch": 145, + "train_loss": 0.11943841837644577, + "train_acc": 0.96326, + "test_loss": 2.9936345024108886, + "test_acc": 0.5606, + "lyapunov": null, + "grad_norm": 0.3616987855339011, + "grad_max_sv": 0.19010693076997995, + "grad_min_sv": 6.951608487104404e-09, + "grad_condition": 4475866647.186778, + "lr": 2.7390523158633524e-06, + "time_sec": 32.77432584762573 + }, + { + "epoch": 146, + "train_loss": 0.12161365668535233, + "train_acc": 0.96184, + "test_loss": 3.0051653202056885, + "test_acc": 0.5534, + "lyapunov": null, + "grad_norm": 0.36606365240898514, + "grad_max_sv": 0.19566274229437114, + "grad_min_sv": 7.090793683911957e-09, + "grad_condition": 1292263099.7971816, + "lr": 1.7535703752478133e-06, + "time_sec": 32.722100257873535 + }, + { + "epoch": 147, + "train_loss": 0.11985450011253357, + "train_acc": 0.96366, + "test_loss": 2.9604510833740236, + "test_acc": 0.5575, + "lyapunov": null, + "grad_norm": 0.36142233410993513, + "grad_max_sv": 0.19281328432261943, + "grad_min_sv": 7.25558266457792e-09, + "grad_condition": 7387609214.887906, + "lr": 9.866357858642196e-07, + "time_sec": 32.73111319541931 + }, + { + "epoch": 148, + "train_loss": 0.11937485624313354, + "train_acc": 0.96304, + "test_loss": 3.0363352073669434, + "test_acc": 0.555, + "lyapunov": null, + "grad_norm": 0.3611567529216887, + "grad_max_sv": 0.1957642961293459, + "grad_min_sv": 7.231622295303733e-09, + "grad_condition": 393022755.7130184, + "lr": 4.38584950570808e-07, + "time_sec": 32.739211320877075 + }, + { + "epoch": 149, + "train_loss": 0.11994361319065094, + "train_acc": 0.96282, + "test_loss": 2.9720828590393067, + "test_acc": 0.5586, + "lyapunov": null, + "grad_norm": 0.36260803003121506, + "grad_max_sv": 0.19581739362329245, + "grad_min_sv": 6.825674283401049e-09, + "grad_condition": 640655030.4564087, + "lr": 1.096582625772501e-07, + "time_sec": 32.73686075210571 + }, + { + "epoch": 150, + "train_loss": 0.12198109043121338, + "train_acc": 0.96096, + "test_loss": 3.0690538398742677, + "test_acc": 0.5514, + "lyapunov": null, + "grad_norm": 0.3640908774200121, + "grad_max_sv": 0.19363359715789558, + "grad_min_sv": 6.96894196785744e-09, + "grad_condition": 273507263.305566, + "lr": 0.0, + "time_sec": 32.99615716934204 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.494552028656006, + "train_acc": 0.03786, + "test_loss": 4.61479503326416, + "test_acc": 0.0201, + "lyapunov": null, + "grad_norm": 4.970128680900294, + "grad_max_sv": 4.1727720379829405, + "grad_min_sv": 8.289555068485832e-08, + "grad_condition": 76452781.51601897, + "lr": 0.0009998903417374227, + "time_sec": 49.85722231864929 + }, + { + "epoch": 2, + "train_loss": 3.9854862425994875, + "train_acc": 0.08822, + "test_loss": 4.992143798828125, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 3.054976721991771, + "grad_max_sv": 2.33364659845829, + "grad_min_sv": 4.921280333802791e-08, + "grad_condition": 63442313.555687234, + "lr": 0.0009995614150494292, + "time_sec": 49.82543992996216 + }, + { + "epoch": 3, + "train_loss": 3.6997953691101073, + "train_acc": 0.12854, + "test_loss": 4.995684532165527, + "test_acc": 0.0293, + "lyapunov": null, + "grad_norm": 2.062296620286874, + "grad_max_sv": 1.3390462696552277, + "grad_min_sv": 3.588550117061828e-08, + "grad_condition": 44525979.84656793, + "lr": 0.0009990133642141358, + "time_sec": 49.824538707733154 + }, + { + "epoch": 4, + "train_loss": 3.5368371379089356, + "train_acc": 0.15444, + "test_loss": 5.110721218109131, + "test_acc": 0.0304, + "lyapunov": null, + "grad_norm": 1.6796942132426855, + "grad_max_sv": 0.9513197481632233, + "grad_min_sv": 2.9029874798469635e-08, + "grad_condition": 38187587.0072392, + "lr": 0.0009982464296247522, + "time_sec": 49.857542514801025 + }, + { + "epoch": 5, + "train_loss": 3.4063741930389404, + "train_acc": 0.1804, + "test_loss": 4.820973803710937, + "test_acc": 0.0488, + "lyapunov": null, + "grad_norm": 1.5228591587706575, + "grad_max_sv": 0.8078360810875893, + "grad_min_sv": 2.6718039813911078e-08, + "grad_condition": 36188290.78873479, + "lr": 0.0009972609476841367, + "time_sec": 49.83380579948425 + }, + { + "epoch": 6, + "train_loss": 3.298316816482544, + "train_acc": 0.19704, + "test_loss": 4.687854388427734, + "test_acc": 0.063, + "lyapunov": null, + "grad_norm": 1.430907384491558, + "grad_max_sv": 0.7338306248188019, + "grad_min_sv": 2.5322855712328617e-08, + "grad_condition": 32479596.327881176, + "lr": 0.000996057350657239, + "time_sec": 49.85435748100281 + }, + { + "epoch": 7, + "train_loss": 3.212421199264526, + "train_acc": 0.21768, + "test_loss": 5.175653315734864, + "test_acc": 0.0504, + "lyapunov": null, + "grad_norm": 1.336875610023359, + "grad_max_sv": 0.649027307331562, + "grad_min_sv": 2.378195060326327e-08, + "grad_condition": 32637118.77699437, + "lr": 0.000994636166481494, + "time_sec": 49.8446729183197 + }, + { + "epoch": 8, + "train_loss": 3.138554875640869, + "train_acc": 0.22894, + "test_loss": 5.807579966735839, + "test_acc": 0.0462, + "lyapunov": null, + "grad_norm": 1.2679659601013358, + "grad_max_sv": 0.5943921484053135, + "grad_min_sv": 2.2575583161904557e-08, + "grad_condition": 97277800.55107144, + "lr": 0.0009929980185352525, + "time_sec": 49.8536856174469 + }, + { + "epoch": 9, + "train_loss": 3.0594152055358887, + "train_acc": 0.24342, + "test_loss": 5.896516481018066, + "test_acc": 0.0504, + "lyapunov": null, + "grad_norm": 1.1948384399270802, + "grad_max_sv": 0.5371919803321361, + "grad_min_sv": 2.1378302061947352e-08, + "grad_condition": 43411043.09074741, + "lr": 0.0009911436253643444, + "time_sec": 49.826568365097046 + }, + { + "epoch": 10, + "train_loss": 3.0018548110961913, + "train_acc": 0.25334, + "test_loss": 6.065813122558594, + "test_acc": 0.0461, + "lyapunov": null, + "grad_norm": 1.1307569845828864, + "grad_max_sv": 0.49591890424489976, + "grad_min_sv": 2.0269659145588648e-08, + "grad_condition": 137243724.22937468, + "lr": 0.0009890738003669028, + "time_sec": 49.83774471282959 + }, + { + "epoch": 11, + "train_loss": 2.955089698944092, + "train_acc": 0.2653, + "test_loss": 5.9151001647949215, + "test_acc": 0.0512, + "lyapunov": null, + "grad_norm": 1.067241785689624, + "grad_max_sv": 0.4469477400183678, + "grad_min_sv": 1.8805797574739103e-08, + "grad_condition": 39379357.71574137, + "lr": 0.00098678945143658, + "time_sec": 49.843921184539795 + }, + { + "epoch": 12, + "train_loss": 2.9137347607421873, + "train_acc": 0.27164, + "test_loss": 6.294404597473145, + "test_acc": 0.0476, + "lyapunov": null, + "grad_norm": 1.0355748395798314, + "grad_max_sv": 0.4451711155474186, + "grad_min_sv": 1.9072327144360128e-08, + "grad_condition": 11465758103.108255, + "lr": 0.0009842915805643154, + "time_sec": 49.864059925079346 + }, + { + "epoch": 13, + "train_loss": 2.8780907594299316, + "train_acc": 0.2771, + "test_loss": 5.592148977661132, + "test_acc": 0.0478, + "lyapunov": null, + "grad_norm": 0.9968605810380445, + "grad_max_sv": 0.42295421436429026, + "grad_min_sv": 1.8676737473244386e-08, + "grad_condition": 25252476.39695831, + "lr": 0.000981581283398829, + "time_sec": 49.83604097366333 + }, + { + "epoch": 14, + "train_loss": 2.83197486907959, + "train_acc": 0.28466, + "test_loss": 5.6323877784729, + "test_acc": 0.0609, + "lyapunov": null, + "grad_norm": 0.9600893848651761, + "grad_max_sv": 0.40282900631427765, + "grad_min_sv": 1.79312983100699e-08, + "grad_condition": 46420938.26971118, + "lr": 0.0009786597487660333, + "time_sec": 49.834007263183594 + }, + { + "epoch": 15, + "train_loss": 2.8022082035064697, + "train_acc": 0.29582, + "test_loss": 6.161382629394531, + "test_acc": 0.067, + "lyapunov": null, + "grad_norm": 0.9375482131775189, + "grad_max_sv": 0.38931420594453814, + "grad_min_sv": 1.7493153070535784e-08, + "grad_condition": 36503130.621698126, + "lr": 0.0009755282581475766, + "time_sec": 49.843669176101685 + }, + { + "epoch": 16, + "train_loss": 2.7717318687438963, + "train_acc": 0.29786, + "test_loss": 6.750612663269043, + "test_acc": 0.0319, + "lyapunov": null, + "grad_norm": 0.914689907325661, + "grad_max_sv": 0.3722547680139542, + "grad_min_sv": 1.6777755511981906e-08, + "grad_condition": 56626372.0449656, + "lr": 0.0009721881851187403, + "time_sec": 49.83157706260681 + }, + { + "epoch": 17, + "train_loss": 2.737800383453369, + "train_acc": 0.30562, + "test_loss": 6.416880516052246, + "test_acc": 0.0612, + "lyapunov": null, + "grad_norm": 0.8943352214027238, + "grad_max_sv": 0.35389882922172544, + "grad_min_sv": 1.6637817648601504e-08, + "grad_condition": 27086037.56335088, + "lr": 0.0009686409947459456, + "time_sec": 49.84391736984253 + }, + { + "epoch": 18, + "train_loss": 2.726037522125244, + "train_acc": 0.30952, + "test_loss": 6.604639881896973, + "test_acc": 0.0459, + "lyapunov": null, + "grad_norm": 0.8840199433360627, + "grad_max_sv": 0.35427382588386536, + "grad_min_sv": 1.631152495851218e-08, + "grad_condition": 30779446.928706445, + "lr": 0.0009648882429441254, + "time_sec": 49.85922360420227 + }, + { + "epoch": 19, + "train_loss": 2.6859044135284424, + "train_acc": 0.31622, + "test_loss": 5.795512687683106, + "test_acc": 0.057, + "lyapunov": null, + "grad_norm": 0.8549569769936459, + "grad_max_sv": 0.33466122299432755, + "grad_min_sv": 1.565257393698616e-08, + "grad_condition": 29386830.435270645, + "lr": 0.00096093157579425, + "time_sec": 49.82556509971619 + }, + { + "epoch": 20, + "train_loss": 2.6536119274902346, + "train_acc": 0.3221, + "test_loss": 6.344257983398437, + "test_acc": 0.044, + "lyapunov": null, + "grad_norm": 0.8449773123460955, + "grad_max_sv": 0.3348921127617359, + "grad_min_sv": 1.5790628153482257e-08, + "grad_condition": 98318741.07961987, + "lr": 0.0009567727288213001, + "time_sec": 49.83516526222229 + }, + { + "epoch": 21, + "train_loss": 2.6361696144104005, + "train_acc": 0.32656, + "test_loss": 7.515093251800537, + "test_acc": 0.0334, + "lyapunov": null, + "grad_norm": 0.8336479900582607, + "grad_max_sv": 0.3216260939836502, + "grad_min_sv": 1.536505757071538e-08, + "grad_condition": 26686558.28517064, + "lr": 0.0009524135262330095, + "time_sec": 49.80964422225952 + }, + { + "epoch": 22, + "train_loss": 2.609321441345215, + "train_acc": 0.33038, + "test_loss": 6.987834294128418, + "test_acc": 0.0336, + "lyapunov": null, + "grad_norm": 0.8111631557338365, + "grad_max_sv": 0.32318604178726673, + "grad_min_sv": 1.552950264216424e-08, + "grad_condition": 31459791.97556909, + "lr": 0.0009478558801197061, + "time_sec": 49.83420443534851 + }, + { + "epoch": 23, + "train_loss": 2.5819150804138182, + "train_acc": 0.33626, + "test_loss": 5.626160023498535, + "test_acc": 0.0597, + "lyapunov": null, + "grad_norm": 0.7975730239086433, + "grad_max_sv": 0.2971249621361494, + "grad_min_sv": 1.4598027968382166e-08, + "grad_condition": 29388140.880233955, + "lr": 0.000943101789615607, + "time_sec": 49.84738302230835 + }, + { + "epoch": 24, + "train_loss": 2.563654583282471, + "train_acc": 0.34112, + "test_loss": 8.088758407592774, + "test_acc": 0.0365, + "lyapunov": null, + "grad_norm": 0.7820981992902372, + "grad_max_sv": 0.30556059442460537, + "grad_min_sv": 1.4405372743275802e-08, + "grad_condition": 36896273.106267676, + "lr": 0.0009381533400219313, + "time_sec": 49.83872365951538 + }, + { + "epoch": 25, + "train_loss": 2.5395704370880128, + "train_acc": 0.3453, + "test_loss": 6.280784951782227, + "test_acc": 0.0419, + "lyapunov": null, + "grad_norm": 0.7796352290200003, + "grad_max_sv": 0.29107407070696356, + "grad_min_sv": 1.438702274536574e-08, + "grad_condition": 23506322.84645006, + "lr": 0.0009330127018922189, + "time_sec": 49.84307074546814 + }, + { + "epoch": 26, + "train_loss": 2.516899804611206, + "train_acc": 0.34914, + "test_loss": 6.8854626892089845, + "test_acc": 0.0472, + "lyapunov": null, + "grad_norm": 0.7654504890703723, + "grad_max_sv": 0.2898920584470034, + "grad_min_sv": 1.4131242567771985e-08, + "grad_condition": 36962656.131567374, + "lr": 0.000927682130080253, + "time_sec": 49.82866811752319 + }, + { + "epoch": 27, + "train_loss": 2.486618924636841, + "train_acc": 0.35846, + "test_loss": 6.096959390258789, + "test_acc": 0.0526, + "lyapunov": null, + "grad_norm": 0.7544470177982979, + "grad_max_sv": 0.2747815653681755, + "grad_min_sv": 1.4021938565811353e-08, + "grad_condition": 22894223.22709341, + "lr": 0.0009221639627510072, + "time_sec": 49.833322048187256 + }, + { + "epoch": 28, + "train_loss": 2.4692860332489013, + "train_acc": 0.35872, + "test_loss": 7.058197943115235, + "test_acc": 0.0368, + "lyapunov": null, + "grad_norm": 0.7556141642776453, + "grad_max_sv": 0.2829656444489956, + "grad_min_sv": 1.4026384997922747e-08, + "grad_condition": 24010034.28343827, + "lr": 0.0009164606203550494, + "time_sec": 49.853132247924805 + }, + { + "epoch": 29, + "train_loss": 2.458679496536255, + "train_acc": 0.36202, + "test_loss": 5.932370195007325, + "test_acc": 0.0515, + "lyapunov": null, + "grad_norm": 0.7489931312284205, + "grad_max_sv": 0.2846912644803524, + "grad_min_sv": 1.3950906180867743e-08, + "grad_condition": 759126756.028516, + "lr": 0.0009105746045668516, + "time_sec": 49.815508127212524 + }, + { + "epoch": 30, + "train_loss": 2.440240175704956, + "train_acc": 0.3643, + "test_loss": 5.7076008422851565, + "test_acc": 0.0545, + "lyapunov": null, + "grad_norm": 0.7451604093710013, + "grad_max_sv": 0.27726204246282576, + "grad_min_sv": 1.3802408763141649e-08, + "grad_condition": 25518721.12854769, + "lr": 0.0009045084971874733, + "time_sec": 49.83587169647217 + }, + { + "epoch": 31, + "train_loss": 2.413286708908081, + "train_acc": 0.37092, + "test_loss": 5.388267793273926, + "test_acc": 0.0567, + "lyapunov": null, + "grad_norm": 0.734602471620392, + "grad_max_sv": 0.2801205262541771, + "grad_min_sv": 1.3700489934209691e-08, + "grad_condition": 70621872.17100011, + "lr": 0.0008982649590120977, + "time_sec": 49.82285523414612 + }, + { + "epoch": 32, + "train_loss": 2.3982598586273194, + "train_acc": 0.37454, + "test_loss": 4.8633959762573244, + "test_acc": 0.0614, + "lyapunov": null, + "grad_norm": 0.7317568960693007, + "grad_max_sv": 0.27396991699934004, + "grad_min_sv": 1.3639147818100827e-08, + "grad_condition": 29568703.15011265, + "lr": 0.0008918467286629196, + "time_sec": 49.83714246749878 + }, + { + "epoch": 33, + "train_loss": 2.3700755281066894, + "train_acc": 0.37942, + "test_loss": 5.800725856018066, + "test_acc": 0.062, + "lyapunov": null, + "grad_norm": 0.7363325475877537, + "grad_max_sv": 0.27091147713363173, + "grad_min_sv": 1.3641409607467736e-08, + "grad_condition": 23422095.65938937, + "lr": 0.0008852566213878943, + "time_sec": 49.85065937042236 + }, + { + "epoch": 34, + "train_loss": 2.3484229640197753, + "train_acc": 0.38438, + "test_loss": 5.51493988494873, + "test_acc": 0.0489, + "lyapunov": null, + "grad_norm": 0.7318255060238914, + "grad_max_sv": 0.2700826805084944, + "grad_min_sv": 1.3733222553602431e-08, + "grad_condition": 23110083.817654673, + "lr": 0.000878497527825878, + "time_sec": 49.825148820877075 + }, + { + "epoch": 35, + "train_loss": 2.332993766708374, + "train_acc": 0.38728, + "test_loss": 6.365867942047119, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.7235217593940582, + "grad_max_sv": 0.26724731288850306, + "grad_min_sv": 1.3652239799766264e-08, + "grad_condition": 21635340.607584503, + "lr": 0.000871572412738697, + "time_sec": 49.830586194992065 + }, + { + "epoch": 36, + "train_loss": 2.306020415649414, + "train_acc": 0.39186, + "test_loss": 5.792026341247559, + "test_acc": 0.0452, + "lyapunov": null, + "grad_norm": 0.7128640395593397, + "grad_max_sv": 0.26750593855977056, + "grad_min_sv": 1.3493218886662105e-08, + "grad_condition": 28714487.625810385, + "lr": 0.0008644843137107055, + "time_sec": 49.84518265724182 + }, + { + "epoch": 37, + "train_loss": 2.2972560415649412, + "train_acc": 0.39398, + "test_loss": 6.719418971252441, + "test_acc": 0.0336, + "lyapunov": null, + "grad_norm": 0.7133630215784597, + "grad_max_sv": 0.2599464699625969, + "grad_min_sv": 1.321531789555408e-08, + "grad_condition": 23431301.61775563, + "lr": 0.0008572363398164014, + "time_sec": 49.80765676498413 + }, + { + "epoch": 38, + "train_loss": 2.2751118283843996, + "train_acc": 0.39982, + "test_loss": 5.9905416282653805, + "test_acc": 0.0405, + "lyapunov": null, + "grad_norm": 0.711317525951205, + "grad_max_sv": 0.25357839167118074, + "grad_min_sv": 1.3227913819857662e-08, + "grad_condition": 22136545.95270278, + "lr": 0.0008498316702566826, + "time_sec": 49.8195858001709 + }, + { + "epoch": 39, + "train_loss": 2.2572131638336184, + "train_acc": 0.40186, + "test_loss": 5.522994046783447, + "test_acc": 0.0292, + "lyapunov": null, + "grad_norm": 0.7046395490795619, + "grad_max_sv": 0.2534454546868801, + "grad_min_sv": 1.3053050565425828e-08, + "grad_condition": 23267030.12204785, + "lr": 0.0008422735529643442, + "time_sec": 49.82005977630615 + }, + { + "epoch": 40, + "train_loss": 2.247441282196045, + "train_acc": 0.40386, + "test_loss": 6.156334571838379, + "test_acc": 0.0459, + "lyapunov": null, + "grad_norm": 0.7028096798670115, + "grad_max_sv": 0.2492887545377016, + "grad_min_sv": 1.295731734268779e-08, + "grad_condition": 27228242.583258677, + "lr": 0.0008345653031794289, + "time_sec": 49.840070724487305 + }, + { + "epoch": 41, + "train_loss": 2.240987236175537, + "train_acc": 0.4064, + "test_loss": 6.480609422302246, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.6963939273563242, + "grad_max_sv": 0.25355591997504234, + "grad_min_sv": 1.3210752133896442e-08, + "grad_condition": 51874622.58196541, + "lr": 0.0008267103019950526, + "time_sec": 49.89214468002319 + }, + { + "epoch": 42, + "train_loss": 2.2241448893737794, + "train_acc": 0.40938, + "test_loss": 7.472731929016113, + "test_acc": 0.0364, + "lyapunov": null, + "grad_norm": 0.6886576186838276, + "grad_max_sv": 0.24406687431037427, + "grad_min_sv": 1.2965910546614001e-08, + "grad_condition": 26237426.90185051, + "lr": 0.0008187119948743447, + "time_sec": 49.831929445266724 + }, + { + "epoch": 43, + "train_loss": 2.195390332183838, + "train_acc": 0.41482, + "test_loss": 6.986102354431153, + "test_acc": 0.0354, + "lyapunov": null, + "grad_norm": 0.692064929980546, + "grad_max_sv": 0.24136908873915672, + "grad_min_sv": 1.287102841251997e-08, + "grad_condition": 29191367.16539036, + "lr": 0.000810573890139155, + "time_sec": 49.820056438446045 + }, + { + "epoch": 44, + "train_loss": 2.1865518129730224, + "train_acc": 0.41708, + "test_loss": 6.7771270584106444, + "test_acc": 0.0393, + "lyapunov": null, + "grad_norm": 0.6868416402158027, + "grad_max_sv": 0.2486371211707592, + "grad_min_sv": 1.2717046270899201e-08, + "grad_condition": 39400931.65148838, + "lr": 0.0008022995574311873, + "time_sec": 49.82724571228027 + }, + { + "epoch": 45, + "train_loss": 2.176023401031494, + "train_acc": 0.41766, + "test_loss": 6.5321983726501465, + "test_acc": 0.0329, + "lyapunov": null, + "grad_norm": 0.688101634481696, + "grad_max_sv": 0.2483655706048012, + "grad_min_sv": 1.2939461641048311e-08, + "grad_condition": 24745167.039308526, + "lr": 0.0007938926261462363, + "time_sec": 49.83728241920471 + }, + { + "epoch": 46, + "train_loss": 2.157371569519043, + "train_acc": 0.42422, + "test_loss": 5.901077621459961, + "test_acc": 0.0536, + "lyapunov": null, + "grad_norm": 0.6810937554159694, + "grad_max_sv": 0.2453255333006382, + "grad_min_sv": 1.2790355725933455e-08, + "grad_condition": 42427572.437124, + "lr": 0.0007853567838422158, + "time_sec": 49.83260989189148 + }, + { + "epoch": 47, + "train_loss": 2.1449081243896484, + "train_acc": 0.42456, + "test_loss": 6.075893556213379, + "test_acc": 0.042, + "lyapunov": null, + "grad_norm": 0.677274699872145, + "grad_max_sv": 0.23359011709690095, + "grad_min_sv": 1.2604452173659019e-08, + "grad_condition": 23439756.57327797, + "lr": 0.0007766957746216719, + "time_sec": 49.81248760223389 + }, + { + "epoch": 48, + "train_loss": 2.121114821166992, + "train_acc": 0.43062, + "test_loss": 6.324017465209961, + "test_acc": 0.0699, + "lyapunov": null, + "grad_norm": 0.6768119432582711, + "grad_max_sv": 0.23583042696118356, + "grad_min_sv": 1.2428631641914211e-08, + "grad_condition": 26576129.087632615, + "lr": 0.0007679133974894982, + "time_sec": 49.85111737251282 + }, + { + "epoch": 49, + "train_loss": 2.1201681073760987, + "train_acc": 0.43092, + "test_loss": 5.493146458435058, + "test_acc": 0.0673, + "lyapunov": null, + "grad_norm": 0.6795448834334495, + "grad_max_sv": 0.24224164076149463, + "grad_min_sv": 1.2691686027133109e-08, + "grad_condition": 24348457.963241145, + "lr": 0.000759013504686565, + "time_sec": 49.81028628349304 + }, + { + "epoch": 50, + "train_loss": 2.082837229309082, + "train_acc": 0.4386, + "test_loss": 6.459659493255615, + "test_acc": 0.0616, + "lyapunov": null, + "grad_norm": 0.6728576224616372, + "grad_max_sv": 0.23022082336246968, + "grad_min_sv": 1.2368064503109899e-08, + "grad_condition": 23985269.670404635, + "lr": 0.0007499999999999998, + "time_sec": 49.82207798957825 + }, + { + "epoch": 51, + "train_loss": 2.0762338228607176, + "train_acc": 0.43984, + "test_loss": 6.028357986450195, + "test_acc": 0.0474, + "lyapunov": null, + "grad_norm": 0.671786463321322, + "grad_max_sv": 0.23933242298662663, + "grad_min_sv": 1.2453496028852485e-08, + "grad_condition": 27468424.752658807, + "lr": 0.0007408768370508575, + "time_sec": 49.839146852493286 + }, + { + "epoch": 52, + "train_loss": 2.068026172409058, + "train_acc": 0.44324, + "test_loss": 6.386326299285889, + "test_acc": 0.0521, + "lyapunov": null, + "grad_norm": 0.6708600139651663, + "grad_max_sv": 0.24169348366558552, + "grad_min_sv": 1.2435446072878164e-08, + "grad_condition": 53682617.89361428, + "lr": 0.0007316480175599307, + "time_sec": 49.84106373786926 + }, + { + "epoch": 53, + "train_loss": 2.0512850422668456, + "train_acc": 0.44514, + "test_loss": 5.693611965942383, + "test_acc": 0.0412, + "lyapunov": null, + "grad_norm": 0.6693562330574987, + "grad_max_sv": 0.23974683545529843, + "grad_min_sv": 1.2387516072631665e-08, + "grad_condition": 26566156.55520319, + "lr": 0.0007223175895924635, + "time_sec": 49.83973002433777 + }, + { + "epoch": 54, + "train_loss": 2.0340771446990966, + "train_acc": 0.45072, + "test_loss": 6.135411253356933, + "test_acc": 0.0562, + "lyapunov": null, + "grad_norm": 0.6690638479693323, + "grad_max_sv": 0.23783069401979445, + "grad_min_sv": 1.2572742053018614e-08, + "grad_condition": 21778321.765234537, + "lr": 0.0007128896457825361, + "time_sec": 49.87506914138794 + }, + { + "epoch": 55, + "train_loss": 2.0094136617279053, + "train_acc": 0.45566, + "test_loss": 5.745096834564209, + "test_acc": 0.0572, + "lyapunov": null, + "grad_norm": 0.6669166301057209, + "grad_max_sv": 0.23878032267093657, + "grad_min_sv": 1.231176157273639e-08, + "grad_condition": 29310923.371788334, + "lr": 0.0007033683215378998, + "time_sec": 49.82778191566467 + }, + { + "epoch": 56, + "train_loss": 2.0006568963241578, + "train_acc": 0.457, + "test_loss": 6.5824570434570315, + "test_acc": 0.0501, + "lyapunov": null, + "grad_norm": 0.6683455061699762, + "grad_max_sv": 0.23399036526679992, + "grad_min_sv": 1.2379160156672509e-08, + "grad_condition": 42922377.98757514, + "lr": 0.0006937577932260512, + "time_sec": 49.85116100311279 + }, + { + "epoch": 57, + "train_loss": 1.9894362976074218, + "train_acc": 0.45838, + "test_loss": 6.51012366104126, + "test_acc": 0.0442, + "lyapunov": null, + "grad_norm": 0.6646066170012002, + "grad_max_sv": 0.23274879157543182, + "grad_min_sv": 1.238940085523943e-08, + "grad_condition": 24070465.15252796, + "lr": 0.0006840622763423388, + "time_sec": 49.8274929523468 + }, + { + "epoch": 58, + "train_loss": 1.9678663694000245, + "train_acc": 0.46314, + "test_loss": 6.619851453399658, + "test_acc": 0.0576, + "lyapunov": null, + "grad_norm": 0.6643541450786883, + "grad_max_sv": 0.23393345512449742, + "grad_min_sv": 1.2389777363092103e-08, + "grad_condition": 38285129.517120846, + "lr": 0.0006742860236609073, + "time_sec": 49.837411880493164 + }, + { + "epoch": 59, + "train_loss": 1.965532445755005, + "train_acc": 0.46532, + "test_loss": 7.184655822753906, + "test_acc": 0.0412, + "lyapunov": null, + "grad_norm": 0.6645069826423124, + "grad_max_sv": 0.23921045735478402, + "grad_min_sv": 1.2522070774040328e-08, + "grad_condition": 95635689.47436689, + "lr": 0.0006644333233692913, + "time_sec": 49.82288122177124 + }, + { + "epoch": 60, + "train_loss": 1.9421441039657592, + "train_acc": 0.46942, + "test_loss": 6.0968818130493165, + "test_acc": 0.0396, + "lyapunov": null, + "grad_norm": 0.6647686483063734, + "grad_max_sv": 0.23022540807723998, + "grad_min_sv": 1.2435142121569597e-08, + "grad_condition": 36516212.89900361, + "lr": 0.0006545084971874734, + "time_sec": 49.836525440216064 + }, + { + "epoch": 61, + "train_loss": 1.9307384226989746, + "train_acc": 0.4713, + "test_loss": 7.351404643249512, + "test_acc": 0.0467, + "lyapunov": null, + "grad_norm": 0.6598071015542969, + "grad_max_sv": 0.23300293684005738, + "grad_min_sv": 1.2553449488250656e-08, + "grad_condition": 21336349.83542385, + "lr": 0.0006445158984722354, + "time_sec": 49.81679058074951 + }, + { + "epoch": 62, + "train_loss": 1.9107242463684082, + "train_acc": 0.47584, + "test_loss": 7.41353745803833, + "test_acc": 0.0564, + "lyapunov": null, + "grad_norm": 0.6632922829797736, + "grad_max_sv": 0.23702187687158585, + "grad_min_sv": 1.256866596290214e-08, + "grad_condition": 414252068.6680373, + "lr": 0.0006344599103076324, + "time_sec": 49.81079959869385 + }, + { + "epoch": 63, + "train_loss": 1.906180576171875, + "train_acc": 0.47704, + "test_loss": 8.345553895568848, + "test_acc": 0.0514, + "lyapunov": null, + "grad_norm": 0.6641303546175715, + "grad_max_sv": 0.23919319920241833, + "grad_min_sv": 1.2445030603269736e-08, + "grad_condition": 48181552.89073322, + "lr": 0.0006243449435824269, + "time_sec": 49.834824323654175 + }, + { + "epoch": 64, + "train_loss": 1.896571351852417, + "train_acc": 0.48022, + "test_loss": 7.706241481018067, + "test_acc": 0.0495, + "lyapunov": null, + "grad_norm": 0.6580911542263143, + "grad_max_sv": 0.233155807107687, + "grad_min_sv": 1.2258548102821176e-08, + "grad_condition": 147912368.09627536, + "lr": 0.0006141754350553275, + "time_sec": 49.827706813812256 + }, + { + "epoch": 65, + "train_loss": 1.8689342678833007, + "train_acc": 0.48694, + "test_loss": 7.604910266113281, + "test_acc": 0.068, + "lyapunov": null, + "grad_norm": 0.6601961376883955, + "grad_max_sv": 0.24266679622232915, + "grad_min_sv": 1.2337946858967385e-08, + "grad_condition": 109479288.75078002, + "lr": 0.0006039558454088793, + "time_sec": 49.847835063934326 + }, + { + "epoch": 66, + "train_loss": 1.8541412976837157, + "train_acc": 0.4913, + "test_loss": 7.621131346130371, + "test_acc": 0.0502, + "lyapunov": null, + "grad_norm": 0.6526859807082246, + "grad_max_sv": 0.22503522336483, + "grad_min_sv": 1.1999139423735094e-08, + "grad_condition": 27658012.606830657, + "lr": 0.000593690657292862, + "time_sec": 49.83453869819641 + }, + { + "epoch": 67, + "train_loss": 1.8500203356170655, + "train_acc": 0.4895, + "test_loss": 8.448241088867187, + "test_acc": 0.0602, + "lyapunov": null, + "grad_norm": 0.654584216781727, + "grad_max_sv": 0.23166645579040052, + "grad_min_sv": 1.2144356195328832e-08, + "grad_condition": 57526231.39027766, + "lr": 0.0005833843733580507, + "time_sec": 49.87798357009888 + }, + { + "epoch": 68, + "train_loss": 1.8333191384887695, + "train_acc": 0.49588, + "test_loss": 7.663671650695801, + "test_acc": 0.0539, + "lyapunov": null, + "grad_norm": 0.6550869721940646, + "grad_max_sv": 0.23333334550261497, + "grad_min_sv": 1.2233289833907257e-08, + "grad_condition": 24346438.395213075, + "lr": 0.0005730415142812054, + "time_sec": 49.82582187652588 + }, + { + "epoch": 69, + "train_loss": 1.8119923030090332, + "train_acc": 0.50032, + "test_loss": 7.175043432617188, + "test_acc": 0.0712, + "lyapunov": null, + "grad_norm": 0.6513215911180641, + "grad_max_sv": 0.2193699970841408, + "grad_min_sv": 1.1865115855103081e-08, + "grad_condition": 26929150.493882775, + "lr": 0.0005626666167821517, + "time_sec": 49.80794405937195 + }, + { + "epoch": 70, + "train_loss": 1.8089694079589844, + "train_acc": 0.49764, + "test_loss": 7.612014476013184, + "test_acc": 0.0538, + "lyapunov": null, + "grad_norm": 0.6557711961342083, + "grad_max_sv": 0.23481616117060183, + "grad_min_sv": 1.21222042414465e-08, + "grad_condition": 49730665.95439996, + "lr": 0.0005522642316338265, + "time_sec": 49.81162214279175 + }, + { + "epoch": 71, + "train_loss": 1.794535770225525, + "train_acc": 0.50302, + "test_loss": 8.002939363861085, + "test_acc": 0.054, + "lyapunov": null, + "grad_norm": 0.6530360122929442, + "grad_max_sv": 0.22891747988760472, + "grad_min_sv": 1.2135645938160522e-08, + "grad_condition": 30239652.54848214, + "lr": 0.0005418389216661573, + "time_sec": 49.83351969718933 + }, + { + "epoch": 72, + "train_loss": 1.7888313204574584, + "train_acc": 0.50272, + "test_loss": 7.378663352966308, + "test_acc": 0.0477, + "lyapunov": null, + "grad_norm": 0.6515803468137452, + "grad_max_sv": 0.223580015450716, + "grad_min_sv": 1.2234114341730384e-08, + "grad_condition": 31177170.11021496, + "lr": 0.0005313952597646563, + "time_sec": 49.80682587623596 + }, + { + "epoch": 73, + "train_loss": 1.7610743871688843, + "train_acc": 0.51094, + "test_loss": 7.5734631568908695, + "test_acc": 0.0456, + "lyapunov": null, + "grad_norm": 0.6471442109164438, + "grad_max_sv": 0.23298447765409946, + "grad_min_sv": 1.2235564984808267e-08, + "grad_condition": 30205955.557135515, + "lr": 0.0005209378268645994, + "time_sec": 49.8284707069397 + }, + { + "epoch": 74, + "train_loss": 1.743510553855896, + "train_acc": 0.51648, + "test_loss": 8.115744052124024, + "test_acc": 0.0597, + "lyapunov": null, + "grad_norm": 0.6470361414945306, + "grad_max_sv": 0.22419601753354074, + "grad_min_sv": 1.175036056857981e-08, + "grad_condition": 44883670.89626708, + "lr": 0.0005104712099416781, + "time_sec": 49.81434655189514 + }, + { + "epoch": 75, + "train_loss": 1.732315214996338, + "train_acc": 0.5162, + "test_loss": 8.69449387588501, + "test_acc": 0.0443, + "lyapunov": null, + "grad_norm": 0.6534168175273212, + "grad_max_sv": 0.22915640994906425, + "grad_min_sv": 1.2120835880813362e-08, + "grad_condition": 30203938.86272805, + "lr": 0.0004999999999999996, + "time_sec": 49.822524070739746 + }, + { + "epoch": 76, + "train_loss": 1.7280053578186034, + "train_acc": 0.51708, + "test_loss": 8.161399678039551, + "test_acc": 0.0506, + "lyapunov": null, + "grad_norm": 0.6519718595623971, + "grad_max_sv": 0.22868257723748683, + "grad_min_sv": 1.1916949028967227e-08, + "grad_condition": 27392099.189085342, + "lr": 0.0004895287900583212, + "time_sec": 49.806185245513916 + }, + { + "epoch": 77, + "train_loss": 1.707364101486206, + "train_acc": 0.52106, + "test_loss": 8.635691497802734, + "test_acc": 0.0553, + "lyapunov": null, + "grad_norm": 0.6489518165829526, + "grad_max_sv": 0.22707784324884414, + "grad_min_sv": 1.21318999957154e-08, + "grad_condition": 22161799.719214164, + "lr": 0.0004790621731353997, + "time_sec": 49.8337197303772 + }, + { + "epoch": 78, + "train_loss": 1.699185922279358, + "train_acc": 0.52508, + "test_loss": 8.116340428161621, + "test_acc": 0.059, + "lyapunov": null, + "grad_norm": 0.6466631616175401, + "grad_max_sv": 0.2242755901068449, + "grad_min_sv": 1.197350978088263e-08, + "grad_condition": 22907889.143189352, + "lr": 0.000468604740235343, + "time_sec": 49.84882068634033 + }, + { + "epoch": 79, + "train_loss": 1.6851876223754882, + "train_acc": 0.53002, + "test_loss": 7.6594300460815425, + "test_acc": 0.0668, + "lyapunov": null, + "grad_norm": 0.6508056360794745, + "grad_max_sv": 0.22947054952383042, + "grad_min_sv": 1.2146863270084962e-08, + "grad_condition": 50400181.57036874, + "lr": 0.00045816107833384175, + "time_sec": 49.81526827812195 + }, + { + "epoch": 80, + "train_loss": 1.6667000872421265, + "train_acc": 0.53166, + "test_loss": 7.577922117614746, + "test_acc": 0.0581, + "lyapunov": null, + "grad_norm": 0.6484594553766964, + "grad_max_sv": 0.22649560272693633, + "grad_min_sv": 1.2028468630853606e-08, + "grad_condition": 33979879.18367102, + "lr": 0.0004477357683661729, + "time_sec": 49.79970574378967 + }, + { + "epoch": 81, + "train_loss": 1.6529949746704102, + "train_acc": 0.53676, + "test_loss": 7.7760236434936525, + "test_acc": 0.061, + "lyapunov": null, + "grad_norm": 0.6501069318076672, + "grad_max_sv": 0.22972256727516652, + "grad_min_sv": 1.196574576337213e-08, + "grad_condition": 396215587.1427422, + "lr": 0.00043733338321784746, + "time_sec": 49.81192994117737 + }, + { + "epoch": 82, + "train_loss": 1.6425591729736329, + "train_acc": 0.53686, + "test_loss": 7.6887285552978515, + "test_acc": 0.0449, + "lyapunov": null, + "grad_norm": 0.6461003642754752, + "grad_max_sv": 0.23114448301494123, + "grad_min_sv": 1.2002917063394513e-08, + "grad_condition": 58155843.95520236, + "lr": 0.0004269584857187939, + "time_sec": 49.80897355079651 + }, + { + "epoch": 83, + "train_loss": 1.6318637802124023, + "train_acc": 0.54154, + "test_loss": 7.384182490539551, + "test_acc": 0.0735, + "lyapunov": null, + "grad_norm": 0.639611071259903, + "grad_max_sv": 0.22576675675809382, + "grad_min_sv": 1.1820984322299943e-08, + "grad_condition": 61458281.56309018, + "lr": 0.0004166156266419484, + "time_sec": 49.81825590133667 + }, + { + "epoch": 84, + "train_loss": 1.6224907682418823, + "train_acc": 0.54502, + "test_loss": 6.842728860473633, + "test_acc": 0.0545, + "lyapunov": null, + "grad_norm": 0.6421226956015884, + "grad_max_sv": 0.21887084767222403, + "grad_min_sv": 1.1874146338408664e-08, + "grad_condition": 36085101.45868175, + "lr": 0.0004063093427071373, + "time_sec": 49.907301902770996 + }, + { + "epoch": 85, + "train_loss": 1.6129507275390624, + "train_acc": 0.5441, + "test_loss": 8.217321695709229, + "test_acc": 0.0637, + "lyapunov": null, + "grad_norm": 0.6427366718485839, + "grad_max_sv": 0.23318556658923625, + "grad_min_sv": 1.2124754387304871e-08, + "grad_condition": 42339311.94718243, + "lr": 0.0003960441545911199, + "time_sec": 49.83733892440796 + }, + { + "epoch": 86, + "train_loss": 1.5975109223556518, + "train_acc": 0.54868, + "test_loss": 7.930374978637695, + "test_acc": 0.0457, + "lyapunov": null, + "grad_norm": 0.648213394339368, + "grad_max_sv": 0.23059269934892654, + "grad_min_sv": 1.2111861368707676e-08, + "grad_condition": 42084970.06037265, + "lr": 0.0003858245649446718, + "time_sec": 49.827972412109375 + }, + { + "epoch": 87, + "train_loss": 1.5812813794708251, + "train_acc": 0.55458, + "test_loss": 7.960672058105469, + "test_acc": 0.0501, + "lyapunov": null, + "grad_norm": 0.6429264180119875, + "grad_max_sv": 0.2283397376537323, + "grad_min_sv": 1.2037938704190233e-08, + "grad_condition": 24951514.668881785, + "lr": 0.00037565505641757235, + "time_sec": 49.82942318916321 + }, + { + "epoch": 88, + "train_loss": 1.573117269897461, + "train_acc": 0.55398, + "test_loss": 8.257780656433106, + "test_acc": 0.0591, + "lyapunov": null, + "grad_norm": 0.6443323703742537, + "grad_max_sv": 0.22722676433622838, + "grad_min_sv": 1.201048842325303e-08, + "grad_condition": 22188712.23632911, + "lr": 0.00036554008969236695, + "time_sec": 49.86358904838562 + }, + { + "epoch": 89, + "train_loss": 1.5576643622207642, + "train_acc": 0.55992, + "test_loss": 8.274403761291504, + "test_acc": 0.041, + "lyapunov": null, + "grad_norm": 0.6402469644123193, + "grad_max_sv": 0.22650128416717052, + "grad_min_sv": 1.1862416463004343e-08, + "grad_condition": 35019834.9168684, + "lr": 0.0003554841015277638, + "time_sec": 49.83419132232666 + }, + { + "epoch": 90, + "train_loss": 1.549127948036194, + "train_acc": 0.56466, + "test_loss": 7.301855851745605, + "test_acc": 0.0718, + "lyapunov": null, + "grad_norm": 0.6449275085704251, + "grad_max_sv": 0.22556735202670097, + "grad_min_sv": 1.1762558954631075e-08, + "grad_condition": 21940981.03509561, + "lr": 0.000345491502812526, + "time_sec": 49.81568884849548 + }, + { + "epoch": 91, + "train_loss": 1.5344566452407837, + "train_acc": 0.56436, + "test_loss": 8.916962014770508, + "test_acc": 0.0515, + "lyapunov": null, + "grad_norm": 0.6463598068323441, + "grad_max_sv": 0.23813196495175362, + "grad_min_sv": 1.2199751642932855e-08, + "grad_condition": 45733250.122319184, + "lr": 0.0003355666766307081, + "time_sec": 49.839728355407715 + }, + { + "epoch": 92, + "train_loss": 1.5208702486419678, + "train_acc": 0.56684, + "test_loss": 8.993258874511719, + "test_acc": 0.054, + "lyapunov": null, + "grad_norm": 0.6391383040365451, + "grad_max_sv": 0.22249663844704629, + "grad_min_sv": 1.166908096122965e-08, + "grad_condition": 28597379.63678825, + "lr": 0.00032571397633909225, + "time_sec": 49.850322008132935 + }, + { + "epoch": 93, + "train_loss": 1.5081010787582398, + "train_acc": 0.57028, + "test_loss": 9.433806256103516, + "test_acc": 0.0535, + "lyapunov": null, + "grad_norm": 0.6456709453433311, + "grad_max_sv": 0.23419931791722776, + "grad_min_sv": 1.195185940633392e-08, + "grad_condition": 29245401.732327044, + "lr": 0.00031593772365766094, + "time_sec": 49.83537983894348 + }, + { + "epoch": 94, + "train_loss": 1.4969723129653931, + "train_acc": 0.57362, + "test_loss": 8.755092433166505, + "test_acc": 0.0528, + "lyapunov": null, + "grad_norm": 0.6461658506271033, + "grad_max_sv": 0.22756082080304624, + "grad_min_sv": 1.1912134220692926e-08, + "grad_condition": 23423387.436489962, + "lr": 0.0003062422067739483, + "time_sec": 49.80311179161072 + }, + { + "epoch": 95, + "train_loss": 2.9494932527923585, + "train_acc": 0.411, + "test_loss": 4.676254756927491, + "test_acc": 0.0505, + "lyapunov": null, + "grad_norm": 0.8335419963078607, + "grad_max_sv": 0.3271928407251835, + "grad_min_sv": 1.4720300411941168e-08, + "grad_condition": 24067860.441598095, + "lr": 0.00029663167846209965, + "time_sec": 49.814762115478516 + }, + { + "epoch": 96, + "train_loss": 3.6572426443481447, + "train_acc": 0.1492, + "test_loss": 5.234876950836181, + "test_acc": 0.0688, + "lyapunov": null, + "grad_norm": 0.5523560840003197, + "grad_max_sv": 0.18005239982157945, + "grad_min_sv": 9.93911985318341e-09, + "grad_condition": 91354773.39239445, + "lr": 0.00028711035421746345, + "time_sec": 49.84577131271362 + }, + { + "epoch": 97, + "train_loss": 3.3812893244171143, + "train_acc": 0.19184, + "test_loss": 4.862454182434082, + "test_acc": 0.077, + "lyapunov": null, + "grad_norm": 0.5636212270422577, + "grad_max_sv": 0.18343333192169667, + "grad_min_sv": 1.0359513497038009e-08, + "grad_condition": 20784291.458693452, + "lr": 0.00027768241040753615, + "time_sec": 49.83091354370117 + }, + { + "epoch": 98, + "train_loss": 3.179550113220215, + "train_acc": 0.2255, + "test_loss": 4.858168863677979, + "test_acc": 0.0807, + "lyapunov": null, + "grad_norm": 0.5839200776735536, + "grad_max_sv": 0.18244810923933982, + "grad_min_sv": 1.037966059214135e-08, + "grad_condition": 22427331.372158233, + "lr": 0.00026835198244006903, + "time_sec": 49.867558002471924 + }, + { + "epoch": 99, + "train_loss": 3.02292495223999, + "train_acc": 0.25396, + "test_loss": 5.169387593078613, + "test_acc": 0.0881, + "lyapunov": null, + "grad_norm": 0.595907429260728, + "grad_max_sv": 0.1938932089135051, + "grad_min_sv": 1.105600735823442e-08, + "grad_condition": 39890639.04859903, + "lr": 0.0002591231629491421, + "time_sec": 49.82200026512146 + }, + { + "epoch": 100, + "train_loss": 2.9043469207000734, + "train_acc": 0.27584, + "test_loss": 4.884814841461182, + "test_acc": 0.0989, + "lyapunov": null, + "grad_norm": 0.5987053513470115, + "grad_max_sv": 0.1915395434945822, + "grad_min_sv": 1.0967718520123356e-08, + "grad_condition": 507391317.2637795, + "lr": 0.0002499999999999997, + "time_sec": 49.835878133773804 + }, + { + "epoch": 101, + "train_loss": 2.8044686096191405, + "train_acc": 0.29558, + "test_loss": 4.889270275497436, + "test_acc": 0.0981, + "lyapunov": null, + "grad_norm": 0.6096838460034203, + "grad_max_sv": 0.20316330213099718, + "grad_min_sv": 1.1341824002197854e-08, + "grad_condition": 19853325.836087834, + "lr": 0.00024098649531343477, + "time_sec": 49.85874676704407 + }, + { + "epoch": 102, + "train_loss": 2.697149913482666, + "train_acc": 0.3167, + "test_loss": 4.92620325088501, + "test_acc": 0.1009, + "lyapunov": null, + "grad_norm": 0.6154909980411829, + "grad_max_sv": 0.20256872698664666, + "grad_min_sv": 1.1648207248748933e-08, + "grad_condition": 19320886.90158599, + "lr": 0.0002320866025105016, + "time_sec": 50.07639527320862 + }, + { + "epoch": 103, + "train_loss": 2.618629614944458, + "train_acc": 0.33036, + "test_loss": 5.49400161895752, + "test_acc": 0.1068, + "lyapunov": null, + "grad_norm": 0.6217563116117207, + "grad_max_sv": 0.20746214482933284, + "grad_min_sv": 1.1507716859981975e-08, + "grad_condition": 25949652.78149998, + "lr": 0.0002233042253783278, + "time_sec": 49.818949460983276 + }, + { + "epoch": 104, + "train_loss": 2.540534757156372, + "train_acc": 0.34564, + "test_loss": 4.9159078086853025, + "test_acc": 0.1126, + "lyapunov": null, + "grad_norm": 0.6217698336501172, + "grad_max_sv": 0.20552988573908806, + "grad_min_sv": 1.1522777731975964e-08, + "grad_condition": 21899890.551626954, + "lr": 0.000214643216157784, + "time_sec": 49.87585234642029 + }, + { + "epoch": 105, + "train_loss": 2.479596985321045, + "train_acc": 0.35746, + "test_loss": 5.100056993484497, + "test_acc": 0.1253, + "lyapunov": null, + "grad_norm": 0.6287156405132894, + "grad_max_sv": 0.2140802226960659, + "grad_min_sv": 1.1805095190275949e-08, + "grad_condition": 26208309.323742133, + "lr": 0.00020610737385376332, + "time_sec": 49.82085204124451 + }, + { + "epoch": 106, + "train_loss": 2.415481425552368, + "train_acc": 0.36924, + "test_loss": 4.742834524536133, + "test_acc": 0.1225, + "lyapunov": null, + "grad_norm": 0.6282670457594898, + "grad_max_sv": 0.21101173125207423, + "grad_min_sv": 1.1938832567004453e-08, + "grad_condition": 33782298.89931901, + "lr": 0.00019770044256881242, + "time_sec": 49.805906534194946 + }, + { + "epoch": 107, + "train_loss": 2.3521559171295165, + "train_acc": 0.38442, + "test_loss": 5.213879206848144, + "test_acc": 0.1211, + "lyapunov": null, + "grad_norm": 0.6335700941216259, + "grad_max_sv": 0.21410419717431067, + "grad_min_sv": 1.1941749475385954e-08, + "grad_condition": 22110752.957356386, + "lr": 0.0001894261098608447, + "time_sec": 49.83317017555237 + }, + { + "epoch": 108, + "train_loss": 2.302857539215088, + "train_acc": 0.39628, + "test_loss": 5.207193740844726, + "test_acc": 0.1285, + "lyapunov": null, + "grad_norm": 0.6359374602349686, + "grad_max_sv": 0.21151717714965343, + "grad_min_sv": 1.187537558844376e-08, + "grad_condition": 37488925.60398644, + "lr": 0.000181288005125655, + "time_sec": 49.82870650291443 + }, + { + "epoch": 109, + "train_loss": 2.2536745275878904, + "train_acc": 0.40138, + "test_loss": 5.2042837226867675, + "test_acc": 0.1322, + "lyapunov": null, + "grad_norm": 0.6289692207235398, + "grad_max_sv": 0.20782952345907688, + "grad_min_sv": 1.1739032497459779e-08, + "grad_condition": 29358916.829315763, + "lr": 0.0001732896980049473, + "time_sec": 49.83245229721069 + }, + { + "epoch": 110, + "train_loss": 2.2073010168457032, + "train_acc": 0.40866, + "test_loss": 5.739359895324707, + "test_acc": 0.1227, + "lyapunov": null, + "grad_norm": 0.6385992521842959, + "grad_max_sv": 0.2127275388687849, + "grad_min_sv": 1.1950131779958628e-08, + "grad_condition": 28764337.97746384, + "lr": 0.00016543469682057076, + "time_sec": 49.83092474937439 + }, + { + "epoch": 111, + "train_loss": 2.1692623610687254, + "train_acc": 0.41942, + "test_loss": 6.2040216323852535, + "test_acc": 0.1309, + "lyapunov": null, + "grad_norm": 0.6444316866103925, + "grad_max_sv": 0.21499809809029102, + "grad_min_sv": 1.1752886208693526e-08, + "grad_condition": 31962706.67450107, + "lr": 0.00015772644703565552, + "time_sec": 49.85021710395813 + }, + { + "epoch": 112, + "train_loss": 2.1302712613677977, + "train_acc": 0.42516, + "test_loss": 5.75790121383667, + "test_acc": 0.1399, + "lyapunov": null, + "grad_norm": 0.6329896331917518, + "grad_max_sv": 0.21649966202676296, + "grad_min_sv": 1.2179612900176106e-08, + "grad_condition": 34093436.46700279, + "lr": 0.00015016832974331713, + "time_sec": 49.81994557380676 + }, + { + "epoch": 113, + "train_loss": 2.1065593459701537, + "train_acc": 0.43386, + "test_loss": 6.140606423950195, + "test_acc": 0.1364, + "lyapunov": null, + "grad_norm": 0.6373030825503643, + "grad_max_sv": 0.2152324143797159, + "grad_min_sv": 1.191059096350422e-08, + "grad_condition": 24786528.45697539, + "lr": 0.00014276366018359834, + "time_sec": 49.832173347473145 + }, + { + "epoch": 114, + "train_loss": 2.0826868451690674, + "train_acc": 0.43754, + "test_loss": 7.314329501342773, + "test_acc": 0.1193, + "lyapunov": null, + "grad_norm": 0.6350963671857877, + "grad_max_sv": 0.2231900453567505, + "grad_min_sv": 1.2137735866390998e-08, + "grad_condition": 27948227.054936886, + "lr": 0.00013551568628929425, + "time_sec": 49.82054424285889 + }, + { + "epoch": 115, + "train_loss": 2.057500901184082, + "train_acc": 0.44596, + "test_loss": 5.995877742004395, + "test_acc": 0.1372, + "lyapunov": null, + "grad_norm": 0.6319121818844147, + "grad_max_sv": 0.2083717118948698, + "grad_min_sv": 1.1799914823723556e-08, + "grad_condition": 35488295.07860346, + "lr": 0.00012842758726130276, + "time_sec": 49.81160569190979 + }, + { + "epoch": 116, + "train_loss": 2.027409094619751, + "train_acc": 0.452, + "test_loss": 7.286285119628906, + "test_acc": 0.122, + "lyapunov": null, + "grad_norm": 0.639785065376269, + "grad_max_sv": 0.2164283238351345, + "grad_min_sv": 1.1941236867721305e-08, + "grad_condition": 66360354.77809191, + "lr": 0.0001215024721741218, + "time_sec": 49.836623191833496 + }, + { + "epoch": 117, + "train_loss": 1.998638267250061, + "train_acc": 0.45694, + "test_loss": 6.76222890625, + "test_acc": 0.1205, + "lyapunov": null, + "grad_norm": 0.6411689060332757, + "grad_max_sv": 0.21728002466261387, + "grad_min_sv": 1.186145185405607e-08, + "grad_condition": 25472303.080288395, + "lr": 0.00011474337861210538, + "time_sec": 49.835474252700806 + }, + { + "epoch": 118, + "train_loss": 1.9871974803924561, + "train_acc": 0.46078, + "test_loss": 6.990749812316895, + "test_acc": 0.1306, + "lyapunov": null, + "grad_norm": 0.6401613879770299, + "grad_max_sv": 0.21996232829988002, + "grad_min_sv": 1.212309715947768e-08, + "grad_condition": 43599185.89621965, + "lr": 0.00010815327133708009, + "time_sec": 49.82992196083069 + }, + { + "epoch": 119, + "train_loss": 1.9558954917144775, + "train_acc": 0.46806, + "test_loss": 6.338745205688476, + "test_acc": 0.1423, + "lyapunov": null, + "grad_norm": 0.6380666956188763, + "grad_max_sv": 0.21726358123123646, + "grad_min_sv": 1.1924941875629536e-08, + "grad_condition": 23332267.546088994, + "lr": 0.00010173504098790182, + "time_sec": 49.8153715133667 + }, + { + "epoch": 120, + "train_loss": 1.9510743766784668, + "train_acc": 0.46974, + "test_loss": 6.733411245727539, + "test_acc": 0.1243, + "lyapunov": null, + "grad_norm": 0.6418284890195846, + "grad_max_sv": 0.22671268545091153, + "grad_min_sv": 1.199444485400214e-08, + "grad_condition": 24711059.275352217, + "lr": 9.549150281252629e-05, + "time_sec": 49.81182289123535 + }, + { + "epoch": 121, + "train_loss": 1.9362508995819092, + "train_acc": 0.47356, + "test_loss": 6.134232345581054, + "test_acc": 0.1378, + "lyapunov": null, + "grad_norm": 0.6346296231277031, + "grad_max_sv": 0.21598901376128196, + "grad_min_sv": 1.1970328496480053e-08, + "grad_condition": 25346274.751641985, + "lr": 8.942539543314794e-05, + "time_sec": 49.83584427833557 + }, + { + "epoch": 122, + "train_loss": 1.9162643937683106, + "train_acc": 0.4749, + "test_loss": 7.639575733947754, + "test_acc": 0.1265, + "lyapunov": null, + "grad_norm": 0.6378739210927734, + "grad_max_sv": 0.21739229559898376, + "grad_min_sv": 1.1819409628278932e-08, + "grad_condition": 181332693.33855394, + "lr": 8.353937964495024e-05, + "time_sec": 49.82065296173096 + }, + { + "epoch": 123, + "train_loss": 1.9041280354309083, + "train_acc": 0.47994, + "test_loss": 6.308480444335937, + "test_acc": 0.1392, + "lyapunov": null, + "grad_norm": 0.6332843460906636, + "grad_max_sv": 0.21474863290786744, + "grad_min_sv": 1.1848325226493373e-08, + "grad_condition": 30395117.45243178, + "lr": 7.783603724899243e-05, + "time_sec": 49.83568549156189 + }, + { + "epoch": 124, + "train_loss": 1.888980817489624, + "train_acc": 0.48018, + "test_loss": 6.931203792572021, + "test_acc": 0.1361, + "lyapunov": null, + "grad_norm": 0.6468989904611825, + "grad_max_sv": 0.22639431655406952, + "grad_min_sv": 1.2179835734427157e-08, + "grad_condition": 27031913.997842442, + "lr": 7.231786991974666e-05, + "time_sec": 49.86228370666504 + }, + { + "epoch": 125, + "train_loss": 1.8688794164657592, + "train_acc": 0.48822, + "test_loss": 7.4782632530212405, + "test_acc": 0.132, + "lyapunov": null, + "grad_norm": 0.6436381282742432, + "grad_max_sv": 0.21808561868965626, + "grad_min_sv": 1.21570175322383e-08, + "grad_condition": 33380104.6057067, + "lr": 6.698729810778072e-05, + "time_sec": 49.83109521865845 + }, + { + "epoch": 126, + "train_loss": 1.8640016136932374, + "train_acc": 0.491, + "test_loss": 6.5455432174682615, + "test_acc": 0.1403, + "lyapunov": null, + "grad_norm": 0.6367336212592833, + "grad_max_sv": 0.22216320559382438, + "grad_min_sv": 1.1826145895899032e-08, + "grad_condition": 33022831.75443542, + "lr": 6.184665997806817e-05, + "time_sec": 49.83457159996033 + }, + { + "epoch": 127, + "train_loss": 1.8510954288101196, + "train_acc": 0.4882, + "test_loss": 7.0682084793090825, + "test_acc": 0.1326, + "lyapunov": null, + "grad_norm": 0.6431259646730736, + "grad_max_sv": 0.22209820635616778, + "grad_min_sv": 1.2136436526935524e-08, + "grad_condition": 66497220.94224206, + "lr": 5.6898210384392595e-05, + "time_sec": 49.83670258522034 + }, + { + "epoch": 128, + "train_loss": 1.8453027178573609, + "train_acc": 0.49042, + "test_loss": 6.2842555938720706, + "test_acc": 0.1305, + "lyapunov": null, + "grad_norm": 0.6383805845227949, + "grad_max_sv": 0.21130143105983734, + "grad_min_sv": 1.1917887206280842e-08, + "grad_condition": 43204631.05359116, + "lr": 5.214411988029363e-05, + "time_sec": 49.81800961494446 + }, + { + "epoch": 129, + "train_loss": 1.8346676333618164, + "train_acc": 0.4945, + "test_loss": 6.274330713653565, + "test_acc": 0.1391, + "lyapunov": null, + "grad_norm": 0.6376052549176046, + "grad_max_sv": 0.2089413482695818, + "grad_min_sv": 1.1727769512470676e-08, + "grad_condition": 27159660.544945084, + "lr": 4.7586473766990294e-05, + "time_sec": 49.845595598220825 + }, + { + "epoch": 130, + "train_loss": 1.830022028465271, + "train_acc": 0.49474, + "test_loss": 6.249729978942871, + "test_acc": 0.1459, + "lyapunov": null, + "grad_norm": 0.6453711202585213, + "grad_max_sv": 0.2190984409302473, + "grad_min_sv": 1.2224324771881178e-08, + "grad_condition": 22960059.51271691, + "lr": 4.32272711786996e-05, + "time_sec": 49.87020516395569 + }, + { + "epoch": 131, + "train_loss": 1.8177084483337402, + "train_acc": 0.49802, + "test_loss": 6.943641340637207, + "test_acc": 0.1332, + "lyapunov": null, + "grad_norm": 0.6440523788025603, + "grad_max_sv": 0.21554723903536796, + "grad_min_sv": 1.1872820722402811e-08, + "grad_condition": 25176936.12047171, + "lr": 3.906842420574966e-05, + "time_sec": 49.89444398880005 + }, + { + "epoch": 132, + "train_loss": 1.8117612997817993, + "train_acc": 0.4992, + "test_loss": 7.735134202575684, + "test_acc": 0.1244, + "lyapunov": null, + "grad_norm": 0.6458623734804945, + "grad_max_sv": 0.2287333384156227, + "grad_min_sv": 1.2116058153988085e-08, + "grad_condition": 23082329.335862808, + "lr": 3.5111757055874305e-05, + "time_sec": 49.84588980674744 + }, + { + "epoch": 133, + "train_loss": 1.811845332069397, + "train_acc": 0.50014, + "test_loss": 7.118609297180176, + "test_acc": 0.1331, + "lyapunov": null, + "grad_norm": 0.638841020277806, + "grad_max_sv": 0.21471160911023618, + "grad_min_sv": 1.1894429352565794e-08, + "grad_condition": 24148328.84591496, + "lr": 3.1359005254054254e-05, + "time_sec": 49.831459283828735 + }, + { + "epoch": 134, + "train_loss": 1.8001032112121582, + "train_acc": 0.50294, + "test_loss": 7.107429740142822, + "test_acc": 0.1282, + "lyapunov": null, + "grad_norm": 0.6464497671620558, + "grad_max_sv": 0.23182750679552555, + "grad_min_sv": 1.2161121044212964e-08, + "grad_condition": 54577461.874021314, + "lr": 2.7811814881259484e-05, + "time_sec": 49.83904433250427 + }, + { + "epoch": 135, + "train_loss": 1.7929331283569336, + "train_acc": 0.50366, + "test_loss": 7.344893767547608, + "test_acc": 0.1271, + "lyapunov": null, + "grad_norm": 0.6435222264694869, + "grad_max_sv": 0.2192435622215271, + "grad_min_sv": 1.2271505814287487e-08, + "grad_condition": 22236846.49951817, + "lr": 2.4471741852423218e-05, + "time_sec": 49.82794523239136 + }, + { + "epoch": 136, + "train_loss": 1.8045927509307862, + "train_acc": 0.49886, + "test_loss": 8.085471559143066, + "test_acc": 0.1207, + "lyapunov": null, + "grad_norm": 0.6382347842581513, + "grad_max_sv": 0.22427703253924847, + "grad_min_sv": 1.216163273837223e-08, + "grad_condition": 28207277.011594873, + "lr": 2.1340251233966362e-05, + "time_sec": 49.88175678253174 + }, + { + "epoch": 137, + "train_loss": 1.7832990637588502, + "train_acc": 0.50496, + "test_loss": 6.688453459167481, + "test_acc": 0.1334, + "lyapunov": null, + "grad_norm": 0.6418151086385053, + "grad_max_sv": 0.21794002875685692, + "grad_min_sv": 1.2034389010318058e-08, + "grad_condition": 22793569.96555335, + "lr": 1.8418716601170932e-05, + "time_sec": 49.84071898460388 + }, + { + "epoch": 138, + "train_loss": 1.7905620854187012, + "train_acc": 0.50572, + "test_loss": 7.2380154365539555, + "test_acc": 0.129, + "lyapunov": null, + "grad_norm": 0.6407824951102813, + "grad_max_sv": 0.22645330876111985, + "grad_min_sv": 1.2214871658589033e-08, + "grad_condition": 20569116.284954578, + "lr": 1.570841943568445e-05, + "time_sec": 49.84640121459961 + }, + { + "epoch": 139, + "train_loss": 1.788800776901245, + "train_acc": 0.50604, + "test_loss": 7.676028425598145, + "test_acc": 0.1308, + "lyapunov": null, + "grad_norm": 0.6393065831907885, + "grad_max_sv": 0.2201111435890198, + "grad_min_sv": 1.206703041933821e-08, + "grad_condition": 28068636.701712035, + "lr": 1.3210548563419845e-05, + "time_sec": 49.82333970069885 + }, + { + "epoch": 140, + "train_loss": 1.7775352002334595, + "train_acc": 0.50992, + "test_loss": 6.824903617858887, + "test_acc": 0.1382, + "lyapunov": null, + "grad_norm": 0.6429938723422318, + "grad_max_sv": 0.21460832096636295, + "grad_min_sv": 1.17411291786218e-08, + "grad_condition": 31960287.943684638, + "lr": 1.0926199633097203e-05, + "time_sec": 49.83107376098633 + }, + { + "epoch": 141, + "train_loss": 1.7772767013931274, + "train_acc": 0.50912, + "test_loss": 8.417906446838378, + "test_acc": 0.1201, + "lyapunov": null, + "grad_norm": 0.6414560412377437, + "grad_max_sv": 0.22789728231728076, + "grad_min_sv": 1.2347990069327964e-08, + "grad_condition": 21519591.2698054, + "lr": 8.856374635655688e-06, + "time_sec": 49.830055475234985 + }, + { + "epoch": 142, + "train_loss": 1.7722079333496095, + "train_acc": 0.5074, + "test_loss": 7.479126264190674, + "test_acc": 0.1332, + "lyapunov": null, + "grad_norm": 0.6492349389016402, + "grad_max_sv": 0.23224957659840584, + "grad_min_sv": 1.2359584963816949e-08, + "grad_condition": 23310731.56809649, + "lr": 7.001981464747503e-06, + "time_sec": 49.821824073791504 + }, + { + "epoch": 143, + "train_loss": 1.7706715833282471, + "train_acc": 0.50882, + "test_loss": 6.759830638885498, + "test_acc": 0.1312, + "lyapunov": null, + "grad_norm": 0.6386303224852788, + "grad_max_sv": 0.21973421648144723, + "grad_min_sv": 1.2129359658330508e-08, + "grad_condition": 22303453.162939433, + "lr": 5.3638335185058295e-06, + "time_sec": 49.82608699798584 + }, + { + "epoch": 144, + "train_loss": 1.770061126937866, + "train_acc": 0.51042, + "test_loss": 8.168591398620606, + "test_acc": 0.1265, + "lyapunov": null, + "grad_norm": 0.6443170070907279, + "grad_max_sv": 0.22507050447165966, + "grad_min_sv": 1.2152392936393141e-08, + "grad_condition": 22873019.852206793, + "lr": 3.942649342761114e-06, + "time_sec": 49.8205029964447 + }, + { + "epoch": 145, + "train_loss": 1.7649179027938844, + "train_acc": 0.509, + "test_loss": 7.854398386383057, + "test_acc": 0.1211, + "lyapunov": null, + "grad_norm": 0.63938639247204, + "grad_max_sv": 0.22039102129638194, + "grad_min_sv": 1.1966107968386375e-08, + "grad_condition": 29791248.29023991, + "lr": 2.7390523158633524e-06, + "time_sec": 49.8352313041687 + }, + { + "epoch": 146, + "train_loss": 1.771636342201233, + "train_acc": 0.50926, + "test_loss": 7.595294637298584, + "test_acc": 0.1263, + "lyapunov": null, + "grad_norm": 0.6439134858087602, + "grad_max_sv": 0.22073593139648437, + "grad_min_sv": 1.1903592189027589e-08, + "grad_condition": 36630674.258442916, + "lr": 1.7535703752478133e-06, + "time_sec": 49.85316801071167 + }, + { + "epoch": 147, + "train_loss": 1.7654109023666382, + "train_acc": 0.50992, + "test_loss": 7.858496125793457, + "test_acc": 0.1228, + "lyapunov": null, + "grad_norm": 0.6452120448477214, + "grad_max_sv": 0.21640395522117614, + "grad_min_sv": 1.1791314735720703e-08, + "grad_condition": 36184836.96072569, + "lr": 9.866357858642196e-07, + "time_sec": 49.80920720100403 + }, + { + "epoch": 148, + "train_loss": 1.76628436378479, + "train_acc": 0.50766, + "test_loss": 8.274021264648438, + "test_acc": 0.1088, + "lyapunov": null, + "grad_norm": 0.6448148716908921, + "grad_max_sv": 0.22330073527991773, + "grad_min_sv": 1.2051270137369841e-08, + "grad_condition": 21403660.781028073, + "lr": 4.38584950570808e-07, + "time_sec": 49.84639763832092 + }, + { + "epoch": 149, + "train_loss": 1.7641568323135377, + "train_acc": 0.50932, + "test_loss": 7.1706701782226565, + "test_acc": 0.1418, + "lyapunov": null, + "grad_norm": 0.6419761185100763, + "grad_max_sv": 0.22420972734689712, + "grad_min_sv": 1.2012330221494726e-08, + "grad_condition": 44951323.39984313, + "lr": 1.096582625772501e-07, + "time_sec": 49.835381269454956 + }, + { + "epoch": 150, + "train_loss": 1.7616498372650147, + "train_acc": 0.51152, + "test_loss": 7.837383623504639, + "test_acc": 0.1182, + "lyapunov": null, + "grad_norm": 0.6426676505435569, + "grad_max_sv": 0.21811567358672618, + "grad_min_sv": 1.1744335026014906e-08, + "grad_condition": 40653937.072005436, + "lr": 0.0, + "time_sec": 49.85364270210266 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 4.790666111755371, + "train_acc": 0.0165, + "test_loss": 4.9503300064086915, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.291697588876432, + "grad_max_sv": 4.663330984115601, + "grad_min_sv": 7.994122603882659e-08, + "grad_condition": 204227559.8068969, + "lr": 0.0009998903417374227, + "time_sec": 66.97809171676636 + }, + { + "epoch": 2, + "train_loss": 4.437635167236328, + "train_acc": 0.03372, + "test_loss": 4.9434486038208005, + "test_acc": 0.0109, + "lyapunov": null, + "grad_norm": 3.3795440241281205, + "grad_max_sv": 2.9110051512718202, + "grad_min_sv": 5.2089944511252154e-08, + "grad_condition": 566186137.812573, + "lr": 0.0009995614150494292, + "time_sec": 66.91377472877502 + }, + { + "epoch": 3, + "train_loss": 4.26833670211792, + "train_acc": 0.04816, + "test_loss": 4.993957643127441, + "test_acc": 0.0118, + "lyapunov": null, + "grad_norm": 2.265691942587348, + "grad_max_sv": 1.775827443599701, + "grad_min_sv": 3.447322165783806e-08, + "grad_condition": 193597124.56597418, + "lr": 0.0009990133642141358, + "time_sec": 66.95397591590881 + }, + { + "epoch": 4, + "train_loss": 4.126825766448975, + "train_acc": 0.0657, + "test_loss": 5.033058495330811, + "test_acc": 0.0133, + "lyapunov": null, + "grad_norm": 1.503639209245557, + "grad_max_sv": 0.996296688914299, + "grad_min_sv": 2.3224798484378083e-08, + "grad_condition": 47352815.280070126, + "lr": 0.0009982464296247522, + "time_sec": 66.94082856178284 + }, + { + "epoch": 5, + "train_loss": 4.033032944335938, + "train_acc": 0.07788, + "test_loss": 5.366096397399902, + "test_acc": 0.0146, + "lyapunov": null, + "grad_norm": 1.2167707155197347, + "grad_max_sv": 0.7315087422728539, + "grad_min_sv": 1.914776174977151e-08, + "grad_condition": 65647468.63073953, + "lr": 0.0009972609476841367, + "time_sec": 66.9649748802185 + }, + { + "epoch": 6, + "train_loss": 3.9636214042663576, + "train_acc": 0.08816, + "test_loss": 5.34757041015625, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 1.109160273746945, + "grad_max_sv": 0.6089150205254554, + "grad_min_sv": 1.7710445950058773e-08, + "grad_condition": 77884060.5331116, + "lr": 0.000996057350657239, + "time_sec": 66.97061657905579 + }, + { + "epoch": 7, + "train_loss": 3.9122159162902834, + "train_acc": 0.09544, + "test_loss": 5.439447886657715, + "test_acc": 0.013, + "lyapunov": null, + "grad_norm": 1.0363457541084344, + "grad_max_sv": 0.5376138880848884, + "grad_min_sv": 1.6374132377761085e-08, + "grad_condition": 48186425.879532695, + "lr": 0.000994636166481494, + "time_sec": 67.02947664260864 + }, + { + "epoch": 8, + "train_loss": 3.860605283126831, + "train_acc": 0.10604, + "test_loss": 5.774677875518798, + "test_acc": 0.0152, + "lyapunov": null, + "grad_norm": 0.9855402112805093, + "grad_max_sv": 0.5275192707777023, + "grad_min_sv": 1.6650217127267554e-08, + "grad_condition": 36767266.40486912, + "lr": 0.0009929980185352525, + "time_sec": 66.97124218940735 + }, + { + "epoch": 9, + "train_loss": 3.8149237147521973, + "train_acc": 0.11454, + "test_loss": 5.3070202072143555, + "test_acc": 0.0222, + "lyapunov": null, + "grad_norm": 0.9330412728543993, + "grad_max_sv": 0.4647836610674858, + "grad_min_sv": 1.5222168972539585e-08, + "grad_condition": 49307207.804101914, + "lr": 0.0009911436253643444, + "time_sec": 67.01966977119446 + }, + { + "epoch": 10, + "train_loss": 3.7818530071258545, + "train_acc": 0.12014, + "test_loss": 5.634545847320557, + "test_acc": 0.0199, + "lyapunov": null, + "grad_norm": 0.8719008089031304, + "grad_max_sv": 0.40649077892303465, + "grad_min_sv": 1.4515182727992126e-08, + "grad_condition": 38341756.409908436, + "lr": 0.0009890738003669028, + "time_sec": 67.23870015144348 + }, + { + "epoch": 11, + "train_loss": 3.743896211090088, + "train_acc": 0.12462, + "test_loss": 5.8831702270507815, + "test_acc": 0.0241, + "lyapunov": null, + "grad_norm": 0.8436698179223415, + "grad_max_sv": 0.39998230785131456, + "grad_min_sv": 1.4137996530785845e-08, + "grad_condition": 231359110.35725895, + "lr": 0.00098678945143658, + "time_sec": 67.23693895339966 + }, + { + "epoch": 12, + "train_loss": 3.7158116050720214, + "train_acc": 0.12962, + "test_loss": 5.8489625442504884, + "test_acc": 0.0182, + "lyapunov": null, + "grad_norm": 0.8103156188684312, + "grad_max_sv": 0.36918022111058235, + "grad_min_sv": 1.3637384886633352e-08, + "grad_condition": 38409273.56149448, + "lr": 0.0009842915805643154, + "time_sec": 67.05321264266968 + }, + { + "epoch": 13, + "train_loss": 3.690355722808838, + "train_acc": 0.13444, + "test_loss": 5.952298941802979, + "test_acc": 0.0139, + "lyapunov": null, + "grad_norm": 0.7799393076966175, + "grad_max_sv": 0.3450939729809761, + "grad_min_sv": 1.3063578439224261e-08, + "grad_condition": 267805312.78349906, + "lr": 0.000981581283398829, + "time_sec": 67.01498341560364 + }, + { + "epoch": 14, + "train_loss": 3.660913709640503, + "train_acc": 0.13974, + "test_loss": 5.962563812255859, + "test_acc": 0.0157, + "lyapunov": null, + "grad_norm": 0.7562346727823589, + "grad_max_sv": 0.3272464439272881, + "grad_min_sv": 1.2569073787327411e-08, + "grad_condition": 28603602.411010243, + "lr": 0.0009786597487660333, + "time_sec": 67.02658581733704 + }, + { + "epoch": 15, + "train_loss": 3.6474139246368407, + "train_acc": 0.14148, + "test_loss": 6.562283952331543, + "test_acc": 0.0135, + "lyapunov": null, + "grad_norm": 0.7393349403998549, + "grad_max_sv": 0.33356437757611274, + "grad_min_sv": 1.2411575255055763e-08, + "grad_condition": 43624327.61961842, + "lr": 0.0009755282581475766, + "time_sec": 67.03324222564697 + }, + { + "epoch": 16, + "train_loss": 3.625168949737549, + "train_acc": 0.1432, + "test_loss": 6.292130155944824, + "test_acc": 0.0141, + "lyapunov": null, + "grad_norm": 0.7144248820011195, + "grad_max_sv": 0.31020588912069796, + "grad_min_sv": 1.2080284056414925e-08, + "grad_condition": 29549483.252300274, + "lr": 0.0009721881851187403, + "time_sec": 66.97783041000366 + }, + { + "epoch": 17, + "train_loss": 3.597680552520752, + "train_acc": 0.14858, + "test_loss": 6.235865226745606, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.6905264720289787, + "grad_max_sv": 0.2911532886326313, + "grad_min_sv": 1.1886577161446255e-08, + "grad_condition": 31227215.280764975, + "lr": 0.0009686409947459456, + "time_sec": 67.08970355987549 + }, + { + "epoch": 18, + "train_loss": 3.5831439966583254, + "train_acc": 0.1503, + "test_loss": 5.975571099853515, + "test_acc": 0.0174, + "lyapunov": null, + "grad_norm": 0.6807202195385632, + "grad_max_sv": 0.28772652372717855, + "grad_min_sv": 1.1393226486029751e-08, + "grad_condition": 137655636.45168823, + "lr": 0.0009648882429441254, + "time_sec": 66.99836611747742 + }, + { + "epoch": 19, + "train_loss": 3.5665633306121824, + "train_acc": 0.15322, + "test_loss": 5.7967665618896485, + "test_acc": 0.0147, + "lyapunov": null, + "grad_norm": 0.6692239217191613, + "grad_max_sv": 0.289702807366848, + "grad_min_sv": 1.1524174722138403e-08, + "grad_condition": 43837157.90767797, + "lr": 0.00096093157579425, + "time_sec": 66.98469638824463 + }, + { + "epoch": 20, + "train_loss": 3.5485270121765136, + "train_acc": 0.15842, + "test_loss": 6.38743748626709, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.6524234858247975, + "grad_max_sv": 0.2710107877850533, + "grad_min_sv": 1.1343318032097648e-08, + "grad_condition": 27194748.912352692, + "lr": 0.0009567727288213001, + "time_sec": 66.97950530052185 + }, + { + "epoch": 21, + "train_loss": 3.5387647283172607, + "train_acc": 0.15974, + "test_loss": 6.142497198486328, + "test_acc": 0.0122, + "lyapunov": null, + "grad_norm": 0.6404971752730705, + "grad_max_sv": 0.25612146519124507, + "grad_min_sv": 1.1065940866417101e-08, + "grad_condition": 27020698.902072392, + "lr": 0.0009524135262330095, + "time_sec": 67.06527757644653 + }, + { + "epoch": 22, + "train_loss": 3.5167810900115968, + "train_acc": 0.16126, + "test_loss": 5.6688673957824705, + "test_acc": 0.0192, + "lyapunov": null, + "grad_norm": 0.6273838486372684, + "grad_max_sv": 0.253273681178689, + "grad_min_sv": 1.0633086347869302e-08, + "grad_condition": 63663927.521495186, + "lr": 0.0009478558801197061, + "time_sec": 67.08625936508179 + }, + { + "epoch": 23, + "train_loss": 3.505348560180664, + "train_acc": 0.16408, + "test_loss": 6.704450527191162, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.6205013434735249, + "grad_max_sv": 0.24795704074203967, + "grad_min_sv": 1.0544875683748956e-08, + "grad_condition": 26930900.301938236, + "lr": 0.000943101789615607, + "time_sec": 67.07537865638733 + }, + { + "epoch": 24, + "train_loss": 3.487646808624268, + "train_acc": 0.16852, + "test_loss": 6.14088282699585, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.614195126220202, + "grad_max_sv": 0.24658647775650025, + "grad_min_sv": 1.0614721224211365e-08, + "grad_condition": 25409602.645818073, + "lr": 0.0009381533400219313, + "time_sec": 67.04035305976868 + }, + { + "epoch": 25, + "train_loss": 3.476624384918213, + "train_acc": 0.16722, + "test_loss": 6.3985797378540035, + "test_acc": 0.0153, + "lyapunov": null, + "grad_norm": 0.6065663518942211, + "grad_max_sv": 0.24001154042780398, + "grad_min_sv": 1.0449337081719356e-08, + "grad_condition": 26892625.00106412, + "lr": 0.0009330127018922189, + "time_sec": 66.98434329032898 + }, + { + "epoch": 26, + "train_loss": 3.451528890914917, + "train_acc": 0.17194, + "test_loss": 7.005337218475342, + "test_acc": 0.0161, + "lyapunov": null, + "grad_norm": 0.5958316341461533, + "grad_max_sv": 0.23011010847985744, + "grad_min_sv": 1.0420057322546583e-08, + "grad_condition": 25092916.983647533, + "lr": 0.000927682130080253, + "time_sec": 67.00863981246948 + }, + { + "epoch": 27, + "train_loss": 3.438732011184692, + "train_acc": 0.17512, + "test_loss": 6.713776673126221, + "test_acc": 0.0158, + "lyapunov": null, + "grad_norm": 0.5885432606585439, + "grad_max_sv": 0.22313685715198517, + "grad_min_sv": 1.0256330273961112e-08, + "grad_condition": 25498257.67463268, + "lr": 0.0009221639627510072, + "time_sec": 66.99373292922974 + }, + { + "epoch": 28, + "train_loss": 3.425728820877075, + "train_acc": 0.17648, + "test_loss": 6.706079711914063, + "test_acc": 0.0161, + "lyapunov": null, + "grad_norm": 0.5776306796513797, + "grad_max_sv": 0.21763003207743167, + "grad_min_sv": 1.0131521277489953e-08, + "grad_condition": 25502860.727228213, + "lr": 0.0009164606203550494, + "time_sec": 66.99960255622864 + }, + { + "epoch": 29, + "train_loss": 3.415288860321045, + "train_acc": 0.18104, + "test_loss": 7.00422691116333, + "test_acc": 0.0154, + "lyapunov": null, + "grad_norm": 0.5811456709025584, + "grad_max_sv": 0.2154564827680588, + "grad_min_sv": 1.0227832727971453e-08, + "grad_condition": 23155291.155594237, + "lr": 0.0009105746045668516, + "time_sec": 67.00278520584106 + }, + { + "epoch": 30, + "train_loss": 3.3993768449401855, + "train_acc": 0.18168, + "test_loss": 6.7661912048339845, + "test_acc": 0.0159, + "lyapunov": null, + "grad_norm": 0.5774334611780905, + "grad_max_sv": 0.21602067165076733, + "grad_min_sv": 9.999383252662363e-09, + "grad_condition": 46830102.49335132, + "lr": 0.0009045084971874733, + "time_sec": 67.01802110671997 + }, + { + "epoch": 31, + "train_loss": 3.39102335395813, + "train_acc": 0.183, + "test_loss": 6.575534628295898, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.5750391869831528, + "grad_max_sv": 0.21328589245676993, + "grad_min_sv": 1.0037052611266972e-08, + "grad_condition": 25219793.844095282, + "lr": 0.0008982649590120977, + "time_sec": 66.98685121536255 + }, + { + "epoch": 32, + "train_loss": 3.3709024705505373, + "train_acc": 0.1847, + "test_loss": 6.773156211090088, + "test_acc": 0.0241, + "lyapunov": null, + "grad_norm": 0.5682008127495727, + "grad_max_sv": 0.20905940011143684, + "grad_min_sv": 9.929261479690864e-09, + "grad_condition": 24026442.614084087, + "lr": 0.0008918467286629196, + "time_sec": 66.98118853569031 + }, + { + "epoch": 33, + "train_loss": 3.35322883605957, + "train_acc": 0.19048, + "test_loss": 6.544390415191651, + "test_acc": 0.0174, + "lyapunov": null, + "grad_norm": 0.5641011790857979, + "grad_max_sv": 0.21131759136915207, + "grad_min_sv": 9.970292436448092e-09, + "grad_condition": 108439933.80954358, + "lr": 0.0008852566213878943, + "time_sec": 67.0021116733551 + }, + { + "epoch": 34, + "train_loss": 3.346888256225586, + "train_acc": 0.1906, + "test_loss": 6.572783890533447, + "test_acc": 0.0249, + "lyapunov": null, + "grad_norm": 0.5631657519504247, + "grad_max_sv": 0.20612632147967816, + "grad_min_sv": 9.939895384558639e-09, + "grad_condition": 27859013.00420784, + "lr": 0.000878497527825878, + "time_sec": 66.99292349815369 + }, + { + "epoch": 35, + "train_loss": 3.3364852532958986, + "train_acc": 0.19192, + "test_loss": 6.624941380310059, + "test_acc": 0.0267, + "lyapunov": null, + "grad_norm": 0.5605769760458655, + "grad_max_sv": 0.20491612255573272, + "grad_min_sv": 9.870486683549728e-09, + "grad_condition": 23146292.907969765, + "lr": 0.000871572412738697, + "time_sec": 66.99680066108704 + }, + { + "epoch": 36, + "train_loss": 3.3320838648986815, + "train_acc": 0.19194, + "test_loss": 6.509025389099121, + "test_acc": 0.0338, + "lyapunov": null, + "grad_norm": 0.5514752672797416, + "grad_max_sv": 0.19631769321858883, + "grad_min_sv": 9.801347783389147e-09, + "grad_condition": 22925424.744912885, + "lr": 0.0008644843137107055, + "time_sec": 67.00271224975586 + }, + { + "epoch": 37, + "train_loss": 3.3248722314453123, + "train_acc": 0.19368, + "test_loss": 6.660050495910644, + "test_acc": 0.0232, + "lyapunov": null, + "grad_norm": 0.5549782000253485, + "grad_max_sv": 0.20016637705266477, + "grad_min_sv": 9.80520761806325e-09, + "grad_condition": 43150496.42441137, + "lr": 0.0008572363398164014, + "time_sec": 67.00392818450928 + }, + { + "epoch": 38, + "train_loss": 3.3040303685760497, + "train_acc": 0.1978, + "test_loss": 6.438115409851074, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.552679160616354, + "grad_max_sv": 0.20150073878467084, + "grad_min_sv": 9.978901688301178e-09, + "grad_condition": 24404614.851154737, + "lr": 0.0008498316702566826, + "time_sec": 66.97884392738342 + }, + { + "epoch": 39, + "train_loss": 3.295093801422119, + "train_acc": 0.2004, + "test_loss": 6.857768655395508, + "test_acc": 0.0356, + "lyapunov": null, + "grad_norm": 0.5456414300888803, + "grad_max_sv": 0.19542820267379285, + "grad_min_sv": 9.64108341980352e-09, + "grad_condition": 38418267.99625971, + "lr": 0.0008422735529643442, + "time_sec": 66.989262342453 + }, + { + "epoch": 40, + "train_loss": 3.2807973724365236, + "train_acc": 0.20254, + "test_loss": 7.183624605560302, + "test_acc": 0.0288, + "lyapunov": null, + "grad_norm": 0.5502236317298648, + "grad_max_sv": 0.20073941312730312, + "grad_min_sv": 9.736421222039659e-09, + "grad_condition": 23971099.963185668, + "lr": 0.0008345653031794289, + "time_sec": 67.05479025840759 + }, + { + "epoch": 41, + "train_loss": 3.27089994934082, + "train_acc": 0.20396, + "test_loss": 7.336966199493408, + "test_acc": 0.0235, + "lyapunov": null, + "grad_norm": 0.5476662910413355, + "grad_max_sv": 0.19763046652078628, + "grad_min_sv": 9.775574641435192e-09, + "grad_condition": 23640934.778466806, + "lr": 0.0008267103019950526, + "time_sec": 67.02259588241577 + }, + { + "epoch": 42, + "train_loss": 3.2620423323059082, + "train_acc": 0.20586, + "test_loss": 6.97865482788086, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.5434507884263167, + "grad_max_sv": 0.19267416559159756, + "grad_min_sv": 9.676590862622846e-09, + "grad_condition": 32692140.861607928, + "lr": 0.0008187119948743447, + "time_sec": 67.11938738822937 + }, + { + "epoch": 43, + "train_loss": 3.246746938018799, + "train_acc": 0.20984, + "test_loss": 7.017108020019531, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.5396772430481056, + "grad_max_sv": 0.1911445375531912, + "grad_min_sv": 9.706909992468482e-09, + "grad_condition": 22347408.62738797, + "lr": 0.000810573890139155, + "time_sec": 67.11671566963196 + }, + { + "epoch": 44, + "train_loss": 3.2492278230285643, + "train_acc": 0.20804, + "test_loss": 6.893268182373047, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.5383084022428465, + "grad_max_sv": 0.18535939790308475, + "grad_min_sv": 9.539425227522713e-09, + "grad_condition": 74582506.47418927, + "lr": 0.0008022995574311873, + "time_sec": 67.00796937942505 + }, + { + "epoch": 45, + "train_loss": 3.2271074884796143, + "train_acc": 0.2125, + "test_loss": 6.6321695571899415, + "test_acc": 0.0298, + "lyapunov": null, + "grad_norm": 0.5350882941371298, + "grad_max_sv": 0.18614536896348, + "grad_min_sv": 9.520675481561152e-09, + "grad_condition": 519972815.1749519, + "lr": 0.0007938926261462363, + "time_sec": 67.05224251747131 + }, + { + "epoch": 46, + "train_loss": 3.223205012207031, + "train_acc": 0.21378, + "test_loss": 8.111690937805175, + "test_acc": 0.0245, + "lyapunov": null, + "grad_norm": 0.5313315491107766, + "grad_max_sv": 0.18769054301083088, + "grad_min_sv": 9.561545546987737e-09, + "grad_condition": 22558726.834869802, + "lr": 0.0007853567838422158, + "time_sec": 67.02692914009094 + }, + { + "epoch": 47, + "train_loss": 3.2102231874084475, + "train_acc": 0.21366, + "test_loss": 7.20476734161377, + "test_acc": 0.0268, + "lyapunov": null, + "grad_norm": 0.5300596779522426, + "grad_max_sv": 0.18552429899573325, + "grad_min_sv": 9.575782686233047e-09, + "grad_condition": 21495882.964656584, + "lr": 0.0007766957746216719, + "time_sec": 67.0929958820343 + }, + { + "epoch": 48, + "train_loss": 3.202328568191528, + "train_acc": 0.21738, + "test_loss": 7.143350020599366, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5275781384357864, + "grad_max_sv": 0.18636706620454788, + "grad_min_sv": 9.551907610705345e-09, + "grad_condition": 33257654.14790963, + "lr": 0.0007679133974894982, + "time_sec": 67.10289525985718 + }, + { + "epoch": 49, + "train_loss": 3.1964333237457274, + "train_acc": 0.21696, + "test_loss": 7.0859999771118165, + "test_acc": 0.0354, + "lyapunov": null, + "grad_norm": 0.5290459768999093, + "grad_max_sv": 0.18547305800020694, + "grad_min_sv": 9.539052431978278e-09, + "grad_condition": 34652740.14328016, + "lr": 0.000759013504686565, + "time_sec": 67.11912679672241 + }, + { + "epoch": 50, + "train_loss": 3.1868507556152346, + "train_acc": 0.2195, + "test_loss": 7.204959943389893, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.5304998310773968, + "grad_max_sv": 0.1833030626177788, + "grad_min_sv": 9.589407306935527e-09, + "grad_condition": 93768948.14927751, + "lr": 0.0007499999999999998, + "time_sec": 67.06959462165833 + }, + { + "epoch": 51, + "train_loss": 3.1883190923309326, + "train_acc": 0.21784, + "test_loss": 7.328389108276367, + "test_acc": 0.0303, + "lyapunov": null, + "grad_norm": 0.5248467282170762, + "grad_max_sv": 0.18131516128778458, + "grad_min_sv": 9.465690375617952e-09, + "grad_condition": 47668215.59636396, + "lr": 0.0007408768370508575, + "time_sec": 67.01846742630005 + }, + { + "epoch": 52, + "train_loss": 3.1719473053741454, + "train_acc": 0.22166, + "test_loss": 8.36594852142334, + "test_acc": 0.025, + "lyapunov": null, + "grad_norm": 0.5248103969653446, + "grad_max_sv": 0.17532115392386913, + "grad_min_sv": 9.532304753867572e-09, + "grad_condition": 26041874.469802074, + "lr": 0.0007316480175599307, + "time_sec": 67.03516387939453 + }, + { + "epoch": 53, + "train_loss": 3.1698596488952635, + "train_acc": 0.22132, + "test_loss": 8.36387837677002, + "test_acc": 0.0251, + "lyapunov": null, + "grad_norm": 0.5233372908286834, + "grad_max_sv": 0.17466790974140167, + "grad_min_sv": 9.286205268632663e-09, + "grad_condition": 21363168.099911686, + "lr": 0.0007223175895924635, + "time_sec": 67.02187657356262 + }, + { + "epoch": 54, + "train_loss": 3.152655903167725, + "train_acc": 0.22722, + "test_loss": 8.196963485717774, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.5285400405038103, + "grad_max_sv": 0.17916450947523116, + "grad_min_sv": 9.4594759324218e-09, + "grad_condition": 82291006.99579689, + "lr": 0.0007128896457825361, + "time_sec": 66.97509050369263 + }, + { + "epoch": 55, + "train_loss": 3.1408946729278564, + "train_acc": 0.22896, + "test_loss": 8.031216970825195, + "test_acc": 0.0238, + "lyapunov": null, + "grad_norm": 0.5251164499697153, + "grad_max_sv": 0.17466633953154087, + "grad_min_sv": 9.452194638104316e-09, + "grad_condition": 22653052.01456701, + "lr": 0.0007033683215378998, + "time_sec": 67.00176858901978 + }, + { + "epoch": 56, + "train_loss": 3.1348105377960205, + "train_acc": 0.22832, + "test_loss": 8.950087960815429, + "test_acc": 0.0204, + "lyapunov": null, + "grad_norm": 0.5200008300943049, + "grad_max_sv": 0.17119008600711821, + "grad_min_sv": 9.414464659240895e-09, + "grad_condition": 31689823.38588159, + "lr": 0.0006937577932260512, + "time_sec": 66.97579646110535 + }, + { + "epoch": 57, + "train_loss": 3.1169134953308104, + "train_acc": 0.23282, + "test_loss": 8.065475146484374, + "test_acc": 0.0311, + "lyapunov": null, + "grad_norm": 0.5241244870526487, + "grad_max_sv": 0.17154259756207466, + "grad_min_sv": 9.529985643685902e-09, + "grad_condition": 28312826.48374013, + "lr": 0.0006840622763423388, + "time_sec": 66.9856812953949 + }, + { + "epoch": 58, + "train_loss": 3.1234397563171385, + "train_acc": 0.22962, + "test_loss": 8.583345112609864, + "test_acc": 0.0222, + "lyapunov": null, + "grad_norm": 0.5197452718406793, + "grad_max_sv": 0.17415275909006595, + "grad_min_sv": 9.31348687893685e-09, + "grad_condition": 21270072.13306666, + "lr": 0.0006742860236609073, + "time_sec": 66.99910068511963 + }, + { + "epoch": 59, + "train_loss": 3.1087922663879395, + "train_acc": 0.23302, + "test_loss": 8.37566005859375, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.5182628480059946, + "grad_max_sv": 0.17543886601924896, + "grad_min_sv": 9.358361164474304e-09, + "grad_condition": 31647391.583267204, + "lr": 0.0006644333233692913, + "time_sec": 66.97189855575562 + }, + { + "epoch": 60, + "train_loss": 3.0956507678985594, + "train_acc": 0.23662, + "test_loss": 7.7532292655944826, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.5195814358053482, + "grad_max_sv": 0.1776260558515787, + "grad_min_sv": 9.643665624392561e-09, + "grad_condition": 22666276.356990974, + "lr": 0.0006545084971874734, + "time_sec": 67.00041198730469 + }, + { + "epoch": 61, + "train_loss": 3.092038777694702, + "train_acc": 0.23596, + "test_loss": 7.946604266357422, + "test_acc": 0.0245, + "lyapunov": null, + "grad_norm": 0.5196921425232948, + "grad_max_sv": 0.17445886991918086, + "grad_min_sv": 9.508607204389285e-09, + "grad_condition": 21427055.017691903, + "lr": 0.0006445158984722354, + "time_sec": 67.06589937210083 + }, + { + "epoch": 62, + "train_loss": 3.079979831466675, + "train_acc": 0.23898, + "test_loss": 9.319492291259765, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.5186454829421666, + "grad_max_sv": 0.16986236572265626, + "grad_min_sv": 9.32054670874094e-09, + "grad_condition": 31246817.26616311, + "lr": 0.0006344599103076324, + "time_sec": 66.99018096923828 + }, + { + "epoch": 63, + "train_loss": 3.0727787420654296, + "train_acc": 0.23906, + "test_loss": 8.948303262329102, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.5175233947350019, + "grad_max_sv": 0.16513913124799728, + "grad_min_sv": 9.338011380810585e-09, + "grad_condition": 24005876.4941143, + "lr": 0.0006243449435824269, + "time_sec": 66.9405734539032 + }, + { + "epoch": 64, + "train_loss": 3.074298862915039, + "train_acc": 0.23708, + "test_loss": 9.195949301147461, + "test_acc": 0.0262, + "lyapunov": null, + "grad_norm": 0.5221855467062518, + "grad_max_sv": 0.17083160430192948, + "grad_min_sv": 9.452190228090296e-09, + "grad_condition": 48343788.07302423, + "lr": 0.0006141754350553275, + "time_sec": 67.0041880607605 + }, + { + "epoch": 65, + "train_loss": 3.0613560808563234, + "train_acc": 0.24008, + "test_loss": 8.735752813720703, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.5207095947451149, + "grad_max_sv": 0.1693739652633667, + "grad_min_sv": 9.425346239599897e-09, + "grad_condition": 23106579.847053923, + "lr": 0.0006039558454088793, + "time_sec": 66.9728434085846 + }, + { + "epoch": 66, + "train_loss": 3.050594620132446, + "train_acc": 0.243, + "test_loss": 8.672268884277344, + "test_acc": 0.0298, + "lyapunov": null, + "grad_norm": 0.5161820441185401, + "grad_max_sv": 0.1685989484190941, + "grad_min_sv": 9.325516864278071e-09, + "grad_condition": 20646125.746492933, + "lr": 0.000593690657292862, + "time_sec": 66.97670912742615 + }, + { + "epoch": 67, + "train_loss": 3.0404045782470703, + "train_acc": 0.2468, + "test_loss": 9.001078883361817, + "test_acc": 0.0227, + "lyapunov": null, + "grad_norm": 0.5184119200981759, + "grad_max_sv": 0.1701225485652685, + "grad_min_sv": 9.472868531257284e-09, + "grad_condition": 23517656.45251561, + "lr": 0.0005833843733580507, + "time_sec": 66.96425604820251 + }, + { + "epoch": 68, + "train_loss": 3.0347717694091796, + "train_acc": 0.24578, + "test_loss": 8.55764455871582, + "test_acc": 0.0204, + "lyapunov": null, + "grad_norm": 0.5177787618737804, + "grad_max_sv": 0.17245440557599068, + "grad_min_sv": 9.351008802005456e-09, + "grad_condition": 26504498.6419156, + "lr": 0.0005730415142812054, + "time_sec": 66.987557888031 + }, + { + "epoch": 69, + "train_loss": 3.0343177091979983, + "train_acc": 0.24472, + "test_loss": 8.6480171875, + "test_acc": 0.0252, + "lyapunov": null, + "grad_norm": 0.5144704452610198, + "grad_max_sv": 0.16564900018274784, + "grad_min_sv": 9.403833016452534e-09, + "grad_condition": 27296778.54875686, + "lr": 0.0005626666167821517, + "time_sec": 66.97946643829346 + }, + { + "epoch": 70, + "train_loss": 3.019142656097412, + "train_acc": 0.25006, + "test_loss": 8.915339315795899, + "test_acc": 0.0291, + "lyapunov": null, + "grad_norm": 0.5199788677371252, + "grad_max_sv": 0.16652515456080436, + "grad_min_sv": 9.64339011144677e-09, + "grad_condition": 23020050.410736304, + "lr": 0.0005522642316338265, + "time_sec": 66.97834086418152 + }, + { + "epoch": 71, + "train_loss": 3.0120436127471923, + "train_acc": 0.25124, + "test_loss": 9.489800686645507, + "test_acc": 0.0229, + "lyapunov": null, + "grad_norm": 0.5170392758240284, + "grad_max_sv": 0.16549308113753797, + "grad_min_sv": 9.466763362109277e-09, + "grad_condition": 23186013.564122196, + "lr": 0.0005418389216661573, + "time_sec": 66.98612070083618 + }, + { + "epoch": 72, + "train_loss": 3.005094768676758, + "train_acc": 0.25262, + "test_loss": 9.240029809570313, + "test_acc": 0.0228, + "lyapunov": null, + "grad_norm": 0.5193656479358113, + "grad_max_sv": 0.16801112554967404, + "grad_min_sv": 9.608471449040756e-09, + "grad_condition": 72045711.1919595, + "lr": 0.0005313952597646563, + "time_sec": 66.99170446395874 + }, + { + "epoch": 73, + "train_loss": 2.9903506928253174, + "train_acc": 0.25404, + "test_loss": 9.075869140625, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.517195719023633, + "grad_max_sv": 0.16475822702050208, + "grad_min_sv": 9.421488161853731e-09, + "grad_condition": 20088448.14143536, + "lr": 0.0005209378268645994, + "time_sec": 66.99337768554688 + }, + { + "epoch": 74, + "train_loss": 2.9886431184387208, + "train_acc": 0.25206, + "test_loss": 8.946782205200195, + "test_acc": 0.0216, + "lyapunov": null, + "grad_norm": 0.5156132053442515, + "grad_max_sv": 0.1671187650412321, + "grad_min_sv": 9.546754539679903e-09, + "grad_condition": 20526453.312863432, + "lr": 0.0005104712099416781, + "time_sec": 66.97370409965515 + }, + { + "epoch": 75, + "train_loss": 2.978247420654297, + "train_acc": 0.25748, + "test_loss": 8.795244805908203, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.5172367229977752, + "grad_max_sv": 0.16712253615260125, + "grad_min_sv": 9.516156018046784e-09, + "grad_condition": 30249731.938419342, + "lr": 0.0004999999999999996, + "time_sec": 67.0042519569397 + }, + { + "epoch": 76, + "train_loss": 2.975222046432495, + "train_acc": 0.2575, + "test_loss": 7.9467042022705074, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.5205213451239863, + "grad_max_sv": 0.16927127800881864, + "grad_min_sv": 9.570786241308582e-09, + "grad_condition": 21297706.844217338, + "lr": 0.0004895287900583212, + "time_sec": 66.98396968841553 + }, + { + "epoch": 77, + "train_loss": 2.9694722108459475, + "train_acc": 0.25688, + "test_loss": 8.63839992980957, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.5171656548088565, + "grad_max_sv": 0.16773934625089168, + "grad_min_sv": 9.45730138160461e-09, + "grad_condition": 53792449.33116071, + "lr": 0.0004790621731353997, + "time_sec": 67.06471967697144 + }, + { + "epoch": 78, + "train_loss": 2.954387292098999, + "train_acc": 0.26136, + "test_loss": 8.785921076965332, + "test_acc": 0.0231, + "lyapunov": null, + "grad_norm": 0.5158257600732294, + "grad_max_sv": 0.16913142390549182, + "grad_min_sv": 9.432701836287194e-09, + "grad_condition": 22764076.692523666, + "lr": 0.000468604740235343, + "time_sec": 66.98979210853577 + }, + { + "epoch": 79, + "train_loss": 2.951801152191162, + "train_acc": 0.26352, + "test_loss": 8.070646887207031, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.5174682191745558, + "grad_max_sv": 0.16524536907672882, + "grad_min_sv": 9.502134473704515e-09, + "grad_condition": 19794117.95628558, + "lr": 0.00045816107833384175, + "time_sec": 67.00397682189941 + }, + { + "epoch": 80, + "train_loss": 2.945303405151367, + "train_acc": 0.25934, + "test_loss": 8.538162045288086, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.5164921536500987, + "grad_max_sv": 0.16473788283765317, + "grad_min_sv": 9.313295684654222e-09, + "grad_condition": 20076070.15299391, + "lr": 0.0004477357683661729, + "time_sec": 66.99750208854675 + }, + { + "epoch": 81, + "train_loss": 2.9330507093811033, + "train_acc": 0.26472, + "test_loss": 9.089803251647949, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.5182949552264074, + "grad_max_sv": 0.16235619597136974, + "grad_min_sv": 9.617397696282115e-09, + "grad_condition": 30543590.097258378, + "lr": 0.00043733338321784746, + "time_sec": 66.96942782402039 + }, + { + "epoch": 82, + "train_loss": 2.931871794204712, + "train_acc": 0.26478, + "test_loss": 9.64152674560547, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.5176276155464238, + "grad_max_sv": 0.16380822993814945, + "grad_min_sv": 9.444439504069369e-09, + "grad_condition": 55360326.762117185, + "lr": 0.0004269584857187939, + "time_sec": 66.98204827308655 + }, + { + "epoch": 83, + "train_loss": 2.9243045820617675, + "train_acc": 0.2654, + "test_loss": 8.998370599365234, + "test_acc": 0.0286, + "lyapunov": null, + "grad_norm": 0.5221359210821417, + "grad_max_sv": 0.16723665855824948, + "grad_min_sv": 9.730227464033181e-09, + "grad_condition": 37510081.93776859, + "lr": 0.0004166156266419484, + "time_sec": 67.03800463676453 + }, + { + "epoch": 84, + "train_loss": 2.910555010223389, + "train_acc": 0.26936, + "test_loss": 9.721973526000976, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 0.519552420362012, + "grad_max_sv": 0.16508992463350297, + "grad_min_sv": 9.647469361231953e-09, + "grad_condition": 55059867.79942672, + "lr": 0.0004063093427071373, + "time_sec": 67.02205467224121 + }, + { + "epoch": 85, + "train_loss": 2.908977954711914, + "train_acc": 0.26772, + "test_loss": 9.513397438049317, + "test_acc": 0.0262, + "lyapunov": null, + "grad_norm": 0.5225336336313486, + "grad_max_sv": 0.1674807954579592, + "grad_min_sv": 9.611194474665185e-09, + "grad_condition": 61660610.28358656, + "lr": 0.0003960441545911199, + "time_sec": 66.98397827148438 + }, + { + "epoch": 86, + "train_loss": 2.9070045388793946, + "train_acc": 0.26946, + "test_loss": 9.42815225982666, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.5163838704970162, + "grad_max_sv": 0.15979891866445542, + "grad_min_sv": 9.371719027900793e-09, + "grad_condition": 27067310.492935486, + "lr": 0.0003858245649446718, + "time_sec": 67.00940752029419 + }, + { + "epoch": 87, + "train_loss": 2.8997818164825437, + "train_acc": 0.27182, + "test_loss": 9.99990376586914, + "test_acc": 0.0235, + "lyapunov": null, + "grad_norm": 0.5185938331206461, + "grad_max_sv": 0.1670172270387411, + "grad_min_sv": 9.72940567521563e-09, + "grad_condition": 41690290.30450606, + "lr": 0.00037565505641757235, + "time_sec": 66.98136639595032 + }, + { + "epoch": 88, + "train_loss": 2.8861678593444826, + "train_acc": 0.27088, + "test_loss": 9.440834574890136, + "test_acc": 0.0223, + "lyapunov": null, + "grad_norm": 0.5210845021802476, + "grad_max_sv": 0.16573623865842818, + "grad_min_sv": 9.66025861803832e-09, + "grad_condition": 21401152.005565703, + "lr": 0.00036554008969236695, + "time_sec": 66.97698450088501 + }, + { + "epoch": 89, + "train_loss": 2.879338860092163, + "train_acc": 0.2741, + "test_loss": 9.169851208496095, + "test_acc": 0.0199, + "lyapunov": null, + "grad_norm": 0.5207447841157706, + "grad_max_sv": 0.16667181067168713, + "grad_min_sv": 9.689165991755289e-09, + "grad_condition": 26973958.650769584, + "lr": 0.0003554841015277638, + "time_sec": 67.01995515823364 + }, + { + "epoch": 90, + "train_loss": 2.8748147813415525, + "train_acc": 0.27324, + "test_loss": 10.077813652038575, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.5199671563562479, + "grad_max_sv": 0.16343193501234055, + "grad_min_sv": 9.647999926754025e-09, + "grad_condition": 21023683.920218416, + "lr": 0.000345491502812526, + "time_sec": 67.06868648529053 + }, + { + "epoch": 91, + "train_loss": 2.8696892933654787, + "train_acc": 0.27466, + "test_loss": 9.565517497253419, + "test_acc": 0.0229, + "lyapunov": null, + "grad_norm": 0.5208386545074176, + "grad_max_sv": 0.16384688578546047, + "grad_min_sv": 9.741156603571e-09, + "grad_condition": 20234282.31156399, + "lr": 0.0003355666766307081, + "time_sec": 67.05189514160156 + }, + { + "epoch": 92, + "train_loss": 2.8643893748474123, + "train_acc": 0.27506, + "test_loss": 9.676446484375, + "test_acc": 0.0222, + "lyapunov": null, + "grad_norm": 0.5227536692673017, + "grad_max_sv": 0.16562484614551068, + "grad_min_sv": 9.696238559286918e-09, + "grad_condition": 19364268.060319778, + "lr": 0.00032571397633909225, + "time_sec": 67.04055285453796 + }, + { + "epoch": 93, + "train_loss": 2.9157111973571777, + "train_acc": 0.2694, + "test_loss": 10.502802850341796, + "test_acc": 0.016, + "lyapunov": null, + "grad_norm": 0.5304583427147314, + "grad_max_sv": 0.16479565128684043, + "grad_min_sv": 9.75800383412606e-09, + "grad_condition": 23919445.487485204, + "lr": 0.00031593772365766094, + "time_sec": 67.07202672958374 + }, + { + "epoch": 94, + "train_loss": 3.5718225437927247, + "train_acc": 0.14984, + "test_loss": 8.342486605834962, + "test_acc": 0.0173, + "lyapunov": null, + "grad_norm": 0.47865396629415263, + "grad_max_sv": 0.146741402707994, + "grad_min_sv": 8.774483893636553e-09, + "grad_condition": 22076860.426247958, + "lr": 0.0003062422067739483, + "time_sec": 66.99063777923584 + }, + { + "epoch": 95, + "train_loss": 3.3590557197570803, + "train_acc": 0.18824, + "test_loss": 9.117096383666992, + "test_acc": 0.018, + "lyapunov": null, + "grad_norm": 0.47849958749977733, + "grad_max_sv": 0.14531232379376888, + "grad_min_sv": 8.800075565473798e-09, + "grad_condition": 21940629.92360129, + "lr": 0.00029663167846209965, + "time_sec": 66.97514224052429 + }, + { + "epoch": 96, + "train_loss": 3.2702466972351076, + "train_acc": 0.2019, + "test_loss": 9.76727836151123, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.47937534710610474, + "grad_max_sv": 0.14464113656431438, + "grad_min_sv": 8.792039801926166e-09, + "grad_condition": 89660660.43121836, + "lr": 0.00028711035421746345, + "time_sec": 66.99873089790344 + }, + { + "epoch": 97, + "train_loss": 3.2227031265258788, + "train_acc": 0.21062, + "test_loss": 9.626097766113281, + "test_acc": 0.02, + "lyapunov": null, + "grad_norm": 0.4871680253381029, + "grad_max_sv": 0.15086784306913614, + "grad_min_sv": 9.198363076778903e-09, + "grad_condition": 18446455.013218474, + "lr": 0.00027768241040753615, + "time_sec": 67.01664638519287 + }, + { + "epoch": 98, + "train_loss": 3.1770834211730956, + "train_acc": 0.21918, + "test_loss": 9.366678713989257, + "test_acc": 0.0189, + "lyapunov": null, + "grad_norm": 0.48983757815120343, + "grad_max_sv": 0.14779492281377316, + "grad_min_sv": 9.026428729463909e-09, + "grad_condition": 18794227.40584495, + "lr": 0.00026835198244006903, + "time_sec": 66.9809033870697 + }, + { + "epoch": 99, + "train_loss": 3.154748341598511, + "train_acc": 0.22074, + "test_loss": 8.755814114379882, + "test_acc": 0.0203, + "lyapunov": null, + "grad_norm": 0.49142802947586006, + "grad_max_sv": 0.14894249550998212, + "grad_min_sv": 9.186921921030405e-09, + "grad_condition": 243665710.2249507, + "lr": 0.0002591231629491421, + "time_sec": 66.99194574356079 + }, + { + "epoch": 100, + "train_loss": 3.120311908035278, + "train_acc": 0.229, + "test_loss": 9.377279025268555, + "test_acc": 0.019, + "lyapunov": null, + "grad_norm": 0.49378455655907144, + "grad_max_sv": 0.1519782803952694, + "grad_min_sv": 9.117503733946376e-09, + "grad_condition": 21901137.13681825, + "lr": 0.0002499999999999997, + "time_sec": 66.99540328979492 + }, + { + "epoch": 101, + "train_loss": 3.102491766357422, + "train_acc": 0.23234, + "test_loss": 9.32430498046875, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.49627664046313075, + "grad_max_sv": 0.15419429913163185, + "grad_min_sv": 9.201821271620503e-09, + "grad_condition": 21776686.85204944, + "lr": 0.00024098649531343477, + "time_sec": 66.98357772827148 + }, + { + "epoch": 102, + "train_loss": 3.085017224731445, + "train_acc": 0.23322, + "test_loss": 9.753949787902831, + "test_acc": 0.0193, + "lyapunov": null, + "grad_norm": 0.49406280305370465, + "grad_max_sv": 0.15118828602135181, + "grad_min_sv": 9.171319623191288e-09, + "grad_condition": 24151283.383643005, + "lr": 0.0002320866025105016, + "time_sec": 66.97265934944153 + }, + { + "epoch": 103, + "train_loss": 3.066944828414917, + "train_acc": 0.23798, + "test_loss": 9.439580722045898, + "test_acc": 0.0198, + "lyapunov": null, + "grad_norm": 0.49800148183033643, + "grad_max_sv": 0.15005342811346054, + "grad_min_sv": 9.260063320998268e-09, + "grad_condition": 32769732.654720783, + "lr": 0.0002233042253783278, + "time_sec": 67.00615048408508 + }, + { + "epoch": 104, + "train_loss": 3.0457233097839356, + "train_acc": 0.24206, + "test_loss": 9.283833685302735, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.5005816660320969, + "grad_max_sv": 0.15397185049951076, + "grad_min_sv": 9.2347574705276e-09, + "grad_condition": 39740043.841383025, + "lr": 0.000214643216157784, + "time_sec": 66.98598265647888 + }, + { + "epoch": 105, + "train_loss": 3.0319893937683107, + "train_acc": 0.24054, + "test_loss": 9.208142726135254, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.4998792272266736, + "grad_max_sv": 0.15734503231942654, + "grad_min_sv": 9.254817884274402e-09, + "grad_condition": 23445108.874561593, + "lr": 0.00020610737385376332, + "time_sec": 66.97633767127991 + }, + { + "epoch": 106, + "train_loss": 3.0231310614013673, + "train_acc": 0.2459, + "test_loss": 9.397696965026855, + "test_acc": 0.0216, + "lyapunov": null, + "grad_norm": 0.5036514636560196, + "grad_max_sv": 0.15039666295051574, + "grad_min_sv": 9.292655003714615e-09, + "grad_condition": 456660482.4660243, + "lr": 0.00019770044256881242, + "time_sec": 66.97969722747803 + }, + { + "epoch": 107, + "train_loss": 3.015210195846558, + "train_acc": 0.24924, + "test_loss": 9.136646028137207, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.5044102710994137, + "grad_max_sv": 0.15338496044278144, + "grad_min_sv": 9.416407534962313e-09, + "grad_condition": 29814119.267252993, + "lr": 0.0001894261098608447, + "time_sec": 66.9929895401001 + }, + { + "epoch": 108, + "train_loss": 2.992950742034912, + "train_acc": 0.25076, + "test_loss": 9.683133767700195, + "test_acc": 0.0206, + "lyapunov": null, + "grad_norm": 0.5024766427018658, + "grad_max_sv": 0.15207941457629204, + "grad_min_sv": 9.368817296961928e-09, + "grad_condition": 25707665.821010012, + "lr": 0.000181288005125655, + "time_sec": 67.04599475860596 + }, + { + "epoch": 109, + "train_loss": 2.9911826483917237, + "train_acc": 0.25182, + "test_loss": 9.541546542358398, + "test_acc": 0.0216, + "lyapunov": null, + "grad_norm": 0.5050428635829171, + "grad_max_sv": 0.1559975240379572, + "grad_min_sv": 9.425568786580741e-09, + "grad_condition": 29011942.837490637, + "lr": 0.0001732896980049473, + "time_sec": 66.9745888710022 + }, + { + "epoch": 110, + "train_loss": 2.9719406244659425, + "train_acc": 0.25626, + "test_loss": 9.304527082824707, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.50709757758927, + "grad_max_sv": 0.15366660207509994, + "grad_min_sv": 9.407841375375093e-09, + "grad_condition": 20259210.324132033, + "lr": 0.00016543469682057076, + "time_sec": 67.00725531578064 + }, + { + "epoch": 111, + "train_loss": 2.9610974934387206, + "train_acc": 0.25892, + "test_loss": 9.905137655639649, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 0.5069510646769094, + "grad_max_sv": 0.16044184900820255, + "grad_min_sv": 9.517911378487121e-09, + "grad_condition": 20572867.320830267, + "lr": 0.00015772644703565552, + "time_sec": 66.96853518486023 + }, + { + "epoch": 112, + "train_loss": 2.956413153839111, + "train_acc": 0.25946, + "test_loss": 10.164678506469727, + "test_acc": 0.0226, + "lyapunov": null, + "grad_norm": 0.5077720159938983, + "grad_max_sv": 0.15506692193448543, + "grad_min_sv": 9.397505702779529e-09, + "grad_condition": 22578916.073937874, + "lr": 0.00015016832974331713, + "time_sec": 67.01250433921814 + }, + { + "epoch": 113, + "train_loss": 2.9505707207489014, + "train_acc": 0.26056, + "test_loss": 9.862203175354004, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.508430292455553, + "grad_max_sv": 0.1596985150128603, + "grad_min_sv": 9.460744607170391e-09, + "grad_condition": 18853883.48562253, + "lr": 0.00014276366018359834, + "time_sec": 66.99557614326477 + }, + { + "epoch": 114, + "train_loss": 2.9415723051452636, + "train_acc": 0.2616, + "test_loss": 9.63483480834961, + "test_acc": 0.0232, + "lyapunov": null, + "grad_norm": 0.5104303932486228, + "grad_max_sv": 0.1552283179014921, + "grad_min_sv": 9.445251571464034e-09, + "grad_condition": 693766580.7640529, + "lr": 0.00013551568628929425, + "time_sec": 66.99906969070435 + }, + { + "epoch": 115, + "train_loss": 2.9388054510498045, + "train_acc": 0.26148, + "test_loss": 9.398469245910645, + "test_acc": 0.0231, + "lyapunov": null, + "grad_norm": 0.5141390434712518, + "grad_max_sv": 0.16008906662464142, + "grad_min_sv": 9.453520891100631e-09, + "grad_condition": 21355980.767428003, + "lr": 0.00012842758726130276, + "time_sec": 66.97847414016724 + }, + { + "epoch": 116, + "train_loss": 2.9283171284484864, + "train_acc": 0.26438, + "test_loss": 9.456967205810546, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.5133058115565678, + "grad_max_sv": 0.15975738912820817, + "grad_min_sv": 9.5292529520008e-09, + "grad_condition": 22298576.095964633, + "lr": 0.0001215024721741218, + "time_sec": 66.9903039932251 + }, + { + "epoch": 117, + "train_loss": 2.919693772506714, + "train_acc": 0.26682, + "test_loss": 9.649295095825195, + "test_acc": 0.0229, + "lyapunov": null, + "grad_norm": 0.5098040600332114, + "grad_max_sv": 0.15964976735413075, + "grad_min_sv": 9.535333161947435e-09, + "grad_condition": 18488699.782394268, + "lr": 0.00011474337861210538, + "time_sec": 66.98530316352844 + }, + { + "epoch": 118, + "train_loss": 2.9129154638671877, + "train_acc": 0.26648, + "test_loss": 9.582696447753905, + "test_acc": 0.0252, + "lyapunov": null, + "grad_norm": 0.5137327165981059, + "grad_max_sv": 0.15674266032874584, + "grad_min_sv": 9.422415092608106e-09, + "grad_condition": 21769035.1047443, + "lr": 0.00010815327133708009, + "time_sec": 67.0712718963623 + }, + { + "epoch": 119, + "train_loss": 2.90771673576355, + "train_acc": 0.26738, + "test_loss": 9.686517756652831, + "test_acc": 0.0223, + "lyapunov": null, + "grad_norm": 0.5112636160904589, + "grad_max_sv": 0.15690986551344394, + "grad_min_sv": 9.557581368002666e-09, + "grad_condition": 65271422.15119822, + "lr": 0.00010173504098790182, + "time_sec": 66.99134540557861 + }, + { + "epoch": 120, + "train_loss": 2.903361056442261, + "train_acc": 0.26626, + "test_loss": 9.534084574890137, + "test_acc": 0.025, + "lyapunov": null, + "grad_norm": 0.5139337490910202, + "grad_max_sv": 0.16002687215805053, + "grad_min_sv": 9.488575995753035e-09, + "grad_condition": 26500108.07568959, + "lr": 9.549150281252629e-05, + "time_sec": 66.98560166358948 + }, + { + "epoch": 121, + "train_loss": 2.8838987274169923, + "train_acc": 0.27268, + "test_loss": 9.002799011230469, + "test_acc": 0.0286, + "lyapunov": null, + "grad_norm": 0.5181242234216702, + "grad_max_sv": 0.15681598484516143, + "grad_min_sv": 9.58419937996391e-09, + "grad_condition": 21911011.850442223, + "lr": 8.942539543314794e-05, + "time_sec": 66.99542880058289 + }, + { + "epoch": 122, + "train_loss": 2.8907574623107912, + "train_acc": 0.27284, + "test_loss": 9.40299231262207, + "test_acc": 0.023, + "lyapunov": null, + "grad_norm": 0.5154755058010533, + "grad_max_sv": 0.16150307320058346, + "grad_min_sv": 9.692825331253373e-09, + "grad_condition": 20117302.380122818, + "lr": 8.353937964495024e-05, + "time_sec": 66.98236727714539 + }, + { + "epoch": 123, + "train_loss": 2.8763803490448, + "train_acc": 0.2739, + "test_loss": 9.18796940612793, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.514194573203304, + "grad_max_sv": 0.15613614898175002, + "grad_min_sv": 9.584234908488477e-09, + "grad_condition": 18777275.99405461, + "lr": 7.783603724899243e-05, + "time_sec": 66.99689793586731 + }, + { + "epoch": 124, + "train_loss": 2.8843617086029054, + "train_acc": 0.27144, + "test_loss": 9.370162466430664, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.5136262444075659, + "grad_max_sv": 0.15881695374846458, + "grad_min_sv": 9.587037638758567e-09, + "grad_condition": 18534833.152038723, + "lr": 7.231786991974666e-05, + "time_sec": 66.98831605911255 + }, + { + "epoch": 125, + "train_loss": 2.8742648021697996, + "train_acc": 0.27246, + "test_loss": 9.4968570602417, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.5172296409721588, + "grad_max_sv": 0.15975196473300457, + "grad_min_sv": 9.493101107982404e-09, + "grad_condition": 20120176.988574862, + "lr": 6.698729810778072e-05, + "time_sec": 66.98702692985535 + }, + { + "epoch": 126, + "train_loss": 2.868820255508423, + "train_acc": 0.27476, + "test_loss": 9.60731820678711, + "test_acc": 0.0243, + "lyapunov": null, + "grad_norm": 0.5204414887458292, + "grad_max_sv": 0.16092863790690898, + "grad_min_sv": 9.674041201446215e-09, + "grad_condition": 18855250.862980247, + "lr": 6.184665997806817e-05, + "time_sec": 66.97707200050354 + }, + { + "epoch": 127, + "train_loss": 2.8692937660217286, + "train_acc": 0.27484, + "test_loss": 9.273512542724609, + "test_acc": 0.0252, + "lyapunov": null, + "grad_norm": 0.5162971653606119, + "grad_max_sv": 0.16184906139969826, + "grad_min_sv": 9.668298800447062e-09, + "grad_condition": 21519277.77695776, + "lr": 5.6898210384392595e-05, + "time_sec": 67.0102117061615 + }, + { + "epoch": 128, + "train_loss": 2.8623614330291747, + "train_acc": 0.27702, + "test_loss": 9.566067819213867, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.5161277911748794, + "grad_max_sv": 0.1572089247405529, + "grad_min_sv": 9.598460455964574e-09, + "grad_condition": 40264946.42458854, + "lr": 5.214411988029363e-05, + "time_sec": 66.9910991191864 + }, + { + "epoch": 129, + "train_loss": 2.8542457569122313, + "train_acc": 0.27896, + "test_loss": 9.585708435058594, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5185536839510844, + "grad_max_sv": 0.16669968273490668, + "grad_min_sv": 9.84268076209549e-09, + "grad_condition": 20409849.055229448, + "lr": 4.7586473766990294e-05, + "time_sec": 67.02374720573425 + }, + { + "epoch": 130, + "train_loss": 2.8572039877319337, + "train_acc": 0.27668, + "test_loss": 9.687789022827149, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.5186381052419109, + "grad_max_sv": 0.15739406496286393, + "grad_min_sv": 9.484110215923769e-09, + "grad_condition": 32956127.450649947, + "lr": 4.32272711786996e-05, + "time_sec": 67.0042040348053 + }, + { + "epoch": 131, + "train_loss": 2.8510476612854005, + "train_acc": 0.27938, + "test_loss": 9.569248272705078, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5207995350849649, + "grad_max_sv": 0.16004110053181647, + "grad_min_sv": 9.74696345579229e-09, + "grad_condition": 19170988.284027696, + "lr": 3.906842420574966e-05, + "time_sec": 67.01241946220398 + }, + { + "epoch": 132, + "train_loss": 2.846966871871948, + "train_acc": 0.28012, + "test_loss": 9.591386764526368, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.5190948064684937, + "grad_max_sv": 0.16090917438268662, + "grad_min_sv": 9.59687692925204e-09, + "grad_condition": 19916201.19002537, + "lr": 3.5111757055874305e-05, + "time_sec": 66.99244403839111 + }, + { + "epoch": 133, + "train_loss": 2.849546993560791, + "train_acc": 0.2807, + "test_loss": 9.568466381835938, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.5185948998509293, + "grad_max_sv": 0.1592203661799431, + "grad_min_sv": 9.741048792588635e-09, + "grad_condition": 21889901.09234864, + "lr": 3.1359005254054254e-05, + "time_sec": 66.98589158058167 + }, + { + "epoch": 134, + "train_loss": 2.8438784635925294, + "train_acc": 0.28108, + "test_loss": 9.896654699707032, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.5160935862439748, + "grad_max_sv": 0.1570783667266369, + "grad_min_sv": 9.671757885201804e-09, + "grad_condition": 260951372.1762239, + "lr": 2.7811814881259484e-05, + "time_sec": 66.98548531532288 + }, + { + "epoch": 135, + "train_loss": 2.834603865356445, + "train_acc": 0.28228, + "test_loss": 9.507378176879882, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.5182545697342097, + "grad_max_sv": 0.16007349267601967, + "grad_min_sv": 9.658516472721423e-09, + "grad_condition": 19713617.954316415, + "lr": 2.4471741852423218e-05, + "time_sec": 67.04329872131348 + }, + { + "epoch": 136, + "train_loss": 2.839189874649048, + "train_acc": 0.28064, + "test_loss": 9.359465802001953, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.5169244988974169, + "grad_max_sv": 0.16038464941084385, + "grad_min_sv": 9.551935577917225e-09, + "grad_condition": 92654982.50365481, + "lr": 2.1340251233966362e-05, + "time_sec": 67.0141191482544 + }, + { + "epoch": 137, + "train_loss": 2.8397282981109617, + "train_acc": 0.28072, + "test_loss": 9.637136407470702, + "test_acc": 0.0232, + "lyapunov": null, + "grad_norm": 0.5171965418231472, + "grad_max_sv": 0.1600246898829937, + "grad_min_sv": 9.73793786961108e-09, + "grad_condition": 49688363.904323384, + "lr": 1.8418716601170932e-05, + "time_sec": 67.01152467727661 + }, + { + "epoch": 138, + "train_loss": 2.832450699005127, + "train_acc": 0.2818, + "test_loss": 9.6108934967041, + "test_acc": 0.0257, + "lyapunov": null, + "grad_norm": 0.5180887909699459, + "grad_max_sv": 0.15756660997867583, + "grad_min_sv": 9.721027080522582e-09, + "grad_condition": 111964333.48758218, + "lr": 1.570841943568445e-05, + "time_sec": 66.98093700408936 + }, + { + "epoch": 139, + "train_loss": 2.831738001098633, + "train_acc": 0.28372, + "test_loss": 9.70671376953125, + "test_acc": 0.0243, + "lyapunov": null, + "grad_norm": 0.5175564205755943, + "grad_max_sv": 0.15984287559986116, + "grad_min_sv": 9.567414729211298e-09, + "grad_condition": 30908421.83810656, + "lr": 1.3210548563419845e-05, + "time_sec": 66.98836731910706 + }, + { + "epoch": 140, + "train_loss": 2.8314741302490236, + "train_acc": 0.2828, + "test_loss": 9.671274719238282, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.5195292394658827, + "grad_max_sv": 0.16055516712367535, + "grad_min_sv": 9.656845009232972e-09, + "grad_condition": 116770748.01439288, + "lr": 1.0926199633097203e-05, + "time_sec": 67.06937670707703 + }, + { + "epoch": 141, + "train_loss": 2.8331345532226564, + "train_acc": 0.28274, + "test_loss": 9.6149158203125, + "test_acc": 0.0254, + "lyapunov": null, + "grad_norm": 0.5200947221378508, + "grad_max_sv": 0.1620084557682276, + "grad_min_sv": 9.736931689749428e-09, + "grad_condition": 45631030.28761599, + "lr": 8.856374635655688e-06, + "time_sec": 67.04308843612671 + }, + { + "epoch": 142, + "train_loss": 2.8309748402404784, + "train_acc": 0.28162, + "test_loss": 9.762360348510741, + "test_acc": 0.0236, + "lyapunov": null, + "grad_norm": 0.5193749464503752, + "grad_max_sv": 0.16398511864244938, + "grad_min_sv": 9.725219179967937e-09, + "grad_condition": 21389461.650285553, + "lr": 7.001981464747503e-06, + "time_sec": 66.99746632575989 + }, + { + "epoch": 143, + "train_loss": 2.8280009740447998, + "train_acc": 0.28424, + "test_loss": 9.46468698425293, + "test_acc": 0.0236, + "lyapunov": null, + "grad_norm": 0.5183118315610563, + "grad_max_sv": 0.15934774614870548, + "grad_min_sv": 9.612720197615943e-09, + "grad_condition": 28184363.311956126, + "lr": 5.3638335185058295e-06, + "time_sec": 67.1207172870636 + }, + { + "epoch": 144, + "train_loss": 2.8344388133239744, + "train_acc": 0.27982, + "test_loss": 9.481146864318848, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.5191802199413043, + "grad_max_sv": 0.16139711774885654, + "grad_min_sv": 9.682644661057616e-09, + "grad_condition": 19530671.727896534, + "lr": 3.942649342761114e-06, + "time_sec": 67.00769138336182 + }, + { + "epoch": 145, + "train_loss": 2.8336991081237795, + "train_acc": 0.28372, + "test_loss": 9.66582228088379, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.5185987884305854, + "grad_max_sv": 0.16210929341614247, + "grad_min_sv": 9.609004592014969e-09, + "grad_condition": 19136474.88235427, + "lr": 2.7390523158633524e-06, + "time_sec": 67.0150043964386 + }, + { + "epoch": 146, + "train_loss": 2.8299831028747557, + "train_acc": 0.28278, + "test_loss": 9.453235021972656, + "test_acc": 0.0257, + "lyapunov": null, + "grad_norm": 0.5191689479196915, + "grad_max_sv": 0.16032814532518386, + "grad_min_sv": 9.704305628868703e-09, + "grad_condition": 46973186.46224795, + "lr": 1.7535703752478133e-06, + "time_sec": 67.00002098083496 + }, + { + "epoch": 147, + "train_loss": 2.825070192184448, + "train_acc": 0.28334, + "test_loss": 9.736306394958497, + "test_acc": 0.0241, + "lyapunov": null, + "grad_norm": 0.5194004947332557, + "grad_max_sv": 0.15663104616105555, + "grad_min_sv": 9.712660245519977e-09, + "grad_condition": 19953974.129073095, + "lr": 9.866357858642196e-07, + "time_sec": 67.0251133441925 + }, + { + "epoch": 148, + "train_loss": 2.8285147483825686, + "train_acc": 0.28494, + "test_loss": 9.718778967285155, + "test_acc": 0.0232, + "lyapunov": null, + "grad_norm": 0.519735769986064, + "grad_max_sv": 0.16175503246486186, + "grad_min_sv": 9.61004464027082e-09, + "grad_condition": 41640518.28457622, + "lr": 4.38584950570808e-07, + "time_sec": 66.99386191368103 + }, + { + "epoch": 149, + "train_loss": 2.8338044094085695, + "train_acc": 0.2828, + "test_loss": 9.769097790527344, + "test_acc": 0.025, + "lyapunov": null, + "grad_norm": 0.518369855767956, + "grad_max_sv": 0.16054188311100007, + "grad_min_sv": 9.553421861929757e-09, + "grad_condition": 19432504.243999995, + "lr": 1.096582625772501e-07, + "time_sec": 66.99177241325378 + }, + { + "epoch": 150, + "train_loss": 2.8278376667022704, + "train_acc": 0.28346, + "test_loss": 9.647385183715821, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5190962063342817, + "grad_max_sv": 0.16339128278195858, + "grad_min_sv": 9.625854724415461e-09, + "grad_condition": 26849402.241447162, + "lr": 0.0, + "time_sec": 66.99396753311157 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 4.0711297009277345, + "train_acc": 0.09922, + "test_loss": 3.9652711036682127, + "test_acc": 0.106, + "lyapunov": 2.009106175978775, + "grad_norm": 5.770356961936896, + "grad_max_sv": 4.216659033298493, + "grad_min_sv": 1.0549574099294467e-07, + "grad_condition": 83568782.62868212, + "lr": 0.0009998903417374227, + "time_sec": 41.888622999191284 + }, + { + "epoch": 2, + "train_loss": 3.7634158575439454, + "train_acc": 0.13558, + "test_loss": 4.481808354949951, + "test_acc": 0.0542, + "lyapunov": 1.6958206730425511, + "grad_norm": 3.6343119962391017, + "grad_max_sv": 2.4889110922813416, + "grad_min_sv": 6.732413328491837e-08, + "grad_condition": 91225677.18337384, + "lr": 0.0009995614150494292, + "time_sec": 41.84356164932251 + }, + { + "epoch": 3, + "train_loss": 3.6647304371643066, + "train_acc": 0.1493, + "test_loss": 4.3052373779296875, + "test_acc": 0.0762, + "lyapunov": 1.6261345663338975, + "grad_norm": 2.8093749766197624, + "grad_max_sv": 1.7556122809648513, + "grad_min_sv": 5.287189366841305e-08, + "grad_condition": 314142006.47060126, + "lr": 0.0009990133642141358, + "time_sec": 41.84758758544922 + }, + { + "epoch": 4, + "train_loss": 3.546524167175293, + "train_acc": 0.16742, + "test_loss": 5.702491674804688, + "test_acc": 0.0294, + "lyapunov": 1.5553575302938671, + "grad_norm": 2.385940862508357, + "grad_max_sv": 1.40236736536026, + "grad_min_sv": 4.480527846517646e-08, + "grad_condition": 43664896.37977407, + "lr": 0.0009982464296247522, + "time_sec": 41.83865737915039 + }, + { + "epoch": 5, + "train_loss": 3.4743005490112306, + "train_acc": 0.18312, + "test_loss": 8.196367356872559, + "test_acc": 0.019, + "lyapunov": 1.5279129725283065, + "grad_norm": 2.072916387891114, + "grad_max_sv": 1.1730020090937614, + "grad_min_sv": 3.8785105194172334e-08, + "grad_condition": 32346211.56806183, + "lr": 0.0009972609476841367, + "time_sec": 41.85976266860962 + }, + { + "epoch": 6, + "train_loss": 3.4256133052062987, + "train_acc": 0.19342, + "test_loss": 9.553438766479491, + "test_acc": 0.0187, + "lyapunov": 1.5210750066410854, + "grad_norm": 1.8439895228569763, + "grad_max_sv": 0.9858661040663719, + "grad_min_sv": 3.4533098991484934e-08, + "grad_condition": 35319864.79656621, + "lr": 0.000996057350657239, + "time_sec": 41.841728925704956 + }, + { + "epoch": 7, + "train_loss": 3.4064867937469483, + "train_acc": 0.2019, + "test_loss": 11.607983041381836, + "test_acc": 0.0152, + "lyapunov": 1.523884119280159, + "grad_norm": 1.687138246958699, + "grad_max_sv": 0.8869923338294029, + "grad_min_sv": 3.151686688296351e-08, + "grad_condition": 33789366.4765297, + "lr": 0.000994636166481494, + "time_sec": 41.84767436981201 + }, + { + "epoch": 8, + "train_loss": 3.434463021774292, + "train_acc": 0.19834, + "test_loss": 11.012699322509766, + "test_acc": 0.0218, + "lyapunov": 1.5377070940364048, + "grad_norm": 1.5753285999803672, + "grad_max_sv": 0.8568978801369667, + "grad_min_sv": 2.9292211212172958e-08, + "grad_condition": 38247647.23104979, + "lr": 0.0009929980185352525, + "time_sec": 41.83318567276001 + }, + { + "epoch": 9, + "train_loss": 3.4525474771118163, + "train_acc": 0.19694, + "test_loss": 13.244960899353027, + "test_acc": 0.0188, + "lyapunov": 1.5521414874459776, + "grad_norm": 1.4910263576831584, + "grad_max_sv": 0.7901037082076072, + "grad_min_sv": 2.7871724133082115e-08, + "grad_condition": 652853959.565771, + "lr": 0.0009911436253643444, + "time_sec": 41.85349941253662 + }, + { + "epoch": 10, + "train_loss": 3.4827073947906495, + "train_acc": 0.19456, + "test_loss": 13.097009005737304, + "test_acc": 0.0142, + "lyapunov": 1.54852739807285, + "grad_norm": 1.3918276084929038, + "grad_max_sv": 0.7072893396019936, + "grad_min_sv": 2.5679541396095296e-08, + "grad_condition": 39117704.605187416, + "lr": 0.0009890738003669028, + "time_sec": 41.853031635284424 + }, + { + "epoch": 11, + "train_loss": 3.502148910446167, + "train_acc": 0.19276, + "test_loss": 14.30014864807129, + "test_acc": 0.0163, + "lyapunov": 1.5574408672044955, + "grad_norm": 1.3267443475145169, + "grad_max_sv": 0.6856341227889061, + "grad_min_sv": 2.4468690279499938e-08, + "grad_condition": 36359188.54410316, + "lr": 0.00098678945143658, + "time_sec": 41.87047362327576 + }, + { + "epoch": 12, + "train_loss": 3.5455151155090334, + "train_acc": 0.1879, + "test_loss": 12.457445967102052, + "test_acc": 0.0197, + "lyapunov": 1.5671831793187525, + "grad_norm": 1.2480528019241246, + "grad_max_sv": 0.6239843934774398, + "grad_min_sv": 2.3005261242953905e-08, + "grad_condition": 526118663.91773003, + "lr": 0.0009842915805643154, + "time_sec": 41.888609409332275 + }, + { + "epoch": 13, + "train_loss": 3.6091552614593505, + "train_acc": 0.17994, + "test_loss": 12.732378463745118, + "test_acc": 0.0121, + "lyapunov": 1.568660382419596, + "grad_norm": 1.1583490651743926, + "grad_max_sv": 0.581366877257824, + "grad_min_sv": 2.1129029859068282e-08, + "grad_condition": 32416771.726506818, + "lr": 0.000981581283398829, + "time_sec": 41.91386127471924 + }, + { + "epoch": 14, + "train_loss": 3.791756629562378, + "train_acc": 0.15402, + "test_loss": 15.130843069458008, + "test_acc": 0.0119, + "lyapunov": 1.616871199034669, + "grad_norm": 1.087286539710877, + "grad_max_sv": 0.572893675416708, + "grad_min_sv": 1.9829283692818224e-08, + "grad_condition": 32374293.19268779, + "lr": 0.0009786597487660333, + "time_sec": 41.84876489639282 + }, + { + "epoch": 15, + "train_loss": 3.8399617958068846, + "train_acc": 0.14724, + "test_loss": 17.94291413269043, + "test_acc": 0.0166, + "lyapunov": 1.6528625835847977, + "grad_norm": 1.0379429629839805, + "grad_max_sv": 0.5574500106275082, + "grad_min_sv": 1.8863349182662857e-08, + "grad_condition": 39761225.70266014, + "lr": 0.0009755282581475766, + "time_sec": 41.82764172554016 + }, + { + "epoch": 16, + "train_loss": 3.8371740995025636, + "train_acc": 0.15152, + "test_loss": 13.5413774017334, + "test_acc": 0.01, + "lyapunov": 1.648486807218293, + "grad_norm": 0.9596716866271199, + "grad_max_sv": 0.5051649369299411, + "grad_min_sv": 1.7647910632856423e-08, + "grad_condition": 34020323.13172309, + "lr": 0.0009721881851187403, + "time_sec": 41.84924578666687 + }, + { + "epoch": 17, + "train_loss": 3.890597806930542, + "train_acc": 0.14732, + "test_loss": 14.242138269042968, + "test_acc": 0.0132, + "lyapunov": 1.6423247948936794, + "grad_norm": 0.8982590539538886, + "grad_max_sv": 0.46011053323745726, + "grad_min_sv": 1.6221578684992576e-08, + "grad_condition": 227922899.83540225, + "lr": 0.0009686409947459456, + "time_sec": 41.824068784713745 + }, + { + "epoch": 18, + "train_loss": 3.8945003430938723, + "train_acc": 0.14424, + "test_loss": 12.652154109191894, + "test_acc": 0.009, + "lyapunov": 1.6140738649441457, + "grad_norm": 0.8509250568629757, + "grad_max_sv": 0.4146191440522671, + "grad_min_sv": 1.5334739790484608e-08, + "grad_condition": 46249959.20615914, + "lr": 0.0009648882429441254, + "time_sec": 41.92591094970703 + }, + { + "epoch": 19, + "train_loss": 3.911494416732788, + "train_acc": 0.14534, + "test_loss": 10.313947262573242, + "test_acc": 0.01, + "lyapunov": 1.6057381596406708, + "grad_norm": 0.8291056062070911, + "grad_max_sv": 0.39902378544211387, + "grad_min_sv": 1.5037980047316603e-08, + "grad_condition": 51800842.237051465, + "lr": 0.00096093157579425, + "time_sec": 41.85994362831116 + }, + { + "epoch": 20, + "train_loss": 3.9858800520324706, + "train_acc": 0.13508, + "test_loss": 9.495584085083008, + "test_acc": 0.0117, + "lyapunov": 1.5699561761163385, + "grad_norm": 0.8464930976238112, + "grad_max_sv": 0.4136614315211773, + "grad_min_sv": 1.490709049438779e-08, + "grad_condition": 522735678.0721162, + "lr": 0.0009567727288213001, + "time_sec": 41.85805010795593 + }, + { + "epoch": 21, + "train_loss": 4.023155120925903, + "train_acc": 0.12818, + "test_loss": 10.004813737487792, + "test_acc": 0.0135, + "lyapunov": 1.5752095285888827, + "grad_norm": 0.8291979613527221, + "grad_max_sv": 0.38449598476290703, + "grad_min_sv": 1.4266561158826629e-08, + "grad_condition": 100203024.77550165, + "lr": 0.0009524135262330095, + "time_sec": 41.84737300872803 + }, + { + "epoch": 22, + "train_loss": 4.029212285461425, + "train_acc": 0.12438, + "test_loss": 12.173621334838867, + "test_acc": 0.01, + "lyapunov": 1.5598359254315077, + "grad_norm": 0.7501647761926934, + "grad_max_sv": 0.36557952016592027, + "grad_min_sv": 1.3507705134974124e-08, + "grad_condition": 32668036.703706127, + "lr": 0.0009478558801197061, + "time_sec": 41.83857583999634 + }, + { + "epoch": 23, + "train_loss": 4.038732503051758, + "train_acc": 0.12626, + "test_loss": 8.940043533325195, + "test_acc": 0.011, + "lyapunov": 1.5640881744492086, + "grad_norm": 0.7404717741571084, + "grad_max_sv": 0.36797516867518426, + "grad_min_sv": 1.314027773258175e-08, + "grad_condition": 31266761.905169785, + "lr": 0.000943101789615607, + "time_sec": 41.82795524597168 + }, + { + "epoch": 24, + "train_loss": 4.0988731300354, + "train_acc": 0.11452, + "test_loss": 12.849692756652832, + "test_acc": 0.0107, + "lyapunov": 1.550421966311267, + "grad_norm": 0.7098563411237487, + "grad_max_sv": 0.36257990449666977, + "grad_min_sv": 1.25359189376284e-08, + "grad_condition": 40983554.09727303, + "lr": 0.0009381533400219313, + "time_sec": 41.85472393035889 + }, + { + "epoch": 25, + "train_loss": 4.209664036712646, + "train_acc": 0.09956, + "test_loss": 13.292383435058595, + "test_acc": 0.01, + "lyapunov": 1.5532953726970935, + "grad_norm": 0.6761784984779601, + "grad_max_sv": 0.3498499631881714, + "grad_min_sv": 1.1860140708419564e-08, + "grad_condition": 35321140.57939846, + "lr": 0.0009330127018922189, + "time_sec": 41.83675241470337 + }, + { + "epoch": 26, + "train_loss": 4.387504685211182, + "train_acc": 0.06822, + "test_loss": 13.442844244384766, + "test_acc": 0.01, + "lyapunov": 1.5123424859303038, + "grad_norm": 0.613666343544254, + "grad_max_sv": 0.312596595287323, + "grad_min_sv": 9.974056802697362e-09, + "grad_condition": 73223482.84978306, + "lr": 0.000927682130080253, + "time_sec": 41.83025002479553 + }, + { + "epoch": 27, + "train_loss": 4.494176885528565, + "train_acc": 0.0543, + "test_loss": 11.84754227294922, + "test_acc": 0.0094, + "lyapunov": 1.4815948003393304, + "grad_norm": 0.5747479343845562, + "grad_max_sv": 0.3057863064110279, + "grad_min_sv": 8.438247317554826e-09, + "grad_condition": 38945619.0197791, + "lr": 0.0009221639627510072, + "time_sec": 41.84781360626221 + }, + { + "epoch": 28, + "train_loss": 4.46251156829834, + "train_acc": 0.05616, + "test_loss": 11.681759558105469, + "test_acc": 0.01, + "lyapunov": 1.4850436720396856, + "grad_norm": 0.5367103881878276, + "grad_max_sv": 0.27574604004621506, + "grad_min_sv": 7.970707525950527e-09, + "grad_condition": 43556131.981196605, + "lr": 0.0009164606203550494, + "time_sec": 41.85157370567322 + }, + { + "epoch": 29, + "train_loss": 4.478804314422607, + "train_acc": 0.05546, + "test_loss": 13.70535901184082, + "test_acc": 0.01, + "lyapunov": 1.4930339225417817, + "grad_norm": 0.4922959043886969, + "grad_max_sv": 0.26684653796255586, + "grad_min_sv": 7.476301915054772e-09, + "grad_condition": 50660877.44966361, + "lr": 0.0009105746045668516, + "time_sec": 41.84281659126282 + }, + { + "epoch": 30, + "train_loss": 4.461830242156982, + "train_acc": 0.05732, + "test_loss": 16.430956909179688, + "test_acc": 0.01, + "lyapunov": 1.4880318653857922, + "grad_norm": 0.463062312015885, + "grad_max_sv": 0.24580183289945126, + "grad_min_sv": 6.99083638443232e-09, + "grad_condition": 91544069.9810532, + "lr": 0.0009045084971874733, + "time_sec": 41.85340070724487 + }, + { + "epoch": 31, + "train_loss": 4.449828500366211, + "train_acc": 0.06014, + "test_loss": 16.980024148559572, + "test_acc": 0.01, + "lyapunov": 1.515285712068953, + "grad_norm": 0.46991707412670536, + "grad_max_sv": 0.24059981070458888, + "grad_min_sv": 7.035010417960619e-09, + "grad_condition": 75974624.60279362, + "lr": 0.0008982649590120977, + "time_sec": 41.8510844707489 + }, + { + "epoch": 32, + "train_loss": 4.437514468383789, + "train_acc": 0.06294, + "test_loss": 18.52886298980713, + "test_acc": 0.01, + "lyapunov": 1.5204427940461336, + "grad_norm": 0.45125734819245583, + "grad_max_sv": 0.22053336799144746, + "grad_min_sv": 6.6175200534590585e-09, + "grad_condition": 48917947.725726604, + "lr": 0.0008918467286629196, + "time_sec": 41.869179248809814 + }, + { + "epoch": 33, + "train_loss": 4.40278786529541, + "train_acc": 0.06556, + "test_loss": 18.846385064697266, + "test_acc": 0.01, + "lyapunov": 1.4883441946390645, + "grad_norm": 0.45666973025646995, + "grad_max_sv": 0.21949558071792125, + "grad_min_sv": 6.802780549985954e-09, + "grad_condition": 36143230.241273426, + "lr": 0.0008852566213878943, + "time_sec": 41.84911870956421 + }, + { + "epoch": 34, + "train_loss": 4.40820367401123, + "train_acc": 0.06462, + "test_loss": 20.250594232177736, + "test_acc": 0.01, + "lyapunov": 1.4780629108019192, + "grad_norm": 0.4533983560833586, + "grad_max_sv": 0.21924315206706524, + "grad_min_sv": 6.449878905967488e-09, + "grad_condition": 45022497.55124281, + "lr": 0.000878497527825878, + "time_sec": 41.82957434654236 + }, + { + "epoch": 35, + "train_loss": 4.416326632080078, + "train_acc": 0.06346, + "test_loss": 18.319365844726562, + "test_acc": 0.01, + "lyapunov": 1.4840021791970333, + "grad_norm": 0.44153691028523245, + "grad_max_sv": 0.20659824572503566, + "grad_min_sv": 6.229376612806869e-09, + "grad_condition": 59088146.05455335, + "lr": 0.000871572412738697, + "time_sec": 41.850478410720825 + }, + { + "epoch": 36, + "train_loss": 4.408258157043457, + "train_acc": 0.064, + "test_loss": 20.95832971191406, + "test_acc": 0.01, + "lyapunov": 1.479226511152809, + "grad_norm": 0.4410718020248668, + "grad_max_sv": 0.2093581147491932, + "grad_min_sv": 6.282209370940539e-09, + "grad_condition": 105188788.23632967, + "lr": 0.0008644843137107055, + "time_sec": 41.878541469573975 + }, + { + "epoch": 37, + "train_loss": 4.407336394348144, + "train_acc": 0.06656, + "test_loss": 16.102902310180664, + "test_acc": 0.01, + "lyapunov": 1.4862678380268615, + "grad_norm": 0.44349953997935043, + "grad_max_sv": 0.215363934263587, + "grad_min_sv": 6.384406239789975e-09, + "grad_condition": 37599506.61324627, + "lr": 0.0008572363398164014, + "time_sec": 41.84441637992859 + }, + { + "epoch": 38, + "train_loss": 4.39930072052002, + "train_acc": 0.06716, + "test_loss": 14.936711614990234, + "test_acc": 0.01, + "lyapunov": 1.4831183868296005, + "grad_norm": 0.45835307206344844, + "grad_max_sv": 0.22024714946746826, + "grad_min_sv": 6.405372059842263e-09, + "grad_condition": 66702014.21939925, + "lr": 0.0008498316702566826, + "time_sec": 41.848416805267334 + }, + { + "epoch": 39, + "train_loss": 4.400538181915283, + "train_acc": 0.06598, + "test_loss": 16.468564752197267, + "test_acc": 0.01, + "lyapunov": 1.4876915777430815, + "grad_norm": 0.4485664393328264, + "grad_max_sv": 0.22156519442796707, + "grad_min_sv": 6.4785729367994316e-09, + "grad_condition": 280429030.69459355, + "lr": 0.0008422735529643442, + "time_sec": 41.86299443244934 + }, + { + "epoch": 40, + "train_loss": 4.397091385955811, + "train_acc": 0.06734, + "test_loss": 18.54481873931885, + "test_acc": 0.01, + "lyapunov": 1.4808301129914305, + "grad_norm": 0.4299005955382572, + "grad_max_sv": 0.2034155208617449, + "grad_min_sv": 6.2005965799361015e-09, + "grad_condition": 44401112.87668381, + "lr": 0.0008345653031794289, + "time_sec": 41.8275043964386 + }, + { + "epoch": 41, + "train_loss": 4.386424259796143, + "train_acc": 0.06824, + "test_loss": 21.206073614501953, + "test_acc": 0.01, + "lyapunov": 1.4804525152801553, + "grad_norm": 0.4248718447548538, + "grad_max_sv": 0.20124743394553662, + "grad_min_sv": 6.046653282243408e-09, + "grad_condition": 40043238.334212705, + "lr": 0.0008267103019950526, + "time_sec": 41.85425305366516 + }, + { + "epoch": 42, + "train_loss": 4.386167093048096, + "train_acc": 0.0676, + "test_loss": 19.16770219116211, + "test_acc": 0.01, + "lyapunov": 1.4792915119234558, + "grad_norm": 0.4093890186492107, + "grad_max_sv": 0.1878580778837204, + "grad_min_sv": 5.876780584390673e-09, + "grad_condition": 44144026.50569831, + "lr": 0.0008187119948743447, + "time_sec": 41.865527868270874 + }, + { + "epoch": 43, + "train_loss": 4.397055397033691, + "train_acc": 0.06784, + "test_loss": 18.22021773529053, + "test_acc": 0.01, + "lyapunov": 1.4911047723287207, + "grad_norm": 0.42408941793691435, + "grad_max_sv": 0.1856762148439884, + "grad_min_sv": 5.8528611551061925e-09, + "grad_condition": 150471528.47198898, + "lr": 0.000810573890139155, + "time_sec": 41.851991176605225 + }, + { + "epoch": 44, + "train_loss": 4.418051720123291, + "train_acc": 0.06534, + "test_loss": 18.890657635498048, + "test_acc": 0.01, + "lyapunov": 1.506059860634377, + "grad_norm": 0.41379860519627926, + "grad_max_sv": 0.1912920583039522, + "grad_min_sv": 5.7118770109554354e-09, + "grad_condition": 70799416.84221649, + "lr": 0.0008022995574311873, + "time_sec": 41.855762004852295 + }, + { + "epoch": 45, + "train_loss": 4.555874091186523, + "train_acc": 0.05074, + "test_loss": 16.445907543945314, + "test_acc": 0.01, + "lyapunov": 1.5668693082716765, + "grad_norm": 0.421064301771623, + "grad_max_sv": 0.20280106514692306, + "grad_min_sv": 5.1596785455299e-09, + "grad_condition": 50522308.14501454, + "lr": 0.0007938926261462363, + "time_sec": 41.843982219696045 + }, + { + "epoch": 46, + "train_loss": 4.56307541015625, + "train_acc": 0.04834, + "test_loss": 15.170621519470215, + "test_acc": 0.01, + "lyapunov": 1.5478406470754873, + "grad_norm": 0.4022239019959698, + "grad_max_sv": 0.20177871510386466, + "grad_min_sv": 4.925644440934018e-09, + "grad_condition": 51504299.42247386, + "lr": 0.0007853567838422158, + "time_sec": 41.843809366226196 + }, + { + "epoch": 47, + "train_loss": 4.461052338867187, + "train_acc": 0.06168, + "test_loss": 13.590689770507813, + "test_acc": 0.01, + "lyapunov": 1.539207870698036, + "grad_norm": 0.39483180875809476, + "grad_max_sv": 0.18038341253995896, + "grad_min_sv": 5.225175523509984e-09, + "grad_condition": 48416053.199461475, + "lr": 0.0007766957746216719, + "time_sec": 41.86233711242676 + }, + { + "epoch": 48, + "train_loss": 4.483129704589844, + "train_acc": 0.06082, + "test_loss": 15.866412992858887, + "test_acc": 0.01, + "lyapunov": 1.5564451214602537, + "grad_norm": 0.4001213731670661, + "grad_max_sv": 0.17479643113911153, + "grad_min_sv": 4.983967312466309e-09, + "grad_condition": 45597451.14778058, + "lr": 0.0007679133974894982, + "time_sec": 41.860371828079224 + }, + { + "epoch": 49, + "train_loss": 4.563996811523437, + "train_acc": 0.05704, + "test_loss": 14.467741319274902, + "test_acc": 0.01, + "lyapunov": 1.7151714895692323, + "grad_norm": 0.35765858704843245, + "grad_max_sv": 0.17724147401750087, + "grad_min_sv": 4.611558551666846e-09, + "grad_condition": 3652674833.016098, + "lr": 0.000759013504686565, + "time_sec": 41.88652062416077 + }, + { + "epoch": 50, + "train_loss": 4.699548272705078, + "train_acc": 0.04798, + "test_loss": 14.650819215393067, + "test_acc": 0.01, + "lyapunov": 1.8773073610442375, + "grad_norm": 0.3237139765922586, + "grad_max_sv": 0.18019139617681504, + "grad_min_sv": 4.004119223688374e-09, + "grad_condition": 56553030.085173145, + "lr": 0.0007499999999999998, + "time_sec": 41.8651602268219 + }, + { + "epoch": 51, + "train_loss": 4.856528885040283, + "train_acc": 0.01108, + "test_loss": 13.696816278076172, + "test_acc": 0.01, + "lyapunov": 1.4683626176756057, + "grad_norm": 0.238328597603378, + "grad_max_sv": 0.17753527872264385, + "grad_min_sv": 2.2218590706860787e-10, + "grad_condition": 124996343340.03922, + "lr": 0.0007408768370508575, + "time_sec": 41.89140796661377 + }, + { + "epoch": 52, + "train_loss": 4.859013377990722, + "train_acc": 0.0091, + "test_loss": 13.624913540649414, + "test_acc": 0.01, + "lyapunov": 1.465970806453539, + "grad_norm": 0.16106795495349294, + "grad_max_sv": 0.1110096687451005, + "grad_min_sv": 6.2731757239434485e-15, + "grad_condition": 110304236489.90335, + "lr": 0.0007316480175599307, + "time_sec": 41.900989294052124 + }, + { + "epoch": 53, + "train_loss": 4.851568754730224, + "train_acc": 0.00906, + "test_loss": 15.073454458618164, + "test_acc": 0.01, + "lyapunov": 1.456499196684269, + "grad_norm": 0.1430055471916021, + "grad_max_sv": 0.09564914535731077, + "grad_min_sv": 1.5236447104070445e-15, + "grad_condition": 95502112628.56236, + "lr": 0.0007223175895924635, + "time_sec": 41.87765717506409 + }, + { + "epoch": 54, + "train_loss": 4.851486787261963, + "train_acc": 0.0096, + "test_loss": 15.396797889709473, + "test_acc": 0.01, + "lyapunov": 1.4582891162399136, + "grad_norm": 0.1275918494558622, + "grad_max_sv": 0.07877833610400557, + "grad_min_sv": 1.1071724086990746e-23, + "grad_condition": 78778336103.16934, + "lr": 0.0007128896457825361, + "time_sec": 41.84445524215698 + }, + { + "epoch": 55, + "train_loss": 4.850928226623535, + "train_acc": 0.00872, + "test_loss": 14.606024462890625, + "test_acc": 0.01, + "lyapunov": 1.4591175653135684, + "grad_norm": 0.12323118676067203, + "grad_max_sv": 0.07178116273134946, + "grad_min_sv": 2.5052708059998736e-20, + "grad_condition": 71781161032.94218, + "lr": 0.0007033683215378998, + "time_sec": 41.84666895866394 + }, + { + "epoch": 56, + "train_loss": 4.852352551269531, + "train_acc": 0.0098, + "test_loss": 14.902420947265625, + "test_acc": 0.01, + "lyapunov": 1.4618816878789527, + "grad_norm": 0.114352449118403, + "grad_max_sv": 0.06100161336362362, + "grad_min_sv": 6.896960539960325e-27, + "grad_condition": 61001613363.62309, + "lr": 0.0006937577932260512, + "time_sec": 41.880367279052734 + }, + { + "epoch": 57, + "train_loss": 4.852858272247315, + "train_acc": 0.01102, + "test_loss": 14.057881980895996, + "test_acc": 0.01, + "lyapunov": 1.4654078419556094, + "grad_norm": 0.10881533107486291, + "grad_max_sv": 0.05331473303958774, + "grad_min_sv": 1.4012984643248171e-46, + "grad_condition": 53314733039.58773, + "lr": 0.0006840622763423388, + "time_sec": 41.84727120399475 + }, + { + "epoch": 58, + "train_loss": 4.851343263397217, + "train_acc": 0.01044, + "test_loss": 14.620996353149414, + "test_acc": 0.01, + "lyapunov": 1.4605532884597778, + "grad_norm": 0.11574598071345925, + "grad_max_sv": 0.06319006895646453, + "grad_min_sv": 2.802712535772941e-41, + "grad_condition": 63190068956.46452, + "lr": 0.0006742860236609073, + "time_sec": 41.8674533367157 + }, + { + "epoch": 59, + "train_loss": 4.852657847747802, + "train_acc": 0.0102, + "test_loss": 14.391234281921387, + "test_acc": 0.01, + "lyapunov": 1.4630218619275885, + "grad_norm": 0.1117850897535104, + "grad_max_sv": 0.057737766206264494, + "grad_min_sv": 8.962900509942182e-33, + "grad_condition": 57737766206.2645, + "lr": 0.0006644333233692913, + "time_sec": 41.853941679000854 + }, + { + "epoch": 60, + "train_loss": 4.851071483917236, + "train_acc": 0.00948, + "test_loss": 14.590808624267579, + "test_acc": 0.01, + "lyapunov": 1.4618642052726063, + "grad_norm": 0.10400000692897449, + "grad_max_sv": 0.04577720589004457, + "grad_min_sv": 0.0, + "grad_condition": 45777205890.04457, + "lr": 0.0006545084971874734, + "time_sec": 41.848552227020264 + }, + { + "epoch": 61, + "train_loss": 4.852240568084717, + "train_acc": 0.0095, + "test_loss": 14.59047717590332, + "test_acc": 0.01, + "lyapunov": 1.4638908500866512, + "grad_norm": 0.10799934715249591, + "grad_max_sv": 0.05035868901759386, + "grad_min_sv": 0.0, + "grad_condition": 50358689017.59386, + "lr": 0.0006445158984722354, + "time_sec": 41.850308418273926 + }, + { + "epoch": 62, + "train_loss": 4.852433279266357, + "train_acc": 0.01012, + "test_loss": 15.986171211242675, + "test_acc": 0.01, + "lyapunov": 1.4649500645639952, + "grad_norm": 0.10733331744324738, + "grad_max_sv": 0.05229583606123924, + "grad_min_sv": 0.0, + "grad_condition": 52295836061.23924, + "lr": 0.0006344599103076324, + "time_sec": 41.855886936187744 + }, + { + "epoch": 63, + "train_loss": 4.85242006362915, + "train_acc": 0.00952, + "test_loss": 13.999450773620605, + "test_acc": 0.01, + "lyapunov": 1.4631946355180667, + "grad_norm": 0.10887508886634635, + "grad_max_sv": 0.05549173932522535, + "grad_min_sv": 0.0, + "grad_condition": 55491739325.22536, + "lr": 0.0006243449435824269, + "time_sec": 41.875603675842285 + }, + { + "epoch": 64, + "train_loss": 4.852031197509765, + "train_acc": 0.00988, + "test_loss": 13.823671005249023, + "test_acc": 0.01, + "lyapunov": 1.46498492947015, + "grad_norm": 0.10631816229605466, + "grad_max_sv": 0.050992762017995116, + "grad_min_sv": 0.0, + "grad_condition": 50992762017.99512, + "lr": 0.0006141754350553275, + "time_sec": 41.84609389305115 + }, + { + "epoch": 65, + "train_loss": 4.851191096801758, + "train_acc": 0.01018, + "test_loss": 13.375173307800292, + "test_acc": 0.01, + "lyapunov": 1.4641655095093085, + "grad_norm": 0.1010577343573765, + "grad_max_sv": 0.042480578925460574, + "grad_min_sv": 0.0, + "grad_condition": 42480578925.46058, + "lr": 0.0006039558454088793, + "time_sec": 41.83738660812378 + }, + { + "epoch": 66, + "train_loss": 4.852197050323486, + "train_acc": 0.00882, + "test_loss": 14.165961294555665, + "test_acc": 0.01, + "lyapunov": 1.4664015864472255, + "grad_norm": 0.09792907198844746, + "grad_max_sv": 0.036209277296438816, + "grad_min_sv": 0.0, + "grad_condition": 36209277296.43882, + "lr": 0.000593690657292862, + "time_sec": 41.797043323516846 + }, + { + "epoch": 67, + "train_loss": 4.85130561340332, + "train_acc": 0.0101, + "test_loss": 14.011718264770508, + "test_acc": 0.01, + "lyapunov": 1.4650892686965826, + "grad_norm": 0.09456101481889781, + "grad_max_sv": 0.02113236514851451, + "grad_min_sv": 0.0, + "grad_condition": 21132365148.514507, + "lr": 0.0005833843733580507, + "time_sec": 41.754011154174805 + }, + { + "epoch": 68, + "train_loss": 4.852421583099365, + "train_acc": 0.00954, + "test_loss": 13.768776727294922, + "test_acc": 0.01, + "lyapunov": 1.4679525093654233, + "grad_norm": 0.09464764660731555, + "grad_max_sv": 0.025787328323349356, + "grad_min_sv": 0.0, + "grad_condition": 25787328323.349358, + "lr": 0.0005730415142812054, + "time_sec": 42.026938676834106 + }, + { + "epoch": 69, + "train_loss": 4.85272935760498, + "train_acc": 0.00984, + "test_loss": 13.534171914672852, + "test_acc": 0.01, + "lyapunov": 1.4685536226653078, + "grad_norm": 0.09557086506346626, + "grad_max_sv": 0.026282459730282426, + "grad_min_sv": 0.0, + "grad_condition": 26282459730.282425, + "lr": 0.0005626666167821517, + "time_sec": 41.802675008773804 + }, + { + "epoch": 70, + "train_loss": 4.851980906524658, + "train_acc": 0.01004, + "test_loss": 13.33881396484375, + "test_acc": 0.01, + "lyapunov": 1.4669674391026997, + "grad_norm": 0.09715157690608033, + "grad_max_sv": 0.03565134848468006, + "grad_min_sv": 0.0, + "grad_condition": 35651348484.68006, + "lr": 0.0005522642316338265, + "time_sec": 41.813010931015015 + }, + { + "epoch": 71, + "train_loss": 4.85278720413208, + "train_acc": 0.01006, + "test_loss": 12.802179231262206, + "test_acc": 0.01, + "lyapunov": 1.468117561791559, + "grad_norm": 0.09992948652871142, + "grad_max_sv": 0.03685425859875977, + "grad_min_sv": 0.0, + "grad_condition": 36854258598.759766, + "lr": 0.0005418389216661573, + "time_sec": 41.84488320350647 + }, + { + "epoch": 72, + "train_loss": 4.851398905639648, + "train_acc": 0.00926, + "test_loss": 13.120699348449707, + "test_acc": 0.01, + "lyapunov": 1.4663349237588361, + "grad_norm": 0.0922810139338614, + "grad_max_sv": 0.021838864544406533, + "grad_min_sv": 0.0, + "grad_condition": 21838864544.406532, + "lr": 0.0005313952597646563, + "time_sec": 41.80693006515503 + }, + { + "epoch": 73, + "train_loss": 4.852625637207031, + "train_acc": 0.01006, + "test_loss": 14.170262338256835, + "test_acc": 0.01, + "lyapunov": 1.4684231619700752, + "grad_norm": 0.09725476129415889, + "grad_max_sv": 0.03474617879837751, + "grad_min_sv": 0.0, + "grad_condition": 34746178798.37752, + "lr": 0.0005209378268645994, + "time_sec": 41.80283856391907 + }, + { + "epoch": 74, + "train_loss": 4.854615002288818, + "train_acc": 0.01012, + "test_loss": 13.06523247833252, + "test_acc": 0.01, + "lyapunov": 1.4741113576132927, + "grad_norm": 0.09355435634576315, + "grad_max_sv": 0.026293953135609626, + "grad_min_sv": 0.0, + "grad_condition": 26293953135.609627, + "lr": 0.0005104712099416781, + "time_sec": 41.77813935279846 + }, + { + "epoch": 75, + "train_loss": 4.8521118782043455, + "train_acc": 0.01014, + "test_loss": 13.227028475952148, + "test_acc": 0.01, + "lyapunov": 1.4683185632881302, + "grad_norm": 0.09873531057612077, + "grad_max_sv": 0.029217457259073855, + "grad_min_sv": 0.0, + "grad_condition": 29217457259.073853, + "lr": 0.0004999999999999996, + "time_sec": 41.80186319351196 + }, + { + "epoch": 76, + "train_loss": 4.8521026638793945, + "train_acc": 0.00974, + "test_loss": 13.727623275756835, + "test_acc": 0.01, + "lyapunov": 1.4683916117529126, + "grad_norm": 0.09359089364340291, + "grad_max_sv": 0.019284735713154078, + "grad_min_sv": 0.0, + "grad_condition": 19284735713.154076, + "lr": 0.0004895287900583212, + "time_sec": 41.79860997200012 + }, + { + "epoch": 77, + "train_loss": 4.85240275100708, + "train_acc": 0.00924, + "test_loss": 13.845351657104493, + "test_acc": 0.01, + "lyapunov": 1.469331070285319, + "grad_norm": 0.09291177556896672, + "grad_max_sv": 0.02184786768630147, + "grad_min_sv": 0.0, + "grad_condition": 21847867686.30147, + "lr": 0.0004790621731353997, + "time_sec": 41.78152871131897 + }, + { + "epoch": 78, + "train_loss": 4.853202556762695, + "train_acc": 0.0094, + "test_loss": 12.943718765258788, + "test_acc": 0.01, + "lyapunov": 1.4710808498475252, + "grad_norm": 0.09560356806636944, + "grad_max_sv": 0.024571862118318678, + "grad_min_sv": 0.0, + "grad_condition": 24571862118.318676, + "lr": 0.000468604740235343, + "time_sec": 41.800830364227295 + }, + { + "epoch": 79, + "train_loss": 4.852821475524903, + "train_acc": 0.00916, + "test_loss": 13.06967273864746, + "test_acc": 0.01, + "lyapunov": 1.4714962222691996, + "grad_norm": 0.09286348407291162, + "grad_max_sv": 0.01579846618697047, + "grad_min_sv": 0.0, + "grad_condition": 15798466186.97047, + "lr": 0.00045816107833384175, + "time_sec": 41.79053092002869 + }, + { + "epoch": 80, + "train_loss": 4.852609764556885, + "train_acc": 0.00954, + "test_loss": 13.320957052612306, + "test_acc": 0.01, + "lyapunov": 1.4709682016421461, + "grad_norm": 0.09107911624268931, + "grad_max_sv": 0.013279847288504242, + "grad_min_sv": 0.0, + "grad_condition": 13279847288.504242, + "lr": 0.0004477357683661729, + "time_sec": 41.762046813964844 + }, + { + "epoch": 81, + "train_loss": 4.851465040130615, + "train_acc": 0.00952, + "test_loss": 13.012565188598632, + "test_acc": 0.01, + "lyapunov": 1.468221844004853, + "grad_norm": 0.09041003134861456, + "grad_max_sv": 0.007651371089741588, + "grad_min_sv": 0.0, + "grad_condition": 7651371089.741588, + "lr": 0.00043733338321784746, + "time_sec": 41.751330614089966 + }, + { + "epoch": 82, + "train_loss": 4.852081020355224, + "train_acc": 0.00966, + "test_loss": 12.822627255249023, + "test_acc": 0.01, + "lyapunov": 1.4696848944324972, + "grad_norm": 0.09065480177880879, + "grad_max_sv": 0.01019995305687189, + "grad_min_sv": 0.0, + "grad_condition": 10199953056.871891, + "lr": 0.0004269584857187939, + "time_sec": 41.86999726295471 + }, + { + "epoch": 83, + "train_loss": 4.852022810516358, + "train_acc": 0.00996, + "test_loss": 12.253762084960938, + "test_acc": 0.01, + "lyapunov": 1.4689973016529132, + "grad_norm": 0.09460842094540753, + "grad_max_sv": 0.029235992394387723, + "grad_min_sv": 0.0, + "grad_condition": 29235992394.38772, + "lr": 0.0004166156266419484, + "time_sec": 41.76723504066467 + }, + { + "epoch": 84, + "train_loss": 4.852035647277832, + "train_acc": 0.01024, + "test_loss": 12.115891886901855, + "test_acc": 0.01, + "lyapunov": 1.4691770165167806, + "grad_norm": 0.09360646750239629, + "grad_max_sv": 0.019934501592069866, + "grad_min_sv": 0.0, + "grad_condition": 19934501592.069862, + "lr": 0.0004063093427071373, + "time_sec": 41.82295870780945 + }, + { + "epoch": 85, + "train_loss": 4.852076805419922, + "train_acc": 0.00986, + "test_loss": 12.878702352905274, + "test_acc": 0.01, + "lyapunov": 1.4699803453577145, + "grad_norm": 0.09050948837033777, + "grad_max_sv": 0.010260828444734216, + "grad_min_sv": 0.0, + "grad_condition": 10260828444.734217, + "lr": 0.0003960441545911199, + "time_sec": 41.740272521972656 + }, + { + "epoch": 86, + "train_loss": 4.853503344268799, + "train_acc": 0.00942, + "test_loss": 13.130225515747071, + "test_acc": 0.01, + "lyapunov": 1.473677592204355, + "grad_norm": 0.08911124738850405, + "grad_max_sv": 0.0034935059491544964, + "grad_min_sv": 0.0, + "grad_condition": 3493505949.154496, + "lr": 0.0003858245649446718, + "time_sec": 41.71459937095642 + }, + { + "epoch": 87, + "train_loss": 4.852846223449707, + "train_acc": 0.0098, + "test_loss": 13.668508865356445, + "test_acc": 0.01, + "lyapunov": 1.4720799718671442, + "grad_norm": 0.09028155404620607, + "grad_max_sv": 0.008756613591685891, + "grad_min_sv": 0.0, + "grad_condition": 8756613591.685892, + "lr": 0.00037565505641757235, + "time_sec": 41.74625873565674 + }, + { + "epoch": 88, + "train_loss": 4.852147266693115, + "train_acc": 0.01, + "test_loss": 13.016764665222167, + "test_acc": 0.01, + "lyapunov": 1.4709450503444428, + "grad_norm": 0.08907329873744592, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 41.72583556175232 + }, + { + "epoch": 89, + "train_loss": 4.854143925933838, + "train_acc": 0.00968, + "test_loss": 13.080362130737305, + "test_acc": 0.01, + "lyapunov": 1.4749400249832427, + "grad_norm": 0.09887236057674029, + "grad_max_sv": 0.017000502441078424, + "grad_min_sv": 0.0, + "grad_condition": 17000502441.078424, + "lr": 0.0003554841015277638, + "time_sec": 41.776273250579834 + }, + { + "epoch": 90, + "train_loss": 4.852338234405518, + "train_acc": 0.00894, + "test_loss": 13.206872094726563, + "test_acc": 0.01, + "lyapunov": 1.470992279784454, + "grad_norm": 0.08990915500150026, + "grad_max_sv": 0.004822738515213132, + "grad_min_sv": 0.0, + "grad_condition": 4822738515.213132, + "lr": 0.000345491502812526, + "time_sec": 41.74059700965881 + }, + { + "epoch": 91, + "train_loss": 4.854439675140381, + "train_acc": 0.0098, + "test_loss": 13.193742947387696, + "test_acc": 0.01, + "lyapunov": 1.4752069266555865, + "grad_norm": 0.09195463137068469, + "grad_max_sv": 0.016309724561870097, + "grad_min_sv": 0.0, + "grad_condition": 16309724561.870098, + "lr": 0.0003355666766307081, + "time_sec": 41.72685122489929 + }, + { + "epoch": 92, + "train_loss": 4.852755132141113, + "train_acc": 0.00966, + "test_loss": 12.651437782287598, + "test_acc": 0.01, + "lyapunov": 1.4722728369485996, + "grad_norm": 0.09031090314491075, + "grad_max_sv": 0.013889235025271774, + "grad_min_sv": 0.0, + "grad_condition": 13889235025.27177, + "lr": 0.00032571397633909225, + "time_sec": 41.76129865646362 + }, + { + "epoch": 93, + "train_loss": 4.852394995727539, + "train_acc": 0.00978, + "test_loss": 13.140398934936524, + "test_acc": 0.01, + "lyapunov": 1.4706439609112947, + "grad_norm": 0.09896021199497843, + "grad_max_sv": 0.012632346572354436, + "grad_min_sv": 0.0, + "grad_condition": 12632346572.354437, + "lr": 0.00031593772365766094, + "time_sec": 41.7473201751709 + }, + { + "epoch": 94, + "train_loss": 4.853237281036377, + "train_acc": 0.00878, + "test_loss": 12.807959544372558, + "test_acc": 0.01, + "lyapunov": 1.4736966973985248, + "grad_norm": 0.09036941229411612, + "grad_max_sv": 0.008218426816165447, + "grad_min_sv": 0.0, + "grad_condition": 8218426816.165448, + "lr": 0.0003062422067739483, + "time_sec": 41.732847452163696 + }, + { + "epoch": 95, + "train_loss": 4.852389494171143, + "train_acc": 0.00908, + "test_loss": 12.560802192687989, + "test_acc": 0.01, + "lyapunov": 1.471325798412723, + "grad_norm": 0.08925054999698791, + "grad_max_sv": 0.00795787493698299, + "grad_min_sv": 0.0, + "grad_condition": 7957874936.982989, + "lr": 0.00029663167846209965, + "time_sec": 41.743444204330444 + }, + { + "epoch": 96, + "train_loss": 4.852095717926026, + "train_acc": 0.00964, + "test_loss": 12.698743003845214, + "test_acc": 0.01, + "lyapunov": 1.4707305251484941, + "grad_norm": 0.08980211873044659, + "grad_max_sv": 0.006079048849642277, + "grad_min_sv": 0.0, + "grad_condition": 6079048849.642277, + "lr": 0.00028711035421746345, + "time_sec": 41.744508266448975 + }, + { + "epoch": 97, + "train_loss": 4.852325097198486, + "train_acc": 0.00998, + "test_loss": 12.385714389038085, + "test_acc": 0.01, + "lyapunov": 1.4707067143886596, + "grad_norm": 0.09303110633276697, + "grad_max_sv": 0.013369420357048512, + "grad_min_sv": 0.0, + "grad_condition": 13369420357.048512, + "lr": 0.00027768241040753615, + "time_sec": 41.777459383010864 + }, + { + "epoch": 98, + "train_loss": 4.852114578399658, + "train_acc": 0.00946, + "test_loss": 12.616465420532226, + "test_acc": 0.01, + "lyapunov": 1.4709890193646522, + "grad_norm": 0.08982717043210414, + "grad_max_sv": 0.011742619890719652, + "grad_min_sv": 0.0, + "grad_condition": 11742619890.719652, + "lr": 0.00026835198244006903, + "time_sec": 41.74090838432312 + }, + { + "epoch": 99, + "train_loss": 4.852081492767334, + "train_acc": 0.00914, + "test_loss": 12.773276670837403, + "test_acc": 0.01, + "lyapunov": 1.4708703545963062, + "grad_norm": 0.08820725715813042, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 41.70957374572754 + }, + { + "epoch": 100, + "train_loss": 4.852057821807861, + "train_acc": 0.00854, + "test_loss": 12.903013801574707, + "test_acc": 0.01, + "lyapunov": 1.470713365718227, + "grad_norm": 0.08831333485556404, + "grad_max_sv": 0.001176884165033698, + "grad_min_sv": 0.0, + "grad_condition": 1176884165.033698, + "lr": 0.0002499999999999997, + "time_sec": 41.70664095878601 + }, + { + "epoch": 101, + "train_loss": 4.852297632446289, + "train_acc": 0.0088, + "test_loss": 12.991321166992188, + "test_acc": 0.01, + "lyapunov": 1.471470196838574, + "grad_norm": 0.08844546443228318, + "grad_max_sv": 0.0007792085409164429, + "grad_min_sv": 0.0, + "grad_condition": 779208540.9164429, + "lr": 0.00024098649531343477, + "time_sec": 41.72946095466614 + }, + { + "epoch": 102, + "train_loss": 4.85340077835083, + "train_acc": 0.00928, + "test_loss": 12.494372912597656, + "test_acc": 0.01, + "lyapunov": 1.4734248584493652, + "grad_norm": 0.0904122316991309, + "grad_max_sv": 0.01403848035261035, + "grad_min_sv": 0.0, + "grad_condition": 14038480352.610352, + "lr": 0.0002320866025105016, + "time_sec": 41.72011160850525 + }, + { + "epoch": 103, + "train_loss": 4.8527667138671875, + "train_acc": 0.00854, + "test_loss": 13.111592295837402, + "test_acc": 0.01, + "lyapunov": 1.4726007445084164, + "grad_norm": 0.08932121120200033, + "grad_max_sv": 0.004739455413073301, + "grad_min_sv": 0.0, + "grad_condition": 4739455413.073301, + "lr": 0.0002233042253783278, + "time_sec": 41.74779987335205 + }, + { + "epoch": 104, + "train_loss": 4.852004501037598, + "train_acc": 0.00946, + "test_loss": 12.720405123901367, + "test_acc": 0.01, + "lyapunov": 1.4705228412242801, + "grad_norm": 0.08860158464501969, + "grad_max_sv": 0.006343359779566527, + "grad_min_sv": 0.0, + "grad_condition": 6343359779.566526, + "lr": 0.000214643216157784, + "time_sec": 41.75279927253723 + }, + { + "epoch": 105, + "train_loss": 4.852732130584717, + "train_acc": 0.00936, + "test_loss": 12.728569932556152, + "test_acc": 0.01, + "lyapunov": 1.4726796906317592, + "grad_norm": 0.08858840001436137, + "grad_max_sv": 0.0021229078993201256, + "grad_min_sv": 0.0, + "grad_condition": 2122907899.3201256, + "lr": 0.00020610737385376332, + "time_sec": 41.71723484992981 + }, + { + "epoch": 106, + "train_loss": 4.852207695922852, + "train_acc": 0.00926, + "test_loss": 12.709718621826172, + "test_acc": 0.01, + "lyapunov": 1.4712865084333493, + "grad_norm": 0.08830963721683445, + "grad_max_sv": 0.0027129428926855326, + "grad_min_sv": 0.0, + "grad_condition": 2712942892.6855326, + "lr": 0.00019770044256881242, + "time_sec": 41.71148443222046 + }, + { + "epoch": 107, + "train_loss": 4.85225803314209, + "train_acc": 0.00982, + "test_loss": 12.837951531982421, + "test_acc": 0.01, + "lyapunov": 1.4712638537902052, + "grad_norm": 0.08902472521530928, + "grad_max_sv": 0.008135201036930084, + "grad_min_sv": 0.0, + "grad_condition": 8135201036.930084, + "lr": 0.0001894261098608447, + "time_sec": 41.72528624534607 + }, + { + "epoch": 108, + "train_loss": 4.852549499511719, + "train_acc": 0.00936, + "test_loss": 13.247559573364258, + "test_acc": 0.01, + "lyapunov": 1.4724893740680822, + "grad_norm": 0.08825387718460724, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 41.74774885177612 + }, + { + "epoch": 109, + "train_loss": 4.85227595916748, + "train_acc": 0.00946, + "test_loss": 13.13632116241455, + "test_acc": 0.01, + "lyapunov": 1.471560059910845, + "grad_norm": 0.08956498900691849, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 41.7323522567749 + }, + { + "epoch": 110, + "train_loss": 4.852233708801269, + "train_acc": 0.00902, + "test_loss": 13.550802612304688, + "test_acc": 0.01, + "lyapunov": 1.4712924996910193, + "grad_norm": 0.08901901086212888, + "grad_max_sv": 0.004322580248117447, + "grad_min_sv": 0.0, + "grad_condition": 4322580248.117447, + "lr": 0.00016543469682057076, + "time_sec": 41.74680209159851 + }, + { + "epoch": 111, + "train_loss": 4.852689293060303, + "train_acc": 0.00916, + "test_loss": 13.372785118103028, + "test_acc": 0.01, + "lyapunov": 1.4729326292681877, + "grad_norm": 0.08862372209724671, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 41.72367000579834 + }, + { + "epoch": 112, + "train_loss": 4.855245245056152, + "train_acc": 0.00918, + "test_loss": 13.167806037902832, + "test_acc": 0.01, + "lyapunov": 1.4768958594792945, + "grad_norm": 0.08841785458131039, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 41.73188829421997 + }, + { + "epoch": 113, + "train_loss": 4.852458833618164, + "train_acc": 0.00882, + "test_loss": 13.374362356567383, + "test_acc": 0.01, + "lyapunov": 1.4722495371728297, + "grad_norm": 0.08871568614447918, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 41.71817493438721 + }, + { + "epoch": 114, + "train_loss": 4.851942072448731, + "train_acc": 0.00902, + "test_loss": 13.413740673828125, + "test_acc": 0.01, + "lyapunov": 1.4704074313878404, + "grad_norm": 0.08870214010553126, + "grad_max_sv": 0.0019620250910520553, + "grad_min_sv": 0.0, + "grad_condition": 1962025091.0520554, + "lr": 0.00013551568628929425, + "time_sec": 41.72637939453125 + }, + { + "epoch": 115, + "train_loss": 4.853842346343994, + "train_acc": 0.00876, + "test_loss": 13.078753887939452, + "test_acc": 0.01, + "lyapunov": 1.4757750683733264, + "grad_norm": 0.08934074054242225, + "grad_max_sv": 0.0054347761906683445, + "grad_min_sv": 0.0, + "grad_condition": 5434776190.6683445, + "lr": 0.00012842758726130276, + "time_sec": 41.711642265319824 + }, + { + "epoch": 116, + "train_loss": 4.852122984466552, + "train_acc": 0.0092, + "test_loss": 13.219519885253906, + "test_acc": 0.01, + "lyapunov": 1.4712010920809968, + "grad_norm": 0.08808712563631747, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 41.74567747116089 + }, + { + "epoch": 117, + "train_loss": 4.8583870220947265, + "train_acc": 0.00938, + "test_loss": 13.296599545288085, + "test_acc": 0.01, + "lyapunov": 1.4836899404940398, + "grad_norm": 0.08878474499083394, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 41.72996282577515 + }, + { + "epoch": 118, + "train_loss": 4.8542758628845215, + "train_acc": 0.0095, + "test_loss": 13.232178741455078, + "test_acc": 0.01, + "lyapunov": 1.476102854284789, + "grad_norm": 0.08869739853760654, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 41.73535418510437 + }, + { + "epoch": 119, + "train_loss": 4.852905385437012, + "train_acc": 0.00894, + "test_loss": 13.59550298614502, + "test_acc": 0.01, + "lyapunov": 1.4737293317799678, + "grad_norm": 0.08826212131432655, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 41.72545409202576 + }, + { + "epoch": 120, + "train_loss": 4.852262009429932, + "train_acc": 0.0092, + "test_loss": 13.53664966430664, + "test_acc": 0.01, + "lyapunov": 1.471702798248252, + "grad_norm": 0.08816229564695008, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 41.747995376586914 + }, + { + "epoch": 121, + "train_loss": 4.852286165924072, + "train_acc": 0.00938, + "test_loss": 13.543427288818359, + "test_acc": 0.01, + "lyapunov": 1.4718451771284917, + "grad_norm": 0.0882556097544163, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 41.71251606941223 + }, + { + "epoch": 122, + "train_loss": 4.852815079193115, + "train_acc": 0.00866, + "test_loss": 13.50841277770996, + "test_acc": 0.01, + "lyapunov": 1.4734657941876774, + "grad_norm": 0.08834171363916951, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 41.828593492507935 + }, + { + "epoch": 123, + "train_loss": 4.8519872172546386, + "train_acc": 0.0097, + "test_loss": 13.492674378967285, + "test_acc": 0.01, + "lyapunov": 1.470838068696239, + "grad_norm": 0.08874014439548912, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 41.981213331222534 + }, + { + "epoch": 124, + "train_loss": 4.853034484252929, + "train_acc": 0.009, + "test_loss": 13.126736920166016, + "test_acc": 0.01, + "lyapunov": 1.4740290989351394, + "grad_norm": 0.08813885370977613, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 41.71132040023804 + }, + { + "epoch": 125, + "train_loss": 4.85233381652832, + "train_acc": 0.00952, + "test_loss": 13.397762631225586, + "test_acc": 0.01, + "lyapunov": 1.471941991230411, + "grad_norm": 0.08812641091996891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 41.72543954849243 + }, + { + "epoch": 126, + "train_loss": 4.8525572804260255, + "train_acc": 0.0096, + "test_loss": 13.308763629150391, + "test_acc": 0.01, + "lyapunov": 1.472656028349991, + "grad_norm": 0.08840738704987161, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 41.72384238243103 + }, + { + "epoch": 127, + "train_loss": 4.855584846191406, + "train_acc": 0.00946, + "test_loss": 13.759437710571289, + "test_acc": 0.01, + "lyapunov": 1.4782639266279958, + "grad_norm": 0.08826506573029154, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 41.73837852478027 + }, + { + "epoch": 128, + "train_loss": 4.85253405090332, + "train_acc": 0.00946, + "test_loss": 13.737331958007813, + "test_acc": 0.01, + "lyapunov": 1.4725991725311864, + "grad_norm": 0.08806307055084844, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 41.761263847351074 + }, + { + "epoch": 129, + "train_loss": 4.852324590759277, + "train_acc": 0.01, + "test_loss": 13.721236633300782, + "test_acc": 0.01, + "lyapunov": 1.4719348380632717, + "grad_norm": 0.08813587403770864, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 41.74943208694458 + }, + { + "epoch": 130, + "train_loss": 4.85221561340332, + "train_acc": 0.00954, + "test_loss": 13.78914153137207, + "test_acc": 0.01, + "lyapunov": 1.4716954301385319, + "grad_norm": 0.08851547081560074, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 41.76015615463257 + }, + { + "epoch": 131, + "train_loss": 4.852464799957275, + "train_acc": 0.00878, + "test_loss": 13.605609268188477, + "test_acc": 0.01, + "lyapunov": 1.4723939121226826, + "grad_norm": 0.08823360335901036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 41.77037334442139 + }, + { + "epoch": 132, + "train_loss": 4.852380610198975, + "train_acc": 0.00896, + "test_loss": 13.703162010192871, + "test_acc": 0.01, + "lyapunov": 1.4721423701557053, + "grad_norm": 0.08806535417914078, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 41.78282904624939 + }, + { + "epoch": 133, + "train_loss": 4.853441643676758, + "train_acc": 0.00924, + "test_loss": 13.780622036743164, + "test_acc": 0.01, + "lyapunov": 1.4737608521185872, + "grad_norm": 0.08786943886020787, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 41.94830918312073 + }, + { + "epoch": 134, + "train_loss": 4.8520362255859375, + "train_acc": 0.00954, + "test_loss": 13.83701887512207, + "test_acc": 0.01, + "lyapunov": 1.471004798284272, + "grad_norm": 0.08837937530648805, + "grad_max_sv": 0.000659800786525011, + "grad_min_sv": 0.0, + "grad_condition": 659800786.5250111, + "lr": 2.7811814881259484e-05, + "time_sec": 41.915955781936646 + }, + { + "epoch": 135, + "train_loss": 4.852150169067383, + "train_acc": 0.00958, + "test_loss": 13.836302838134765, + "test_acc": 0.01, + "lyapunov": 1.471451068473289, + "grad_norm": 0.0887060490050228, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 41.69927930831909 + }, + { + "epoch": 136, + "train_loss": 4.853155226898194, + "train_acc": 0.00916, + "test_loss": 13.758418685913085, + "test_acc": 0.01, + "lyapunov": 1.4742048859901136, + "grad_norm": 0.09745955508136325, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 41.71672034263611 + }, + { + "epoch": 137, + "train_loss": 4.85282894165039, + "train_acc": 0.00928, + "test_loss": 13.801075386047364, + "test_acc": 0.01, + "lyapunov": 1.4736028842608948, + "grad_norm": 0.08838780479254947, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 41.86513018608093 + }, + { + "epoch": 138, + "train_loss": 4.852049649047852, + "train_acc": 0.00982, + "test_loss": 13.844301895141601, + "test_acc": 0.01, + "lyapunov": 1.4711221602871596, + "grad_norm": 0.0886793780466303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 41.807748317718506 + }, + { + "epoch": 139, + "train_loss": 4.853534520874024, + "train_acc": 0.01, + "test_loss": 13.770389680480957, + "test_acc": 0.01, + "lyapunov": 1.4747250278282653, + "grad_norm": 0.08808641740018294, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 41.780285596847534 + }, + { + "epoch": 140, + "train_loss": 4.851904624481201, + "train_acc": 0.0096, + "test_loss": 13.713402738952636, + "test_acc": 0.01, + "lyapunov": 1.4706565852055464, + "grad_norm": 0.08806158709361275, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 41.71153283119202 + }, + { + "epoch": 141, + "train_loss": 4.852294711456299, + "train_acc": 0.00974, + "test_loss": 13.674919595336915, + "test_acc": 0.01, + "lyapunov": 1.4719334886507, + "grad_norm": 0.08848605705342659, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 41.75360417366028 + }, + { + "epoch": 142, + "train_loss": 4.852051578979492, + "train_acc": 0.00986, + "test_loss": 13.683543762207032, + "test_acc": 0.01, + "lyapunov": 1.4711576669722262, + "grad_norm": 0.08814132937210956, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 41.73791003227234 + }, + { + "epoch": 143, + "train_loss": 4.852365187683105, + "train_acc": 0.00984, + "test_loss": 13.635780154418946, + "test_acc": 0.01, + "lyapunov": 1.4721494221016573, + "grad_norm": 0.08862731675513442, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 41.75744414329529 + }, + { + "epoch": 144, + "train_loss": 4.852421789550781, + "train_acc": 0.00964, + "test_loss": 13.633413438415527, + "test_acc": 0.01, + "lyapunov": 1.4723204545047888, + "grad_norm": 0.08863761801039138, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 41.74138283729553 + }, + { + "epoch": 145, + "train_loss": 4.852283345336914, + "train_acc": 0.00988, + "test_loss": 13.618844378662109, + "test_acc": 0.01, + "lyapunov": 1.471912037990892, + "grad_norm": 0.08829552590637708, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 41.73318958282471 + }, + { + "epoch": 146, + "train_loss": 4.852081503601074, + "train_acc": 0.00942, + "test_loss": 13.636005783081055, + "test_acc": 0.01, + "lyapunov": 1.4712535944741096, + "grad_norm": 0.0881891115278494, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 41.7281494140625 + }, + { + "epoch": 147, + "train_loss": 4.851804008331299, + "train_acc": 0.00964, + "test_loss": 13.61884249420166, + "test_acc": 0.01, + "lyapunov": 1.4703791028703266, + "grad_norm": 0.08816211822553004, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 41.74032163619995 + }, + { + "epoch": 148, + "train_loss": 4.8529896348571775, + "train_acc": 0.0097, + "test_loss": 13.650962756347656, + "test_acc": 0.01, + "lyapunov": 1.4741563284793473, + "grad_norm": 0.08847924183215054, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 41.70267343521118 + }, + { + "epoch": 149, + "train_loss": 4.851896666412354, + "train_acc": 0.01, + "test_loss": 13.636007565307617, + "test_acc": 0.01, + "lyapunov": 1.470671361669555, + "grad_norm": 0.08871972262513622, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 41.72864389419556 + }, + { + "epoch": 150, + "train_loss": 4.852557410736084, + "train_acc": 0.01, + "test_loss": 13.636007955932618, + "test_acc": 0.01, + "lyapunov": 1.4727459463012187, + "grad_norm": 0.08844840269295245, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 41.74263858795166 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.735240103759765, + "train_acc": 0.02524, + "test_loss": 4.866816416931153, + "test_acc": 0.0196, + "lyapunov": 2.026013672809162, + "grad_norm": 5.2515251679689285, + "grad_max_sv": 4.178838831186295, + "grad_min_sv": 9.041712029367321e-08, + "grad_condition": 179649161.33195654, + "lr": 0.0009998903417374227, + "time_sec": 87.18950843811035 + }, + { + "epoch": 2, + "train_loss": 4.5068304737854, + "train_acc": 0.03554, + "test_loss": 5.026126983642578, + "test_acc": 0.0173, + "lyapunov": 1.7496998066182636, + "grad_norm": 3.127286126154696, + "grad_max_sv": 2.359567102789879, + "grad_min_sv": 5.685370215550989e-08, + "grad_condition": 519592009.8775345, + "lr": 0.0009995614150494292, + "time_sec": 87.2297294139862 + }, + { + "epoch": 3, + "train_loss": 4.461366838684082, + "train_acc": 0.03612, + "test_loss": 4.588225796508789, + "test_acc": 0.0214, + "lyapunov": 1.5944948662882266, + "grad_norm": 1.7421788335036872, + "grad_max_sv": 1.159491127729416, + "grad_min_sv": 3.012503119736998e-08, + "grad_condition": 46872158.840100154, + "lr": 0.0009990133642141358, + "time_sec": 87.14756369590759 + }, + { + "epoch": 4, + "train_loss": 4.419443615722656, + "train_acc": 0.0416, + "test_loss": 5.286386401367188, + "test_acc": 0.01, + "lyapunov": 1.5645387861734765, + "grad_norm": 1.1211397301440151, + "grad_max_sv": 0.6769661128520965, + "grad_min_sv": 1.748986164784583e-08, + "grad_condition": 61425339.07877908, + "lr": 0.0009982464296247522, + "time_sec": 87.12213373184204 + }, + { + "epoch": 5, + "train_loss": 4.423492089996338, + "train_acc": 0.04338, + "test_loss": 6.2819957962036135, + "test_acc": 0.01, + "lyapunov": 1.5490608950100286, + "grad_norm": 0.8706870069158426, + "grad_max_sv": 0.5114456944167614, + "grad_min_sv": 1.31196238317699e-08, + "grad_condition": 53181583.053102724, + "lr": 0.0009972609476841367, + "time_sec": 87.13790082931519 + }, + { + "epoch": 6, + "train_loss": 4.523505429840088, + "train_acc": 0.03268, + "test_loss": 5.438013370513916, + "test_acc": 0.0125, + "lyapunov": 1.5594564731163747, + "grad_norm": 0.857804226532666, + "grad_max_sv": 0.49648181200027464, + "grad_min_sv": 1.1631784305188297e-08, + "grad_condition": 65912570.425740495, + "lr": 0.000996057350657239, + "time_sec": 87.11513113975525 + }, + { + "epoch": 7, + "train_loss": 4.491675056762696, + "train_acc": 0.03868, + "test_loss": 4.85823662109375, + "test_acc": 0.01, + "lyapunov": 1.5649392903613313, + "grad_norm": 0.922475970431733, + "grad_max_sv": 0.5282619304955005, + "grad_min_sv": 1.3700025544571837e-08, + "grad_condition": 115221136.73324652, + "lr": 0.000994636166481494, + "time_sec": 87.11052560806274 + }, + { + "epoch": 8, + "train_loss": 4.458245279388428, + "train_acc": 0.04286, + "test_loss": 5.0693019569396975, + "test_acc": 0.01, + "lyapunov": 1.564261608416467, + "grad_norm": 0.8247796151577914, + "grad_max_sv": 0.4666087761521339, + "grad_min_sv": 1.2590186138083937e-08, + "grad_condition": 80951881.02073678, + "lr": 0.0009929980185352525, + "time_sec": 87.10055899620056 + }, + { + "epoch": 9, + "train_loss": 4.479283211364746, + "train_acc": 0.04164, + "test_loss": 4.6463909927368165, + "test_acc": 0.01, + "lyapunov": 1.5368007479421317, + "grad_norm": 0.7899216729609227, + "grad_max_sv": 0.41627604588866235, + "grad_min_sv": 1.04147358570561e-08, + "grad_condition": 47679788.12689672, + "lr": 0.0009911436253643444, + "time_sec": 87.12877798080444 + }, + { + "epoch": 10, + "train_loss": 4.452324397583008, + "train_acc": 0.0458, + "test_loss": 4.653008950805664, + "test_acc": 0.01, + "lyapunov": 1.5427158729499564, + "grad_norm": 0.693102659392051, + "grad_max_sv": 0.39028600230813026, + "grad_min_sv": 9.917548506044316e-09, + "grad_condition": 50871255.950711094, + "lr": 0.0009890738003669028, + "time_sec": 87.09939312934875 + }, + { + "epoch": 11, + "train_loss": 4.498550581054688, + "train_acc": 0.04238, + "test_loss": 4.798313717651367, + "test_acc": 0.01, + "lyapunov": 1.562767594061849, + "grad_norm": 0.7157991404315234, + "grad_max_sv": 0.3735340617597103, + "grad_min_sv": 9.18097689817099e-09, + "grad_condition": 76046170.48271176, + "lr": 0.00098678945143658, + "time_sec": 87.10426044464111 + }, + { + "epoch": 12, + "train_loss": 4.4704539869689945, + "train_acc": 0.04582, + "test_loss": 4.7863667205810545, + "test_acc": 0.01, + "lyapunov": 1.5232323402029169, + "grad_norm": 0.6028364454937816, + "grad_max_sv": 0.332496403157711, + "grad_min_sv": 8.755317024156106e-09, + "grad_condition": 43134971.96461357, + "lr": 0.0009842915805643154, + "time_sec": 87.09469079971313 + }, + { + "epoch": 13, + "train_loss": 4.537702497558594, + "train_acc": 0.03896, + "test_loss": 4.654966796875, + "test_acc": 0.01, + "lyapunov": 1.54529083567812, + "grad_norm": 0.6292726486160667, + "grad_max_sv": 0.3057276763021946, + "grad_min_sv": 6.5090396415661e-09, + "grad_condition": 700356710.9321487, + "lr": 0.000981581283398829, + "time_sec": 87.09531950950623 + }, + { + "epoch": 14, + "train_loss": 4.620839001159668, + "train_acc": 0.0303, + "test_loss": 4.868439013671875, + "test_acc": 0.01, + "lyapunov": 1.5458131620036366, + "grad_norm": 0.5338695301373511, + "grad_max_sv": 0.29795307405292987, + "grad_min_sv": 5.120543077052897e-09, + "grad_condition": 339314023.7111832, + "lr": 0.0009786597487660333, + "time_sec": 87.12465906143188 + }, + { + "epoch": 15, + "train_loss": 4.513916426849366, + "train_acc": 0.04438, + "test_loss": 4.835803776550293, + "test_acc": 0.01, + "lyapunov": 1.5507933197119046, + "grad_norm": 0.6007957930506477, + "grad_max_sv": 0.3038324311375618, + "grad_min_sv": 6.934315210233022e-09, + "grad_condition": 198097346.8229193, + "lr": 0.0009755282581475766, + "time_sec": 87.08587527275085 + }, + { + "epoch": 16, + "train_loss": 4.492137908630371, + "train_acc": 0.04818, + "test_loss": 4.887235678100586, + "test_acc": 0.01, + "lyapunov": 1.5494948896910528, + "grad_norm": 0.5976636149826597, + "grad_max_sv": 0.30106121934950353, + "grad_min_sv": 7.290029437057033e-09, + "grad_condition": 63284303.580263734, + "lr": 0.0009721881851187403, + "time_sec": 87.09524250030518 + }, + { + "epoch": 17, + "train_loss": 4.575829989471435, + "train_acc": 0.03854, + "test_loss": 4.948842854309082, + "test_acc": 0.01, + "lyapunov": 1.53777074539448, + "grad_norm": 0.5014123935951768, + "grad_max_sv": 0.29032444581389427, + "grad_min_sv": 5.414256840086118e-09, + "grad_condition": 69838858.70858149, + "lr": 0.0009686409947459456, + "time_sec": 87.14909029006958 + }, + { + "epoch": 18, + "train_loss": 4.597054883728028, + "train_acc": 0.03624, + "test_loss": 4.844102088165283, + "test_acc": 0.01, + "lyapunov": 1.5350244057452893, + "grad_norm": 0.5123739316899657, + "grad_max_sv": 0.26398728154599665, + "grad_min_sv": 5.243455172138089e-09, + "grad_condition": 119920046.5630234, + "lr": 0.0009648882429441254, + "time_sec": 87.09620761871338 + }, + { + "epoch": 19, + "train_loss": 4.620368363647461, + "train_acc": 0.03384, + "test_loss": 4.720510952758789, + "test_acc": 0.01, + "lyapunov": 1.5356951705025286, + "grad_norm": 0.47243607957213, + "grad_max_sv": 0.24507929012179375, + "grad_min_sv": 5.088020715859898e-09, + "grad_condition": 57785330.0936975, + "lr": 0.00096093157579425, + "time_sec": 87.11660838127136 + }, + { + "epoch": 20, + "train_loss": 4.613923555145264, + "train_acc": 0.03756, + "test_loss": 5.093030418395996, + "test_acc": 0.01, + "lyapunov": 1.5330088199556942, + "grad_norm": 0.5270298408202432, + "grad_max_sv": 0.2416334819048643, + "grad_min_sv": 4.882703122420853e-09, + "grad_condition": 311593743.69228464, + "lr": 0.0009567727288213001, + "time_sec": 87.09937357902527 + }, + { + "epoch": 21, + "train_loss": 4.636924856567383, + "train_acc": 0.036, + "test_loss": 5.04784955368042, + "test_acc": 0.01, + "lyapunov": 1.5540363645309683, + "grad_norm": 0.526606906737193, + "grad_max_sv": 0.24690264500677586, + "grad_min_sv": 5.1651495895903985e-09, + "grad_condition": 691559676.1292815, + "lr": 0.0009524135262330095, + "time_sec": 87.11412358283997 + }, + { + "epoch": 22, + "train_loss": 4.679128698577881, + "train_acc": 0.02896, + "test_loss": 4.895172619628906, + "test_acc": 0.01, + "lyapunov": 1.547908184778355, + "grad_norm": 0.44727272149588615, + "grad_max_sv": 0.24925720058381556, + "grad_min_sv": 4.642139438126858e-09, + "grad_condition": 66478210.43898354, + "lr": 0.0009478558801197061, + "time_sec": 87.11094355583191 + }, + { + "epoch": 23, + "train_loss": 4.662371476287841, + "train_acc": 0.03188, + "test_loss": 4.795903799438476, + "test_acc": 0.01, + "lyapunov": 1.5548140889848285, + "grad_norm": 0.5260267923584394, + "grad_max_sv": 0.23556945472955704, + "grad_min_sv": 4.337634041588854e-09, + "grad_condition": 1025805594.4440111, + "lr": 0.000943101789615607, + "time_sec": 87.11297392845154 + }, + { + "epoch": 24, + "train_loss": 4.6645262229919435, + "train_acc": 0.03214, + "test_loss": 5.057237059783936, + "test_acc": 0.01, + "lyapunov": 1.5496064592200471, + "grad_norm": 0.6505246940270789, + "grad_max_sv": 0.2576914459466934, + "grad_min_sv": 4.8245041350813974e-09, + "grad_condition": 94704831.81255548, + "lr": 0.0009381533400219313, + "time_sec": 87.10920405387878 + }, + { + "epoch": 25, + "train_loss": 4.654648971710205, + "train_acc": 0.0322, + "test_loss": 5.318339912414551, + "test_acc": 0.01, + "lyapunov": 1.565699156592874, + "grad_norm": 0.4161938321621143, + "grad_max_sv": 0.2134155698120594, + "grad_min_sv": 3.946434762314155e-09, + "grad_condition": 254671281.05499464, + "lr": 0.0009330127018922189, + "time_sec": 87.13201785087585 + }, + { + "epoch": 26, + "train_loss": 4.791520259552002, + "train_acc": 0.02372, + "test_loss": 4.959452788543701, + "test_acc": 0.01, + "lyapunov": 1.600033207012869, + "grad_norm": 0.9779964796296537, + "grad_max_sv": 0.2255085190758109, + "grad_min_sv": 3.1466205011160244e-09, + "grad_condition": 11039609220.08119, + "lr": 0.000927682130080253, + "time_sec": 87.18698191642761 + }, + { + "epoch": 27, + "train_loss": 4.69488529296875, + "train_acc": 0.03142, + "test_loss": 5.3654563461303715, + "test_acc": 0.01, + "lyapunov": 1.5987402142771066, + "grad_norm": 0.6442328720311332, + "grad_max_sv": 0.23703443501144647, + "grad_min_sv": 3.5609615074683707e-09, + "grad_condition": 1745246073.6363997, + "lr": 0.0009221639627510072, + "time_sec": 87.134925365448 + }, + { + "epoch": 28, + "train_loss": 4.606881724700928, + "train_acc": 0.03926, + "test_loss": 4.73573546295166, + "test_acc": 0.0103, + "lyapunov": 1.5937491731570506, + "grad_norm": 0.4194063933325514, + "grad_max_sv": 0.21865120753645897, + "grad_min_sv": 3.87901320235591e-09, + "grad_condition": 523863784.21676093, + "lr": 0.0009164606203550494, + "time_sec": 87.14774799346924 + }, + { + "epoch": 29, + "train_loss": 4.617493250274658, + "train_acc": 0.03728, + "test_loss": 4.662520077514649, + "test_acc": 0.01, + "lyapunov": 1.596246981559812, + "grad_norm": 0.3789306278435458, + "grad_max_sv": 0.19524494409561158, + "grad_min_sv": 3.4768166591418737e-09, + "grad_condition": 236541357.234686, + "lr": 0.0009105746045668516, + "time_sec": 87.11421346664429 + }, + { + "epoch": 30, + "train_loss": 4.631677906799316, + "train_acc": 0.03778, + "test_loss": 6.121908515167236, + "test_acc": 0.01, + "lyapunov": 1.6226924099885593, + "grad_norm": 0.44716784199095383, + "grad_max_sv": 0.1934027548879385, + "grad_min_sv": 3.3855620726374116e-09, + "grad_condition": 581199629.6704518, + "lr": 0.0009045084971874733, + "time_sec": 87.11589574813843 + }, + { + "epoch": 31, + "train_loss": 4.7931158798217774, + "train_acc": 0.02286, + "test_loss": 4.620251409912109, + "test_acc": 0.0092, + "lyapunov": 1.6308694739475884, + "grad_norm": 0.550187770618441, + "grad_max_sv": 0.18949946835637094, + "grad_min_sv": 1.786556805578803e-09, + "grad_condition": 42877123442.64499, + "lr": 0.0008982649590120977, + "time_sec": 87.1836428642273 + }, + { + "epoch": 32, + "train_loss": 4.760539370574951, + "train_acc": 0.02752, + "test_loss": 4.657791676330566, + "test_acc": 0.01, + "lyapunov": 1.6191697065787547, + "grad_norm": 0.3614365919222485, + "grad_max_sv": 0.17497441843152045, + "grad_min_sv": 1.779506375100445e-09, + "grad_condition": 13836124253.01267, + "lr": 0.0008918467286629196, + "time_sec": 87.18445110321045 + }, + { + "epoch": 33, + "train_loss": 4.739889914245605, + "train_acc": 0.029, + "test_loss": 4.71790985031128, + "test_acc": 0.0111, + "lyapunov": 1.6113197523004867, + "grad_norm": 0.3353632004468733, + "grad_max_sv": 0.1673861812800169, + "grad_min_sv": 7.641599533418533e-10, + "grad_condition": 13965803361.130926, + "lr": 0.0008852566213878943, + "time_sec": 87.21766877174377 + }, + { + "epoch": 34, + "train_loss": 4.753917649078369, + "train_acc": 0.02908, + "test_loss": 6.4435778312683105, + "test_acc": 0.01, + "lyapunov": 1.6236087751510504, + "grad_norm": 0.32686722214079433, + "grad_max_sv": 0.16869123242795467, + "grad_min_sv": 5.19174209905656e-10, + "grad_condition": 25949866712.408104, + "lr": 0.000878497527825878, + "time_sec": 87.14275527000427 + }, + { + "epoch": 35, + "train_loss": 4.802844509124756, + "train_acc": 0.0244, + "test_loss": 6.557575407409668, + "test_acc": 0.01, + "lyapunov": 1.6418090259937375, + "grad_norm": 0.4988110566872576, + "grad_max_sv": 0.1611970603466034, + "grad_min_sv": 7.265029261023372e-10, + "grad_condition": 19350605239.471405, + "lr": 0.000871572412738697, + "time_sec": 87.16936993598938 + }, + { + "epoch": 36, + "train_loss": 4.776907616271973, + "train_acc": 0.02782, + "test_loss": 4.822451950073242, + "test_acc": 0.01, + "lyapunov": 1.649027470737467, + "grad_norm": 0.342256043849884, + "grad_max_sv": 0.15263066124171018, + "grad_min_sv": 1.2339334798351036e-10, + "grad_condition": 9338850661.261333, + "lr": 0.0008644843137107055, + "time_sec": 87.186208486557 + }, + { + "epoch": 37, + "train_loss": 4.772866481628418, + "train_acc": 0.0269, + "test_loss": 6.221601684570312, + "test_acc": 0.01, + "lyapunov": 1.6788606286963539, + "grad_norm": 0.6629649981625318, + "grad_max_sv": 0.17593900030478835, + "grad_min_sv": 2.304191549799707e-09, + "grad_condition": 9259298449.8995, + "lr": 0.0008572363398164014, + "time_sec": 87.18624091148376 + }, + { + "epoch": 38, + "train_loss": 4.77164099029541, + "train_acc": 0.02672, + "test_loss": 4.766420809936523, + "test_acc": 0.01, + "lyapunov": 1.7235305708692508, + "grad_norm": 0.3937581266699412, + "grad_max_sv": 0.17076923064887523, + "grad_min_sv": 4.0183006136103404e-10, + "grad_condition": 16063615551.021002, + "lr": 0.0008498316702566826, + "time_sec": 87.20626258850098 + }, + { + "epoch": 39, + "train_loss": 4.807452021179199, + "train_acc": 0.02832, + "test_loss": 4.899550021362304, + "test_acc": 0.01, + "lyapunov": 1.8249543252808358, + "grad_norm": 0.5715574182036978, + "grad_max_sv": 0.16177968972187956, + "grad_min_sv": 3.793029192220455e-10, + "grad_condition": 8307565763.804538, + "lr": 0.0008422735529643442, + "time_sec": 87.19903802871704 + }, + { + "epoch": 40, + "train_loss": 4.760174724121094, + "train_acc": 0.0279, + "test_loss": 5.857627616119385, + "test_acc": 0.01, + "lyapunov": 1.7056615718490327, + "grad_norm": 0.4256172750988047, + "grad_max_sv": 0.16561466939747332, + "grad_min_sv": 2.058724911119941e-09, + "grad_condition": 512180966.31238127, + "lr": 0.0008345653031794289, + "time_sec": 87.21863722801208 + }, + { + "epoch": 41, + "train_loss": 4.69559801071167, + "train_acc": 0.02966, + "test_loss": 5.604364262390137, + "test_acc": 0.01, + "lyapunov": 1.5935010431367722, + "grad_norm": 0.35011105073884097, + "grad_max_sv": 0.18168312907218934, + "grad_min_sv": 2.4247929442111626e-09, + "grad_condition": 93356754.736842, + "lr": 0.0008267103019950526, + "time_sec": 87.22393608093262 + }, + { + "epoch": 42, + "train_loss": 4.709802615814209, + "train_acc": 0.02616, + "test_loss": 4.870189538574219, + "test_acc": 0.01, + "lyapunov": 1.615870985228692, + "grad_norm": 0.31755349221985774, + "grad_max_sv": 0.17116790413856506, + "grad_min_sv": 2.5351133262074833e-09, + "grad_condition": 220960563.35692176, + "lr": 0.0008187119948743447, + "time_sec": 87.20640540122986 + }, + { + "epoch": 43, + "train_loss": 4.793043034057617, + "train_acc": 0.02262, + "test_loss": 5.881324156951904, + "test_acc": 0.01, + "lyapunov": 1.7521904277069795, + "grad_norm": 0.5590339405433944, + "grad_max_sv": 0.14497370515600777, + "grad_min_sv": 3.9279086975103414e-10, + "grad_condition": 19019670561.939625, + "lr": 0.000810573890139155, + "time_sec": 87.31258749961853 + }, + { + "epoch": 44, + "train_loss": 4.844116692810059, + "train_acc": 0.02276, + "test_loss": 5.395824824523926, + "test_acc": 0.01, + "lyapunov": 1.8710771832624664, + "grad_norm": 0.5293965973008694, + "grad_max_sv": 0.1555709108710289, + "grad_min_sv": 4.2711866910149697e-10, + "grad_condition": 14548258948.991043, + "lr": 0.0008022995574311873, + "time_sec": 87.18556952476501 + }, + { + "epoch": 45, + "train_loss": 4.8768616571044925, + "train_acc": 0.02038, + "test_loss": 4.61512779083252, + "test_acc": 0.01, + "lyapunov": 1.8506627338926505, + "grad_norm": 0.6998099846191761, + "grad_max_sv": 0.13765994729474187, + "grad_min_sv": 5.812380418716187e-11, + "grad_condition": 29846677946.806488, + "lr": 0.0007938926261462363, + "time_sec": 87.2240195274353 + }, + { + "epoch": 46, + "train_loss": 4.969230243377686, + "train_acc": 0.01168, + "test_loss": 7.386215936279297, + "test_acc": 0.01, + "lyapunov": 1.8457061924288034, + "grad_norm": 1.2406105764459343, + "grad_max_sv": 0.11906649246811866, + "grad_min_sv": 3.98718814026065e-11, + "grad_condition": 92245006784.32524, + "lr": 0.0007853567838422158, + "time_sec": 87.17690944671631 + }, + { + "epoch": 47, + "train_loss": 4.875964500274658, + "train_acc": 0.01072, + "test_loss": 6.527316121673584, + "test_acc": 0.01, + "lyapunov": 1.5310816859345302, + "grad_norm": 0.16182231228887384, + "grad_max_sv": 0.08984448052942753, + "grad_min_sv": 1.0441322375968024e-16, + "grad_condition": 89835727617.94872, + "lr": 0.0007766957746216719, + "time_sec": 87.1852126121521 + }, + { + "epoch": 48, + "train_loss": 4.875588766021728, + "train_acc": 0.00916, + "test_loss": 6.651647409820557, + "test_acc": 0.01, + "lyapunov": 1.5314356905724995, + "grad_norm": 0.17879068685955746, + "grad_max_sv": 0.09055437743663788, + "grad_min_sv": 2.807460538981671e-16, + "grad_condition": 90529399768.58862, + "lr": 0.0007679133974894982, + "time_sec": 87.19542217254639 + }, + { + "epoch": 49, + "train_loss": 4.874160293884278, + "train_acc": 0.00928, + "test_loss": 6.9806133621215825, + "test_acc": 0.01, + "lyapunov": 1.5310221773279293, + "grad_norm": 0.15914063982748972, + "grad_max_sv": 0.0841954169794917, + "grad_min_sv": 1.1028138256059021e-16, + "grad_condition": 84186278073.27275, + "lr": 0.000759013504686565, + "time_sec": 87.18294835090637 + }, + { + "epoch": 50, + "train_loss": 4.874967584228516, + "train_acc": 0.0088, + "test_loss": 7.2512130996704105, + "test_acc": 0.01, + "lyapunov": 1.531926109052985, + "grad_norm": 0.13359997166294424, + "grad_max_sv": 0.07885234858840703, + "grad_min_sv": 1.5449564137240798e-17, + "grad_condition": 78851261996.51497, + "lr": 0.0007499999999999998, + "time_sec": 87.1744954586029 + }, + { + "epoch": 51, + "train_loss": 4.873049064331055, + "train_acc": 0.00894, + "test_loss": 7.2680836700439455, + "test_acc": 0.01, + "lyapunov": 1.5300328816904132, + "grad_norm": 0.13566663059488987, + "grad_max_sv": 0.06801612647250295, + "grad_min_sv": 3.3721854663294077e-28, + "grad_condition": 68016126472.50293, + "lr": 0.0007408768370508575, + "time_sec": 87.2090744972229 + }, + { + "epoch": 52, + "train_loss": 4.8752045971679685, + "train_acc": 0.00998, + "test_loss": 7.319013902282715, + "test_acc": 0.01, + "lyapunov": 1.5358237284223746, + "grad_norm": 0.15295505609252377, + "grad_max_sv": 0.07399358823895455, + "grad_min_sv": 4.036005675649565e-34, + "grad_condition": 73993588238.95454, + "lr": 0.0007316480175599307, + "time_sec": 87.17916941642761 + }, + { + "epoch": 53, + "train_loss": 4.875089646759033, + "train_acc": 0.00932, + "test_loss": 6.708341079711914, + "test_acc": 0.01, + "lyapunov": 1.535219712025674, + "grad_norm": 0.15337946692641713, + "grad_max_sv": 0.0786401204764843, + "grad_min_sv": 9.418872962396182e-34, + "grad_condition": 78640120476.4843, + "lr": 0.0007223175895924635, + "time_sec": 87.19920134544373 + }, + { + "epoch": 54, + "train_loss": 4.8763134245300295, + "train_acc": 0.00954, + "test_loss": 7.893965859985352, + "test_acc": 0.01, + "lyapunov": 1.5382219912755826, + "grad_norm": 0.14430315662174414, + "grad_max_sv": 0.0842284008860588, + "grad_min_sv": 1.4016176262153585e-17, + "grad_condition": 84227307606.50656, + "lr": 0.0007128896457825361, + "time_sec": 87.16732549667358 + }, + { + "epoch": 55, + "train_loss": 4.880924655761719, + "train_acc": 0.00986, + "test_loss": 8.769433529663086, + "test_acc": 0.01, + "lyapunov": 1.5441064075435824, + "grad_norm": 0.16740838552751033, + "grad_max_sv": 0.08879097644239664, + "grad_min_sv": 3.0302474954849e-15, + "grad_condition": 88489187160.01863, + "lr": 0.0007033683215378998, + "time_sec": 87.23270034790039 + }, + { + "epoch": 56, + "train_loss": 4.880691115722656, + "train_acc": 0.00984, + "test_loss": 8.956744931030274, + "test_acc": 0.01, + "lyapunov": 1.5440428296623327, + "grad_norm": 0.169681128943872, + "grad_max_sv": 0.08683812469244004, + "grad_min_sv": 2.6780771295629216e-16, + "grad_condition": 86810744990.1141, + "lr": 0.0006937577932260512, + "time_sec": 87.5180823802948 + }, + { + "epoch": 57, + "train_loss": 4.875461320648193, + "train_acc": 0.00882, + "test_loss": 7.914718838500977, + "test_acc": 0.01, + "lyapunov": 1.5361771690266213, + "grad_norm": 0.13744745585086549, + "grad_max_sv": 0.08106257226318121, + "grad_min_sv": 4.602306454836924e-17, + "grad_condition": 81058882088.7789, + "lr": 0.0006840622763423388, + "time_sec": 87.23774647712708 + }, + { + "epoch": 58, + "train_loss": 4.876462248229981, + "train_acc": 0.0086, + "test_loss": 7.521480532836914, + "test_acc": 0.01, + "lyapunov": 1.5380861676867357, + "grad_norm": 0.1308094426729998, + "grad_max_sv": 0.07691145669668913, + "grad_min_sv": 5.2512441923478546e-21, + "grad_condition": 76911456255.58595, + "lr": 0.0006742860236609073, + "time_sec": 87.19443416595459 + }, + { + "epoch": 59, + "train_loss": 4.876125813751221, + "train_acc": 0.00958, + "test_loss": 9.108944590759277, + "test_acc": 0.01, + "lyapunov": 1.5374773286492622, + "grad_norm": 0.13065965995697965, + "grad_max_sv": 0.07693316899240017, + "grad_min_sv": 4.628041294277668e-28, + "grad_condition": 76933168992.40013, + "lr": 0.0006644333233692913, + "time_sec": 87.11430335044861 + }, + { + "epoch": 60, + "train_loss": 4.876531585845948, + "train_acc": 0.01002, + "test_loss": 8.708165438842773, + "test_acc": 0.01, + "lyapunov": 1.540081706193402, + "grad_norm": 0.12514364110494514, + "grad_max_sv": 0.04278304530307651, + "grad_min_sv": 5.111839701214236e-27, + "grad_condition": 42783045303.07613, + "lr": 0.0006545084971874734, + "time_sec": 87.08950901031494 + }, + { + "epoch": 61, + "train_loss": 4.876955277404785, + "train_acc": 0.00986, + "test_loss": 9.633759455871582, + "test_acc": 0.01, + "lyapunov": 1.5432406968777748, + "grad_norm": 0.13030696119131907, + "grad_max_sv": 0.01869940897449851, + "grad_min_sv": 0.0, + "grad_condition": 18699408974.498512, + "lr": 0.0006445158984722354, + "time_sec": 87.06369233131409 + }, + { + "epoch": 62, + "train_loss": 4.880256801300049, + "train_acc": 0.00914, + "test_loss": 8.106962710571288, + "test_acc": 0.01, + "lyapunov": 1.5493804704197838, + "grad_norm": 0.13707953455281482, + "grad_max_sv": 0.05703742457553744, + "grad_min_sv": 2.412788074144182e-18, + "grad_condition": 57037235841.35691, + "lr": 0.0006344599103076324, + "time_sec": 87.23956346511841 + }, + { + "epoch": 63, + "train_loss": 4.877262191009521, + "train_acc": 0.00972, + "test_loss": 9.24615108947754, + "test_acc": 0.01, + "lyapunov": 1.5415991502039879, + "grad_norm": 0.13665560919633327, + "grad_max_sv": 0.0726124294102192, + "grad_min_sv": 2.0682456318226844e-23, + "grad_condition": 72612429408.54066, + "lr": 0.0006243449435824269, + "time_sec": 87.23054909706116 + }, + { + "epoch": 64, + "train_loss": 4.87730983215332, + "train_acc": 0.00936, + "test_loss": 10.058143447875976, + "test_acc": 0.01, + "lyapunov": 1.5422342823594428, + "grad_norm": 0.12004208587403144, + "grad_max_sv": 0.06160930292680859, + "grad_min_sv": 0.0, + "grad_condition": 61609302926.80859, + "lr": 0.0006141754350553275, + "time_sec": 87.30030584335327 + }, + { + "epoch": 65, + "train_loss": 4.878948260040283, + "train_acc": 0.0093, + "test_loss": 9.260436712646484, + "test_acc": 0.01, + "lyapunov": 1.5483233312816571, + "grad_norm": 0.12423135486220072, + "grad_max_sv": 0.0546061669010669, + "grad_min_sv": 0.0, + "grad_condition": 54606166901.066895, + "lr": 0.0006039558454088793, + "time_sec": 87.31754422187805 + }, + { + "epoch": 66, + "train_loss": 4.881117270965576, + "train_acc": 0.00976, + "test_loss": 7.955686111450195, + "test_acc": 0.01, + "lyapunov": 1.5531517626989224, + "grad_norm": 0.1466609355894601, + "grad_max_sv": 0.05231738574802876, + "grad_min_sv": 0.0, + "grad_condition": 52317385748.02876, + "lr": 0.000593690657292862, + "time_sec": 87.25684475898743 + }, + { + "epoch": 67, + "train_loss": 4.87848960723877, + "train_acc": 0.0093, + "test_loss": 8.291721563720703, + "test_acc": 0.01, + "lyapunov": 1.5488468536635493, + "grad_norm": 0.13358884588524558, + "grad_max_sv": 0.046516909170895814, + "grad_min_sv": 0.0, + "grad_condition": 46516909170.89581, + "lr": 0.0005833843733580507, + "time_sec": 87.23024368286133 + }, + { + "epoch": 68, + "train_loss": 4.876251863098145, + "train_acc": 0.00948, + "test_loss": 8.313035414123535, + "test_acc": 0.01, + "lyapunov": 1.5433335642680488, + "grad_norm": 0.10782264609925914, + "grad_max_sv": 0.04402522062882781, + "grad_min_sv": 0.0, + "grad_condition": 44025220628.827805, + "lr": 0.0005730415142812054, + "time_sec": 87.16200470924377 + }, + { + "epoch": 69, + "train_loss": 4.877121996459961, + "train_acc": 0.00992, + "test_loss": 6.634935369110107, + "test_acc": 0.01, + "lyapunov": 1.5465551251950471, + "grad_norm": 0.10524482896626382, + "grad_max_sv": 0.03552310774102807, + "grad_min_sv": 0.0, + "grad_condition": 35523107741.02806, + "lr": 0.0005626666167821517, + "time_sec": 87.16768336296082 + }, + { + "epoch": 70, + "train_loss": 4.877148870697021, + "train_acc": 0.00924, + "test_loss": 5.170057612609863, + "test_acc": 0.01, + "lyapunov": 1.544044288223052, + "grad_norm": 0.12272040694034365, + "grad_max_sv": 0.042177446838468316, + "grad_min_sv": 0.0, + "grad_condition": 42177446838.46831, + "lr": 0.0005522642316338265, + "time_sec": 87.17852282524109 + }, + { + "epoch": 71, + "train_loss": 4.878114613800049, + "train_acc": 0.00918, + "test_loss": 5.881608570861816, + "test_acc": 0.01, + "lyapunov": 1.5485444328059321, + "grad_norm": 0.1267744759308649, + "grad_max_sv": 0.03348520016297698, + "grad_min_sv": 0.0, + "grad_condition": 33485200162.97698, + "lr": 0.0005418389216661573, + "time_sec": 87.12145924568176 + }, + { + "epoch": 72, + "train_loss": 4.877243146057129, + "train_acc": 0.00954, + "test_loss": 4.831268686676025, + "test_acc": 0.01, + "lyapunov": 1.5455416965362665, + "grad_norm": 0.11162604722177562, + "grad_max_sv": 0.04829189190641046, + "grad_min_sv": 0.0, + "grad_condition": 48291891906.41045, + "lr": 0.0005313952597646563, + "time_sec": 87.20591306686401 + }, + { + "epoch": 73, + "train_loss": 4.877523553466797, + "train_acc": 0.00916, + "test_loss": 5.21819946975708, + "test_acc": 0.01, + "lyapunov": 1.5469345262898204, + "grad_norm": 0.1695274830056392, + "grad_max_sv": 0.03528429148718715, + "grad_min_sv": 0.0, + "grad_condition": 35284291487.18715, + "lr": 0.0005209378268645994, + "time_sec": 87.15492391586304 + }, + { + "epoch": 74, + "train_loss": 4.878687818603516, + "train_acc": 0.00902, + "test_loss": 7.045982824707031, + "test_acc": 0.01, + "lyapunov": 1.548920457320445, + "grad_norm": 0.11876165619339213, + "grad_max_sv": 0.0398634166456759, + "grad_min_sv": 0.0, + "grad_condition": 39863416645.675896, + "lr": 0.0005104712099416781, + "time_sec": 87.20987892150879 + }, + { + "epoch": 75, + "train_loss": 4.8802404374694826, + "train_acc": 0.00952, + "test_loss": 5.816082705688476, + "test_acc": 0.01, + "lyapunov": 1.5510207057913856, + "grad_norm": 0.11814260313160607, + "grad_max_sv": 0.04241896355524659, + "grad_min_sv": 0.0, + "grad_condition": 42418963555.24659, + "lr": 0.0004999999999999996, + "time_sec": 87.17034125328064 + }, + { + "epoch": 76, + "train_loss": 4.877049774017334, + "train_acc": 0.01008, + "test_loss": 5.791509801483154, + "test_acc": 0.01, + "lyapunov": 1.545583454544282, + "grad_norm": 0.10644494843061181, + "grad_max_sv": 0.044637566059827806, + "grad_min_sv": 0.0, + "grad_condition": 44637566059.827805, + "lr": 0.0004895287900583212, + "time_sec": 87.17367744445801 + }, + { + "epoch": 77, + "train_loss": 4.876323641052246, + "train_acc": 0.00964, + "test_loss": 5.184193676757812, + "test_acc": 0.01, + "lyapunov": 1.5437548282506215, + "grad_norm": 0.10450293107653293, + "grad_max_sv": 0.04073738274164498, + "grad_min_sv": 0.0, + "grad_condition": 40737382741.64498, + "lr": 0.0004790621731353997, + "time_sec": 87.17853283882141 + }, + { + "epoch": 78, + "train_loss": 4.8809456416320804, + "train_acc": 0.00946, + "test_loss": 4.926686591339111, + "test_acc": 0.01, + "lyapunov": 1.5541882484465304, + "grad_norm": 0.12051319198728945, + "grad_max_sv": 0.033642015885561705, + "grad_min_sv": 0.0, + "grad_condition": 33642015885.561707, + "lr": 0.000468604740235343, + "time_sec": 87.15360975265503 + }, + { + "epoch": 79, + "train_loss": 4.878056556091309, + "train_acc": 0.00886, + "test_loss": 4.698637203979493, + "test_acc": 0.01, + "lyapunov": 1.5484835391154375, + "grad_norm": 0.11143972892340351, + "grad_max_sv": 0.03221007520332932, + "grad_min_sv": 0.0, + "grad_condition": 32210075203.329323, + "lr": 0.00045816107833384175, + "time_sec": 87.12274217605591 + }, + { + "epoch": 80, + "train_loss": 4.877688450622559, + "train_acc": 0.00998, + "test_loss": 4.708519946289062, + "test_acc": 0.01, + "lyapunov": 1.5479903696747996, + "grad_norm": 0.10853834057327462, + "grad_max_sv": 0.03808168638497591, + "grad_min_sv": 0.0, + "grad_condition": 38081686384.97591, + "lr": 0.0004477357683661729, + "time_sec": 87.16511940956116 + }, + { + "epoch": 81, + "train_loss": 4.877410650787353, + "train_acc": 0.00924, + "test_loss": 5.326217936706543, + "test_acc": 0.01, + "lyapunov": 1.5462311384318126, + "grad_norm": 0.1078272819076305, + "grad_max_sv": 0.0341941992752254, + "grad_min_sv": 0.0, + "grad_condition": 34194199275.225403, + "lr": 0.00043733338321784746, + "time_sec": 87.13259315490723 + }, + { + "epoch": 82, + "train_loss": 4.878852579498291, + "train_acc": 0.00992, + "test_loss": 5.124214416503906, + "test_acc": 0.01, + "lyapunov": 1.551578131783039, + "grad_norm": 0.11924540172549285, + "grad_max_sv": 0.032149143144488336, + "grad_min_sv": 0.0, + "grad_condition": 32149143144.488342, + "lr": 0.0004269584857187939, + "time_sec": 87.15441107749939 + }, + { + "epoch": 83, + "train_loss": 4.877541376647949, + "train_acc": 0.00962, + "test_loss": 5.2295348327636715, + "test_acc": 0.01, + "lyapunov": 1.5478261575064696, + "grad_norm": 0.1053498185299808, + "grad_max_sv": 0.026044291676953435, + "grad_min_sv": 0.0, + "grad_condition": 26044291676.953438, + "lr": 0.0004166156266419484, + "time_sec": 87.16295027732849 + }, + { + "epoch": 84, + "train_loss": 4.877119447631836, + "train_acc": 0.00984, + "test_loss": 5.116746160888672, + "test_acc": 0.01, + "lyapunov": 1.5470911304054358, + "grad_norm": 0.10156236054846617, + "grad_max_sv": 0.028701860643923282, + "grad_min_sv": 0.0, + "grad_condition": 28701860643.92328, + "lr": 0.0004063093427071373, + "time_sec": 87.13170576095581 + }, + { + "epoch": 85, + "train_loss": 4.878303242034912, + "train_acc": 0.01008, + "test_loss": 4.748899824523925, + "test_acc": 0.01, + "lyapunov": 1.5509575178556125, + "grad_norm": 0.1141388454907746, + "grad_max_sv": 0.033817021455615756, + "grad_min_sv": 0.0, + "grad_condition": 33817021455.61576, + "lr": 0.0003960441545911199, + "time_sec": 87.10089588165283 + }, + { + "epoch": 86, + "train_loss": 4.87876032699585, + "train_acc": 0.0097, + "test_loss": 4.651885162353516, + "test_acc": 0.01, + "lyapunov": 1.5511503161676705, + "grad_norm": 0.09785209813867382, + "grad_max_sv": 0.027630697237327695, + "grad_min_sv": 0.0, + "grad_condition": 27630697237.32769, + "lr": 0.0003858245649446718, + "time_sec": 87.0941972732544 + }, + { + "epoch": 87, + "train_loss": 4.877712865142822, + "train_acc": 0.00998, + "test_loss": 5.250769630432129, + "test_acc": 0.01, + "lyapunov": 1.548732325549016, + "grad_norm": 0.1974258085478382, + "grad_max_sv": 0.02602379145100713, + "grad_min_sv": 0.0, + "grad_condition": 26023791451.00713, + "lr": 0.00037565505641757235, + "time_sec": 87.11909556388855 + }, + { + "epoch": 88, + "train_loss": 4.877790277404785, + "train_acc": 0.00996, + "test_loss": 5.091197055053711, + "test_acc": 0.01, + "lyapunov": 1.5483774038227014, + "grad_norm": 0.10333331120218883, + "grad_max_sv": 0.03042559456080198, + "grad_min_sv": 0.0, + "grad_condition": 30425594560.801983, + "lr": 0.00036554008969236695, + "time_sec": 87.1078622341156 + }, + { + "epoch": 89, + "train_loss": 4.877677908020019, + "train_acc": 0.0099, + "test_loss": 5.058323477935791, + "test_acc": 0.01, + "lyapunov": 1.5483884863231494, + "grad_norm": 0.09905622622525881, + "grad_max_sv": 0.03069272106513381, + "grad_min_sv": 0.0, + "grad_condition": 30692721065.133812, + "lr": 0.0003554841015277638, + "time_sec": 87.05663800239563 + }, + { + "epoch": 90, + "train_loss": 4.881804440917969, + "train_acc": 0.0106, + "test_loss": 5.362990502166748, + "test_acc": 0.01, + "lyapunov": 1.553605647648082, + "grad_norm": 0.10267946386955158, + "grad_max_sv": 0.030273563507944346, + "grad_min_sv": 0.0, + "grad_condition": 30273563507.944347, + "lr": 0.000345491502812526, + "time_sec": 87.06899333000183 + }, + { + "epoch": 91, + "train_loss": 4.879398302917481, + "train_acc": 0.01, + "test_loss": 5.126827237701416, + "test_acc": 0.01, + "lyapunov": 1.5521758828321686, + "grad_norm": 0.12087522031268683, + "grad_max_sv": 0.03009325391612947, + "grad_min_sv": 0.0, + "grad_condition": 30093253916.129467, + "lr": 0.0003355666766307081, + "time_sec": 87.05256390571594 + }, + { + "epoch": 92, + "train_loss": 4.880291121673584, + "train_acc": 0.00988, + "test_loss": 5.26154695892334, + "test_acc": 0.01, + "lyapunov": 1.5549428770914102, + "grad_norm": 0.13231588784429352, + "grad_max_sv": 0.03350330209359527, + "grad_min_sv": 0.0, + "grad_condition": 33503302093.595264, + "lr": 0.00032571397633909225, + "time_sec": 87.10619926452637 + }, + { + "epoch": 93, + "train_loss": 4.8782078823852535, + "train_acc": 0.00968, + "test_loss": 5.271252917480469, + "test_acc": 0.01, + "lyapunov": 1.5495562916216643, + "grad_norm": 0.12175801600529883, + "grad_max_sv": 0.03186503546312451, + "grad_min_sv": 0.0, + "grad_condition": 31865035463.12451, + "lr": 0.00031593772365766094, + "time_sec": 87.12923264503479 + }, + { + "epoch": 94, + "train_loss": 4.87740290222168, + "train_acc": 0.00982, + "test_loss": 5.075842178344726, + "test_acc": 0.01, + "lyapunov": 1.547658307473068, + "grad_norm": 0.11436426699794455, + "grad_max_sv": 0.02530919690616429, + "grad_min_sv": 0.0, + "grad_condition": 25309196906.164288, + "lr": 0.0003062422067739483, + "time_sec": 87.08783769607544 + }, + { + "epoch": 95, + "train_loss": 4.877675037384034, + "train_acc": 0.00952, + "test_loss": 5.33029627532959, + "test_acc": 0.01, + "lyapunov": 1.5485165667960712, + "grad_norm": 0.10074303038813699, + "grad_max_sv": 0.03554986314848065, + "grad_min_sv": 0.0, + "grad_condition": 35549863148.48065, + "lr": 0.00029663167846209965, + "time_sec": 87.08289909362793 + }, + { + "epoch": 96, + "train_loss": 4.877177648620606, + "train_acc": 0.01022, + "test_loss": 5.369173509216308, + "test_acc": 0.01, + "lyapunov": 1.5468677212210262, + "grad_norm": 0.1013436246118025, + "grad_max_sv": 0.03922831532545388, + "grad_min_sv": 0.0, + "grad_condition": 39228315325.45387, + "lr": 0.00028711035421746345, + "time_sec": 87.09603428840637 + }, + { + "epoch": 97, + "train_loss": 4.881449295959473, + "train_acc": 0.00942, + "test_loss": 4.928601164245605, + "test_acc": 0.01, + "lyapunov": 1.5567159265508432, + "grad_norm": 0.10170216841041604, + "grad_max_sv": 0.021827650628983973, + "grad_min_sv": 0.0, + "grad_condition": 21827650628.98397, + "lr": 0.00027768241040753615, + "time_sec": 87.07169818878174 + }, + { + "epoch": 98, + "train_loss": 4.8775743408203125, + "train_acc": 0.00984, + "test_loss": 4.987854670715332, + "test_acc": 0.01, + "lyapunov": 1.548287238916168, + "grad_norm": 0.12626493811946907, + "grad_max_sv": 0.03011642089113593, + "grad_min_sv": 0.0, + "grad_condition": 30116420891.135933, + "lr": 0.00026835198244006903, + "time_sec": 87.164879322052 + }, + { + "epoch": 99, + "train_loss": 4.878459322357178, + "train_acc": 0.00968, + "test_loss": 4.931130755615234, + "test_acc": 0.01, + "lyapunov": 1.5513008421339343, + "grad_norm": 0.1050431882077805, + "grad_max_sv": 0.026918977173045276, + "grad_min_sv": 0.0, + "grad_condition": 26918977173.045277, + "lr": 0.0002591231629491421, + "time_sec": 87.06193971633911 + }, + { + "epoch": 100, + "train_loss": 4.877405020904541, + "train_acc": 0.00972, + "test_loss": 4.892998168182373, + "test_acc": 0.01, + "lyapunov": 1.5485746119638233, + "grad_norm": 0.10391039157029125, + "grad_max_sv": 0.009399653738364577, + "grad_min_sv": 0.0, + "grad_condition": 9399653738.364578, + "lr": 0.0002499999999999997, + "time_sec": 86.99319124221802 + }, + { + "epoch": 101, + "train_loss": 4.878013845367431, + "train_acc": 0.00972, + "test_loss": 4.892334498596192, + "test_acc": 0.01, + "lyapunov": 1.549886227568702, + "grad_norm": 0.10312805970588344, + "grad_max_sv": 0.020510493777692318, + "grad_min_sv": 0.0, + "grad_condition": 20510493777.692318, + "lr": 0.00024098649531343477, + "time_sec": 87.05790066719055 + }, + { + "epoch": 102, + "train_loss": 4.878095693969726, + "train_acc": 0.00976, + "test_loss": 4.820429385375976, + "test_acc": 0.01, + "lyapunov": 1.5501237391206004, + "grad_norm": 0.11558211080028734, + "grad_max_sv": 0.024952154234051706, + "grad_min_sv": 0.0, + "grad_condition": 24952154234.051704, + "lr": 0.0002320866025105016, + "time_sec": 87.05184125900269 + }, + { + "epoch": 103, + "train_loss": 4.878661685333252, + "train_acc": 0.01018, + "test_loss": 5.300121360015869, + "test_acc": 0.01, + "lyapunov": 1.551538582957919, + "grad_norm": 0.12567932831666664, + "grad_max_sv": 0.012993747182190419, + "grad_min_sv": 0.0, + "grad_condition": 12993747182.190418, + "lr": 0.0002233042253783278, + "time_sec": 87.06061792373657 + }, + { + "epoch": 104, + "train_loss": 4.877294933776856, + "train_acc": 0.0099, + "test_loss": 5.135670352172852, + "test_acc": 0.01, + "lyapunov": 1.5485212714470866, + "grad_norm": 0.09250410480818645, + "grad_max_sv": 0.004851618967950344, + "grad_min_sv": 0.0, + "grad_condition": 4851618967.950345, + "lr": 0.000214643216157784, + "time_sec": 87.05238747596741 + }, + { + "epoch": 105, + "train_loss": 4.877063808746338, + "train_acc": 0.00988, + "test_loss": 5.725478736877442, + "test_acc": 0.01, + "lyapunov": 1.5481484466806397, + "grad_norm": 0.09550603539231842, + "grad_max_sv": 0.011385573633015155, + "grad_min_sv": 0.0, + "grad_condition": 11385573633.015156, + "lr": 0.00020610737385376332, + "time_sec": 87.0910587310791 + }, + { + "epoch": 106, + "train_loss": 4.877282638549804, + "train_acc": 0.00984, + "test_loss": 5.60465906829834, + "test_acc": 0.01, + "lyapunov": 1.5483009687165166, + "grad_norm": 0.10354511535570549, + "grad_max_sv": 0.02720399503596127, + "grad_min_sv": 0.0, + "grad_condition": 27203995035.961273, + "lr": 0.00019770044256881242, + "time_sec": 87.10812902450562 + }, + { + "epoch": 107, + "train_loss": 4.876681364440918, + "train_acc": 0.00976, + "test_loss": 5.2093520240783695, + "test_acc": 0.01, + "lyapunov": 1.5473160725420394, + "grad_norm": 0.09575843142426103, + "grad_max_sv": 0.007643958646804094, + "grad_min_sv": 0.0, + "grad_condition": 7643958646.804095, + "lr": 0.0001894261098608447, + "time_sec": 87.00347948074341 + }, + { + "epoch": 108, + "train_loss": 4.878350821228027, + "train_acc": 0.01052, + "test_loss": 4.913621876525879, + "test_acc": 0.01, + "lyapunov": 1.5520180210737926, + "grad_norm": 0.1307850708492295, + "grad_max_sv": 0.016565991286188363, + "grad_min_sv": 0.0, + "grad_condition": 16565991286.188366, + "lr": 0.000181288005125655, + "time_sec": 87.0159866809845 + }, + { + "epoch": 109, + "train_loss": 4.876669662628174, + "train_acc": 0.01016, + "test_loss": 4.88301672668457, + "test_acc": 0.01, + "lyapunov": 1.5467288201422338, + "grad_norm": 0.09856162731459642, + "grad_max_sv": 0.014887689799070358, + "grad_min_sv": 0.0, + "grad_condition": 14887689799.070358, + "lr": 0.0001732896980049473, + "time_sec": 86.99599003791809 + }, + { + "epoch": 110, + "train_loss": 4.877418764038086, + "train_acc": 0.00988, + "test_loss": 5.01456753540039, + "test_acc": 0.01, + "lyapunov": 1.549457520170285, + "grad_norm": 0.11878011333313225, + "grad_max_sv": 0.005905823782086372, + "grad_min_sv": 0.0, + "grad_condition": 5905823782.086372, + "lr": 0.00016543469682057076, + "time_sec": 87.00050139427185 + }, + { + "epoch": 111, + "train_loss": 4.877375203704834, + "train_acc": 0.01016, + "test_loss": 4.923972444152832, + "test_acc": 0.01, + "lyapunov": 1.549215167074862, + "grad_norm": 0.11051840491520531, + "grad_max_sv": 0.007604151451960206, + "grad_min_sv": 0.0, + "grad_condition": 7604151451.960205, + "lr": 0.00015772644703565552, + "time_sec": 87.03872609138489 + }, + { + "epoch": 112, + "train_loss": 4.87747160736084, + "train_acc": 0.0097, + "test_loss": 4.956568124389649, + "test_acc": 0.01, + "lyapunov": 1.5494032619554368, + "grad_norm": 0.11381662366828246, + "grad_max_sv": 0.01119147464632988, + "grad_min_sv": 0.0, + "grad_condition": 11191474646.32988, + "lr": 0.00015016832974331713, + "time_sec": 87.11299419403076 + }, + { + "epoch": 113, + "train_loss": 4.87979639755249, + "train_acc": 0.01012, + "test_loss": 4.926776232910156, + "test_acc": 0.01, + "lyapunov": 1.5544771361533942, + "grad_norm": 0.15709933765078352, + "grad_max_sv": 0.00347123583778739, + "grad_min_sv": 0.0, + "grad_condition": 3471235837.78739, + "lr": 0.00014276366018359834, + "time_sec": 87.06232452392578 + }, + { + "epoch": 114, + "train_loss": 4.878047005310059, + "train_acc": 0.00952, + "test_loss": 4.92212592086792, + "test_acc": 0.01, + "lyapunov": 1.5507129702116826, + "grad_norm": 0.10294832245991155, + "grad_max_sv": 0.012609629379585385, + "grad_min_sv": 0.0, + "grad_condition": 12609629379.585384, + "lr": 0.00013551568628929425, + "time_sec": 87.06694340705872 + }, + { + "epoch": 115, + "train_loss": 4.877151131134033, + "train_acc": 0.0092, + "test_loss": 4.918728126525879, + "test_acc": 0.01, + "lyapunov": 1.548615127878116, + "grad_norm": 0.10263613090186025, + "grad_max_sv": 0.006314583634957671, + "grad_min_sv": 0.0, + "grad_condition": 6314583634.957671, + "lr": 0.00012842758726130276, + "time_sec": 87.03067350387573 + }, + { + "epoch": 116, + "train_loss": 4.87786820098877, + "train_acc": 0.00982, + "test_loss": 5.00487536239624, + "test_acc": 0.01, + "lyapunov": 1.5504866353691082, + "grad_norm": 0.12269127259842373, + "grad_max_sv": 0.014170486759394408, + "grad_min_sv": 0.0, + "grad_condition": 14170486759.39441, + "lr": 0.0001215024721741218, + "time_sec": 87.00306367874146 + }, + { + "epoch": 117, + "train_loss": 4.876784671478272, + "train_acc": 0.00974, + "test_loss": 5.023514326477051, + "test_acc": 0.01, + "lyapunov": 1.5474366047193326, + "grad_norm": 0.10427521316985092, + "grad_max_sv": 0.004411047184839844, + "grad_min_sv": 0.0, + "grad_condition": 4411047184.839845, + "lr": 0.00011474337861210538, + "time_sec": 87.03306269645691 + }, + { + "epoch": 118, + "train_loss": 4.877164349365234, + "train_acc": 0.01002, + "test_loss": 4.991419695281983, + "test_acc": 0.01, + "lyapunov": 1.5484020453889658, + "grad_norm": 0.10471789513305493, + "grad_max_sv": 0.008587307529523969, + "grad_min_sv": 0.0, + "grad_condition": 8587307529.523969, + "lr": 0.00010815327133708009, + "time_sec": 87.06011486053467 + }, + { + "epoch": 119, + "train_loss": 4.876861254577637, + "train_acc": 0.00988, + "test_loss": 5.089453727722168, + "test_acc": 0.01, + "lyapunov": 1.5475890602906952, + "grad_norm": 0.10992180658040822, + "grad_max_sv": 0.009593591233715415, + "grad_min_sv": 0.0, + "grad_condition": 9593591233.715414, + "lr": 0.00010173504098790182, + "time_sec": 87.0181610584259 + }, + { + "epoch": 120, + "train_loss": 4.87691458618164, + "train_acc": 0.00984, + "test_loss": 5.0014659088134765, + "test_acc": 0.01, + "lyapunov": 1.5480926106957829, + "grad_norm": 0.10767138662291806, + "grad_max_sv": 0.0038278432097285987, + "grad_min_sv": 0.0, + "grad_condition": 3827843209.728598, + "lr": 9.549150281252629e-05, + "time_sec": 86.99478530883789 + }, + { + "epoch": 121, + "train_loss": 4.877940362548828, + "train_acc": 0.00962, + "test_loss": 4.935777435302734, + "test_acc": 0.01, + "lyapunov": 1.5509431261540678, + "grad_norm": 0.13054112707845358, + "grad_max_sv": 0.006552627170458436, + "grad_min_sv": 0.0, + "grad_condition": 6552627170.458437, + "lr": 8.942539543314794e-05, + "time_sec": 87.0364146232605 + }, + { + "epoch": 122, + "train_loss": 4.877626941223144, + "train_acc": 0.01018, + "test_loss": 4.956711478424072, + "test_acc": 0.01, + "lyapunov": 1.549799994434542, + "grad_norm": 0.12579422138988705, + "grad_max_sv": 0.012472250685095786, + "grad_min_sv": 0.0, + "grad_condition": 12472250685.095787, + "lr": 8.353937964495024e-05, + "time_sec": 87.04438400268555 + }, + { + "epoch": 123, + "train_loss": 4.8773612213134765, + "train_acc": 0.01028, + "test_loss": 5.112759294128418, + "test_acc": 0.01, + "lyapunov": 1.5493231264831464, + "grad_norm": 0.11869948278714595, + "grad_max_sv": 0.006990070082247257, + "grad_min_sv": 0.0, + "grad_condition": 6990070082.247256, + "lr": 7.783603724899243e-05, + "time_sec": 87.04442477226257 + }, + { + "epoch": 124, + "train_loss": 4.876904801330566, + "train_acc": 0.00974, + "test_loss": 5.0848597717285156, + "test_acc": 0.01, + "lyapunov": 1.547949957725642, + "grad_norm": 0.11622328135609243, + "grad_max_sv": 0.00592916551977396, + "grad_min_sv": 0.0, + "grad_condition": 5929165519.773959, + "lr": 7.231786991974666e-05, + "time_sec": 87.02583312988281 + }, + { + "epoch": 125, + "train_loss": 4.876884867248535, + "train_acc": 0.00994, + "test_loss": 5.093001669311524, + "test_acc": 0.01, + "lyapunov": 1.5479519553196706, + "grad_norm": 0.11394234129927898, + "grad_max_sv": 0.003486808715388179, + "grad_min_sv": 0.0, + "grad_condition": 3486808715.388179, + "lr": 6.698729810778072e-05, + "time_sec": 87.01634311676025 + }, + { + "epoch": 126, + "train_loss": 4.87686362991333, + "train_acc": 0.00962, + "test_loss": 5.044818876647949, + "test_acc": 0.01, + "lyapunov": 1.5478015985635236, + "grad_norm": 0.11528475995319568, + "grad_max_sv": 0.01741538755595684, + "grad_min_sv": 0.0, + "grad_condition": 17415387555.95684, + "lr": 6.184665997806817e-05, + "time_sec": 87.03749418258667 + }, + { + "epoch": 127, + "train_loss": 4.877244481811523, + "train_acc": 0.00992, + "test_loss": 5.0011329849243165, + "test_acc": 0.01, + "lyapunov": 1.5490661807682202, + "grad_norm": 0.11235050252375584, + "grad_max_sv": 0.0023714601527899505, + "grad_min_sv": 0.0, + "grad_condition": 2371460152.7899504, + "lr": 5.6898210384392595e-05, + "time_sec": 87.06668877601624 + }, + { + "epoch": 128, + "train_loss": 4.877482815856934, + "train_acc": 0.01004, + "test_loss": 5.234975555419922, + "test_acc": 0.01, + "lyapunov": 1.549882313784431, + "grad_norm": 0.11546242652617031, + "grad_max_sv": 0.0007256413344293832, + "grad_min_sv": 0.0, + "grad_condition": 725641334.4293833, + "lr": 5.214411988029363e-05, + "time_sec": 87.02991795539856 + }, + { + "epoch": 129, + "train_loss": 4.8767640072631835, + "train_acc": 0.01006, + "test_loss": 5.377161560821533, + "test_acc": 0.01, + "lyapunov": 1.5474718257289408, + "grad_norm": 0.12203371483427425, + "grad_max_sv": 0.016016411827877164, + "grad_min_sv": 0.0, + "grad_condition": 16016411827.877163, + "lr": 4.7586473766990294e-05, + "time_sec": 87.09737348556519 + }, + { + "epoch": 130, + "train_loss": 4.8772621307373045, + "train_acc": 0.00994, + "test_loss": 5.146733520507812, + "test_acc": 0.01, + "lyapunov": 1.5492317725325484, + "grad_norm": 0.13239853793431725, + "grad_max_sv": 0.007805489096790552, + "grad_min_sv": 0.0, + "grad_condition": 7805489096.790552, + "lr": 4.32272711786996e-05, + "time_sec": 87.02493596076965 + }, + { + "epoch": 131, + "train_loss": 4.878482946472168, + "train_acc": 0.01002, + "test_loss": 5.187312270355225, + "test_acc": 0.01, + "lyapunov": 1.5515824739280564, + "grad_norm": 0.13050261520417258, + "grad_max_sv": 0.003781923418864608, + "grad_min_sv": 0.0, + "grad_condition": 3781923418.8646073, + "lr": 3.906842420574966e-05, + "time_sec": 87.00766158103943 + }, + { + "epoch": 132, + "train_loss": 4.8773687062072755, + "train_acc": 0.01038, + "test_loss": 5.233526524353027, + "test_acc": 0.01, + "lyapunov": 1.5493864241768331, + "grad_norm": 0.13275623808990364, + "grad_max_sv": 0.00900785457342863, + "grad_min_sv": 0.0, + "grad_condition": 9007854573.42863, + "lr": 3.5111757055874305e-05, + "time_sec": 87.07332277297974 + }, + { + "epoch": 133, + "train_loss": 4.877119999389649, + "train_acc": 0.01, + "test_loss": 5.208364566040039, + "test_acc": 0.01, + "lyapunov": 1.5486897553324395, + "grad_norm": 0.13669667117137443, + "grad_max_sv": 0.0031375800725072624, + "grad_min_sv": 0.0, + "grad_condition": 3137580072.507262, + "lr": 3.1359005254054254e-05, + "time_sec": 87.08415913581848 + }, + { + "epoch": 134, + "train_loss": 4.876680097198486, + "train_acc": 0.01026, + "test_loss": 5.228788011169434, + "test_acc": 0.01, + "lyapunov": 1.5476158646976246, + "grad_norm": 0.1315586247563803, + "grad_max_sv": 0.0019336893223226071, + "grad_min_sv": 0.0, + "grad_condition": 1933689322.322607, + "lr": 2.7811814881259484e-05, + "time_sec": 87.04997158050537 + }, + { + "epoch": 135, + "train_loss": 4.877045626525879, + "train_acc": 0.00998, + "test_loss": 5.150844607543945, + "test_acc": 0.01, + "lyapunov": 1.5484065021700262, + "grad_norm": 0.16019208167708357, + "grad_max_sv": 0.0067828110419213775, + "grad_min_sv": 0.0, + "grad_condition": 6782811041.921377, + "lr": 2.4471741852423218e-05, + "time_sec": 87.07145261764526 + }, + { + "epoch": 136, + "train_loss": 4.877011717224121, + "train_acc": 0.00942, + "test_loss": 5.185321200561523, + "test_acc": 0.01, + "lyapunov": 1.5481893522355257, + "grad_norm": 0.16513336675938264, + "grad_max_sv": 0.006155044818297028, + "grad_min_sv": 0.0, + "grad_condition": 6155044818.297029, + "lr": 2.1340251233966362e-05, + "time_sec": 87.08501839637756 + }, + { + "epoch": 137, + "train_loss": 4.877299792480469, + "train_acc": 0.00994, + "test_loss": 5.153644463348389, + "test_acc": 0.01, + "lyapunov": 1.5492148905458962, + "grad_norm": 0.14657870229772474, + "grad_max_sv": 0.007406354090198875, + "grad_min_sv": 0.0, + "grad_condition": 7406354090.1988735, + "lr": 1.8418716601170932e-05, + "time_sec": 87.17517495155334 + }, + { + "epoch": 138, + "train_loss": 4.877124798736572, + "train_acc": 0.01016, + "test_loss": 5.164669793701172, + "test_acc": 0.01, + "lyapunov": 1.548459598170522, + "grad_norm": 0.15457514508897918, + "grad_max_sv": 0.012952858628705145, + "grad_min_sv": 0.0, + "grad_condition": 12952858628.705143, + "lr": 1.570841943568445e-05, + "time_sec": 87.19324207305908 + }, + { + "epoch": 139, + "train_loss": 4.877282972564697, + "train_acc": 0.00982, + "test_loss": 5.207451676940918, + "test_acc": 0.01, + "lyapunov": 1.5492830764302208, + "grad_norm": 0.18425099220738375, + "grad_max_sv": 0.0019508119206875564, + "grad_min_sv": 0.0, + "grad_condition": 1950811920.6875565, + "lr": 1.3210548563419845e-05, + "time_sec": 87.13183116912842 + }, + { + "epoch": 140, + "train_loss": 4.877498146057129, + "train_acc": 0.00968, + "test_loss": 5.200590103149414, + "test_acc": 0.01, + "lyapunov": 1.5491700614504802, + "grad_norm": 0.1734732516042842, + "grad_max_sv": 0.01371888890862465, + "grad_min_sv": 0.0, + "grad_condition": 13718888908.62465, + "lr": 1.0926199633097203e-05, + "time_sec": 87.21231150627136 + }, + { + "epoch": 141, + "train_loss": 4.8770866912841795, + "train_acc": 0.00992, + "test_loss": 5.190837601470947, + "test_acc": 0.01, + "lyapunov": 1.548795386653422, + "grad_norm": 0.14753103772737095, + "grad_max_sv": 0.005145562486723066, + "grad_min_sv": 0.0, + "grad_condition": 5145562486.723065, + "lr": 8.856374635655688e-06, + "time_sec": 87.26526665687561 + }, + { + "epoch": 142, + "train_loss": 4.8766608699035645, + "train_acc": 0.00968, + "test_loss": 5.162030874633789, + "test_acc": 0.01, + "lyapunov": 1.5475660821665889, + "grad_norm": 0.15219397900813178, + "grad_max_sv": 0.005608938308432699, + "grad_min_sv": 0.0, + "grad_condition": 5608938308.432698, + "lr": 7.001981464747503e-06, + "time_sec": 87.12494492530823 + }, + { + "epoch": 143, + "train_loss": 4.8769151321411135, + "train_acc": 0.01004, + "test_loss": 5.153072937011719, + "test_acc": 0.01, + "lyapunov": 1.5482893115114373, + "grad_norm": 0.15346228098731488, + "grad_max_sv": 0.001303949998691678, + "grad_min_sv": 0.0, + "grad_condition": 1303949998.691678, + "lr": 5.3638335185058295e-06, + "time_sec": 87.097491979599 + }, + { + "epoch": 144, + "train_loss": 4.877143389892578, + "train_acc": 0.0097, + "test_loss": 5.164535620117188, + "test_acc": 0.01, + "lyapunov": 1.5487491736936447, + "grad_norm": 0.15811775595604075, + "grad_max_sv": 0.008902552211657167, + "grad_min_sv": 0.0, + "grad_condition": 8902552211.657166, + "lr": 3.942649342761114e-06, + "time_sec": 87.06983470916748 + }, + { + "epoch": 145, + "train_loss": 4.876982822113037, + "train_acc": 0.00984, + "test_loss": 5.165194831848145, + "test_acc": 0.01, + "lyapunov": 1.5484599853720507, + "grad_norm": 0.1582019401241392, + "grad_max_sv": 0.004445526329800486, + "grad_min_sv": 0.0, + "grad_condition": 4445526329.800487, + "lr": 2.7390523158633524e-06, + "time_sec": 87.08561754226685 + }, + { + "epoch": 146, + "train_loss": 4.876878872375488, + "train_acc": 0.00992, + "test_loss": 5.165199098205567, + "test_acc": 0.01, + "lyapunov": 1.5481780770489626, + "grad_norm": 0.16041164237051417, + "grad_max_sv": 0.003941980935633182, + "grad_min_sv": 0.0, + "grad_condition": 3941980935.6331825, + "lr": 1.7535703752478133e-06, + "time_sec": 87.0421531200409 + }, + { + "epoch": 147, + "train_loss": 4.8771999089050295, + "train_acc": 0.01004, + "test_loss": 5.164550498199463, + "test_acc": 0.01, + "lyapunov": 1.5491338004846402, + "grad_norm": 0.16309259034155005, + "grad_max_sv": 0.004459652304649353, + "grad_min_sv": 0.0, + "grad_condition": 4459652304.649353, + "lr": 9.866357858642196e-07, + "time_sec": 87.06988906860352 + }, + { + "epoch": 148, + "train_loss": 4.876641088562011, + "train_acc": 0.00982, + "test_loss": 5.164551524353027, + "test_acc": 0.01, + "lyapunov": 1.5472115714226842, + "grad_norm": 0.15826813584085664, + "grad_max_sv": 0.008349275542423129, + "grad_min_sv": 0.0, + "grad_condition": 8349275542.423129, + "lr": 4.38584950570808e-07, + "time_sec": 87.10272812843323 + }, + { + "epoch": 149, + "train_loss": 4.877132370300293, + "train_acc": 0.01012, + "test_loss": 5.164552142333984, + "test_acc": 0.01, + "lyapunov": 1.5489305702926557, + "grad_norm": 0.15991562154962183, + "grad_max_sv": 0.0012625465169548988, + "grad_min_sv": 0.0, + "grad_condition": 1262546516.9548988, + "lr": 1.096582625772501e-07, + "time_sec": 87.08622741699219 + }, + { + "epoch": 150, + "train_loss": 4.876020973968505, + "train_acc": 0.0099, + "test_loss": 5.164552197265625, + "test_acc": 0.01, + "lyapunov": 1.545588637251988, + "grad_norm": 0.16382667555465003, + "grad_max_sv": 0.008686219714581967, + "grad_min_sv": 0.0, + "grad_condition": 8686219714.581966, + "lr": 0.0, + "time_sec": 87.09966802597046 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.855030886230469, + "train_acc": 0.0148, + "test_loss": 4.869620406341553, + "test_acc": 0.01, + "lyapunov": 2.2862052685769316, + "grad_norm": 4.935339749560766, + "grad_max_sv": 4.1397371053695675, + "grad_min_sv": 8.49077093301176e-08, + "grad_condition": 60021939.87195291, + "lr": 0.0009998903417374227, + "time_sec": 132.66977620124817 + }, + { + "epoch": 2, + "train_loss": 4.676363162231445, + "train_acc": 0.01706, + "test_loss": 4.653746462249756, + "test_acc": 0.01, + "lyapunov": 1.9439213897870935, + "grad_norm": 2.813935189124443, + "grad_max_sv": 2.2243280917406083, + "grad_min_sv": 4.668241500582759e-08, + "grad_condition": 69883158.92021513, + "lr": 0.0009995614150494292, + "time_sec": 132.62859869003296 + }, + { + "epoch": 3, + "train_loss": 4.635125137634278, + "train_acc": 0.0156, + "test_loss": 4.85989921875, + "test_acc": 0.01, + "lyapunov": 1.709093817359651, + "grad_norm": 1.402581704275357, + "grad_max_sv": 1.0371076561510564, + "grad_min_sv": 1.9744334944187383e-08, + "grad_condition": 12965122527.521233, + "lr": 0.0009990133642141358, + "time_sec": 132.57633781433105 + }, + { + "epoch": 4, + "train_loss": 4.640354335479737, + "train_acc": 0.01534, + "test_loss": 4.637619474792481, + "test_acc": 0.01, + "lyapunov": 1.6715390605999685, + "grad_norm": 0.9398579368308534, + "grad_max_sv": 0.6633182838559151, + "grad_min_sv": 1.2069862256511819e-08, + "grad_condition": 8530355196.976077, + "lr": 0.0009982464296247522, + "time_sec": 132.54676032066345 + }, + { + "epoch": 5, + "train_loss": 4.64221305480957, + "train_acc": 0.01564, + "test_loss": 4.680573092651367, + "test_acc": 0.01, + "lyapunov": 1.657093484688293, + "grad_norm": 0.552135234831364, + "grad_max_sv": 0.3695975001901388, + "grad_min_sv": 2.375610143283509e-09, + "grad_condition": 53738580663.96106, + "lr": 0.0009972609476841367, + "time_sec": 132.5168435573578 + }, + { + "epoch": 6, + "train_loss": 4.6413539511108395, + "train_acc": 0.01584, + "test_loss": 5.049699407958984, + "test_acc": 0.0103, + "lyapunov": 1.6153722675255193, + "grad_norm": 0.5032723336212916, + "grad_max_sv": 0.3346161611378193, + "grad_min_sv": 1.7202862416924891e-09, + "grad_condition": 61330096051.013405, + "lr": 0.000996057350657239, + "time_sec": 132.53665018081665 + }, + { + "epoch": 7, + "train_loss": 4.6673028504943845, + "train_acc": 0.01474, + "test_loss": 4.570369634246826, + "test_acc": 0.0114, + "lyapunov": 1.6155120164841947, + "grad_norm": 0.406883512526028, + "grad_max_sv": 0.2576971501111984, + "grad_min_sv": 1.9000999133456468e-10, + "grad_condition": 77661364868.79805, + "lr": 0.000994636166481494, + "time_sec": 132.51018714904785 + }, + { + "epoch": 8, + "train_loss": 4.760079259643555, + "train_acc": 0.01052, + "test_loss": 4.907698545074463, + "test_acc": 0.01, + "lyapunov": 1.5642740458173825, + "grad_norm": 0.7987649812847755, + "grad_max_sv": 0.6862246070057154, + "grad_min_sv": 1.0877307097171696e-08, + "grad_condition": 32321166738.690815, + "lr": 0.0009929980185352525, + "time_sec": 132.5572907924652 + }, + { + "epoch": 9, + "train_loss": 4.772606210021973, + "train_acc": 0.00996, + "test_loss": 4.704743336486817, + "test_acc": 0.01, + "lyapunov": 1.5716174904952573, + "grad_norm": 0.8148548143851404, + "grad_max_sv": 0.6870301708579063, + "grad_min_sv": 1.1020205989789069e-08, + "grad_condition": 2417926250.6670694, + "lr": 0.0009911436253643444, + "time_sec": 132.52283430099487 + }, + { + "epoch": 10, + "train_loss": 4.773616914978027, + "train_acc": 0.01062, + "test_loss": 4.874710052490235, + "test_acc": 0.01, + "lyapunov": 1.562704872292326, + "grad_norm": 0.6675097799983111, + "grad_max_sv": 0.5464496180415154, + "grad_min_sv": 7.172653980753015e-09, + "grad_condition": 20965681724.308956, + "lr": 0.0009890738003669028, + "time_sec": 132.5459840297699 + }, + { + "epoch": 11, + "train_loss": 4.773348721618652, + "train_acc": 0.01024, + "test_loss": 4.6200670059204105, + "test_acc": 0.01, + "lyapunov": 1.562029262637848, + "grad_norm": 0.5488543058826973, + "grad_max_sv": 0.4311558365821838, + "grad_min_sv": 2.9074530078217566e-09, + "grad_condition": 49435903159.65074, + "lr": 0.00098678945143658, + "time_sec": 132.52372455596924 + }, + { + "epoch": 12, + "train_loss": 4.780688554229736, + "train_acc": 0.01046, + "test_loss": 4.7990555023193355, + "test_acc": 0.01, + "lyapunov": 1.557410420359248, + "grad_norm": 0.39735835708243683, + "grad_max_sv": 0.29783011190593245, + "grad_min_sv": 2.955632668999543e-10, + "grad_condition": 137320228990.74185, + "lr": 0.0009842915805643154, + "time_sec": 132.52459120750427 + }, + { + "epoch": 13, + "train_loss": 4.794568827362061, + "train_acc": 0.00944, + "test_loss": 4.6620225440979, + "test_acc": 0.01, + "lyapunov": 1.5579908677684071, + "grad_norm": 0.3760550232574214, + "grad_max_sv": 0.27942878790199754, + "grad_min_sv": 7.445462603040203e-10, + "grad_condition": 105013083205.519, + "lr": 0.000981581283398829, + "time_sec": 132.5209527015686 + }, + { + "epoch": 14, + "train_loss": 4.809564754486084, + "train_acc": 0.00862, + "test_loss": 4.655567189025879, + "test_acc": 0.01, + "lyapunov": 1.571449481007998, + "grad_norm": 0.33124516886493516, + "grad_max_sv": 0.21216185558587314, + "grad_min_sv": 5.858595327667813e-10, + "grad_condition": 110751878933.28384, + "lr": 0.0009786597487660333, + "time_sec": 132.577819108963 + }, + { + "epoch": 15, + "train_loss": 4.816427656860352, + "train_acc": 0.00936, + "test_loss": 4.6545363082885745, + "test_acc": 0.01, + "lyapunov": 1.5565597386006504, + "grad_norm": 0.2791973343426611, + "grad_max_sv": 0.1684179350733757, + "grad_min_sv": 6.917982259102923e-13, + "grad_condition": 127223674978.58926, + "lr": 0.0009755282581475766, + "time_sec": 132.58430194854736 + }, + { + "epoch": 16, + "train_loss": 4.829237567138672, + "train_acc": 0.00908, + "test_loss": 4.629003553771972, + "test_acc": 0.01, + "lyapunov": 1.5557427775219579, + "grad_norm": 0.2712716184485074, + "grad_max_sv": 0.1436759451404214, + "grad_min_sv": 3.50392380214562e-13, + "grad_condition": 118193912798.78633, + "lr": 0.0009721881851187403, + "time_sec": 132.49679327011108 + }, + { + "epoch": 17, + "train_loss": 4.842587297058105, + "train_acc": 0.00944, + "test_loss": 4.633112139892578, + "test_acc": 0.01, + "lyapunov": 1.554307114742601, + "grad_norm": 0.26245775185719383, + "grad_max_sv": 0.140065660700202, + "grad_min_sv": 2.6676405041443376e-15, + "grad_condition": 139703664535.0272, + "lr": 0.0009686409947459456, + "time_sec": 132.52488541603088 + }, + { + "epoch": 18, + "train_loss": 4.85334480545044, + "train_acc": 0.0098, + "test_loss": 4.6145305236816405, + "test_acc": 0.01, + "lyapunov": 1.5502319726187859, + "grad_norm": 0.20648576741983057, + "grad_max_sv": 0.11613305620849132, + "grad_min_sv": 2.4641309551932607e-14, + "grad_condition": 112456376406.20891, + "lr": 0.0009648882429441254, + "time_sec": 132.53546261787415 + }, + { + "epoch": 19, + "train_loss": 4.8756606997680665, + "train_acc": 0.00972, + "test_loss": 4.63894914932251, + "test_acc": 0.01, + "lyapunov": 1.5529851959184613, + "grad_norm": 0.29909579690838006, + "grad_max_sv": 0.2365069929510355, + "grad_min_sv": 8.824648532682828e-14, + "grad_condition": 223546987940.7954, + "lr": 0.00096093157579425, + "time_sec": 132.5408227443695 + }, + { + "epoch": 20, + "train_loss": 4.8827299949646, + "train_acc": 0.01024, + "test_loss": 4.622587729644775, + "test_acc": 0.01, + "lyapunov": 1.556399286555512, + "grad_norm": 0.15272550856176187, + "grad_max_sv": 0.08741383519954979, + "grad_min_sv": 8.699695565641333e-15, + "grad_condition": 85913025020.82304, + "lr": 0.0009567727288213001, + "time_sec": 132.51366233825684 + }, + { + "epoch": 21, + "train_loss": 4.884711999969483, + "train_acc": 0.00998, + "test_loss": 4.606764881896972, + "test_acc": 0.01, + "lyapunov": 1.5493811259184347, + "grad_norm": 0.2280734728397927, + "grad_max_sv": 0.17737758290022612, + "grad_min_sv": 1.7983389117226294e-14, + "grad_condition": 174310016585.06476, + "lr": 0.0009524135262330095, + "time_sec": 132.5240728855133 + }, + { + "epoch": 22, + "train_loss": 4.88518779006958, + "train_acc": 0.00898, + "test_loss": 4.625405541229248, + "test_acc": 0.01, + "lyapunov": 1.5538233515551634, + "grad_norm": 0.21224774170023955, + "grad_max_sv": 0.15938115157186986, + "grad_min_sv": 3.1749157935371154e-14, + "grad_condition": 154547913667.9044, + "lr": 0.0009478558801197061, + "time_sec": 132.49090003967285 + }, + { + "epoch": 23, + "train_loss": 4.87999728149414, + "train_acc": 0.01018, + "test_loss": 4.662280471801758, + "test_acc": 0.01, + "lyapunov": 1.5508448772723107, + "grad_norm": 0.15119163863092763, + "grad_max_sv": 0.08865232784301043, + "grad_min_sv": 7.005994597272193e-16, + "grad_condition": 88575401119.44853, + "lr": 0.000943101789615607, + "time_sec": 132.47974038124084 + }, + { + "epoch": 24, + "train_loss": 4.881147270202637, + "train_acc": 0.00976, + "test_loss": 4.615948718261719, + "test_acc": 0.01, + "lyapunov": 1.5512399081988713, + "grad_norm": 0.15770676446584825, + "grad_max_sv": 0.10294295214116574, + "grad_min_sv": 5.7741339454657465e-15, + "grad_condition": 102285384766.49887, + "lr": 0.0009381533400219313, + "time_sec": 132.52317762374878 + }, + { + "epoch": 25, + "train_loss": 4.880569260253906, + "train_acc": 0.00984, + "test_loss": 4.610492027282715, + "test_acc": 0.01, + "lyapunov": 1.5512746035900262, + "grad_norm": 0.14554815906091484, + "grad_max_sv": 0.08865004125982523, + "grad_min_sv": 2.6778839672578997e-16, + "grad_condition": 88627301882.68987, + "lr": 0.0009330127018922189, + "time_sec": 132.56079196929932 + }, + { + "epoch": 26, + "train_loss": 4.881224513397217, + "train_acc": 0.01002, + "test_loss": 4.747660410308838, + "test_acc": 0.01, + "lyapunov": 1.5542162702516522, + "grad_norm": 0.1391562981495577, + "grad_max_sv": 0.08203545394353569, + "grad_min_sv": 2.822381678288234e-15, + "grad_condition": 81722256507.78954, + "lr": 0.000927682130080253, + "time_sec": 132.5239975452423 + }, + { + "epoch": 27, + "train_loss": 4.881258678741455, + "train_acc": 0.0098, + "test_loss": 4.790026293182373, + "test_acc": 0.01, + "lyapunov": 1.5510657614149401, + "grad_norm": 0.14725967817424349, + "grad_max_sv": 0.09194991793483495, + "grad_min_sv": 4.568772527401975e-15, + "grad_condition": 91398390464.57925, + "lr": 0.0009221639627510072, + "time_sec": 132.526837348938 + }, + { + "epoch": 28, + "train_loss": 4.880898860931397, + "train_acc": 0.0102, + "test_loss": 4.802646064758301, + "test_acc": 0.01, + "lyapunov": 1.5514030862037482, + "grad_norm": 0.14347689217252269, + "grad_max_sv": 0.09245897587388754, + "grad_min_sv": 1.0843861076282981e-15, + "grad_condition": 92342187840.9415, + "lr": 0.0009164606203550494, + "time_sec": 132.5042200088501 + }, + { + "epoch": 29, + "train_loss": 4.880448774719238, + "train_acc": 0.01046, + "test_loss": 4.7516579360961915, + "test_acc": 0.01, + "lyapunov": 1.5519556474807623, + "grad_norm": 0.13309334546952373, + "grad_max_sv": 0.08154573319479823, + "grad_min_sv": 9.282067880476938e-16, + "grad_condition": 81454842058.19734, + "lr": 0.0009105746045668516, + "time_sec": 132.52633500099182 + }, + { + "epoch": 30, + "train_loss": 4.883071630401611, + "train_acc": 0.00954, + "test_loss": 4.771951943206787, + "test_acc": 0.01, + "lyapunov": 1.554316602399587, + "grad_norm": 0.14789859288021653, + "grad_max_sv": 0.09579872786998749, + "grad_min_sv": 3.051331237308755e-15, + "grad_condition": 95468711969.6211, + "lr": 0.0009045084971874733, + "time_sec": 132.5885534286499 + }, + { + "epoch": 31, + "train_loss": 4.881176261901856, + "train_acc": 0.00888, + "test_loss": 4.774106753540039, + "test_acc": 0.01, + "lyapunov": 1.5536001310933887, + "grad_norm": 0.13112482323923252, + "grad_max_sv": 0.07564891651272773, + "grad_min_sv": 2.107048715412855e-15, + "grad_condition": 75454097088.2188, + "lr": 0.0008982649590120977, + "time_sec": 132.49479031562805 + }, + { + "epoch": 32, + "train_loss": 4.880477762145996, + "train_acc": 0.00962, + "test_loss": 4.746245973968506, + "test_acc": 0.01, + "lyapunov": 1.5537874387658162, + "grad_norm": 0.12461403839681509, + "grad_max_sv": 0.062327271420508625, + "grad_min_sv": 1.0725391843424482e-20, + "grad_condition": 62327270693.35764, + "lr": 0.0008918467286629196, + "time_sec": 132.4852647781372 + }, + { + "epoch": 33, + "train_loss": 4.881243226470947, + "train_acc": 0.00888, + "test_loss": 4.736703532409668, + "test_acc": 0.01, + "lyapunov": 1.556170121788064, + "grad_norm": 0.1148317700659679, + "grad_max_sv": 0.05345285767689347, + "grad_min_sv": 0.0, + "grad_condition": 53452857676.89348, + "lr": 0.0008852566213878943, + "time_sec": 132.53890919685364 + }, + { + "epoch": 34, + "train_loss": 4.881585180969238, + "train_acc": 0.01008, + "test_loss": 4.703427969360352, + "test_acc": 0.01, + "lyapunov": 1.5578572292766912, + "grad_norm": 0.11335239335552806, + "grad_max_sv": 0.052668086066842076, + "grad_min_sv": 0.0, + "grad_condition": 52668086066.84208, + "lr": 0.000878497527825878, + "time_sec": 132.64637637138367 + }, + { + "epoch": 35, + "train_loss": 4.882511229858398, + "train_acc": 0.0097, + "test_loss": 4.681371363830566, + "test_acc": 0.01, + "lyapunov": 1.5592110135671122, + "grad_norm": 0.12058968555924836, + "grad_max_sv": 0.06217097630724311, + "grad_min_sv": 0.0, + "grad_condition": 62170976307.2431, + "lr": 0.000871572412738697, + "time_sec": 132.43680119514465 + }, + { + "epoch": 36, + "train_loss": 4.881192719268799, + "train_acc": 0.00946, + "test_loss": 4.697506471252441, + "test_acc": 0.01, + "lyapunov": 1.5561128973655993, + "grad_norm": 0.11655881819882306, + "grad_max_sv": 0.058859458193182945, + "grad_min_sv": 8.230737425630695e-40, + "grad_condition": 58859458193.182945, + "lr": 0.0008644843137107055, + "time_sec": 132.4848039150238 + }, + { + "epoch": 37, + "train_loss": 4.8825209786987305, + "train_acc": 0.00972, + "test_loss": 4.694917836761475, + "test_acc": 0.01, + "lyapunov": 1.5584492564506238, + "grad_norm": 0.13341533833277566, + "grad_max_sv": 0.07657676143571734, + "grad_min_sv": 1.687390330982044e-16, + "grad_condition": 76560751213.82744, + "lr": 0.0008572363398164014, + "time_sec": 132.51812028884888 + }, + { + "epoch": 38, + "train_loss": 4.882141689910888, + "train_acc": 0.01016, + "test_loss": 4.688916626739502, + "test_acc": 0.01, + "lyapunov": 1.5593435761263914, + "grad_norm": 0.11853299040694154, + "grad_max_sv": 0.055678781820461154, + "grad_min_sv": 6.767910398009686e-40, + "grad_condition": 55678781820.46116, + "lr": 0.0008498316702566826, + "time_sec": 132.56456470489502 + }, + { + "epoch": 39, + "train_loss": 4.8832370683288575, + "train_acc": 0.01006, + "test_loss": 4.7038502136230465, + "test_acc": 0.01, + "lyapunov": 1.5620976924286474, + "grad_norm": 0.11941743088728123, + "grad_max_sv": 0.05502237342298031, + "grad_min_sv": 8.246841147582715e-40, + "grad_condition": 55022373422.9803, + "lr": 0.0008422735529643442, + "time_sec": 132.5043168067932 + }, + { + "epoch": 40, + "train_loss": 4.884805080718994, + "train_acc": 0.00916, + "test_loss": 4.710450775146485, + "test_acc": 0.01, + "lyapunov": 1.5655303751416219, + "grad_norm": 0.12619034606889276, + "grad_max_sv": 0.06059649083763361, + "grad_min_sv": 2.3062997125157342e-34, + "grad_condition": 60596490837.63362, + "lr": 0.0008345653031794289, + "time_sec": 132.5351688861847 + }, + { + "epoch": 41, + "train_loss": 4.886436430511474, + "train_acc": 0.00842, + "test_loss": 4.693475389099121, + "test_acc": 0.01, + "lyapunov": 1.566963563794675, + "grad_norm": 0.13196364661308996, + "grad_max_sv": 0.06961128637194633, + "grad_min_sv": 1.1737794876080507e-22, + "grad_condition": 69611286362.64899, + "lr": 0.0008267103019950526, + "time_sec": 132.51111769676208 + }, + { + "epoch": 42, + "train_loss": 4.882716519012451, + "train_acc": 0.00938, + "test_loss": 4.694032908630371, + "test_acc": 0.01, + "lyapunov": 1.5620074573990024, + "grad_norm": 0.11781162776823918, + "grad_max_sv": 0.046270584035664794, + "grad_min_sv": 0.0, + "grad_condition": 46270584035.664795, + "lr": 0.0008187119948743447, + "time_sec": 132.5160994529724 + }, + { + "epoch": 43, + "train_loss": 4.8821180502319335, + "train_acc": 0.00952, + "test_loss": 4.7027722869873045, + "test_acc": 0.01, + "lyapunov": 1.561017348638276, + "grad_norm": 0.11312831534529132, + "grad_max_sv": 0.04106818297877908, + "grad_min_sv": 0.0, + "grad_condition": 41068182978.77908, + "lr": 0.000810573890139155, + "time_sec": 132.5087025165558 + }, + { + "epoch": 44, + "train_loss": 4.883875316619873, + "train_acc": 0.00868, + "test_loss": 4.726299923706055, + "test_acc": 0.01, + "lyapunov": 1.5633756574767326, + "grad_norm": 0.12667296790156193, + "grad_max_sv": 0.0658588983118534, + "grad_min_sv": 1.0092078216956858e-18, + "grad_condition": 65858810617.60825, + "lr": 0.0008022995574311873, + "time_sec": 132.5128674507141 + }, + { + "epoch": 45, + "train_loss": 4.883541934661865, + "train_acc": 0.00932, + "test_loss": 4.7017227630615235, + "test_acc": 0.01, + "lyapunov": 1.5632145856042652, + "grad_norm": 0.12309109072630019, + "grad_max_sv": 0.05839173295535147, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 58391732955.35146, + "lr": 0.0007938926261462363, + "time_sec": 132.53016304969788 + }, + { + "epoch": 46, + "train_loss": 4.888793373718261, + "train_acc": 0.00888, + "test_loss": 4.696292651367187, + "test_acc": 0.01, + "lyapunov": 1.5750811136592076, + "grad_norm": 0.13746736535152312, + "grad_max_sv": 0.058484140876680614, + "grad_min_sv": 0.0, + "grad_condition": 58484140876.68062, + "lr": 0.0007853567838422158, + "time_sec": 132.50724458694458 + }, + { + "epoch": 47, + "train_loss": 4.883440639190674, + "train_acc": 0.00972, + "test_loss": 4.701148196411133, + "test_acc": 0.01, + "lyapunov": 1.564275365351411, + "grad_norm": 0.12158899868830998, + "grad_max_sv": 0.05122774885967374, + "grad_min_sv": 0.0, + "grad_condition": 51227748859.673744, + "lr": 0.0007766957746216719, + "time_sec": 132.50299715995789 + }, + { + "epoch": 48, + "train_loss": 4.884719120330811, + "train_acc": 0.00906, + "test_loss": 4.729176859283447, + "test_acc": 0.01, + "lyapunov": 1.5687132698800557, + "grad_norm": 0.12254448404539135, + "grad_max_sv": 0.040120215015485884, + "grad_min_sv": 0.0, + "grad_condition": 40120215015.485886, + "lr": 0.0007679133974894982, + "time_sec": 132.46641159057617 + }, + { + "epoch": 49, + "train_loss": 4.884110562133789, + "train_acc": 0.00872, + "test_loss": 4.725056867980957, + "test_acc": 0.01, + "lyapunov": 1.5669305754439604, + "grad_norm": 0.1149187900499572, + "grad_max_sv": 0.03382976925931871, + "grad_min_sv": 0.0, + "grad_condition": 33829769259.318707, + "lr": 0.000759013504686565, + "time_sec": 132.51045417785645 + }, + { + "epoch": 50, + "train_loss": 4.883614390563965, + "train_acc": 0.00966, + "test_loss": 4.709762881469727, + "test_acc": 0.01, + "lyapunov": 1.566156323608535, + "grad_norm": 0.12258255087018385, + "grad_max_sv": 0.034629582427442074, + "grad_min_sv": 0.0, + "grad_condition": 34629582427.44206, + "lr": 0.0007499999999999998, + "time_sec": 132.5417709350586 + }, + { + "epoch": 51, + "train_loss": 4.8839620613098145, + "train_acc": 0.0093, + "test_loss": 4.6980411888122555, + "test_acc": 0.01, + "lyapunov": 1.5664365087323786, + "grad_norm": 0.13769170593996222, + "grad_max_sv": 0.04753138842061162, + "grad_min_sv": 0.0, + "grad_condition": 47531388420.61162, + "lr": 0.0007408768370508575, + "time_sec": 132.5473415851593 + }, + { + "epoch": 52, + "train_loss": 4.883951457366943, + "train_acc": 0.0097, + "test_loss": 4.7330233673095705, + "test_acc": 0.01, + "lyapunov": 1.5676923822563933, + "grad_norm": 0.12914534017358148, + "grad_max_sv": 0.03236106717959046, + "grad_min_sv": 0.0, + "grad_condition": 32361067179.590466, + "lr": 0.0007316480175599307, + "time_sec": 132.50377297401428 + }, + { + "epoch": 53, + "train_loss": 4.883413257293701, + "train_acc": 0.00908, + "test_loss": 4.7225365089416504, + "test_acc": 0.01, + "lyapunov": 1.5648496943666501, + "grad_norm": 0.1255861922278266, + "grad_max_sv": 0.04178534299135208, + "grad_min_sv": 0.0, + "grad_condition": 41785342991.35208, + "lr": 0.0007223175895924635, + "time_sec": 132.52618622779846 + }, + { + "epoch": 54, + "train_loss": 4.8835242868041995, + "train_acc": 0.00984, + "test_loss": 4.827378164672852, + "test_acc": 0.01, + "lyapunov": 1.5652363522888144, + "grad_norm": 0.11717740789911417, + "grad_max_sv": 0.04349024128168821, + "grad_min_sv": 0.0, + "grad_condition": 43490241281.68822, + "lr": 0.0007128896457825361, + "time_sec": 132.49181389808655 + }, + { + "epoch": 55, + "train_loss": 4.885148456573487, + "train_acc": 0.00938, + "test_loss": 4.805696286010742, + "test_acc": 0.01, + "lyapunov": 1.5694574946942537, + "grad_norm": 0.11719591784462954, + "grad_max_sv": 0.027647955063730478, + "grad_min_sv": 0.0, + "grad_condition": 27647955063.73048, + "lr": 0.0007033683215378998, + "time_sec": 132.4630925655365 + }, + { + "epoch": 56, + "train_loss": 4.8840925729370115, + "train_acc": 0.00916, + "test_loss": 4.817810218048096, + "test_acc": 0.01, + "lyapunov": 1.5679599275369474, + "grad_norm": 0.10763202558448146, + "grad_max_sv": 0.024515782250091434, + "grad_min_sv": 0.0, + "grad_condition": 24515782250.09143, + "lr": 0.0006937577932260512, + "time_sec": 132.42955470085144 + }, + { + "epoch": 57, + "train_loss": 4.883760057678223, + "train_acc": 0.0095, + "test_loss": 4.856276947784424, + "test_acc": 0.01, + "lyapunov": 1.5672943607315688, + "grad_norm": 0.11038524447317109, + "grad_max_sv": 0.031160860368981958, + "grad_min_sv": 0.0, + "grad_condition": 31160860368.981956, + "lr": 0.0006840622763423388, + "time_sec": 132.52315950393677 + }, + { + "epoch": 58, + "train_loss": 4.884222667388916, + "train_acc": 0.00974, + "test_loss": 4.874290851593018, + "test_acc": 0.01, + "lyapunov": 1.567508033779271, + "grad_norm": 0.11849561013061653, + "grad_max_sv": 0.03593655498698354, + "grad_min_sv": 0.0, + "grad_condition": 35936554986.983536, + "lr": 0.0006742860236609073, + "time_sec": 132.47893905639648 + }, + { + "epoch": 59, + "train_loss": 4.88414927734375, + "train_acc": 0.00932, + "test_loss": 4.812584387207031, + "test_acc": 0.01, + "lyapunov": 1.5678569962606406, + "grad_norm": 0.11036912590820531, + "grad_max_sv": 0.028424020344391464, + "grad_min_sv": 0.0, + "grad_condition": 28424020344.391468, + "lr": 0.0006644333233692913, + "time_sec": 132.4449987411499 + }, + { + "epoch": 60, + "train_loss": 4.8860119464111325, + "train_acc": 0.00866, + "test_loss": 4.839297940826416, + "test_acc": 0.01, + "lyapunov": 1.5727104262622726, + "grad_norm": 0.12489417029089354, + "grad_max_sv": 0.0449837657622993, + "grad_min_sv": 0.0, + "grad_condition": 44983765762.2993, + "lr": 0.0006545084971874734, + "time_sec": 132.52293181419373 + }, + { + "epoch": 61, + "train_loss": 4.884305205383301, + "train_acc": 0.01046, + "test_loss": 4.857601212310791, + "test_acc": 0.01, + "lyapunov": 1.5686972680908944, + "grad_norm": 0.11135287490998455, + "grad_max_sv": 0.04157614354044199, + "grad_min_sv": 0.0, + "grad_condition": 41576143540.44199, + "lr": 0.0006445158984722354, + "time_sec": 132.51698970794678 + }, + { + "epoch": 62, + "train_loss": 4.884398639678955, + "train_acc": 0.00944, + "test_loss": 4.833207711791992, + "test_acc": 0.01, + "lyapunov": 1.5687918172163122, + "grad_norm": 0.11243013251101783, + "grad_max_sv": 0.043204908631742, + "grad_min_sv": 0.0, + "grad_condition": 43204908631.742004, + "lr": 0.0006344599103076324, + "time_sec": 132.51721620559692 + }, + { + "epoch": 63, + "train_loss": 4.884688519744873, + "train_acc": 0.00908, + "test_loss": 4.811236346435547, + "test_acc": 0.01, + "lyapunov": 1.570080169326509, + "grad_norm": 0.11662661682539925, + "grad_max_sv": 0.02772782016545534, + "grad_min_sv": 0.0, + "grad_condition": 27727820165.455345, + "lr": 0.0006243449435824269, + "time_sec": 132.50267052650452 + }, + { + "epoch": 64, + "train_loss": 4.8855357188415525, + "train_acc": 0.0096, + "test_loss": 4.834980075073243, + "test_acc": 0.01, + "lyapunov": 1.5721226451951829, + "grad_norm": 0.12180207356240787, + "grad_max_sv": 0.013557582441717387, + "grad_min_sv": 0.0, + "grad_condition": 13557582441.717386, + "lr": 0.0006141754350553275, + "time_sec": 132.6969666481018 + }, + { + "epoch": 65, + "train_loss": 4.884502696838379, + "train_acc": 0.00962, + "test_loss": 4.815651828765869, + "test_acc": 0.01, + "lyapunov": 1.5692061444987422, + "grad_norm": 0.13731619014897972, + "grad_max_sv": 0.036923335213214156, + "grad_min_sv": 0.0, + "grad_condition": 36923335213.21416, + "lr": 0.0006039558454088793, + "time_sec": 132.4734799861908 + }, + { + "epoch": 66, + "train_loss": 4.88990579711914, + "train_acc": 0.00978, + "test_loss": 4.791162698364258, + "test_acc": 0.01, + "lyapunov": 1.581291075862582, + "grad_norm": 0.14075282121769883, + "grad_max_sv": 0.039619889203459026, + "grad_min_sv": 0.0, + "grad_condition": 39619889203.45903, + "lr": 0.000593690657292862, + "time_sec": 132.52782583236694 + }, + { + "epoch": 67, + "train_loss": 4.888191639251709, + "train_acc": 0.00998, + "test_loss": 4.805363137054443, + "test_acc": 0.01, + "lyapunov": 1.5781969777153582, + "grad_norm": 0.11852732787787948, + "grad_max_sv": 0.03636179021559656, + "grad_min_sv": 0.0, + "grad_condition": 36361790215.59656, + "lr": 0.0005833843733580507, + "time_sec": 132.50655126571655 + }, + { + "epoch": 68, + "train_loss": 4.885113808746338, + "train_acc": 0.0092, + "test_loss": 4.790876692962646, + "test_acc": 0.01, + "lyapunov": 1.5712030659551206, + "grad_norm": 0.11464904106569235, + "grad_max_sv": 0.02942234524525702, + "grad_min_sv": 0.0, + "grad_condition": 29422345245.25702, + "lr": 0.0005730415142812054, + "time_sec": 132.44155955314636 + }, + { + "epoch": 69, + "train_loss": 4.886073732910156, + "train_acc": 0.00874, + "test_loss": 4.788568280029297, + "test_acc": 0.01, + "lyapunov": 1.5744608549205847, + "grad_norm": 0.11158557694696751, + "grad_max_sv": 0.004607879696413875, + "grad_min_sv": 0.0, + "grad_condition": 4607879696.413875, + "lr": 0.0005626666167821517, + "time_sec": 132.44937348365784 + }, + { + "epoch": 70, + "train_loss": 4.885406183319092, + "train_acc": 0.00988, + "test_loss": 4.791419393157959, + "test_acc": 0.01, + "lyapunov": 1.5723789460823665, + "grad_norm": 0.1093341588876136, + "grad_max_sv": 0.013379927957430482, + "grad_min_sv": 0.0, + "grad_condition": 13379927957.430483, + "lr": 0.0005522642316338265, + "time_sec": 132.44818544387817 + }, + { + "epoch": 71, + "train_loss": 4.885112988128662, + "train_acc": 0.00898, + "test_loss": 4.807086729431153, + "test_acc": 0.01, + "lyapunov": 1.5718346922598836, + "grad_norm": 0.12168415122862028, + "grad_max_sv": 0.014193862210959196, + "grad_min_sv": 0.0, + "grad_condition": 14193862210.959198, + "lr": 0.0005418389216661573, + "time_sec": 132.46469593048096 + }, + { + "epoch": 72, + "train_loss": 4.888309308624268, + "train_acc": 0.00942, + "test_loss": 4.786458195495605, + "test_acc": 0.01, + "lyapunov": 1.5786126913012142, + "grad_norm": 0.1257472430943546, + "grad_max_sv": 0.00992818851955235, + "grad_min_sv": 0.0, + "grad_condition": 9928188519.55235, + "lr": 0.0005313952597646563, + "time_sec": 132.4868745803833 + }, + { + "epoch": 73, + "train_loss": 4.8883187344360355, + "train_acc": 0.01008, + "test_loss": 4.763764072418213, + "test_acc": 0.01, + "lyapunov": 1.5783945306792588, + "grad_norm": 0.16063770590325258, + "grad_max_sv": 0.02905639265663922, + "grad_min_sv": 0.0, + "grad_condition": 29056392656.63922, + "lr": 0.0005209378268645994, + "time_sec": 132.40988731384277 + }, + { + "epoch": 74, + "train_loss": 4.885095281524658, + "train_acc": 0.00904, + "test_loss": 4.771036297607422, + "test_acc": 0.01, + "lyapunov": 1.5722466762108571, + "grad_norm": 0.332703681561214, + "grad_max_sv": 0.009321404900401831, + "grad_min_sv": 0.0, + "grad_condition": 9321404900.40183, + "lr": 0.0005104712099416781, + "time_sec": 132.41944670677185 + }, + { + "epoch": 75, + "train_loss": 4.8858135334777835, + "train_acc": 0.00924, + "test_loss": 4.7793162803649905, + "test_acc": 0.01, + "lyapunov": 1.573599765367825, + "grad_norm": 0.3785245081976868, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 132.43439865112305 + }, + { + "epoch": 76, + "train_loss": 4.885755948486328, + "train_acc": 0.00894, + "test_loss": 4.775339208984375, + "test_acc": 0.01, + "lyapunov": 1.5738494380965562, + "grad_norm": 0.26809830726413736, + "grad_max_sv": 0.00972625520080328, + "grad_min_sv": 0.0, + "grad_condition": 9726255200.80328, + "lr": 0.0004895287900583212, + "time_sec": 132.4453580379486 + }, + { + "epoch": 77, + "train_loss": 4.886971358032227, + "train_acc": 0.0088, + "test_loss": 4.780246302032471, + "test_acc": 0.01, + "lyapunov": 1.576519505447134, + "grad_norm": 0.5857000867492739, + "grad_max_sv": 0.015286983083933591, + "grad_min_sv": 0.0, + "grad_condition": 15286983083.933594, + "lr": 0.0004790621731353997, + "time_sec": 132.4340922832489 + }, + { + "epoch": 78, + "train_loss": 4.8857606088256835, + "train_acc": 0.00878, + "test_loss": 4.796332804870605, + "test_acc": 0.01, + "lyapunov": 1.574093949764281, + "grad_norm": 0.19474925059694603, + "grad_max_sv": 0.007740102289244532, + "grad_min_sv": 0.0, + "grad_condition": 7740102289.244532, + "lr": 0.000468604740235343, + "time_sec": 132.4252007007599 + }, + { + "epoch": 79, + "train_loss": 4.8854332868957515, + "train_acc": 0.00904, + "test_loss": 4.7431994110107425, + "test_acc": 0.01, + "lyapunov": 1.5728687746140657, + "grad_norm": 0.2002833929164076, + "grad_max_sv": 0.018612090731039643, + "grad_min_sv": 0.0, + "grad_condition": 18612090731.039646, + "lr": 0.00045816107833384175, + "time_sec": 132.41635990142822 + }, + { + "epoch": 80, + "train_loss": 4.88607871963501, + "train_acc": 0.00908, + "test_loss": 4.782230687713623, + "test_acc": 0.01, + "lyapunov": 1.5748912559445862, + "grad_norm": 0.2663292726664251, + "grad_max_sv": 0.0006320734973996878, + "grad_min_sv": 0.0, + "grad_condition": 632073497.3996878, + "lr": 0.0004477357683661729, + "time_sec": 132.3943703174591 + }, + { + "epoch": 81, + "train_loss": 4.885633817596435, + "train_acc": 0.00894, + "test_loss": 4.773731129455566, + "test_acc": 0.01, + "lyapunov": 1.5739493342616675, + "grad_norm": 0.19467627817910108, + "grad_max_sv": 0.004234243137761951, + "grad_min_sv": 0.0, + "grad_condition": 4234243137.7619505, + "lr": 0.00043733338321784746, + "time_sec": 132.42148518562317 + }, + { + "epoch": 82, + "train_loss": 4.890183934631348, + "train_acc": 0.00922, + "test_loss": 4.80019803237915, + "test_acc": 0.01, + "lyapunov": 1.58174940356818, + "grad_norm": 0.2693904362677404, + "grad_max_sv": 0.023508542357012628, + "grad_min_sv": 0.0, + "grad_condition": 23508542357.01263, + "lr": 0.0004269584857187939, + "time_sec": 132.48368287086487 + }, + { + "epoch": 83, + "train_loss": 4.887686183624267, + "train_acc": 0.00988, + "test_loss": 4.6776658203125, + "test_acc": 0.01, + "lyapunov": 1.574008427922378, + "grad_norm": 0.2293228968062561, + "grad_max_sv": 0.06707085431553424, + "grad_min_sv": 5.322572622808566e-16, + "grad_condition": 67002509647.244484, + "lr": 0.0004166156266419484, + "time_sec": 132.49965047836304 + }, + { + "epoch": 84, + "train_loss": 4.887849067077637, + "train_acc": 0.01004, + "test_loss": 4.733781813049316, + "test_acc": 0.01, + "lyapunov": 1.573820165356102, + "grad_norm": 0.14901481902367925, + "grad_max_sv": 0.09299901695922017, + "grad_min_sv": 1.6405075679230025e-16, + "grad_condition": 92982403383.72546, + "lr": 0.0004063093427071373, + "time_sec": 132.49851322174072 + }, + { + "epoch": 85, + "train_loss": 4.891140226135254, + "train_acc": 0.00994, + "test_loss": 4.79980509262085, + "test_acc": 0.01, + "lyapunov": 1.5841534381632305, + "grad_norm": 0.14782164130887582, + "grad_max_sv": 0.07909845747053623, + "grad_min_sv": 4.4865151314265836e-26, + "grad_condition": 79098457470.53198, + "lr": 0.0003960441545911199, + "time_sec": 132.5316731929779 + }, + { + "epoch": 86, + "train_loss": 4.887021747589111, + "train_acc": 0.00944, + "test_loss": 4.776346062469482, + "test_acc": 0.01, + "lyapunov": 1.5762594874252749, + "grad_norm": 0.12848068900948553, + "grad_max_sv": 0.05206927340477705, + "grad_min_sv": 0.0, + "grad_condition": 52069273404.777054, + "lr": 0.0003858245649446718, + "time_sec": 132.53142595291138 + }, + { + "epoch": 87, + "train_loss": 4.889097787322998, + "train_acc": 0.00868, + "test_loss": 4.707060712432861, + "test_acc": 0.01, + "lyapunov": 1.5793669498180185, + "grad_norm": 0.1548551396628501, + "grad_max_sv": 0.07543672090396285, + "grad_min_sv": 1.994722925254039e-23, + "grad_condition": 75436720902.41975, + "lr": 0.00037565505641757235, + "time_sec": 132.56474471092224 + }, + { + "epoch": 88, + "train_loss": 4.887517103881836, + "train_acc": 0.00934, + "test_loss": 4.697494779968261, + "test_acc": 0.01, + "lyapunov": 1.5769202114675966, + "grad_norm": 0.12499428379004662, + "grad_max_sv": 0.06417224258184433, + "grad_min_sv": 3.819406582541987e-27, + "grad_condition": 64172242581.844055, + "lr": 0.00036554008969236695, + "time_sec": 132.5758376121521 + }, + { + "epoch": 89, + "train_loss": 4.889558787384034, + "train_acc": 0.00908, + "test_loss": 4.738901914978027, + "test_acc": 0.01, + "lyapunov": 1.5814725813048576, + "grad_norm": 0.1259682508249713, + "grad_max_sv": 0.05729179736226797, + "grad_min_sv": 0.0, + "grad_condition": 57291797362.26797, + "lr": 0.0003554841015277638, + "time_sec": 132.55631971359253 + }, + { + "epoch": 90, + "train_loss": 4.887118022155762, + "train_acc": 0.00926, + "test_loss": 4.745434680175781, + "test_acc": 0.01, + "lyapunov": 1.57591240881654, + "grad_norm": 0.12675049544335418, + "grad_max_sv": 0.0551216053776443, + "grad_min_sv": 0.0, + "grad_condition": 55121605377.64431, + "lr": 0.000345491502812526, + "time_sec": 132.52520608901978 + }, + { + "epoch": 91, + "train_loss": 4.886403057098389, + "train_acc": 0.01032, + "test_loss": 4.728809788513184, + "test_acc": 0.01, + "lyapunov": 1.575149437045807, + "grad_norm": 0.12166328349782148, + "grad_max_sv": 0.04358728057704866, + "grad_min_sv": 0.0, + "grad_condition": 43587280577.04866, + "lr": 0.0003355666766307081, + "time_sec": 132.5356101989746 + }, + { + "epoch": 92, + "train_loss": 4.886422184295654, + "train_acc": 0.00926, + "test_loss": 4.738454541015625, + "test_acc": 0.01, + "lyapunov": 1.5745899811425172, + "grad_norm": 0.11920532388570855, + "grad_max_sv": 0.05519997598603368, + "grad_min_sv": 0.0, + "grad_condition": 55199975986.033676, + "lr": 0.00032571397633909225, + "time_sec": 132.55407977104187 + }, + { + "epoch": 93, + "train_loss": 4.886163410339355, + "train_acc": 0.00948, + "test_loss": 4.729941507720947, + "test_acc": 0.01, + "lyapunov": 1.5739426192115336, + "grad_norm": 0.13075040975965602, + "grad_max_sv": 0.051908688899129626, + "grad_min_sv": 0.0, + "grad_condition": 51908688899.12963, + "lr": 0.00031593772365766094, + "time_sec": 132.55454182624817 + }, + { + "epoch": 94, + "train_loss": 4.889471523284912, + "train_acc": 0.00938, + "test_loss": 4.726048579406738, + "test_acc": 0.01, + "lyapunov": 1.5820539750711387, + "grad_norm": 0.13111792932705457, + "grad_max_sv": 0.04076082408428192, + "grad_min_sv": 0.0, + "grad_condition": 40760824084.28192, + "lr": 0.0003062422067739483, + "time_sec": 132.50855350494385 + }, + { + "epoch": 95, + "train_loss": 4.886597353057861, + "train_acc": 0.00966, + "test_loss": 4.721816172790527, + "test_acc": 0.01, + "lyapunov": 1.5761216878890991, + "grad_norm": 0.10242530878744271, + "grad_max_sv": 0.018115377286449075, + "grad_min_sv": 0.0, + "grad_condition": 18115377286.449074, + "lr": 0.00029663167846209965, + "time_sec": 132.52085852622986 + }, + { + "epoch": 96, + "train_loss": 4.8871041314697266, + "train_acc": 0.00878, + "test_loss": 4.708365040588379, + "test_acc": 0.01, + "lyapunov": 1.5773879777440025, + "grad_norm": 0.11832202769749675, + "grad_max_sv": 0.01925608702003956, + "grad_min_sv": 0.0, + "grad_condition": 19256087020.03956, + "lr": 0.00028711035421746345, + "time_sec": 132.48231029510498 + }, + { + "epoch": 97, + "train_loss": 4.885575797424316, + "train_acc": 0.00956, + "test_loss": 4.758969999694824, + "test_acc": 0.01, + "lyapunov": 1.5739980253112285, + "grad_norm": 0.102958848729015, + "grad_max_sv": 0.00836998880840838, + "grad_min_sv": 0.0, + "grad_condition": 8369988808.4083805, + "lr": 0.00027768241040753615, + "time_sec": 132.4623761177063 + }, + { + "epoch": 98, + "train_loss": 4.885688443298339, + "train_acc": 0.00946, + "test_loss": 4.7685779739379885, + "test_acc": 0.01, + "lyapunov": 1.5737464616975516, + "grad_norm": 0.11414360687104802, + "grad_max_sv": 0.033959317160770296, + "grad_min_sv": 0.0, + "grad_condition": 33959317160.770294, + "lr": 0.00026835198244006903, + "time_sec": 132.65263080596924 + }, + { + "epoch": 99, + "train_loss": 4.888634443054199, + "train_acc": 0.00974, + "test_loss": 4.754720726013184, + "test_acc": 0.01, + "lyapunov": 1.5796314081572511, + "grad_norm": 0.11056614929218114, + "grad_max_sv": 0.034730975748971105, + "grad_min_sv": 0.0, + "grad_condition": 34730975748.9711, + "lr": 0.0002591231629491421, + "time_sec": 132.53659439086914 + }, + { + "epoch": 100, + "train_loss": 4.888005011444092, + "train_acc": 0.00978, + "test_loss": 4.7091091361999515, + "test_acc": 0.01, + "lyapunov": 1.5793088131853381, + "grad_norm": 0.11538715899109499, + "grad_max_sv": 0.027404929930344223, + "grad_min_sv": 0.0, + "grad_condition": 27404929930.344227, + "lr": 0.0002499999999999997, + "time_sec": 132.47063946723938 + }, + { + "epoch": 101, + "train_loss": 4.890101184844971, + "train_acc": 0.00978, + "test_loss": 4.713412440490723, + "test_acc": 0.01, + "lyapunov": 1.583473697037953, + "grad_norm": 0.14124961194918514, + "grad_max_sv": 0.030058392463251947, + "grad_min_sv": 0.0, + "grad_condition": 30058392463.251945, + "lr": 0.00024098649531343477, + "time_sec": 132.50555539131165 + }, + { + "epoch": 102, + "train_loss": 4.887625363464355, + "train_acc": 0.01148, + "test_loss": 4.7020545562744145, + "test_acc": 0.01, + "lyapunov": 1.579564877178358, + "grad_norm": 0.1297826697220666, + "grad_max_sv": 0.019950845977291465, + "grad_min_sv": 0.0, + "grad_condition": 19950845977.291466, + "lr": 0.0002320866025105016, + "time_sec": 132.43331456184387 + }, + { + "epoch": 103, + "train_loss": 4.889458109130859, + "train_acc": 0.00924, + "test_loss": 4.700020100402832, + "test_acc": 0.01, + "lyapunov": 1.5832947227351195, + "grad_norm": 0.16304165123375366, + "grad_max_sv": 0.00834191357716918, + "grad_min_sv": 0.0, + "grad_condition": 8341913577.16918, + "lr": 0.0002233042253783278, + "time_sec": 132.42489337921143 + }, + { + "epoch": 104, + "train_loss": 4.888043740234375, + "train_acc": 0.00976, + "test_loss": 4.690122833251953, + "test_acc": 0.01, + "lyapunov": 1.580241550874832, + "grad_norm": 0.16164115490422049, + "grad_max_sv": 0.00892186602577567, + "grad_min_sv": 0.0, + "grad_condition": 8921866025.775671, + "lr": 0.000214643216157784, + "time_sec": 132.40913486480713 + }, + { + "epoch": 105, + "train_loss": 4.885801515350342, + "train_acc": 0.00962, + "test_loss": 4.70759442062378, + "test_acc": 0.01, + "lyapunov": 1.5747494935379613, + "grad_norm": 0.10757507074973427, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 132.41837000846863 + }, + { + "epoch": 106, + "train_loss": 4.886232281951904, + "train_acc": 0.00966, + "test_loss": 4.676759211730957, + "test_acc": 0.01, + "lyapunov": 1.5755804490555279, + "grad_norm": 0.11054714782321104, + "grad_max_sv": 0.016818781569600105, + "grad_min_sv": 0.0, + "grad_condition": 16818781569.600103, + "lr": 0.00019770044256881242, + "time_sec": 132.38776516914368 + }, + { + "epoch": 107, + "train_loss": 4.889010899200439, + "train_acc": 0.00964, + "test_loss": 4.686521159362793, + "test_acc": 0.01, + "lyapunov": 1.5793325800420073, + "grad_norm": 0.5205851606002122, + "grad_max_sv": 0.027481868257746102, + "grad_min_sv": 0.0, + "grad_condition": 27481868257.7461, + "lr": 0.0001894261098608447, + "time_sec": 132.4469666481018 + }, + { + "epoch": 108, + "train_loss": 4.885496775512696, + "train_acc": 0.00916, + "test_loss": 4.701310534667969, + "test_acc": 0.01, + "lyapunov": 1.5739044819951362, + "grad_norm": 0.9976131592675321, + "grad_max_sv": 0.010380421532317996, + "grad_min_sv": 0.0, + "grad_condition": 10380421532.317997, + "lr": 0.000181288005125655, + "time_sec": 132.34952044487 + }, + { + "epoch": 109, + "train_loss": 4.88569960144043, + "train_acc": 0.00982, + "test_loss": 4.704411970520019, + "test_acc": 0.01, + "lyapunov": 1.574234271598289, + "grad_norm": 0.9761047066143378, + "grad_max_sv": 0.026565171172842385, + "grad_min_sv": 0.0, + "grad_condition": 26565171172.842384, + "lr": 0.0001732896980049473, + "time_sec": 132.45858502388 + }, + { + "epoch": 110, + "train_loss": 4.885857049255371, + "train_acc": 0.00906, + "test_loss": 4.700390522766114, + "test_acc": 0.01, + "lyapunov": 1.5747647572051533, + "grad_norm": 1.1449227675806375, + "grad_max_sv": 0.025618467247113585, + "grad_min_sv": 0.0, + "grad_condition": 25618467247.113586, + "lr": 0.00016543469682057076, + "time_sec": 132.4441635608673 + }, + { + "epoch": 111, + "train_loss": 4.886974509887695, + "train_acc": 0.00982, + "test_loss": 4.78629910736084, + "test_acc": 0.01, + "lyapunov": 1.5769317887933052, + "grad_norm": 0.9679265494141023, + "grad_max_sv": 0.03804315887391567, + "grad_min_sv": 0.0, + "grad_condition": 38043158873.91567, + "lr": 0.00015772644703565552, + "time_sec": 132.5875232219696 + }, + { + "epoch": 112, + "train_loss": 4.886453926544189, + "train_acc": 0.00974, + "test_loss": 4.8048784591674805, + "test_acc": 0.01, + "lyapunov": 1.5754460748809074, + "grad_norm": 0.8807920950548352, + "grad_max_sv": 0.03984132050536573, + "grad_min_sv": 0.0, + "grad_condition": 39841320505.36573, + "lr": 0.00015016832974331713, + "time_sec": 132.5120551586151 + }, + { + "epoch": 113, + "train_loss": 4.885906947784424, + "train_acc": 0.00966, + "test_loss": 4.798358418273926, + "test_acc": 0.01, + "lyapunov": 1.5747274245752398, + "grad_norm": 0.8637882261226464, + "grad_max_sv": 0.033320454647764564, + "grad_min_sv": 0.0, + "grad_condition": 33320454647.764565, + "lr": 0.00014276366018359834, + "time_sec": 132.50000762939453 + }, + { + "epoch": 114, + "train_loss": 4.885719304962159, + "train_acc": 0.00982, + "test_loss": 4.793103702545166, + "test_acc": 0.01, + "lyapunov": 1.5744778527628125, + "grad_norm": 0.782099951820462, + "grad_max_sv": 0.03417456489987671, + "grad_min_sv": 0.0, + "grad_condition": 34174564899.87671, + "lr": 0.00013551568628929425, + "time_sec": 132.49124789237976 + }, + { + "epoch": 115, + "train_loss": 4.8859512828063965, + "train_acc": 0.00934, + "test_loss": 4.802629745483398, + "test_acc": 0.01, + "lyapunov": 1.575113305960165, + "grad_norm": 0.7049115792540724, + "grad_max_sv": 0.018358896067366005, + "grad_min_sv": 0.0, + "grad_condition": 18358896067.366005, + "lr": 0.00012842758726130276, + "time_sec": 132.44965839385986 + }, + { + "epoch": 116, + "train_loss": 4.886716898498535, + "train_acc": 0.01, + "test_loss": 4.802504382324218, + "test_acc": 0.01, + "lyapunov": 1.5769645506158814, + "grad_norm": 0.7070432983143201, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 132.43424487113953 + }, + { + "epoch": 117, + "train_loss": 4.8879242680358885, + "train_acc": 0.00916, + "test_loss": 4.805041016387939, + "test_acc": 0.01, + "lyapunov": 1.5800700291343357, + "grad_norm": 0.7061830114700672, + "grad_max_sv": 0.02115973932668567, + "grad_min_sv": 0.0, + "grad_condition": 21159739326.68567, + "lr": 0.00011474337861210538, + "time_sec": 132.52493023872375 + }, + { + "epoch": 118, + "train_loss": 4.885882244415283, + "train_acc": 0.01036, + "test_loss": 4.74331266784668, + "test_acc": 0.01, + "lyapunov": 1.5747067300255035, + "grad_norm": 0.7245826894780792, + "grad_max_sv": 0.03378571714274585, + "grad_min_sv": 0.0, + "grad_condition": 33785717142.745857, + "lr": 0.00010815327133708009, + "time_sec": 132.48710799217224 + }, + { + "epoch": 119, + "train_loss": 4.886389665374756, + "train_acc": 0.00962, + "test_loss": 4.740865539550781, + "test_acc": 0.01, + "lyapunov": 1.5762843387511076, + "grad_norm": 0.7753676227893881, + "grad_max_sv": 0.03039190392009914, + "grad_min_sv": 0.0, + "grad_condition": 30391903920.09914, + "lr": 0.00010173504098790182, + "time_sec": 132.4465343952179 + }, + { + "epoch": 120, + "train_loss": 4.886249551086426, + "train_acc": 0.00964, + "test_loss": 4.7418055305480955, + "test_acc": 0.01, + "lyapunov": 1.5757878259624667, + "grad_norm": 0.7403330417590244, + "grad_max_sv": 0.03614077656529844, + "grad_min_sv": 0.0, + "grad_condition": 36140776565.29844, + "lr": 9.549150281252629e-05, + "time_sec": 132.79633259773254 + }, + { + "epoch": 121, + "train_loss": 4.886320632019043, + "train_acc": 0.0099, + "test_loss": 4.7293956802368164, + "test_acc": 0.01, + "lyapunov": 1.5760322620191842, + "grad_norm": 0.7505635192152501, + "grad_max_sv": 0.026077959313988687, + "grad_min_sv": 0.0, + "grad_condition": 26077959313.988686, + "lr": 8.942539543314794e-05, + "time_sec": 133.23189043998718 + }, + { + "epoch": 122, + "train_loss": 4.887943274230957, + "train_acc": 0.00948, + "test_loss": 4.919895000457764, + "test_acc": 0.01, + "lyapunov": 1.5784789354295072, + "grad_norm": 0.6996628561837273, + "grad_max_sv": 0.0160073421895504, + "grad_min_sv": 0.0, + "grad_condition": 16007342189.550396, + "lr": 8.353937964495024e-05, + "time_sec": 132.61993741989136 + }, + { + "epoch": 123, + "train_loss": 4.886383193359375, + "train_acc": 0.01012, + "test_loss": 4.8154360328674315, + "test_acc": 0.01, + "lyapunov": 1.5765104918833583, + "grad_norm": 0.8202114075319168, + "grad_max_sv": 0.0287565924692899, + "grad_min_sv": 0.0, + "grad_condition": 28756592469.289906, + "lr": 7.783603724899243e-05, + "time_sec": 132.69449758529663 + }, + { + "epoch": 124, + "train_loss": 4.885598735046386, + "train_acc": 0.01062, + "test_loss": 4.811818315124512, + "test_acc": 0.01, + "lyapunov": 1.5741741837138106, + "grad_norm": 0.7110817230064039, + "grad_max_sv": 0.04011002266779542, + "grad_min_sv": 0.0, + "grad_condition": 40110022667.795425, + "lr": 7.231786991974666e-05, + "time_sec": 132.79418468475342 + }, + { + "epoch": 125, + "train_loss": 4.887531413879395, + "train_acc": 0.00998, + "test_loss": 4.798822694396972, + "test_acc": 0.01, + "lyapunov": 1.5775156819911869, + "grad_norm": 0.6755952206914222, + "grad_max_sv": 0.03821564754471183, + "grad_min_sv": 0.0, + "grad_condition": 38215647544.71183, + "lr": 6.698729810778072e-05, + "time_sec": 132.56555151939392 + }, + { + "epoch": 126, + "train_loss": 4.885848933258057, + "train_acc": 0.0096, + "test_loss": 4.79271836013794, + "test_acc": 0.01, + "lyapunov": 1.5746296488720437, + "grad_norm": 0.783689796852182, + "grad_max_sv": 0.0219818449113518, + "grad_min_sv": 0.0, + "grad_condition": 21981844911.3518, + "lr": 6.184665997806817e-05, + "time_sec": 132.44697856903076 + }, + { + "epoch": 127, + "train_loss": 4.885011657409668, + "train_acc": 0.0099, + "test_loss": 4.796478929901123, + "test_acc": 0.01, + "lyapunov": 1.5726598202420012, + "grad_norm": 0.746827927020454, + "grad_max_sv": 0.006885465793311596, + "grad_min_sv": 0.0, + "grad_condition": 6885465793.311597, + "lr": 5.6898210384392595e-05, + "time_sec": 132.4967279434204 + }, + { + "epoch": 128, + "train_loss": 4.885314655151367, + "train_acc": 0.00972, + "test_loss": 4.764711624908447, + "test_acc": 0.01, + "lyapunov": 1.5735664736584325, + "grad_norm": 0.7327332821536672, + "grad_max_sv": 0.000560962175950408, + "grad_min_sv": 0.0, + "grad_condition": 560962175.950408, + "lr": 5.214411988029363e-05, + "time_sec": 132.5673258304596 + }, + { + "epoch": 129, + "train_loss": 4.886808303070068, + "train_acc": 0.00958, + "test_loss": 4.767883946990967, + "test_acc": 0.01, + "lyapunov": 1.5768778150343834, + "grad_norm": 0.7089376244924456, + "grad_max_sv": 0.0005988820921629667, + "grad_min_sv": 0.0, + "grad_condition": 598882092.1629667, + "lr": 4.7586473766990294e-05, + "time_sec": 132.46098804473877 + }, + { + "epoch": 130, + "train_loss": 4.886055064697266, + "train_acc": 0.00958, + "test_loss": 4.76520872039795, + "test_acc": 0.01, + "lyapunov": 1.575562137167167, + "grad_norm": 0.8017477597198375, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 132.55271816253662 + }, + { + "epoch": 131, + "train_loss": 4.8861244363403324, + "train_acc": 0.0098, + "test_loss": 4.774403156280518, + "test_acc": 0.01, + "lyapunov": 1.5755851704751134, + "grad_norm": 0.8346593666537984, + "grad_max_sv": 0.0012377811130136252, + "grad_min_sv": 0.0, + "grad_condition": 1237781113.0136251, + "lr": 3.906842420574966e-05, + "time_sec": 132.4554464817047 + }, + { + "epoch": 132, + "train_loss": 4.8852793449401855, + "train_acc": 0.00998, + "test_loss": 4.771010957336426, + "test_acc": 0.01, + "lyapunov": 1.573425286566205, + "grad_norm": 0.7375330331800295, + "grad_max_sv": 0.006311370152980089, + "grad_min_sv": 0.0, + "grad_condition": 6311370152.980089, + "lr": 3.5111757055874305e-05, + "time_sec": 132.4216513633728 + }, + { + "epoch": 133, + "train_loss": 4.884971447448731, + "train_acc": 0.00938, + "test_loss": 4.771634101104737, + "test_acc": 0.01, + "lyapunov": 1.572620025985991, + "grad_norm": 0.6774345796584929, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 132.4028835296631 + }, + { + "epoch": 134, + "train_loss": 4.885691842803955, + "train_acc": 0.01002, + "test_loss": 4.844159544372559, + "test_acc": 0.01, + "lyapunov": 1.57454265353015, + "grad_norm": 0.7944955115704805, + "grad_max_sv": 0.02395228371024132, + "grad_min_sv": 0.0, + "grad_condition": 23952283710.241318, + "lr": 2.7811814881259484e-05, + "time_sec": 132.41754722595215 + }, + { + "epoch": 135, + "train_loss": 4.8864432501220705, + "train_acc": 0.0101, + "test_loss": 4.844892832946777, + "test_acc": 0.01, + "lyapunov": 1.575845740945138, + "grad_norm": 0.7437160641154223, + "grad_max_sv": 0.020727850822731854, + "grad_min_sv": 0.0, + "grad_condition": 20727850822.731853, + "lr": 2.4471741852423218e-05, + "time_sec": 132.44422578811646 + }, + { + "epoch": 136, + "train_loss": 4.8851325263977055, + "train_acc": 0.0098, + "test_loss": 4.8378851570129395, + "test_acc": 0.01, + "lyapunov": 1.5731066611721694, + "grad_norm": 0.6658420197701125, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 132.38768362998962 + }, + { + "epoch": 137, + "train_loss": 4.885479872436523, + "train_acc": 0.01006, + "test_loss": 4.843586358642578, + "test_acc": 0.01, + "lyapunov": 1.5740535426932527, + "grad_norm": 0.7299510564419838, + "grad_max_sv": 0.003957807831466198, + "grad_min_sv": 0.0, + "grad_condition": 3957807831.466198, + "lr": 1.8418716601170932e-05, + "time_sec": 132.38154101371765 + }, + { + "epoch": 138, + "train_loss": 4.884863400421143, + "train_acc": 0.01014, + "test_loss": 4.843053856658935, + "test_acc": 0.01, + "lyapunov": 1.5721587311581273, + "grad_norm": 0.6927716154040414, + "grad_max_sv": 0.017578842211514713, + "grad_min_sv": 0.0, + "grad_condition": 17578842211.51471, + "lr": 1.570841943568445e-05, + "time_sec": 132.4182834625244 + }, + { + "epoch": 139, + "train_loss": 4.884934008331299, + "train_acc": 0.01022, + "test_loss": 4.844250295257568, + "test_acc": 0.01, + "lyapunov": 1.5725375057181434, + "grad_norm": 0.6981880900264675, + "grad_max_sv": 0.0031383157707750796, + "grad_min_sv": 0.0, + "grad_condition": 3138315770.7750797, + "lr": 1.3210548563419845e-05, + "time_sec": 132.41427326202393 + }, + { + "epoch": 140, + "train_loss": 4.885497499389649, + "train_acc": 0.00972, + "test_loss": 4.844135813903809, + "test_acc": 0.01, + "lyapunov": 1.574064860868332, + "grad_norm": 0.774635016593933, + "grad_max_sv": 0.005403042444959283, + "grad_min_sv": 0.0, + "grad_condition": 5403042444.959283, + "lr": 1.0926199633097203e-05, + "time_sec": 132.38426899909973 + }, + { + "epoch": 141, + "train_loss": 4.885045772247315, + "train_acc": 0.01014, + "test_loss": 4.8358864456176756, + "test_acc": 0.01, + "lyapunov": 1.5727792880724154, + "grad_norm": 0.7412742981630644, + "grad_max_sv": 0.011697014886885881, + "grad_min_sv": 0.0, + "grad_condition": 11697014886.885881, + "lr": 8.856374635655688e-06, + "time_sec": 132.46910786628723 + }, + { + "epoch": 142, + "train_loss": 4.884702201538086, + "train_acc": 0.01002, + "test_loss": 4.838421836090088, + "test_acc": 0.01, + "lyapunov": 1.5717649999481942, + "grad_norm": 0.7113065718119301, + "grad_max_sv": 0.00798416011966765, + "grad_min_sv": 0.0, + "grad_condition": 7984160119.66765, + "lr": 7.001981464747503e-06, + "time_sec": 132.44912910461426 + }, + { + "epoch": 143, + "train_loss": 4.885199571380615, + "train_acc": 0.00982, + "test_loss": 4.841495401763916, + "test_acc": 0.01, + "lyapunov": 1.5731582995265951, + "grad_norm": 0.705829448061863, + "grad_max_sv": 0.021906211972236633, + "grad_min_sv": 0.0, + "grad_condition": 21906211972.236633, + "lr": 5.3638335185058295e-06, + "time_sec": 132.39459085464478 + }, + { + "epoch": 144, + "train_loss": 4.884931218566894, + "train_acc": 0.01002, + "test_loss": 4.842521714782714, + "test_acc": 0.01, + "lyapunov": 1.5725436259413619, + "grad_norm": 0.7770696416339791, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 132.33704686164856 + }, + { + "epoch": 145, + "train_loss": 4.885003453521729, + "train_acc": 0.01038, + "test_loss": 4.84215620880127, + "test_acc": 0.01, + "lyapunov": 1.5727140568101499, + "grad_norm": 0.7469803441120764, + "grad_max_sv": 0.007154888892546296, + "grad_min_sv": 0.0, + "grad_condition": 7154888892.546295, + "lr": 2.7390523158633524e-06, + "time_sec": 132.3757495880127 + }, + { + "epoch": 146, + "train_loss": 4.885197346801758, + "train_acc": 0.00996, + "test_loss": 4.842266304016113, + "test_acc": 0.01, + "lyapunov": 1.5733027034403417, + "grad_norm": 0.7332908840273178, + "grad_max_sv": 0.0006548997946083546, + "grad_min_sv": 0.0, + "grad_condition": 654899794.6083546, + "lr": 1.7535703752478133e-06, + "time_sec": 132.45014452934265 + }, + { + "epoch": 147, + "train_loss": 4.885225572662353, + "train_acc": 0.01, + "test_loss": 4.841919314575195, + "test_acc": 0.01, + "lyapunov": 1.5734141430891384, + "grad_norm": 0.7407542017866708, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 132.37303113937378 + }, + { + "epoch": 148, + "train_loss": 4.885419764556885, + "train_acc": 0.01, + "test_loss": 4.841919337463379, + "test_acc": 0.01, + "lyapunov": 1.5739776710110247, + "grad_norm": 0.7868248231615788, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 132.36948442459106 + }, + { + "epoch": 149, + "train_loss": 4.884984393463135, + "train_acc": 0.01, + "test_loss": 4.841919581604004, + "test_acc": 0.01, + "lyapunov": 1.5726999001734703, + "grad_norm": 0.7663497621598592, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 132.3525311946869 + }, + { + "epoch": 150, + "train_loss": 4.8838786590576175, + "train_acc": 0.01, + "test_loss": 4.841919624328614, + "test_acc": 0.01, + "lyapunov": 1.5694036883161502, + "grad_norm": 0.6984069616734725, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 132.51661276817322 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 4.785678502502441, + "train_acc": 0.01854, + "test_loss": 4.888219262695313, + "test_acc": 0.0096, + "lyapunov": 2.2034229628570245, + "grad_norm": 4.9662527525898525, + "grad_max_sv": 4.1295246422290806, + "grad_min_sv": 8.43239183145883e-08, + "grad_condition": 57848709.59664528, + "lr": 0.0009998903417374227, + "time_sec": 178.03496599197388 + }, + { + "epoch": 2, + "train_loss": 4.6398111044311525, + "train_acc": 0.0207, + "test_loss": 4.653040969085693, + "test_acc": 0.01, + "lyapunov": 1.9294306939215307, + "grad_norm": 3.0185365178654044, + "grad_max_sv": 2.4029204517602922, + "grad_min_sv": 5.100535853952426e-08, + "grad_condition": 482708945.8134031, + "lr": 0.0009995614150494292, + "time_sec": 178.04272985458374 + }, + { + "epoch": 3, + "train_loss": 4.587504278259277, + "train_acc": 0.01798, + "test_loss": 4.565644731140137, + "test_acc": 0.0158, + "lyapunov": 1.7756437584567253, + "grad_norm": 1.468640621914821, + "grad_max_sv": 0.8633963579282863, + "grad_min_sv": 1.4697805644365008e-08, + "grad_condition": 29354955308.653522, + "lr": 0.0009990133642141358, + "time_sec": 177.90911650657654 + }, + { + "epoch": 4, + "train_loss": 4.609674820861817, + "train_acc": 0.01586, + "test_loss": 5.16701375579834, + "test_acc": 0.0101, + "lyapunov": 1.7137653553272452, + "grad_norm": 0.7203838648352618, + "grad_max_sv": 0.5238488506525755, + "grad_min_sv": 2.2053512622504097e-09, + "grad_condition": 75198729364.04495, + "lr": 0.0009982464296247522, + "time_sec": 177.86139965057373 + }, + { + "epoch": 5, + "train_loss": 4.638868305969238, + "train_acc": 0.01426, + "test_loss": 5.560866254425049, + "test_acc": 0.01, + "lyapunov": 1.6978333834796915, + "grad_norm": 0.5502157339199643, + "grad_max_sv": 0.44361272603273394, + "grad_min_sv": 2.7029428141806377e-12, + "grad_condition": 181889969040.05048, + "lr": 0.0009972609476841367, + "time_sec": 177.9277467727661 + }, + { + "epoch": 6, + "train_loss": 4.669847656402588, + "train_acc": 0.01332, + "test_loss": 4.8178652496337895, + "test_acc": 0.01, + "lyapunov": 1.7381863307465069, + "grad_norm": 0.5563091323848212, + "grad_max_sv": 0.37752934321761134, + "grad_min_sv": 1.4602178925586487e-12, + "grad_condition": 201992262866.57877, + "lr": 0.000996057350657239, + "time_sec": 177.8438265323639 + }, + { + "epoch": 7, + "train_loss": 4.702823111572266, + "train_acc": 0.01186, + "test_loss": 4.627877201843262, + "test_acc": 0.01, + "lyapunov": 1.7552724058365883, + "grad_norm": 0.4233607461027203, + "grad_max_sv": 0.35499467700719833, + "grad_min_sv": 3.8501282054302263e-13, + "grad_condition": 282171382589.46027, + "lr": 0.000994636166481494, + "time_sec": 177.7493600845337 + }, + { + "epoch": 8, + "train_loss": 4.722017111511231, + "train_acc": 0.01098, + "test_loss": 6.090566035461426, + "test_acc": 0.01, + "lyapunov": 1.7357035292993725, + "grad_norm": 0.3850039806872663, + "grad_max_sv": 0.3226898044347763, + "grad_min_sv": 7.113592445244562e-14, + "grad_condition": 304348428639.08154, + "lr": 0.0009929980185352525, + "time_sec": 177.78767728805542 + }, + { + "epoch": 9, + "train_loss": 4.741448409118652, + "train_acc": 0.01154, + "test_loss": 5.83977333984375, + "test_acc": 0.01, + "lyapunov": 1.7204718992228398, + "grad_norm": 0.4078264807422899, + "grad_max_sv": 0.31335003934800626, + "grad_min_sv": 1.9402458265888006e-13, + "grad_condition": 298038507715.96027, + "lr": 0.0009911436253643444, + "time_sec": 177.80518293380737 + }, + { + "epoch": 10, + "train_loss": 4.747990810241699, + "train_acc": 0.01106, + "test_loss": 6.513046632385254, + "test_acc": 0.01, + "lyapunov": 1.6953654838035175, + "grad_norm": 0.4292578477364445, + "grad_max_sv": 0.3652988448739052, + "grad_min_sv": 1.2809375813436604e-13, + "grad_condition": 342642686942.9036, + "lr": 0.0009890738003669028, + "time_sec": 177.78542613983154 + }, + { + "epoch": 11, + "train_loss": 4.765809431610108, + "train_acc": 0.01214, + "test_loss": 7.22933176574707, + "test_acc": 0.01, + "lyapunov": 1.7186210655495333, + "grad_norm": 0.4487253545215033, + "grad_max_sv": 0.3868314690887928, + "grad_min_sv": 3.013939023123918e-13, + "grad_condition": 329330315777.6491, + "lr": 0.00098678945143658, + "time_sec": 177.81605434417725 + }, + { + "epoch": 12, + "train_loss": 4.784488880615235, + "train_acc": 0.00986, + "test_loss": 4.611177786254883, + "test_acc": 0.01, + "lyapunov": 1.652159307009119, + "grad_norm": 0.4707826268774683, + "grad_max_sv": 0.3026094869710505, + "grad_min_sv": 3.8656478774921674e-15, + "grad_condition": 301420540269.25793, + "lr": 0.0009842915805643154, + "time_sec": 177.8059630393982 + }, + { + "epoch": 13, + "train_loss": 4.809918058624268, + "train_acc": 0.00966, + "test_loss": 5.106430908203125, + "test_acc": 0.01, + "lyapunov": 1.6707328871997726, + "grad_norm": 0.667273831565697, + "grad_max_sv": 0.24273031912744045, + "grad_min_sv": 1.0572839902934006e-10, + "grad_condition": 229305129700.13013, + "lr": 0.000981581283398829, + "time_sec": 177.8098611831665 + }, + { + "epoch": 14, + "train_loss": 4.825652238159179, + "train_acc": 0.01056, + "test_loss": 10.256812258911133, + "test_acc": 0.01, + "lyapunov": 1.6938227213861998, + "grad_norm": 1.331380545313032, + "grad_max_sv": 0.26493136398494244, + "grad_min_sv": 2.65579091596793e-10, + "grad_condition": 237101921206.0838, + "lr": 0.0009786597487660333, + "time_sec": 177.74433708190918 + }, + { + "epoch": 15, + "train_loss": 4.858567563171387, + "train_acc": 0.01086, + "test_loss": 4.6056615829467775, + "test_acc": 0.01, + "lyapunov": 1.7649985844521876, + "grad_norm": 0.6838854666615405, + "grad_max_sv": 0.34980414882302285, + "grad_min_sv": 2.1796140399673834e-13, + "grad_condition": 312022583270.1326, + "lr": 0.0009755282581475766, + "time_sec": 177.7609293460846 + }, + { + "epoch": 16, + "train_loss": 4.88505381439209, + "train_acc": 0.01104, + "test_loss": 4.605761392211914, + "test_acc": 0.01, + "lyapunov": 1.8020565973218445, + "grad_norm": 0.5845356530706413, + "grad_max_sv": 0.2943306349217892, + "grad_min_sv": 4.369502606031448e-14, + "grad_condition": 287139369751.0244, + "lr": 0.0009721881851187403, + "time_sec": 177.8197786808014 + }, + { + "epoch": 17, + "train_loss": 4.893186149749756, + "train_acc": 0.01036, + "test_loss": 4.605876076507569, + "test_acc": 0.01, + "lyapunov": 1.7787105851161205, + "grad_norm": 0.4680659078828573, + "grad_max_sv": 0.2733098614960909, + "grad_min_sv": 4.296774163499721e-19, + "grad_condition": 273309717860.49023, + "lr": 0.0009686409947459456, + "time_sec": 177.79044127464294 + }, + { + "epoch": 18, + "train_loss": 4.893065974731445, + "train_acc": 0.0107, + "test_loss": 4.6065135696411135, + "test_acc": 0.01, + "lyapunov": 1.718729690822494, + "grad_norm": 0.5727929210621684, + "grad_max_sv": 0.30122888199985026, + "grad_min_sv": 4.424719830275789e-19, + "grad_condition": 301228714224.6802, + "lr": 0.0009648882429441254, + "time_sec": 177.80086708068848 + }, + { + "epoch": 19, + "train_loss": 4.88860928604126, + "train_acc": 0.01, + "test_loss": 4.702660593414307, + "test_acc": 0.01, + "lyapunov": 1.6696165498260342, + "grad_norm": 0.42342867331427436, + "grad_max_sv": 0.34960081316530706, + "grad_min_sv": 2.8274243075655694e-14, + "grad_condition": 340909047209.5011, + "lr": 0.00096093157579425, + "time_sec": 177.7979953289032 + }, + { + "epoch": 20, + "train_loss": 4.903309204711914, + "train_acc": 0.01068, + "test_loss": 5.4670142036437985, + "test_acc": 0.01, + "lyapunov": 1.6678839117059927, + "grad_norm": 0.5364190790754718, + "grad_max_sv": 0.3460624013096094, + "grad_min_sv": 1.5815154140131103e-14, + "grad_condition": 341291954932.3224, + "lr": 0.0009567727288213001, + "time_sec": 177.79369568824768 + }, + { + "epoch": 21, + "train_loss": 4.915025991210937, + "train_acc": 0.01106, + "test_loss": 4.692510232543945, + "test_acc": 0.01, + "lyapunov": 1.6982163163402197, + "grad_norm": 0.5511803995310802, + "grad_max_sv": 0.34619002789258957, + "grad_min_sv": 4.733950722420789e-14, + "grad_condition": 333444655591.8086, + "lr": 0.0009524135262330095, + "time_sec": 177.79608535766602 + }, + { + "epoch": 22, + "train_loss": 4.909840554809571, + "train_acc": 0.01084, + "test_loss": 4.6062485778808595, + "test_acc": 0.01, + "lyapunov": 1.6909822228619509, + "grad_norm": 0.4483805706207121, + "grad_max_sv": 0.3018789976027193, + "grad_min_sv": 3.421304159357815e-14, + "grad_condition": 293400173556.4137, + "lr": 0.0009478558801197061, + "time_sec": 177.81299710273743 + }, + { + "epoch": 23, + "train_loss": 4.909692084808349, + "train_acc": 0.01108, + "test_loss": 4.6094023056030275, + "test_acc": 0.01, + "lyapunov": 1.6835671846214157, + "grad_norm": 0.45426031851013016, + "grad_max_sv": 0.3322039857506752, + "grad_min_sv": 6.560297434150338e-15, + "grad_condition": 330632003336.626, + "lr": 0.000943101789615607, + "time_sec": 177.8134524822235 + }, + { + "epoch": 24, + "train_loss": 4.901827787475586, + "train_acc": 0.011, + "test_loss": 4.606396533203125, + "test_acc": 0.01, + "lyapunov": 1.6725571582384426, + "grad_norm": 0.5007132528772561, + "grad_max_sv": 0.3051792338490486, + "grad_min_sv": 2.976912647072195e-14, + "grad_condition": 299276387943.3783, + "lr": 0.0009381533400219313, + "time_sec": 177.7837200164795 + }, + { + "epoch": 25, + "train_loss": 4.899776871948243, + "train_acc": 0.0109, + "test_loss": 4.606364790344238, + "test_acc": 0.01, + "lyapunov": 1.6670247737099142, + "grad_norm": 0.4224268025378797, + "grad_max_sv": 0.2703032233530493, + "grad_min_sv": 5.37251515366592e-15, + "grad_condition": 268629366269.90933, + "lr": 0.0009330127018922189, + "time_sec": 177.82209467887878 + }, + { + "epoch": 26, + "train_loss": 4.896821321258545, + "train_acc": 0.0107, + "test_loss": 4.722185048675537, + "test_acc": 0.01, + "lyapunov": 1.6472089549769526, + "grad_norm": 0.48011762637076694, + "grad_max_sv": 0.2670708648860455, + "grad_min_sv": 3.756115387104417e-15, + "grad_condition": 266170283847.3038, + "lr": 0.000927682130080253, + "time_sec": 177.78438448905945 + }, + { + "epoch": 27, + "train_loss": 4.906476246490478, + "train_acc": 0.01086, + "test_loss": 5.412735247802734, + "test_acc": 0.01, + "lyapunov": 1.6813617880691958, + "grad_norm": 0.4406715400059857, + "grad_max_sv": 0.25074354074895383, + "grad_min_sv": 6.093407208933511e-20, + "grad_condition": 250743525278.97955, + "lr": 0.0009221639627510072, + "time_sec": 177.7901487350464 + }, + { + "epoch": 28, + "train_loss": 4.893644842224121, + "train_acc": 0.01172, + "test_loss": 5.005291435241699, + "test_acc": 0.01, + "lyapunov": 1.6454817526175847, + "grad_norm": 0.3605258439803559, + "grad_max_sv": 0.2296090517193079, + "grad_min_sv": 8.79898850927057e-21, + "grad_condition": 229609049604.029, + "lr": 0.0009164606203550494, + "time_sec": 177.8756561279297 + }, + { + "epoch": 29, + "train_loss": 4.886972426452637, + "train_acc": 0.01162, + "test_loss": 5.60837995223999, + "test_acc": 0.01, + "lyapunov": 1.6373517272417502, + "grad_norm": 0.35252531034326595, + "grad_max_sv": 0.2174192801117897, + "grad_min_sv": 1.7514629554834846e-20, + "grad_condition": 217419276581.3401, + "lr": 0.0009105746045668516, + "time_sec": 177.83988404273987 + }, + { + "epoch": 30, + "train_loss": 4.887171002197266, + "train_acc": 0.011, + "test_loss": 5.029856091308594, + "test_acc": 0.01, + "lyapunov": 1.6322715209268244, + "grad_norm": 0.3694860441565804, + "grad_max_sv": 0.1933195549994707, + "grad_min_sv": 2.0216060912179585e-20, + "grad_condition": 193319550988.26825, + "lr": 0.0009045084971874733, + "time_sec": 177.91060781478882 + }, + { + "epoch": 31, + "train_loss": 4.882497029418945, + "train_acc": 0.01094, + "test_loss": 4.946529456329346, + "test_acc": 0.01, + "lyapunov": 1.6160695430872691, + "grad_norm": 0.3009086445042491, + "grad_max_sv": 0.17770135290920736, + "grad_min_sv": 3.24419256482409e-21, + "grad_condition": 177701352269.52295, + "lr": 0.0008982649590120977, + "time_sec": 179.66105842590332 + }, + { + "epoch": 32, + "train_loss": 4.880725912780762, + "train_acc": 0.01128, + "test_loss": 5.578618463897705, + "test_acc": 0.01, + "lyapunov": 1.62386571232925, + "grad_norm": 0.36023587191613426, + "grad_max_sv": 0.1822029523551464, + "grad_min_sv": 3.6796007523380705e-21, + "grad_condition": 182202951444.53656, + "lr": 0.0008918467286629196, + "time_sec": 179.0988199710846 + }, + { + "epoch": 33, + "train_loss": 4.908818702850342, + "train_acc": 0.01182, + "test_loss": 4.791287840270996, + "test_acc": 0.01, + "lyapunov": 1.674632024886968, + "grad_norm": 2.355286231583665, + "grad_max_sv": 0.1451555678440961, + "grad_min_sv": 3.147262321441897e-13, + "grad_condition": 145124831420.269, + "lr": 0.0008852566213878943, + "time_sec": 177.81290411949158 + }, + { + "epoch": 34, + "train_loss": 4.966870961761475, + "train_acc": 0.00932, + "test_loss": 4.691395782470703, + "test_acc": 0.01, + "lyapunov": 1.7797045579651738, + "grad_norm": 0.4484129521918933, + "grad_max_sv": 0.14517696127295493, + "grad_min_sv": 1.115426717388758e-15, + "grad_condition": 144975581810.04208, + "lr": 0.000878497527825878, + "time_sec": 177.8652102947235 + }, + { + "epoch": 35, + "train_loss": 4.915819309997558, + "train_acc": 0.01472, + "test_loss": 4.624800839996338, + "test_acc": 0.01, + "lyapunov": 1.721020828122678, + "grad_norm": 1.0620945447138674, + "grad_max_sv": 0.19911672528833152, + "grad_min_sv": 1.9872991955575878e-10, + "grad_condition": 95641187798.97682, + "lr": 0.000871572412738697, + "time_sec": 177.88512420654297 + }, + { + "epoch": 36, + "train_loss": 4.9530413731384275, + "train_acc": 0.01452, + "test_loss": 4.789580516052246, + "test_acc": 0.0101, + "lyapunov": 1.8076083949764672, + "grad_norm": 0.5972631933008199, + "grad_max_sv": 0.19924248810857534, + "grad_min_sv": 3.440275442940527e-10, + "grad_condition": 148843110630.56686, + "lr": 0.0008644843137107055, + "time_sec": 177.85971999168396 + }, + { + "epoch": 37, + "train_loss": 4.963237725219726, + "train_acc": 0.01242, + "test_loss": 9.607163096618653, + "test_acc": 0.01, + "lyapunov": 1.7487757071814574, + "grad_norm": 0.5178441019436488, + "grad_max_sv": 0.2677606202661991, + "grad_min_sv": 1.2794001535597794e-09, + "grad_condition": 118342772090.25644, + "lr": 0.0008572363398164014, + "time_sec": 177.87799191474915 + }, + { + "epoch": 38, + "train_loss": 4.974736349639892, + "train_acc": 0.01056, + "test_loss": 4.772847597503662, + "test_acc": 0.01, + "lyapunov": 1.6420561239847442, + "grad_norm": 0.7737397356236614, + "grad_max_sv": 0.48621650636196134, + "grad_min_sv": 5.431396735144922e-09, + "grad_condition": 1130833560.0526097, + "lr": 0.0008498316702566826, + "time_sec": 177.84695863723755 + }, + { + "epoch": 39, + "train_loss": 4.914389076538086, + "train_acc": 0.00954, + "test_loss": 5.4321878707885745, + "test_acc": 0.01, + "lyapunov": 1.606756867959981, + "grad_norm": 0.6387073953630102, + "grad_max_sv": 0.28100625462830064, + "grad_min_sv": 1.1923785099299402e-09, + "grad_condition": 31042166964.6133, + "lr": 0.0008422735529643442, + "time_sec": 177.8997838497162 + }, + { + "epoch": 40, + "train_loss": 4.907334909515381, + "train_acc": 0.00932, + "test_loss": 5.197367625427246, + "test_acc": 0.01, + "lyapunov": 1.6101341015847443, + "grad_norm": 0.549617557037775, + "grad_max_sv": 0.21684555038809777, + "grad_min_sv": 1.6231511646555081e-12, + "grad_condition": 115360148938.91074, + "lr": 0.0008345653031794289, + "time_sec": 177.88523411750793 + }, + { + "epoch": 41, + "train_loss": 4.9172815733337405, + "train_acc": 0.00966, + "test_loss": 5.328871868896484, + "test_acc": 0.01, + "lyapunov": 1.6233936231154615, + "grad_norm": 0.6437990568107412, + "grad_max_sv": 0.23363575600087644, + "grad_min_sv": 5.030357610936974e-10, + "grad_condition": 138575586823.60834, + "lr": 0.0008267103019950526, + "time_sec": 177.87491416931152 + }, + { + "epoch": 42, + "train_loss": 4.910974921875, + "train_acc": 0.0094, + "test_loss": 5.260343148803711, + "test_acc": 0.01, + "lyapunov": 1.6119288898185087, + "grad_norm": 0.6213630809261163, + "grad_max_sv": 0.2208472192287445, + "grad_min_sv": 1.6566058977896803e-10, + "grad_condition": 142601015959.25623, + "lr": 0.0008187119948743447, + "time_sec": 177.85157465934753 + }, + { + "epoch": 43, + "train_loss": 4.910828229217529, + "train_acc": 0.0082, + "test_loss": 4.699688921356201, + "test_acc": 0.01, + "lyapunov": 1.6258944394948232, + "grad_norm": 0.4079357024315036, + "grad_max_sv": 0.15661620609462262, + "grad_min_sv": 1.7684309930750455e-15, + "grad_condition": 156350108060.72934, + "lr": 0.000810573890139155, + "time_sec": 177.86257314682007 + }, + { + "epoch": 44, + "train_loss": 4.896916885833741, + "train_acc": 0.00922, + "test_loss": 4.812428985595703, + "test_acc": 0.01, + "lyapunov": 1.5950726255431504, + "grad_norm": 0.4783756369080321, + "grad_max_sv": 0.14141971599310638, + "grad_min_sv": 1.3813946661647787e-39, + "grad_condition": 141419715993.10638, + "lr": 0.0008022995574311873, + "time_sec": 177.92987060546875 + }, + { + "epoch": 45, + "train_loss": 4.908877978973389, + "train_acc": 0.00912, + "test_loss": 4.708805274963379, + "test_acc": 0.01, + "lyapunov": 1.6267534076710186, + "grad_norm": 0.7771603049125322, + "grad_max_sv": 0.15806035809218882, + "grad_min_sv": 1.4034116208559716e-15, + "grad_condition": 157762251235.76987, + "lr": 0.0007938926261462363, + "time_sec": 177.94272303581238 + }, + { + "epoch": 46, + "train_loss": 4.90580543838501, + "train_acc": 0.00928, + "test_loss": 4.734797378540039, + "test_acc": 0.01, + "lyapunov": 1.6176637389775737, + "grad_norm": 0.6942542366402378, + "grad_max_sv": 0.15787413250654936, + "grad_min_sv": 7.864894789560978e-16, + "grad_condition": 157723200668.28387, + "lr": 0.0007853567838422158, + "time_sec": 177.97623896598816 + }, + { + "epoch": 47, + "train_loss": 4.8965187059021, + "train_acc": 0.00938, + "test_loss": 4.6579503898620604, + "test_acc": 0.01, + "lyapunov": 1.5973099085985851, + "grad_norm": 0.36353228305050295, + "grad_max_sv": 0.13088524471968413, + "grad_min_sv": 1.2231276530985221e-20, + "grad_condition": 130885242907.8948, + "lr": 0.0007766957746216719, + "time_sec": 177.95993542671204 + }, + { + "epoch": 48, + "train_loss": 4.8988071447753905, + "train_acc": 0.00944, + "test_loss": 4.662165933227539, + "test_acc": 0.01, + "lyapunov": 1.603416101402029, + "grad_norm": 0.3898458431943687, + "grad_max_sv": 0.1284548096358776, + "grad_min_sv": 1.1576870843401716e-38, + "grad_condition": 128454809635.87761, + "lr": 0.0007679133974894982, + "time_sec": 177.8052430152893 + }, + { + "epoch": 49, + "train_loss": 4.913481904144287, + "train_acc": 0.00918, + "test_loss": 4.763600569915772, + "test_acc": 0.01, + "lyapunov": 1.6402373295610824, + "grad_norm": 0.5994299094599757, + "grad_max_sv": 0.1396894573670579, + "grad_min_sv": 2.779377619525618e-15, + "grad_condition": 139046550095.99487, + "lr": 0.000759013504686565, + "time_sec": 177.86163926124573 + }, + { + "epoch": 50, + "train_loss": 4.906329712219239, + "train_acc": 0.00982, + "test_loss": 4.609917034912109, + "test_acc": 0.01, + "lyapunov": 1.6202878165427985, + "grad_norm": 0.6143555741962269, + "grad_max_sv": 0.15427468828856944, + "grad_min_sv": 1.5586657350285492e-15, + "grad_condition": 153998022994.1138, + "lr": 0.0007499999999999998, + "time_sec": 177.81070852279663 + }, + { + "epoch": 51, + "train_loss": 4.901778139953613, + "train_acc": 0.01, + "test_loss": 5.7906026428222654, + "test_acc": 0.01, + "lyapunov": 1.6095840150438, + "grad_norm": 0.4846890301599483, + "grad_max_sv": 0.10476460931822658, + "grad_min_sv": 6.919555377168684e-15, + "grad_condition": 103682757395.60971, + "lr": 0.0007408768370508575, + "time_sec": 177.827232837677 + }, + { + "epoch": 52, + "train_loss": 4.897733354492187, + "train_acc": 0.0102, + "test_loss": 5.14119333190918, + "test_acc": 0.01, + "lyapunov": 1.6018984003749954, + "grad_norm": 0.45183942591328674, + "grad_max_sv": 0.08775242893025278, + "grad_min_sv": 1.964503741104032e-16, + "grad_condition": 87731321318.76743, + "lr": 0.0007316480175599307, + "time_sec": 177.8825397491455 + }, + { + "epoch": 53, + "train_loss": 4.899286302947998, + "train_acc": 0.0105, + "test_loss": 5.116060150146485, + "test_acc": 0.01, + "lyapunov": 1.6068680664462507, + "grad_norm": 0.39046803319247386, + "grad_max_sv": 0.10442779418081045, + "grad_min_sv": 1.8704405143177693e-32, + "grad_condition": 104427794180.81046, + "lr": 0.0007223175895924635, + "time_sec": 177.85691237449646 + }, + { + "epoch": 54, + "train_loss": 4.900419689025879, + "train_acc": 0.00974, + "test_loss": 6.225739611816406, + "test_acc": 0.01, + "lyapunov": 1.611330489673273, + "grad_norm": 0.7830684513344699, + "grad_max_sv": 0.08616076316975523, + "grad_min_sv": 7.006492321624086e-47, + "grad_condition": 86160763169.75522, + "lr": 0.0007128896457825361, + "time_sec": 177.79533982276917 + }, + { + "epoch": 55, + "train_loss": 4.90022905456543, + "train_acc": 0.00872, + "test_loss": 4.660898509216309, + "test_acc": 0.01, + "lyapunov": 1.6107879657574626, + "grad_norm": 0.3602507862317559, + "grad_max_sv": 0.07782914067938691, + "grad_min_sv": 0.0, + "grad_condition": 77829140679.3869, + "lr": 0.0007033683215378998, + "time_sec": 177.81696367263794 + }, + { + "epoch": 56, + "train_loss": 4.899950318450927, + "train_acc": 0.009, + "test_loss": 4.8788808166503905, + "test_acc": 0.01, + "lyapunov": 1.608769400345395, + "grad_norm": 0.24016992273295382, + "grad_max_sv": 0.07058875868096948, + "grad_min_sv": 0.0, + "grad_condition": 70588758680.96948, + "lr": 0.0006937577932260512, + "time_sec": 177.81637740135193 + }, + { + "epoch": 57, + "train_loss": 4.904979566650391, + "train_acc": 0.01016, + "test_loss": 4.727262957763672, + "test_acc": 0.01, + "lyapunov": 1.6228536108265752, + "grad_norm": 0.25668226851580556, + "grad_max_sv": 0.08947733379900455, + "grad_min_sv": 3.709630814829091e-18, + "grad_condition": 89476902167.92735, + "lr": 0.0006840622763423388, + "time_sec": 177.7847032546997 + }, + { + "epoch": 58, + "train_loss": 4.91234857635498, + "train_acc": 0.00984, + "test_loss": 4.992978315734863, + "test_acc": 0.01, + "lyapunov": 1.6392204319424641, + "grad_norm": 0.2870713508381296, + "grad_max_sv": 0.08510738047771156, + "grad_min_sv": 5.680980030609821e-34, + "grad_condition": 85107380477.71156, + "lr": 0.0006742860236609073, + "time_sec": 177.93095755577087 + }, + { + "epoch": 59, + "train_loss": 4.895672921447754, + "train_acc": 0.00956, + "test_loss": 4.850344149017334, + "test_acc": 0.01, + "lyapunov": 1.6016130505315482, + "grad_norm": 0.21955395456353394, + "grad_max_sv": 0.04376054578460753, + "grad_min_sv": 0.0, + "grad_condition": 43760545784.60753, + "lr": 0.0006644333233692913, + "time_sec": 178.03867888450623 + }, + { + "epoch": 60, + "train_loss": 4.904327979278564, + "train_acc": 0.01052, + "test_loss": 5.107528366088867, + "test_acc": 0.01, + "lyapunov": 1.6214414124598588, + "grad_norm": 0.4134573581512024, + "grad_max_sv": 0.05148340538144112, + "grad_min_sv": 0.0, + "grad_condition": 51483405381.44112, + "lr": 0.0006545084971874734, + "time_sec": 177.95739769935608 + }, + { + "epoch": 61, + "train_loss": 4.898002865753174, + "train_acc": 0.0092, + "test_loss": 5.260837869262695, + "test_acc": 0.01, + "lyapunov": 1.6072155035975035, + "grad_norm": 0.21245422531513092, + "grad_max_sv": 0.06225627232342958, + "grad_min_sv": 0.0, + "grad_condition": 62256272323.42959, + "lr": 0.0006445158984722354, + "time_sec": 177.8253002166748 + }, + { + "epoch": 62, + "train_loss": 4.895106823730469, + "train_acc": 0.00882, + "test_loss": 4.800835796356202, + "test_acc": 0.01, + "lyapunov": 1.6004807888089543, + "grad_norm": 0.2174674542614135, + "grad_max_sv": 0.05514842057600618, + "grad_min_sv": 0.0, + "grad_condition": 55148420576.00618, + "lr": 0.0006344599103076324, + "time_sec": 177.72123980522156 + }, + { + "epoch": 63, + "train_loss": 4.899956417541504, + "train_acc": 0.0105, + "test_loss": 4.751542483520508, + "test_acc": 0.01, + "lyapunov": 1.6128623427637399, + "grad_norm": 0.40884851608059564, + "grad_max_sv": 0.05529614672996104, + "grad_min_sv": 0.0, + "grad_condition": 55296146729.96104, + "lr": 0.0006243449435824269, + "time_sec": 177.73331904411316 + }, + { + "epoch": 64, + "train_loss": 4.899741290130615, + "train_acc": 0.01012, + "test_loss": 4.856732801818848, + "test_acc": 0.01, + "lyapunov": 1.610243486931257, + "grad_norm": 0.2140046037475775, + "grad_max_sv": 0.04319468280300498, + "grad_min_sv": 1.2200012063541023e-32, + "grad_condition": 43194682803.00498, + "lr": 0.0006141754350553275, + "time_sec": 177.72633337974548 + }, + { + "epoch": 65, + "train_loss": 4.901744207763672, + "train_acc": 0.00894, + "test_loss": 5.05665267791748, + "test_acc": 0.01, + "lyapunov": 1.612555693482499, + "grad_norm": 0.41191406243662826, + "grad_max_sv": 0.06249867400620133, + "grad_min_sv": 9.569992363469874e-20, + "grad_condition": 62498664540.05955, + "lr": 0.0006039558454088793, + "time_sec": 177.71029257774353 + }, + { + "epoch": 66, + "train_loss": 4.905766971282959, + "train_acc": 0.00954, + "test_loss": 5.186077005767822, + "test_acc": 0.01, + "lyapunov": 1.6214341486201567, + "grad_norm": 0.4859633789458757, + "grad_max_sv": 0.0410848444327712, + "grad_min_sv": 0.0, + "grad_condition": 41084844432.7712, + "lr": 0.000593690657292862, + "time_sec": 177.8285129070282 + }, + { + "epoch": 67, + "train_loss": 4.905345126495361, + "train_acc": 0.00986, + "test_loss": 4.869504832458496, + "test_acc": 0.01, + "lyapunov": 1.6231126108437852, + "grad_norm": 0.39055695869151713, + "grad_max_sv": 0.04164083697833121, + "grad_min_sv": 1.4012984643248171e-46, + "grad_condition": 41640836978.3312, + "lr": 0.0005833843733580507, + "time_sec": 177.75302600860596 + }, + { + "epoch": 68, + "train_loss": 4.897688937835693, + "train_acc": 0.00942, + "test_loss": 4.753113725280762, + "test_acc": 0.01, + "lyapunov": 1.6065946210680715, + "grad_norm": 0.20313081565215924, + "grad_max_sv": 0.023377659870311616, + "grad_min_sv": 0.0, + "grad_condition": 23377659870.311615, + "lr": 0.0005730415142812054, + "time_sec": 177.63269519805908 + }, + { + "epoch": 69, + "train_loss": 4.898588792419433, + "train_acc": 0.01028, + "test_loss": 4.782024855804443, + "test_acc": 0.01, + "lyapunov": 1.6088185420121683, + "grad_norm": 0.17496031637798137, + "grad_max_sv": 0.026315743662416936, + "grad_min_sv": 0.0, + "grad_condition": 26315743662.416935, + "lr": 0.0005626666167821517, + "time_sec": 177.63309144973755 + }, + { + "epoch": 70, + "train_loss": 4.8972829446411135, + "train_acc": 0.00906, + "test_loss": 5.072041613769532, + "test_acc": 0.01, + "lyapunov": 1.606105865419978, + "grad_norm": 4.752321231571355, + "grad_max_sv": 0.01162667127500754, + "grad_min_sv": 0.0, + "grad_condition": 11626671275.007538, + "lr": 0.0005522642316338265, + "time_sec": 177.63151264190674 + }, + { + "epoch": 71, + "train_loss": 4.903229199066162, + "train_acc": 0.00974, + "test_loss": 4.996621307373047, + "test_acc": 0.01, + "lyapunov": 1.618955539315558, + "grad_norm": 8.808121966401492, + "grad_max_sv": 0.009761298389639706, + "grad_min_sv": 0.0, + "grad_condition": 9761298389.639706, + "lr": 0.0005418389216661573, + "time_sec": 177.6599452495575 + }, + { + "epoch": 72, + "train_loss": 4.906216805419922, + "train_acc": 0.00934, + "test_loss": 4.894567427062988, + "test_acc": 0.01, + "lyapunov": 1.628432136362471, + "grad_norm": 8.489795940827486, + "grad_max_sv": 0.016040445899125188, + "grad_min_sv": 0.0, + "grad_condition": 16040445899.125189, + "lr": 0.0005313952597646563, + "time_sec": 177.6416893005371 + }, + { + "epoch": 73, + "train_loss": 4.899343757019043, + "train_acc": 0.00984, + "test_loss": 4.877998015594482, + "test_acc": 0.01, + "lyapunov": 1.6116645827012903, + "grad_norm": 8.78253510980995, + "grad_max_sv": 0.011263658234383911, + "grad_min_sv": 0.0, + "grad_condition": 11263658234.383911, + "lr": 0.0005209378268645994, + "time_sec": 177.685124874115 + }, + { + "epoch": 74, + "train_loss": 4.909308713531495, + "train_acc": 0.0098, + "test_loss": 4.906534819030762, + "test_acc": 0.01, + "lyapunov": 1.6356849475284976, + "grad_norm": 8.739719950493322, + "grad_max_sv": 0.018200278421863912, + "grad_min_sv": 0.0, + "grad_condition": 18200278421.863914, + "lr": 0.0005104712099416781, + "time_sec": 177.67348718643188 + }, + { + "epoch": 75, + "train_loss": 4.896382185516358, + "train_acc": 0.00988, + "test_loss": 4.891489701843262, + "test_acc": 0.01, + "lyapunov": 1.6029227630561576, + "grad_norm": 8.719549027099202, + "grad_max_sv": 0.022427358670393006, + "grad_min_sv": 0.0, + "grad_condition": 22427358670.393005, + "lr": 0.0004999999999999996, + "time_sec": 177.7534384727478 + }, + { + "epoch": 76, + "train_loss": 4.899071414489746, + "train_acc": 0.00968, + "test_loss": 4.9015754707336425, + "test_acc": 0.01, + "lyapunov": 1.6096787852094607, + "grad_norm": 8.515820970435684, + "grad_max_sv": 0.009400015359278768, + "grad_min_sv": 0.0, + "grad_condition": 9400015359.278769, + "lr": 0.0004895287900583212, + "time_sec": 177.62656164169312 + }, + { + "epoch": 77, + "train_loss": 4.898522388305664, + "train_acc": 0.01038, + "test_loss": 5.091467515563965, + "test_acc": 0.01, + "lyapunov": 1.6093772655862677, + "grad_norm": 8.114992022856779, + "grad_max_sv": 0.018641287484206258, + "grad_min_sv": 0.0, + "grad_condition": 18641287484.20626, + "lr": 0.0004790621731353997, + "time_sec": 177.68832445144653 + }, + { + "epoch": 78, + "train_loss": 4.898501075897217, + "train_acc": 0.00976, + "test_loss": 5.021521907043457, + "test_acc": 0.01, + "lyapunov": 1.609497647761079, + "grad_norm": 8.539277939413502, + "grad_max_sv": 0.007715003727935254, + "grad_min_sv": 0.0, + "grad_condition": 7715003727.935254, + "lr": 0.000468604740235343, + "time_sec": 177.67188620567322 + }, + { + "epoch": 79, + "train_loss": 4.89914041229248, + "train_acc": 0.00952, + "test_loss": 5.091536389160156, + "test_acc": 0.01, + "lyapunov": 1.6118732392025725, + "grad_norm": 8.137454688889077, + "grad_max_sv": 0.014247056667227299, + "grad_min_sv": 0.0, + "grad_condition": 14247056667.227299, + "lr": 0.00045816107833384175, + "time_sec": 177.66169714927673 + }, + { + "epoch": 80, + "train_loss": 4.896471509552002, + "train_acc": 0.00904, + "test_loss": 5.056171662139892, + "test_acc": 0.01, + "lyapunov": 1.6047609431664351, + "grad_norm": 8.176635016602376, + "grad_max_sv": 0.01795925593469292, + "grad_min_sv": 0.0, + "grad_condition": 17959255934.69292, + "lr": 0.0004477357683661729, + "time_sec": 177.69231700897217 + }, + { + "epoch": 81, + "train_loss": 4.902812586059571, + "train_acc": 0.00932, + "test_loss": 4.95149069366455, + "test_acc": 0.01, + "lyapunov": 1.6196627622979987, + "grad_norm": 7.929696982355576, + "grad_max_sv": 0.0070913337520323695, + "grad_min_sv": 0.0, + "grad_condition": 7091333752.03237, + "lr": 0.00043733338321784746, + "time_sec": 177.62628316879272 + }, + { + "epoch": 82, + "train_loss": 4.896946704254151, + "train_acc": 0.00924, + "test_loss": 5.036287983703613, + "test_acc": 0.01, + "lyapunov": 1.606176169632036, + "grad_norm": 7.888136562780922, + "grad_max_sv": 0.0152505733538419, + "grad_min_sv": 0.0, + "grad_condition": 15250573353.8419, + "lr": 0.0004269584857187939, + "time_sec": 177.6838881969452 + }, + { + "epoch": 83, + "train_loss": 4.903535429534912, + "train_acc": 0.00942, + "test_loss": 4.913862983703614, + "test_acc": 0.01, + "lyapunov": 1.6229887536114744, + "grad_norm": 5.821543829416724, + "grad_max_sv": 0.0042757402297866065, + "grad_min_sv": 0.0, + "grad_condition": 4275740229.786606, + "lr": 0.0004166156266419484, + "time_sec": 177.63864398002625 + }, + { + "epoch": 84, + "train_loss": 4.900573203125, + "train_acc": 0.00922, + "test_loss": 4.881514458465576, + "test_acc": 0.01, + "lyapunov": 1.6157215519634354, + "grad_norm": 2.3035299291537767, + "grad_max_sv": 0.018527308432385325, + "grad_min_sv": 0.0, + "grad_condition": 18527308432.385326, + "lr": 0.0004063093427071373, + "time_sec": 177.61864590644836 + }, + { + "epoch": 85, + "train_loss": 4.902895740814209, + "train_acc": 0.00928, + "test_loss": 4.858868844604492, + "test_acc": 0.01, + "lyapunov": 1.6206753049665095, + "grad_norm": 0.12191327008361393, + "grad_max_sv": 0.011266671447083354, + "grad_min_sv": 0.0, + "grad_condition": 11266671447.083355, + "lr": 0.0003960441545911199, + "time_sec": 177.60221338272095 + }, + { + "epoch": 86, + "train_loss": 4.899129556274414, + "train_acc": 0.01002, + "test_loss": 4.940996123504639, + "test_acc": 0.01, + "lyapunov": 1.6121560679677198, + "grad_norm": 1.7402391187392277, + "grad_max_sv": 0.002565371198579669, + "grad_min_sv": 0.0, + "grad_condition": 2565371198.579669, + "lr": 0.0003858245649446718, + "time_sec": 177.66662287712097 + }, + { + "epoch": 87, + "train_loss": 4.898443488616944, + "train_acc": 0.0105, + "test_loss": 4.900648780059814, + "test_acc": 0.01, + "lyapunov": 1.6101132055072833, + "grad_norm": 3.9387378230742067, + "grad_max_sv": 0.014504804974421859, + "grad_min_sv": 0.0, + "grad_condition": 14504804974.421856, + "lr": 0.00037565505641757235, + "time_sec": 177.92060565948486 + }, + { + "epoch": 88, + "train_loss": 4.903396017608642, + "train_acc": 0.01006, + "test_loss": 4.946898637390137, + "test_acc": 0.01, + "lyapunov": 1.6227889701228617, + "grad_norm": 3.523322793117835, + "grad_max_sv": 0.010716242669150233, + "grad_min_sv": 0.0, + "grad_condition": 10716242669.150234, + "lr": 0.00036554008969236695, + "time_sec": 177.71660375595093 + }, + { + "epoch": 89, + "train_loss": 4.898063175964356, + "train_acc": 0.00952, + "test_loss": 4.944628465270996, + "test_acc": 0.01, + "lyapunov": 1.6093785500587405, + "grad_norm": 3.442066441987714, + "grad_max_sv": 0.001931725861504674, + "grad_min_sv": 0.0, + "grad_condition": 1931725861.5046737, + "lr": 0.0003554841015277638, + "time_sec": 177.85225415229797 + }, + { + "epoch": 90, + "train_loss": 4.897619627685547, + "train_acc": 0.00938, + "test_loss": 5.051801362609863, + "test_acc": 0.01, + "lyapunov": 1.608569312583455, + "grad_norm": 2.438214274664479, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 177.65104031562805 + }, + { + "epoch": 91, + "train_loss": 4.901775200042724, + "train_acc": 0.00952, + "test_loss": 4.932051847076416, + "test_acc": 0.01, + "lyapunov": 1.6196813135195876, + "grad_norm": 1.9676599328431443, + "grad_max_sv": 0.0042047965805977585, + "grad_min_sv": 0.0, + "grad_condition": 4204796580.5977583, + "lr": 0.0003355666766307081, + "time_sec": 177.5405979156494 + }, + { + "epoch": 92, + "train_loss": 4.8983032328796385, + "train_acc": 0.0092, + "test_loss": 4.899715927886963, + "test_acc": 0.01, + "lyapunov": 1.6106610715846577, + "grad_norm": 1.4208199060741078, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 177.52678775787354 + }, + { + "epoch": 93, + "train_loss": 4.899546262664795, + "train_acc": 0.00828, + "test_loss": 4.734424713134765, + "test_acc": 0.01, + "lyapunov": 1.6129982721470202, + "grad_norm": 0.7679133474898795, + "grad_max_sv": 0.001235782215371728, + "grad_min_sv": 0.0, + "grad_condition": 1235782215.371728, + "lr": 0.00031593772365766094, + "time_sec": 177.578599691391 + }, + { + "epoch": 94, + "train_loss": 4.897470514221191, + "train_acc": 0.00868, + "test_loss": 4.861271743774414, + "test_acc": 0.01, + "lyapunov": 1.6078075801624971, + "grad_norm": 0.5114523908732937, + "grad_max_sv": 0.010413796734064817, + "grad_min_sv": 0.0, + "grad_condition": 10413796734.064817, + "lr": 0.0003062422067739483, + "time_sec": 177.66828536987305 + }, + { + "epoch": 95, + "train_loss": 4.896396814422608, + "train_acc": 0.00902, + "test_loss": 4.879605053710938, + "test_acc": 0.01, + "lyapunov": 1.6050515763290094, + "grad_norm": 0.3961292769391823, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 177.51401448249817 + }, + { + "epoch": 96, + "train_loss": 4.8946277626037595, + "train_acc": 0.00906, + "test_loss": 4.8813762161254886, + "test_acc": 0.01, + "lyapunov": 1.6007561808656854, + "grad_norm": 0.3223908585413378, + "grad_max_sv": 0.004684461047872901, + "grad_min_sv": 0.0, + "grad_condition": 4684461047.8729, + "lr": 0.00028711035421746345, + "time_sec": 177.507954120636 + }, + { + "epoch": 97, + "train_loss": 4.898638327026367, + "train_acc": 0.0089, + "test_loss": 4.8062256309509275, + "test_acc": 0.01, + "lyapunov": 1.6108122432933134, + "grad_norm": 0.26732308458116777, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 177.541433095932 + }, + { + "epoch": 98, + "train_loss": 4.898670770721435, + "train_acc": 0.00952, + "test_loss": 4.863480428314209, + "test_acc": 0.01, + "lyapunov": 1.6111446103781386, + "grad_norm": 0.2214969265799768, + "grad_max_sv": 0.009903033776208759, + "grad_min_sv": 0.0, + "grad_condition": 9903033776.20876, + "lr": 0.00026835198244006903, + "time_sec": 177.60904955863953 + }, + { + "epoch": 99, + "train_loss": 4.897254006500244, + "train_acc": 0.00834, + "test_loss": 4.817773220062256, + "test_acc": 0.01, + "lyapunov": 1.607484469023507, + "grad_norm": 0.19294402621230472, + "grad_max_sv": 0.0008362619206309319, + "grad_min_sv": 0.0, + "grad_condition": 836261920.6309319, + "lr": 0.0002591231629491421, + "time_sec": 177.57478499412537 + }, + { + "epoch": 100, + "train_loss": 4.901547922363282, + "train_acc": 0.0089, + "test_loss": 4.874810285949707, + "test_acc": 0.01, + "lyapunov": 1.618047608134082, + "grad_norm": 0.48303744135317395, + "grad_max_sv": 0.0005853609647601843, + "grad_min_sv": 0.0, + "grad_condition": 585360964.7601843, + "lr": 0.0002499999999999997, + "time_sec": 177.57369899749756 + }, + { + "epoch": 101, + "train_loss": 4.900225694732666, + "train_acc": 0.0088, + "test_loss": 4.874546339416504, + "test_acc": 0.01, + "lyapunov": 1.6143963080842783, + "grad_norm": 0.10450627590873329, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 177.6406271457672 + }, + { + "epoch": 102, + "train_loss": 4.897779517669678, + "train_acc": 0.00842, + "test_loss": 4.97530121307373, + "test_acc": 0.01, + "lyapunov": 1.6092621133760419, + "grad_norm": 0.11958307306926726, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 177.58187460899353 + }, + { + "epoch": 103, + "train_loss": 4.89978483215332, + "train_acc": 0.00836, + "test_loss": 4.904860715484619, + "test_acc": 0.01, + "lyapunov": 1.613416659862489, + "grad_norm": 0.11840174924430107, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 177.59923720359802 + }, + { + "epoch": 104, + "train_loss": 4.8979805488586425, + "train_acc": 0.0086, + "test_loss": 5.0884550689697265, + "test_acc": 0.01, + "lyapunov": 1.6097813783704167, + "grad_norm": 0.119936422604111, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 177.6080665588379 + }, + { + "epoch": 105, + "train_loss": 4.898741788330078, + "train_acc": 0.00866, + "test_loss": 4.9618072402954105, + "test_acc": 0.01, + "lyapunov": 1.6113920699604942, + "grad_norm": 0.152172750895754, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 177.6668050289154 + }, + { + "epoch": 106, + "train_loss": 4.899783585510254, + "train_acc": 0.00854, + "test_loss": 4.853069065856934, + "test_acc": 0.01, + "lyapunov": 1.6142695355598273, + "grad_norm": 0.12651234741385065, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 177.65955018997192 + }, + { + "epoch": 107, + "train_loss": 4.89967593460083, + "train_acc": 0.00888, + "test_loss": 4.81962833480835, + "test_acc": 0.01, + "lyapunov": 1.6138155131083924, + "grad_norm": 0.12897917774661904, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 178.0168354511261 + }, + { + "epoch": 108, + "train_loss": 4.898814065093994, + "train_acc": 0.00946, + "test_loss": 4.862646290588379, + "test_acc": 0.01, + "lyapunov": 1.6114065183702941, + "grad_norm": 0.12441425701414183, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 177.91981077194214 + }, + { + "epoch": 109, + "train_loss": 4.895898725891113, + "train_acc": 0.00866, + "test_loss": 4.898298935699463, + "test_acc": 0.01, + "lyapunov": 1.6044228336085444, + "grad_norm": 0.12735396729359733, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 177.5811812877655 + }, + { + "epoch": 110, + "train_loss": 4.897967128295899, + "train_acc": 0.0088, + "test_loss": 4.881989184570313, + "test_acc": 0.01, + "lyapunov": 1.610074214008458, + "grad_norm": 0.12498581799753569, + "grad_max_sv": 0.0005899489391595125, + "grad_min_sv": 0.0, + "grad_condition": 589948939.1595125, + "lr": 0.00016543469682057076, + "time_sec": 177.58177971839905 + }, + { + "epoch": 111, + "train_loss": 4.894624674987793, + "train_acc": 0.00892, + "test_loss": 4.883820623779297, + "test_acc": 0.01, + "lyapunov": 1.6010574471310277, + "grad_norm": 0.12140577807922988, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 177.56197333335876 + }, + { + "epoch": 112, + "train_loss": 4.895216448974609, + "train_acc": 0.00852, + "test_loss": 4.954343832397461, + "test_acc": 0.01, + "lyapunov": 1.602743710093486, + "grad_norm": 0.1186981012224881, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 177.6377820968628 + }, + { + "epoch": 113, + "train_loss": 4.89654906173706, + "train_acc": 0.00892, + "test_loss": 4.86073722076416, + "test_acc": 0.01, + "lyapunov": 1.6060491681403821, + "grad_norm": 0.13508163826012107, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 177.58386063575745 + }, + { + "epoch": 114, + "train_loss": 4.8961822531127925, + "train_acc": 0.00894, + "test_loss": 4.85973716430664, + "test_acc": 0.01, + "lyapunov": 1.605295106578056, + "grad_norm": 0.1269661896874639, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 177.66930723190308 + }, + { + "epoch": 115, + "train_loss": 4.899547542419434, + "train_acc": 0.00846, + "test_loss": 4.86928017654419, + "test_acc": 0.01, + "lyapunov": 1.611534357680689, + "grad_norm": 0.12942007445088913, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 177.5964391231537 + }, + { + "epoch": 116, + "train_loss": 4.8983458253479, + "train_acc": 0.00896, + "test_loss": 4.843299571990967, + "test_acc": 0.01, + "lyapunov": 1.6105001826420464, + "grad_norm": 0.13930842303851845, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 177.61230850219727 + }, + { + "epoch": 117, + "train_loss": 4.896871134490967, + "train_acc": 0.00876, + "test_loss": 4.854955553436279, + "test_acc": 0.01, + "lyapunov": 1.6068359040238362, + "grad_norm": 0.14085548109201876, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 177.60942769050598 + }, + { + "epoch": 118, + "train_loss": 4.895171242523193, + "train_acc": 0.00872, + "test_loss": 4.848788255310058, + "test_acc": 0.01, + "lyapunov": 1.6026884250323792, + "grad_norm": 0.14154856326059925, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 177.55690503120422 + }, + { + "epoch": 119, + "train_loss": 4.896756847839355, + "train_acc": 0.00832, + "test_loss": 4.8384888511657715, + "test_acc": 0.01, + "lyapunov": 1.6064672335944212, + "grad_norm": 0.13186296404041234, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 177.58031153678894 + }, + { + "epoch": 120, + "train_loss": 4.898055244140625, + "train_acc": 0.00912, + "test_loss": 4.863050064086914, + "test_acc": 0.01, + "lyapunov": 1.608289188131347, + "grad_norm": 0.13789827868104076, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 177.57413148880005 + }, + { + "epoch": 121, + "train_loss": 4.895827691040039, + "train_acc": 0.00928, + "test_loss": 4.863882962799072, + "test_acc": 0.01, + "lyapunov": 1.6041748965792644, + "grad_norm": 0.1447753316018149, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 177.61848878860474 + }, + { + "epoch": 122, + "train_loss": 4.894580706329346, + "train_acc": 0.0093, + "test_loss": 4.832992823791504, + "test_acc": 0.01, + "lyapunov": 1.6009809287917582, + "grad_norm": 0.13403320495860124, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 177.63413906097412 + }, + { + "epoch": 123, + "train_loss": 4.896512101593018, + "train_acc": 0.00856, + "test_loss": 4.88107511138916, + "test_acc": 0.01, + "lyapunov": 1.6053285842661358, + "grad_norm": 0.1349040405870927, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 177.86059856414795 + }, + { + "epoch": 124, + "train_loss": 4.902536525726318, + "train_acc": 0.00916, + "test_loss": 4.825576887512207, + "test_acc": 0.01, + "lyapunov": 1.618482659235025, + "grad_norm": 0.15260564991727005, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 177.59844970703125 + }, + { + "epoch": 125, + "train_loss": 4.8969797262573245, + "train_acc": 0.00904, + "test_loss": 4.842672832489014, + "test_acc": 0.01, + "lyapunov": 1.607402919198546, + "grad_norm": 0.14681033483413716, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 177.69832468032837 + }, + { + "epoch": 126, + "train_loss": 4.896537158660888, + "train_acc": 0.00922, + "test_loss": 4.80990348739624, + "test_acc": 0.01, + "lyapunov": 1.6063618071548773, + "grad_norm": 0.13507935123670756, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 177.70786309242249 + }, + { + "epoch": 127, + "train_loss": 4.894742733154297, + "train_acc": 0.00798, + "test_loss": 4.8113509506225585, + "test_acc": 0.01, + "lyapunov": 1.6014454364776611, + "grad_norm": 0.1351277333350339, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 177.86230516433716 + }, + { + "epoch": 128, + "train_loss": 4.897651534729004, + "train_acc": 0.0094, + "test_loss": 4.849126397705078, + "test_acc": 0.01, + "lyapunov": 1.6088779442145695, + "grad_norm": 0.17636542409245334, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 177.6271688938141 + }, + { + "epoch": 129, + "train_loss": 4.89603802230835, + "train_acc": 0.00886, + "test_loss": 4.837294686126709, + "test_acc": 0.01, + "lyapunov": 1.605165058694532, + "grad_norm": 0.1801255445906475, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 177.71211314201355 + }, + { + "epoch": 130, + "train_loss": 4.895125115509034, + "train_acc": 0.00866, + "test_loss": 4.808775178527832, + "test_acc": 0.01, + "lyapunov": 1.6025557109462025, + "grad_norm": 0.14181669608504024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 177.64269709587097 + }, + { + "epoch": 131, + "train_loss": 4.902938699340821, + "train_acc": 0.008, + "test_loss": 4.826445443725586, + "test_acc": 0.01, + "lyapunov": 1.6225644127487222, + "grad_norm": 0.15063649346643543, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 177.69655632972717 + }, + { + "epoch": 132, + "train_loss": 4.895815797271728, + "train_acc": 0.00944, + "test_loss": 4.808843030548096, + "test_acc": 0.01, + "lyapunov": 1.6045795020544926, + "grad_norm": 0.13954946888706687, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 177.6466555595398 + }, + { + "epoch": 133, + "train_loss": 4.896005963287354, + "train_acc": 0.0088, + "test_loss": 4.82414176940918, + "test_acc": 0.01, + "lyapunov": 1.6050951605867547, + "grad_norm": 0.14029597054344972, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 177.6260485649109 + }, + { + "epoch": 134, + "train_loss": 4.898020515136719, + "train_acc": 0.00954, + "test_loss": 4.837333515167236, + "test_acc": 0.01, + "lyapunov": 1.609246312199956, + "grad_norm": 0.14357714581869627, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 177.584956407547 + }, + { + "epoch": 135, + "train_loss": 4.895735731048584, + "train_acc": 0.0092, + "test_loss": 4.8159059692382815, + "test_acc": 0.01, + "lyapunov": 1.6042115407831528, + "grad_norm": 0.14076247756947305, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 177.55930995941162 + }, + { + "epoch": 136, + "train_loss": 4.899449185333252, + "train_acc": 0.01, + "test_loss": 4.8122740142822265, + "test_acc": 0.01, + "lyapunov": 1.61043234645863, + "grad_norm": 0.19068368741616817, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 177.60587310791016 + }, + { + "epoch": 137, + "train_loss": 4.895413861694336, + "train_acc": 0.0092, + "test_loss": 4.812394242858887, + "test_acc": 0.01, + "lyapunov": 1.6033874640379415, + "grad_norm": 0.5123554678520819, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 177.5866892337799 + }, + { + "epoch": 138, + "train_loss": 4.897919689941406, + "train_acc": 0.01, + "test_loss": 4.824399436187744, + "test_acc": 0.01, + "lyapunov": 1.60939773604693, + "grad_norm": 0.42554152230186504, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 177.5575873851776 + }, + { + "epoch": 139, + "train_loss": 4.896585512237549, + "train_acc": 0.0096, + "test_loss": 4.813831822967529, + "test_acc": 0.01, + "lyapunov": 1.6059378885552096, + "grad_norm": 0.40395815580062067, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 177.5689401626587 + }, + { + "epoch": 140, + "train_loss": 4.896397541656494, + "train_acc": 0.01, + "test_loss": 4.813830749511719, + "test_acc": 0.01, + "lyapunov": 1.6058773750539326, + "grad_norm": 0.3517546520670756, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 177.56592845916748 + }, + { + "epoch": 141, + "train_loss": 4.897689798278809, + "train_acc": 0.00908, + "test_loss": 4.809725570678711, + "test_acc": 0.01, + "lyapunov": 1.6086021369070653, + "grad_norm": 0.34730980637645387, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 177.57834815979004 + }, + { + "epoch": 142, + "train_loss": 4.897065491943359, + "train_acc": 0.00946, + "test_loss": 4.804353742218018, + "test_acc": 0.01, + "lyapunov": 1.6070060754371116, + "grad_norm": 0.34991199227840564, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 177.5697898864746 + }, + { + "epoch": 143, + "train_loss": 4.895145080566406, + "train_acc": 0.00966, + "test_loss": 4.821014101409912, + "test_acc": 0.01, + "lyapunov": 1.6025798217110012, + "grad_norm": 0.3468579023438424, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 177.62174582481384 + }, + { + "epoch": 144, + "train_loss": 4.895165930786133, + "train_acc": 0.00984, + "test_loss": 4.800519823455811, + "test_acc": 0.01, + "lyapunov": 1.602697217860795, + "grad_norm": 0.34813989460737055, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 177.58397316932678 + }, + { + "epoch": 145, + "train_loss": 4.896360063476562, + "train_acc": 0.01, + "test_loss": 4.800519633483887, + "test_acc": 0.01, + "lyapunov": 1.605867438913916, + "grad_norm": 0.3366340618642584, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 177.5893211364746 + }, + { + "epoch": 146, + "train_loss": 4.894688441314697, + "train_acc": 0.01, + "test_loss": 4.800520404052734, + "test_acc": 0.01, + "lyapunov": 1.6013682687374027, + "grad_norm": 0.3310266277326936, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 177.56866335868835 + }, + { + "epoch": 147, + "train_loss": 4.894518559265137, + "train_acc": 0.01, + "test_loss": 4.8005200927734375, + "test_acc": 0.01, + "lyapunov": 1.600981123307172, + "grad_norm": 0.3451840089468246, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 177.56436419487 + }, + { + "epoch": 148, + "train_loss": 4.895737046356201, + "train_acc": 0.01, + "test_loss": 4.800520344543457, + "test_acc": 0.01, + "lyapunov": 1.6043054953865383, + "grad_norm": 0.3208172451267627, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 177.5520420074463 + }, + { + "epoch": 149, + "train_loss": 4.894163135528564, + "train_acc": 0.01, + "test_loss": 4.800520320892334, + "test_acc": 0.01, + "lyapunov": 1.5999351096580097, + "grad_norm": 0.32420799089770896, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 177.6083221435547 + }, + { + "epoch": 150, + "train_loss": 4.892976047668457, + "train_acc": 0.01, + "test_loss": 4.8005203384399415, + "test_acc": 0.01, + "lyapunov": 1.596442692724945, + "grad_norm": 0.32157877988197864, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 177.66009068489075 + } + ] + } +} \ No newline at end of file -- cgit v1.2.3