diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
| commit | cd99d6b874d9d09b3bb87b8485cc787885af71f1 (patch) | |
| tree | 59a233959932ca0e4f12f196275e07fcf443b33f /runs/depth_scaling/cifar100_20251230-213033 | |
init commit
Diffstat (limited to 'runs/depth_scaling/cifar100_20251230-213033')
| -rw-r--r-- | runs/depth_scaling/cifar100_20251230-213033/config.json | 21 | ||||
| -rw-r--r-- | runs/depth_scaling/cifar100_20251230-213033/results.json | 21026 |
2 files changed, 21047 insertions, 0 deletions
diff --git a/runs/depth_scaling/cifar100_20251230-213033/config.json b/runs/depth_scaling/cifar100_20251230-213033/config.json new file mode 100644 index 0000000..1ccfe37 --- /dev/null +++ b/runs/depth_scaling/cifar100_20251230-213033/config.json @@ -0,0 +1,21 @@ +{ + "dataset": "cifar100", + "depths": [ + 4, + 8, + 12, + 16, + 20 + ], + "T": 4, + "epochs": 150, + "batch_size": 128, + "lr": 0.001, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "data_dir": "./data", + "out_dir": "runs/depth_scaling", + "device": "cuda", + "seed": 42, + "no_progress": false +}
\ No newline at end of file diff --git a/runs/depth_scaling/cifar100_20251230-213033/results.json b/runs/depth_scaling/cifar100_20251230-213033/results.json new file mode 100644 index 0000000..160dc74 --- /dev/null +++ b/runs/depth_scaling/cifar100_20251230-213033/results.json @@ -0,0 +1,21026 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 4.346117241363525, + "train_acc": 0.09834, + "test_loss": 3.550243005371094, + "test_acc": 0.1705, + "lyapunov": null, + "grad_norm": 6.371099905681965, + "grad_max_sv": 5.004546135663986, + "grad_min_sv": 1.1479638856171093e-07, + "grad_condition": 101906528.03771546, + "lr": 0.0009998903417374227, + "time_sec": 16.05687952041626 + }, + { + "epoch": 2, + "train_loss": 3.5102988652038576, + "train_acc": 0.18534, + "test_loss": 3.5716390384674073, + "test_acc": 0.2002, + "lyapunov": null, + "grad_norm": 4.572810771811442, + "grad_max_sv": 3.3247465908527376, + "grad_min_sv": 8.398422393085526e-08, + "grad_condition": 76227232.13894418, + "lr": 0.0009995614150494292, + "time_sec": 15.448272466659546 + }, + { + "epoch": 3, + "train_loss": 3.054396768722534, + "train_acc": 0.25274, + "test_loss": 2.993664514160156, + "test_acc": 0.2763, + "lyapunov": null, + "grad_norm": 3.5860981037463016, + "grad_max_sv": 2.402756503224373, + "grad_min_sv": 6.775348947440918e-08, + "grad_condition": 42769838.6817436, + "lr": 0.0009990133642141358, + "time_sec": 15.465861558914185 + }, + { + "epoch": 4, + "train_loss": 2.722675824432373, + "train_acc": 0.3136, + "test_loss": 2.728995104598999, + "test_acc": 0.3281, + "lyapunov": null, + "grad_norm": 2.9852975671602957, + "grad_max_sv": 1.8682193964719773, + "grad_min_sv": 5.5938930086305014e-08, + "grad_condition": 328348281.0445617, + "lr": 0.0009982464296247522, + "time_sec": 15.43475079536438 + }, + { + "epoch": 5, + "train_loss": 2.508175393676758, + "train_acc": 0.3569, + "test_loss": 3.419650896835327, + "test_acc": 0.2461, + "lyapunov": null, + "grad_norm": 2.6358092556880783, + "grad_max_sv": 1.6064732760190963, + "grad_min_sv": 4.9754905795396096e-08, + "grad_condition": 44385388.81342572, + "lr": 0.0009972609476841367, + "time_sec": 15.444115400314331 + }, + { + "epoch": 6, + "train_loss": 2.3319723847961424, + "train_acc": 0.39276, + "test_loss": 2.5260577701568603, + "test_acc": 0.373, + "lyapunov": null, + "grad_norm": 2.4120452283895926, + "grad_max_sv": 1.3716692090034486, + "grad_min_sv": 4.6226219474476696e-08, + "grad_condition": 36175494.06179842, + "lr": 0.000996057350657239, + "time_sec": 15.43784475326538 + }, + { + "epoch": 7, + "train_loss": 2.190326895675659, + "train_acc": 0.42378, + "test_loss": 2.579724459838867, + "test_acc": 0.3695, + "lyapunov": null, + "grad_norm": 2.2437900964501787, + "grad_max_sv": 1.2385427325963974, + "grad_min_sv": 4.28970178392718e-08, + "grad_condition": 190661418.56414273, + "lr": 0.000994636166481494, + "time_sec": 15.455140829086304 + }, + { + "epoch": 8, + "train_loss": 2.070303360748291, + "train_acc": 0.44962, + "test_loss": 2.7414955226898194, + "test_acc": 0.3392, + "lyapunov": null, + "grad_norm": 2.0940271772848607, + "grad_max_sv": 1.1511073380708694, + "grad_min_sv": 4.056795894439441e-08, + "grad_condition": 707337590.06387, + "lr": 0.0009929980185352525, + "time_sec": 15.463218450546265 + }, + { + "epoch": 9, + "train_loss": 1.9642453713607788, + "train_acc": 0.47356, + "test_loss": 2.222684016609192, + "test_acc": 0.4312, + "lyapunov": null, + "grad_norm": 1.964494515952547, + "grad_max_sv": 1.0273158520460128, + "grad_min_sv": 3.78966669392633e-08, + "grad_condition": 428475326.2676049, + "lr": 0.0009911436253643444, + "time_sec": 15.443583011627197 + }, + { + "epoch": 10, + "train_loss": 1.8679190033721924, + "train_acc": 0.49384, + "test_loss": 2.2569959682464598, + "test_acc": 0.4227, + "lyapunov": null, + "grad_norm": 1.863426925292341, + "grad_max_sv": 0.9406855523586273, + "grad_min_sv": 3.563859525823609e-08, + "grad_condition": 44606817.73724544, + "lr": 0.0009890738003669028, + "time_sec": 15.442885637283325 + }, + { + "epoch": 11, + "train_loss": 1.7814382321929931, + "train_acc": 0.51302, + "test_loss": 2.504388472366333, + "test_acc": 0.3946, + "lyapunov": null, + "grad_norm": 1.7723102238636992, + "grad_max_sv": 0.8945659548044205, + "grad_min_sv": 3.425328631706526e-08, + "grad_condition": 109308981.21335419, + "lr": 0.00098678945143658, + "time_sec": 15.459418535232544 + }, + { + "epoch": 12, + "train_loss": 1.7159840296936035, + "train_acc": 0.53146, + "test_loss": 2.508260029220581, + "test_acc": 0.3935, + "lyapunov": null, + "grad_norm": 1.686140929704303, + "grad_max_sv": 0.8295574262738228, + "grad_min_sv": 3.2012488864613386e-08, + "grad_condition": 89179142.85485055, + "lr": 0.0009842915805643154, + "time_sec": 15.439209461212158 + }, + { + "epoch": 13, + "train_loss": 1.6503846585845947, + "train_acc": 0.54474, + "test_loss": 2.1456974792480468, + "test_acc": 0.4502, + "lyapunov": null, + "grad_norm": 1.619802250264676, + "grad_max_sv": 0.7797225803136826, + "grad_min_sv": 3.0749212220730626e-08, + "grad_condition": 285444721.0869424, + "lr": 0.000981581283398829, + "time_sec": 15.433976173400879 + }, + { + "epoch": 14, + "train_loss": 1.5905582858276368, + "train_acc": 0.5585, + "test_loss": 2.3602350467681883, + "test_acc": 0.4172, + "lyapunov": null, + "grad_norm": 1.5586059487347217, + "grad_max_sv": 0.7570723682641983, + "grad_min_sv": 2.990113052159238e-08, + "grad_condition": 33337603.41083364, + "lr": 0.0009786597487660333, + "time_sec": 15.430689811706543 + }, + { + "epoch": 15, + "train_loss": 1.5257548734283448, + "train_acc": 0.57394, + "test_loss": 2.2596036737442016, + "test_acc": 0.4401, + "lyapunov": null, + "grad_norm": 1.494958992831554, + "grad_max_sv": 0.7011767938733101, + "grad_min_sv": 2.8093294829334425e-08, + "grad_condition": 215948380.66679326, + "lr": 0.0009755282581475766, + "time_sec": 15.445661544799805 + }, + { + "epoch": 16, + "train_loss": 1.4769169562911988, + "train_acc": 0.58454, + "test_loss": 2.1792555765151977, + "test_acc": 0.4464, + "lyapunov": null, + "grad_norm": 1.4433947117799557, + "grad_max_sv": 0.6677212715148926, + "grad_min_sv": 2.683760501054344e-08, + "grad_condition": 45818352.96134277, + "lr": 0.0009721881851187403, + "time_sec": 15.456706523895264 + }, + { + "epoch": 17, + "train_loss": 1.429377403755188, + "train_acc": 0.5973, + "test_loss": 1.954601181793213, + "test_acc": 0.4919, + "lyapunov": null, + "grad_norm": 1.402899746172417, + "grad_max_sv": 0.6569379523396492, + "grad_min_sv": 2.6772942612884876e-08, + "grad_condition": 33425629.606939513, + "lr": 0.0009686409947459456, + "time_sec": 15.437876462936401 + }, + { + "epoch": 18, + "train_loss": 1.3954533521652221, + "train_acc": 0.60348, + "test_loss": 2.0381541999816895, + "test_acc": 0.4877, + "lyapunov": null, + "grad_norm": 1.3646767773598742, + "grad_max_sv": 0.6277542792260646, + "grad_min_sv": 2.5360278501545055e-08, + "grad_condition": 1276893214.2885015, + "lr": 0.0009648882429441254, + "time_sec": 15.442293643951416 + }, + { + "epoch": 19, + "train_loss": 1.34601386013031, + "train_acc": 0.61788, + "test_loss": 2.016515805435181, + "test_acc": 0.4879, + "lyapunov": null, + "grad_norm": 1.3307426948998278, + "grad_max_sv": 0.6192222326993942, + "grad_min_sv": 2.5143750027184496e-08, + "grad_condition": 86894504.02450311, + "lr": 0.00096093157579425, + "time_sec": 15.452877044677734 + }, + { + "epoch": 20, + "train_loss": 1.3103528637313844, + "train_acc": 0.6263, + "test_loss": 1.9570331373214722, + "test_acc": 0.5034, + "lyapunov": null, + "grad_norm": 1.3019068672950393, + "grad_max_sv": 0.5866124749183654, + "grad_min_sv": 2.432551227254942e-08, + "grad_condition": 79675782.79073408, + "lr": 0.0009567727288213001, + "time_sec": 15.442177057266235 + }, + { + "epoch": 21, + "train_loss": 1.2698568128204346, + "train_acc": 0.6344, + "test_loss": 2.4308045747756957, + "test_acc": 0.4364, + "lyapunov": null, + "grad_norm": 1.268768380545349, + "grad_max_sv": 0.5797948583960533, + "grad_min_sv": 2.4104086050920348e-08, + "grad_condition": 252776511.74393004, + "lr": 0.0009524135262330095, + "time_sec": 15.434435844421387 + }, + { + "epoch": 22, + "train_loss": 1.2418579862976074, + "train_acc": 0.64312, + "test_loss": 2.0848071727752684, + "test_acc": 0.4867, + "lyapunov": null, + "grad_norm": 1.2415784803203374, + "grad_max_sv": 0.5592644922435284, + "grad_min_sv": 2.333180208254765e-08, + "grad_condition": 407593245.7962709, + "lr": 0.0009478558801197061, + "time_sec": 15.460945129394531 + }, + { + "epoch": 23, + "train_loss": 1.2006691330718995, + "train_acc": 0.65526, + "test_loss": 2.041600823402405, + "test_acc": 0.4981, + "lyapunov": null, + "grad_norm": 1.2102718857806654, + "grad_max_sv": 0.5479752145707607, + "grad_min_sv": 2.2646243507534748e-08, + "grad_condition": 185681115.951604, + "lr": 0.000943101789615607, + "time_sec": 15.44005274772644 + }, + { + "epoch": 24, + "train_loss": 1.172968614616394, + "train_acc": 0.66154, + "test_loss": 1.9552119861602784, + "test_acc": 0.513, + "lyapunov": null, + "grad_norm": 1.1987019399549284, + "grad_max_sv": 0.5312893047928811, + "grad_min_sv": 2.1980094488081857e-08, + "grad_condition": 1318897337.4819613, + "lr": 0.0009381533400219313, + "time_sec": 15.440562009811401 + }, + { + "epoch": 25, + "train_loss": 1.1449218238067627, + "train_acc": 0.6641, + "test_loss": 2.128752773284912, + "test_acc": 0.4906, + "lyapunov": null, + "grad_norm": 1.1778317272519585, + "grad_max_sv": 0.5174455069005489, + "grad_min_sv": 2.167262270237613e-08, + "grad_condition": 94067067.14088301, + "lr": 0.0009330127018922189, + "time_sec": 15.443851232528687 + }, + { + "epoch": 26, + "train_loss": 1.1113452094268799, + "train_acc": 0.67438, + "test_loss": 1.8866374584197998, + "test_acc": 0.5238, + "lyapunov": null, + "grad_norm": 1.1514970963524438, + "grad_max_sv": 0.5059572130441665, + "grad_min_sv": 2.105146406777836e-08, + "grad_condition": 50748348.81685668, + "lr": 0.000927682130080253, + "time_sec": 15.436878681182861 + }, + { + "epoch": 27, + "train_loss": 1.0829708759689332, + "train_acc": 0.68438, + "test_loss": 1.9943335615158082, + "test_acc": 0.5124, + "lyapunov": null, + "grad_norm": 1.1319771840855883, + "grad_max_sv": 0.4948433578014374, + "grad_min_sv": 2.0725160652934616e-08, + "grad_condition": 77507476.80554287, + "lr": 0.0009221639627510072, + "time_sec": 15.441301822662354 + }, + { + "epoch": 28, + "train_loss": 1.0513020403671265, + "train_acc": 0.6904, + "test_loss": 1.9359693916320801, + "test_acc": 0.5214, + "lyapunov": null, + "grad_norm": 1.1163749465170618, + "grad_max_sv": 0.48814368024468424, + "grad_min_sv": 2.0212865362197185e-08, + "grad_condition": 298941066.3217323, + "lr": 0.0009164606203550494, + "time_sec": 15.441382646560669 + }, + { + "epoch": 29, + "train_loss": 1.029607636756897, + "train_acc": 0.69482, + "test_loss": 1.8560630758285523, + "test_acc": 0.5431, + "lyapunov": null, + "grad_norm": 1.0928580221633342, + "grad_max_sv": 0.5047290526330471, + "grad_min_sv": 2.040681175013992e-08, + "grad_condition": 48855533.517919585, + "lr": 0.0009105746045668516, + "time_sec": 15.460914373397827 + }, + { + "epoch": 30, + "train_loss": 1.0061684103393556, + "train_acc": 0.70324, + "test_loss": 1.8417754476547241, + "test_acc": 0.5501, + "lyapunov": null, + "grad_norm": 1.0821004976322715, + "grad_max_sv": 0.4740450643002987, + "grad_min_sv": 1.9723761995882327e-08, + "grad_condition": 57054017.19113614, + "lr": 0.0009045084971874733, + "time_sec": 15.458839178085327 + }, + { + "epoch": 31, + "train_loss": 0.9935745064163208, + "train_acc": 0.70312, + "test_loss": 1.9427630338668824, + "test_acc": 0.522, + "lyapunov": null, + "grad_norm": 1.0722093249603526, + "grad_max_sv": 0.46733852848410606, + "grad_min_sv": 1.9939205435706707e-08, + "grad_condition": 112229781.98396464, + "lr": 0.0008982649590120977, + "time_sec": 15.452664375305176 + }, + { + "epoch": 32, + "train_loss": 0.9721898876953124, + "train_acc": 0.70988, + "test_loss": 1.9291723361968993, + "test_acc": 0.5365, + "lyapunov": null, + "grad_norm": 1.0493640798096933, + "grad_max_sv": 0.451675596088171, + "grad_min_sv": 1.9157993355872065e-08, + "grad_condition": 369697835.9253775, + "lr": 0.0008918467286629196, + "time_sec": 15.447975158691406 + }, + { + "epoch": 33, + "train_loss": 0.9359502591705322, + "train_acc": 0.71948, + "test_loss": 1.8434128448486329, + "test_acc": 0.544, + "lyapunov": null, + "grad_norm": 1.0350388755850537, + "grad_max_sv": 0.4494323328137398, + "grad_min_sv": 1.8973058482987804e-08, + "grad_condition": 171928795.69725567, + "lr": 0.0008852566213878943, + "time_sec": 15.466245889663696 + }, + { + "epoch": 34, + "train_loss": 0.9224456702995301, + "train_acc": 0.72168, + "test_loss": 1.9599631881713868, + "test_acc": 0.5373, + "lyapunov": null, + "grad_norm": 1.0242311025233581, + "grad_max_sv": 0.44513428434729574, + "grad_min_sv": 1.8523945613654545e-08, + "grad_condition": 888195654.0727282, + "lr": 0.000878497527825878, + "time_sec": 15.461785316467285 + }, + { + "epoch": 35, + "train_loss": 0.9021567019844056, + "train_acc": 0.72618, + "test_loss": 1.9999154584884644, + "test_acc": 0.5252, + "lyapunov": null, + "grad_norm": 1.0039865896001459, + "grad_max_sv": 0.43928237855434416, + "grad_min_sv": 1.8592035315456722e-08, + "grad_condition": 59743908.57133106, + "lr": 0.000871572412738697, + "time_sec": 15.456985473632812 + }, + { + "epoch": 36, + "train_loss": 0.873283097190857, + "train_acc": 0.73628, + "test_loss": 1.982330265045166, + "test_acc": 0.5279, + "lyapunov": null, + "grad_norm": 0.9875825554026111, + "grad_max_sv": 0.42813498005270956, + "grad_min_sv": 1.7983777930719037e-08, + "grad_condition": 38527409.79900636, + "lr": 0.0008644843137107055, + "time_sec": 15.460105419158936 + }, + { + "epoch": 37, + "train_loss": 0.855709279346466, + "train_acc": 0.74242, + "test_loss": 1.9136155584335328, + "test_acc": 0.5472, + "lyapunov": null, + "grad_norm": 0.9742310219337682, + "grad_max_sv": 0.4270216949284077, + "grad_min_sv": 1.8125810764824114e-08, + "grad_condition": 40840950.73216411, + "lr": 0.0008572363398164014, + "time_sec": 15.459755897521973 + }, + { + "epoch": 38, + "train_loss": 0.8404359550476074, + "train_acc": 0.74404, + "test_loss": 1.9389733367919921, + "test_acc": 0.543, + "lyapunov": null, + "grad_norm": 0.9722202503028375, + "grad_max_sv": 0.42485796511173246, + "grad_min_sv": 1.783134123689578e-08, + "grad_condition": 35194167.51271446, + "lr": 0.0008498316702566826, + "time_sec": 15.465211629867554 + }, + { + "epoch": 39, + "train_loss": 0.8240101078987122, + "train_acc": 0.7481, + "test_loss": 1.8307217979431152, + "test_acc": 0.5614, + "lyapunov": null, + "grad_norm": 0.9595502877351665, + "grad_max_sv": 0.42209447696805, + "grad_min_sv": 1.767885368514355e-08, + "grad_condition": 49656386.85866156, + "lr": 0.0008422735529643442, + "time_sec": 15.455949544906616 + }, + { + "epoch": 40, + "train_loss": 0.8046207006645203, + "train_acc": 0.75466, + "test_loss": 1.850761813545227, + "test_acc": 0.5635, + "lyapunov": null, + "grad_norm": 0.9479757240987767, + "grad_max_sv": 0.4134661167860031, + "grad_min_sv": 1.7007238412025672e-08, + "grad_condition": 126702887.42727256, + "lr": 0.0008345653031794289, + "time_sec": 15.462433099746704 + }, + { + "epoch": 41, + "train_loss": 0.7895244974899291, + "train_acc": 0.7586, + "test_loss": 1.8032215663909912, + "test_acc": 0.5672, + "lyapunov": null, + "grad_norm": 0.9378242670136524, + "grad_max_sv": 0.3964280657470226, + "grad_min_sv": 1.6944396442897246e-08, + "grad_condition": 56052359.18882908, + "lr": 0.0008267103019950526, + "time_sec": 15.461899757385254 + }, + { + "epoch": 42, + "train_loss": 0.7817759350585938, + "train_acc": 0.76056, + "test_loss": 1.8505826110839845, + "test_acc": 0.5582, + "lyapunov": null, + "grad_norm": 0.9337187835649021, + "grad_max_sv": 0.40529350489377974, + "grad_min_sv": 1.6676117367206422e-08, + "grad_condition": 104849301.5445062, + "lr": 0.0008187119948743447, + "time_sec": 15.4581778049469 + }, + { + "epoch": 43, + "train_loss": 0.7522177431297302, + "train_acc": 0.77, + "test_loss": 1.8242130517959594, + "test_acc": 0.5664, + "lyapunov": null, + "grad_norm": 0.9099555522847652, + "grad_max_sv": 0.3934644728899002, + "grad_min_sv": 1.6434511908997028e-08, + "grad_condition": 61342068.969211556, + "lr": 0.000810573890139155, + "time_sec": 15.447810411453247 + }, + { + "epoch": 44, + "train_loss": 0.7323650365447998, + "train_acc": 0.77464, + "test_loss": 1.8068662160873412, + "test_acc": 0.5687, + "lyapunov": null, + "grad_norm": 0.9037556138602378, + "grad_max_sv": 0.38610322400927544, + "grad_min_sv": 1.6304181772903992e-08, + "grad_condition": 167736758.90882486, + "lr": 0.0008022995574311873, + "time_sec": 15.458601951599121 + }, + { + "epoch": 45, + "train_loss": 0.7159886347198486, + "train_acc": 0.77928, + "test_loss": 1.8823264539718627, + "test_acc": 0.5645, + "lyapunov": null, + "grad_norm": 0.8924866037240323, + "grad_max_sv": 0.3947519548237324, + "grad_min_sv": 1.6336485028634052e-08, + "grad_condition": 69167052.26120928, + "lr": 0.0007938926261462363, + "time_sec": 15.471583843231201 + }, + { + "epoch": 46, + "train_loss": 0.7136952446365357, + "train_acc": 0.78054, + "test_loss": 1.7574677402496337, + "test_acc": 0.5825, + "lyapunov": null, + "grad_norm": 0.8931942393361509, + "grad_max_sv": 0.37973910570144653, + "grad_min_sv": 1.6153765381235476e-08, + "grad_condition": 489329276.9292526, + "lr": 0.0007853567838422158, + "time_sec": 15.471785068511963 + }, + { + "epoch": 47, + "train_loss": 0.6837898429489135, + "train_acc": 0.78762, + "test_loss": 1.813544430541992, + "test_acc": 0.5725, + "lyapunov": null, + "grad_norm": 0.8815821036419627, + "grad_max_sv": 0.3751175247132778, + "grad_min_sv": 1.5766544728818e-08, + "grad_condition": 56980767.9665909, + "lr": 0.0007766957746216719, + "time_sec": 15.457926750183105 + }, + { + "epoch": 48, + "train_loss": 0.6856673602676392, + "train_acc": 0.78888, + "test_loss": 1.990400904083252, + "test_acc": 0.5508, + "lyapunov": null, + "grad_norm": 0.8744462547536074, + "grad_max_sv": 0.3799706071615219, + "grad_min_sv": 1.6096928557272904e-08, + "grad_condition": 303945380.88277286, + "lr": 0.0007679133974894982, + "time_sec": 15.456810712814331 + }, + { + "epoch": 49, + "train_loss": 0.667086083278656, + "train_acc": 0.792, + "test_loss": 1.8513258657455445, + "test_acc": 0.5727, + "lyapunov": null, + "grad_norm": 0.8677773875250141, + "grad_max_sv": 0.3783408857882023, + "grad_min_sv": 1.5666924351245835e-08, + "grad_condition": 353923080.3313891, + "lr": 0.000759013504686565, + "time_sec": 15.462752342224121 + }, + { + "epoch": 50, + "train_loss": 0.6466483051490783, + "train_acc": 0.79742, + "test_loss": 2.043276873779297, + "test_acc": 0.5419, + "lyapunov": null, + "grad_norm": 0.8555816651124006, + "grad_max_sv": 0.3675771526992321, + "grad_min_sv": 1.5045219146090152e-08, + "grad_condition": 536508015.45004594, + "lr": 0.0007499999999999998, + "time_sec": 15.458629846572876 + }, + { + "epoch": 51, + "train_loss": 0.6258693974494934, + "train_acc": 0.80236, + "test_loss": 1.954080751991272, + "test_acc": 0.5622, + "lyapunov": null, + "grad_norm": 0.8469179426728266, + "grad_max_sv": 0.377849230915308, + "grad_min_sv": 1.5333696528480045e-08, + "grad_condition": 117912957.37628272, + "lr": 0.0007408768370508575, + "time_sec": 15.46766972541809 + }, + { + "epoch": 52, + "train_loss": 0.6236670018768311, + "train_acc": 0.80516, + "test_loss": 1.8472453788757324, + "test_acc": 0.5858, + "lyapunov": null, + "grad_norm": 0.8404179479578597, + "grad_max_sv": 0.3541756056249142, + "grad_min_sv": 1.5022051764665422e-08, + "grad_condition": 129884434.5908782, + "lr": 0.0007316480175599307, + "time_sec": 15.461432695388794 + }, + { + "epoch": 53, + "train_loss": 0.6075375831794739, + "train_acc": 0.80952, + "test_loss": 1.9628248615264892, + "test_acc": 0.5673, + "lyapunov": null, + "grad_norm": 0.8367502172326149, + "grad_max_sv": 0.3639704927802086, + "grad_min_sv": 1.532564684603166e-08, + "grad_condition": 35699441.49240203, + "lr": 0.0007223175895924635, + "time_sec": 15.46337342262268 + }, + { + "epoch": 54, + "train_loss": 0.5996641965866089, + "train_acc": 0.81216, + "test_loss": 1.8179010778427125, + "test_acc": 0.5843, + "lyapunov": null, + "grad_norm": 0.8307418709294171, + "grad_max_sv": 0.3613003775477409, + "grad_min_sv": 1.4895932505510321e-08, + "grad_condition": 875528249.2472179, + "lr": 0.0007128896457825361, + "time_sec": 15.465355396270752 + }, + { + "epoch": 55, + "train_loss": 0.5882498831176758, + "train_acc": 0.81494, + "test_loss": 1.8813747344970704, + "test_acc": 0.582, + "lyapunov": null, + "grad_norm": 0.8235931888813899, + "grad_max_sv": 0.3551651187241077, + "grad_min_sv": 1.469800572865415e-08, + "grad_condition": 484027587.3941019, + "lr": 0.0007033683215378998, + "time_sec": 15.460170984268188 + }, + { + "epoch": 56, + "train_loss": 0.5707145217132569, + "train_acc": 0.82072, + "test_loss": 1.840101174545288, + "test_acc": 0.5813, + "lyapunov": null, + "grad_norm": 0.8086603393569909, + "grad_max_sv": 0.34960880503058434, + "grad_min_sv": 1.4356627959719037e-08, + "grad_condition": 198153063.82803452, + "lr": 0.0006937577932260512, + "time_sec": 15.455865383148193 + }, + { + "epoch": 57, + "train_loss": 0.5646172902584076, + "train_acc": 0.82002, + "test_loss": 1.8341705081939697, + "test_acc": 0.5873, + "lyapunov": null, + "grad_norm": 0.810642435475112, + "grad_max_sv": 0.3562955237925053, + "grad_min_sv": 1.4607543052502087e-08, + "grad_condition": 226679350.92895135, + "lr": 0.0006840622763423388, + "time_sec": 15.474364757537842 + }, + { + "epoch": 58, + "train_loss": 0.5469015620231629, + "train_acc": 0.82858, + "test_loss": 1.9427689083099364, + "test_acc": 0.5739, + "lyapunov": null, + "grad_norm": 0.7944800992028263, + "grad_max_sv": 0.33950445652008054, + "grad_min_sv": 1.368517551399162e-08, + "grad_condition": 347795127.79131866, + "lr": 0.0006742860236609073, + "time_sec": 15.464811563491821 + }, + { + "epoch": 59, + "train_loss": 0.5445322315883636, + "train_acc": 0.82716, + "test_loss": 1.8801843715667725, + "test_acc": 0.5792, + "lyapunov": null, + "grad_norm": 0.7916664309528131, + "grad_max_sv": 0.3434500187635422, + "grad_min_sv": 1.4393026628520266e-08, + "grad_condition": 315625887.3364844, + "lr": 0.0006644333233692913, + "time_sec": 15.463439702987671 + }, + { + "epoch": 60, + "train_loss": 0.5323922993850708, + "train_acc": 0.8299, + "test_loss": 1.9002599145889283, + "test_acc": 0.5809, + "lyapunov": null, + "grad_norm": 0.7870533377985126, + "grad_max_sv": 0.34093547612428665, + "grad_min_sv": 1.4214920851518542e-08, + "grad_condition": 91722689.16411342, + "lr": 0.0006545084971874734, + "time_sec": 15.450496912002563 + }, + { + "epoch": 61, + "train_loss": 0.519907633266449, + "train_acc": 0.83526, + "test_loss": 1.9299441148757934, + "test_acc": 0.5794, + "lyapunov": null, + "grad_norm": 0.7766553414478388, + "grad_max_sv": 0.3247631438076496, + "grad_min_sv": 1.3660971805162792e-08, + "grad_condition": 158255223.31341702, + "lr": 0.0006445158984722354, + "time_sec": 15.486064910888672 + }, + { + "epoch": 62, + "train_loss": 0.5158719365882873, + "train_acc": 0.83688, + "test_loss": 1.8924803583145142, + "test_acc": 0.5838, + "lyapunov": null, + "grad_norm": 0.7769879212152438, + "grad_max_sv": 0.34014692306518557, + "grad_min_sv": 1.4163850685366964e-08, + "grad_condition": 69424987.38028774, + "lr": 0.0006344599103076324, + "time_sec": 15.469778776168823 + }, + { + "epoch": 63, + "train_loss": 0.5016013371658326, + "train_acc": 0.83886, + "test_loss": 1.9557724254608155, + "test_acc": 0.578, + "lyapunov": null, + "grad_norm": 0.7667097633814496, + "grad_max_sv": 0.3396275587379932, + "grad_min_sv": 1.3258012922148093e-08, + "grad_condition": 246523332.7028369, + "lr": 0.0006243449435824269, + "time_sec": 15.490433692932129 + }, + { + "epoch": 64, + "train_loss": 0.4887677048301697, + "train_acc": 0.84204, + "test_loss": 1.919124504852295, + "test_acc": 0.5841, + "lyapunov": null, + "grad_norm": 0.7573654062297513, + "grad_max_sv": 0.32946483269333837, + "grad_min_sv": 1.3579194014026741e-08, + "grad_condition": 122613286.93525049, + "lr": 0.0006141754350553275, + "time_sec": 15.473332166671753 + }, + { + "epoch": 65, + "train_loss": 0.4757623895263672, + "train_acc": 0.84768, + "test_loss": 1.9984818859100342, + "test_acc": 0.5761, + "lyapunov": null, + "grad_norm": 0.748014318960053, + "grad_max_sv": 0.33319817706942556, + "grad_min_sv": 1.3326467683972414e-08, + "grad_condition": 623990635.8236978, + "lr": 0.0006039558454088793, + "time_sec": 15.485574960708618 + }, + { + "epoch": 66, + "train_loss": 0.4649162304496765, + "train_acc": 0.85152, + "test_loss": 1.9724672309875488, + "test_acc": 0.576, + "lyapunov": null, + "grad_norm": 0.7417116384839675, + "grad_max_sv": 0.3309340290725231, + "grad_min_sv": 1.334454621318426e-08, + "grad_condition": 142248731.7186973, + "lr": 0.000593690657292862, + "time_sec": 15.480328559875488 + }, + { + "epoch": 67, + "train_loss": 0.4583131973075867, + "train_acc": 0.85314, + "test_loss": 1.911379218673706, + "test_acc": 0.5815, + "lyapunov": null, + "grad_norm": 0.737726746568229, + "grad_max_sv": 0.32083366960287096, + "grad_min_sv": 1.2965913287477093e-08, + "grad_condition": 78597953.03928533, + "lr": 0.0005833843733580507, + "time_sec": 15.469099283218384 + }, + { + "epoch": 68, + "train_loss": 0.44331007887840274, + "train_acc": 0.85794, + "test_loss": 1.9728064548492432, + "test_acc": 0.5854, + "lyapunov": null, + "grad_norm": 0.7274207800935486, + "grad_max_sv": 0.3188414238393307, + "grad_min_sv": 1.2804001882360528e-08, + "grad_condition": 55555678.95357393, + "lr": 0.0005730415142812054, + "time_sec": 15.481547117233276 + }, + { + "epoch": 69, + "train_loss": 0.43979987537384035, + "train_acc": 0.85974, + "test_loss": 1.919715219116211, + "test_acc": 0.5884, + "lyapunov": null, + "grad_norm": 0.7242391218539499, + "grad_max_sv": 0.3140024244785309, + "grad_min_sv": 1.275962300552845e-08, + "grad_condition": 326554514.7187793, + "lr": 0.0005626666167821517, + "time_sec": 15.48648977279663 + }, + { + "epoch": 70, + "train_loss": 0.4322844411468506, + "train_acc": 0.86176, + "test_loss": 2.0117150314331056, + "test_acc": 0.5834, + "lyapunov": null, + "grad_norm": 0.7186156540948507, + "grad_max_sv": 0.31351484879851343, + "grad_min_sv": 1.2888502469096674e-08, + "grad_condition": 178788272.1664782, + "lr": 0.0005522642316338265, + "time_sec": 15.48006272315979 + }, + { + "epoch": 71, + "train_loss": 0.42623882338523866, + "train_acc": 0.86272, + "test_loss": 1.9539510818481445, + "test_acc": 0.5875, + "lyapunov": null, + "grad_norm": 0.7137008149677833, + "grad_max_sv": 0.31342701613903046, + "grad_min_sv": 1.2595162532727522e-08, + "grad_condition": 302205097.8444015, + "lr": 0.0005418389216661573, + "time_sec": 15.492274284362793 + }, + { + "epoch": 72, + "train_loss": 0.41300243412017823, + "train_acc": 0.86584, + "test_loss": 1.9104324056625366, + "test_acc": 0.5874, + "lyapunov": null, + "grad_norm": 0.7058331032866322, + "grad_max_sv": 0.3122198607772589, + "grad_min_sv": 1.2484183565045215e-08, + "grad_condition": 249411647.9543108, + "lr": 0.0005313952597646563, + "time_sec": 15.472809076309204 + }, + { + "epoch": 73, + "train_loss": 0.4090885982322693, + "train_acc": 0.86766, + "test_loss": 1.9304109241485596, + "test_acc": 0.5896, + "lyapunov": null, + "grad_norm": 0.7030000923329225, + "grad_max_sv": 0.3075466021895409, + "grad_min_sv": 1.252222159744791e-08, + "grad_condition": 331808797.86113906, + "lr": 0.0005209378268645994, + "time_sec": 15.497188806533813 + }, + { + "epoch": 74, + "train_loss": 0.40033238063812254, + "train_acc": 0.87144, + "test_loss": 1.985810231399536, + "test_acc": 0.5849, + "lyapunov": null, + "grad_norm": 0.6995855816146154, + "grad_max_sv": 0.31191978715360164, + "grad_min_sv": 1.2527367021682167e-08, + "grad_condition": 263818262.83558512, + "lr": 0.0005104712099416781, + "time_sec": 15.483733892440796 + }, + { + "epoch": 75, + "train_loss": 0.39340143531799315, + "train_acc": 0.87318, + "test_loss": 1.9034859148025514, + "test_acc": 0.5988, + "lyapunov": null, + "grad_norm": 0.6917443264462005, + "grad_max_sv": 0.3097103513777256, + "grad_min_sv": 1.2234487580323195e-08, + "grad_condition": 189402494.46869463, + "lr": 0.0004999999999999996, + "time_sec": 15.491854667663574 + }, + { + "epoch": 76, + "train_loss": 0.38218573943138123, + "train_acc": 0.87562, + "test_loss": 1.9674748405456544, + "test_acc": 0.5897, + "lyapunov": null, + "grad_norm": 0.6848552863949536, + "grad_max_sv": 0.306015183404088, + "grad_min_sv": 1.2231246879906843e-08, + "grad_condition": 67368302.47465871, + "lr": 0.0004895287900583212, + "time_sec": 15.475126504898071 + }, + { + "epoch": 77, + "train_loss": 0.37298857500076293, + "train_acc": 0.8782, + "test_loss": 1.9116508392333984, + "test_acc": 0.5973, + "lyapunov": null, + "grad_norm": 0.676733354734531, + "grad_max_sv": 0.30364411063492297, + "grad_min_sv": 1.2298366306937036e-08, + "grad_condition": 113213891.7010752, + "lr": 0.0004790621731353997, + "time_sec": 15.476521015167236 + }, + { + "epoch": 78, + "train_loss": 0.3701143793487549, + "train_acc": 0.88078, + "test_loss": 2.085685297012329, + "test_acc": 0.5795, + "lyapunov": null, + "grad_norm": 0.6755741762416969, + "grad_max_sv": 0.30699342787265776, + "grad_min_sv": 1.205234841629107e-08, + "grad_condition": 3030668677.964108, + "lr": 0.000468604740235343, + "time_sec": 15.484160423278809 + }, + { + "epoch": 79, + "train_loss": 0.36959360103607175, + "train_acc": 0.87916, + "test_loss": 1.9509956113815308, + "test_acc": 0.601, + "lyapunov": null, + "grad_norm": 0.6757618176434513, + "grad_max_sv": 0.3065595250576735, + "grad_min_sv": 1.2097158442331279e-08, + "grad_condition": 77210703.25088154, + "lr": 0.00045816107833384175, + "time_sec": 15.480469226837158 + }, + { + "epoch": 80, + "train_loss": 0.3621886194419861, + "train_acc": 0.88318, + "test_loss": 1.9287394012451171, + "test_acc": 0.5985, + "lyapunov": null, + "grad_norm": 0.6691339361755074, + "grad_max_sv": 0.3024368964135647, + "grad_min_sv": 1.2120088314785185e-08, + "grad_condition": 405016123.1402856, + "lr": 0.0004477357683661729, + "time_sec": 15.493567705154419 + }, + { + "epoch": 81, + "train_loss": 0.35030229503631594, + "train_acc": 0.88624, + "test_loss": 2.00673182220459, + "test_acc": 0.5919, + "lyapunov": null, + "grad_norm": 0.6596224304671231, + "grad_max_sv": 0.29136806540191174, + "grad_min_sv": 1.127730693450046e-08, + "grad_condition": 1639288832.1236253, + "lr": 0.00043733338321784746, + "time_sec": 15.493369817733765 + }, + { + "epoch": 82, + "train_loss": 0.34493877026557923, + "train_acc": 0.8872, + "test_loss": 2.030837797164917, + "test_acc": 0.5955, + "lyapunov": null, + "grad_norm": 0.656267153049647, + "grad_max_sv": 0.28955256529152396, + "grad_min_sv": 1.1868315586143104e-08, + "grad_condition": 869246762.0746359, + "lr": 0.0004269584857187939, + "time_sec": 15.51423978805542 + }, + { + "epoch": 83, + "train_loss": 0.33515030410289764, + "train_acc": 0.89166, + "test_loss": 2.0619586929321287, + "test_acc": 0.5889, + "lyapunov": null, + "grad_norm": 0.6433611607654642, + "grad_max_sv": 0.28342132121324537, + "grad_min_sv": 1.1435175364601923e-08, + "grad_condition": 62926422.11698373, + "lr": 0.0004166156266419484, + "time_sec": 15.476901769638062 + }, + { + "epoch": 84, + "train_loss": 0.33155179508209226, + "train_acc": 0.8925, + "test_loss": 2.021995645713806, + "test_acc": 0.5931, + "lyapunov": null, + "grad_norm": 0.6432295423646542, + "grad_max_sv": 0.29169376716017725, + "grad_min_sv": 1.1024380705050054e-08, + "grad_condition": 1442816426.8026254, + "lr": 0.0004063093427071373, + "time_sec": 15.489609479904175 + }, + { + "epoch": 85, + "train_loss": 0.32435158078193665, + "train_acc": 0.89488, + "test_loss": 2.013304320335388, + "test_acc": 0.5916, + "lyapunov": null, + "grad_norm": 0.6387569144998656, + "grad_max_sv": 0.29359805807471273, + "grad_min_sv": 1.1595539084474638e-08, + "grad_condition": 189598831.94028363, + "lr": 0.0003960441545911199, + "time_sec": 15.501060247421265 + }, + { + "epoch": 86, + "train_loss": 0.3179238869667053, + "train_acc": 0.89698, + "test_loss": 1.9903604904174805, + "test_acc": 0.5974, + "lyapunov": null, + "grad_norm": 0.6339090393643317, + "grad_max_sv": 0.2939893651753664, + "grad_min_sv": 1.1321056620980375e-08, + "grad_condition": 126309584.77428427, + "lr": 0.0003858245649446718, + "time_sec": 15.473534345626831 + }, + { + "epoch": 87, + "train_loss": 0.3082590392589569, + "train_acc": 0.90084, + "test_loss": 1.9719016357421875, + "test_acc": 0.5973, + "lyapunov": null, + "grad_norm": 0.6204648872897773, + "grad_max_sv": 0.2808060821145773, + "grad_min_sv": 1.1003370339922671e-08, + "grad_condition": 295054731.1552657, + "lr": 0.00037565505641757235, + "time_sec": 15.489596128463745 + }, + { + "epoch": 88, + "train_loss": 0.30407683875083924, + "train_acc": 0.9015, + "test_loss": 2.046679413032532, + "test_acc": 0.5983, + "lyapunov": null, + "grad_norm": 0.6232550099645187, + "grad_max_sv": 0.2919613588601351, + "grad_min_sv": 1.106688122280361e-08, + "grad_condition": 322143674.85252506, + "lr": 0.00036554008969236695, + "time_sec": 15.49986457824707 + }, + { + "epoch": 89, + "train_loss": 0.3027446964073181, + "train_acc": 0.90118, + "test_loss": 2.086252244949341, + "test_acc": 0.5888, + "lyapunov": null, + "grad_norm": 0.6190288324649083, + "grad_max_sv": 0.28052753023803234, + "grad_min_sv": 1.0900322809496467e-08, + "grad_condition": 566479183.315316, + "lr": 0.0003554841015277638, + "time_sec": 15.504590034484863 + }, + { + "epoch": 90, + "train_loss": 0.29228587161064146, + "train_acc": 0.9047, + "test_loss": 2.0138395809173586, + "test_acc": 0.5944, + "lyapunov": null, + "grad_norm": 0.6096912272320082, + "grad_max_sv": 0.28337894156575205, + "grad_min_sv": 1.0885550369042416e-08, + "grad_condition": 2055184394.3102565, + "lr": 0.000345491502812526, + "time_sec": 15.49034571647644 + }, + { + "epoch": 91, + "train_loss": 0.2902773824119568, + "train_acc": 0.9069, + "test_loss": 2.0066411319732667, + "test_acc": 0.6022, + "lyapunov": null, + "grad_norm": 0.6066794741118794, + "grad_max_sv": 0.27967384792864325, + "grad_min_sv": 1.113149796019841e-08, + "grad_condition": 126085093.27825883, + "lr": 0.0003355666766307081, + "time_sec": 15.486260652542114 + }, + { + "epoch": 92, + "train_loss": 0.2833449110221863, + "train_acc": 0.90814, + "test_loss": 2.077221655654907, + "test_acc": 0.5914, + "lyapunov": null, + "grad_norm": 0.6042052133918574, + "grad_max_sv": 0.27325271964073183, + "grad_min_sv": 1.057503346621057e-08, + "grad_condition": 3596600642.934755, + "lr": 0.00032571397633909225, + "time_sec": 15.505445957183838 + }, + { + "epoch": 93, + "train_loss": 0.275921519203186, + "train_acc": 0.91156, + "test_loss": 2.0253973026275633, + "test_acc": 0.6011, + "lyapunov": null, + "grad_norm": 0.596345487343705, + "grad_max_sv": 0.27955980561673643, + "grad_min_sv": 1.0745895713884512e-08, + "grad_condition": 99226565.9342475, + "lr": 0.00031593772365766094, + "time_sec": 15.494666337966919 + }, + { + "epoch": 94, + "train_loss": 0.27615388660430906, + "train_acc": 0.90982, + "test_loss": 2.0751438976287844, + "test_acc": 0.5926, + "lyapunov": null, + "grad_norm": 0.5987218023474344, + "grad_max_sv": 0.27597025111317636, + "grad_min_sv": 1.0580089662877434e-08, + "grad_condition": 377084496.3903383, + "lr": 0.0003062422067739483, + "time_sec": 15.47998309135437 + }, + { + "epoch": 95, + "train_loss": 0.26991701264381407, + "train_acc": 0.9106, + "test_loss": 2.065015655708313, + "test_acc": 0.5995, + "lyapunov": null, + "grad_norm": 0.591359331692498, + "grad_max_sv": 0.280801360309124, + "grad_min_sv": 1.058501965522929e-08, + "grad_condition": 177268235.5442259, + "lr": 0.00029663167846209965, + "time_sec": 15.503370761871338 + }, + { + "epoch": 96, + "train_loss": 0.26606324160575867, + "train_acc": 0.9137, + "test_loss": 2.0547151592254638, + "test_acc": 0.6024, + "lyapunov": null, + "grad_norm": 0.5902198713479344, + "grad_max_sv": 0.2709753967821598, + "grad_min_sv": 1.0618598106555168e-08, + "grad_condition": 842340240.5160465, + "lr": 0.00028711035421746345, + "time_sec": 15.498698949813843 + }, + { + "epoch": 97, + "train_loss": 0.25566293501853943, + "train_acc": 0.91732, + "test_loss": 2.007575707626343, + "test_acc": 0.5994, + "lyapunov": null, + "grad_norm": 0.5817467490050799, + "grad_max_sv": 0.2697387088090181, + "grad_min_sv": 1.025438704743524e-08, + "grad_condition": 463836797.56778467, + "lr": 0.00027768241040753615, + "time_sec": 15.489367485046387 + }, + { + "epoch": 98, + "train_loss": 0.2515622547864914, + "train_acc": 0.91842, + "test_loss": 2.04601014251709, + "test_acc": 0.6008, + "lyapunov": null, + "grad_norm": 0.5794799592204589, + "grad_max_sv": 0.26677791140973567, + "grad_min_sv": 1.029050446439174e-08, + "grad_condition": 588388249.9313815, + "lr": 0.00026835198244006903, + "time_sec": 15.474334001541138 + }, + { + "epoch": 99, + "train_loss": 0.24500514444351196, + "train_acc": 0.92196, + "test_loss": 2.086534292602539, + "test_acc": 0.6033, + "lyapunov": null, + "grad_norm": 0.5694490714138027, + "grad_max_sv": 0.2623301979154348, + "grad_min_sv": 9.966415031648947e-09, + "grad_condition": 1015125356.3291184, + "lr": 0.0002591231629491421, + "time_sec": 15.491194248199463 + }, + { + "epoch": 100, + "train_loss": 0.24579128606796263, + "train_acc": 0.92022, + "test_loss": 2.033238724517822, + "test_acc": 0.6073, + "lyapunov": null, + "grad_norm": 0.5680720755555388, + "grad_max_sv": 0.25963654592633245, + "grad_min_sv": 9.939859338002274e-09, + "grad_condition": 445557731.47806203, + "lr": 0.0002499999999999997, + "time_sec": 15.490838050842285 + }, + { + "epoch": 101, + "train_loss": 0.24127339096069336, + "train_acc": 0.92306, + "test_loss": 2.1002378002166746, + "test_acc": 0.6036, + "lyapunov": null, + "grad_norm": 0.5641906297524981, + "grad_max_sv": 0.27549757733941077, + "grad_min_sv": 1.0068470844863327e-08, + "grad_condition": 409101783.765684, + "lr": 0.00024098649531343477, + "time_sec": 15.490317106246948 + }, + { + "epoch": 102, + "train_loss": 0.2390659130167961, + "train_acc": 0.9225, + "test_loss": 2.0233927448272704, + "test_acc": 0.6081, + "lyapunov": null, + "grad_norm": 0.5658609942304538, + "grad_max_sv": 0.2694991033524275, + "grad_min_sv": 9.839277652549483e-09, + "grad_condition": 3844646046.5289702, + "lr": 0.0002320866025105016, + "time_sec": 15.493839740753174 + }, + { + "epoch": 103, + "train_loss": 0.23365470203876496, + "train_acc": 0.92546, + "test_loss": 2.007601522064209, + "test_acc": 0.6095, + "lyapunov": null, + "grad_norm": 0.5584257053092218, + "grad_max_sv": 0.2743960417807102, + "grad_min_sv": 1.0207792428690299e-08, + "grad_condition": 250547163.15828475, + "lr": 0.0002233042253783278, + "time_sec": 15.469611167907715 + }, + { + "epoch": 104, + "train_loss": 0.22797604578971864, + "train_acc": 0.92666, + "test_loss": 1.9921390232086182, + "test_acc": 0.6104, + "lyapunov": null, + "grad_norm": 0.5477060234172001, + "grad_max_sv": 0.2509814579039812, + "grad_min_sv": 9.610087979301102e-09, + "grad_condition": 2430635198.302944, + "lr": 0.000214643216157784, + "time_sec": 15.485874652862549 + }, + { + "epoch": 105, + "train_loss": 0.2194866455602646, + "train_acc": 0.92896, + "test_loss": 2.065049479866028, + "test_acc": 0.6048, + "lyapunov": null, + "grad_norm": 0.5427601977062464, + "grad_max_sv": 0.24938638992607592, + "grad_min_sv": 9.552283189700334e-09, + "grad_condition": 249820703.92123896, + "lr": 0.00020610737385376332, + "time_sec": 15.492459058761597 + }, + { + "epoch": 106, + "train_loss": 0.22127391705036165, + "train_acc": 0.9277, + "test_loss": 2.0674615295410157, + "test_acc": 0.6066, + "lyapunov": null, + "grad_norm": 0.545565415204051, + "grad_max_sv": 0.252237818390131, + "grad_min_sv": 9.870081852563286e-09, + "grad_condition": 1730317003.0799267, + "lr": 0.00019770044256881242, + "time_sec": 15.494806051254272 + }, + { + "epoch": 107, + "train_loss": 0.21957805599212646, + "train_acc": 0.92936, + "test_loss": 2.069959518432617, + "test_acc": 0.6059, + "lyapunov": null, + "grad_norm": 0.5427102510735407, + "grad_max_sv": 0.26037181839346885, + "grad_min_sv": 9.796433978262464e-09, + "grad_condition": 619659373.2197987, + "lr": 0.0001894261098608447, + "time_sec": 15.494577169418335 + }, + { + "epoch": 108, + "train_loss": 0.21802687605857848, + "train_acc": 0.92854, + "test_loss": 2.069862120437622, + "test_acc": 0.6064, + "lyapunov": null, + "grad_norm": 0.5412145734801318, + "grad_max_sv": 0.26357722133398054, + "grad_min_sv": 9.731102705856913e-09, + "grad_condition": 4896886016.781491, + "lr": 0.000181288005125655, + "time_sec": 15.492915630340576 + }, + { + "epoch": 109, + "train_loss": 0.2105085688495636, + "train_acc": 0.9329, + "test_loss": 2.0300133407592775, + "test_acc": 0.6118, + "lyapunov": null, + "grad_norm": 0.5316865416598037, + "grad_max_sv": 0.24584890641272067, + "grad_min_sv": 9.288343090713484e-09, + "grad_condition": 1467162755.386783, + "lr": 0.0001732896980049473, + "time_sec": 15.496263980865479 + }, + { + "epoch": 110, + "train_loss": 0.20778575693130494, + "train_acc": 0.9324, + "test_loss": 2.033147290420532, + "test_acc": 0.6113, + "lyapunov": null, + "grad_norm": 0.5310273370102141, + "grad_max_sv": 0.25715232640504837, + "grad_min_sv": 9.619756366117082e-09, + "grad_condition": 909703469.1889927, + "lr": 0.00016543469682057076, + "time_sec": 15.48079514503479 + }, + { + "epoch": 111, + "train_loss": 0.2022018117570877, + "train_acc": 0.93408, + "test_loss": 2.0903577659606936, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.5248885212713278, + "grad_max_sv": 0.25115896202623844, + "grad_min_sv": 9.449230327059423e-09, + "grad_condition": 654306379.114652, + "lr": 0.00015772644703565552, + "time_sec": 15.481376886367798 + }, + { + "epoch": 112, + "train_loss": 0.2012022008705139, + "train_acc": 0.93478, + "test_loss": 2.1256960330963133, + "test_acc": 0.6062, + "lyapunov": null, + "grad_norm": 0.5259715208516651, + "grad_max_sv": 0.25880570262670516, + "grad_min_sv": 9.483339922537942e-09, + "grad_condition": 3450539548.1120477, + "lr": 0.00015016832974331713, + "time_sec": 15.474645853042603 + }, + { + "epoch": 113, + "train_loss": 0.20022091041088105, + "train_acc": 0.9359, + "test_loss": 2.0813249099731443, + "test_acc": 0.6127, + "lyapunov": null, + "grad_norm": 0.518582122023061, + "grad_max_sv": 0.25183347687125207, + "grad_min_sv": 9.362834274724563e-09, + "grad_condition": 206343345.02075773, + "lr": 0.00014276366018359834, + "time_sec": 15.51976227760315 + }, + { + "epoch": 114, + "train_loss": 0.20003674240589142, + "train_acc": 0.93548, + "test_loss": 2.059957353401184, + "test_acc": 0.6113, + "lyapunov": null, + "grad_norm": 0.5204510649985771, + "grad_max_sv": 0.24840169511735438, + "grad_min_sv": 9.433198861711483e-09, + "grad_condition": 156281157.83753783, + "lr": 0.00013551568628929425, + "time_sec": 15.486659526824951 + }, + { + "epoch": 115, + "train_loss": 0.19450239594459534, + "train_acc": 0.9368, + "test_loss": 2.081795527267456, + "test_acc": 0.613, + "lyapunov": null, + "grad_norm": 0.513222572000434, + "grad_max_sv": 0.25595347620546816, + "grad_min_sv": 9.54867237041787e-09, + "grad_condition": 768174194.3770015, + "lr": 0.00012842758726130276, + "time_sec": 15.51030945777893 + }, + { + "epoch": 116, + "train_loss": 0.19022185802936553, + "train_acc": 0.93888, + "test_loss": 2.0910057247161866, + "test_acc": 0.6109, + "lyapunov": null, + "grad_norm": 0.509950221902217, + "grad_max_sv": 0.24649180248379707, + "grad_min_sv": 9.286189562706521e-09, + "grad_condition": 190506622.94702727, + "lr": 0.0001215024721741218, + "time_sec": 15.4960777759552 + }, + { + "epoch": 117, + "train_loss": 0.18697156070709228, + "train_acc": 0.9409, + "test_loss": 2.1048245140075683, + "test_acc": 0.6113, + "lyapunov": null, + "grad_norm": 0.5023066665762482, + "grad_max_sv": 0.24158176295459272, + "grad_min_sv": 9.132921396148092e-09, + "grad_condition": 4603577974.011314, + "lr": 0.00011474337861210538, + "time_sec": 15.499973773956299 + }, + { + "epoch": 118, + "train_loss": 0.1897142271566391, + "train_acc": 0.93756, + "test_loss": 2.0972971321105955, + "test_acc": 0.611, + "lyapunov": null, + "grad_norm": 0.5079589956238173, + "grad_max_sv": 0.23757222667336464, + "grad_min_sv": 8.902529727208147e-09, + "grad_condition": 203658547.6693558, + "lr": 0.00010815327133708009, + "time_sec": 15.504847049713135 + }, + { + "epoch": 119, + "train_loss": 0.1865368722629547, + "train_acc": 0.93914, + "test_loss": 2.071676664352417, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.503144489128604, + "grad_max_sv": 0.24214695654809476, + "grad_min_sv": 9.078004823076872e-09, + "grad_condition": 401272428.2934058, + "lr": 0.00010173504098790182, + "time_sec": 15.494940042495728 + }, + { + "epoch": 120, + "train_loss": 0.18263185959339143, + "train_acc": 0.9413, + "test_loss": 2.0995028049468996, + "test_acc": 0.61, + "lyapunov": null, + "grad_norm": 0.49963467133223916, + "grad_max_sv": 0.2448117069900036, + "grad_min_sv": 9.255170430218228e-09, + "grad_condition": 840960640.7523018, + "lr": 9.549150281252629e-05, + "time_sec": 15.50493049621582 + }, + { + "epoch": 121, + "train_loss": 0.17661990516662598, + "train_acc": 0.94376, + "test_loss": 2.0479217910766603, + "test_acc": 0.6139, + "lyapunov": null, + "grad_norm": 0.49017967274439106, + "grad_max_sv": 0.24487083926796913, + "grad_min_sv": 9.062790381261093e-09, + "grad_condition": 297900363.86286056, + "lr": 8.942539543314794e-05, + "time_sec": 15.500595331192017 + }, + { + "epoch": 122, + "train_loss": 0.17436686351299285, + "train_acc": 0.94568, + "test_loss": 2.1033685138702394, + "test_acc": 0.6076, + "lyapunov": null, + "grad_norm": 0.4850908453719191, + "grad_max_sv": 0.24267951920628547, + "grad_min_sv": 9.175133607909614e-09, + "grad_condition": 151651082.8966439, + "lr": 8.353937964495024e-05, + "time_sec": 15.500707149505615 + }, + { + "epoch": 123, + "train_loss": 0.17420966561317444, + "train_acc": 0.94574, + "test_loss": 2.0771576751708984, + "test_acc": 0.6091, + "lyapunov": null, + "grad_norm": 0.48697820878218756, + "grad_max_sv": 0.24934822954237462, + "grad_min_sv": 9.043736691862272e-09, + "grad_condition": 342563176.44086933, + "lr": 7.783603724899243e-05, + "time_sec": 15.506757974624634 + }, + { + "epoch": 124, + "train_loss": 0.1725812414932251, + "train_acc": 0.94486, + "test_loss": 2.135185445022583, + "test_acc": 0.608, + "lyapunov": null, + "grad_norm": 0.4844109930695783, + "grad_max_sv": 0.24152979552745818, + "grad_min_sv": 9.037162034160328e-09, + "grad_condition": 142594941.29597357, + "lr": 7.231786991974666e-05, + "time_sec": 15.495522499084473 + }, + { + "epoch": 125, + "train_loss": 0.17122176954269408, + "train_acc": 0.94558, + "test_loss": 2.1152863483428956, + "test_acc": 0.612, + "lyapunov": null, + "grad_norm": 0.4826385410866865, + "grad_max_sv": 0.24549916423857213, + "grad_min_sv": 8.782795131207118e-09, + "grad_condition": 1347993858.355885, + "lr": 6.698729810778072e-05, + "time_sec": 15.489627361297607 + }, + { + "epoch": 126, + "train_loss": 0.17058868828058243, + "train_acc": 0.94662, + "test_loss": 2.1105800861358643, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.48281055678110163, + "grad_max_sv": 0.24400779306888581, + "grad_min_sv": 8.881911921611655e-09, + "grad_condition": 907798367.550338, + "lr": 6.184665997806817e-05, + "time_sec": 15.487231254577637 + }, + { + "epoch": 127, + "train_loss": 0.16842705961704255, + "train_acc": 0.94676, + "test_loss": 2.075766274642944, + "test_acc": 0.6129, + "lyapunov": null, + "grad_norm": 0.4814153543267475, + "grad_max_sv": 0.24004302807152272, + "grad_min_sv": 8.701755094839368e-09, + "grad_condition": 2608046426.213746, + "lr": 5.6898210384392595e-05, + "time_sec": 15.498921394348145 + }, + { + "epoch": 128, + "train_loss": 0.16494292568683624, + "train_acc": 0.94768, + "test_loss": 2.151611907196045, + "test_acc": 0.6047, + "lyapunov": null, + "grad_norm": 0.4763822150733386, + "grad_max_sv": 0.22842325568199157, + "grad_min_sv": 8.631154578726818e-09, + "grad_condition": 260686423.05458745, + "lr": 5.214411988029363e-05, + "time_sec": 15.489452600479126 + }, + { + "epoch": 129, + "train_loss": 0.16430129640102387, + "train_acc": 0.94824, + "test_loss": 2.0951647556304933, + "test_acc": 0.6128, + "lyapunov": null, + "grad_norm": 0.4754481221102857, + "grad_max_sv": 0.23247553929686546, + "grad_min_sv": 8.414460946461547e-09, + "grad_condition": 437817787.9214033, + "lr": 4.7586473766990294e-05, + "time_sec": 15.491871118545532 + }, + { + "epoch": 130, + "train_loss": 0.16159661509513856, + "train_acc": 0.94926, + "test_loss": 2.0767082111358643, + "test_acc": 0.6156, + "lyapunov": null, + "grad_norm": 0.4695751355550292, + "grad_max_sv": 0.24420519769191742, + "grad_min_sv": 8.783045789696309e-09, + "grad_condition": 2887625517.4136095, + "lr": 4.32272711786996e-05, + "time_sec": 15.50525712966919 + }, + { + "epoch": 131, + "train_loss": 0.16233114049911498, + "train_acc": 0.94986, + "test_loss": 2.090193899154663, + "test_acc": 0.6138, + "lyapunov": null, + "grad_norm": 0.4718133586500909, + "grad_max_sv": 0.23811170123517514, + "grad_min_sv": 8.731167988607069e-09, + "grad_condition": 171473959.97673047, + "lr": 3.906842420574966e-05, + "time_sec": 15.489828824996948 + }, + { + "epoch": 132, + "train_loss": 0.16304145799160003, + "train_acc": 0.9489, + "test_loss": 2.0699268299102784, + "test_acc": 0.6176, + "lyapunov": null, + "grad_norm": 0.47181034193305915, + "grad_max_sv": 0.24468088522553444, + "grad_min_sv": 8.694641913677115e-09, + "grad_condition": 3950610050.0669045, + "lr": 3.5111757055874305e-05, + "time_sec": 15.489463329315186 + }, + { + "epoch": 133, + "train_loss": 0.16222090543746948, + "train_acc": 0.94862, + "test_loss": 2.0846460132598876, + "test_acc": 0.6154, + "lyapunov": null, + "grad_norm": 0.47432514605256276, + "grad_max_sv": 0.2351464234292507, + "grad_min_sv": 8.508125437679944e-09, + "grad_condition": 3262769680.1508665, + "lr": 3.1359005254054254e-05, + "time_sec": 15.493263721466064 + }, + { + "epoch": 134, + "train_loss": 0.1564504327917099, + "train_acc": 0.95064, + "test_loss": 2.039795367050171, + "test_acc": 0.616, + "lyapunov": null, + "grad_norm": 0.46132567077349346, + "grad_max_sv": 0.23477552309632302, + "grad_min_sv": 8.499829853240298e-09, + "grad_condition": 275652896.5549098, + "lr": 2.7811814881259484e-05, + "time_sec": 15.501915693283081 + }, + { + "epoch": 135, + "train_loss": 0.1633557910346985, + "train_acc": 0.94906, + "test_loss": 2.1431523998260498, + "test_acc": 0.6082, + "lyapunov": null, + "grad_norm": 0.4725347110912027, + "grad_max_sv": 0.2321782097220421, + "grad_min_sv": 8.273568699135141e-09, + "grad_condition": 719211854.1190578, + "lr": 2.4471741852423218e-05, + "time_sec": 15.49996304512024 + }, + { + "epoch": 136, + "train_loss": 0.1577922046995163, + "train_acc": 0.95056, + "test_loss": 2.039000785446167, + "test_acc": 0.6154, + "lyapunov": null, + "grad_norm": 0.46347763663429586, + "grad_max_sv": 0.23204916007816792, + "grad_min_sv": 8.698969911215922e-09, + "grad_condition": 2466699319.0239253, + "lr": 2.1340251233966362e-05, + "time_sec": 15.497424125671387 + }, + { + "epoch": 137, + "train_loss": 0.15701312964439393, + "train_acc": 0.94962, + "test_loss": 2.085305763244629, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.46705315608384584, + "grad_max_sv": 0.22602895461022854, + "grad_min_sv": 8.363478537018877e-09, + "grad_condition": 5418883019.032962, + "lr": 1.8418716601170932e-05, + "time_sec": 15.491859674453735 + }, + { + "epoch": 138, + "train_loss": 0.15615028873443604, + "train_acc": 0.95128, + "test_loss": 2.101923070907593, + "test_acc": 0.6133, + "lyapunov": null, + "grad_norm": 0.46267937397470993, + "grad_max_sv": 0.23617675378918648, + "grad_min_sv": 8.55792531187071e-09, + "grad_condition": 668785672.229811, + "lr": 1.570841943568445e-05, + "time_sec": 15.490991592407227 + }, + { + "epoch": 139, + "train_loss": 0.15497800857305527, + "train_acc": 0.95104, + "test_loss": 2.131324795150757, + "test_acc": 0.6096, + "lyapunov": null, + "grad_norm": 0.4627316674414162, + "grad_max_sv": 0.23336338251829147, + "grad_min_sv": 8.54283688542061e-09, + "grad_condition": 547232078.4054619, + "lr": 1.3210548563419845e-05, + "time_sec": 15.493245840072632 + }, + { + "epoch": 140, + "train_loss": 0.15815438273906707, + "train_acc": 0.95054, + "test_loss": 2.0743191734313964, + "test_acc": 0.6132, + "lyapunov": null, + "grad_norm": 0.46525185071118685, + "grad_max_sv": 0.23031578138470649, + "grad_min_sv": 8.578327668909771e-09, + "grad_condition": 1472538153.7679148, + "lr": 1.0926199633097203e-05, + "time_sec": 15.508398056030273 + }, + { + "epoch": 141, + "train_loss": 0.15565036369800567, + "train_acc": 0.95156, + "test_loss": 2.083190835571289, + "test_acc": 0.6143, + "lyapunov": null, + "grad_norm": 0.4634211187185363, + "grad_max_sv": 0.2209864068776369, + "grad_min_sv": 8.388305931458784e-09, + "grad_condition": 735187313.3407264, + "lr": 8.856374635655688e-06, + "time_sec": 15.477578163146973 + }, + { + "epoch": 142, + "train_loss": 0.1526834367275238, + "train_acc": 0.95296, + "test_loss": 2.0579229915618895, + "test_acc": 0.6125, + "lyapunov": null, + "grad_norm": 0.45577943773159835, + "grad_max_sv": 0.22755092419683934, + "grad_min_sv": 8.457177222030362e-09, + "grad_condition": 1934756909.5252705, + "lr": 7.001981464747503e-06, + "time_sec": 15.47980809211731 + }, + { + "epoch": 143, + "train_loss": 0.1551715327501297, + "train_acc": 0.95138, + "test_loss": 2.094068197631836, + "test_acc": 0.6117, + "lyapunov": null, + "grad_norm": 0.46037433954931045, + "grad_max_sv": 0.22780660428106786, + "grad_min_sv": 8.502836361531321e-09, + "grad_condition": 963929271.8099291, + "lr": 5.3638335185058295e-06, + "time_sec": 15.485134363174438 + }, + { + "epoch": 144, + "train_loss": 0.15432416381835937, + "train_acc": 0.95178, + "test_loss": 2.110651277923584, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.4613614148812742, + "grad_max_sv": 0.22735756635665894, + "grad_min_sv": 8.44454743694368e-09, + "grad_condition": 1076939620.5494838, + "lr": 3.942649342761114e-06, + "time_sec": 15.493315696716309 + }, + { + "epoch": 145, + "train_loss": 0.15650244321346282, + "train_acc": 0.95044, + "test_loss": 2.0880191951751708, + "test_acc": 0.6119, + "lyapunov": null, + "grad_norm": 0.4660268832705423, + "grad_max_sv": 0.23027937039732932, + "grad_min_sv": 8.513131491633477e-09, + "grad_condition": 297143450.17696226, + "lr": 2.7390523158633524e-06, + "time_sec": 15.480180501937866 + }, + { + "epoch": 146, + "train_loss": 0.15448970682621002, + "train_acc": 0.952, + "test_loss": 2.0194208770751954, + "test_acc": 0.621, + "lyapunov": null, + "grad_norm": 0.4600178145858194, + "grad_max_sv": 0.22371375933289528, + "grad_min_sv": 8.652061342297613e-09, + "grad_condition": 2586380341.3174944, + "lr": 1.7535703752478133e-06, + "time_sec": 15.502386331558228 + }, + { + "epoch": 147, + "train_loss": 0.15414279275417328, + "train_acc": 0.95114, + "test_loss": 2.1069964057922363, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.4616285885002781, + "grad_max_sv": 0.2342820342630148, + "grad_min_sv": 8.68108046944878e-09, + "grad_condition": 379507449.7225493, + "lr": 9.866357858642196e-07, + "time_sec": 15.488835096359253 + }, + { + "epoch": 148, + "train_loss": 0.15620617700576783, + "train_acc": 0.95078, + "test_loss": 2.1161761821746827, + "test_acc": 0.6085, + "lyapunov": null, + "grad_norm": 0.46475971700568747, + "grad_max_sv": 0.2303019493818283, + "grad_min_sv": 8.695906369591763e-09, + "grad_condition": 729395813.573787, + "lr": 4.38584950570808e-07, + "time_sec": 15.500977277755737 + }, + { + "epoch": 149, + "train_loss": 0.1530400000667572, + "train_acc": 0.95168, + "test_loss": 2.0760107112884523, + "test_acc": 0.6147, + "lyapunov": null, + "grad_norm": 0.4585791144767188, + "grad_max_sv": 0.23029794916510582, + "grad_min_sv": 8.466522902726702e-09, + "grad_condition": 540903237.1982462, + "lr": 1.096582625772501e-07, + "time_sec": 15.49415111541748 + }, + { + "epoch": 150, + "train_loss": 0.15208094583511353, + "train_acc": 0.95228, + "test_loss": 2.0765135959625245, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.45743890734329773, + "grad_max_sv": 0.23194126076996327, + "grad_min_sv": 8.657490525268864e-09, + "grad_condition": 1180436704.3069885, + "lr": 0.0, + "time_sec": 15.487801790237427 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.642479771652222, + "train_acc": 0.0563, + "test_loss": 4.471788549804687, + "test_acc": 0.0525, + "lyapunov": null, + "grad_norm": 6.299700683423435, + "grad_max_sv": 5.376748514175415, + "grad_min_sv": 1.0876815811078355e-07, + "grad_condition": 123806577.64929362, + "lr": 0.0009998903417374227, + "time_sec": 32.55821919441223 + }, + { + "epoch": 2, + "train_loss": 3.921236069869995, + "train_acc": 0.1164, + "test_loss": 4.031661200714112, + "test_acc": 0.0987, + "lyapunov": null, + "grad_norm": 4.744809408953577, + "grad_max_sv": 4.056096857786178, + "grad_min_sv": 8.545224932585138e-08, + "grad_condition": 432966802.88566554, + "lr": 0.0009995614150494292, + "time_sec": 32.52909827232361 + }, + { + "epoch": 3, + "train_loss": 3.563258330001831, + "train_acc": 0.16394, + "test_loss": 3.665959655380249, + "test_acc": 0.1478, + "lyapunov": null, + "grad_norm": 3.968544793489477, + "grad_max_sv": 3.2656030714511872, + "grad_min_sv": 7.328074659307404e-08, + "grad_condition": 54148101.24592471, + "lr": 0.0009990133642141358, + "time_sec": 32.514859199523926 + }, + { + "epoch": 4, + "train_loss": 3.30762485168457, + "train_acc": 0.20282, + "test_loss": 3.602442971038818, + "test_acc": 0.1715, + "lyapunov": null, + "grad_norm": 3.360539325527588, + "grad_max_sv": 2.5611240684986116, + "grad_min_sv": 6.275024531099404e-08, + "grad_condition": 48558402.55237199, + "lr": 0.0009982464296247522, + "time_sec": 32.511942863464355 + }, + { + "epoch": 5, + "train_loss": 3.070727022857666, + "train_acc": 0.2431, + "test_loss": 3.0896433425903322, + "test_acc": 0.2428, + "lyapunov": null, + "grad_norm": 2.8612981669887914, + "grad_max_sv": 2.039329302310944, + "grad_min_sv": 5.3213209671998385e-08, + "grad_condition": 45899387.46141158, + "lr": 0.0009972609476841367, + "time_sec": 32.535019874572754 + }, + { + "epoch": 6, + "train_loss": 2.873271194458008, + "train_acc": 0.2795, + "test_loss": 3.0904090099334716, + "test_acc": 0.2488, + "lyapunov": null, + "grad_norm": 2.4953735022476837, + "grad_max_sv": 1.6734129816293717, + "grad_min_sv": 4.6456209978895655e-08, + "grad_condition": 55631562.29872565, + "lr": 0.000996057350657239, + "time_sec": 32.5289192199707 + }, + { + "epoch": 7, + "train_loss": 2.698648819732666, + "train_acc": 0.31066, + "test_loss": 2.9098104148864747, + "test_acc": 0.2799, + "lyapunov": null, + "grad_norm": 2.1963953249289316, + "grad_max_sv": 1.3662363350391389, + "grad_min_sv": 4.123726340746203e-08, + "grad_condition": 175183802.14149565, + "lr": 0.000994636166481494, + "time_sec": 32.53304076194763 + }, + { + "epoch": 8, + "train_loss": 2.5489939933776857, + "train_acc": 0.3414, + "test_loss": 2.918805715942383, + "test_acc": 0.2796, + "lyapunov": null, + "grad_norm": 1.9702205989411337, + "grad_max_sv": 1.1486580684781074, + "grad_min_sv": 3.6719605156498857e-08, + "grad_condition": 45078452.49282994, + "lr": 0.0009929980185352525, + "time_sec": 32.52384686470032 + }, + { + "epoch": 9, + "train_loss": 2.429889005661011, + "train_acc": 0.36856, + "test_loss": 2.617208067703247, + "test_acc": 0.3352, + "lyapunov": null, + "grad_norm": 1.7958642065413024, + "grad_max_sv": 0.976833887398243, + "grad_min_sv": 3.4111676243397945e-08, + "grad_condition": 88392837.95669074, + "lr": 0.0009911436253643444, + "time_sec": 32.52341938018799 + }, + { + "epoch": 10, + "train_loss": 2.312202433395386, + "train_acc": 0.39006, + "test_loss": 2.6336415348052977, + "test_acc": 0.3376, + "lyapunov": null, + "grad_norm": 1.6688154279715788, + "grad_max_sv": 0.8335120677947998, + "grad_min_sv": 3.1057890326202656e-08, + "grad_condition": 43581868.8179111, + "lr": 0.0009890738003669028, + "time_sec": 32.53657627105713 + }, + { + "epoch": 11, + "train_loss": 2.2113982202911378, + "train_acc": 0.41394, + "test_loss": 2.4651415496826172, + "test_acc": 0.3668, + "lyapunov": null, + "grad_norm": 1.5852177586967415, + "grad_max_sv": 0.7658713042736054, + "grad_min_sv": 2.981889714037678e-08, + "grad_condition": 33093574.792371016, + "lr": 0.00098678945143658, + "time_sec": 32.52194833755493 + }, + { + "epoch": 12, + "train_loss": 2.1308777001190187, + "train_acc": 0.432, + "test_loss": 2.5040061386108396, + "test_acc": 0.3654, + "lyapunov": null, + "grad_norm": 1.5129835225343262, + "grad_max_sv": 0.6879909574985504, + "grad_min_sv": 2.8309841176854533e-08, + "grad_condition": 30209408.624890875, + "lr": 0.0009842915805643154, + "time_sec": 32.519477128982544 + }, + { + "epoch": 13, + "train_loss": 2.051232373428345, + "train_acc": 0.4496, + "test_loss": 2.3721223037719725, + "test_acc": 0.3951, + "lyapunov": null, + "grad_norm": 1.4527042328822815, + "grad_max_sv": 0.6657147958874703, + "grad_min_sv": 2.7529119311919813e-08, + "grad_condition": 32877524.0735294, + "lr": 0.000981581283398829, + "time_sec": 32.51488184928894 + }, + { + "epoch": 14, + "train_loss": 1.9786859475326537, + "train_acc": 0.46372, + "test_loss": 2.4099101028442385, + "test_acc": 0.3885, + "lyapunov": null, + "grad_norm": 1.3903946049407439, + "grad_max_sv": 0.619149561971426, + "grad_min_sv": 2.6381883344583912e-08, + "grad_condition": 32158488.579634093, + "lr": 0.0009786597487660333, + "time_sec": 32.53034734725952 + }, + { + "epoch": 15, + "train_loss": 1.9087054037857056, + "train_acc": 0.48146, + "test_loss": 2.356669859313965, + "test_acc": 0.4054, + "lyapunov": null, + "grad_norm": 1.3401497982688246, + "grad_max_sv": 0.5884689308702946, + "grad_min_sv": 2.5261919572860948e-08, + "grad_condition": 27243493.57243519, + "lr": 0.0009755282581475766, + "time_sec": 32.53805232048035 + }, + { + "epoch": 16, + "train_loss": 1.8580862741851807, + "train_acc": 0.4903, + "test_loss": 2.3727874526977537, + "test_acc": 0.3978, + "lyapunov": null, + "grad_norm": 1.2980660063098806, + "grad_max_sv": 0.5687403865158558, + "grad_min_sv": 2.4705210138753485e-08, + "grad_condition": 36506916.881677285, + "lr": 0.0009721881851187403, + "time_sec": 32.529054403305054 + }, + { + "epoch": 17, + "train_loss": 1.7838218069458007, + "train_acc": 0.50946, + "test_loss": 2.411915710067749, + "test_acc": 0.4013, + "lyapunov": null, + "grad_norm": 1.2536082066251264, + "grad_max_sv": 0.5238922812044621, + "grad_min_sv": 2.3606322296920722e-08, + "grad_condition": 36849925.4309851, + "lr": 0.0009686409947459456, + "time_sec": 32.526257038116455 + }, + { + "epoch": 18, + "train_loss": 1.7371992016983033, + "train_acc": 0.51958, + "test_loss": 2.2599031024932863, + "test_acc": 0.4264, + "lyapunov": null, + "grad_norm": 1.229284180873741, + "grad_max_sv": 0.5230717524886132, + "grad_min_sv": 2.312521401454104e-08, + "grad_condition": 49053511.209702894, + "lr": 0.0009648882429441254, + "time_sec": 32.5399911403656 + }, + { + "epoch": 19, + "train_loss": 1.6830381874847413, + "train_acc": 0.53178, + "test_loss": 2.1889729766845702, + "test_acc": 0.4447, + "lyapunov": null, + "grad_norm": 1.1785390649791196, + "grad_max_sv": 0.4872257113456726, + "grad_min_sv": 2.2137700339541766e-08, + "grad_condition": 138866163.95418012, + "lr": 0.00096093157579425, + "time_sec": 32.52653670310974 + }, + { + "epoch": 20, + "train_loss": 1.6344180388641358, + "train_acc": 0.54714, + "test_loss": 2.227257891082764, + "test_acc": 0.4375, + "lyapunov": null, + "grad_norm": 1.1489035121891145, + "grad_max_sv": 0.47284500747919084, + "grad_min_sv": 2.1496744417870418e-08, + "grad_condition": 29593450.061258078, + "lr": 0.0009567727288213001, + "time_sec": 32.52734684944153 + }, + { + "epoch": 21, + "train_loss": 1.5880603087615968, + "train_acc": 0.55388, + "test_loss": 2.109391535949707, + "test_acc": 0.4605, + "lyapunov": null, + "grad_norm": 1.1350345214433142, + "grad_max_sv": 0.47259567975997924, + "grad_min_sv": 2.13382750108293e-08, + "grad_condition": 39203948.276769534, + "lr": 0.0009524135262330095, + "time_sec": 32.51701855659485 + }, + { + "epoch": 22, + "train_loss": 1.5451898790740968, + "train_acc": 0.56776, + "test_loss": 2.1289856529235838, + "test_acc": 0.4622, + "lyapunov": null, + "grad_norm": 1.1083032352595108, + "grad_max_sv": 0.44387331902980803, + "grad_min_sv": 2.0636199499213248e-08, + "grad_condition": 31425874.99589374, + "lr": 0.0009478558801197061, + "time_sec": 32.51593995094299 + }, + { + "epoch": 23, + "train_loss": 1.4903677392959596, + "train_acc": 0.57754, + "test_loss": 2.133696251296997, + "test_acc": 0.4671, + "lyapunov": null, + "grad_norm": 1.0825668306165386, + "grad_max_sv": 0.4390222616493702, + "grad_min_sv": 2.047547279677986e-08, + "grad_condition": 129993822.14571199, + "lr": 0.000943101789615607, + "time_sec": 32.51069974899292 + }, + { + "epoch": 24, + "train_loss": 1.4748817832183838, + "train_acc": 0.58158, + "test_loss": 2.1626602745056154, + "test_acc": 0.4632, + "lyapunov": null, + "grad_norm": 1.0751338305034317, + "grad_max_sv": 0.43956650570034983, + "grad_min_sv": 2.0244324640261713e-08, + "grad_condition": 41342301.85017798, + "lr": 0.0009381533400219313, + "time_sec": 32.533777952194214 + }, + { + "epoch": 25, + "train_loss": 1.4211272861099242, + "train_acc": 0.5951, + "test_loss": 2.096311450576782, + "test_acc": 0.481, + "lyapunov": null, + "grad_norm": 1.0399638076679998, + "grad_max_sv": 0.42748609334230425, + "grad_min_sv": 1.9937479189824357e-08, + "grad_condition": 38871491.7985058, + "lr": 0.0009330127018922189, + "time_sec": 32.53145217895508 + }, + { + "epoch": 26, + "train_loss": 1.396544298095703, + "train_acc": 0.6008, + "test_loss": 2.1271941719055176, + "test_acc": 0.4714, + "lyapunov": null, + "grad_norm": 1.028506322176559, + "grad_max_sv": 0.4079991213977337, + "grad_min_sv": 1.9165852835345554e-08, + "grad_condition": 39309871.185656376, + "lr": 0.000927682130080253, + "time_sec": 32.53234934806824 + }, + { + "epoch": 27, + "train_loss": 1.361050274734497, + "train_acc": 0.60774, + "test_loss": 2.0897907325744627, + "test_acc": 0.4811, + "lyapunov": null, + "grad_norm": 1.009655904655981, + "grad_max_sv": 0.39270137771964075, + "grad_min_sv": 1.8564359835493426e-08, + "grad_condition": 28517922.90367631, + "lr": 0.0009221639627510072, + "time_sec": 32.54458284378052 + }, + { + "epoch": 28, + "train_loss": 1.3167539808654785, + "train_acc": 0.62254, + "test_loss": 2.2306322479248046, + "test_acc": 0.4663, + "lyapunov": null, + "grad_norm": 0.9884512545787755, + "grad_max_sv": 0.393748565018177, + "grad_min_sv": 1.8592529393846036e-08, + "grad_condition": 34171303.89028352, + "lr": 0.0009164606203550494, + "time_sec": 32.525365352630615 + }, + { + "epoch": 29, + "train_loss": 1.2844751734542847, + "train_acc": 0.62692, + "test_loss": 2.19309764251709, + "test_acc": 0.4751, + "lyapunov": null, + "grad_norm": 0.9700062599103884, + "grad_max_sv": 0.387305423617363, + "grad_min_sv": 1.7872535887364373e-08, + "grad_condition": 26903062.552241027, + "lr": 0.0009105746045668516, + "time_sec": 32.526561975479126 + }, + { + "epoch": 30, + "train_loss": 1.2640808475494385, + "train_acc": 0.63334, + "test_loss": 2.2757652931213377, + "test_acc": 0.4536, + "lyapunov": null, + "grad_norm": 0.9608534659761124, + "grad_max_sv": 0.39087340533733367, + "grad_min_sv": 1.800268759344359e-08, + "grad_condition": 33161981.652286977, + "lr": 0.0009045084971874733, + "time_sec": 32.51922965049744 + }, + { + "epoch": 31, + "train_loss": 1.2303438648223877, + "train_acc": 0.64076, + "test_loss": 2.1164483276367188, + "test_acc": 0.4864, + "lyapunov": null, + "grad_norm": 0.9467438832197973, + "grad_max_sv": 0.3729639552533627, + "grad_min_sv": 1.7477179434233213e-08, + "grad_condition": 28618454.375976466, + "lr": 0.0008982649590120977, + "time_sec": 32.51436138153076 + }, + { + "epoch": 32, + "train_loss": 1.2104430978012084, + "train_acc": 0.6455, + "test_loss": 2.2232689281463625, + "test_acc": 0.481, + "lyapunov": null, + "grad_norm": 0.9361931150490757, + "grad_max_sv": 0.37210237309336663, + "grad_min_sv": 1.7445883718214537e-08, + "grad_condition": 29250266.68112684, + "lr": 0.0008918467286629196, + "time_sec": 32.532060861587524 + }, + { + "epoch": 33, + "train_loss": 1.1789497135162355, + "train_acc": 0.65278, + "test_loss": 2.143947396850586, + "test_acc": 0.4907, + "lyapunov": null, + "grad_norm": 0.9196344126113596, + "grad_max_sv": 0.367071446031332, + "grad_min_sv": 1.6865934492071855e-08, + "grad_condition": 40056883.7628016, + "lr": 0.0008852566213878943, + "time_sec": 32.526479959487915 + }, + { + "epoch": 34, + "train_loss": 1.1554690090179442, + "train_acc": 0.65844, + "test_loss": 2.1499678684234618, + "test_acc": 0.4922, + "lyapunov": null, + "grad_norm": 0.9057802742532243, + "grad_max_sv": 0.3550798542797565, + "grad_min_sv": 1.6556807021315262e-08, + "grad_condition": 255610578.57101497, + "lr": 0.000878497527825878, + "time_sec": 32.53326392173767 + }, + { + "epoch": 35, + "train_loss": 1.1325925022506713, + "train_acc": 0.66696, + "test_loss": 2.187357851409912, + "test_acc": 0.498, + "lyapunov": null, + "grad_norm": 0.8980481880537616, + "grad_max_sv": 0.35023384541273117, + "grad_min_sv": 1.653067620913107e-08, + "grad_condition": 47664672.04568529, + "lr": 0.000871572412738697, + "time_sec": 32.529192209243774 + }, + { + "epoch": 36, + "train_loss": 1.1162108192062379, + "train_acc": 0.67076, + "test_loss": 2.078928050994873, + "test_acc": 0.5062, + "lyapunov": null, + "grad_norm": 0.8887291214894226, + "grad_max_sv": 0.34587462246418, + "grad_min_sv": 1.598691768550653e-08, + "grad_condition": 47253750.309311725, + "lr": 0.0008644843137107055, + "time_sec": 32.53391623497009 + }, + { + "epoch": 37, + "train_loss": 1.088490778541565, + "train_acc": 0.67814, + "test_loss": 2.117596751022339, + "test_acc": 0.5079, + "lyapunov": null, + "grad_norm": 0.8827902897341499, + "grad_max_sv": 0.3460941031575203, + "grad_min_sv": 1.613751039689776e-08, + "grad_condition": 120430106.41639173, + "lr": 0.0008572363398164014, + "time_sec": 32.52939796447754 + }, + { + "epoch": 38, + "train_loss": 1.0622543322944642, + "train_acc": 0.68324, + "test_loss": 2.2524201555252077, + "test_acc": 0.4904, + "lyapunov": null, + "grad_norm": 0.8643928358196139, + "grad_max_sv": 0.3311579547822475, + "grad_min_sv": 1.5921391385842476e-08, + "grad_condition": 28147641.32749777, + "lr": 0.0008498316702566826, + "time_sec": 32.51650023460388 + }, + { + "epoch": 39, + "train_loss": 1.0258385097503662, + "train_acc": 0.6921, + "test_loss": 2.215389312553406, + "test_acc": 0.4912, + "lyapunov": null, + "grad_norm": 0.8507960671612714, + "grad_max_sv": 0.3430253557860851, + "grad_min_sv": 1.6041156275514722e-08, + "grad_condition": 41417221.90444088, + "lr": 0.0008422735529643442, + "time_sec": 32.51078248023987 + }, + { + "epoch": 40, + "train_loss": 1.008150099067688, + "train_acc": 0.69894, + "test_loss": 2.285165777206421, + "test_acc": 0.4887, + "lyapunov": null, + "grad_norm": 0.8500378683317822, + "grad_max_sv": 0.33013429269194605, + "grad_min_sv": 1.547893761040184e-08, + "grad_condition": 735713799.268648, + "lr": 0.0008345653031794289, + "time_sec": 32.51578617095947 + }, + { + "epoch": 41, + "train_loss": 0.9898018364715576, + "train_acc": 0.70114, + "test_loss": 2.1710759185791018, + "test_acc": 0.5054, + "lyapunov": null, + "grad_norm": 0.845636323093009, + "grad_max_sv": 0.334617256373167, + "grad_min_sv": 1.552002822438614e-08, + "grad_condition": 178790285.2774743, + "lr": 0.0008267103019950526, + "time_sec": 32.55498909950256 + }, + { + "epoch": 42, + "train_loss": 0.9689999252319336, + "train_acc": 0.70992, + "test_loss": 2.1532568422317504, + "test_acc": 0.5088, + "lyapunov": null, + "grad_norm": 0.8290515928528267, + "grad_max_sv": 0.32156808376312257, + "grad_min_sv": 1.513711112358096e-08, + "grad_condition": 63393159.17157264, + "lr": 0.0008187119948743447, + "time_sec": 32.5278046131134 + }, + { + "epoch": 43, + "train_loss": 0.9382334645080567, + "train_acc": 0.7173, + "test_loss": 2.1617983654022215, + "test_acc": 0.5099, + "lyapunov": null, + "grad_norm": 0.8199573726083517, + "grad_max_sv": 0.3176788903772831, + "grad_min_sv": 1.4969858624924724e-08, + "grad_condition": 39337083.20882653, + "lr": 0.000810573890139155, + "time_sec": 32.54653334617615 + }, + { + "epoch": 44, + "train_loss": 0.9182830782318115, + "train_acc": 0.7211, + "test_loss": 2.2938510860443113, + "test_acc": 0.5032, + "lyapunov": null, + "grad_norm": 0.8158010406023241, + "grad_max_sv": 0.32802748009562493, + "grad_min_sv": 1.5100565674969203e-08, + "grad_condition": 67700595.0906401, + "lr": 0.0008022995574311873, + "time_sec": 32.530778884887695 + }, + { + "epoch": 45, + "train_loss": 0.89899619556427, + "train_acc": 0.72596, + "test_loss": 2.3243038515090944, + "test_acc": 0.4978, + "lyapunov": null, + "grad_norm": 0.8106149860815325, + "grad_max_sv": 0.31970001086592675, + "grad_min_sv": 1.444995242211311e-08, + "grad_condition": 61707891.58292439, + "lr": 0.0007938926261462363, + "time_sec": 32.53210163116455 + }, + { + "epoch": 46, + "train_loss": 0.8833617488861084, + "train_acc": 0.72982, + "test_loss": 2.3542774658203127, + "test_acc": 0.4957, + "lyapunov": null, + "grad_norm": 0.8034668926314622, + "grad_max_sv": 0.3169444307684898, + "grad_min_sv": 1.4620525734955046e-08, + "grad_condition": 2306938949.5105658, + "lr": 0.0007853567838422158, + "time_sec": 32.52321457862854 + }, + { + "epoch": 47, + "train_loss": 0.8611621459960938, + "train_acc": 0.73636, + "test_loss": 2.3614687870025635, + "test_acc": 0.5019, + "lyapunov": null, + "grad_norm": 0.7952702534581538, + "grad_max_sv": 0.3213916938751936, + "grad_min_sv": 1.4360261544471564e-08, + "grad_condition": 98833361.99001758, + "lr": 0.0007766957746216719, + "time_sec": 32.551071643829346 + }, + { + "epoch": 48, + "train_loss": 0.8414902052116394, + "train_acc": 0.74232, + "test_loss": 2.3029669830322264, + "test_acc": 0.5085, + "lyapunov": null, + "grad_norm": 0.784297561095192, + "grad_max_sv": 0.3114811100065708, + "grad_min_sv": 1.4304356266148232e-08, + "grad_condition": 35252220.65254038, + "lr": 0.0007679133974894982, + "time_sec": 32.53156328201294 + }, + { + "epoch": 49, + "train_loss": 0.8309669767951965, + "train_acc": 0.74656, + "test_loss": 2.286893635559082, + "test_acc": 0.5045, + "lyapunov": null, + "grad_norm": 0.7866799445354931, + "grad_max_sv": 0.31325423568487165, + "grad_min_sv": 1.420554635719537e-08, + "grad_condition": 245828981.88515216, + "lr": 0.000759013504686565, + "time_sec": 32.530038595199585 + }, + { + "epoch": 50, + "train_loss": 0.7998139995956421, + "train_acc": 0.75392, + "test_loss": 2.3185002082824706, + "test_acc": 0.5087, + "lyapunov": null, + "grad_norm": 0.7702444904048175, + "grad_max_sv": 0.3126057405024767, + "grad_min_sv": 1.4057572236413247e-08, + "grad_condition": 895759530.8359982, + "lr": 0.0007499999999999998, + "time_sec": 32.539623498916626 + }, + { + "epoch": 51, + "train_loss": 0.7901191444015503, + "train_acc": 0.75788, + "test_loss": 2.337850633239746, + "test_acc": 0.509, + "lyapunov": null, + "grad_norm": 0.7647274965495858, + "grad_max_sv": 0.3004269126802683, + "grad_min_sv": 1.4008410850752107e-08, + "grad_condition": 176379975.2857924, + "lr": 0.0007408768370508575, + "time_sec": 32.52524662017822 + }, + { + "epoch": 52, + "train_loss": 0.7781133801651001, + "train_acc": 0.76004, + "test_loss": 2.3018055530548094, + "test_acc": 0.5142, + "lyapunov": null, + "grad_norm": 0.7628575677364715, + "grad_max_sv": 0.3077410638332367, + "grad_min_sv": 1.3944687078052547e-08, + "grad_condition": 476227675.55278826, + "lr": 0.0007316480175599307, + "time_sec": 32.53758096694946 + }, + { + "epoch": 53, + "train_loss": 0.7562806001663208, + "train_acc": 0.7648, + "test_loss": 2.379827104949951, + "test_acc": 0.5063, + "lyapunov": null, + "grad_norm": 0.7526764366291289, + "grad_max_sv": 0.30248577073216437, + "grad_min_sv": 1.3496081205355803e-08, + "grad_condition": 1089676260.2113607, + "lr": 0.0007223175895924635, + "time_sec": 32.54466271400452 + }, + { + "epoch": 54, + "train_loss": 0.7475943574333191, + "train_acc": 0.76786, + "test_loss": 2.377075054550171, + "test_acc": 0.512, + "lyapunov": null, + "grad_norm": 0.750215382398683, + "grad_max_sv": 0.3043755616992712, + "grad_min_sv": 1.3518679307933379e-08, + "grad_condition": 37379268.11133198, + "lr": 0.0007128896457825361, + "time_sec": 32.53366780281067 + }, + { + "epoch": 55, + "train_loss": 0.7366778998947143, + "train_acc": 0.77304, + "test_loss": 2.4013710193634035, + "test_acc": 0.5052, + "lyapunov": null, + "grad_norm": 0.7465343546140976, + "grad_max_sv": 0.30028381906449797, + "grad_min_sv": 1.382671875327368e-08, + "grad_condition": 28698720.96166121, + "lr": 0.0007033683215378998, + "time_sec": 32.53609323501587 + }, + { + "epoch": 56, + "train_loss": 0.7091366660690308, + "train_acc": 0.77762, + "test_loss": 2.33411563911438, + "test_acc": 0.5126, + "lyapunov": null, + "grad_norm": 0.7380136003829837, + "grad_max_sv": 0.2953734669834375, + "grad_min_sv": 1.303365445352823e-08, + "grad_condition": 1175915690.269457, + "lr": 0.0006937577932260512, + "time_sec": 32.5473690032959 + }, + { + "epoch": 57, + "train_loss": 0.6999513886070251, + "train_acc": 0.78266, + "test_loss": 2.43815316696167, + "test_acc": 0.5107, + "lyapunov": null, + "grad_norm": 0.7328699359209336, + "grad_max_sv": 0.2920531783252954, + "grad_min_sv": 1.2993845399135451e-08, + "grad_condition": 152587828.403437, + "lr": 0.0006840622763423388, + "time_sec": 32.55185127258301 + }, + { + "epoch": 58, + "train_loss": 0.6799741724395751, + "train_acc": 0.78742, + "test_loss": 2.381142023277283, + "test_acc": 0.5177, + "lyapunov": null, + "grad_norm": 0.7278793670004745, + "grad_max_sv": 0.2917668532580137, + "grad_min_sv": 1.304645755725517e-08, + "grad_condition": 169810706.32481682, + "lr": 0.0006742860236609073, + "time_sec": 32.537921667099 + }, + { + "epoch": 59, + "train_loss": 0.6622171486473083, + "train_acc": 0.79306, + "test_loss": 2.350548614120483, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.7160794966099063, + "grad_max_sv": 0.28989222049713137, + "grad_min_sv": 1.3154668510517373e-08, + "grad_condition": 518100543.52278435, + "lr": 0.0006644333233692913, + "time_sec": 32.556652784347534 + }, + { + "epoch": 60, + "train_loss": 0.6548414518356324, + "train_acc": 0.79498, + "test_loss": 2.558105725860596, + "test_acc": 0.5026, + "lyapunov": null, + "grad_norm": 0.7139601066120349, + "grad_max_sv": 0.2839757200330496, + "grad_min_sv": 1.2719528911207812e-08, + "grad_condition": 106598497.36127238, + "lr": 0.0006545084971874734, + "time_sec": 32.54617619514465 + }, + { + "epoch": 61, + "train_loss": 0.6367912077522278, + "train_acc": 0.79956, + "test_loss": 2.549720768737793, + "test_acc": 0.503, + "lyapunov": null, + "grad_norm": 0.7072938119035849, + "grad_max_sv": 0.2815666403621435, + "grad_min_sv": 1.2655917643131925e-08, + "grad_condition": 351545390.3878931, + "lr": 0.0006445158984722354, + "time_sec": 32.52895545959473 + }, + { + "epoch": 62, + "train_loss": 0.6108809622764587, + "train_acc": 0.80962, + "test_loss": 2.4582517892837523, + "test_acc": 0.5155, + "lyapunov": null, + "grad_norm": 0.6871779503013541, + "grad_max_sv": 0.27853575013577936, + "grad_min_sv": 1.2499909360016991e-08, + "grad_condition": 84323115.24066128, + "lr": 0.0006344599103076324, + "time_sec": 32.53638219833374 + }, + { + "epoch": 63, + "train_loss": 0.6110955193519593, + "train_acc": 0.8082, + "test_loss": 2.421668832015991, + "test_acc": 0.5218, + "lyapunov": null, + "grad_norm": 0.6974575785480693, + "grad_max_sv": 0.29437441378831863, + "grad_min_sv": 1.2760532111023327e-08, + "grad_condition": 1141074655.802474, + "lr": 0.0006243449435824269, + "time_sec": 32.5341739654541 + }, + { + "epoch": 64, + "train_loss": 0.5902745287513733, + "train_acc": 0.81326, + "test_loss": 2.525721709823608, + "test_acc": 0.5137, + "lyapunov": null, + "grad_norm": 0.6819775061327956, + "grad_max_sv": 0.2760129250586033, + "grad_min_sv": 1.2472146640636617e-08, + "grad_condition": 153380994.2741132, + "lr": 0.0006141754350553275, + "time_sec": 32.54224371910095 + }, + { + "epoch": 65, + "train_loss": 0.5767888858222961, + "train_acc": 0.81892, + "test_loss": 2.5681256893157958, + "test_acc": 0.5109, + "lyapunov": null, + "grad_norm": 0.6842883453940269, + "grad_max_sv": 0.27693442031741144, + "grad_min_sv": 1.214616162405202e-08, + "grad_condition": 180936373.24743983, + "lr": 0.0006039558454088793, + "time_sec": 32.535571575164795 + }, + { + "epoch": 66, + "train_loss": 0.5719620153427124, + "train_acc": 0.81766, + "test_loss": 2.4380872802734377, + "test_acc": 0.5187, + "lyapunov": null, + "grad_norm": 0.6845868887152398, + "grad_max_sv": 0.2806558083742857, + "grad_min_sv": 1.2417019015428798e-08, + "grad_condition": 91981311.14124386, + "lr": 0.000593690657292862, + "time_sec": 32.537678956985474 + }, + { + "epoch": 67, + "train_loss": 0.5476583632850647, + "train_acc": 0.8273, + "test_loss": 2.4955981588363647, + "test_acc": 0.5183, + "lyapunov": null, + "grad_norm": 0.6627927561159936, + "grad_max_sv": 0.27053381204605104, + "grad_min_sv": 1.1682474739156678e-08, + "grad_condition": 119357334.07208268, + "lr": 0.0005833843733580507, + "time_sec": 32.53704595565796 + }, + { + "epoch": 68, + "train_loss": 0.5349030065536499, + "train_acc": 0.82988, + "test_loss": 2.576411254119873, + "test_acc": 0.5106, + "lyapunov": null, + "grad_norm": 0.6582392321316073, + "grad_max_sv": 0.27176710218191147, + "grad_min_sv": 1.180562275559377e-08, + "grad_condition": 846305950.6996868, + "lr": 0.0005730415142812054, + "time_sec": 32.54088878631592 + }, + { + "epoch": 69, + "train_loss": 0.5356097626113892, + "train_acc": 0.82918, + "test_loss": 2.5702699626922607, + "test_acc": 0.5154, + "lyapunov": null, + "grad_norm": 0.6641979366792015, + "grad_max_sv": 0.27518576607108114, + "grad_min_sv": 1.2052892484938627e-08, + "grad_condition": 130030350.74337718, + "lr": 0.0005626666167821517, + "time_sec": 32.54138922691345 + }, + { + "epoch": 70, + "train_loss": 0.513014861240387, + "train_acc": 0.8363, + "test_loss": 2.6079680850982667, + "test_acc": 0.5106, + "lyapunov": null, + "grad_norm": 0.6500943565960319, + "grad_max_sv": 0.2724282074719667, + "grad_min_sv": 1.178367022645465e-08, + "grad_condition": 673776556.319051, + "lr": 0.0005522642316338265, + "time_sec": 32.5693633556366 + }, + { + "epoch": 71, + "train_loss": 0.49603789474487303, + "train_acc": 0.84198, + "test_loss": 2.5577601636886595, + "test_acc": 0.5169, + "lyapunov": null, + "grad_norm": 0.6430240258167331, + "grad_max_sv": 0.27023660503327845, + "grad_min_sv": 1.1744692686443959e-08, + "grad_condition": 80314537.0435541, + "lr": 0.0005418389216661573, + "time_sec": 32.54641532897949 + }, + { + "epoch": 72, + "train_loss": 0.49025250810623167, + "train_acc": 0.8432, + "test_loss": 2.5663631786346435, + "test_acc": 0.5234, + "lyapunov": null, + "grad_norm": 0.643279476058677, + "grad_max_sv": 0.27230227626860143, + "grad_min_sv": 1.1624652314357053e-08, + "grad_condition": 62786442.37501116, + "lr": 0.0005313952597646563, + "time_sec": 32.54123497009277 + }, + { + "epoch": 73, + "train_loss": 0.48772711526870727, + "train_acc": 0.84528, + "test_loss": 2.648895852470398, + "test_acc": 0.5168, + "lyapunov": null, + "grad_norm": 0.6405905214601311, + "grad_max_sv": 0.2699441872537136, + "grad_min_sv": 1.1482883187884097e-08, + "grad_condition": 111834993.35897943, + "lr": 0.0005209378268645994, + "time_sec": 32.56350803375244 + }, + { + "epoch": 74, + "train_loss": 0.467068857088089, + "train_acc": 0.84904, + "test_loss": 2.6479972763061523, + "test_acc": 0.5139, + "lyapunov": null, + "grad_norm": 0.6363491242612465, + "grad_max_sv": 0.2783078793436289, + "grad_min_sv": 1.1536390146556913e-08, + "grad_condition": 219390233.59819812, + "lr": 0.0005104712099416781, + "time_sec": 32.546509981155396 + }, + { + "epoch": 75, + "train_loss": 0.4711385968875885, + "train_acc": 0.84816, + "test_loss": 2.608884352874756, + "test_acc": 0.5195, + "lyapunov": null, + "grad_norm": 0.6374082155755629, + "grad_max_sv": 0.26901070438325403, + "grad_min_sv": 1.1190769711073856e-08, + "grad_condition": 334559678.03980315, + "lr": 0.0004999999999999996, + "time_sec": 32.54527187347412 + }, + { + "epoch": 76, + "train_loss": 0.45760808762550353, + "train_acc": 0.85254, + "test_loss": 2.6803735092163086, + "test_acc": 0.5135, + "lyapunov": null, + "grad_norm": 0.6239727106157842, + "grad_max_sv": 0.2669793125241995, + "grad_min_sv": 1.1426927580722445e-08, + "grad_condition": 760532191.4933506, + "lr": 0.0004895287900583212, + "time_sec": 32.556286096572876 + }, + { + "epoch": 77, + "train_loss": 0.4403402804660797, + "train_acc": 0.85888, + "test_loss": 2.6952022495269774, + "test_acc": 0.5153, + "lyapunov": null, + "grad_norm": 0.6180261512024202, + "grad_max_sv": 0.2674210451543331, + "grad_min_sv": 1.1284923026578207e-08, + "grad_condition": 800342890.6120255, + "lr": 0.0004790621731353997, + "time_sec": 32.570063829422 + }, + { + "epoch": 78, + "train_loss": 0.43386900725364685, + "train_acc": 0.8609, + "test_loss": 2.6530003887176514, + "test_acc": 0.5232, + "lyapunov": null, + "grad_norm": 0.6088851948477753, + "grad_max_sv": 0.2547843284904957, + "grad_min_sv": 1.0926095429623917e-08, + "grad_condition": 95464128.01992908, + "lr": 0.000468604740235343, + "time_sec": 32.54688787460327 + }, + { + "epoch": 79, + "train_loss": 0.4240487690734863, + "train_acc": 0.8654, + "test_loss": 2.7931711376190185, + "test_acc": 0.5088, + "lyapunov": null, + "grad_norm": 0.5993382897461283, + "grad_max_sv": 0.24774248749017716, + "grad_min_sv": 1.07508628526291e-08, + "grad_condition": 623384828.9212538, + "lr": 0.00045816107833384175, + "time_sec": 32.54505252838135 + }, + { + "epoch": 80, + "train_loss": 0.4058323986816406, + "train_acc": 0.86904, + "test_loss": 2.6775668907165526, + "test_acc": 0.5171, + "lyapunov": null, + "grad_norm": 0.5885819627420461, + "grad_max_sv": 0.24584074690937996, + "grad_min_sv": 1.022559682466867e-08, + "grad_condition": 156757634.53668588, + "lr": 0.0004477357683661729, + "time_sec": 32.55807185173035 + }, + { + "epoch": 81, + "train_loss": 0.3943421869087219, + "train_acc": 0.87248, + "test_loss": 2.596042275619507, + "test_acc": 0.5241, + "lyapunov": null, + "grad_norm": 0.5915570736864834, + "grad_max_sv": 0.252938449382782, + "grad_min_sv": 1.0551333432320953e-08, + "grad_condition": 290621793.5733338, + "lr": 0.00043733338321784746, + "time_sec": 32.56740355491638 + }, + { + "epoch": 82, + "train_loss": 0.39024432485580446, + "train_acc": 0.87492, + "test_loss": 2.715544410324097, + "test_acc": 0.5245, + "lyapunov": null, + "grad_norm": 0.5825377843109248, + "grad_max_sv": 0.2532011177390814, + "grad_min_sv": 1.0358391808878986e-08, + "grad_condition": 412597611.83888507, + "lr": 0.0004269584857187939, + "time_sec": 32.55344319343567 + }, + { + "epoch": 83, + "train_loss": 0.3715799244689941, + "train_acc": 0.88012, + "test_loss": 2.6901692249298095, + "test_acc": 0.5264, + "lyapunov": null, + "grad_norm": 0.5717041976150569, + "grad_max_sv": 0.24421822614967822, + "grad_min_sv": 1.0306600353336345e-08, + "grad_condition": 329985889.12779623, + "lr": 0.0004166156266419484, + "time_sec": 32.559467792510986 + }, + { + "epoch": 84, + "train_loss": 0.3671589259147644, + "train_acc": 0.882, + "test_loss": 2.6448453563690184, + "test_acc": 0.5345, + "lyapunov": null, + "grad_norm": 0.5691852194449533, + "grad_max_sv": 0.24019994884729384, + "grad_min_sv": 9.989625743278551e-09, + "grad_condition": 122734290.43687347, + "lr": 0.0004063093427071373, + "time_sec": 32.583213567733765 + }, + { + "epoch": 85, + "train_loss": 0.35963713159561156, + "train_acc": 0.8824, + "test_loss": 2.718573891067505, + "test_acc": 0.5235, + "lyapunov": null, + "grad_norm": 0.5695765343654775, + "grad_max_sv": 0.24239672683179378, + "grad_min_sv": 1.0202618674231591e-08, + "grad_condition": 1852046324.0623333, + "lr": 0.0003960441545911199, + "time_sec": 32.562474727630615 + }, + { + "epoch": 86, + "train_loss": 0.35900317364692685, + "train_acc": 0.88314, + "test_loss": 2.690758750152588, + "test_acc": 0.5281, + "lyapunov": null, + "grad_norm": 0.5695226754489282, + "grad_max_sv": 0.2359969958662987, + "grad_min_sv": 9.85500920487603e-09, + "grad_condition": 394077563.11466306, + "lr": 0.0003858245649446718, + "time_sec": 32.56024169921875 + }, + { + "epoch": 87, + "train_loss": 0.34593051030158994, + "train_acc": 0.88774, + "test_loss": 2.6911534130096437, + "test_acc": 0.5276, + "lyapunov": null, + "grad_norm": 0.5605319049257929, + "grad_max_sv": 0.24156057350337506, + "grad_min_sv": 9.944241273420092e-09, + "grad_condition": 944172650.8084786, + "lr": 0.00037565505641757235, + "time_sec": 32.55394530296326 + }, + { + "epoch": 88, + "train_loss": 0.3350362122821808, + "train_acc": 0.89292, + "test_loss": 2.761347038269043, + "test_acc": 0.5248, + "lyapunov": null, + "grad_norm": 0.5537857918957506, + "grad_max_sv": 0.24467103444039823, + "grad_min_sv": 9.84480716557587e-09, + "grad_condition": 557423472.2448919, + "lr": 0.00036554008969236695, + "time_sec": 32.565001487731934 + }, + { + "epoch": 89, + "train_loss": 0.32590197957992556, + "train_acc": 0.89466, + "test_loss": 2.873864278793335, + "test_acc": 0.5155, + "lyapunov": null, + "grad_norm": 0.5519161551510952, + "grad_max_sv": 0.2400045834481716, + "grad_min_sv": 9.881915213807297e-09, + "grad_condition": 248477788.07047543, + "lr": 0.0003554841015277638, + "time_sec": 32.55529260635376 + }, + { + "epoch": 90, + "train_loss": 0.31863860460281374, + "train_acc": 0.89664, + "test_loss": 2.8045926555633547, + "test_acc": 0.5231, + "lyapunov": null, + "grad_norm": 0.5479641587602809, + "grad_max_sv": 0.24628719314932823, + "grad_min_sv": 1.0033076104122573e-08, + "grad_condition": 105371945.52289103, + "lr": 0.000345491502812526, + "time_sec": 32.55959415435791 + }, + { + "epoch": 91, + "train_loss": 0.31169461310863494, + "train_acc": 0.89832, + "test_loss": 2.764314810180664, + "test_acc": 0.5242, + "lyapunov": null, + "grad_norm": 0.5454170376093662, + "grad_max_sv": 0.24890379793941975, + "grad_min_sv": 9.700326364034394e-09, + "grad_condition": 77171376.4128032, + "lr": 0.0003355666766307081, + "time_sec": 32.56360149383545 + }, + { + "epoch": 92, + "train_loss": 0.3113831770801544, + "train_acc": 0.90008, + "test_loss": 2.778244842529297, + "test_acc": 0.5291, + "lyapunov": null, + "grad_norm": 0.5407137447043685, + "grad_max_sv": 0.23328636735677719, + "grad_min_sv": 9.360961983687077e-09, + "grad_condition": 128397939.07976246, + "lr": 0.00032571397633909225, + "time_sec": 32.571138858795166 + }, + { + "epoch": 93, + "train_loss": 0.30188457230567933, + "train_acc": 0.903, + "test_loss": 2.7606024471282957, + "test_acc": 0.5339, + "lyapunov": null, + "grad_norm": 0.5330386559824729, + "grad_max_sv": 0.24647361300885678, + "grad_min_sv": 9.782626700523788e-09, + "grad_condition": 930794659.3385656, + "lr": 0.00031593772365766094, + "time_sec": 32.56698513031006 + }, + { + "epoch": 94, + "train_loss": 0.2888755958557129, + "train_acc": 0.90584, + "test_loss": 2.8303293384552, + "test_acc": 0.5252, + "lyapunov": null, + "grad_norm": 0.5239071385040424, + "grad_max_sv": 0.24134295992553234, + "grad_min_sv": 9.665177403035685e-09, + "grad_condition": 341790086.36703265, + "lr": 0.0003062422067739483, + "time_sec": 32.560898303985596 + }, + { + "epoch": 95, + "train_loss": 0.2843299233055115, + "train_acc": 0.90856, + "test_loss": 2.878970125961304, + "test_acc": 0.5228, + "lyapunov": null, + "grad_norm": 0.5173032628331714, + "grad_max_sv": 0.22986819855868817, + "grad_min_sv": 9.369064224050081e-09, + "grad_condition": 493164980.6666913, + "lr": 0.00029663167846209965, + "time_sec": 32.586976528167725 + }, + { + "epoch": 96, + "train_loss": 0.280480184469223, + "train_acc": 0.9093, + "test_loss": 2.9630297519683837, + "test_acc": 0.5184, + "lyapunov": null, + "grad_norm": 0.5133233008116458, + "grad_max_sv": 0.22380913645029069, + "grad_min_sv": 9.095019559701712e-09, + "grad_condition": 693584615.2355412, + "lr": 0.00028711035421746345, + "time_sec": 32.56851410865784 + }, + { + "epoch": 97, + "train_loss": 0.2670245563793182, + "train_acc": 0.9139, + "test_loss": 2.9036443214416505, + "test_acc": 0.5232, + "lyapunov": null, + "grad_norm": 0.5060688229901619, + "grad_max_sv": 0.23383041098713875, + "grad_min_sv": 9.393182952245269e-09, + "grad_condition": 365456172.90854704, + "lr": 0.00027768241040753615, + "time_sec": 32.560548305511475 + }, + { + "epoch": 98, + "train_loss": 0.2613537116527557, + "train_acc": 0.91552, + "test_loss": 2.93895020904541, + "test_acc": 0.5186, + "lyapunov": null, + "grad_norm": 0.5033096276176704, + "grad_max_sv": 0.22504370659589767, + "grad_min_sv": 9.149747783043782e-09, + "grad_condition": 181789237.51414594, + "lr": 0.00026835198244006903, + "time_sec": 32.57581615447998 + }, + { + "epoch": 99, + "train_loss": 0.25923142310142516, + "train_acc": 0.91662, + "test_loss": 2.9681204444885254, + "test_acc": 0.519, + "lyapunov": null, + "grad_norm": 0.5005047043499057, + "grad_max_sv": 0.23424391224980354, + "grad_min_sv": 9.202334173646042e-09, + "grad_condition": 1390486041.6800082, + "lr": 0.0002591231629491421, + "time_sec": 32.568488359451294 + }, + { + "epoch": 100, + "train_loss": 0.2552828652858734, + "train_acc": 0.91668, + "test_loss": 2.9585084489822386, + "test_acc": 0.5195, + "lyapunov": null, + "grad_norm": 0.5000052829086656, + "grad_max_sv": 0.23269009366631507, + "grad_min_sv": 9.008429451874688e-09, + "grad_condition": 118235741.33881798, + "lr": 0.0002499999999999997, + "time_sec": 32.64319896697998 + }, + { + "epoch": 101, + "train_loss": 0.2504552359342575, + "train_acc": 0.92034, + "test_loss": 2.881327504348755, + "test_acc": 0.527, + "lyapunov": null, + "grad_norm": 0.4976095445457081, + "grad_max_sv": 0.23710807636380196, + "grad_min_sv": 8.987613531706572e-09, + "grad_condition": 188175820.91636205, + "lr": 0.00024098649531343477, + "time_sec": 32.56459856033325 + }, + { + "epoch": 102, + "train_loss": 0.24319207516670227, + "train_acc": 0.9211, + "test_loss": 2.8339650466918944, + "test_acc": 0.5304, + "lyapunov": null, + "grad_norm": 0.49020316429940586, + "grad_max_sv": 0.22668980285525323, + "grad_min_sv": 8.876688220674786e-09, + "grad_condition": 3067014755.4611425, + "lr": 0.0002320866025105016, + "time_sec": 32.56655430793762 + }, + { + "epoch": 103, + "train_loss": 0.23643713227272034, + "train_acc": 0.92328, + "test_loss": 2.8374974479675292, + "test_acc": 0.5312, + "lyapunov": null, + "grad_norm": 0.48382300142218854, + "grad_max_sv": 0.22789723835885525, + "grad_min_sv": 8.629146283113676e-09, + "grad_condition": 335837582.58375555, + "lr": 0.0002233042253783278, + "time_sec": 32.56167936325073 + }, + { + "epoch": 104, + "train_loss": 0.23221797705173491, + "train_acc": 0.92652, + "test_loss": 2.8848680614471434, + "test_acc": 0.5292, + "lyapunov": null, + "grad_norm": 0.47687316634744686, + "grad_max_sv": 0.21569081246852875, + "grad_min_sv": 8.62663665758762e-09, + "grad_condition": 1157675505.971954, + "lr": 0.000214643216157784, + "time_sec": 32.563629150390625 + }, + { + "epoch": 105, + "train_loss": 0.2289664591026306, + "train_acc": 0.9265, + "test_loss": 2.9271271530151366, + "test_acc": 0.5268, + "lyapunov": null, + "grad_norm": 0.47818041348027984, + "grad_max_sv": 0.21913939844816924, + "grad_min_sv": 8.707405810184226e-09, + "grad_condition": 207155237.78245467, + "lr": 0.00020610737385376332, + "time_sec": 32.56299424171448 + }, + { + "epoch": 106, + "train_loss": 0.22260613627433776, + "train_acc": 0.92814, + "test_loss": 2.8978806022644044, + "test_acc": 0.5295, + "lyapunov": null, + "grad_norm": 0.4722385726091627, + "grad_max_sv": 0.2149375133216381, + "grad_min_sv": 8.579168120879944e-09, + "grad_condition": 165117262.170354, + "lr": 0.00019770044256881242, + "time_sec": 32.58579874038696 + }, + { + "epoch": 107, + "train_loss": 0.21763298731803893, + "train_acc": 0.93018, + "test_loss": 2.908183602523804, + "test_acc": 0.5286, + "lyapunov": null, + "grad_norm": 0.4652522989647011, + "grad_max_sv": 0.22290415540337563, + "grad_min_sv": 8.928726000223541e-09, + "grad_condition": 479064684.028664, + "lr": 0.0001894261098608447, + "time_sec": 32.594443798065186 + }, + { + "epoch": 108, + "train_loss": 0.2121983386325836, + "train_acc": 0.9317, + "test_loss": 2.8597964405059813, + "test_acc": 0.5362, + "lyapunov": null, + "grad_norm": 0.45763107412030085, + "grad_max_sv": 0.21216899007558823, + "grad_min_sv": 8.420200893585924e-09, + "grad_condition": 688259775.9446552, + "lr": 0.000181288005125655, + "time_sec": 32.56038689613342 + }, + { + "epoch": 109, + "train_loss": 0.20583704056739807, + "train_acc": 0.93444, + "test_loss": 2.9211787143707277, + "test_acc": 0.5282, + "lyapunov": null, + "grad_norm": 0.4568920236456778, + "grad_max_sv": 0.22295879386365414, + "grad_min_sv": 8.673458856169048e-09, + "grad_condition": 89075535.84085791, + "lr": 0.0001732896980049473, + "time_sec": 32.575947761535645 + }, + { + "epoch": 110, + "train_loss": 0.21038897478103638, + "train_acc": 0.93206, + "test_loss": 2.9601449073791506, + "test_acc": 0.5279, + "lyapunov": null, + "grad_norm": 0.45979845223683363, + "grad_max_sv": 0.22593539729714393, + "grad_min_sv": 8.6531671937215e-09, + "grad_condition": 89403715.48231289, + "lr": 0.00016543469682057076, + "time_sec": 32.607563495635986 + }, + { + "epoch": 111, + "train_loss": 0.19834216837882995, + "train_acc": 0.93586, + "test_loss": 2.9055423223495485, + "test_acc": 0.5353, + "lyapunov": null, + "grad_norm": 0.44710603724659786, + "grad_max_sv": 0.2183500427752733, + "grad_min_sv": 8.1763572969476e-09, + "grad_condition": 161545447.91228038, + "lr": 0.00015772644703565552, + "time_sec": 32.57204461097717 + }, + { + "epoch": 112, + "train_loss": 0.19908358410835267, + "train_acc": 0.93552, + "test_loss": 2.994161311531067, + "test_acc": 0.5244, + "lyapunov": null, + "grad_norm": 0.4546597416131923, + "grad_max_sv": 0.21809808388352395, + "grad_min_sv": 8.425444494170043e-09, + "grad_condition": 140538020.508261, + "lr": 0.00015016832974331713, + "time_sec": 32.601916790008545 + }, + { + "epoch": 113, + "train_loss": 0.191571541864872, + "train_acc": 0.93866, + "test_loss": 2.986764238739014, + "test_acc": 0.5296, + "lyapunov": null, + "grad_norm": 0.4450596671055528, + "grad_max_sv": 0.21210374720394612, + "grad_min_sv": 8.032377695355725e-09, + "grad_condition": 1444127435.9832203, + "lr": 0.00014276366018359834, + "time_sec": 32.559205770492554 + }, + { + "epoch": 114, + "train_loss": 0.1893005026912689, + "train_acc": 0.93862, + "test_loss": 3.0139925247192383, + "test_acc": 0.5255, + "lyapunov": null, + "grad_norm": 0.4424054116910155, + "grad_max_sv": 0.21594099812209605, + "grad_min_sv": 8.292241756094332e-09, + "grad_condition": 1221030181.2962646, + "lr": 0.00013551568628929425, + "time_sec": 32.54303812980652 + }, + { + "epoch": 115, + "train_loss": 0.1869383985710144, + "train_acc": 0.94032, + "test_loss": 2.9447794439315795, + "test_acc": 0.5338, + "lyapunov": null, + "grad_norm": 0.44046789562845245, + "grad_max_sv": 0.22429420053958893, + "grad_min_sv": 8.562988351723532e-09, + "grad_condition": 109188406.44486985, + "lr": 0.00012842758726130276, + "time_sec": 32.57725954055786 + }, + { + "epoch": 116, + "train_loss": 0.18216380766868592, + "train_acc": 0.94282, + "test_loss": 2.9761684719085695, + "test_acc": 0.533, + "lyapunov": null, + "grad_norm": 0.43380483120573066, + "grad_max_sv": 0.21227659583091735, + "grad_min_sv": 8.084414394003703e-09, + "grad_condition": 442388430.74640197, + "lr": 0.0001215024721741218, + "time_sec": 32.56703448295593 + }, + { + "epoch": 117, + "train_loss": 0.18284838955402374, + "train_acc": 0.94104, + "test_loss": 2.988401131248474, + "test_acc": 0.5304, + "lyapunov": null, + "grad_norm": 0.43518014689479523, + "grad_max_sv": 0.20529667772352694, + "grad_min_sv": 8.008318215188027e-09, + "grad_condition": 525224592.1224529, + "lr": 0.00011474337861210538, + "time_sec": 32.56633758544922 + }, + { + "epoch": 118, + "train_loss": 0.17929271565437316, + "train_acc": 0.94202, + "test_loss": 2.969692068481445, + "test_acc": 0.531, + "lyapunov": null, + "grad_norm": 0.43166468988319484, + "grad_max_sv": 0.20995365753769873, + "grad_min_sv": 7.949281083993037e-09, + "grad_condition": 206686551.43998715, + "lr": 0.00010815327133708009, + "time_sec": 32.58298921585083 + }, + { + "epoch": 119, + "train_loss": 0.1746947413468361, + "train_acc": 0.94538, + "test_loss": 2.9470513034820556, + "test_acc": 0.5265, + "lyapunov": null, + "grad_norm": 0.4240479391496432, + "grad_max_sv": 0.21465191170573233, + "grad_min_sv": 8.01244074109808e-09, + "grad_condition": 266673927.46960324, + "lr": 0.00010173504098790182, + "time_sec": 32.58079934120178 + }, + { + "epoch": 120, + "train_loss": 0.17056026011943817, + "train_acc": 0.94666, + "test_loss": 2.9715382446289063, + "test_acc": 0.5374, + "lyapunov": null, + "grad_norm": 0.4216192661535551, + "grad_max_sv": 0.21133692860603331, + "grad_min_sv": 8.155698732288316e-09, + "grad_condition": 310751065.89462894, + "lr": 9.549150281252629e-05, + "time_sec": 32.567041635513306 + }, + { + "epoch": 121, + "train_loss": 0.16829824639320373, + "train_acc": 0.94648, + "test_loss": 3.087546385574341, + "test_acc": 0.5255, + "lyapunov": null, + "grad_norm": 0.4183748049917772, + "grad_max_sv": 0.20680695101618768, + "grad_min_sv": 7.995454154665922e-09, + "grad_condition": 1023933342.3354034, + "lr": 8.942539543314794e-05, + "time_sec": 32.589598178863525 + }, + { + "epoch": 122, + "train_loss": 0.16800043944358825, + "train_acc": 0.94632, + "test_loss": 2.9318422325134277, + "test_acc": 0.5338, + "lyapunov": null, + "grad_norm": 0.42099752391898676, + "grad_max_sv": 0.21042499877512455, + "grad_min_sv": 7.547093950439551e-09, + "grad_condition": 900826897.3857119, + "lr": 8.353937964495024e-05, + "time_sec": 32.595381021499634 + }, + { + "epoch": 123, + "train_loss": 0.16323296820640565, + "train_acc": 0.94816, + "test_loss": 3.0529399940490722, + "test_acc": 0.5285, + "lyapunov": null, + "grad_norm": 0.41313116824251195, + "grad_max_sv": 0.19900580085814, + "grad_min_sv": 7.892230206862915e-09, + "grad_condition": 209614816.18259263, + "lr": 7.783603724899243e-05, + "time_sec": 32.5691282749176 + }, + { + "epoch": 124, + "train_loss": 0.16248614077568055, + "train_acc": 0.94808, + "test_loss": 2.968647869491577, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.4109739294498664, + "grad_max_sv": 0.2045503228902817, + "grad_min_sv": 7.709402672934767e-09, + "grad_condition": 204317712.1943869, + "lr": 7.231786991974666e-05, + "time_sec": 32.56873893737793 + }, + { + "epoch": 125, + "train_loss": 0.16562083917617798, + "train_acc": 0.94652, + "test_loss": 2.990608223724365, + "test_acc": 0.5324, + "lyapunov": null, + "grad_norm": 0.41726227575170305, + "grad_max_sv": 0.21484395451843738, + "grad_min_sv": 8.067420890524312e-09, + "grad_condition": 451509267.6606773, + "lr": 6.698729810778072e-05, + "time_sec": 32.563942432403564 + }, + { + "epoch": 126, + "train_loss": 0.16248787566184997, + "train_acc": 0.94908, + "test_loss": 3.0610411296844484, + "test_acc": 0.5248, + "lyapunov": null, + "grad_norm": 0.41265591679124974, + "grad_max_sv": 0.20524860061705114, + "grad_min_sv": 7.563831366450003e-09, + "grad_condition": 115790817.80184206, + "lr": 6.184665997806817e-05, + "time_sec": 32.568299770355225 + }, + { + "epoch": 127, + "train_loss": 0.15771708325862885, + "train_acc": 0.95078, + "test_loss": 2.962667014122009, + "test_acc": 0.5409, + "lyapunov": null, + "grad_norm": 0.4075071230249109, + "grad_max_sv": 0.20769537538290023, + "grad_min_sv": 8.188405986597757e-09, + "grad_condition": 380886928.1801485, + "lr": 5.6898210384392595e-05, + "time_sec": 32.57155394554138 + }, + { + "epoch": 128, + "train_loss": 0.15537331622004508, + "train_acc": 0.95126, + "test_loss": 2.9610030857086183, + "test_acc": 0.5357, + "lyapunov": null, + "grad_norm": 0.4021889013709537, + "grad_max_sv": 0.19925076719373463, + "grad_min_sv": 7.527878987789033e-09, + "grad_condition": 171791225.70681745, + "lr": 5.214411988029363e-05, + "time_sec": 32.58445978164673 + }, + { + "epoch": 129, + "train_loss": 0.15362726456165313, + "train_acc": 0.9504, + "test_loss": 3.0267199047088624, + "test_acc": 0.5318, + "lyapunov": null, + "grad_norm": 0.40304342978976343, + "grad_max_sv": 0.2073110181838274, + "grad_min_sv": 7.651128650391566e-09, + "grad_condition": 655223821.7012879, + "lr": 4.7586473766990294e-05, + "time_sec": 32.58788251876831 + }, + { + "epoch": 130, + "train_loss": 0.15159179414272309, + "train_acc": 0.95296, + "test_loss": 3.075101675415039, + "test_acc": 0.5263, + "lyapunov": null, + "grad_norm": 0.3974054527380892, + "grad_max_sv": 0.20575362853705884, + "grad_min_sv": 7.740591648555672e-09, + "grad_condition": 144759180.06870463, + "lr": 4.32272711786996e-05, + "time_sec": 32.578858613967896 + }, + { + "epoch": 131, + "train_loss": 0.1488430485343933, + "train_acc": 0.95292, + "test_loss": 2.9862019886016844, + "test_acc": 0.5315, + "lyapunov": null, + "grad_norm": 0.3954060106149679, + "grad_max_sv": 0.20766182690858842, + "grad_min_sv": 7.58607175857344e-09, + "grad_condition": 425579805.0794872, + "lr": 3.906842420574966e-05, + "time_sec": 32.586265325546265 + }, + { + "epoch": 132, + "train_loss": 0.14661406512260436, + "train_acc": 0.95324, + "test_loss": 3.057056298828125, + "test_acc": 0.5262, + "lyapunov": null, + "grad_norm": 0.39095745142548216, + "grad_max_sv": 0.19490535818040372, + "grad_min_sv": 7.49121251628342e-09, + "grad_condition": 3507301112.9708757, + "lr": 3.5111757055874305e-05, + "time_sec": 32.574090003967285 + }, + { + "epoch": 133, + "train_loss": 0.1463806065893173, + "train_acc": 0.95318, + "test_loss": 3.0613175567626953, + "test_acc": 0.527, + "lyapunov": null, + "grad_norm": 0.3949318760097119, + "grad_max_sv": 0.2000393845140934, + "grad_min_sv": 7.511325199847929e-09, + "grad_condition": 264016430.37942663, + "lr": 3.1359005254054254e-05, + "time_sec": 32.57793402671814 + }, + { + "epoch": 134, + "train_loss": 0.14586117388010025, + "train_acc": 0.95352, + "test_loss": 3.0277784969329833, + "test_acc": 0.5333, + "lyapunov": null, + "grad_norm": 0.3915443650869973, + "grad_max_sv": 0.20002376139163972, + "grad_min_sv": 7.407051562673041e-09, + "grad_condition": 1569872714.1138968, + "lr": 2.7811814881259484e-05, + "time_sec": 32.58327078819275 + }, + { + "epoch": 135, + "train_loss": 0.14679538232803344, + "train_acc": 0.9531, + "test_loss": 3.02330316696167, + "test_acc": 0.5325, + "lyapunov": null, + "grad_norm": 0.39654447314663155, + "grad_max_sv": 0.2064110331237316, + "grad_min_sv": 8.009200439971707e-09, + "grad_condition": 408075856.5604743, + "lr": 2.4471741852423218e-05, + "time_sec": 32.57164478302002 + }, + { + "epoch": 136, + "train_loss": 0.14213005175113677, + "train_acc": 0.95606, + "test_loss": 3.066131346511841, + "test_acc": 0.5326, + "lyapunov": null, + "grad_norm": 0.386859099144263, + "grad_max_sv": 0.20008183866739274, + "grad_min_sv": 7.493826075335216e-09, + "grad_condition": 1294487907.3292127, + "lr": 2.1340251233966362e-05, + "time_sec": 32.59002447128296 + }, + { + "epoch": 137, + "train_loss": 0.14528326896190644, + "train_acc": 0.95314, + "test_loss": 2.9820048439025877, + "test_acc": 0.5384, + "lyapunov": null, + "grad_norm": 0.3940518150499405, + "grad_max_sv": 0.20172332599759102, + "grad_min_sv": 7.518978299708582e-09, + "grad_condition": 2050951064.0374703, + "lr": 1.8418716601170932e-05, + "time_sec": 32.582863569259644 + }, + { + "epoch": 138, + "train_loss": 0.14290555841445923, + "train_acc": 0.954, + "test_loss": 2.9484275436401366, + "test_acc": 0.5392, + "lyapunov": null, + "grad_norm": 0.3885095445150157, + "grad_max_sv": 0.1956668719649315, + "grad_min_sv": 7.481351363262425e-09, + "grad_condition": 817168787.737042, + "lr": 1.570841943568445e-05, + "time_sec": 32.56788969039917 + }, + { + "epoch": 139, + "train_loss": 0.1455221847629547, + "train_acc": 0.95376, + "test_loss": 2.9918841510772705, + "test_acc": 0.539, + "lyapunov": null, + "grad_norm": 0.39394584988421966, + "grad_max_sv": 0.1982663732022047, + "grad_min_sv": 7.502347731524073e-09, + "grad_condition": 1796580822.5410652, + "lr": 1.3210548563419845e-05, + "time_sec": 32.57190442085266 + }, + { + "epoch": 140, + "train_loss": 0.1442144584083557, + "train_acc": 0.95352, + "test_loss": 2.970733211517334, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.39260771988813964, + "grad_max_sv": 0.19792755618691443, + "grad_min_sv": 7.351794456978561e-09, + "grad_condition": 208762115.79842368, + "lr": 1.0926199633097203e-05, + "time_sec": 32.58234429359436 + }, + { + "epoch": 141, + "train_loss": 0.1421483956861496, + "train_acc": 0.95486, + "test_loss": 2.9954518421173097, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.3895044607831209, + "grad_max_sv": 0.19535492211580277, + "grad_min_sv": 7.2159212467261255e-09, + "grad_condition": 226711442.0952455, + "lr": 8.856374635655688e-06, + "time_sec": 32.580827951431274 + }, + { + "epoch": 142, + "train_loss": 0.14344135119915008, + "train_acc": 0.95412, + "test_loss": 3.0175164573669435, + "test_acc": 0.5347, + "lyapunov": null, + "grad_norm": 0.3912699552240718, + "grad_max_sv": 0.20520108379423618, + "grad_min_sv": 7.762914990688819e-09, + "grad_condition": 387803307.69275963, + "lr": 7.001981464747503e-06, + "time_sec": 32.58955121040344 + }, + { + "epoch": 143, + "train_loss": 0.145557352809906, + "train_acc": 0.95334, + "test_loss": 2.9905672885894776, + "test_acc": 0.5351, + "lyapunov": null, + "grad_norm": 0.3937145534468507, + "grad_max_sv": 0.19824392758309842, + "grad_min_sv": 7.470967854170812e-09, + "grad_condition": 615993628.5132923, + "lr": 5.3638335185058295e-06, + "time_sec": 32.584557056427 + }, + { + "epoch": 144, + "train_loss": 0.13792892556190492, + "train_acc": 0.9568, + "test_loss": 3.0243384300231932, + "test_acc": 0.5351, + "lyapunov": null, + "grad_norm": 0.38137874618156004, + "grad_max_sv": 0.20396318212151526, + "grad_min_sv": 7.759564610645975e-09, + "grad_condition": 401781652.79968464, + "lr": 3.942649342761114e-06, + "time_sec": 32.58082866668701 + }, + { + "epoch": 145, + "train_loss": 0.14240989098906517, + "train_acc": 0.95506, + "test_loss": 3.008878281021118, + "test_acc": 0.5332, + "lyapunov": null, + "grad_norm": 0.38824198485970274, + "grad_max_sv": 0.1965224850922823, + "grad_min_sv": 7.475432478099615e-09, + "grad_condition": 547980005.9847585, + "lr": 2.7390523158633524e-06, + "time_sec": 32.580146074295044 + }, + { + "epoch": 146, + "train_loss": 0.14141309247016906, + "train_acc": 0.95526, + "test_loss": 2.9967607612609863, + "test_acc": 0.5355, + "lyapunov": null, + "grad_norm": 0.3897738666220961, + "grad_max_sv": 0.20576116181910037, + "grad_min_sv": 7.723471491180578e-09, + "grad_condition": 174968319.88759154, + "lr": 1.7535703752478133e-06, + "time_sec": 32.57999658584595 + }, + { + "epoch": 147, + "train_loss": 0.14116668840408325, + "train_acc": 0.95622, + "test_loss": 3.015700612258911, + "test_acc": 0.5356, + "lyapunov": null, + "grad_norm": 0.38647682331651556, + "grad_max_sv": 0.20005690585821867, + "grad_min_sv": 7.458373789469112e-09, + "grad_condition": 559134109.3457831, + "lr": 9.866357858642196e-07, + "time_sec": 32.57423949241638 + }, + { + "epoch": 148, + "train_loss": 0.13872075388908386, + "train_acc": 0.95694, + "test_loss": 3.02675003452301, + "test_acc": 0.5311, + "lyapunov": null, + "grad_norm": 0.3834516001697345, + "grad_max_sv": 0.20063496865332126, + "grad_min_sv": 7.280352303873708e-09, + "grad_condition": 342935155.3336584, + "lr": 4.38584950570808e-07, + "time_sec": 32.59147930145264 + }, + { + "epoch": 149, + "train_loss": 0.14044044229030608, + "train_acc": 0.9558, + "test_loss": 3.0015827127456665, + "test_acc": 0.537, + "lyapunov": null, + "grad_norm": 0.38662537604202735, + "grad_max_sv": 0.1903643485158682, + "grad_min_sv": 7.2725075060480446e-09, + "grad_condition": 1114748941.7660475, + "lr": 1.096582625772501e-07, + "time_sec": 32.56627154350281 + }, + { + "epoch": 150, + "train_loss": 0.14047483313083647, + "train_acc": 0.95586, + "test_loss": 3.1137742416381835, + "test_acc": 0.5222, + "lyapunov": null, + "grad_norm": 0.38553295960146916, + "grad_max_sv": 0.2001470748335123, + "grad_min_sv": 7.337464655082695e-09, + "grad_condition": 1377858482.3116786, + "lr": 0.0, + "time_sec": 32.586660385131836 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.87748296585083, + "train_acc": 0.0306, + "test_loss": 4.82872876663208, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 5.932964620640208, + "grad_max_sv": 5.34441111087799, + "grad_min_sv": 9.95076935739192e-08, + "grad_condition": 162613846.39082906, + "lr": 0.0009998903417374227, + "time_sec": 49.64781618118286 + }, + { + "epoch": 2, + "train_loss": 4.325910377655029, + "train_acc": 0.05894, + "test_loss": 4.736625276947022, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 4.434671975936239, + "grad_max_sv": 3.9236845791339876, + "grad_min_sv": 7.506598741907622e-08, + "grad_condition": 326618949.3555427, + "lr": 0.0009995614150494292, + "time_sec": 49.66104316711426 + }, + { + "epoch": 3, + "train_loss": 4.033521332244873, + "train_acc": 0.08816, + "test_loss": 4.546054625701904, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 3.5972867305140204, + "grad_max_sv": 3.0456687450408935, + "grad_min_sv": 6.285284603370356e-08, + "grad_condition": 641155242.0675491, + "lr": 0.0009990133642141358, + "time_sec": 49.67153525352478 + }, + { + "epoch": 4, + "train_loss": 3.8378815770721437, + "train_acc": 0.11312, + "test_loss": 4.485385893249512, + "test_acc": 0.0421, + "lyapunov": null, + "grad_norm": 3.005868245561951, + "grad_max_sv": 2.4899374902248383, + "grad_min_sv": 5.274935636068179e-08, + "grad_condition": 56291013.628438115, + "lr": 0.0009982464296247522, + "time_sec": 49.65495419502258 + }, + { + "epoch": 5, + "train_loss": 3.6790373979949953, + "train_acc": 0.1354, + "test_loss": 4.809463809204102, + "test_acc": 0.0483, + "lyapunov": null, + "grad_norm": 2.481791347519261, + "grad_max_sv": 1.911762249469757, + "grad_min_sv": 4.251578253344768e-08, + "grad_condition": 59447447.39549043, + "lr": 0.0009972609476841367, + "time_sec": 49.609050989151 + }, + { + "epoch": 6, + "train_loss": 3.5471466955566404, + "train_acc": 0.1563, + "test_loss": 4.763859475708008, + "test_acc": 0.0562, + "lyapunov": null, + "grad_norm": 2.0531107778434636, + "grad_max_sv": 1.4932055324316025, + "grad_min_sv": 3.614347272584695e-08, + "grad_condition": 45442606.51570525, + "lr": 0.000996057350657239, + "time_sec": 49.593199491500854 + }, + { + "epoch": 7, + "train_loss": 3.4418113514709474, + "train_acc": 0.17478, + "test_loss": 4.615470837402344, + "test_acc": 0.061, + "lyapunov": null, + "grad_norm": 1.7367000738812381, + "grad_max_sv": 1.1847797572612762, + "grad_min_sv": 3.088092909442341e-08, + "grad_condition": 65255140.867708586, + "lr": 0.000994636166481494, + "time_sec": 49.60785531997681 + }, + { + "epoch": 8, + "train_loss": 3.354895782546997, + "train_acc": 0.18784, + "test_loss": 5.2386075889587405, + "test_acc": 0.0585, + "lyapunov": null, + "grad_norm": 1.5335851977180728, + "grad_max_sv": 0.9428193107247352, + "grad_min_sv": 2.6885542893373415e-08, + "grad_condition": 75909476.50814043, + "lr": 0.0009929980185352525, + "time_sec": 49.60816526412964 + }, + { + "epoch": 9, + "train_loss": 3.2788688597869875, + "train_acc": 0.20466, + "test_loss": 5.2327860107421875, + "test_acc": 0.0714, + "lyapunov": null, + "grad_norm": 1.374914600034168, + "grad_max_sv": 0.7664340496063232, + "grad_min_sv": 2.4066519885290737e-08, + "grad_condition": 51969313.05697616, + "lr": 0.0009911436253643444, + "time_sec": 49.62115836143494 + }, + { + "epoch": 10, + "train_loss": 3.214320725250244, + "train_acc": 0.21478, + "test_loss": 5.367890010070801, + "test_acc": 0.0635, + "lyapunov": null, + "grad_norm": 1.2723756047607861, + "grad_max_sv": 0.6678376257419586, + "grad_min_sv": 2.3140357913176147e-08, + "grad_condition": 33781734.36143675, + "lr": 0.0009890738003669028, + "time_sec": 49.653478384017944 + }, + { + "epoch": 11, + "train_loss": 3.157560857696533, + "train_acc": 0.22716, + "test_loss": 4.9893413871765135, + "test_acc": 0.0793, + "lyapunov": null, + "grad_norm": 1.1804196554033854, + "grad_max_sv": 0.5599115259945393, + "grad_min_sv": 2.0999575375824088e-08, + "grad_condition": 40003653.553005375, + "lr": 0.00098678945143658, + "time_sec": 49.64659833908081 + }, + { + "epoch": 12, + "train_loss": 3.10919125541687, + "train_acc": 0.23374, + "test_loss": 5.922018681335449, + "test_acc": 0.0572, + "lyapunov": null, + "grad_norm": 1.1127516543729237, + "grad_max_sv": 0.5103657670319081, + "grad_min_sv": 2.0326233945988648e-08, + "grad_condition": 31959597.02886455, + "lr": 0.0009842915805643154, + "time_sec": 49.6422758102417 + }, + { + "epoch": 13, + "train_loss": 3.0661709033203124, + "train_acc": 0.24498, + "test_loss": 5.5857378784179685, + "test_acc": 0.0641, + "lyapunov": null, + "grad_norm": 1.0572945850355566, + "grad_max_sv": 0.468644580245018, + "grad_min_sv": 1.9489185115739716e-08, + "grad_condition": 28974309.240684826, + "lr": 0.000981581283398829, + "time_sec": 49.644200801849365 + }, + { + "epoch": 14, + "train_loss": 3.031631886138916, + "train_acc": 0.2494, + "test_loss": 6.1126462295532225, + "test_acc": 0.0622, + "lyapunov": null, + "grad_norm": 1.0078886975437553, + "grad_max_sv": 0.4199274107813835, + "grad_min_sv": 1.78886194669714e-08, + "grad_condition": 58726821.90857921, + "lr": 0.0009786597487660333, + "time_sec": 49.64050054550171 + }, + { + "epoch": 15, + "train_loss": 2.9854307820892334, + "train_acc": 0.25912, + "test_loss": 6.682256416320801, + "test_acc": 0.0577, + "lyapunov": null, + "grad_norm": 0.9661185163428607, + "grad_max_sv": 0.4044369950890541, + "grad_min_sv": 1.7625257230091673e-08, + "grad_condition": 47054066.77256496, + "lr": 0.0009755282581475766, + "time_sec": 49.64783048629761 + }, + { + "epoch": 16, + "train_loss": 2.950966311187744, + "train_acc": 0.26442, + "test_loss": 6.452827975463867, + "test_acc": 0.0549, + "lyapunov": null, + "grad_norm": 0.9327205202160699, + "grad_max_sv": 0.38560108840465546, + "grad_min_sv": 1.7282875616189337e-08, + "grad_condition": 314726395.9437877, + "lr": 0.0009721881851187403, + "time_sec": 49.64088153839111 + }, + { + "epoch": 17, + "train_loss": 2.916735321044922, + "train_acc": 0.27246, + "test_loss": 6.896680711364746, + "test_acc": 0.0438, + "lyapunov": null, + "grad_norm": 0.8945744514519771, + "grad_max_sv": 0.354119461029768, + "grad_min_sv": 1.643565590847551e-08, + "grad_condition": 26255983.39074681, + "lr": 0.0009686409947459456, + "time_sec": 49.627718448638916 + }, + { + "epoch": 18, + "train_loss": 2.8857511570739747, + "train_acc": 0.27974, + "test_loss": 5.6459962882995605, + "test_acc": 0.0503, + "lyapunov": null, + "grad_norm": 0.8793484279442325, + "grad_max_sv": 0.35779951736330984, + "grad_min_sv": 1.628617940785393e-08, + "grad_condition": 111551423.90357837, + "lr": 0.0009648882429441254, + "time_sec": 49.611419677734375 + }, + { + "epoch": 19, + "train_loss": 2.850851222381592, + "train_acc": 0.28394, + "test_loss": 6.184397215270996, + "test_acc": 0.0477, + "lyapunov": null, + "grad_norm": 0.8560875588234809, + "grad_max_sv": 0.3290360912680626, + "grad_min_sv": 1.5741092075638452e-08, + "grad_condition": 33852379.436212204, + "lr": 0.00096093157579425, + "time_sec": 49.60723423957825 + }, + { + "epoch": 20, + "train_loss": 2.8297593169403075, + "train_acc": 0.2865, + "test_loss": 6.550658810424805, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.8484343768951315, + "grad_max_sv": 0.3310988314449787, + "grad_min_sv": 1.579570341747605e-08, + "grad_condition": 26630780.62742402, + "lr": 0.0009567727288213001, + "time_sec": 49.63738775253296 + }, + { + "epoch": 21, + "train_loss": 2.8062883308410647, + "train_acc": 0.29554, + "test_loss": 6.611366340637207, + "test_acc": 0.0425, + "lyapunov": null, + "grad_norm": 0.8271444897566678, + "grad_max_sv": 0.31499212570488455, + "grad_min_sv": 1.5104316366393312e-08, + "grad_condition": 56385885.9009584, + "lr": 0.0009524135262330095, + "time_sec": 49.624245405197144 + }, + { + "epoch": 22, + "train_loss": 2.7797841816711424, + "train_acc": 0.29848, + "test_loss": 5.2575527236938475, + "test_acc": 0.0689, + "lyapunov": null, + "grad_norm": 0.8192773127159139, + "grad_max_sv": 0.3165230479091406, + "grad_min_sv": 1.5343957029956278e-08, + "grad_condition": 28932546.565699626, + "lr": 0.0009478558801197061, + "time_sec": 49.6358916759491 + }, + { + "epoch": 23, + "train_loss": 2.758929995956421, + "train_acc": 0.30298, + "test_loss": 5.9057046417236325, + "test_acc": 0.0483, + "lyapunov": null, + "grad_norm": 0.7977853555521689, + "grad_max_sv": 0.2981082580983639, + "grad_min_sv": 1.4607530535171166e-08, + "grad_condition": 23062158.33463922, + "lr": 0.000943101789615607, + "time_sec": 49.64936828613281 + }, + { + "epoch": 24, + "train_loss": 2.7243907251739503, + "train_acc": 0.30978, + "test_loss": 6.879129153442383, + "test_acc": 0.0503, + "lyapunov": null, + "grad_norm": 0.785562618961601, + "grad_max_sv": 0.3072618875652552, + "grad_min_sv": 1.4546391063907649e-08, + "grad_condition": 26103951.701446574, + "lr": 0.0009381533400219313, + "time_sec": 49.654170513153076 + }, + { + "epoch": 25, + "train_loss": 2.7052862129211426, + "train_acc": 0.31438, + "test_loss": 7.123418940734863, + "test_acc": 0.0498, + "lyapunov": null, + "grad_norm": 0.7800832079587465, + "grad_max_sv": 0.28868941627442835, + "grad_min_sv": 1.4423146366127071e-08, + "grad_condition": 25468875.32253523, + "lr": 0.0009330127018922189, + "time_sec": 49.644099712371826 + }, + { + "epoch": 26, + "train_loss": 2.6786952052307127, + "train_acc": 0.31786, + "test_loss": 6.8779948043823245, + "test_acc": 0.04, + "lyapunov": null, + "grad_norm": 0.7660717213990589, + "grad_max_sv": 0.28445089757442477, + "grad_min_sv": 1.4051416873800404e-08, + "grad_condition": 157008558.44244316, + "lr": 0.000927682130080253, + "time_sec": 49.6546745300293 + }, + { + "epoch": 27, + "train_loss": 2.650107885437012, + "train_acc": 0.3233, + "test_loss": 6.409167988586426, + "test_acc": 0.0663, + "lyapunov": null, + "grad_norm": 0.7553219053413048, + "grad_max_sv": 0.2734900705516338, + "grad_min_sv": 1.3975185350623143e-08, + "grad_condition": 26675374.92153287, + "lr": 0.0009221639627510072, + "time_sec": 49.651949882507324 + }, + { + "epoch": 28, + "train_loss": 2.6323010539245604, + "train_acc": 0.32642, + "test_loss": 6.348737354278565, + "test_acc": 0.0767, + "lyapunov": null, + "grad_norm": 0.7542460840346141, + "grad_max_sv": 0.28178194239735604, + "grad_min_sv": 1.4111558673673974e-08, + "grad_condition": 153191030.94962814, + "lr": 0.0009164606203550494, + "time_sec": 49.657703161239624 + }, + { + "epoch": 29, + "train_loss": 2.622528738861084, + "train_acc": 0.33052, + "test_loss": 5.323012785339356, + "test_acc": 0.0615, + "lyapunov": null, + "grad_norm": 0.7434329600183185, + "grad_max_sv": 0.28229105696082113, + "grad_min_sv": 1.3741382927194567e-08, + "grad_condition": 99920561.24148658, + "lr": 0.0009105746045668516, + "time_sec": 49.640869140625 + }, + { + "epoch": 30, + "train_loss": 2.589859499359131, + "train_acc": 0.3361, + "test_loss": 5.348752153015137, + "test_acc": 0.0806, + "lyapunov": null, + "grad_norm": 0.7401188593705409, + "grad_max_sv": 0.2747684422880411, + "grad_min_sv": 1.3880728885751203e-08, + "grad_condition": 23324413.51449412, + "lr": 0.0009045084971874733, + "time_sec": 49.62320137023926 + }, + { + "epoch": 31, + "train_loss": 2.574071376495361, + "train_acc": 0.33836, + "test_loss": 4.929797785949707, + "test_acc": 0.0696, + "lyapunov": null, + "grad_norm": 0.7328550694976608, + "grad_max_sv": 0.27694769613444803, + "grad_min_sv": 1.3843863291840286e-08, + "grad_condition": 27250825.622907154, + "lr": 0.0008982649590120977, + "time_sec": 49.61762976646423 + }, + { + "epoch": 32, + "train_loss": 2.5636251927185056, + "train_acc": 0.33996, + "test_loss": 4.977822930908203, + "test_acc": 0.0603, + "lyapunov": null, + "grad_norm": 0.72578993407064, + "grad_max_sv": 0.26916658468544485, + "grad_min_sv": 1.3664173616201313e-08, + "grad_condition": 37586474.04914663, + "lr": 0.0008918467286629196, + "time_sec": 49.59874439239502 + }, + { + "epoch": 33, + "train_loss": 2.534274593658447, + "train_acc": 0.34576, + "test_loss": 5.612884985351562, + "test_acc": 0.0648, + "lyapunov": null, + "grad_norm": 0.7195677912828391, + "grad_max_sv": 0.2578020472079515, + "grad_min_sv": 1.3214893858359833e-08, + "grad_condition": 31599310.228798192, + "lr": 0.0008852566213878943, + "time_sec": 49.60587477684021 + }, + { + "epoch": 34, + "train_loss": 2.5204806367492676, + "train_acc": 0.34968, + "test_loss": 5.823319554901123, + "test_acc": 0.0571, + "lyapunov": null, + "grad_norm": 0.7058229239582122, + "grad_max_sv": 0.2517259892076254, + "grad_min_sv": 1.3128194935319027e-08, + "grad_condition": 38016748.40510639, + "lr": 0.000878497527825878, + "time_sec": 49.63596320152283 + }, + { + "epoch": 35, + "train_loss": 2.4967036684417723, + "train_acc": 0.35386, + "test_loss": 5.568839009094238, + "test_acc": 0.0655, + "lyapunov": null, + "grad_norm": 0.7071521329332581, + "grad_max_sv": 0.2598913241177797, + "grad_min_sv": 1.3420283057063997e-08, + "grad_condition": 21475756.171551444, + "lr": 0.000871572412738697, + "time_sec": 49.64343976974487 + }, + { + "epoch": 36, + "train_loss": 2.483395898208618, + "train_acc": 0.356, + "test_loss": 5.925778231811523, + "test_acc": 0.0775, + "lyapunov": null, + "grad_norm": 0.7019030587227678, + "grad_max_sv": 0.2620332419872284, + "grad_min_sv": 1.330909059973906e-08, + "grad_condition": 39143745.76315293, + "lr": 0.0008644843137107055, + "time_sec": 49.633464097976685 + }, + { + "epoch": 37, + "train_loss": 2.455888598480225, + "train_acc": 0.3619, + "test_loss": 5.800891122436523, + "test_acc": 0.0522, + "lyapunov": null, + "grad_norm": 0.7041203727881495, + "grad_max_sv": 0.25247339606285096, + "grad_min_sv": 1.317027563119133e-08, + "grad_condition": 25971636.862640023, + "lr": 0.0008572363398164014, + "time_sec": 49.641075134277344 + }, + { + "epoch": 38, + "train_loss": 2.444258794937134, + "train_acc": 0.3643, + "test_loss": 6.3827191253662106, + "test_acc": 0.0512, + "lyapunov": null, + "grad_norm": 0.6991868964165402, + "grad_max_sv": 0.2449926756322384, + "grad_min_sv": 1.2983126976284787e-08, + "grad_condition": 22727640.443126805, + "lr": 0.0008498316702566826, + "time_sec": 49.6653778553009 + }, + { + "epoch": 39, + "train_loss": 2.427623992614746, + "train_acc": 0.36718, + "test_loss": 5.836345671081543, + "test_acc": 0.0532, + "lyapunov": null, + "grad_norm": 0.6944654131754266, + "grad_max_sv": 0.24421218782663345, + "grad_min_sv": 1.2779784830385666e-08, + "grad_condition": 26159365.26096248, + "lr": 0.0008422735529643442, + "time_sec": 49.65552568435669 + }, + { + "epoch": 40, + "train_loss": 2.4149912483215332, + "train_acc": 0.36854, + "test_loss": 5.969065676879882, + "test_acc": 0.0689, + "lyapunov": null, + "grad_norm": 0.6869986110904911, + "grad_max_sv": 0.23399859815835952, + "grad_min_sv": 1.2716373970489415e-08, + "grad_condition": 21923336.447286993, + "lr": 0.0008345653031794289, + "time_sec": 49.66923117637634 + }, + { + "epoch": 41, + "train_loss": 2.386474126663208, + "train_acc": 0.37558, + "test_loss": 6.019966047668457, + "test_acc": 0.0579, + "lyapunov": null, + "grad_norm": 0.68492309888036, + "grad_max_sv": 0.2508115164935589, + "grad_min_sv": 1.3077304128472633e-08, + "grad_condition": 23198341.25841063, + "lr": 0.0008267103019950526, + "time_sec": 49.620418071746826 + }, + { + "epoch": 42, + "train_loss": 2.3729596766662597, + "train_acc": 0.38002, + "test_loss": 6.315153423309326, + "test_acc": 0.0611, + "lyapunov": null, + "grad_norm": 0.6839063548904902, + "grad_max_sv": 0.24613724276423454, + "grad_min_sv": 1.2924071682296479e-08, + "grad_condition": 24553794.967906404, + "lr": 0.0008187119948743447, + "time_sec": 49.66134309768677 + }, + { + "epoch": 43, + "train_loss": 2.3540061936950685, + "train_acc": 0.38038, + "test_loss": 6.8890972946166995, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.6797404469786038, + "grad_max_sv": 0.23774098604917526, + "grad_min_sv": 1.269067942399893e-08, + "grad_condition": 36055931.35688925, + "lr": 0.000810573890139155, + "time_sec": 49.60659217834473 + }, + { + "epoch": 44, + "train_loss": 2.3270812229919433, + "train_acc": 0.38584, + "test_loss": 6.7161765426635744, + "test_acc": 0.0423, + "lyapunov": null, + "grad_norm": 0.6759173721688353, + "grad_max_sv": 0.24107158593833447, + "grad_min_sv": 1.2535652725575997e-08, + "grad_condition": 27534242.15084389, + "lr": 0.0008022995574311873, + "time_sec": 49.602726459503174 + }, + { + "epoch": 45, + "train_loss": 2.3246476860046386, + "train_acc": 0.39008, + "test_loss": 6.29091294631958, + "test_acc": 0.0518, + "lyapunov": null, + "grad_norm": 0.6715272373280456, + "grad_max_sv": 0.23545034006237983, + "grad_min_sv": 1.2545344027503624e-08, + "grad_condition": 21225788.36034053, + "lr": 0.0007938926261462363, + "time_sec": 49.6089346408844 + }, + { + "epoch": 46, + "train_loss": 2.302794339752197, + "train_acc": 0.3932, + "test_loss": 6.331070534515381, + "test_acc": 0.0457, + "lyapunov": null, + "grad_norm": 0.6695288339948315, + "grad_max_sv": 0.2387615241110325, + "grad_min_sv": 1.267214993216914e-08, + "grad_condition": 21439809.063333027, + "lr": 0.0007853567838422158, + "time_sec": 49.6616952419281 + }, + { + "epoch": 47, + "train_loss": 2.2937580155944826, + "train_acc": 0.39494, + "test_loss": 6.747457525634766, + "test_acc": 0.0403, + "lyapunov": null, + "grad_norm": 0.6703150590025013, + "grad_max_sv": 0.23008973710238934, + "grad_min_sv": 1.243687924035175e-08, + "grad_condition": 21332244.897804268, + "lr": 0.0007766957746216719, + "time_sec": 49.64005661010742 + }, + { + "epoch": 48, + "train_loss": 2.271936141662598, + "train_acc": 0.40028, + "test_loss": 8.364392227172852, + "test_acc": 0.045, + "lyapunov": null, + "grad_norm": 0.6688819126115724, + "grad_max_sv": 0.23257951848208905, + "grad_min_sv": 1.2320799760989764e-08, + "grad_condition": 43562236.54403031, + "lr": 0.0007679133974894982, + "time_sec": 49.66763877868652 + }, + { + "epoch": 49, + "train_loss": 2.2604706730651856, + "train_acc": 0.40228, + "test_loss": 6.142012088012695, + "test_acc": 0.0648, + "lyapunov": null, + "grad_norm": 0.6643101794178548, + "grad_max_sv": 0.2336978729814291, + "grad_min_sv": 1.2540253756243568e-08, + "grad_condition": 33614084.08040741, + "lr": 0.000759013504686565, + "time_sec": 49.65048050880432 + }, + { + "epoch": 50, + "train_loss": 2.238395141143799, + "train_acc": 0.40952, + "test_loss": 7.636728004455566, + "test_acc": 0.0642, + "lyapunov": null, + "grad_norm": 0.6646450225062208, + "grad_max_sv": 0.23055841773748398, + "grad_min_sv": 1.2360750140105737e-08, + "grad_condition": 29243478.728895236, + "lr": 0.0007499999999999998, + "time_sec": 49.64303922653198 + }, + { + "epoch": 51, + "train_loss": 2.22945908203125, + "train_acc": 0.40844, + "test_loss": 6.013677481079101, + "test_acc": 0.0746, + "lyapunov": null, + "grad_norm": 0.6654733307343168, + "grad_max_sv": 0.23596662729978563, + "grad_min_sv": 1.2487093845048314e-08, + "grad_condition": 24754111.81759522, + "lr": 0.0007408768370508575, + "time_sec": 49.64409947395325 + }, + { + "epoch": 52, + "train_loss": 2.2170784504699705, + "train_acc": 0.40908, + "test_loss": 6.157418632507325, + "test_acc": 0.0702, + "lyapunov": null, + "grad_norm": 0.6594175681266546, + "grad_max_sv": 0.2355981681495905, + "grad_min_sv": 1.236185071251672e-08, + "grad_condition": 25757058.499904532, + "lr": 0.0007316480175599307, + "time_sec": 49.636614084243774 + }, + { + "epoch": 53, + "train_loss": 2.1939515002059937, + "train_acc": 0.41558, + "test_loss": 6.859078231048584, + "test_acc": 0.0569, + "lyapunov": null, + "grad_norm": 0.662946169812431, + "grad_max_sv": 0.23508151918649672, + "grad_min_sv": 1.2330145124361813e-08, + "grad_condition": 32594540.125570327, + "lr": 0.0007223175895924635, + "time_sec": 49.70306444168091 + }, + { + "epoch": 54, + "train_loss": 2.1878874357604983, + "train_acc": 0.41686, + "test_loss": 6.514185330963135, + "test_acc": 0.0579, + "lyapunov": null, + "grad_norm": 0.6592013207620988, + "grad_max_sv": 0.23284565843641758, + "grad_min_sv": 1.246490098361086e-08, + "grad_condition": 21669360.08749289, + "lr": 0.0007128896457825361, + "time_sec": 49.62425947189331 + }, + { + "epoch": 55, + "train_loss": 2.1700433895111084, + "train_acc": 0.42082, + "test_loss": 7.349776064300537, + "test_acc": 0.0557, + "lyapunov": null, + "grad_norm": 0.6591415320918335, + "grad_max_sv": 0.23167332261800766, + "grad_min_sv": 1.2205207861396006e-08, + "grad_condition": 238494592.31476593, + "lr": 0.0007033683215378998, + "time_sec": 49.62825536727905 + }, + { + "epoch": 56, + "train_loss": 2.153282830657959, + "train_acc": 0.4221, + "test_loss": 6.606533212280273, + "test_acc": 0.0616, + "lyapunov": null, + "grad_norm": 0.6581126496222481, + "grad_max_sv": 0.22157299481332302, + "grad_min_sv": 1.218345958564626e-08, + "grad_condition": 21160581.40499527, + "lr": 0.0006937577932260512, + "time_sec": 49.614638328552246 + }, + { + "epoch": 57, + "train_loss": 2.1483337621307372, + "train_acc": 0.42194, + "test_loss": 8.756062689208985, + "test_acc": 0.0525, + "lyapunov": null, + "grad_norm": 0.655149621093074, + "grad_max_sv": 0.23063393794000148, + "grad_min_sv": 1.2325510248545334e-08, + "grad_condition": 32561576.294376243, + "lr": 0.0006840622763423388, + "time_sec": 49.604514598846436 + }, + { + "epoch": 58, + "train_loss": 2.13039572971344, + "train_acc": 0.428, + "test_loss": 6.102099295043946, + "test_acc": 0.077, + "lyapunov": null, + "grad_norm": 0.6579204722244499, + "grad_max_sv": 0.22870929054915906, + "grad_min_sv": 1.2437226873385221e-08, + "grad_condition": 29029893.441014826, + "lr": 0.0006742860236609073, + "time_sec": 49.63142991065979 + }, + { + "epoch": 59, + "train_loss": 2.1072697998809815, + "train_acc": 0.4333, + "test_loss": 6.253016600799561, + "test_acc": 0.0479, + "lyapunov": null, + "grad_norm": 0.6541760692934044, + "grad_max_sv": 0.22985584288835526, + "grad_min_sv": 1.2442094027981244e-08, + "grad_condition": 231036397.09788594, + "lr": 0.0006644333233692913, + "time_sec": 49.64534831047058 + }, + { + "epoch": 60, + "train_loss": 2.1020205306243898, + "train_acc": 0.43472, + "test_loss": 5.772405567932129, + "test_acc": 0.0592, + "lyapunov": null, + "grad_norm": 0.6527505369999154, + "grad_max_sv": 0.22004029378294945, + "grad_min_sv": 1.217291406285792e-08, + "grad_condition": 24874942.26037088, + "lr": 0.0006545084971874734, + "time_sec": 49.647597312927246 + }, + { + "epoch": 61, + "train_loss": 2.0730964871215822, + "train_acc": 0.4414, + "test_loss": 7.9832359893798825, + "test_acc": 0.0641, + "lyapunov": null, + "grad_norm": 0.6546297418175855, + "grad_max_sv": 0.223886064812541, + "grad_min_sv": 1.2451116643275028e-08, + "grad_condition": 22916995.636865757, + "lr": 0.0006445158984722354, + "time_sec": 49.65083956718445 + }, + { + "epoch": 62, + "train_loss": 2.062996348876953, + "train_acc": 0.4436, + "test_loss": 7.34946787109375, + "test_acc": 0.044, + "lyapunov": null, + "grad_norm": 0.6483177973397803, + "grad_max_sv": 0.22704768665134906, + "grad_min_sv": 1.20682398005445e-08, + "grad_condition": 38390561.96495845, + "lr": 0.0006344599103076324, + "time_sec": 49.65266275405884 + }, + { + "epoch": 63, + "train_loss": 2.0523825840759278, + "train_acc": 0.44564, + "test_loss": 8.959309451293946, + "test_acc": 0.0413, + "lyapunov": null, + "grad_norm": 0.6488732278425234, + "grad_max_sv": 0.22664117477834225, + "grad_min_sv": 1.2159747242446172e-08, + "grad_condition": 31006507.26126058, + "lr": 0.0006243449435824269, + "time_sec": 49.65293788909912 + }, + { + "epoch": 64, + "train_loss": 2.0479974696350096, + "train_acc": 0.44714, + "test_loss": 8.05115908203125, + "test_acc": 0.0537, + "lyapunov": null, + "grad_norm": 0.6455494446410326, + "grad_max_sv": 0.2193945564329624, + "grad_min_sv": 1.2038907266117942e-08, + "grad_condition": 901694346.4545784, + "lr": 0.0006141754350553275, + "time_sec": 49.64103627204895 + }, + { + "epoch": 65, + "train_loss": 2.027272645950317, + "train_acc": 0.45036, + "test_loss": 8.782285342407226, + "test_acc": 0.0554, + "lyapunov": null, + "grad_norm": 0.6482083158352888, + "grad_max_sv": 0.2296803079545498, + "grad_min_sv": 1.2045603877547384e-08, + "grad_condition": 44744302.33572485, + "lr": 0.0006039558454088793, + "time_sec": 49.62383842468262 + }, + { + "epoch": 66, + "train_loss": 2.012310220794678, + "train_acc": 0.4561, + "test_loss": 8.360753945922852, + "test_acc": 0.0486, + "lyapunov": null, + "grad_norm": 0.6486341651257033, + "grad_max_sv": 0.21999806091189383, + "grad_min_sv": 1.2103176813549332e-08, + "grad_condition": 25365047.453725625, + "lr": 0.000593690657292862, + "time_sec": 49.620052099227905 + }, + { + "epoch": 67, + "train_loss": 2.2251435960388184, + "train_acc": 0.43342, + "test_loss": 4.351189101409912, + "test_acc": 0.0583, + "lyapunov": null, + "grad_norm": 0.6822841692183329, + "grad_max_sv": 0.23429610803723336, + "grad_min_sv": 1.2533971320831828e-08, + "grad_condition": 620776564.7686789, + "lr": 0.0005833843733580507, + "time_sec": 49.6039252281189 + }, + { + "epoch": 68, + "train_loss": 3.644752220916748, + "train_acc": 0.14882, + "test_loss": 4.446993719482422, + "test_acc": 0.1036, + "lyapunov": null, + "grad_norm": 0.5322357731359522, + "grad_max_sv": 0.1740941284224391, + "grad_min_sv": 9.981525750379916e-09, + "grad_condition": 19772886.771588072, + "lr": 0.0005730415142812054, + "time_sec": 49.6299045085907 + }, + { + "epoch": 69, + "train_loss": 3.1906630830383302, + "train_acc": 0.22138, + "test_loss": 4.447753040695191, + "test_acc": 0.1086, + "lyapunov": null, + "grad_norm": 0.5849582495428348, + "grad_max_sv": 0.19428364057093858, + "grad_min_sv": 1.0978856412879878e-08, + "grad_condition": 20893419.13528825, + "lr": 0.0005626666167821517, + "time_sec": 49.62305164337158 + }, + { + "epoch": 70, + "train_loss": 2.9685875498962404, + "train_acc": 0.26182, + "test_loss": 5.079945266723633, + "test_acc": 0.1082, + "lyapunov": null, + "grad_norm": 0.5988082474018407, + "grad_max_sv": 0.20677474029362203, + "grad_min_sv": 1.1152884460408074e-08, + "grad_condition": 28125873.10543083, + "lr": 0.0005522642316338265, + "time_sec": 49.63573360443115 + }, + { + "epoch": 71, + "train_loss": 2.8187981507110598, + "train_acc": 0.29056, + "test_loss": 5.128676221466065, + "test_acc": 0.1097, + "lyapunov": null, + "grad_norm": 0.6073589396586558, + "grad_max_sv": 0.19603765942156315, + "grad_min_sv": 1.1142021388854673e-08, + "grad_condition": 23682104.838631887, + "lr": 0.0005418389216661573, + "time_sec": 49.65342855453491 + }, + { + "epoch": 72, + "train_loss": 2.7264524671173094, + "train_acc": 0.30584, + "test_loss": 4.905041383361817, + "test_acc": 0.1255, + "lyapunov": null, + "grad_norm": 0.6147190521685049, + "grad_max_sv": 0.20450513996183872, + "grad_min_sv": 1.1536205649087527e-08, + "grad_condition": 28562481.748963058, + "lr": 0.0005313952597646563, + "time_sec": 49.65431094169617 + }, + { + "epoch": 73, + "train_loss": 2.6403448142242434, + "train_acc": 0.32094, + "test_loss": 5.800853311538696, + "test_acc": 0.107, + "lyapunov": null, + "grad_norm": 0.6247716864218055, + "grad_max_sv": 0.21473125889897346, + "grad_min_sv": 1.1889953104027295e-08, + "grad_condition": 65722876.53475368, + "lr": 0.0005209378268645994, + "time_sec": 49.64467167854309 + }, + { + "epoch": 74, + "train_loss": 2.5647068825531005, + "train_acc": 0.33604, + "test_loss": 6.016946387481689, + "test_acc": 0.1108, + "lyapunov": null, + "grad_norm": 0.6262187013652493, + "grad_max_sv": 0.21014209054410457, + "grad_min_sv": 1.1593367979512159e-08, + "grad_condition": 23978185.39414488, + "lr": 0.0005104712099416781, + "time_sec": 49.635523080825806 + }, + { + "epoch": 75, + "train_loss": 2.5212148859405517, + "train_acc": 0.34632, + "test_loss": 6.316108853149414, + "test_acc": 0.1027, + "lyapunov": null, + "grad_norm": 0.6347754908556336, + "grad_max_sv": 0.21141788363456726, + "grad_min_sv": 1.179611141682857e-08, + "grad_condition": 33522616.12577144, + "lr": 0.0004999999999999996, + "time_sec": 49.63302993774414 + }, + { + "epoch": 76, + "train_loss": 2.470890021209717, + "train_acc": 0.35636, + "test_loss": 6.3965694896698, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 0.6330916660078362, + "grad_max_sv": 0.21149154454469682, + "grad_min_sv": 1.186264902419687e-08, + "grad_condition": 78784632.22578731, + "lr": 0.0004895287900583212, + "time_sec": 49.637208223342896 + }, + { + "epoch": 77, + "train_loss": 2.421552244262695, + "train_acc": 0.36788, + "test_loss": 6.69319435043335, + "test_acc": 0.1017, + "lyapunov": null, + "grad_norm": 0.634293677395214, + "grad_max_sv": 0.2066604733467102, + "grad_min_sv": 1.1785100880942756e-08, + "grad_condition": 59189077.883828625, + "lr": 0.0004790621731353997, + "time_sec": 49.63215613365173 + }, + { + "epoch": 78, + "train_loss": 2.3847443492126463, + "train_acc": 0.37546, + "test_loss": 7.132302479934692, + "test_acc": 0.0943, + "lyapunov": null, + "grad_norm": 0.6382190364657672, + "grad_max_sv": 0.20905729271471502, + "grad_min_sv": 1.1757649508170598e-08, + "grad_condition": 26167748.83618117, + "lr": 0.000468604740235343, + "time_sec": 49.61492323875427 + }, + { + "epoch": 79, + "train_loss": 2.3435024488830565, + "train_acc": 0.38554, + "test_loss": 7.740195120239258, + "test_acc": 0.0916, + "lyapunov": null, + "grad_norm": 0.6365390593800095, + "grad_max_sv": 0.214980835467577, + "grad_min_sv": 1.20849943802126e-08, + "grad_condition": 26878255.479230188, + "lr": 0.00045816107833384175, + "time_sec": 49.625444412231445 + }, + { + "epoch": 80, + "train_loss": 2.3083001178741456, + "train_acc": 0.39014, + "test_loss": 6.61783053894043, + "test_acc": 0.1104, + "lyapunov": null, + "grad_norm": 0.6406625014101909, + "grad_max_sv": 0.21362034603953362, + "grad_min_sv": 1.2048267306052906e-08, + "grad_condition": 20392384.690080393, + "lr": 0.0004477357683661729, + "time_sec": 49.60279703140259 + }, + { + "epoch": 81, + "train_loss": 2.2839368876647947, + "train_acc": 0.39676, + "test_loss": 6.873206716918945, + "test_acc": 0.1118, + "lyapunov": null, + "grad_norm": 0.640888071388829, + "grad_max_sv": 0.21525344289839268, + "grad_min_sv": 1.1972712192151457e-08, + "grad_condition": 50063258.30804229, + "lr": 0.00043733338321784746, + "time_sec": 49.61454939842224 + }, + { + "epoch": 82, + "train_loss": 2.256084364776611, + "train_acc": 0.40168, + "test_loss": 8.169263735961914, + "test_acc": 0.0948, + "lyapunov": null, + "grad_norm": 0.6434003244484818, + "grad_max_sv": 0.21655187159776687, + "grad_min_sv": 1.23490741438248e-08, + "grad_condition": 21577781.507507768, + "lr": 0.0004269584857187939, + "time_sec": 49.62588882446289 + }, + { + "epoch": 83, + "train_loss": 2.2249307306671144, + "train_acc": 0.40856, + "test_loss": 7.893931579589844, + "test_acc": 0.1041, + "lyapunov": null, + "grad_norm": 0.6443153342631529, + "grad_max_sv": 0.2138610877096653, + "grad_min_sv": 1.1779399097799904e-08, + "grad_condition": 37321529.4476779, + "lr": 0.0004166156266419484, + "time_sec": 49.63660502433777 + }, + { + "epoch": 84, + "train_loss": 2.208123627166748, + "train_acc": 0.4104, + "test_loss": 7.499340794372559, + "test_acc": 0.104, + "lyapunov": null, + "grad_norm": 0.6478863121733859, + "grad_max_sv": 0.21281871050596238, + "grad_min_sv": 1.2020403913903798e-08, + "grad_condition": 28996288.04674848, + "lr": 0.0004063093427071373, + "time_sec": 49.6533477306366 + }, + { + "epoch": 85, + "train_loss": 2.187458460845947, + "train_acc": 0.41414, + "test_loss": 7.118385442352295, + "test_acc": 0.1033, + "lyapunov": null, + "grad_norm": 0.6504270947812989, + "grad_max_sv": 0.22195289880037308, + "grad_min_sv": 1.2075933084054746e-08, + "grad_condition": 35680632.041642115, + "lr": 0.0003960441545911199, + "time_sec": 49.64801740646362 + }, + { + "epoch": 86, + "train_loss": 2.16914088722229, + "train_acc": 0.41866, + "test_loss": 8.384735362243653, + "test_acc": 0.0929, + "lyapunov": null, + "grad_norm": 0.6545464063385937, + "grad_max_sv": 0.22763431407511234, + "grad_min_sv": 1.2551986523431924e-08, + "grad_condition": 55796762.73182211, + "lr": 0.0003858245649446718, + "time_sec": 49.66041612625122 + }, + { + "epoch": 87, + "train_loss": 2.1368742782592776, + "train_acc": 0.42592, + "test_loss": 6.581503366088867, + "test_acc": 0.1232, + "lyapunov": null, + "grad_norm": 0.6536380667194897, + "grad_max_sv": 0.2278426967561245, + "grad_min_sv": 1.2359256434946175e-08, + "grad_condition": 24353654.705191635, + "lr": 0.00037565505641757235, + "time_sec": 49.66181540489197 + }, + { + "epoch": 88, + "train_loss": 2.1224456649780272, + "train_acc": 0.4304, + "test_loss": 7.7792722061157225, + "test_acc": 0.1034, + "lyapunov": null, + "grad_norm": 0.6522543248368956, + "grad_max_sv": 0.21917447336018087, + "grad_min_sv": 1.2232303508996622e-08, + "grad_condition": 23923683.00683912, + "lr": 0.00036554008969236695, + "time_sec": 49.64878726005554 + }, + { + "epoch": 89, + "train_loss": 2.099866188964844, + "train_acc": 0.4329, + "test_loss": 7.891568328857422, + "test_acc": 0.0965, + "lyapunov": null, + "grad_norm": 0.6502507826061058, + "grad_max_sv": 0.2151956543326378, + "grad_min_sv": 1.197734313118648e-08, + "grad_condition": 22524026.625488658, + "lr": 0.0003554841015277638, + "time_sec": 49.636536598205566 + }, + { + "epoch": 90, + "train_loss": 2.0865442153167724, + "train_acc": 0.43664, + "test_loss": 7.531399671936035, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 0.6569777082536814, + "grad_max_sv": 0.2229558028280735, + "grad_min_sv": 1.218858882712226e-08, + "grad_condition": 23258750.132011104, + "lr": 0.000345491502812526, + "time_sec": 49.61567449569702 + }, + { + "epoch": 91, + "train_loss": 2.06498106628418, + "train_acc": 0.44214, + "test_loss": 8.12637159576416, + "test_acc": 0.0982, + "lyapunov": null, + "grad_norm": 0.6551117087544674, + "grad_max_sv": 0.2304719265550375, + "grad_min_sv": 1.2402068626238271e-08, + "grad_condition": 26484691.211153176, + "lr": 0.0003355666766307081, + "time_sec": 49.61532545089722 + }, + { + "epoch": 92, + "train_loss": 2.05007131362915, + "train_acc": 0.44468, + "test_loss": 8.683588043212891, + "test_acc": 0.0875, + "lyapunov": null, + "grad_norm": 0.6572758654097208, + "grad_max_sv": 0.2220118623226881, + "grad_min_sv": 1.228345688220056e-08, + "grad_condition": 43719860.633667246, + "lr": 0.00032571397633909225, + "time_sec": 49.61735486984253 + }, + { + "epoch": 93, + "train_loss": 2.0329663645935057, + "train_acc": 0.44968, + "test_loss": 8.036752981567382, + "test_acc": 0.0946, + "lyapunov": null, + "grad_norm": 0.6594762151865757, + "grad_max_sv": 0.23468641191720963, + "grad_min_sv": 1.2702623283789016e-08, + "grad_condition": 22758035.70513925, + "lr": 0.00031593772365766094, + "time_sec": 49.594003438949585 + }, + { + "epoch": 94, + "train_loss": 2.015877328491211, + "train_acc": 0.45332, + "test_loss": 6.995108350372314, + "test_acc": 0.1074, + "lyapunov": null, + "grad_norm": 0.652167332688343, + "grad_max_sv": 0.21848529055714608, + "grad_min_sv": 1.2157653033612048e-08, + "grad_condition": 31954927.567971922, + "lr": 0.0003062422067739483, + "time_sec": 49.64247727394104 + }, + { + "epoch": 95, + "train_loss": 1.9991163059997559, + "train_acc": 0.45638, + "test_loss": 7.588622467803955, + "test_acc": 0.1142, + "lyapunov": null, + "grad_norm": 0.6621803475520015, + "grad_max_sv": 0.21934038177132606, + "grad_min_sv": 1.2358172536697243e-08, + "grad_condition": 24385893.04871109, + "lr": 0.00029663167846209965, + "time_sec": 49.63428497314453 + }, + { + "epoch": 96, + "train_loss": 1.9834483330917358, + "train_acc": 0.45752, + "test_loss": 7.558978903198242, + "test_acc": 0.1094, + "lyapunov": null, + "grad_norm": 0.6668846817868389, + "grad_max_sv": 0.21797076910734176, + "grad_min_sv": 1.225281484884544e-08, + "grad_condition": 22333814.982193254, + "lr": 0.00028711035421746345, + "time_sec": 49.63755655288696 + }, + { + "epoch": 97, + "train_loss": 1.969242282485962, + "train_acc": 0.46376, + "test_loss": 7.394112825012207, + "test_acc": 0.1099, + "lyapunov": null, + "grad_norm": 0.6554699630149605, + "grad_max_sv": 0.2301444172859192, + "grad_min_sv": 1.2433391152755214e-08, + "grad_condition": 24491819.03636659, + "lr": 0.00027768241040753615, + "time_sec": 49.655335903167725 + }, + { + "epoch": 98, + "train_loss": 1.9529696557617187, + "train_acc": 0.46774, + "test_loss": 7.055284997558593, + "test_acc": 0.1162, + "lyapunov": null, + "grad_norm": 0.6640537000345971, + "grad_max_sv": 0.22325844801962375, + "grad_min_sv": 1.2163324900060778e-08, + "grad_condition": 52648989.07312742, + "lr": 0.00026835198244006903, + "time_sec": 49.669140100479126 + }, + { + "epoch": 99, + "train_loss": 1.939459365234375, + "train_acc": 0.46992, + "test_loss": 7.755525547790527, + "test_acc": 0.1106, + "lyapunov": null, + "grad_norm": 0.6598990438805343, + "grad_max_sv": 0.23020310550928116, + "grad_min_sv": 1.2323512080247845e-08, + "grad_condition": 26539045.73575706, + "lr": 0.0002591231629491421, + "time_sec": 49.658100605010986 + }, + { + "epoch": 100, + "train_loss": 1.9241277764892577, + "train_acc": 0.47272, + "test_loss": 6.962932342529297, + "test_acc": 0.1245, + "lyapunov": null, + "grad_norm": 0.6566318375145326, + "grad_max_sv": 0.228052269667387, + "grad_min_sv": 1.2546390118495231e-08, + "grad_condition": 21651299.709478803, + "lr": 0.0002499999999999997, + "time_sec": 49.63715100288391 + }, + { + "epoch": 101, + "train_loss": 1.9074506490325929, + "train_acc": 0.47786, + "test_loss": 7.837496071624756, + "test_acc": 0.1147, + "lyapunov": null, + "grad_norm": 0.6602483696560503, + "grad_max_sv": 0.2316434532403946, + "grad_min_sv": 1.2379145530871938e-08, + "grad_condition": 26011010.493026, + "lr": 0.00024098649531343477, + "time_sec": 49.64603877067566 + }, + { + "epoch": 102, + "train_loss": 1.8926145942687989, + "train_acc": 0.48072, + "test_loss": 8.698235131835938, + "test_acc": 0.0935, + "lyapunov": null, + "grad_norm": 0.6633351574173826, + "grad_max_sv": 0.22496680207550526, + "grad_min_sv": 1.2393885331918319e-08, + "grad_condition": 62142872.25343563, + "lr": 0.0002320866025105016, + "time_sec": 49.613752126693726 + }, + { + "epoch": 103, + "train_loss": 1.8847379415130616, + "train_acc": 0.48146, + "test_loss": 8.400778024291991, + "test_acc": 0.1064, + "lyapunov": null, + "grad_norm": 0.6628163988108642, + "grad_max_sv": 0.2389563336968422, + "grad_min_sv": 1.2502011579674024e-08, + "grad_condition": 561960509.0407003, + "lr": 0.0002233042253783278, + "time_sec": 49.64220905303955 + }, + { + "epoch": 104, + "train_loss": 1.864337573890686, + "train_acc": 0.48388, + "test_loss": 7.582353992080688, + "test_acc": 0.1105, + "lyapunov": null, + "grad_norm": 0.6662860681196462, + "grad_max_sv": 0.2305597063153982, + "grad_min_sv": 1.2549438151154835e-08, + "grad_condition": 28749280.670694787, + "lr": 0.000214643216157784, + "time_sec": 49.59931921958923 + }, + { + "epoch": 105, + "train_loss": 1.8436736141586303, + "train_acc": 0.49176, + "test_loss": 7.296687260437012, + "test_acc": 0.1222, + "lyapunov": null, + "grad_norm": 0.6651015349952935, + "grad_max_sv": 0.22770841754972934, + "grad_min_sv": 1.2484767888520238e-08, + "grad_condition": 223685448.9202466, + "lr": 0.00020610737385376332, + "time_sec": 49.59563899040222 + }, + { + "epoch": 106, + "train_loss": 1.841442982711792, + "train_acc": 0.49332, + "test_loss": 8.086389836120606, + "test_acc": 0.1055, + "lyapunov": null, + "grad_norm": 0.6642212770974275, + "grad_max_sv": 0.23377629406750203, + "grad_min_sv": 1.239430658661611e-08, + "grad_condition": 25560457.467378292, + "lr": 0.00019770044256881242, + "time_sec": 49.633612394332886 + }, + { + "epoch": 107, + "train_loss": 1.8276642670440675, + "train_acc": 0.49872, + "test_loss": 8.12283078918457, + "test_acc": 0.1035, + "lyapunov": null, + "grad_norm": 0.6635032674607848, + "grad_max_sv": 0.22688985653221608, + "grad_min_sv": 1.237523354902237e-08, + "grad_condition": 25808230.55779849, + "lr": 0.0001894261098608447, + "time_sec": 49.63720369338989 + }, + { + "epoch": 108, + "train_loss": 1.8169137536621094, + "train_acc": 0.49852, + "test_loss": 8.409533373260498, + "test_acc": 0.0987, + "lyapunov": null, + "grad_norm": 0.6667541497565868, + "grad_max_sv": 0.22939535826444626, + "grad_min_sv": 1.2364147994672892e-08, + "grad_condition": 124450338.46619192, + "lr": 0.000181288005125655, + "time_sec": 49.650787591934204 + }, + { + "epoch": 109, + "train_loss": 1.7991494818115235, + "train_acc": 0.50362, + "test_loss": 7.646248370361328, + "test_acc": 0.1117, + "lyapunov": null, + "grad_norm": 0.6718663681176132, + "grad_max_sv": 0.22661731615662575, + "grad_min_sv": 1.2321765009010166e-08, + "grad_condition": 38880987.41150442, + "lr": 0.0001732896980049473, + "time_sec": 49.649791955947876 + }, + { + "epoch": 110, + "train_loss": 1.8055472195053102, + "train_acc": 0.5002, + "test_loss": 7.981080414581299, + "test_acc": 0.1032, + "lyapunov": null, + "grad_norm": 0.66872350270792, + "grad_max_sv": 0.22803995087742807, + "grad_min_sv": 1.2362955611371421e-08, + "grad_condition": 262033827.92100912, + "lr": 0.00016543469682057076, + "time_sec": 49.647390365600586 + }, + { + "epoch": 111, + "train_loss": 1.7805239984130858, + "train_acc": 0.50612, + "test_loss": 8.953764317321777, + "test_acc": 0.098, + "lyapunov": null, + "grad_norm": 0.673049303663611, + "grad_max_sv": 0.23256770558655263, + "grad_min_sv": 1.2522076875409738e-08, + "grad_condition": 79448628.08930221, + "lr": 0.00015772644703565552, + "time_sec": 49.64419651031494 + }, + { + "epoch": 112, + "train_loss": 1.7635594388580322, + "train_acc": 0.51178, + "test_loss": 9.006199928283692, + "test_acc": 0.0944, + "lyapunov": null, + "grad_norm": 0.6690577762179267, + "grad_max_sv": 0.231477802246809, + "grad_min_sv": 1.2611339457110904e-08, + "grad_condition": 74574181.95014855, + "lr": 0.00015016832974331713, + "time_sec": 49.6623969078064 + }, + { + "epoch": 113, + "train_loss": 1.7649991600799562, + "train_acc": 0.50992, + "test_loss": 8.706898388671876, + "test_acc": 0.0957, + "lyapunov": null, + "grad_norm": 0.6698910233260391, + "grad_max_sv": 0.24120958633720874, + "grad_min_sv": 1.2578526964457382e-08, + "grad_condition": 53483669.38925791, + "lr": 0.00014276366018359834, + "time_sec": 49.66872000694275 + }, + { + "epoch": 114, + "train_loss": 1.7550373428726196, + "train_acc": 0.51416, + "test_loss": 9.079370852661134, + "test_acc": 0.0946, + "lyapunov": null, + "grad_norm": 0.6663575459996698, + "grad_max_sv": 0.22731570713222027, + "grad_min_sv": 1.247297455250762e-08, + "grad_condition": 42511186.51551006, + "lr": 0.00013551568628929425, + "time_sec": 49.61651134490967 + }, + { + "epoch": 115, + "train_loss": 1.7389271509552002, + "train_acc": 0.51604, + "test_loss": 8.636061263275147, + "test_acc": 0.1024, + "lyapunov": null, + "grad_norm": 0.6736568214282298, + "grad_max_sv": 0.23145201802253723, + "grad_min_sv": 1.2523735046232608e-08, + "grad_condition": 34281489.67578278, + "lr": 0.00012842758726130276, + "time_sec": 49.587687492370605 + }, + { + "epoch": 116, + "train_loss": 1.73655320854187, + "train_acc": 0.51642, + "test_loss": 9.354261597442626, + "test_acc": 0.0971, + "lyapunov": null, + "grad_norm": 0.6692761494554511, + "grad_max_sv": 0.23360017724335194, + "grad_min_sv": 1.2428947707143757e-08, + "grad_condition": 42706933.20787396, + "lr": 0.0001215024721741218, + "time_sec": 49.61284112930298 + }, + { + "epoch": 117, + "train_loss": 1.722219416847229, + "train_acc": 0.52034, + "test_loss": 9.05172070465088, + "test_acc": 0.0864, + "lyapunov": null, + "grad_norm": 0.6709665811373348, + "grad_max_sv": 0.23329499438405038, + "grad_min_sv": 1.2499731633086597e-08, + "grad_condition": 23426718.363504913, + "lr": 0.00011474337861210538, + "time_sec": 49.612444162368774 + }, + { + "epoch": 118, + "train_loss": 1.720088274269104, + "train_acc": 0.5212, + "test_loss": 8.445899168395997, + "test_acc": 0.1071, + "lyapunov": null, + "grad_norm": 0.6772013084899083, + "grad_max_sv": 0.23568132370710373, + "grad_min_sv": 1.26266935157604e-08, + "grad_condition": 30951096.93160528, + "lr": 0.00010815327133708009, + "time_sec": 49.616597414016724 + }, + { + "epoch": 119, + "train_loss": 1.7100347495269776, + "train_acc": 0.52412, + "test_loss": 7.941069074249268, + "test_acc": 0.116, + "lyapunov": null, + "grad_norm": 0.6653971862031371, + "grad_max_sv": 0.23134685456752777, + "grad_min_sv": 1.2402505802922015e-08, + "grad_condition": 22810188.64319814, + "lr": 0.00010173504098790182, + "time_sec": 49.63788056373596 + }, + { + "epoch": 120, + "train_loss": 1.700667360534668, + "train_acc": 0.52674, + "test_loss": 9.192179844665528, + "test_acc": 0.0952, + "lyapunov": null, + "grad_norm": 0.67019495782139, + "grad_max_sv": 0.23498024754226207, + "grad_min_sv": 1.2522474526766025e-08, + "grad_condition": 25575812.55122325, + "lr": 9.549150281252629e-05, + "time_sec": 49.633721113204956 + }, + { + "epoch": 121, + "train_loss": 1.6934022713470458, + "train_acc": 0.52622, + "test_loss": 8.246514013671876, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 0.67264731502187, + "grad_max_sv": 0.23390924520790576, + "grad_min_sv": 1.2629734989083596e-08, + "grad_condition": 75127709.41882512, + "lr": 8.942539543314794e-05, + "time_sec": 49.658979177474976 + }, + { + "epoch": 122, + "train_loss": 1.6853880523681641, + "train_acc": 0.52858, + "test_loss": 8.835922454071046, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 0.6681915576498015, + "grad_max_sv": 0.22805486135184766, + "grad_min_sv": 1.2523601156111397e-08, + "grad_condition": 22825184.37456271, + "lr": 8.353937964495024e-05, + "time_sec": 49.645174980163574 + }, + { + "epoch": 123, + "train_loss": 1.6754656018447875, + "train_acc": 0.52996, + "test_loss": 8.766720679473877, + "test_acc": 0.0969, + "lyapunov": null, + "grad_norm": 0.6635381868278838, + "grad_max_sv": 0.23943961299955846, + "grad_min_sv": 1.2716584071870152e-08, + "grad_condition": 25094494.26316102, + "lr": 7.783603724899243e-05, + "time_sec": 49.64848589897156 + }, + { + "epoch": 124, + "train_loss": 1.6794914197158815, + "train_acc": 0.53018, + "test_loss": 8.580409744262695, + "test_acc": 0.1045, + "lyapunov": null, + "grad_norm": 0.671245577708117, + "grad_max_sv": 0.23060270808637143, + "grad_min_sv": 1.234503174199486e-08, + "grad_condition": 63345986.58758273, + "lr": 7.231786991974666e-05, + "time_sec": 49.87266302108765 + }, + { + "epoch": 125, + "train_loss": 1.6680570980834961, + "train_acc": 0.53182, + "test_loss": 8.834838022613525, + "test_acc": 0.1023, + "lyapunov": null, + "grad_norm": 0.6759384740097162, + "grad_max_sv": 0.23802748061716555, + "grad_min_sv": 1.276443843678532e-08, + "grad_condition": 24804650.245445848, + "lr": 6.698729810778072e-05, + "time_sec": 49.65100860595703 + }, + { + "epoch": 126, + "train_loss": 1.6599959258651733, + "train_acc": 0.53514, + "test_loss": 8.445849030303956, + "test_acc": 0.0993, + "lyapunov": null, + "grad_norm": 0.6683123713335807, + "grad_max_sv": 0.23196808211505413, + "grad_min_sv": 1.239824619359009e-08, + "grad_condition": 24122291.210029412, + "lr": 6.184665997806817e-05, + "time_sec": 49.60801029205322 + }, + { + "epoch": 127, + "train_loss": 1.6581390426254272, + "train_acc": 0.53286, + "test_loss": 8.180217957305908, + "test_acc": 0.1144, + "lyapunov": null, + "grad_norm": 0.671697720762431, + "grad_max_sv": 0.23852520175278186, + "grad_min_sv": 1.290384490787444e-08, + "grad_condition": 30505273.567765664, + "lr": 5.6898210384392595e-05, + "time_sec": 49.62530255317688 + }, + { + "epoch": 128, + "train_loss": 1.6536951416015624, + "train_acc": 0.53944, + "test_loss": 9.100402154541015, + "test_acc": 0.0967, + "lyapunov": null, + "grad_norm": 0.667185365414166, + "grad_max_sv": 0.2322216048836708, + "grad_min_sv": 1.2572321161918864e-08, + "grad_condition": 23830602.615603756, + "lr": 5.214411988029363e-05, + "time_sec": 49.59242367744446 + }, + { + "epoch": 129, + "train_loss": 1.6502027558135985, + "train_acc": 0.53564, + "test_loss": 8.243769989013671, + "test_acc": 0.1101, + "lyapunov": null, + "grad_norm": 0.6719880999378245, + "grad_max_sv": 0.23203521333634852, + "grad_min_sv": 1.2620684003428195e-08, + "grad_condition": 74978797.83799863, + "lr": 4.7586473766990294e-05, + "time_sec": 49.60294818878174 + }, + { + "epoch": 130, + "train_loss": 1.6536482720565795, + "train_acc": 0.53586, + "test_loss": 8.237010109710694, + "test_acc": 0.1067, + "lyapunov": null, + "grad_norm": 0.6804852067291551, + "grad_max_sv": 0.2377860952168703, + "grad_min_sv": 1.2762065921406718e-08, + "grad_condition": 39212371.63315557, + "lr": 4.32272711786996e-05, + "time_sec": 49.597888708114624 + }, + { + "epoch": 131, + "train_loss": 1.639038058242798, + "train_acc": 0.54146, + "test_loss": 8.44538454055786, + "test_acc": 0.1063, + "lyapunov": null, + "grad_norm": 0.6724835885199256, + "grad_max_sv": 0.2353504840284586, + "grad_min_sv": 1.2740010607581453e-08, + "grad_condition": 26983674.320896793, + "lr": 3.906842420574966e-05, + "time_sec": 49.665122509002686 + }, + { + "epoch": 132, + "train_loss": 1.6450230081176758, + "train_acc": 0.53788, + "test_loss": 8.850830727386475, + "test_acc": 0.1028, + "lyapunov": null, + "grad_norm": 0.6728968812754041, + "grad_max_sv": 0.2380696687847376, + "grad_min_sv": 1.2689633881700357e-08, + "grad_condition": 85473852.69328196, + "lr": 3.5111757055874305e-05, + "time_sec": 49.62814116477966 + }, + { + "epoch": 133, + "train_loss": 1.6397483406066895, + "train_acc": 0.53942, + "test_loss": 8.841438789367675, + "test_acc": 0.0951, + "lyapunov": null, + "grad_norm": 0.6743180544065257, + "grad_max_sv": 0.23258159644901752, + "grad_min_sv": 1.2391172625816904e-08, + "grad_condition": 50130338.96886261, + "lr": 3.1359005254054254e-05, + "time_sec": 49.650676250457764 + }, + { + "epoch": 134, + "train_loss": 1.6300106893539428, + "train_acc": 0.54306, + "test_loss": 8.161712069702148, + "test_acc": 0.0977, + "lyapunov": null, + "grad_norm": 0.6697898119311428, + "grad_max_sv": 0.23791733495891093, + "grad_min_sv": 1.2599619581693533e-08, + "grad_condition": 33905362.44570724, + "lr": 2.7811814881259484e-05, + "time_sec": 49.678349018096924 + }, + { + "epoch": 135, + "train_loss": 1.6280161280059815, + "train_acc": 0.54206, + "test_loss": 8.8084473777771, + "test_acc": 0.099, + "lyapunov": null, + "grad_norm": 0.6685419282298722, + "grad_max_sv": 0.2294952504336834, + "grad_min_sv": 1.2453856032546007e-08, + "grad_condition": 28183066.52638216, + "lr": 2.4471741852423218e-05, + "time_sec": 49.63830757141113 + }, + { + "epoch": 136, + "train_loss": 1.6250385632324218, + "train_acc": 0.5424, + "test_loss": 9.245115556335449, + "test_acc": 0.0982, + "lyapunov": null, + "grad_norm": 0.673719312762165, + "grad_max_sv": 0.2436251524835825, + "grad_min_sv": 1.2834923374116514e-08, + "grad_condition": 22720217.479475908, + "lr": 2.1340251233966362e-05, + "time_sec": 49.68732476234436 + }, + { + "epoch": 137, + "train_loss": 1.6283387484741212, + "train_acc": 0.5456, + "test_loss": 8.400495840454102, + "test_acc": 0.1051, + "lyapunov": null, + "grad_norm": 0.6729648252425294, + "grad_max_sv": 0.228320786729455, + "grad_min_sv": 1.2201329287198082e-08, + "grad_condition": 29654367.28966447, + "lr": 1.8418716601170932e-05, + "time_sec": 49.65324902534485 + }, + { + "epoch": 138, + "train_loss": 1.6186187603378297, + "train_acc": 0.54454, + "test_loss": 8.544135133361817, + "test_acc": 0.1026, + "lyapunov": null, + "grad_norm": 0.6767335790557945, + "grad_max_sv": 0.24417912773787975, + "grad_min_sv": 1.2745562341653915e-08, + "grad_condition": 22462589.905390937, + "lr": 1.570841943568445e-05, + "time_sec": 49.62770223617554 + }, + { + "epoch": 139, + "train_loss": 1.614481148033142, + "train_acc": 0.54796, + "test_loss": 8.814221725463867, + "test_acc": 0.0977, + "lyapunov": null, + "grad_norm": 0.6703542181357327, + "grad_max_sv": 0.2325075563043356, + "grad_min_sv": 1.2578777475180657e-08, + "grad_condition": 21363698.231181078, + "lr": 1.3210548563419845e-05, + "time_sec": 49.592610120773315 + }, + { + "epoch": 140, + "train_loss": 1.6180111114883422, + "train_acc": 0.54492, + "test_loss": 8.483137963104248, + "test_acc": 0.1107, + "lyapunov": null, + "grad_norm": 0.6809540897117702, + "grad_max_sv": 0.2395390760153532, + "grad_min_sv": 1.2634957796686664e-08, + "grad_condition": 54098275.066982284, + "lr": 1.0926199633097203e-05, + "time_sec": 49.62364315986633 + }, + { + "epoch": 141, + "train_loss": 1.613265188369751, + "train_acc": 0.548, + "test_loss": 9.025719612884522, + "test_acc": 0.0959, + "lyapunov": null, + "grad_norm": 0.6738933430180942, + "grad_max_sv": 0.2385118592530489, + "grad_min_sv": 1.2675423211039316e-08, + "grad_condition": 24268524.45347375, + "lr": 8.856374635655688e-06, + "time_sec": 49.6093544960022 + }, + { + "epoch": 142, + "train_loss": 1.6109765142822265, + "train_acc": 0.54672, + "test_loss": 8.501644051361083, + "test_acc": 0.1071, + "lyapunov": null, + "grad_norm": 0.6688401906779454, + "grad_max_sv": 0.2420313537120819, + "grad_min_sv": 1.2541520851006016e-08, + "grad_condition": 34051323.70080558, + "lr": 7.001981464747503e-06, + "time_sec": 49.626237869262695 + }, + { + "epoch": 143, + "train_loss": 1.6083808990859985, + "train_acc": 0.5495, + "test_loss": 8.410878736114501, + "test_acc": 0.1029, + "lyapunov": null, + "grad_norm": 0.6694620190305317, + "grad_max_sv": 0.2360597461462021, + "grad_min_sv": 1.2411240957882486e-08, + "grad_condition": 256359120.1912489, + "lr": 5.3638335185058295e-06, + "time_sec": 49.64081525802612 + }, + { + "epoch": 144, + "train_loss": 1.6100667620468139, + "train_acc": 0.54798, + "test_loss": 8.832001342010498, + "test_acc": 0.1019, + "lyapunov": null, + "grad_norm": 0.6707738006928022, + "grad_max_sv": 0.23732503540813923, + "grad_min_sv": 1.258596476483298e-08, + "grad_condition": 24176116.650407396, + "lr": 3.942649342761114e-06, + "time_sec": 49.650325536727905 + }, + { + "epoch": 145, + "train_loss": 1.6037773385238647, + "train_acc": 0.54702, + "test_loss": 8.7359261428833, + "test_acc": 0.0989, + "lyapunov": null, + "grad_norm": 0.6690176163372957, + "grad_max_sv": 0.23970598317682743, + "grad_min_sv": 1.2538464763678369e-08, + "grad_condition": 33292646.116570044, + "lr": 2.7390523158633524e-06, + "time_sec": 49.64434027671814 + }, + { + "epoch": 146, + "train_loss": 1.6090083113098144, + "train_acc": 0.54738, + "test_loss": 8.776909831237793, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 0.6706150402911953, + "grad_max_sv": 0.2313551239669323, + "grad_min_sv": 1.2493580149597339e-08, + "grad_condition": 36814707.572352916, + "lr": 1.7535703752478133e-06, + "time_sec": 49.653162479400635 + }, + { + "epoch": 147, + "train_loss": 1.6126505808258056, + "train_acc": 0.54692, + "test_loss": 9.092076904296874, + "test_acc": 0.0975, + "lyapunov": null, + "grad_norm": 0.6703962324024396, + "grad_max_sv": 0.233590966463089, + "grad_min_sv": 1.2700339725724153e-08, + "grad_condition": 46904603.438913696, + "lr": 9.866357858642196e-07, + "time_sec": 49.64583897590637 + }, + { + "epoch": 148, + "train_loss": 1.6134785464096069, + "train_acc": 0.54594, + "test_loss": 8.983751535797118, + "test_acc": 0.0995, + "lyapunov": null, + "grad_norm": 0.674578489012928, + "grad_max_sv": 0.23970573469996453, + "grad_min_sv": 1.272608372571149e-08, + "grad_condition": 21842271.84696827, + "lr": 4.38584950570808e-07, + "time_sec": 49.64808487892151 + }, + { + "epoch": 149, + "train_loss": 1.6119013549423218, + "train_acc": 0.54862, + "test_loss": 8.56843572845459, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 0.6747520334683573, + "grad_max_sv": 0.2384514592587948, + "grad_min_sv": 1.2600235418935846e-08, + "grad_condition": 25340562.620727975, + "lr": 1.096582625772501e-07, + "time_sec": 49.64168334007263 + }, + { + "epoch": 150, + "train_loss": 1.6072704146957397, + "train_acc": 0.54742, + "test_loss": 8.887614213562012, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 0.6742776904392008, + "grad_max_sv": 0.24012672565877438, + "grad_min_sv": 1.2860058681840591e-08, + "grad_condition": 24539045.015578836, + "lr": 0.0, + "time_sec": 49.61355018615723 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.088581143493652, + "train_acc": 0.01332, + "test_loss": 4.951591259765625, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.595797699274781, + "grad_max_sv": 5.059777915477753, + "grad_min_sv": 8.380082079928463e-08, + "grad_condition": 144739678.32890567, + "lr": 0.0009998903417374227, + "time_sec": 66.76207876205444 + }, + { + "epoch": 2, + "train_loss": 4.727508141174316, + "train_acc": 0.0242, + "test_loss": 4.891763400268554, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 4.11050155163041, + "grad_max_sv": 3.698546850681305, + "grad_min_sv": 6.387429426490954e-08, + "grad_condition": 67471298.37535235, + "lr": 0.0009995614150494292, + "time_sec": 66.79832410812378 + }, + { + "epoch": 3, + "train_loss": 4.516627143707275, + "train_acc": 0.03364, + "test_loss": 5.023839845275879, + "test_acc": 0.0096, + "lyapunov": null, + "grad_norm": 3.230804659530269, + "grad_max_sv": 2.737754541635513, + "grad_min_sv": 4.854583614544161e-08, + "grad_condition": 87922174.2345469, + "lr": 0.0009990133642141358, + "time_sec": 66.76044511795044 + }, + { + "epoch": 4, + "train_loss": 4.37137044631958, + "train_acc": 0.04084, + "test_loss": 5.107725936889649, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 2.5815981982320455, + "grad_max_sv": 2.1624936670064927, + "grad_min_sv": 3.8690102244220983e-08, + "grad_condition": 66775302.44012289, + "lr": 0.0009982464296247522, + "time_sec": 66.69986486434937 + }, + { + "epoch": 5, + "train_loss": 4.2787111569213865, + "train_acc": 0.0499, + "test_loss": 5.093746864318848, + "test_acc": 0.0119, + "lyapunov": null, + "grad_norm": 2.0501754928637608, + "grad_max_sv": 1.6735655426979066, + "grad_min_sv": 3.02018420605954e-08, + "grad_condition": 83847616.58229446, + "lr": 0.0009972609476841367, + "time_sec": 66.70642113685608 + }, + { + "epoch": 6, + "train_loss": 4.173126724395752, + "train_acc": 0.06114, + "test_loss": 5.650288801574707, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 1.4461755519297805, + "grad_max_sv": 1.029741930961609, + "grad_min_sv": 2.1617413775709693e-08, + "grad_condition": 53690503.75103078, + "lr": 0.000996057350657239, + "time_sec": 66.68753027915955 + }, + { + "epoch": 7, + "train_loss": 4.093725746765137, + "train_acc": 0.07048, + "test_loss": 5.236350575256347, + "test_acc": 0.0131, + "lyapunov": null, + "grad_norm": 1.104296817764675, + "grad_max_sv": 0.6810471951961518, + "grad_min_sv": 1.7525281126307134e-08, + "grad_condition": 46908594.94631828, + "lr": 0.000994636166481494, + "time_sec": 66.73089575767517 + }, + { + "epoch": 8, + "train_loss": 4.031361261062622, + "train_acc": 0.08184, + "test_loss": 5.266020038604736, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.9907154687339563, + "grad_max_sv": 0.5727237299084663, + "grad_min_sv": 1.568161453573136e-08, + "grad_condition": 205087186.79278168, + "lr": 0.0009929980185352525, + "time_sec": 66.74000144004822 + }, + { + "epoch": 9, + "train_loss": 3.9836690045166017, + "train_acc": 0.08876, + "test_loss": 5.373385707092285, + "test_acc": 0.0145, + "lyapunov": null, + "grad_norm": 0.9286442561107239, + "grad_max_sv": 0.49140588417649267, + "grad_min_sv": 1.4355377359054344e-08, + "grad_condition": 49567929.749295376, + "lr": 0.0009911436253643444, + "time_sec": 66.75752806663513 + }, + { + "epoch": 10, + "train_loss": 3.9524392292785646, + "train_acc": 0.09442, + "test_loss": 5.648289218139649, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.8635186549937055, + "grad_max_sv": 0.44110502675175667, + "grad_min_sv": 1.380239241649539e-08, + "grad_condition": 160205558.71937332, + "lr": 0.0009890738003669028, + "time_sec": 66.74852681159973 + }, + { + "epoch": 11, + "train_loss": 3.9057430783081055, + "train_acc": 0.09904, + "test_loss": 5.593870043945312, + "test_acc": 0.0153, + "lyapunov": null, + "grad_norm": 0.8313455134497171, + "grad_max_sv": 0.4245350927114487, + "grad_min_sv": 1.3408236181761123e-08, + "grad_condition": 70475775.54279244, + "lr": 0.00098678945143658, + "time_sec": 66.72569394111633 + }, + { + "epoch": 12, + "train_loss": 3.879755588531494, + "train_acc": 0.1059, + "test_loss": 5.91184571685791, + "test_acc": 0.0122, + "lyapunov": null, + "grad_norm": 0.8098343665002108, + "grad_max_sv": 0.3995117902755737, + "grad_min_sv": 1.3223197731335352e-08, + "grad_condition": 2262455188.632939, + "lr": 0.0009842915805643154, + "time_sec": 66.74134874343872 + }, + { + "epoch": 13, + "train_loss": 3.8387034120178223, + "train_acc": 0.11128, + "test_loss": 5.55406644744873, + "test_acc": 0.0159, + "lyapunov": null, + "grad_norm": 0.7779364983364899, + "grad_max_sv": 0.36580874100327493, + "grad_min_sv": 1.2747200656137991e-08, + "grad_condition": 31403290.857171714, + "lr": 0.000981581283398829, + "time_sec": 66.71355533599854 + }, + { + "epoch": 14, + "train_loss": 3.8182811224365234, + "train_acc": 0.11366, + "test_loss": 5.846968073272705, + "test_acc": 0.0132, + "lyapunov": null, + "grad_norm": 0.7545251260271086, + "grad_max_sv": 0.34809157326817514, + "grad_min_sv": 1.2320788722597342e-08, + "grad_condition": 32144212.47563106, + "lr": 0.0009786597487660333, + "time_sec": 66.72689533233643 + }, + { + "epoch": 15, + "train_loss": 3.7967992616271973, + "train_acc": 0.11852, + "test_loss": 5.68047932510376, + "test_acc": 0.0155, + "lyapunov": null, + "grad_norm": 0.731162073111203, + "grad_max_sv": 0.3421657994389534, + "grad_min_sv": 1.1936111505433944e-08, + "grad_condition": 244312799.4199868, + "lr": 0.0009755282581475766, + "time_sec": 66.7026903629303 + }, + { + "epoch": 16, + "train_loss": 3.7741379774475097, + "train_acc": 0.12086, + "test_loss": 5.484867942047119, + "test_acc": 0.0182, + "lyapunov": null, + "grad_norm": 0.7090304412758509, + "grad_max_sv": 0.3223520040512085, + "grad_min_sv": 1.1672073835233832e-08, + "grad_condition": 31524319.78711735, + "lr": 0.0009721881851187403, + "time_sec": 66.739328622818 + }, + { + "epoch": 17, + "train_loss": 3.753197032470703, + "train_acc": 0.1256, + "test_loss": 6.568574522399902, + "test_acc": 0.0151, + "lyapunov": null, + "grad_norm": 0.6935882502734273, + "grad_max_sv": 0.3146128565073013, + "grad_min_sv": 1.1361096601426174e-08, + "grad_condition": 210125774.08050695, + "lr": 0.0009686409947459456, + "time_sec": 66.74520659446716 + }, + { + "epoch": 18, + "train_loss": 3.725816408157349, + "train_acc": 0.1287, + "test_loss": 6.34478737487793, + "test_acc": 0.0159, + "lyapunov": null, + "grad_norm": 0.6758795184950354, + "grad_max_sv": 0.30437840037047864, + "grad_min_sv": 1.1510641159673262e-08, + "grad_condition": 31558341.74036485, + "lr": 0.0009648882429441254, + "time_sec": 66.78180265426636 + }, + { + "epoch": 19, + "train_loss": 3.714654729003906, + "train_acc": 0.13168, + "test_loss": 6.368891102600098, + "test_acc": 0.016, + "lyapunov": null, + "grad_norm": 0.6618910868321934, + "grad_max_sv": 0.2960255391895771, + "grad_min_sv": 1.1117618592404455e-08, + "grad_condition": 30205848.660664685, + "lr": 0.00096093157579425, + "time_sec": 66.74912786483765 + }, + { + "epoch": 20, + "train_loss": 3.6946691497802733, + "train_acc": 0.13396, + "test_loss": 6.4278502319335935, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.6443454538226331, + "grad_max_sv": 0.28263592235744, + "grad_min_sv": 1.0974601266297567e-08, + "grad_condition": 85210724.40585044, + "lr": 0.0009567727288213001, + "time_sec": 66.75979924201965 + }, + { + "epoch": 21, + "train_loss": 3.678538037261963, + "train_acc": 0.1389, + "test_loss": 5.944661869812012, + "test_acc": 0.0147, + "lyapunov": null, + "grad_norm": 0.6338793846375858, + "grad_max_sv": 0.2817647561430931, + "grad_min_sv": 1.0979779263564637e-08, + "grad_condition": 31384399.636330932, + "lr": 0.0009524135262330095, + "time_sec": 66.75862097740173 + }, + { + "epoch": 22, + "train_loss": 3.6583445849609375, + "train_acc": 0.1389, + "test_loss": 6.617507224273681, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.6270968339485256, + "grad_max_sv": 0.2682405423372984, + "grad_min_sv": 1.0661627264374474e-08, + "grad_condition": 28199289.108431924, + "lr": 0.0009478558801197061, + "time_sec": 66.70150375366211 + }, + { + "epoch": 23, + "train_loss": 3.646308810348511, + "train_acc": 0.14268, + "test_loss": 6.335385469818116, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6088892694217577, + "grad_max_sv": 0.25535150058567524, + "grad_min_sv": 1.0300061187296095e-08, + "grad_condition": 34795287.59915707, + "lr": 0.000943101789615607, + "time_sec": 66.70925712585449 + }, + { + "epoch": 24, + "train_loss": 3.6351177741241454, + "train_acc": 0.1426, + "test_loss": 6.3158514701843265, + "test_acc": 0.0177, + "lyapunov": null, + "grad_norm": 0.5964648659799031, + "grad_max_sv": 0.24951178021728992, + "grad_min_sv": 1.0093550447537458e-08, + "grad_condition": 51838350.11107895, + "lr": 0.0009381533400219313, + "time_sec": 66.70350575447083 + }, + { + "epoch": 25, + "train_loss": 3.6183255680847166, + "train_acc": 0.14644, + "test_loss": 6.721168376159668, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5933387221507487, + "grad_max_sv": 0.25210563503205774, + "grad_min_sv": 1.0153997685290878e-08, + "grad_condition": 247394984.04080305, + "lr": 0.0009330127018922189, + "time_sec": 66.75347089767456 + }, + { + "epoch": 26, + "train_loss": 3.6071299158477785, + "train_acc": 0.14866, + "test_loss": 6.642034001922608, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5954282647789416, + "grad_max_sv": 0.2547519262880087, + "grad_min_sv": 1.0135606323680157e-08, + "grad_condition": 28483815.51624248, + "lr": 0.000927682130080253, + "time_sec": 66.75868964195251 + }, + { + "epoch": 27, + "train_loss": 3.5931669886779787, + "train_acc": 0.1502, + "test_loss": 6.223846574401856, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.5877941221593797, + "grad_max_sv": 0.24717812985181808, + "grad_min_sv": 9.855245958201308e-09, + "grad_condition": 28193359.09622656, + "lr": 0.0009221639627510072, + "time_sec": 66.77666926383972 + }, + { + "epoch": 28, + "train_loss": 3.5780224719238283, + "train_acc": 0.15286, + "test_loss": 6.90847115020752, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.5733930952654505, + "grad_max_sv": 0.2419151894748211, + "grad_min_sv": 9.843924880792442e-09, + "grad_condition": 28364870.16247251, + "lr": 0.0009164606203550494, + "time_sec": 66.74913716316223 + }, + { + "epoch": 29, + "train_loss": 3.573341248779297, + "train_acc": 0.15312, + "test_loss": 6.439982345581055, + "test_acc": 0.021, + "lyapunov": null, + "grad_norm": 0.5679699095868811, + "grad_max_sv": 0.2286886375397444, + "grad_min_sv": 9.63519248414757e-09, + "grad_condition": 29833754.648618333, + "lr": 0.0009105746045668516, + "time_sec": 66.7665946483612 + }, + { + "epoch": 30, + "train_loss": 3.5598143620300293, + "train_acc": 0.1562, + "test_loss": 6.429332733154297, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.5589691788337113, + "grad_max_sv": 0.227083408087492, + "grad_min_sv": 9.709436735172439e-09, + "grad_condition": 27930931.211393736, + "lr": 0.0009045084971874733, + "time_sec": 66.75674724578857 + }, + { + "epoch": 31, + "train_loss": 3.5470434929656984, + "train_acc": 0.16, + "test_loss": 6.6052438804626465, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.5612591002612681, + "grad_max_sv": 0.22930745929479598, + "grad_min_sv": 9.687322477525128e-09, + "grad_condition": 27425333.623921502, + "lr": 0.0008982649590120977, + "time_sec": 66.71509528160095 + }, + { + "epoch": 32, + "train_loss": 3.537414684448242, + "train_acc": 0.16062, + "test_loss": 6.011712426757812, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.5564909883403706, + "grad_max_sv": 0.22170890271663665, + "grad_min_sv": 9.485011626120255e-09, + "grad_condition": 25722607.460985243, + "lr": 0.0008918467286629196, + "time_sec": 66.73007607460022 + }, + { + "epoch": 33, + "train_loss": 3.5317853105163572, + "train_acc": 0.1603, + "test_loss": 6.360434799194336, + "test_acc": 0.0189, + "lyapunov": null, + "grad_norm": 0.550433878030662, + "grad_max_sv": 0.2289751097559929, + "grad_min_sv": 9.54062134832928e-09, + "grad_condition": 381531522.893629, + "lr": 0.0008852566213878943, + "time_sec": 66.71780228614807 + }, + { + "epoch": 34, + "train_loss": 3.5253816675567626, + "train_acc": 0.16216, + "test_loss": 6.247197938537598, + "test_acc": 0.0221, + "lyapunov": null, + "grad_norm": 0.5426800931973276, + "grad_max_sv": 0.21441863812506198, + "grad_min_sv": 9.316700774752996e-09, + "grad_condition": 26950152.667612456, + "lr": 0.000878497527825878, + "time_sec": 66.72579026222229 + }, + { + "epoch": 35, + "train_loss": 3.502744727020264, + "train_acc": 0.16578, + "test_loss": 6.571361762237549, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.5398257014810475, + "grad_max_sv": 0.20931940749287606, + "grad_min_sv": 9.403711298539009e-09, + "grad_condition": 25780458.398535747, + "lr": 0.000871572412738697, + "time_sec": 66.74532318115234 + }, + { + "epoch": 36, + "train_loss": 3.5064585032653808, + "train_acc": 0.1655, + "test_loss": 6.218161656951905, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.5305975593103218, + "grad_max_sv": 0.20301839672029018, + "grad_min_sv": 9.261498659651757e-09, + "grad_condition": 24222820.24324985, + "lr": 0.0008644843137107055, + "time_sec": 66.7688057422638 + }, + { + "epoch": 37, + "train_loss": 3.4891217603302, + "train_acc": 0.16706, + "test_loss": 6.142190956115723, + "test_acc": 0.0211, + "lyapunov": null, + "grad_norm": 0.5317318651110877, + "grad_max_sv": 0.20387103594839573, + "grad_min_sv": 9.19414472749791e-09, + "grad_condition": 41748735.80026223, + "lr": 0.0008572363398164014, + "time_sec": 66.75609850883484 + }, + { + "epoch": 38, + "train_loss": 3.4776386444854737, + "train_acc": 0.17062, + "test_loss": 6.417214579772949, + "test_acc": 0.0205, + "lyapunov": null, + "grad_norm": 0.5236386972874332, + "grad_max_sv": 0.20101286694407464, + "grad_min_sv": 9.154465988037152e-09, + "grad_condition": 37634567.23075999, + "lr": 0.0008498316702566826, + "time_sec": 66.79052495956421 + }, + { + "epoch": 39, + "train_loss": 3.46743884765625, + "train_acc": 0.16932, + "test_loss": 5.726113172912598, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.5210988175669885, + "grad_max_sv": 0.19942357540130615, + "grad_min_sv": 8.937806597608677e-09, + "grad_condition": 49428217.19173406, + "lr": 0.0008422735529643442, + "time_sec": 66.74242496490479 + }, + { + "epoch": 40, + "train_loss": 3.451697437210083, + "train_acc": 0.17372, + "test_loss": 6.044572091674804, + "test_acc": 0.0225, + "lyapunov": null, + "grad_norm": 0.5170646983548032, + "grad_max_sv": 0.19684507846832275, + "grad_min_sv": 9.003056534485909e-09, + "grad_condition": 138977031.8076538, + "lr": 0.0008345653031794289, + "time_sec": 66.70748567581177 + }, + { + "epoch": 41, + "train_loss": 3.4474837628173827, + "train_acc": 0.17626, + "test_loss": 5.9893402641296385, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.5155937638119307, + "grad_max_sv": 0.19306579753756523, + "grad_min_sv": 8.943595689384076e-09, + "grad_condition": 75805302.28035732, + "lr": 0.0008267103019950526, + "time_sec": 66.69197702407837 + }, + { + "epoch": 42, + "train_loss": 3.4423429164123536, + "train_acc": 0.17422, + "test_loss": 5.739228091430664, + "test_acc": 0.0203, + "lyapunov": null, + "grad_norm": 0.5099978166539899, + "grad_max_sv": 0.1884769570082426, + "grad_min_sv": 8.939715143152505e-09, + "grad_condition": 24445550.576415405, + "lr": 0.0008187119948743447, + "time_sec": 66.70687818527222 + }, + { + "epoch": 43, + "train_loss": 3.4337082667541505, + "train_acc": 0.1755, + "test_loss": 5.964181529998779, + "test_acc": 0.0177, + "lyapunov": null, + "grad_norm": 0.5104491505466159, + "grad_max_sv": 0.19002889432013034, + "grad_min_sv": 9.048546927015178e-09, + "grad_condition": 102521993.69997685, + "lr": 0.000810573890139155, + "time_sec": 66.7257513999939 + }, + { + "epoch": 44, + "train_loss": 3.420871334762573, + "train_acc": 0.17948, + "test_loss": 5.929026190948487, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.5050154925488476, + "grad_max_sv": 0.18516961708664895, + "grad_min_sv": 8.980576357564551e-09, + "grad_condition": 24771047.136464976, + "lr": 0.0008022995574311873, + "time_sec": 66.74575066566467 + }, + { + "epoch": 45, + "train_loss": 3.4096126289367676, + "train_acc": 0.18164, + "test_loss": 5.663789749145508, + "test_acc": 0.0195, + "lyapunov": null, + "grad_norm": 0.5049903163352594, + "grad_max_sv": 0.18273597210645676, + "grad_min_sv": 8.972159917797207e-09, + "grad_condition": 23794424.428349543, + "lr": 0.0007938926261462363, + "time_sec": 66.7593412399292 + }, + { + "epoch": 46, + "train_loss": 3.410715911254883, + "train_acc": 0.1807, + "test_loss": 5.895871440124512, + "test_acc": 0.018, + "lyapunov": null, + "grad_norm": 0.5025553542851052, + "grad_max_sv": 0.1833956018090248, + "grad_min_sv": 8.830828140959924e-09, + "grad_condition": 30936751.6432406, + "lr": 0.0007853567838422158, + "time_sec": 66.75630521774292 + }, + { + "epoch": 47, + "train_loss": 3.4009066193389894, + "train_acc": 0.18276, + "test_loss": 6.028702513122559, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.5031283438960251, + "grad_max_sv": 0.1799595769494772, + "grad_min_sv": 8.917869195879114e-09, + "grad_condition": 23059530.36595428, + "lr": 0.0007766957746216719, + "time_sec": 66.75422596931458 + }, + { + "epoch": 48, + "train_loss": 3.390701540603638, + "train_acc": 0.18414, + "test_loss": 6.1965219741821285, + "test_acc": 0.0191, + "lyapunov": null, + "grad_norm": 0.4978643158932146, + "grad_max_sv": 0.1835469003766775, + "grad_min_sv": 8.827262552163485e-09, + "grad_condition": 51184664.832447655, + "lr": 0.0007679133974894982, + "time_sec": 66.75912022590637 + }, + { + "epoch": 49, + "train_loss": 3.3818662035369873, + "train_acc": 0.185, + "test_loss": 5.9103582473754885, + "test_acc": 0.0216, + "lyapunov": null, + "grad_norm": 0.49852008894363287, + "grad_max_sv": 0.18433105908334255, + "grad_min_sv": 8.89238179827001e-09, + "grad_condition": 40247674.29131043, + "lr": 0.000759013504686565, + "time_sec": 66.705406665802 + }, + { + "epoch": 50, + "train_loss": 3.3789881330871583, + "train_acc": 0.18412, + "test_loss": 6.037129666137695, + "test_acc": 0.0221, + "lyapunov": null, + "grad_norm": 0.49658079337268785, + "grad_max_sv": 0.179146596416831, + "grad_min_sv": 8.88557344369545e-09, + "grad_condition": 24117261.20845995, + "lr": 0.0007499999999999998, + "time_sec": 66.72649240493774 + }, + { + "epoch": 51, + "train_loss": 3.368231953201294, + "train_acc": 0.18852, + "test_loss": 5.9292546646118165, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.4961366760585921, + "grad_max_sv": 0.17853211835026742, + "grad_min_sv": 8.978999294084744e-09, + "grad_condition": 23793132.034851797, + "lr": 0.0007408768370508575, + "time_sec": 66.72111701965332 + }, + { + "epoch": 52, + "train_loss": 3.3652955891418457, + "train_acc": 0.18696, + "test_loss": 6.321981049346924, + "test_acc": 0.0194, + "lyapunov": null, + "grad_norm": 0.492099764209841, + "grad_max_sv": 0.16977054849267006, + "grad_min_sv": 8.831625028515866e-09, + "grad_condition": 22251962.97293579, + "lr": 0.0007316480175599307, + "time_sec": 66.76648426055908 + }, + { + "epoch": 53, + "train_loss": 3.348167460861206, + "train_acc": 0.19116, + "test_loss": 6.423485536193848, + "test_acc": 0.0194, + "lyapunov": null, + "grad_norm": 0.49189585228327304, + "grad_max_sv": 0.17462090440094472, + "grad_min_sv": 8.786478893248183e-09, + "grad_condition": 188050773.829039, + "lr": 0.0007223175895924635, + "time_sec": 66.76346206665039 + }, + { + "epoch": 54, + "train_loss": 3.348860473022461, + "train_acc": 0.1902, + "test_loss": 5.888034158325195, + "test_acc": 0.0208, + "lyapunov": null, + "grad_norm": 0.49279210316788963, + "grad_max_sv": 0.17498359829187393, + "grad_min_sv": 8.822100200367444e-09, + "grad_condition": 28219026.60736394, + "lr": 0.0007128896457825361, + "time_sec": 66.78646183013916 + }, + { + "epoch": 55, + "train_loss": 3.340097451171875, + "train_acc": 0.19068, + "test_loss": 6.104175454711914, + "test_acc": 0.0217, + "lyapunov": null, + "grad_norm": 0.48880812803196916, + "grad_max_sv": 0.16894785091280937, + "grad_min_sv": 8.688565139580718e-09, + "grad_condition": 29986515.161999334, + "lr": 0.0007033683215378998, + "time_sec": 66.76022791862488 + }, + { + "epoch": 56, + "train_loss": 3.3290103381347658, + "train_acc": 0.19526, + "test_loss": 6.31472435760498, + "test_acc": 0.021, + "lyapunov": null, + "grad_norm": 0.4920323275084941, + "grad_max_sv": 0.16673259809613228, + "grad_min_sv": 8.834232892440674e-09, + "grad_condition": 22477005.35692047, + "lr": 0.0006937577932260512, + "time_sec": 66.74644947052002 + }, + { + "epoch": 57, + "train_loss": 3.3146336823272704, + "train_acc": 0.19646, + "test_loss": 5.99189327545166, + "test_acc": 0.0226, + "lyapunov": null, + "grad_norm": 0.48946191063890415, + "grad_max_sv": 0.167069473862648, + "grad_min_sv": 8.78488659317167e-09, + "grad_condition": 21365105.05732888, + "lr": 0.0006840622763423388, + "time_sec": 66.73155951499939 + }, + { + "epoch": 58, + "train_loss": 3.304142900466919, + "train_acc": 0.19854, + "test_loss": 5.5838108703613285, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.4865732671541852, + "grad_max_sv": 0.16740650571882726, + "grad_min_sv": 8.786859095888389e-09, + "grad_condition": 22043022.83729876, + "lr": 0.0006742860236609073, + "time_sec": 66.7638807296753 + }, + { + "epoch": 59, + "train_loss": 3.306339856491089, + "train_acc": 0.19832, + "test_loss": 6.71665584564209, + "test_acc": 0.0226, + "lyapunov": null, + "grad_norm": 0.4874859882247268, + "grad_max_sv": 0.17165971212089062, + "grad_min_sv": 8.715364420430748e-09, + "grad_condition": 25734869.826652374, + "lr": 0.0006644333233692913, + "time_sec": 66.69665598869324 + }, + { + "epoch": 60, + "train_loss": 3.2998611443328856, + "train_acc": 0.19806, + "test_loss": 5.851872462463379, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.4884739100521322, + "grad_max_sv": 0.16974798031151295, + "grad_min_sv": 8.883696248074279e-09, + "grad_condition": 21737745.94010177, + "lr": 0.0006545084971874734, + "time_sec": 66.72846579551697 + }, + { + "epoch": 61, + "train_loss": 3.2928254180908203, + "train_acc": 0.19828, + "test_loss": 5.552249732971191, + "test_acc": 0.023, + "lyapunov": null, + "grad_norm": 0.49016744220935893, + "grad_max_sv": 0.16948793716728688, + "grad_min_sv": 8.760361631943159e-09, + "grad_condition": 27254819.27808509, + "lr": 0.0006445158984722354, + "time_sec": 66.78463363647461 + }, + { + "epoch": 62, + "train_loss": 3.275610556716919, + "train_acc": 0.20532, + "test_loss": 5.873171199035644, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.4866265828805679, + "grad_max_sv": 0.16542929150164126, + "grad_min_sv": 8.78843325786971e-09, + "grad_condition": 66183687.20952544, + "lr": 0.0006344599103076324, + "time_sec": 66.76870799064636 + }, + { + "epoch": 63, + "train_loss": 3.271966901855469, + "train_acc": 0.20438, + "test_loss": 5.9298525764465335, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.4859022585476048, + "grad_max_sv": 0.16404966413974761, + "grad_min_sv": 8.811849419587681e-09, + "grad_condition": 22319350.467063613, + "lr": 0.0006243449435824269, + "time_sec": 66.73905062675476 + }, + { + "epoch": 64, + "train_loss": 3.266578521652222, + "train_acc": 0.2042, + "test_loss": 5.641555810546875, + "test_acc": 0.0272, + "lyapunov": null, + "grad_norm": 0.48486007197076664, + "grad_max_sv": 0.1655890803784132, + "grad_min_sv": 8.723941788413291e-09, + "grad_condition": 22305108.16299928, + "lr": 0.0006141754350553275, + "time_sec": 66.7476577758789 + }, + { + "epoch": 65, + "train_loss": 3.2511880633544923, + "train_acc": 0.2074, + "test_loss": 5.8412233901977535, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.48754428036288966, + "grad_max_sv": 0.16739307381212712, + "grad_min_sv": 8.817329924526441e-09, + "grad_condition": 21968003.756148495, + "lr": 0.0006039558454088793, + "time_sec": 66.75903058052063 + }, + { + "epoch": 66, + "train_loss": 3.249825279388428, + "train_acc": 0.2102, + "test_loss": 5.375687086486816, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.4852656386861206, + "grad_max_sv": 0.16313621625304223, + "grad_min_sv": 8.705907367234644e-09, + "grad_condition": 22679705.957923576, + "lr": 0.000593690657292862, + "time_sec": 66.70783424377441 + }, + { + "epoch": 67, + "train_loss": 3.245251103134155, + "train_acc": 0.21036, + "test_loss": 6.777110389709472, + "test_acc": 0.0168, + "lyapunov": null, + "grad_norm": 0.4867378238882827, + "grad_max_sv": 0.1655280452221632, + "grad_min_sv": 8.915351975939679e-09, + "grad_condition": 110454092.86004348, + "lr": 0.0005833843733580507, + "time_sec": 66.69803929328918 + }, + { + "epoch": 68, + "train_loss": 3.2381321800231935, + "train_acc": 0.20952, + "test_loss": 6.102328826904297, + "test_acc": 0.0197, + "lyapunov": null, + "grad_norm": 0.48671688246611916, + "grad_max_sv": 0.1659169655293226, + "grad_min_sv": 8.76257463186536e-09, + "grad_condition": 44812459.07892763, + "lr": 0.0005730415142812054, + "time_sec": 66.69719409942627 + }, + { + "epoch": 69, + "train_loss": 3.2316595709991454, + "train_acc": 0.21144, + "test_loss": 5.602972175598144, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.4847784835340826, + "grad_max_sv": 0.1632793139666319, + "grad_min_sv": 8.814856525610204e-09, + "grad_condition": 107593372.59174109, + "lr": 0.0005626666167821517, + "time_sec": 66.68555569648743 + }, + { + "epoch": 70, + "train_loss": 3.21884576965332, + "train_acc": 0.21162, + "test_loss": 6.080870904541015, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.4868075160552665, + "grad_max_sv": 0.15996163412928582, + "grad_min_sv": 8.820852938351554e-09, + "grad_condition": 24906478.982524626, + "lr": 0.0005522642316338265, + "time_sec": 66.75078678131104 + }, + { + "epoch": 71, + "train_loss": 3.2169480547332765, + "train_acc": 0.2131, + "test_loss": 6.322179025268555, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.48693869340308327, + "grad_max_sv": 0.16328724324703217, + "grad_min_sv": 8.897740871871563e-09, + "grad_condition": 21378151.74249644, + "lr": 0.0005418389216661573, + "time_sec": 66.82618498802185 + }, + { + "epoch": 72, + "train_loss": 3.209583250656128, + "train_acc": 0.21452, + "test_loss": 5.9164725677490235, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.48710676929190333, + "grad_max_sv": 0.1638231087476015, + "grad_min_sv": 8.895584530099753e-09, + "grad_condition": 26372411.903145302, + "lr": 0.0005313952597646563, + "time_sec": 66.76002073287964 + }, + { + "epoch": 73, + "train_loss": 3.206989998016357, + "train_acc": 0.2156, + "test_loss": 6.779888274383545, + "test_acc": 0.02, + "lyapunov": null, + "grad_norm": 0.4871385804296449, + "grad_max_sv": 0.16540717855095863, + "grad_min_sv": 8.919061500467506e-09, + "grad_condition": 24713788.997361727, + "lr": 0.0005209378268645994, + "time_sec": 66.79043841362 + }, + { + "epoch": 74, + "train_loss": 3.196985797729492, + "train_acc": 0.21718, + "test_loss": 6.031893154907227, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.4885299333145373, + "grad_max_sv": 0.1637456502765417, + "grad_min_sv": 8.884239661999249e-09, + "grad_condition": 31643344.54858377, + "lr": 0.0005104712099416781, + "time_sec": 66.7399845123291 + }, + { + "epoch": 75, + "train_loss": 3.1916642933654784, + "train_acc": 0.21804, + "test_loss": 6.505784149169922, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.48738903646108195, + "grad_max_sv": 0.16264366619288922, + "grad_min_sv": 8.976378307323785e-09, + "grad_condition": 23550016.098660976, + "lr": 0.0004999999999999996, + "time_sec": 66.73288559913635 + }, + { + "epoch": 76, + "train_loss": 3.1814585160827638, + "train_acc": 0.22052, + "test_loss": 6.48178818359375, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.4843426315380276, + "grad_max_sv": 0.16138911359012126, + "grad_min_sv": 8.912034432650984e-09, + "grad_condition": 23286891.30520594, + "lr": 0.0004895287900583212, + "time_sec": 66.69967555999756 + }, + { + "epoch": 77, + "train_loss": 3.1693101245117186, + "train_acc": 0.22188, + "test_loss": 6.60695295715332, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.48473864055458005, + "grad_max_sv": 0.16252022571861743, + "grad_min_sv": 8.865778075572983e-09, + "grad_condition": 20379861.793125592, + "lr": 0.0004790621731353997, + "time_sec": 66.73058843612671 + }, + { + "epoch": 78, + "train_loss": 3.172366504058838, + "train_acc": 0.22092, + "test_loss": 6.633734432983398, + "test_acc": 0.0249, + "lyapunov": null, + "grad_norm": 0.4834678400720691, + "grad_max_sv": 0.1624290570616722, + "grad_min_sv": 8.932120706961477e-09, + "grad_condition": 23408681.375307254, + "lr": 0.000468604740235343, + "time_sec": 66.69404172897339 + }, + { + "epoch": 79, + "train_loss": 3.1615784413146972, + "train_acc": 0.2258, + "test_loss": 6.273578634643554, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.48944403353102334, + "grad_max_sv": 0.16398866586387156, + "grad_min_sv": 8.946382384911189e-09, + "grad_condition": 22712578.898883633, + "lr": 0.00045816107833384175, + "time_sec": 66.7472972869873 + }, + { + "epoch": 80, + "train_loss": 3.1575608079528807, + "train_acc": 0.22382, + "test_loss": 6.2906877746582035, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.4897084401415468, + "grad_max_sv": 0.16338732056319713, + "grad_min_sv": 8.928839754715478e-09, + "grad_condition": 54043718.99023694, + "lr": 0.0004477357683661729, + "time_sec": 66.72847270965576 + }, + { + "epoch": 81, + "train_loss": 3.1497875170898437, + "train_acc": 0.22584, + "test_loss": 6.6115754776000975, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.48772100619317266, + "grad_max_sv": 0.15775733068585396, + "grad_min_sv": 9.009791279712686e-09, + "grad_condition": 20818306.202141248, + "lr": 0.00043733338321784746, + "time_sec": 66.74951100349426 + }, + { + "epoch": 82, + "train_loss": 3.150099751586914, + "train_acc": 0.22466, + "test_loss": 6.489882479858398, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.48649716303896257, + "grad_max_sv": 0.15712360739707948, + "grad_min_sv": 8.928376640099378e-09, + "grad_condition": 33122173.6130862, + "lr": 0.0004269584857187939, + "time_sec": 66.73039722442627 + }, + { + "epoch": 83, + "train_loss": 3.1423302052307127, + "train_acc": 0.22782, + "test_loss": 6.021305515289306, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.48633742199561775, + "grad_max_sv": 0.1581266548484564, + "grad_min_sv": 8.888032958058456e-09, + "grad_condition": 115025831.2804152, + "lr": 0.0004166156266419484, + "time_sec": 66.74857115745544 + }, + { + "epoch": 84, + "train_loss": 3.128035169677734, + "train_acc": 0.22886, + "test_loss": 6.798161625671387, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.48802181363511177, + "grad_max_sv": 0.1612305197864771, + "grad_min_sv": 8.905917459056666e-09, + "grad_condition": 24037955.80487976, + "lr": 0.0004063093427071373, + "time_sec": 66.70986270904541 + }, + { + "epoch": 85, + "train_loss": 3.127580302810669, + "train_acc": 0.23112, + "test_loss": 6.7588252937316895, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.4875306431638057, + "grad_max_sv": 0.16091111600399016, + "grad_min_sv": 9.01161150146379e-09, + "grad_condition": 21073737.755382914, + "lr": 0.0003960441545911199, + "time_sec": 66.68802571296692 + }, + { + "epoch": 86, + "train_loss": 3.114855668182373, + "train_acc": 0.2308, + "test_loss": 6.564279100036621, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.48637730612121255, + "grad_max_sv": 0.15542719289660453, + "grad_min_sv": 8.93872263707518e-09, + "grad_condition": 21703985.404231258, + "lr": 0.0003858245649446718, + "time_sec": 66.6933023929596 + }, + { + "epoch": 87, + "train_loss": 3.1120968659210204, + "train_acc": 0.23044, + "test_loss": 6.98433928451538, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.4900107193499055, + "grad_max_sv": 0.16207418888807296, + "grad_min_sv": 8.972892097738883e-09, + "grad_condition": 47614869.04451983, + "lr": 0.00037565505641757235, + "time_sec": 66.71200680732727 + }, + { + "epoch": 88, + "train_loss": 3.105097593078613, + "train_acc": 0.23214, + "test_loss": 6.7922447959899905, + "test_acc": 0.0302, + "lyapunov": null, + "grad_norm": 0.4884472360111878, + "grad_max_sv": 0.15889082551002504, + "grad_min_sv": 8.899033936138335e-09, + "grad_condition": 25000729.654329486, + "lr": 0.00036554008969236695, + "time_sec": 66.7427408695221 + }, + { + "epoch": 89, + "train_loss": 3.0926671070098877, + "train_acc": 0.23664, + "test_loss": 6.916401704406738, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.49050493507655857, + "grad_max_sv": 0.16100925132632254, + "grad_min_sv": 9.010439719348006e-09, + "grad_condition": 21207674.720614858, + "lr": 0.0003554841015277638, + "time_sec": 66.76495027542114 + }, + { + "epoch": 90, + "train_loss": 3.090296846160889, + "train_acc": 0.23536, + "test_loss": 7.012615090179444, + "test_acc": 0.0308, + "lyapunov": null, + "grad_norm": 0.49019979842343425, + "grad_max_sv": 0.1572930809110403, + "grad_min_sv": 8.949024762796698e-09, + "grad_condition": 734920063.8359609, + "lr": 0.000345491502812526, + "time_sec": 66.73302173614502 + }, + { + "epoch": 91, + "train_loss": 3.085657378997803, + "train_acc": 0.23746, + "test_loss": 6.360618818664551, + "test_acc": 0.0363, + "lyapunov": null, + "grad_norm": 0.4915162849741807, + "grad_max_sv": 0.15855198130011558, + "grad_min_sv": 8.980356871329809e-09, + "grad_condition": 28731902.889844812, + "lr": 0.0003355666766307081, + "time_sec": 66.74396848678589 + }, + { + "epoch": 92, + "train_loss": 3.0831817041778566, + "train_acc": 0.2383, + "test_loss": 5.9396498611450195, + "test_acc": 0.0352, + "lyapunov": null, + "grad_norm": 0.49047678071806555, + "grad_max_sv": 0.15942419767379762, + "grad_min_sv": 9.062854348755588e-09, + "grad_condition": 57497218.341688454, + "lr": 0.00032571397633909225, + "time_sec": 66.77806997299194 + }, + { + "epoch": 93, + "train_loss": 3.071146830596924, + "train_acc": 0.23998, + "test_loss": 6.60078558807373, + "test_acc": 0.0328, + "lyapunov": null, + "grad_norm": 0.48952410405337216, + "grad_max_sv": 0.1553661532700062, + "grad_min_sv": 9.10862152092573e-09, + "grad_condition": 20074531.31734441, + "lr": 0.00031593772365766094, + "time_sec": 66.71407961845398 + }, + { + "epoch": 94, + "train_loss": 3.0655629290008544, + "train_acc": 0.23992, + "test_loss": 6.003435957336426, + "test_acc": 0.0378, + "lyapunov": null, + "grad_norm": 0.49221246193757373, + "grad_max_sv": 0.15908809714019298, + "grad_min_sv": 9.144222304358074e-09, + "grad_condition": 19907441.898985844, + "lr": 0.0003062422067739483, + "time_sec": 66.693532705307 + }, + { + "epoch": 95, + "train_loss": 3.060634704437256, + "train_acc": 0.23888, + "test_loss": 6.056681440734863, + "test_acc": 0.0373, + "lyapunov": null, + "grad_norm": 0.49339217556104, + "grad_max_sv": 0.15901063568890095, + "grad_min_sv": 9.065924972545547e-09, + "grad_condition": 29502219.759497046, + "lr": 0.00029663167846209965, + "time_sec": 66.70557427406311 + }, + { + "epoch": 96, + "train_loss": 3.061671485443115, + "train_acc": 0.24224, + "test_loss": 6.776474742126465, + "test_acc": 0.0353, + "lyapunov": null, + "grad_norm": 0.49062641992823525, + "grad_max_sv": 0.15993262231349945, + "grad_min_sv": 9.044680277306427e-09, + "grad_condition": 42484326.952753186, + "lr": 0.00028711035421746345, + "time_sec": 66.71291422843933 + }, + { + "epoch": 97, + "train_loss": 3.0552709561157227, + "train_acc": 0.24368, + "test_loss": 6.627662403869629, + "test_acc": 0.0312, + "lyapunov": null, + "grad_norm": 0.49312118223102674, + "grad_max_sv": 0.1586600374430418, + "grad_min_sv": 9.106857379315159e-09, + "grad_condition": 19815371.442228314, + "lr": 0.00027768241040753615, + "time_sec": 66.74342608451843 + }, + { + "epoch": 98, + "train_loss": 3.047260310974121, + "train_acc": 0.24534, + "test_loss": 6.661625199890136, + "test_acc": 0.0358, + "lyapunov": null, + "grad_norm": 0.4920094661808142, + "grad_max_sv": 0.1592965368181467, + "grad_min_sv": 9.102059620250124e-09, + "grad_condition": 78440147.91108674, + "lr": 0.00026835198244006903, + "time_sec": 66.75223684310913 + }, + { + "epoch": 99, + "train_loss": 3.046775559768677, + "train_acc": 0.24216, + "test_loss": 6.965150428771973, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.4926874565507386, + "grad_max_sv": 0.16148377656936647, + "grad_min_sv": 9.167028746162597e-09, + "grad_condition": 82327087.71133485, + "lr": 0.0002591231629491421, + "time_sec": 66.76156210899353 + }, + { + "epoch": 100, + "train_loss": 3.041998874053955, + "train_acc": 0.24108, + "test_loss": 6.647268369293213, + "test_acc": 0.0319, + "lyapunov": null, + "grad_norm": 0.49732363208650837, + "grad_max_sv": 0.15973055586218834, + "grad_min_sv": 9.144760823587283e-09, + "grad_condition": 19643395.96339509, + "lr": 0.0002499999999999997, + "time_sec": 66.74560022354126 + }, + { + "epoch": 101, + "train_loss": 3.0355277448272706, + "train_acc": 0.24656, + "test_loss": 6.661636563873291, + "test_acc": 0.0352, + "lyapunov": null, + "grad_norm": 0.4945949712556627, + "grad_max_sv": 0.16228868998587132, + "grad_min_sv": 9.097275698727314e-09, + "grad_condition": 29717156.96899251, + "lr": 0.00024098649531343477, + "time_sec": 66.74929976463318 + }, + { + "epoch": 102, + "train_loss": 3.028595997467041, + "train_acc": 0.24942, + "test_loss": 7.008212976837158, + "test_acc": 0.0297, + "lyapunov": null, + "grad_norm": 0.4951875945091829, + "grad_max_sv": 0.1601081270724535, + "grad_min_sv": 9.183049341776606e-09, + "grad_condition": 28833554.07107707, + "lr": 0.0002320866025105016, + "time_sec": 66.70356440544128 + }, + { + "epoch": 103, + "train_loss": 3.0245940507507325, + "train_acc": 0.24584, + "test_loss": 6.46308011932373, + "test_acc": 0.0341, + "lyapunov": null, + "grad_norm": 0.49371498929192353, + "grad_max_sv": 0.15619246214628218, + "grad_min_sv": 9.060142111202984e-09, + "grad_condition": 39182662.24958947, + "lr": 0.0002233042253783278, + "time_sec": 66.71340656280518 + }, + { + "epoch": 104, + "train_loss": 3.021408618774414, + "train_acc": 0.2456, + "test_loss": 6.825051796722412, + "test_acc": 0.0336, + "lyapunov": null, + "grad_norm": 0.4938389055758033, + "grad_max_sv": 0.1602877888828516, + "grad_min_sv": 9.021206631709689e-09, + "grad_condition": 22621712.521351572, + "lr": 0.000214643216157784, + "time_sec": 66.69873213768005 + }, + { + "epoch": 105, + "train_loss": 3.0085532719421386, + "train_acc": 0.25126, + "test_loss": 6.49373994140625, + "test_acc": 0.0345, + "lyapunov": null, + "grad_norm": 0.49734202210836465, + "grad_max_sv": 0.1637524042278528, + "grad_min_sv": 9.15554402847185e-09, + "grad_condition": 21636907.97691984, + "lr": 0.00020610737385376332, + "time_sec": 66.7116219997406 + }, + { + "epoch": 106, + "train_loss": 3.0132780470275877, + "train_acc": 0.24846, + "test_loss": 6.5495201698303225, + "test_acc": 0.0336, + "lyapunov": null, + "grad_norm": 0.4981310757648767, + "grad_max_sv": 0.15820327922701835, + "grad_min_sv": 9.158961136734866e-09, + "grad_condition": 20307530.065489154, + "lr": 0.00019770044256881242, + "time_sec": 66.74218201637268 + }, + { + "epoch": 107, + "train_loss": 3.0039769695281984, + "train_acc": 0.24998, + "test_loss": 6.218603918457031, + "test_acc": 0.0361, + "lyapunov": null, + "grad_norm": 0.4961392053949623, + "grad_max_sv": 0.1600139781832695, + "grad_min_sv": 9.131589118194228e-09, + "grad_condition": 36979479.48401734, + "lr": 0.0001894261098608447, + "time_sec": 66.80793809890747 + }, + { + "epoch": 108, + "train_loss": 3.001887908782959, + "train_acc": 0.2516, + "test_loss": 6.588950064086914, + "test_acc": 0.0328, + "lyapunov": null, + "grad_norm": 0.49597326074702125, + "grad_max_sv": 0.1588774763047695, + "grad_min_sv": 9.17765310692875e-09, + "grad_condition": 50896304.22255845, + "lr": 0.000181288005125655, + "time_sec": 66.76537990570068 + }, + { + "epoch": 109, + "train_loss": 2.9904132221221924, + "train_acc": 0.25664, + "test_loss": 6.382045315551758, + "test_acc": 0.0395, + "lyapunov": null, + "grad_norm": 0.4973619331899814, + "grad_max_sv": 0.1614119179546833, + "grad_min_sv": 9.145205881466722e-09, + "grad_condition": 19754492.90124496, + "lr": 0.0001732896980049473, + "time_sec": 66.78630447387695 + }, + { + "epoch": 110, + "train_loss": 2.989228514251709, + "train_acc": 0.25492, + "test_loss": 6.322301493072509, + "test_acc": 0.0369, + "lyapunov": null, + "grad_norm": 0.498337161336674, + "grad_max_sv": 0.15811876803636551, + "grad_min_sv": 9.229779307506902e-09, + "grad_condition": 19822899.140848357, + "lr": 0.00016543469682057076, + "time_sec": 66.75606536865234 + }, + { + "epoch": 111, + "train_loss": 2.984906556854248, + "train_acc": 0.25606, + "test_loss": 6.8701157440185545, + "test_acc": 0.0367, + "lyapunov": null, + "grad_norm": 0.49721550527739367, + "grad_max_sv": 0.16228222362697126, + "grad_min_sv": 9.23479824502943e-09, + "grad_condition": 293614052.48096585, + "lr": 0.00015772644703565552, + "time_sec": 66.73988127708435 + }, + { + "epoch": 112, + "train_loss": 2.9811305560302737, + "train_acc": 0.25646, + "test_loss": 7.038999290466308, + "test_acc": 0.0335, + "lyapunov": null, + "grad_norm": 0.4941490782513605, + "grad_max_sv": 0.15477370359003545, + "grad_min_sv": 9.218313174429171e-09, + "grad_condition": 164935506.24721447, + "lr": 0.00015016832974331713, + "time_sec": 66.71515774726868 + }, + { + "epoch": 113, + "train_loss": 2.9800968042755125, + "train_acc": 0.25398, + "test_loss": 6.309658117675781, + "test_acc": 0.0389, + "lyapunov": null, + "grad_norm": 0.49886850458670223, + "grad_max_sv": 0.16330830678343772, + "grad_min_sv": 9.236376152799153e-09, + "grad_condition": 21870251.37413417, + "lr": 0.00014276366018359834, + "time_sec": 66.71296858787537 + }, + { + "epoch": 114, + "train_loss": 2.9754512078094484, + "train_acc": 0.25594, + "test_loss": 6.60843113861084, + "test_acc": 0.0346, + "lyapunov": null, + "grad_norm": 0.4960627007320755, + "grad_max_sv": 0.1573273716494441, + "grad_min_sv": 9.209630175144312e-09, + "grad_condition": 21208142.4041068, + "lr": 0.00013551568628929425, + "time_sec": 66.73864150047302 + }, + { + "epoch": 115, + "train_loss": 2.973171382446289, + "train_acc": 0.25546, + "test_loss": 6.1580316360473635, + "test_acc": 0.0359, + "lyapunov": null, + "grad_norm": 0.4975170133978326, + "grad_max_sv": 0.16185041181743146, + "grad_min_sv": 9.172154036285463e-09, + "grad_condition": 23675277.644423716, + "lr": 0.00012842758726130276, + "time_sec": 66.7741425037384 + }, + { + "epoch": 116, + "train_loss": 2.9698315058135987, + "train_acc": 0.2585, + "test_loss": 6.728188695526123, + "test_acc": 0.0352, + "lyapunov": null, + "grad_norm": 0.49786156791485014, + "grad_max_sv": 0.1629601776599884, + "grad_min_sv": 9.141069147108882e-09, + "grad_condition": 42245446.81835711, + "lr": 0.0001215024721741218, + "time_sec": 66.85877132415771 + }, + { + "epoch": 117, + "train_loss": 2.96759364151001, + "train_acc": 0.25688, + "test_loss": 6.810253086853027, + "test_acc": 0.0317, + "lyapunov": null, + "grad_norm": 0.5004102922188621, + "grad_max_sv": 0.16316126510500908, + "grad_min_sv": 9.275286505516789e-09, + "grad_condition": 21737711.712548293, + "lr": 0.00011474337861210538, + "time_sec": 66.78435349464417 + }, + { + "epoch": 118, + "train_loss": 2.9639752848815917, + "train_acc": 0.25784, + "test_loss": 6.6183334121704105, + "test_acc": 0.037, + "lyapunov": null, + "grad_norm": 0.4993536159032588, + "grad_max_sv": 0.16331967823207377, + "grad_min_sv": 9.30454736036701e-09, + "grad_condition": 24980238.64283476, + "lr": 0.00010815327133708009, + "time_sec": 66.78651332855225 + }, + { + "epoch": 119, + "train_loss": 2.955244768218994, + "train_acc": 0.26012, + "test_loss": 7.170739624023438, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.49772875386211013, + "grad_max_sv": 0.15745177641510963, + "grad_min_sv": 9.275912776773865e-09, + "grad_condition": 20252652.260798354, + "lr": 0.00010173504098790182, + "time_sec": 66.7590229511261 + }, + { + "epoch": 120, + "train_loss": 2.9573191987609864, + "train_acc": 0.25902, + "test_loss": 6.63704820098877, + "test_acc": 0.0341, + "lyapunov": null, + "grad_norm": 0.4996347696527594, + "grad_max_sv": 0.16082486175000668, + "grad_min_sv": 9.223728218710203e-09, + "grad_condition": 31826325.619799424, + "lr": 9.549150281252629e-05, + "time_sec": 66.7681827545166 + }, + { + "epoch": 121, + "train_loss": 2.9523595883178713, + "train_acc": 0.2618, + "test_loss": 6.729842405700683, + "test_acc": 0.036, + "lyapunov": null, + "grad_norm": 0.5013710314611776, + "grad_max_sv": 0.15908933244645596, + "grad_min_sv": 9.356316055253444e-09, + "grad_condition": 25691489.85231958, + "lr": 8.942539543314794e-05, + "time_sec": 66.74568009376526 + }, + { + "epoch": 122, + "train_loss": 2.9497915851593017, + "train_acc": 0.2617, + "test_loss": 6.87424278717041, + "test_acc": 0.033, + "lyapunov": null, + "grad_norm": 0.5005453549657005, + "grad_max_sv": 0.16275203377008438, + "grad_min_sv": 9.293272996112322e-09, + "grad_condition": 83221431.81677945, + "lr": 8.353937964495024e-05, + "time_sec": 66.74210405349731 + }, + { + "epoch": 123, + "train_loss": 2.9416942150115966, + "train_acc": 0.2643, + "test_loss": 6.686075965118408, + "test_acc": 0.0363, + "lyapunov": null, + "grad_norm": 0.5025049175782571, + "grad_max_sv": 0.15961344465613364, + "grad_min_sv": 9.371966801230425e-09, + "grad_condition": 35132803.96387108, + "lr": 7.783603724899243e-05, + "time_sec": 66.75957775115967 + }, + { + "epoch": 124, + "train_loss": 2.94895947555542, + "train_acc": 0.25956, + "test_loss": 6.959716784667969, + "test_acc": 0.0344, + "lyapunov": null, + "grad_norm": 0.5043618033931743, + "grad_max_sv": 0.16490019261837005, + "grad_min_sv": 9.45151938935851e-09, + "grad_condition": 20739176.963236075, + "lr": 7.231786991974666e-05, + "time_sec": 66.76986241340637 + }, + { + "epoch": 125, + "train_loss": 2.9465578133392336, + "train_acc": 0.2615, + "test_loss": 6.6146667854309085, + "test_acc": 0.0372, + "lyapunov": null, + "grad_norm": 0.50165695568463, + "grad_max_sv": 0.16004594042897224, + "grad_min_sv": 9.333669109823362e-09, + "grad_condition": 27696527.631483592, + "lr": 6.698729810778072e-05, + "time_sec": 66.79878735542297 + }, + { + "epoch": 126, + "train_loss": 2.944279951171875, + "train_acc": 0.25922, + "test_loss": 6.776188401794434, + "test_acc": 0.0359, + "lyapunov": null, + "grad_norm": 0.5004778327715103, + "grad_max_sv": 0.1615132074803114, + "grad_min_sv": 9.285796417901615e-09, + "grad_condition": 20380420.794493236, + "lr": 6.184665997806817e-05, + "time_sec": 66.81306886672974 + }, + { + "epoch": 127, + "train_loss": 2.9345046046447756, + "train_acc": 0.26554, + "test_loss": 6.409585705566406, + "test_acc": 0.0365, + "lyapunov": null, + "grad_norm": 0.5009056150070453, + "grad_max_sv": 0.16262583658099175, + "grad_min_sv": 9.41551325135681e-09, + "grad_condition": 92271454.95901966, + "lr": 5.6898210384392595e-05, + "time_sec": 66.77955317497253 + }, + { + "epoch": 128, + "train_loss": 2.9406036145782473, + "train_acc": 0.26226, + "test_loss": 6.883744766235352, + "test_acc": 0.0362, + "lyapunov": null, + "grad_norm": 0.5019103000513857, + "grad_max_sv": 0.15915893130004405, + "grad_min_sv": 9.27946301465532e-09, + "grad_condition": 26892136.241638493, + "lr": 5.214411988029363e-05, + "time_sec": 66.7971682548523 + }, + { + "epoch": 129, + "train_loss": 2.9357696857452393, + "train_acc": 0.26482, + "test_loss": 6.798914263916016, + "test_acc": 0.0371, + "lyapunov": null, + "grad_norm": 0.502875147430765, + "grad_max_sv": 0.16597487404942513, + "grad_min_sv": 9.331743605622833e-09, + "grad_condition": 21894734.234583445, + "lr": 4.7586473766990294e-05, + "time_sec": 66.76526641845703 + }, + { + "epoch": 130, + "train_loss": 2.931978320159912, + "train_acc": 0.2632, + "test_loss": 6.588931091308594, + "test_acc": 0.0383, + "lyapunov": null, + "grad_norm": 0.5024988425718886, + "grad_max_sv": 0.16058847755193711, + "grad_min_sv": 9.346998992854072e-09, + "grad_condition": 23689235.71364718, + "lr": 4.32272711786996e-05, + "time_sec": 66.73650169372559 + }, + { + "epoch": 131, + "train_loss": 2.9257036571502684, + "train_acc": 0.26346, + "test_loss": 6.79047756652832, + "test_acc": 0.037, + "lyapunov": null, + "grad_norm": 0.5025936155191698, + "grad_max_sv": 0.1606222338974476, + "grad_min_sv": 9.344622825535609e-09, + "grad_condition": 19448498.594337363, + "lr": 3.906842420574966e-05, + "time_sec": 66.72977805137634 + }, + { + "epoch": 132, + "train_loss": 2.9238443630981443, + "train_acc": 0.26652, + "test_loss": 6.582272483825683, + "test_acc": 0.0359, + "lyapunov": null, + "grad_norm": 0.5057115235264575, + "grad_max_sv": 0.1622081771492958, + "grad_min_sv": 9.322094066382264e-09, + "grad_condition": 110706873.75285177, + "lr": 3.5111757055874305e-05, + "time_sec": 66.74127459526062 + }, + { + "epoch": 133, + "train_loss": 2.9275563074493407, + "train_acc": 0.26798, + "test_loss": 6.701000856018067, + "test_acc": 0.0403, + "lyapunov": null, + "grad_norm": 0.5047358455148018, + "grad_max_sv": 0.1596795056015253, + "grad_min_sv": 9.385729068944748e-09, + "grad_condition": 24899256.961485635, + "lr": 3.1359005254054254e-05, + "time_sec": 66.78476786613464 + }, + { + "epoch": 134, + "train_loss": 2.922698397293091, + "train_acc": 0.2656, + "test_loss": 6.822336962890625, + "test_acc": 0.0348, + "lyapunov": null, + "grad_norm": 0.5011816329114258, + "grad_max_sv": 0.16208452992141248, + "grad_min_sv": 9.367489639533489e-09, + "grad_condition": 21334456.488015514, + "lr": 2.7811814881259484e-05, + "time_sec": 66.77467155456543 + }, + { + "epoch": 135, + "train_loss": 2.9318275360870363, + "train_acc": 0.26446, + "test_loss": 6.82299095916748, + "test_acc": 0.0375, + "lyapunov": null, + "grad_norm": 0.5036159796429942, + "grad_max_sv": 0.16086461171507835, + "grad_min_sv": 9.421430274825227e-09, + "grad_condition": 23697065.511433274, + "lr": 2.4471741852423218e-05, + "time_sec": 66.81163048744202 + }, + { + "epoch": 136, + "train_loss": 2.924918181915283, + "train_acc": 0.26562, + "test_loss": 6.8049731414794925, + "test_acc": 0.0379, + "lyapunov": null, + "grad_norm": 0.5025705246301901, + "grad_max_sv": 0.1608381040394306, + "grad_min_sv": 9.298360864606891e-09, + "grad_condition": 21070247.46761896, + "lr": 2.1340251233966362e-05, + "time_sec": 66.75751781463623 + }, + { + "epoch": 137, + "train_loss": 2.9179174461364745, + "train_acc": 0.267, + "test_loss": 7.41930817565918, + "test_acc": 0.0354, + "lyapunov": null, + "grad_norm": 0.5020038013732862, + "grad_max_sv": 0.16103104539215565, + "grad_min_sv": 9.377383154707264e-09, + "grad_condition": 25924694.766624488, + "lr": 1.8418716601170932e-05, + "time_sec": 66.75570106506348 + }, + { + "epoch": 138, + "train_loss": 2.923201954345703, + "train_acc": 0.26658, + "test_loss": 6.757112614440918, + "test_acc": 0.0368, + "lyapunov": null, + "grad_norm": 0.5024810225531171, + "grad_max_sv": 0.1589697927236557, + "grad_min_sv": 9.370084333437667e-09, + "grad_condition": 21088389.845349483, + "lr": 1.570841943568445e-05, + "time_sec": 66.72540855407715 + }, + { + "epoch": 139, + "train_loss": 2.91647822807312, + "train_acc": 0.26728, + "test_loss": 6.73676093826294, + "test_acc": 0.0367, + "lyapunov": null, + "grad_norm": 0.5029392119297419, + "grad_max_sv": 0.16374287530779838, + "grad_min_sv": 9.458621610947127e-09, + "grad_condition": 21151341.282133214, + "lr": 1.3210548563419845e-05, + "time_sec": 66.74242377281189 + }, + { + "epoch": 140, + "train_loss": 2.9202518330383302, + "train_acc": 0.2648, + "test_loss": 7.060108929443359, + "test_acc": 0.0321, + "lyapunov": null, + "grad_norm": 0.5033375321825745, + "grad_max_sv": 0.1628003478050232, + "grad_min_sv": 9.350477757699705e-09, + "grad_condition": 42538003.149772, + "lr": 1.0926199633097203e-05, + "time_sec": 66.72664403915405 + }, + { + "epoch": 141, + "train_loss": 2.9214018739318846, + "train_acc": 0.26676, + "test_loss": 7.03288666305542, + "test_acc": 0.0373, + "lyapunov": null, + "grad_norm": 0.5040934974077137, + "grad_max_sv": 0.1631232462823391, + "grad_min_sv": 9.429894434753727e-09, + "grad_condition": 22205151.285805613, + "lr": 8.856374635655688e-06, + "time_sec": 66.73880624771118 + }, + { + "epoch": 142, + "train_loss": 2.9171245983886718, + "train_acc": 0.26776, + "test_loss": 7.131447039031983, + "test_acc": 0.0347, + "lyapunov": null, + "grad_norm": 0.502296749693395, + "grad_max_sv": 0.16366422846913337, + "grad_min_sv": 9.319274187069571e-09, + "grad_condition": 23643079.173571, + "lr": 7.001981464747503e-06, + "time_sec": 66.7779552936554 + }, + { + "epoch": 143, + "train_loss": 2.922498332595825, + "train_acc": 0.26552, + "test_loss": 6.954830606079102, + "test_acc": 0.0348, + "lyapunov": null, + "grad_norm": 0.5043546674267846, + "grad_max_sv": 0.1646194864064455, + "grad_min_sv": 9.327249025914419e-09, + "grad_condition": 20109722.273851108, + "lr": 5.3638335185058295e-06, + "time_sec": 66.78727650642395 + }, + { + "epoch": 144, + "train_loss": 2.9214989219665526, + "train_acc": 0.26862, + "test_loss": 7.012627954101562, + "test_acc": 0.0377, + "lyapunov": null, + "grad_norm": 0.5036510560585029, + "grad_max_sv": 0.1648405112326145, + "grad_min_sv": 9.423214848702788e-09, + "grad_condition": 39000025.89670716, + "lr": 3.942649342761114e-06, + "time_sec": 66.78706383705139 + }, + { + "epoch": 145, + "train_loss": 2.922225288314819, + "train_acc": 0.2672, + "test_loss": 6.957889157104492, + "test_acc": 0.0364, + "lyapunov": null, + "grad_norm": 0.503867068026341, + "grad_max_sv": 0.16379656754434108, + "grad_min_sv": 9.359998385562173e-09, + "grad_condition": 77281010.69187385, + "lr": 2.7390523158633524e-06, + "time_sec": 66.7628915309906 + }, + { + "epoch": 146, + "train_loss": 2.9163033376312257, + "train_acc": 0.2685, + "test_loss": 6.855587731933594, + "test_acc": 0.0358, + "lyapunov": null, + "grad_norm": 0.5029204495133565, + "grad_max_sv": 0.16139821223914624, + "grad_min_sv": 9.274698062333719e-09, + "grad_condition": 20548752.94100132, + "lr": 1.7535703752478133e-06, + "time_sec": 66.76251316070557 + }, + { + "epoch": 147, + "train_loss": 2.9199572286987303, + "train_acc": 0.2662, + "test_loss": 7.004822827148438, + "test_acc": 0.0334, + "lyapunov": null, + "grad_norm": 0.5038995262415072, + "grad_max_sv": 0.15897907465696334, + "grad_min_sv": 9.380836815675586e-09, + "grad_condition": 19124324.302936584, + "lr": 9.866357858642196e-07, + "time_sec": 66.77228903770447 + }, + { + "epoch": 148, + "train_loss": 2.9100856079101565, + "train_acc": 0.26856, + "test_loss": 7.008816410064697, + "test_acc": 0.0333, + "lyapunov": null, + "grad_norm": 0.5033801740007838, + "grad_max_sv": 0.16318991631269456, + "grad_min_sv": 9.304624077298429e-09, + "grad_condition": 88163387.15126483, + "lr": 4.38584950570808e-07, + "time_sec": 66.73154377937317 + }, + { + "epoch": 149, + "train_loss": 2.918438820800781, + "train_acc": 0.26988, + "test_loss": 7.183802980041504, + "test_acc": 0.0335, + "lyapunov": null, + "grad_norm": 0.5034594519443074, + "grad_max_sv": 0.16287193521857263, + "grad_min_sv": 9.228533171673492e-09, + "grad_condition": 31684078.48425772, + "lr": 1.096582625772501e-07, + "time_sec": 66.71334385871887 + }, + { + "epoch": 150, + "train_loss": 2.9179681867980958, + "train_acc": 0.26896, + "test_loss": 7.132198828887939, + "test_acc": 0.0374, + "lyapunov": null, + "grad_norm": 0.5039379693049055, + "grad_max_sv": 0.16534604988992213, + "grad_min_sv": 9.358835868777949e-09, + "grad_condition": 24483022.85106538, + "lr": 0.0, + "time_sec": 66.76589560508728 + } + ], + "20": [ + { + "epoch": 1, + "train_loss": 5.21357828704834, + "train_acc": 0.00958, + "test_loss": 4.717830415344238, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 6.028281164907647, + "grad_max_sv": 5.586896324157715, + "grad_min_sv": 8.321505736708091e-08, + "grad_condition": 126391405.93672016, + "lr": 0.0009998903417374227, + "time_sec": 83.75971913337708 + }, + { + "epoch": 2, + "train_loss": 5.002406215209961, + "train_acc": 0.01054, + "test_loss": 4.706539186859131, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.942916858382687, + "grad_max_sv": 4.443458986282349, + "grad_min_sv": 6.176679956948483e-08, + "grad_condition": 368514713.27491444, + "lr": 0.0009995614150494292, + "time_sec": 83.72638368606567 + }, + { + "epoch": 3, + "train_loss": 4.941021067657471, + "train_acc": 0.0102, + "test_loss": 4.685369007110595, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.551335199238429, + "grad_max_sv": 4.130530917644501, + "grad_min_sv": 5.607447592093085e-08, + "grad_condition": 379082253.2858798, + "lr": 0.0009990133642141358, + "time_sec": 83.7252631187439 + }, + { + "epoch": 4, + "train_loss": 4.901978406677246, + "train_acc": 0.00948, + "test_loss": 4.704164950561523, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.292365216371512, + "grad_max_sv": 3.9344047129154207, + "grad_min_sv": 5.476369089318922e-08, + "grad_condition": 96219244.721114, + "lr": 0.0009982464296247522, + "time_sec": 83.74504327774048 + }, + { + "epoch": 5, + "train_loss": 4.875739136657715, + "train_acc": 0.00976, + "test_loss": 4.67882677154541, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.102770691913926, + "grad_max_sv": 3.7305591464042664, + "grad_min_sv": 5.105303844121778e-08, + "grad_condition": 114422829.17041938, + "lr": 0.0009972609476841367, + "time_sec": 83.7535228729248 + }, + { + "epoch": 6, + "train_loss": 4.854646638641357, + "train_acc": 0.01, + "test_loss": 4.6779319816589355, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 3.9533090018879022, + "grad_max_sv": 3.569680255651474, + "grad_min_sv": 4.9375477451096826e-08, + "grad_condition": 120982864.11796215, + "lr": 0.000996057350657239, + "time_sec": 83.76437997817993 + }, + { + "epoch": 7, + "train_loss": 4.843388534240723, + "train_acc": 0.0093, + "test_loss": 4.688051298522949, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.808254303294448, + "grad_max_sv": 3.401720005273819, + "grad_min_sv": 4.769865569742571e-08, + "grad_condition": 124322938.54178014, + "lr": 0.000994636166481494, + "time_sec": 83.73754358291626 + }, + { + "epoch": 8, + "train_loss": 4.831099078216552, + "train_acc": 0.0098, + "test_loss": 4.686168608093261, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 3.638633817460268, + "grad_max_sv": 3.29349827170372, + "grad_min_sv": 4.562366222038428e-08, + "grad_condition": 130991249.85200353, + "lr": 0.0009929980185352525, + "time_sec": 83.75114607810974 + }, + { + "epoch": 9, + "train_loss": 4.8127050201416015, + "train_acc": 0.01066, + "test_loss": 4.702382767486572, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.500656504897414, + "grad_max_sv": 3.2044365644454955, + "grad_min_sv": 4.392227098831691e-08, + "grad_condition": 228917141.42878217, + "lr": 0.0009911436253643444, + "time_sec": 83.75008654594421 + }, + { + "epoch": 10, + "train_loss": 4.809432870025635, + "train_acc": 0.00958, + "test_loss": 4.662561440277099, + "test_acc": 0.0105, + "lyapunov": null, + "grad_norm": 3.3981948131519792, + "grad_max_sv": 3.0618119478225707, + "grad_min_sv": 4.221159614070658e-08, + "grad_condition": 89285987.82360582, + "lr": 0.0009890738003669028, + "time_sec": 83.75357627868652 + }, + { + "epoch": 11, + "train_loss": 4.788434708251953, + "train_acc": 0.01052, + "test_loss": 4.672326850891113, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.239567320080417, + "grad_max_sv": 2.9396412312984466, + "grad_min_sv": 3.992155273024878e-08, + "grad_condition": 91783422.62374839, + "lr": 0.00098678945143658, + "time_sec": 83.73260736465454 + }, + { + "epoch": 12, + "train_loss": 4.779874237365723, + "train_acc": 0.01008, + "test_loss": 4.67001594543457, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 3.103566946411183, + "grad_max_sv": 2.861602544784546, + "grad_min_sv": 3.936066093057633e-08, + "grad_condition": 119851949.4663836, + "lr": 0.0009842915805643154, + "time_sec": 83.817462682724 + }, + { + "epoch": 13, + "train_loss": 4.770841501159668, + "train_acc": 0.00992, + "test_loss": 4.656426369476319, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.0009960370081323, + "grad_max_sv": 2.656493490934372, + "grad_min_sv": 3.707013069217946e-08, + "grad_condition": 498107586.22724324, + "lr": 0.000981581283398829, + "time_sec": 83.74097108840942 + }, + { + "epoch": 14, + "train_loss": 4.756785203857422, + "train_acc": 0.01042, + "test_loss": 4.675232955932617, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 2.8493309861575318, + "grad_max_sv": 2.5364737689495085, + "grad_min_sv": 3.586032745195311e-08, + "grad_condition": 113107959.8123773, + "lr": 0.0009786597487660333, + "time_sec": 83.73817372322083 + }, + { + "epoch": 15, + "train_loss": 4.754773846588135, + "train_acc": 0.00998, + "test_loss": 4.659816702270508, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 2.754495953066911, + "grad_max_sv": 2.477891582250595, + "grad_min_sv": 3.409575287799394e-08, + "grad_condition": 161602481.60469836, + "lr": 0.0009755282581475766, + "time_sec": 83.75961685180664 + }, + { + "epoch": 16, + "train_loss": 4.743301128997802, + "train_acc": 0.0101, + "test_loss": 4.649964485168457, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 2.6595920331694725, + "grad_max_sv": 2.3447550773620605, + "grad_min_sv": 3.222141393699474e-08, + "grad_condition": 183792258.0998055, + "lr": 0.0009721881851187403, + "time_sec": 83.78172135353088 + }, + { + "epoch": 17, + "train_loss": 4.733358394927978, + "train_acc": 0.01016, + "test_loss": 4.642168313598633, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 2.5896272478360634, + "grad_max_sv": 2.3136182010173796, + "grad_min_sv": 3.172710767995745e-08, + "grad_condition": 117247363.48613138, + "lr": 0.0009686409947459456, + "time_sec": 83.75683784484863 + }, + { + "epoch": 18, + "train_loss": 4.729640578918457, + "train_acc": 0.0106, + "test_loss": 4.654958557128906, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 2.5388744373274417, + "grad_max_sv": 2.2171274721622467, + "grad_min_sv": 3.0159331015910953e-08, + "grad_condition": 101838677.71373975, + "lr": 0.0009648882429441254, + "time_sec": 83.75490856170654 + }, + { + "epoch": 19, + "train_loss": 4.723793775634766, + "train_acc": 0.0104, + "test_loss": 4.653732388305664, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 2.4692592532468662, + "grad_max_sv": 2.1681156396865844, + "grad_min_sv": 2.978641970435847e-08, + "grad_condition": 233798757.5515837, + "lr": 0.00096093157579425, + "time_sec": 83.76724123954773 + }, + { + "epoch": 20, + "train_loss": 4.718724663238525, + "train_acc": 0.0102, + "test_loss": 4.649697755432129, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 2.427591699320917, + "grad_max_sv": 2.1466651976108553, + "grad_min_sv": 2.9465831946628997e-08, + "grad_condition": 88939856.59831895, + "lr": 0.0009567727288213001, + "time_sec": 83.74052405357361 + }, + { + "epoch": 21, + "train_loss": 4.712672980194092, + "train_acc": 0.01012, + "test_loss": 4.647871576690674, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 2.357057284901842, + "grad_max_sv": 2.1047394454479216, + "grad_min_sv": 2.8490478837239763e-08, + "grad_condition": 91579762.44536874, + "lr": 0.0009524135262330095, + "time_sec": 83.75857543945312 + }, + { + "epoch": 22, + "train_loss": 4.706978241882324, + "train_acc": 0.01024, + "test_loss": 4.648735240936279, + "test_acc": 0.0085, + "lyapunov": null, + "grad_norm": 2.2900045512493366, + "grad_max_sv": 2.081936264038086, + "grad_min_sv": 2.8080869171609457e-08, + "grad_condition": 136805304.6805451, + "lr": 0.0009478558801197061, + "time_sec": 83.75628423690796 + }, + { + "epoch": 23, + "train_loss": 4.700225740966797, + "train_acc": 0.00964, + "test_loss": 4.647530085754394, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 2.2107587083430276, + "grad_max_sv": 1.988323137164116, + "grad_min_sv": 2.6475746447984784e-08, + "grad_condition": 164008669.76777038, + "lr": 0.000943101789615607, + "time_sec": 83.77352237701416 + }, + { + "epoch": 24, + "train_loss": 4.692355620117188, + "train_acc": 0.0096, + "test_loss": 4.637314375305176, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 2.058860964349953, + "grad_max_sv": 1.8445529341697693, + "grad_min_sv": 2.4344878213344857e-08, + "grad_condition": 86439388.46384792, + "lr": 0.0009381533400219313, + "time_sec": 83.79498553276062 + }, + { + "epoch": 25, + "train_loss": 4.681464791564942, + "train_acc": 0.00928, + "test_loss": 4.623963987731933, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.887935665727307, + "grad_max_sv": 1.675812867283821, + "grad_min_sv": 2.197329014158589e-08, + "grad_condition": 136861974.56893334, + "lr": 0.0009330127018922189, + "time_sec": 83.75438261032104 + }, + { + "epoch": 26, + "train_loss": 4.666114781646728, + "train_acc": 0.00968, + "test_loss": 4.622957837677002, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.6987317795206707, + "grad_max_sv": 1.5008918464183807, + "grad_min_sv": 1.8850404182035874e-08, + "grad_condition": 396848763.8507156, + "lr": 0.000927682130080253, + "time_sec": 83.80677318572998 + }, + { + "epoch": 27, + "train_loss": 4.656886034545899, + "train_acc": 0.0103, + "test_loss": 4.618579483032226, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.49568981841554, + "grad_max_sv": 1.3568953216075896, + "grad_min_sv": 1.566217179560514e-08, + "grad_condition": 103503015.49660948, + "lr": 0.0009221639627510072, + "time_sec": 83.78064775466919 + }, + { + "epoch": 28, + "train_loss": 4.643399444732666, + "train_acc": 0.01056, + "test_loss": 4.614220301055909, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 1.3088039077662417, + "grad_max_sv": 1.1537246599793434, + "grad_min_sv": 1.2267503651797185e-08, + "grad_condition": 114843460.24858093, + "lr": 0.0009164606203550494, + "time_sec": 83.7792694568634 + }, + { + "epoch": 29, + "train_loss": 4.633547606048584, + "train_acc": 0.00896, + "test_loss": 4.611564260101319, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.0933490764935123, + "grad_max_sv": 0.9679391533136368, + "grad_min_sv": 7.642074995560522e-09, + "grad_condition": 804214751.6294578, + "lr": 0.0009105746045668516, + "time_sec": 83.83227157592773 + }, + { + "epoch": 30, + "train_loss": 4.624774245300293, + "train_acc": 0.00964, + "test_loss": 4.608921669769287, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.8837855695002744, + "grad_max_sv": 0.773915484547615, + "grad_min_sv": 2.366957635572509e-11, + "grad_condition": 237910863465.00665, + "lr": 0.0009045084971874733, + "time_sec": 83.80770468711853 + }, + { + "epoch": 31, + "train_loss": 4.618612337646485, + "train_acc": 0.01032, + "test_loss": 4.607751036071777, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.7415257832044893, + "grad_max_sv": 0.644972386956215, + "grad_min_sv": 3.660935201474329e-12, + "grad_condition": 261782379031.45782, + "lr": 0.0008982649590120977, + "time_sec": 83.79283952713013 + }, + { + "epoch": 32, + "train_loss": 4.616099582977295, + "train_acc": 0.0089, + "test_loss": 4.606554626464844, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.6524091899037507, + "grad_max_sv": 0.5655980415642261, + "grad_min_sv": 1.3079153537243355e-13, + "grad_condition": 507838982675.7344, + "lr": 0.0008918467286629196, + "time_sec": 83.77927327156067 + }, + { + "epoch": 33, + "train_loss": 4.613166402130127, + "train_acc": 0.00916, + "test_loss": 4.606206927490234, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.5720100552333853, + "grad_max_sv": 0.4838749781250954, + "grad_min_sv": 7.656531138726084e-14, + "grad_condition": 452556546253.1081, + "lr": 0.0008852566213878943, + "time_sec": 83.7956645488739 + }, + { + "epoch": 34, + "train_loss": 4.610275639953613, + "train_acc": 0.0096, + "test_loss": 4.605738200378418, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.4266452221992571, + "grad_max_sv": 0.36331126987934115, + "grad_min_sv": 5.44079975167954e-15, + "grad_condition": 361256197137.27747, + "lr": 0.000878497527825878, + "time_sec": 83.78154063224792 + }, + { + "epoch": 35, + "train_loss": 4.608961817626954, + "train_acc": 0.01014, + "test_loss": 4.605575282287598, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 0.32905926875005, + "grad_max_sv": 0.2839593421667814, + "grad_min_sv": 8.941027107756884e-17, + "grad_condition": 283933784815.36444, + "lr": 0.000871572412738697, + "time_sec": 83.76054668426514 + }, + { + "epoch": 36, + "train_loss": 4.608401114196777, + "train_acc": 0.00938, + "test_loss": 4.605348924255371, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2743447711162471, + "grad_max_sv": 0.2315550185739994, + "grad_min_sv": 2.4262184593062427e-31, + "grad_condition": 231555018573.99936, + "lr": 0.0008644843137107055, + "time_sec": 83.76748013496399 + }, + { + "epoch": 37, + "train_loss": 4.6074152955627445, + "train_acc": 0.01014, + "test_loss": 4.605235860443115, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.22829204328314687, + "grad_max_sv": 0.19001176171004772, + "grad_min_sv": 0.0, + "grad_condition": 190011761710.0477, + "lr": 0.0008572363398164014, + "time_sec": 83.82857966423035 + }, + { + "epoch": 38, + "train_loss": 4.6074430204772945, + "train_acc": 0.00846, + "test_loss": 4.605340163421631, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2131689057955099, + "grad_max_sv": 0.17414189949631692, + "grad_min_sv": 0.0, + "grad_condition": 174141899496.3169, + "lr": 0.0008498316702566826, + "time_sec": 83.7941620349884 + }, + { + "epoch": 39, + "train_loss": 4.608160193786621, + "train_acc": 0.00878, + "test_loss": 4.605639952087403, + "test_acc": 0.009, + "lyapunov": null, + "grad_norm": 0.24317456921386985, + "grad_max_sv": 0.2019160557538271, + "grad_min_sv": 0.0, + "grad_condition": 201916055753.8271, + "lr": 0.0008422735529643442, + "time_sec": 83.80830645561218 + }, + { + "epoch": 40, + "train_loss": 4.606921190032959, + "train_acc": 0.00868, + "test_loss": 4.605219190216064, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.17887802551259574, + "grad_max_sv": 0.14444960467517376, + "grad_min_sv": 0.0, + "grad_condition": 144449604675.17377, + "lr": 0.0008345653031794289, + "time_sec": 83.76973342895508 + }, + { + "epoch": 41, + "train_loss": 4.606422245941162, + "train_acc": 0.00834, + "test_loss": 4.605222705078125, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.17289778065418965, + "grad_max_sv": 0.13819168899208306, + "grad_min_sv": 0.0, + "grad_condition": 138191688992.08307, + "lr": 0.0008267103019950526, + "time_sec": 83.74321436882019 + }, + { + "epoch": 42, + "train_loss": 4.606239071655273, + "train_acc": 0.01008, + "test_loss": 4.605207167053223, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.16994723888320276, + "grad_max_sv": 0.13730969540774823, + "grad_min_sv": 0.0, + "grad_condition": 137309695407.74821, + "lr": 0.0008187119948743447, + "time_sec": 83.7667281627655 + }, + { + "epoch": 43, + "train_loss": 4.606040752410888, + "train_acc": 0.00878, + "test_loss": 4.605204765319824, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.14038728911483775, + "grad_max_sv": 0.10907853152602912, + "grad_min_sv": 0.0, + "grad_condition": 109078531526.0291, + "lr": 0.000810573890139155, + "time_sec": 83.71949076652527 + }, + { + "epoch": 44, + "train_loss": 4.605822370910644, + "train_acc": 0.00892, + "test_loss": 4.605195722198486, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.11252097462442588, + "grad_max_sv": 0.05359459263272583, + "grad_min_sv": 0.0, + "grad_condition": 53594592632.72584, + "lr": 0.0008022995574311873, + "time_sec": 83.74685764312744 + }, + { + "epoch": 45, + "train_loss": 4.605744844055176, + "train_acc": 0.0091, + "test_loss": 4.605188182067871, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09696133635132191, + "grad_max_sv": 0.02572248433716595, + "grad_min_sv": 0.0, + "grad_condition": 25722484337.16595, + "lr": 0.0007938926261462363, + "time_sec": 83.688485622406 + }, + { + "epoch": 46, + "train_loss": 4.605597140960693, + "train_acc": 0.00844, + "test_loss": 4.605181010437012, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09018030151754076, + "grad_max_sv": 0.008408381370827556, + "grad_min_sv": 0.0, + "grad_condition": 8408381370.827555, + "lr": 0.0007853567838422158, + "time_sec": 83.6915934085846 + }, + { + "epoch": 47, + "train_loss": 4.605502964324951, + "train_acc": 0.00962, + "test_loss": 4.605176095581054, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.08904470683636952, + "grad_max_sv": 0.006156692747026682, + "grad_min_sv": 0.0, + "grad_condition": 6156692747.026682, + "lr": 0.0007766957746216719, + "time_sec": 83.68823766708374 + }, + { + "epoch": 48, + "train_loss": 4.605539189758301, + "train_acc": 0.00832, + "test_loss": 4.605174793243409, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.08881260926985375, + "grad_max_sv": 0.005750873032957316, + "grad_min_sv": 0.0, + "grad_condition": 5750873032.957315, + "lr": 0.0007679133974894982, + "time_sec": 83.71515822410583 + }, + { + "epoch": 49, + "train_loss": 4.605639272460937, + "train_acc": 0.00838, + "test_loss": 4.605174536132813, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09166121492862447, + "grad_max_sv": 0.012213990930467844, + "grad_min_sv": 0.0, + "grad_condition": 12213990930.467844, + "lr": 0.000759013504686565, + "time_sec": 83.6816132068634 + }, + { + "epoch": 50, + "train_loss": 4.605558903808594, + "train_acc": 0.00886, + "test_loss": 4.605173831939697, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09052173034897262, + "grad_max_sv": 0.015108420280739665, + "grad_min_sv": 0.0, + "grad_condition": 15108420280.739666, + "lr": 0.0007499999999999998, + "time_sec": 83.65550971031189 + }, + { + "epoch": 51, + "train_loss": 4.606378012390136, + "train_acc": 0.00982, + "test_loss": 4.605191948699951, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.13316554004595244, + "grad_max_sv": 0.08486739061772823, + "grad_min_sv": 5.639984459982783e-14, + "grad_condition": 78828935747.45195, + "lr": 0.0007408768370508575, + "time_sec": 83.73471426963806 + }, + { + "epoch": 52, + "train_loss": 4.548985960083008, + "train_acc": 0.01534, + "test_loss": 6.090479849243164, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.31291438549111006, + "grad_max_sv": 0.21921597719192504, + "grad_min_sv": 1.8728595782364096e-11, + "grad_condition": 72581711957.44724, + "lr": 0.0007316480175599307, + "time_sec": 83.83673882484436 + }, + { + "epoch": 53, + "train_loss": 4.517283289031982, + "train_acc": 0.01706, + "test_loss": 6.098530506896973, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.298946556890386, + "grad_max_sv": 0.21190068013966085, + "grad_min_sv": 3.1303262042079113e-12, + "grad_condition": 83525509037.16917, + "lr": 0.0007223175895924635, + "time_sec": 83.79953289031982 + }, + { + "epoch": 54, + "train_loss": 4.506922316894531, + "train_acc": 0.01826, + "test_loss": 6.029461811828614, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2872016386861535, + "grad_max_sv": 0.2001660715788603, + "grad_min_sv": 2.1477832165699736e-12, + "grad_condition": 93342369625.0347, + "lr": 0.0007128896457825361, + "time_sec": 83.83765316009521 + }, + { + "epoch": 55, + "train_loss": 4.500352125549316, + "train_acc": 0.01822, + "test_loss": 6.254561413574219, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2840675312383032, + "grad_max_sv": 0.19858233965933322, + "grad_min_sv": 2.2369640777182348e-12, + "grad_condition": 84452645725.82004, + "lr": 0.0007033683215378998, + "time_sec": 83.87366318702698 + }, + { + "epoch": 56, + "train_loss": 4.494334082946778, + "train_acc": 0.01898, + "test_loss": 6.176936679077149, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28473204888904313, + "grad_max_sv": 0.20153928063809873, + "grad_min_sv": 2.5336075244057393e-12, + "grad_condition": 84473652713.76613, + "lr": 0.0006937577932260512, + "time_sec": 83.85195803642273 + }, + { + "epoch": 57, + "train_loss": 4.491042407073975, + "train_acc": 0.01962, + "test_loss": 6.597558038330078, + "test_acc": 0.009, + "lyapunov": null, + "grad_norm": 0.27666587557698485, + "grad_max_sv": 0.19496511965990065, + "grad_min_sv": 2.6691194986502985e-12, + "grad_condition": 76747509393.5625, + "lr": 0.0006840622763423388, + "time_sec": 83.8267707824707 + }, + { + "epoch": 58, + "train_loss": 4.48429320526123, + "train_acc": 0.0202, + "test_loss": 6.6381898071289065, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2720732789744726, + "grad_max_sv": 0.189533968269825, + "grad_min_sv": 2.6686336090421275e-12, + "grad_condition": 76958091069.54593, + "lr": 0.0006742860236609073, + "time_sec": 83.81882667541504 + }, + { + "epoch": 59, + "train_loss": 4.479027882080078, + "train_acc": 0.02112, + "test_loss": 6.593468840026856, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28013135845208736, + "grad_max_sv": 0.1970901783555746, + "grad_min_sv": 3.427181970598606e-12, + "grad_condition": 77152467146.4727, + "lr": 0.0006644333233692913, + "time_sec": 83.80582737922668 + }, + { + "epoch": 60, + "train_loss": 4.455229897613525, + "train_acc": 0.02522, + "test_loss": 7.094032968139649, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2984456215457652, + "grad_max_sv": 0.20514705888926982, + "grad_min_sv": 1.3113472435618547e-11, + "grad_condition": 46710044351.44385, + "lr": 0.0006545084971874734, + "time_sec": 83.83238410949707 + }, + { + "epoch": 61, + "train_loss": 4.434012725677491, + "train_acc": 0.02664, + "test_loss": 7.727159403991699, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.31670091276798196, + "grad_max_sv": 0.22147773541510105, + "grad_min_sv": 2.0530699328249547e-10, + "grad_condition": 23070127911.0107, + "lr": 0.0006445158984722354, + "time_sec": 83.8679609298706 + }, + { + "epoch": 62, + "train_loss": 4.419747852783203, + "train_acc": 0.02636, + "test_loss": 7.459843544006348, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 0.3192666281191851, + "grad_max_sv": 0.22665422596037388, + "grad_min_sv": 2.7867287440722047e-10, + "grad_condition": 28668691596.510204, + "lr": 0.0006344599103076324, + "time_sec": 83.7790117263794 + }, + { + "epoch": 63, + "train_loss": 4.410167588043213, + "train_acc": 0.0297, + "test_loss": 6.561855883789063, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.30978499796993897, + "grad_max_sv": 0.21358359269797803, + "grad_min_sv": 1.0904945902848835e-10, + "grad_condition": 28758391079.590137, + "lr": 0.0006243449435824269, + "time_sec": 83.8552029132843 + }, + { + "epoch": 64, + "train_loss": 4.398182756958008, + "train_acc": 0.02932, + "test_loss": 7.0834544662475585, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2981823968653719, + "grad_max_sv": 0.2038045074790716, + "grad_min_sv": 4.896934048336616e-10, + "grad_condition": 6480139621.348356, + "lr": 0.0006141754350553275, + "time_sec": 83.81044340133667 + }, + { + "epoch": 65, + "train_loss": 4.39155801651001, + "train_acc": 0.0299, + "test_loss": 6.743014807128906, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2915326524043412, + "grad_max_sv": 0.19417541958391665, + "grad_min_sv": 1.18620941511223e-09, + "grad_condition": 1528876877.7676086, + "lr": 0.0006039558454088793, + "time_sec": 83.8169424533844 + }, + { + "epoch": 66, + "train_loss": 4.383871633453369, + "train_acc": 0.03122, + "test_loss": 6.343855700683593, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2920918221308499, + "grad_max_sv": 0.19423219338059425, + "grad_min_sv": 1.1915352001942714e-09, + "grad_condition": 890331184.9718037, + "lr": 0.000593690657292862, + "time_sec": 83.8088231086731 + }, + { + "epoch": 67, + "train_loss": 4.380996891784668, + "train_acc": 0.03214, + "test_loss": 6.3810079963684085, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28877371474045604, + "grad_max_sv": 0.193271204829216, + "grad_min_sv": 1.6600884500828778e-09, + "grad_condition": 372383180.6138096, + "lr": 0.0005833843733580507, + "time_sec": 83.78432846069336 + }, + { + "epoch": 68, + "train_loss": 4.376522983703613, + "train_acc": 0.0316, + "test_loss": 6.291935075378418, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.2862661185936042, + "grad_max_sv": 0.18648179918527602, + "grad_min_sv": 1.468030542869361e-09, + "grad_condition": 2139805441.5710232, + "lr": 0.0005730415142812054, + "time_sec": 83.7891354560852 + }, + { + "epoch": 69, + "train_loss": 4.372224440612793, + "train_acc": 0.03352, + "test_loss": 6.681443427276611, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2796495478797956, + "grad_max_sv": 0.18046599105000496, + "grad_min_sv": 1.2168376441450828e-09, + "grad_condition": 721985908.0902131, + "lr": 0.0005626666167821517, + "time_sec": 83.80607604980469 + }, + { + "epoch": 70, + "train_loss": 4.369470675811767, + "train_acc": 0.03222, + "test_loss": 6.483533153533935, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.28218706578232045, + "grad_max_sv": 0.18038711175322533, + "grad_min_sv": 1.6886237430915884e-09, + "grad_condition": 284801174.2502399, + "lr": 0.0005522642316338265, + "time_sec": 83.80915093421936 + }, + { + "epoch": 71, + "train_loss": 4.36190840423584, + "train_acc": 0.03452, + "test_loss": 6.448402415466308, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.27607671132097, + "grad_max_sv": 0.17782694809138774, + "grad_min_sv": 1.594215062207787e-09, + "grad_condition": 2097996064.0572019, + "lr": 0.0005418389216661573, + "time_sec": 83.82332372665405 + }, + { + "epoch": 72, + "train_loss": 4.354908424377442, + "train_acc": 0.03596, + "test_loss": 6.558257571411133, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 0.2756995722839523, + "grad_max_sv": 0.16976643167436123, + "grad_min_sv": 1.6113121665065067e-09, + "grad_condition": 277986841.7750164, + "lr": 0.0005313952597646563, + "time_sec": 83.79193758964539 + }, + { + "epoch": 73, + "train_loss": 4.354222341156006, + "train_acc": 0.03476, + "test_loss": 6.309269012451172, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26842599931569244, + "grad_max_sv": 0.1654328290373087, + "grad_min_sv": 1.5355291571898453e-09, + "grad_condition": 494546718.69761646, + "lr": 0.0005209378268645994, + "time_sec": 83.83719944953918 + }, + { + "epoch": 74, + "train_loss": 4.348915999755859, + "train_acc": 0.03656, + "test_loss": 6.48945037689209, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2721751559070442, + "grad_max_sv": 0.1733177002519369, + "grad_min_sv": 1.6353850840794179e-09, + "grad_condition": 4394906218.143788, + "lr": 0.0005104712099416781, + "time_sec": 83.87231683731079 + }, + { + "epoch": 75, + "train_loss": 4.344389753723145, + "train_acc": 0.0362, + "test_loss": 6.536355171203613, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2762971427042467, + "grad_max_sv": 0.17327322103083134, + "grad_min_sv": 1.6745484680748961e-09, + "grad_condition": 296861622.65127766, + "lr": 0.0004999999999999996, + "time_sec": 83.7963707447052 + }, + { + "epoch": 76, + "train_loss": 4.336879919433594, + "train_acc": 0.0385, + "test_loss": 6.207801509094239, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.27617831363540746, + "grad_max_sv": 0.17525496631860732, + "grad_min_sv": 1.712406004191272e-09, + "grad_condition": 355194777.2860588, + "lr": 0.0004895287900583212, + "time_sec": 83.78706455230713 + }, + { + "epoch": 77, + "train_loss": 4.334291800689697, + "train_acc": 0.03816, + "test_loss": 5.998904524230957, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.27646822759404405, + "grad_max_sv": 0.17449169531464576, + "grad_min_sv": 1.7281031508770487e-09, + "grad_condition": 617370975.1793921, + "lr": 0.0004790621731353997, + "time_sec": 83.79909944534302 + }, + { + "epoch": 78, + "train_loss": 4.33249505783081, + "train_acc": 0.0375, + "test_loss": 6.079836444854736, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.28240731905667205, + "grad_max_sv": 0.17906831130385398, + "grad_min_sv": 1.832980646302232e-09, + "grad_condition": 570608704.9054655, + "lr": 0.000468604740235343, + "time_sec": 83.78829288482666 + }, + { + "epoch": 79, + "train_loss": 4.327211993713379, + "train_acc": 0.0372, + "test_loss": 6.010349069976806, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26579955843267283, + "grad_max_sv": 0.16206405386328698, + "grad_min_sv": 1.8076382385400804e-09, + "grad_condition": 680257720.1741323, + "lr": 0.00045816107833384175, + "time_sec": 83.79378890991211 + }, + { + "epoch": 80, + "train_loss": 4.325840251617431, + "train_acc": 0.0399, + "test_loss": 6.453493260192871, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 0.2678340843927439, + "grad_max_sv": 0.16088486537337304, + "grad_min_sv": 1.8230197001067525e-09, + "grad_condition": 491813566.00292075, + "lr": 0.0004477357683661729, + "time_sec": 83.77716493606567 + }, + { + "epoch": 81, + "train_loss": 4.324064207763672, + "train_acc": 0.03872, + "test_loss": 6.066691808319092, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27284601483817317, + "grad_max_sv": 0.1656409576535225, + "grad_min_sv": 1.966192943528289e-09, + "grad_condition": 120565010.54568236, + "lr": 0.00043733338321784746, + "time_sec": 83.78050255775452 + }, + { + "epoch": 82, + "train_loss": 4.3167226469421385, + "train_acc": 0.04004, + "test_loss": 6.479253450012207, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.266468676835963, + "grad_max_sv": 0.16226925253868102, + "grad_min_sv": 1.8786357255094232e-09, + "grad_condition": 832620477.3818345, + "lr": 0.0004269584857187939, + "time_sec": 83.77594256401062 + }, + { + "epoch": 83, + "train_loss": 4.314026451263428, + "train_acc": 0.04066, + "test_loss": 6.491674769592285, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2618645063357135, + "grad_max_sv": 0.15328656397759916, + "grad_min_sv": 1.8954250842473375e-09, + "grad_condition": 324046081.6731597, + "lr": 0.0004166156266419484, + "time_sec": 83.79970407485962 + }, + { + "epoch": 84, + "train_loss": 4.307831993713379, + "train_acc": 0.04056, + "test_loss": 6.641959228515625, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2686563253168225, + "grad_max_sv": 0.16125894524157047, + "grad_min_sv": 2.0374150564578254e-09, + "grad_condition": 160522665.97837877, + "lr": 0.0004063093427071373, + "time_sec": 83.82930493354797 + }, + { + "epoch": 85, + "train_loss": 4.308941020507812, + "train_acc": 0.0418, + "test_loss": 6.508579216003418, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.27160717763788633, + "grad_max_sv": 0.1655819222331047, + "grad_min_sv": 2.023065160186577e-09, + "grad_condition": 120462376.21506557, + "lr": 0.0003960441545911199, + "time_sec": 83.7900025844574 + }, + { + "epoch": 86, + "train_loss": 4.304050233764649, + "train_acc": 0.03994, + "test_loss": 6.396804527282715, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.2729810873547816, + "grad_max_sv": 0.16440293304622172, + "grad_min_sv": 2.151508744253905e-09, + "grad_condition": 132130608.9556226, + "lr": 0.0003858245649446718, + "time_sec": 83.80140709877014 + }, + { + "epoch": 87, + "train_loss": 4.299405968475342, + "train_acc": 0.04196, + "test_loss": 6.600989144897461, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2695479470251096, + "grad_max_sv": 0.1591991312801838, + "grad_min_sv": 1.9906060319194175e-09, + "grad_condition": 119698677.25192289, + "lr": 0.00037565505641757235, + "time_sec": 83.82861065864563 + }, + { + "epoch": 88, + "train_loss": 4.301599495544433, + "train_acc": 0.04232, + "test_loss": 6.554762725830078, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2647703969850391, + "grad_max_sv": 0.15560886412858962, + "grad_min_sv": 1.9747980002995937e-09, + "grad_condition": 122983202.1326602, + "lr": 0.00036554008969236695, + "time_sec": 83.82960343360901 + }, + { + "epoch": 89, + "train_loss": 4.297747989654541, + "train_acc": 0.04348, + "test_loss": 6.357062748718262, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.26734470016505596, + "grad_max_sv": 0.15722180251032114, + "grad_min_sv": 1.981925610086699e-09, + "grad_condition": 100233762.481437, + "lr": 0.0003554841015277638, + "time_sec": 83.85219097137451 + }, + { + "epoch": 90, + "train_loss": 4.294689517669678, + "train_acc": 0.04346, + "test_loss": 6.4904538467407225, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26448991829060364, + "grad_max_sv": 0.1514646142721176, + "grad_min_sv": 2.0380848893969404e-09, + "grad_condition": 115297831.8608543, + "lr": 0.000345491502812526, + "time_sec": 83.78560423851013 + }, + { + "epoch": 91, + "train_loss": 4.288459105834961, + "train_acc": 0.04228, + "test_loss": 6.363833187866211, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2716021382283501, + "grad_max_sv": 0.16101026125252246, + "grad_min_sv": 2.0529807125135857e-09, + "grad_condition": 111422037.25124231, + "lr": 0.0003355666766307081, + "time_sec": 83.80491185188293 + }, + { + "epoch": 92, + "train_loss": 4.2877139868164065, + "train_acc": 0.04416, + "test_loss": 6.387586988067627, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2675364217657968, + "grad_max_sv": 0.1556147363036871, + "grad_min_sv": 2.072003611047757e-09, + "grad_condition": 100163844.77093126, + "lr": 0.00032571397633909225, + "time_sec": 83.80176591873169 + }, + { + "epoch": 93, + "train_loss": 4.286743914489746, + "train_acc": 0.04442, + "test_loss": 6.614454327392578, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.2696169338715711, + "grad_max_sv": 0.1587842211127281, + "grad_min_sv": 2.1451849420948964e-09, + "grad_condition": 175440678.68888003, + "lr": 0.00031593772365766094, + "time_sec": 83.81897950172424 + }, + { + "epoch": 94, + "train_loss": 4.281456643066406, + "train_acc": 0.04426, + "test_loss": 6.365528283691407, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27294877944821766, + "grad_max_sv": 0.16244313083589076, + "grad_min_sv": 2.1448280498881368e-09, + "grad_condition": 93958550.86214396, + "lr": 0.0003062422067739483, + "time_sec": 83.78250980377197 + }, + { + "epoch": 95, + "train_loss": 4.280488971710205, + "train_acc": 0.04608, + "test_loss": 6.470796231842041, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.273056993639001, + "grad_max_sv": 0.16184688359498978, + "grad_min_sv": 2.2206805599250813e-09, + "grad_condition": 185414259.9896317, + "lr": 0.00029663167846209965, + "time_sec": 83.82439541816711 + }, + { + "epoch": 96, + "train_loss": 4.279716082458496, + "train_acc": 0.04314, + "test_loss": 6.52447133026123, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 0.27442923945512043, + "grad_max_sv": 0.1630928661674261, + "grad_min_sv": 2.3233001415073897e-09, + "grad_condition": 103462231.52886583, + "lr": 0.00028711035421746345, + "time_sec": 83.83807969093323 + }, + { + "epoch": 97, + "train_loss": 4.274856643218994, + "train_acc": 0.04572, + "test_loss": 6.772166311645508, + "test_acc": 0.0109, + "lyapunov": null, + "grad_norm": 0.2771278283509764, + "grad_max_sv": 0.17104111909866332, + "grad_min_sv": 2.4184343061159352e-09, + "grad_condition": 271014828.3038153, + "lr": 0.00027768241040753615, + "time_sec": 83.85514092445374 + }, + { + "epoch": 98, + "train_loss": 4.2779387315368655, + "train_acc": 0.04608, + "test_loss": 6.668636999511719, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27463112819076785, + "grad_max_sv": 0.16144732832908631, + "grad_min_sv": 2.2677979229649758e-09, + "grad_condition": 4419130655.463402, + "lr": 0.00026835198244006903, + "time_sec": 83.83084058761597 + }, + { + "epoch": 99, + "train_loss": 4.276140930480957, + "train_acc": 0.04544, + "test_loss": 6.88837735748291, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.26886350994697167, + "grad_max_sv": 0.15219354666769505, + "grad_min_sv": 2.2166218230715296e-09, + "grad_condition": 103754705.283932, + "lr": 0.0002591231629491421, + "time_sec": 83.79713916778564 + }, + { + "epoch": 100, + "train_loss": 4.273054361877441, + "train_acc": 0.04564, + "test_loss": 6.783898326873779, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.26691489320326656, + "grad_max_sv": 0.14936545640230178, + "grad_min_sv": 2.2781338981925358e-09, + "grad_condition": 87358992.35708968, + "lr": 0.0002499999999999997, + "time_sec": 83.80319023132324 + }, + { + "epoch": 101, + "train_loss": 4.26914766998291, + "train_acc": 0.04564, + "test_loss": 6.513159948730468, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26611169562468134, + "grad_max_sv": 0.15025373138487338, + "grad_min_sv": 2.2174503035848892e-09, + "grad_condition": 96439723.92469814, + "lr": 0.00024098649531343477, + "time_sec": 83.83437013626099 + }, + { + "epoch": 102, + "train_loss": 4.26979032119751, + "train_acc": 0.04642, + "test_loss": 6.493202007293701, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.26813810856759995, + "grad_max_sv": 0.1489817149937153, + "grad_min_sv": 2.380725915018811e-09, + "grad_condition": 76215277.93021134, + "lr": 0.0002320866025105016, + "time_sec": 83.80248379707336 + }, + { + "epoch": 103, + "train_loss": 4.260873723297119, + "train_acc": 0.04782, + "test_loss": 6.493594526672363, + "test_acc": 0.0111, + "lyapunov": null, + "grad_norm": 0.2688305350715821, + "grad_max_sv": 0.1512874387204647, + "grad_min_sv": 2.453062892919522e-09, + "grad_condition": 134347199.1051014, + "lr": 0.0002233042253783278, + "time_sec": 83.81874346733093 + }, + { + "epoch": 104, + "train_loss": 4.262198150939941, + "train_acc": 0.04738, + "test_loss": 6.605858857727051, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.27225916391154686, + "grad_max_sv": 0.15373125690966843, + "grad_min_sv": 2.44866176035783e-09, + "grad_condition": 419013949.5031613, + "lr": 0.000214643216157784, + "time_sec": 84.03694415092468 + }, + { + "epoch": 105, + "train_loss": 4.262576495056153, + "train_acc": 0.04672, + "test_loss": 6.746639459991455, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2762952402363064, + "grad_max_sv": 0.15909811817109584, + "grad_min_sv": 2.4671919398103204e-09, + "grad_condition": 139499125.202051, + "lr": 0.00020610737385376332, + "time_sec": 83.83756351470947 + }, + { + "epoch": 106, + "train_loss": 4.256981732330322, + "train_acc": 0.04834, + "test_loss": 6.714322766113281, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.27463124817104645, + "grad_max_sv": 0.15689255371689798, + "grad_min_sv": 2.5142482939360944e-09, + "grad_condition": 118433721.44138017, + "lr": 0.00019770044256881242, + "time_sec": 83.83591985702515 + }, + { + "epoch": 107, + "train_loss": 4.2602463818359375, + "train_acc": 0.04698, + "test_loss": 6.657286577606201, + "test_acc": 0.0109, + "lyapunov": null, + "grad_norm": 0.2689041932222791, + "grad_max_sv": 0.15177576132118703, + "grad_min_sv": 2.4187723310364893e-09, + "grad_condition": 94992794.34351222, + "lr": 0.0001894261098608447, + "time_sec": 83.80453681945801 + }, + { + "epoch": 108, + "train_loss": 4.2544874598693845, + "train_acc": 0.04844, + "test_loss": 6.59372087097168, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2710712522794079, + "grad_max_sv": 0.15038638189435005, + "grad_min_sv": 2.514627481589593e-09, + "grad_condition": 93107492.33691652, + "lr": 0.000181288005125655, + "time_sec": 83.77546954154968 + }, + { + "epoch": 109, + "train_loss": 4.253146978759766, + "train_acc": 0.04824, + "test_loss": 6.575524732208252, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2727669683249611, + "grad_max_sv": 0.15002147294580936, + "grad_min_sv": 2.4739045799762604e-09, + "grad_condition": 125566166.74099617, + "lr": 0.0001732896980049473, + "time_sec": 83.82711911201477 + }, + { + "epoch": 110, + "train_loss": 4.250933767089844, + "train_acc": 0.04966, + "test_loss": 6.632392105102539, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.27898350710296843, + "grad_max_sv": 0.15593392103910447, + "grad_min_sv": 2.5894539202545724e-09, + "grad_condition": 625752503.9437258, + "lr": 0.00016543469682057076, + "time_sec": 83.74293255805969 + }, + { + "epoch": 111, + "train_loss": 4.24997673614502, + "train_acc": 0.04972, + "test_loss": 6.568419965362549, + "test_acc": 0.0109, + "lyapunov": null, + "grad_norm": 0.27772763472261885, + "grad_max_sv": 0.15495621263980866, + "grad_min_sv": 2.661621495425592e-09, + "grad_condition": 70119073.46937823, + "lr": 0.00015772644703565552, + "time_sec": 83.79197788238525 + }, + { + "epoch": 112, + "train_loss": 4.249247148590088, + "train_acc": 0.0507, + "test_loss": 6.707973278045654, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 0.27686969610418316, + "grad_max_sv": 0.15229813233017922, + "grad_min_sv": 2.662702908856618e-09, + "grad_condition": 153958977.83635777, + "lr": 0.00015016832974331713, + "time_sec": 83.80273818969727 + }, + { + "epoch": 113, + "train_loss": 4.250667928771973, + "train_acc": 0.0492, + "test_loss": 6.8461118530273435, + "test_acc": 0.0096, + "lyapunov": null, + "grad_norm": 0.28055092675814575, + "grad_max_sv": 0.1576558079570532, + "grad_min_sv": 2.742332778221668e-09, + "grad_condition": 137456876.77179033, + "lr": 0.00014276366018359834, + "time_sec": 83.80364871025085 + }, + { + "epoch": 114, + "train_loss": 4.2449106436157225, + "train_acc": 0.05016, + "test_loss": 6.787322373962402, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27979119322019597, + "grad_max_sv": 0.15479157418012618, + "grad_min_sv": 2.6695785599467614e-09, + "grad_condition": 81382647.58523288, + "lr": 0.00013551568628929425, + "time_sec": 83.82229542732239 + }, + { + "epoch": 115, + "train_loss": 4.244952727355957, + "train_acc": 0.05002, + "test_loss": 6.741559551239014, + "test_acc": 0.0092, + "lyapunov": null, + "grad_norm": 0.2773863197316903, + "grad_max_sv": 0.15171751268208028, + "grad_min_sv": 2.682797061023465e-09, + "grad_condition": 212074169.4590431, + "lr": 0.00012842758726130276, + "time_sec": 83.82812428474426 + }, + { + "epoch": 116, + "train_loss": 4.242339648132324, + "train_acc": 0.04982, + "test_loss": 6.755374185180664, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2805527611657844, + "grad_max_sv": 0.1574402242898941, + "grad_min_sv": 2.8019030511548804e-09, + "grad_condition": 238625880.71394747, + "lr": 0.0001215024721741218, + "time_sec": 83.79120373725891 + }, + { + "epoch": 117, + "train_loss": 4.240206247253418, + "train_acc": 0.04966, + "test_loss": 6.836046894073486, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2758039178422697, + "grad_max_sv": 0.1517912581562996, + "grad_min_sv": 2.68810798897956e-09, + "grad_condition": 72825643.14736441, + "lr": 0.00011474337861210538, + "time_sec": 83.7668628692627 + }, + { + "epoch": 118, + "train_loss": 4.2366791255187985, + "train_acc": 0.05162, + "test_loss": 6.8930122108459475, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.28097411795628907, + "grad_max_sv": 0.15138982199132442, + "grad_min_sv": 2.6724390362123373e-09, + "grad_condition": 105031519.49257562, + "lr": 0.00010815327133708009, + "time_sec": 83.7777681350708 + }, + { + "epoch": 119, + "train_loss": 4.239317052307129, + "train_acc": 0.05098, + "test_loss": 6.895288885498047, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.28557653268704064, + "grad_max_sv": 0.15877793319523334, + "grad_min_sv": 2.852896488665657e-09, + "grad_condition": 130124221.77470978, + "lr": 0.00010173504098790182, + "time_sec": 83.770183801651 + }, + { + "epoch": 120, + "train_loss": 4.238326491088867, + "train_acc": 0.04944, + "test_loss": 6.971952970123291, + "test_acc": 0.0116, + "lyapunov": null, + "grad_norm": 0.28330987147198217, + "grad_max_sv": 0.15257025621831416, + "grad_min_sv": 2.890761002100062e-09, + "grad_condition": 92481164.9877267, + "lr": 9.549150281252629e-05, + "time_sec": 83.78682947158813 + }, + { + "epoch": 121, + "train_loss": 4.238821759033203, + "train_acc": 0.05118, + "test_loss": 6.903655708312988, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.2844816880687477, + "grad_max_sv": 0.15047130659222602, + "grad_min_sv": 2.9364908977515257e-09, + "grad_condition": 155468550.15943855, + "lr": 8.942539543314794e-05, + "time_sec": 83.74171853065491 + }, + { + "epoch": 122, + "train_loss": 4.231929050292969, + "train_acc": 0.05106, + "test_loss": 6.9859304649353025, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.28661742540946805, + "grad_max_sv": 0.15440320819616318, + "grad_min_sv": 3.0144829410438945e-09, + "grad_condition": 58782400.13901849, + "lr": 8.353937964495024e-05, + "time_sec": 83.77999758720398 + }, + { + "epoch": 123, + "train_loss": 4.234138116607666, + "train_acc": 0.05334, + "test_loss": 6.891355895996094, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28893265325047696, + "grad_max_sv": 0.15679317489266395, + "grad_min_sv": 3.0731328568706083e-09, + "grad_condition": 83816649.99544896, + "lr": 7.783603724899243e-05, + "time_sec": 83.76851487159729 + }, + { + "epoch": 124, + "train_loss": 4.229343013763428, + "train_acc": 0.05258, + "test_loss": 7.009951159667969, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2863743887145036, + "grad_max_sv": 0.15191952474415302, + "grad_min_sv": 3.0230644397499785e-09, + "grad_condition": 211100331.6657278, + "lr": 7.231786991974666e-05, + "time_sec": 83.76139807701111 + }, + { + "epoch": 125, + "train_loss": 4.232501866760254, + "train_acc": 0.05186, + "test_loss": 6.96674277420044, + "test_acc": 0.0111, + "lyapunov": null, + "grad_norm": 0.2858550264764349, + "grad_max_sv": 0.15213587880134583, + "grad_min_sv": 3.046650505489357e-09, + "grad_condition": 63383717.426429704, + "lr": 6.698729810778072e-05, + "time_sec": 83.78086757659912 + }, + { + "epoch": 126, + "train_loss": 4.229700404968262, + "train_acc": 0.0524, + "test_loss": 7.008199283599853, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.2850115287876514, + "grad_max_sv": 0.14953349605202676, + "grad_min_sv": 2.9821331362644977e-09, + "grad_condition": 76613514.19037959, + "lr": 6.184665997806817e-05, + "time_sec": 83.765873670578 + }, + { + "epoch": 127, + "train_loss": 4.226065429992675, + "train_acc": 0.05148, + "test_loss": 6.9513890808105465, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.28929346428701186, + "grad_max_sv": 0.15673540011048318, + "grad_min_sv": 3.046475822998662e-09, + "grad_condition": 68840265.65077923, + "lr": 5.6898210384392595e-05, + "time_sec": 83.76980423927307 + }, + { + "epoch": 128, + "train_loss": 4.223751395874023, + "train_acc": 0.05446, + "test_loss": 6.981657604980469, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2886516286895676, + "grad_max_sv": 0.15273929238319398, + "grad_min_sv": 3.0959206469283186e-09, + "grad_condition": 61503758.19812535, + "lr": 5.214411988029363e-05, + "time_sec": 83.77617073059082 + }, + { + "epoch": 129, + "train_loss": 4.223811264648438, + "train_acc": 0.05404, + "test_loss": 6.9342261474609375, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2869141420134922, + "grad_max_sv": 0.15136036798357963, + "grad_min_sv": 3.047223613023009e-09, + "grad_condition": 97351366.2154063, + "lr": 4.7586473766990294e-05, + "time_sec": 83.78148245811462 + }, + { + "epoch": 130, + "train_loss": 4.224827704467773, + "train_acc": 0.0532, + "test_loss": 7.028645568084717, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.2903989310802725, + "grad_max_sv": 0.15144419111311436, + "grad_min_sv": 3.1437888660390544e-09, + "grad_condition": 118830904.24527971, + "lr": 4.32272711786996e-05, + "time_sec": 83.79948663711548 + }, + { + "epoch": 131, + "train_loss": 4.221605782775879, + "train_acc": 0.05298, + "test_loss": 6.999451491546631, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.29092754210208693, + "grad_max_sv": 0.15410602577030658, + "grad_min_sv": 3.2033975992662445e-09, + "grad_condition": 57038304.52076046, + "lr": 3.906842420574966e-05, + "time_sec": 83.77110433578491 + }, + { + "epoch": 132, + "train_loss": 4.218992453613281, + "train_acc": 0.05284, + "test_loss": 7.0255691505432125, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2914825249386215, + "grad_max_sv": 0.15589108187705278, + "grad_min_sv": 3.206146753816086e-09, + "grad_condition": 122587816.51957992, + "lr": 3.5111757055874305e-05, + "time_sec": 83.75379085540771 + }, + { + "epoch": 133, + "train_loss": 4.220229903869629, + "train_acc": 0.05394, + "test_loss": 6.9970667213439945, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.293170941298062, + "grad_max_sv": 0.15195444263517857, + "grad_min_sv": 3.1603012576666978e-09, + "grad_condition": 99833022.93899234, + "lr": 3.1359005254054254e-05, + "time_sec": 83.83364748954773 + }, + { + "epoch": 134, + "train_loss": 4.221537724761963, + "train_acc": 0.05412, + "test_loss": 7.081800342559815, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.29192289713649316, + "grad_max_sv": 0.1527898743748665, + "grad_min_sv": 3.242900753486211e-09, + "grad_condition": 53839731.29661299, + "lr": 2.7811814881259484e-05, + "time_sec": 83.77570366859436 + }, + { + "epoch": 135, + "train_loss": 4.224225687103272, + "train_acc": 0.0536, + "test_loss": 7.031653879547119, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2928013245487039, + "grad_max_sv": 0.15023601055145264, + "grad_min_sv": 3.1499084042485583e-09, + "grad_condition": 56443800.83675871, + "lr": 2.4471741852423218e-05, + "time_sec": 83.79031038284302 + }, + { + "epoch": 136, + "train_loss": 4.2209420147705075, + "train_acc": 0.05542, + "test_loss": 7.0730202087402345, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.29383612459846997, + "grad_max_sv": 0.1526225544512272, + "grad_min_sv": 3.216327003211297e-09, + "grad_condition": 488112741.3165139, + "lr": 2.1340251233966362e-05, + "time_sec": 83.78721952438354 + }, + { + "epoch": 137, + "train_loss": 4.217904202728271, + "train_acc": 0.0547, + "test_loss": 7.029183413696289, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.29146081115101274, + "grad_max_sv": 0.14856699295341969, + "grad_min_sv": 3.193107374344084e-09, + "grad_condition": 54362425.00069554, + "lr": 1.8418716601170932e-05, + "time_sec": 83.76650714874268 + }, + { + "epoch": 138, + "train_loss": 4.222578598480225, + "train_acc": 0.05248, + "test_loss": 7.08011364440918, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.29305556036271213, + "grad_max_sv": 0.1505037024617195, + "grad_min_sv": 3.2047648587836542e-09, + "grad_condition": 326741808.1820611, + "lr": 1.570841943568445e-05, + "time_sec": 83.7816994190216 + }, + { + "epoch": 139, + "train_loss": 4.218749967193603, + "train_acc": 0.05366, + "test_loss": 7.0575081214904785, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.29397952766323676, + "grad_max_sv": 0.148932196572423, + "grad_min_sv": 3.2381111236823303e-09, + "grad_condition": 52412171.837261274, + "lr": 1.3210548563419845e-05, + "time_sec": 83.8086462020874 + }, + { + "epoch": 140, + "train_loss": 4.217845681304931, + "train_acc": 0.05502, + "test_loss": 7.102373625946045, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 0.2935367604869691, + "grad_max_sv": 0.14902403093874456, + "grad_min_sv": 3.2832004351335264e-09, + "grad_condition": 52749321.36829077, + "lr": 1.0926199633097203e-05, + "time_sec": 83.79147672653198 + }, + { + "epoch": 141, + "train_loss": 4.214903557434082, + "train_acc": 0.05414, + "test_loss": 7.033845091247558, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.29612387661640516, + "grad_max_sv": 0.15556762106716632, + "grad_min_sv": 3.2642252397602213e-09, + "grad_condition": 123272892.75406721, + "lr": 8.856374635655688e-06, + "time_sec": 83.81054306030273 + }, + { + "epoch": 142, + "train_loss": 4.215419233093262, + "train_acc": 0.05478, + "test_loss": 7.08431992111206, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.29494037543034185, + "grad_max_sv": 0.15155189596116542, + "grad_min_sv": 3.2587884789964106e-09, + "grad_condition": 76214087.81495127, + "lr": 7.001981464747503e-06, + "time_sec": 83.78057074546814 + }, + { + "epoch": 143, + "train_loss": 4.217841682281494, + "train_acc": 0.05398, + "test_loss": 7.037088000488281, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2932160255751842, + "grad_max_sv": 0.14940347485244274, + "grad_min_sv": 3.258327102573233e-09, + "grad_condition": 73149202.84067681, + "lr": 5.3638335185058295e-06, + "time_sec": 83.79549980163574 + }, + { + "epoch": 144, + "train_loss": 4.215883382873535, + "train_acc": 0.0537, + "test_loss": 7.091348276519775, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2950445450440956, + "grad_max_sv": 0.153789921104908, + "grad_min_sv": 3.312160905266648e-09, + "grad_condition": 52811849.90694652, + "lr": 3.942649342761114e-06, + "time_sec": 83.8086678981781 + }, + { + "epoch": 145, + "train_loss": 4.2175880349731445, + "train_acc": 0.05522, + "test_loss": 7.115469957733154, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.29403172002116806, + "grad_max_sv": 0.15080158710479735, + "grad_min_sv": 3.237252350907216e-09, + "grad_condition": 52283776.27412096, + "lr": 2.7390523158633524e-06, + "time_sec": 83.78764986991882 + }, + { + "epoch": 146, + "train_loss": 4.211100564270019, + "train_acc": 0.05546, + "test_loss": 7.0454746505737305, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2953687426258213, + "grad_max_sv": 0.1488959614187479, + "grad_min_sv": 3.3052532932842382e-09, + "grad_condition": 57195017.16791941, + "lr": 1.7535703752478133e-06, + "time_sec": 83.81411933898926 + }, + { + "epoch": 147, + "train_loss": 4.215898538208008, + "train_acc": 0.0547, + "test_loss": 7.0791287528991695, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.29507184047055474, + "grad_max_sv": 0.1496420454233885, + "grad_min_sv": 3.2882809359756003e-09, + "grad_condition": 440797367.90569246, + "lr": 9.866357858642196e-07, + "time_sec": 83.83466935157776 + }, + { + "epoch": 148, + "train_loss": 4.21191631515503, + "train_acc": 0.05502, + "test_loss": 6.993793771362305, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.29572223257711466, + "grad_max_sv": 0.1509379804134369, + "grad_min_sv": 3.2624034737582796e-09, + "grad_condition": 53696330.15699832, + "lr": 4.38584950570808e-07, + "time_sec": 83.83085513114929 + }, + { + "epoch": 149, + "train_loss": 4.214856278686524, + "train_acc": 0.05504, + "test_loss": 7.080280429077148, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.29551682436364557, + "grad_max_sv": 0.1497094627469778, + "grad_min_sv": 3.273750590060409e-09, + "grad_condition": 73934031.32038581, + "lr": 1.096582625772501e-07, + "time_sec": 83.84602665901184 + }, + { + "epoch": 150, + "train_loss": 4.2193192990112305, + "train_acc": 0.0535, + "test_loss": 7.083986274719238, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2957722763250381, + "grad_max_sv": 0.15103124249726535, + "grad_min_sv": 3.2879624276699325e-09, + "grad_condition": 65137818.05484857, + "lr": 0.0, + "time_sec": 83.81010937690735 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 8.745512613220216, + "train_acc": 0.02574, + "test_loss": 4.55846024017334, + "test_acc": 0.0339, + "lyapunov": 3.2288631459941035, + "grad_norm": 7.160399518281865, + "grad_max_sv": 5.050605493783951, + "grad_min_sv": 1.0948114780862107e-07, + "grad_condition": 174574426.40620375, + "lr": 0.0009998903417374227, + "time_sec": 38.78080153465271 + }, + { + "epoch": 2, + "train_loss": 6.857188781433106, + "train_acc": 0.03116, + "test_loss": 4.409567827606201, + "test_acc": 0.0498, + "lyapunov": 2.566672464160968, + "grad_norm": 4.581532406245075, + "grad_max_sv": 3.4727421343326568, + "grad_min_sv": 6.695858347782747e-08, + "grad_condition": 100510712.5879864, + "lr": 0.0009995614150494292, + "time_sec": 38.758466482162476 + }, + { + "epoch": 3, + "train_loss": 6.406850777893067, + "train_acc": 0.03836, + "test_loss": 4.3329737182617185, + "test_acc": 0.0541, + "lyapunov": 2.4151331805207237, + "grad_norm": 2.8463282070399885, + "grad_max_sv": 2.2940395712852477, + "grad_min_sv": 3.7823234264044994e-08, + "grad_condition": 106198851.94331202, + "lr": 0.0009990133642141358, + "time_sec": 38.77664065361023 + }, + { + "epoch": 4, + "train_loss": 6.1679999932861325, + "train_acc": 0.04216, + "test_loss": 4.314407443237305, + "test_acc": 0.0539, + "lyapunov": 2.324155716030189, + "grad_norm": 1.4958218707983646, + "grad_max_sv": 1.126097397506237, + "grad_min_sv": 1.8212272229894964e-08, + "grad_condition": 178099339.46093446, + "lr": 0.0009982464296247522, + "time_sec": 38.772703409194946 + }, + { + "epoch": 5, + "train_loss": 6.023621784973145, + "train_acc": 0.04472, + "test_loss": 4.327248037719727, + "test_acc": 0.0523, + "lyapunov": 2.24559463046091, + "grad_norm": 0.8361636453752828, + "grad_max_sv": 0.5582518823444843, + "grad_min_sv": 9.160982232525595e-09, + "grad_condition": 218277432.54054898, + "lr": 0.0009972609476841367, + "time_sec": 38.792168855667114 + }, + { + "epoch": 6, + "train_loss": 5.923550573730469, + "train_acc": 0.03788, + "test_loss": 4.373689149475098, + "test_acc": 0.0448, + "lyapunov": 2.143530731615813, + "grad_norm": 0.6125747823801606, + "grad_max_sv": 0.3806876644492149, + "grad_min_sv": 4.764090941352089e-09, + "grad_condition": 2115444033.3075993, + "lr": 0.000996057350657239, + "time_sec": 38.80649399757385 + }, + { + "epoch": 7, + "train_loss": 5.819468310699463, + "train_acc": 0.03402, + "test_loss": 4.396667736816406, + "test_acc": 0.0409, + "lyapunov": 2.047879105028899, + "grad_norm": 0.5012166631957408, + "grad_max_sv": 0.29988972246646883, + "grad_min_sv": 2.6462318619344118e-09, + "grad_condition": 1674717584.2678788, + "lr": 0.000994636166481494, + "time_sec": 38.8136990070343 + }, + { + "epoch": 8, + "train_loss": 5.776593683929443, + "train_acc": 0.02754, + "test_loss": 4.459617399597168, + "test_acc": 0.0288, + "lyapunov": 1.982207260168422, + "grad_norm": 0.48582047366784137, + "grad_max_sv": 0.2761614330112934, + "grad_min_sv": 2.1785290433868222e-10, + "grad_condition": 40862120030.312584, + "lr": 0.0009929980185352525, + "time_sec": 38.845232248306274 + }, + { + "epoch": 9, + "train_loss": 5.781761088104248, + "train_acc": 0.0231, + "test_loss": 4.675199285888672, + "test_acc": 0.0029, + "lyapunov": 1.954250096360131, + "grad_norm": 0.46266769063149876, + "grad_max_sv": 0.2622381761670113, + "grad_min_sv": 5.480658221434448e-10, + "grad_condition": 100986477853.47366, + "lr": 0.0009911436253643444, + "time_sec": 38.80020809173584 + }, + { + "epoch": 10, + "train_loss": 5.8479565664672855, + "train_acc": 0.01186, + "test_loss": 4.6061001365661625, + "test_acc": 0.01, + "lyapunov": 1.9396185356637705, + "grad_norm": 0.261511927042467, + "grad_max_sv": 0.09869588532019406, + "grad_min_sv": 2.728127020095826e-13, + "grad_condition": 88878548722.67065, + "lr": 0.0009890738003669028, + "time_sec": 38.743908405303955 + }, + { + "epoch": 11, + "train_loss": 5.8408165109252925, + "train_acc": 0.01034, + "test_loss": 4.6082617340087895, + "test_acc": 0.01, + "lyapunov": 1.9296608300465148, + "grad_norm": 0.2344195135575755, + "grad_max_sv": 0.08715516603551805, + "grad_min_sv": 2.4710747756651273e-15, + "grad_condition": 86872648368.75877, + "lr": 0.00098678945143658, + "time_sec": 38.751142263412476 + }, + { + "epoch": 12, + "train_loss": 5.84793187210083, + "train_acc": 0.00954, + "test_loss": 4.6062534797668455, + "test_acc": 0.01, + "lyapunov": 1.932467032881344, + "grad_norm": 0.24986425241000795, + "grad_max_sv": 0.07697397316806018, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 76973973168.06018, + "lr": 0.0009842915805643154, + "time_sec": 38.75897789001465 + }, + { + "epoch": 13, + "train_loss": 5.845315325927734, + "train_acc": 0.01, + "test_loss": 4.606490065002442, + "test_acc": 0.01, + "lyapunov": 1.9308954513896153, + "grad_norm": 0.2234501732158856, + "grad_max_sv": 0.07171829692088068, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 71718296920.88069, + "lr": 0.000981581283398829, + "time_sec": 38.77409482002258 + }, + { + "epoch": 14, + "train_loss": 5.844472907714843, + "train_acc": 0.00932, + "test_loss": 4.611052139282227, + "test_acc": 0.01, + "lyapunov": 1.9302553133586484, + "grad_norm": 0.2546366793913816, + "grad_max_sv": 0.0627493538428098, + "grad_min_sv": 5.442503105591157e-42, + "grad_condition": 62749353842.80979, + "lr": 0.0009786597487660333, + "time_sec": 38.75410294532776 + }, + { + "epoch": 15, + "train_loss": 5.839373329620361, + "train_acc": 0.01012, + "test_loss": 4.605493424987793, + "test_acc": 0.01, + "lyapunov": 1.9264278128323957, + "grad_norm": 0.33195464165742516, + "grad_max_sv": 0.0596250070258975, + "grad_min_sv": 1.1532839803575087e-39, + "grad_condition": 59625007025.89751, + "lr": 0.0009755282581475766, + "time_sec": 38.737260818481445 + }, + { + "epoch": 16, + "train_loss": 5.840845001983642, + "train_acc": 0.01006, + "test_loss": 4.606367964935303, + "test_acc": 0.01, + "lyapunov": 1.9284262577895923, + "grad_norm": 0.41972925674223915, + "grad_max_sv": 0.04947211216203869, + "grad_min_sv": 0.0, + "grad_condition": 49472112162.03868, + "lr": 0.0009721881851187403, + "time_sec": 38.72240591049194 + }, + { + "epoch": 17, + "train_loss": 5.838009662322998, + "train_acc": 0.01014, + "test_loss": 4.607442309570312, + "test_acc": 0.01, + "lyapunov": 1.927741524203659, + "grad_norm": 0.41171422252176765, + "grad_max_sv": 0.06055757296271622, + "grad_min_sv": 6.063498673792123e-17, + "grad_condition": 60551208649.85646, + "lr": 0.0009686409947459456, + "time_sec": 38.7178897857666 + }, + { + "epoch": 18, + "train_loss": 5.8419268412780765, + "train_acc": 0.00974, + "test_loss": 4.605891960144043, + "test_acc": 0.01, + "lyapunov": 1.9291500267775163, + "grad_norm": 0.3483236145113203, + "grad_max_sv": 0.03731603529304266, + "grad_min_sv": 6.04933030713951e-30, + "grad_condition": 37316035293.042656, + "lr": 0.0009648882429441254, + "time_sec": 38.760350704193115 + }, + { + "epoch": 19, + "train_loss": 5.826735510559082, + "train_acc": 0.01202, + "test_loss": 4.605664205932618, + "test_acc": 0.01, + "lyapunov": 1.9298754738419868, + "grad_norm": 0.3207639814137615, + "grad_max_sv": 0.06981198373250663, + "grad_min_sv": 1.9222199366026642e-14, + "grad_condition": 67062140845.185585, + "lr": 0.00096093157579425, + "time_sec": 38.76730132102966 + }, + { + "epoch": 20, + "train_loss": 5.84202998046875, + "train_acc": 0.00976, + "test_loss": 4.606653337097168, + "test_acc": 0.01, + "lyapunov": 1.9302551270750783, + "grad_norm": 0.20194476347748866, + "grad_max_sv": 0.03701699019875378, + "grad_min_sv": 0.0, + "grad_condition": 37016990198.75377, + "lr": 0.0009567727288213001, + "time_sec": 38.725250244140625 + }, + { + "epoch": 21, + "train_loss": 5.84192676071167, + "train_acc": 0.00982, + "test_loss": 4.614536486816406, + "test_acc": 0.01, + "lyapunov": 1.9300702325523358, + "grad_norm": 0.2358565070101103, + "grad_max_sv": 0.033911947428714485, + "grad_min_sv": 0.0, + "grad_condition": 33911947428.714485, + "lr": 0.0009524135262330095, + "time_sec": 38.72857594490051 + }, + { + "epoch": 22, + "train_loss": 5.839627782592774, + "train_acc": 0.00992, + "test_loss": 4.606048239898682, + "test_acc": 0.01, + "lyapunov": 1.9269078469947172, + "grad_norm": 0.17845225075047805, + "grad_max_sv": 0.025568678742274642, + "grad_min_sv": 0.0, + "grad_condition": 25568678742.274643, + "lr": 0.0009478558801197061, + "time_sec": 38.68861746788025 + }, + { + "epoch": 23, + "train_loss": 5.838393308258056, + "train_acc": 0.00958, + "test_loss": 4.586302839660645, + "test_acc": 0.0188, + "lyapunov": 1.9266618383510032, + "grad_norm": 0.13466647962688946, + "grad_max_sv": 0.01349067515693605, + "grad_min_sv": 0.0, + "grad_condition": 13490675156.936049, + "lr": 0.000943101789615607, + "time_sec": 38.702245473861694 + }, + { + "epoch": 24, + "train_loss": 5.835893999938965, + "train_acc": 0.0103, + "test_loss": 4.605248524475098, + "test_acc": 0.01, + "lyapunov": 1.9250504610788486, + "grad_norm": 0.1306925374207253, + "grad_max_sv": 0.021706052590161562, + "grad_min_sv": 4.2115888976736585e-17, + "grad_condition": 21702749025.936443, + "lr": 0.0009381533400219313, + "time_sec": 38.70141124725342 + }, + { + "epoch": 25, + "train_loss": 5.839240811767578, + "train_acc": 0.00906, + "test_loss": 4.605221250915528, + "test_acc": 0.01, + "lyapunov": 1.9273294420803295, + "grad_norm": 0.12078726665544544, + "grad_max_sv": 0.010838619247078896, + "grad_min_sv": 0.0, + "grad_condition": 10838619247.078896, + "lr": 0.0009330127018922189, + "time_sec": 38.68912363052368 + }, + { + "epoch": 26, + "train_loss": 5.832334176635742, + "train_acc": 0.00902, + "test_loss": 4.605214032745361, + "test_acc": 0.01, + "lyapunov": 1.92168139923564, + "grad_norm": 0.11780855950452304, + "grad_max_sv": 0.012504769628867507, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 12504769628.867508, + "lr": 0.000927682130080253, + "time_sec": 38.69681906700134 + }, + { + "epoch": 27, + "train_loss": 5.832823591003418, + "train_acc": 0.00856, + "test_loss": 4.605198753356934, + "test_acc": 0.01, + "lyapunov": 1.9220849495104817, + "grad_norm": 0.1307395775308225, + "grad_max_sv": 0.00955222793854773, + "grad_min_sv": 0.0, + "grad_condition": 9552227938.54773, + "lr": 0.0009221639627510072, + "time_sec": 38.67968559265137 + }, + { + "epoch": 28, + "train_loss": 5.8319349609375, + "train_acc": 0.00908, + "test_loss": 4.60519333190918, + "test_acc": 0.01, + "lyapunov": 1.9214767400565964, + "grad_norm": 0.11312977194763361, + "grad_max_sv": 0.007689819484949112, + "grad_min_sv": 0.0, + "grad_condition": 7689819484.949112, + "lr": 0.0009164606203550494, + "time_sec": 38.693461418151855 + }, + { + "epoch": 29, + "train_loss": 5.832658680419922, + "train_acc": 0.0089, + "test_loss": 4.605188513946533, + "test_acc": 0.01, + "lyapunov": 1.9219111963306241, + "grad_norm": 0.1139488031414971, + "grad_max_sv": 0.009555681003257632, + "grad_min_sv": 0.0, + "grad_condition": 9555681003.257633, + "lr": 0.0009105746045668516, + "time_sec": 38.88858246803284 + }, + { + "epoch": 30, + "train_loss": 5.8301619506835936, + "train_acc": 0.00936, + "test_loss": 4.605182504272461, + "test_acc": 0.01, + "lyapunov": 1.9200728305465424, + "grad_norm": 0.10113831163550316, + "grad_max_sv": 0.004735648166388273, + "grad_min_sv": 0.0, + "grad_condition": 4735648166.388273, + "lr": 0.0009045084971874733, + "time_sec": 38.682101011276245 + }, + { + "epoch": 31, + "train_loss": 5.832088593292236, + "train_acc": 0.00848, + "test_loss": 4.60520027999878, + "test_acc": 0.01, + "lyapunov": 1.921536988309582, + "grad_norm": 0.11928153797201548, + "grad_max_sv": 0.005120814079418778, + "grad_min_sv": 0.0, + "grad_condition": 5120814079.418779, + "lr": 0.0008982649590120977, + "time_sec": 38.66986131668091 + }, + { + "epoch": 32, + "train_loss": 5.830597168426514, + "train_acc": 0.009, + "test_loss": 4.605257048797608, + "test_acc": 0.01, + "lyapunov": 1.9206426658898668, + "grad_norm": 0.09874780482605999, + "grad_max_sv": 0.0029883835930377247, + "grad_min_sv": 0.0, + "grad_condition": 2988383593.0377245, + "lr": 0.0008918467286629196, + "time_sec": 38.69553232192993 + }, + { + "epoch": 33, + "train_loss": 5.829611896514892, + "train_acc": 0.00884, + "test_loss": 4.60517430267334, + "test_acc": 0.01, + "lyapunov": 1.9195137139781357, + "grad_norm": 0.09972362630787891, + "grad_max_sv": 0.00664278594776988, + "grad_min_sv": 0.0, + "grad_condition": 6642785947.76988, + "lr": 0.0008852566213878943, + "time_sec": 38.67990040779114 + }, + { + "epoch": 34, + "train_loss": 5.828044633636474, + "train_acc": 0.0083, + "test_loss": 4.605173886871338, + "test_acc": 0.01, + "lyapunov": 1.918492463848475, + "grad_norm": 0.0974792016961528, + "grad_max_sv": 0.001599628059193492, + "grad_min_sv": 0.0, + "grad_condition": 1599628059.193492, + "lr": 0.000878497527825878, + "time_sec": 38.68664336204529 + }, + { + "epoch": 35, + "train_loss": 5.830746371154786, + "train_acc": 0.00894, + "test_loss": 4.6051726875305175, + "test_acc": 0.01, + "lyapunov": 1.920728165475304, + "grad_norm": 0.0938240145066066, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000871572412738697, + "time_sec": 38.67132115364075 + }, + { + "epoch": 36, + "train_loss": 5.829937998809815, + "train_acc": 0.00866, + "test_loss": 4.605172854614258, + "test_acc": 0.01, + "lyapunov": 1.920135024868314, + "grad_norm": 0.09205400750487011, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107055, + "time_sec": 38.64905834197998 + }, + { + "epoch": 37, + "train_loss": 5.829817896728516, + "train_acc": 0.00818, + "test_loss": 4.6051733100891115, + "test_acc": 0.01, + "lyapunov": 1.9200208934066851, + "grad_norm": 0.09228371311542864, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 38.657002210617065 + }, + { + "epoch": 38, + "train_loss": 5.831039802246094, + "train_acc": 0.0088, + "test_loss": 4.6051726837158204, + "test_acc": 0.01, + "lyapunov": 1.9210114238207296, + "grad_norm": 0.09181178733619569, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 38.66207027435303 + }, + { + "epoch": 39, + "train_loss": 5.829483923492432, + "train_acc": 0.00886, + "test_loss": 4.605172607421875, + "test_acc": 0.01, + "lyapunov": 1.919772486552558, + "grad_norm": 0.09053836987454536, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 38.67074227333069 + }, + { + "epoch": 40, + "train_loss": 5.829308145904541, + "train_acc": 0.00862, + "test_loss": 4.605172937774658, + "test_acc": 0.01, + "lyapunov": 1.9195958787522962, + "grad_norm": 0.09302966072405643, + "grad_max_sv": 0.0028064717072993515, + "grad_min_sv": 0.0, + "grad_condition": 2806471707.2993517, + "lr": 0.0008345653031794289, + "time_sec": 38.66209268569946 + }, + { + "epoch": 41, + "train_loss": 5.828913317565918, + "train_acc": 0.00894, + "test_loss": 4.605173394775391, + "test_acc": 0.01, + "lyapunov": 1.9192491733204677, + "grad_norm": 0.09010018258992165, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 38.68193006515503 + }, + { + "epoch": 42, + "train_loss": 5.83203209274292, + "train_acc": 0.0089, + "test_loss": 4.6051725547790525, + "test_acc": 0.01, + "lyapunov": 1.9218718840947846, + "grad_norm": 0.09554864716201418, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 38.67262053489685 + }, + { + "epoch": 43, + "train_loss": 5.836768571929932, + "train_acc": 0.00868, + "test_loss": 4.605172836303711, + "test_acc": 0.01, + "lyapunov": 1.9252831368800014, + "grad_norm": 0.11288803301983473, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 38.673030853271484 + }, + { + "epoch": 44, + "train_loss": 5.830244238128662, + "train_acc": 0.00862, + "test_loss": 4.605172270202637, + "test_acc": 0.01, + "lyapunov": 1.9203159440204005, + "grad_norm": 0.09075156234022023, + "grad_max_sv": 0.0006292640697211027, + "grad_min_sv": 0.0, + "grad_condition": 629264069.7211027, + "lr": 0.0008022995574311873, + "time_sec": 38.67639136314392 + }, + { + "epoch": 45, + "train_loss": 5.831813296051026, + "train_acc": 0.00798, + "test_loss": 4.605172733306885, + "test_acc": 0.01, + "lyapunov": 1.9216700673408216, + "grad_norm": 0.09800318179113622, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 38.66922402381897 + }, + { + "epoch": 46, + "train_loss": 5.829525221710205, + "train_acc": 0.0088, + "test_loss": 4.605172639465332, + "test_acc": 0.01, + "lyapunov": 1.9197535209948449, + "grad_norm": 0.09607771134569527, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 38.6734299659729 + }, + { + "epoch": 47, + "train_loss": 5.831378362731933, + "train_acc": 0.00896, + "test_loss": 4.605172109985352, + "test_acc": 0.01, + "lyapunov": 1.9213088927671427, + "grad_norm": 0.09002095025572443, + "grad_max_sv": 0.0022390282712876795, + "grad_min_sv": 0.0, + "grad_condition": 2239028271.2876797, + "lr": 0.0007766957746216719, + "time_sec": 38.681992530822754 + }, + { + "epoch": 48, + "train_loss": 5.8296267512512205, + "train_acc": 0.00852, + "test_loss": 4.605172399902344, + "test_acc": 0.01, + "lyapunov": 1.9198472441919625, + "grad_norm": 0.08948131522401738, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 38.69184613227844 + }, + { + "epoch": 49, + "train_loss": 5.82939344329834, + "train_acc": 0.009, + "test_loss": 4.6051721862792965, + "test_acc": 0.01, + "lyapunov": 1.919716474345273, + "grad_norm": 0.08962129117217822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 38.66769075393677 + }, + { + "epoch": 50, + "train_loss": 5.829856867675781, + "train_acc": 0.00824, + "test_loss": 4.605171932983398, + "test_acc": 0.01, + "lyapunov": 1.9200777041027919, + "grad_norm": 0.08949650095695762, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 38.6767897605896 + }, + { + "epoch": 51, + "train_loss": 5.831189596557617, + "train_acc": 0.00886, + "test_loss": 4.605172845458984, + "test_acc": 0.01, + "lyapunov": 1.9211604323838374, + "grad_norm": 0.08928877604280225, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 38.669432640075684 + }, + { + "epoch": 52, + "train_loss": 5.827941221618652, + "train_acc": 0.00906, + "test_loss": 4.605172493743897, + "test_acc": 0.01, + "lyapunov": 1.9184872210787995, + "grad_norm": 0.08912832082902897, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 38.65984392166138 + }, + { + "epoch": 53, + "train_loss": 5.829616719360351, + "train_acc": 0.00856, + "test_loss": 4.6051721878051755, + "test_acc": 0.01, + "lyapunov": 1.9199278674772025, + "grad_norm": 0.08891740863163855, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 38.684584856033325 + }, + { + "epoch": 54, + "train_loss": 5.828832433013916, + "train_acc": 0.00888, + "test_loss": 4.605171940612793, + "test_acc": 0.01, + "lyapunov": 1.9193241215118058, + "grad_norm": 0.08862714787237397, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 38.6649751663208 + }, + { + "epoch": 55, + "train_loss": 5.829295374145508, + "train_acc": 0.00864, + "test_loss": 4.6051718048095704, + "test_acc": 0.01, + "lyapunov": 1.9196355620308605, + "grad_norm": 0.08936964720805882, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 38.66834211349487 + }, + { + "epoch": 56, + "train_loss": 5.831980644836426, + "train_acc": 0.00872, + "test_loss": 4.605172239685059, + "test_acc": 0.01, + "lyapunov": 1.9218218890602325, + "grad_norm": 0.08828331902779529, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 38.67644000053406 + }, + { + "epoch": 57, + "train_loss": 5.8291939093017575, + "train_acc": 0.00898, + "test_loss": 4.605171894836426, + "test_acc": 0.01, + "lyapunov": 1.9195057918958347, + "grad_norm": 0.08970762017367405, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 38.66079378128052 + }, + { + "epoch": 58, + "train_loss": 5.826841032867431, + "train_acc": 0.0085, + "test_loss": 4.605172017669678, + "test_acc": 0.01, + "lyapunov": 1.9176025924170415, + "grad_norm": 0.09048223717877525, + "grad_max_sv": 0.0014875998720526695, + "grad_min_sv": 0.0, + "grad_condition": 1487599872.0526695, + "lr": 0.0006742860236609073, + "time_sec": 38.66658973693848 + }, + { + "epoch": 59, + "train_loss": 5.835019799499512, + "train_acc": 0.00882, + "test_loss": 4.60517190322876, + "test_acc": 0.01, + "lyapunov": 1.9238726757371518, + "grad_norm": 0.09441160205385561, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 38.67969727516174 + }, + { + "epoch": 60, + "train_loss": 5.830721065979004, + "train_acc": 0.00836, + "test_loss": 4.605171463012695, + "test_acc": 0.01, + "lyapunov": 1.9208579142685132, + "grad_norm": 0.08921306700093072, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 38.663196325302124 + }, + { + "epoch": 61, + "train_loss": 5.829596945648193, + "train_acc": 0.00828, + "test_loss": 4.605171449279785, + "test_acc": 0.01, + "lyapunov": 1.9199584844472157, + "grad_norm": 0.08848056161918356, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 38.68021297454834 + }, + { + "epoch": 62, + "train_loss": 5.830569870300293, + "train_acc": 0.00824, + "test_loss": 4.605171228790283, + "test_acc": 0.01, + "lyapunov": 1.9206647436941982, + "grad_norm": 0.08839721397975912, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 38.675719022750854 + }, + { + "epoch": 63, + "train_loss": 5.8305546853637695, + "train_acc": 0.00854, + "test_loss": 4.605172233581543, + "test_acc": 0.01, + "lyapunov": 1.9206541834584892, + "grad_norm": 0.08903578043587344, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 38.658900022506714 + }, + { + "epoch": 64, + "train_loss": 5.836477585449218, + "train_acc": 0.00876, + "test_loss": 4.605171844482422, + "test_acc": 0.01, + "lyapunov": 1.9251100108446673, + "grad_norm": 0.09951449127834824, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 38.67370843887329 + }, + { + "epoch": 65, + "train_loss": 5.830157748260498, + "train_acc": 0.00854, + "test_loss": 4.605171319580078, + "test_acc": 0.01, + "lyapunov": 1.920334783661396, + "grad_norm": 0.09108085096662916, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 38.67955160140991 + }, + { + "epoch": 66, + "train_loss": 5.828997611694336, + "train_acc": 0.00866, + "test_loss": 4.605171671295166, + "test_acc": 0.01, + "lyapunov": 1.919463188751884, + "grad_norm": 0.08904439645709107, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 38.67839956283569 + }, + { + "epoch": 67, + "train_loss": 5.830838754272461, + "train_acc": 0.00868, + "test_loss": 4.605171606445312, + "test_acc": 0.01, + "lyapunov": 1.9207777364174727, + "grad_norm": 0.09755498438636814, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 38.67587614059448 + }, + { + "epoch": 68, + "train_loss": 5.827152337646484, + "train_acc": 0.00928, + "test_loss": 4.605171282958985, + "test_acc": 0.01, + "lyapunov": 1.9178936585136082, + "grad_norm": 0.08799438562008605, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 38.67634415626526 + }, + { + "epoch": 69, + "train_loss": 5.830286772155762, + "train_acc": 0.0096, + "test_loss": 4.605171063232422, + "test_acc": 0.01, + "lyapunov": 1.9204461242231872, + "grad_norm": 0.09070089337302271, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 38.678497076034546 + }, + { + "epoch": 70, + "train_loss": 5.832680291290283, + "train_acc": 0.0098, + "test_loss": 4.605171459197998, + "test_acc": 0.01, + "lyapunov": 1.9224533403621, + "grad_norm": 0.08827257843406246, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 38.66450572013855 + }, + { + "epoch": 71, + "train_loss": 5.830269169921875, + "train_acc": 0.00836, + "test_loss": 4.605171234130859, + "test_acc": 0.01, + "lyapunov": 1.9205291399260616, + "grad_norm": 0.08807564726395264, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 38.656336545944214 + }, + { + "epoch": 72, + "train_loss": 5.830037397460938, + "train_acc": 0.00858, + "test_loss": 4.605171022033692, + "test_acc": 0.01, + "lyapunov": 1.9203362114289229, + "grad_norm": 0.08760409668351568, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 38.68950128555298 + }, + { + "epoch": 73, + "train_loss": 5.83207408782959, + "train_acc": 0.00862, + "test_loss": 4.605171083068847, + "test_acc": 0.01, + "lyapunov": 1.922044792138707, + "grad_norm": 0.08837012490740455, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 38.678892612457275 + }, + { + "epoch": 74, + "train_loss": 5.830842367553711, + "train_acc": 0.00886, + "test_loss": 4.6051713088989255, + "test_acc": 0.01, + "lyapunov": 1.9209648620746935, + "grad_norm": 0.0881334492267735, + "grad_max_sv": 0.0016617819666862488, + "grad_min_sv": 0.0, + "grad_condition": 1661781966.6862488, + "lr": 0.0005104712099416781, + "time_sec": 38.66536831855774 + }, + { + "epoch": 75, + "train_loss": 5.831041750488281, + "train_acc": 0.00846, + "test_loss": 4.605171099853516, + "test_acc": 0.01, + "lyapunov": 1.9211621680832884, + "grad_norm": 0.08829717661983798, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 38.674325704574585 + }, + { + "epoch": 76, + "train_loss": 5.836333667144776, + "train_acc": 0.00864, + "test_loss": 4.605171186065673, + "test_acc": 0.01, + "lyapunov": 1.9246098906792644, + "grad_norm": 0.11366095758738136, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 38.687448501586914 + }, + { + "epoch": 77, + "train_loss": 5.835334293212891, + "train_acc": 0.0089, + "test_loss": 4.6051709121704105, + "test_acc": 0.01, + "lyapunov": 1.9234618140608453, + "grad_norm": 0.10831693857812812, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 38.65811228752136 + }, + { + "epoch": 78, + "train_loss": 5.827478051452637, + "train_acc": 0.00882, + "test_loss": 4.605171005249024, + "test_acc": 0.01, + "lyapunov": 1.9182067341206934, + "grad_norm": 0.08781347391325668, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 38.676063537597656 + }, + { + "epoch": 79, + "train_loss": 5.8290468742370605, + "train_acc": 0.00886, + "test_loss": 4.605171278381348, + "test_acc": 0.01, + "lyapunov": 1.919505515671752, + "grad_norm": 0.08854207911135165, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 38.673518896102905 + }, + { + "epoch": 80, + "train_loss": 5.833914941253662, + "train_acc": 0.0089, + "test_loss": 4.605170984649658, + "test_acc": 0.01, + "lyapunov": 1.9234306675088986, + "grad_norm": 0.09381991898821151, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 38.672255754470825 + }, + { + "epoch": 81, + "train_loss": 5.829356372680664, + "train_acc": 0.00902, + "test_loss": 4.605171099853516, + "test_acc": 0.01, + "lyapunov": 1.919769955413116, + "grad_norm": 0.08816368922697575, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 38.67954111099243 + }, + { + "epoch": 82, + "train_loss": 5.831741758117675, + "train_acc": 0.00918, + "test_loss": 4.605171073913574, + "test_acc": 0.01, + "lyapunov": 1.921732059525102, + "grad_norm": 0.09264254493603952, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 38.673032999038696 + }, + { + "epoch": 83, + "train_loss": 5.834408538513183, + "train_acc": 0.0092, + "test_loss": 4.605170977020264, + "test_acc": 0.01, + "lyapunov": 1.9238771880069352, + "grad_norm": 0.08953937527623661, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 38.68673372268677 + }, + { + "epoch": 84, + "train_loss": 5.830432665252686, + "train_acc": 0.009, + "test_loss": 4.605170909118653, + "test_acc": 0.01, + "lyapunov": 1.920691382854491, + "grad_norm": 0.08848473612958971, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 38.663509130477905 + }, + { + "epoch": 85, + "train_loss": 5.83150433013916, + "train_acc": 0.00862, + "test_loss": 4.605170706176758, + "test_acc": 0.01, + "lyapunov": 1.921521064875376, + "grad_norm": 0.0878123084846611, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 38.6465003490448 + }, + { + "epoch": 86, + "train_loss": 5.831791127319336, + "train_acc": 0.00896, + "test_loss": 4.605170570373535, + "test_acc": 0.01, + "lyapunov": 1.9217873232443925, + "grad_norm": 0.0877757716455608, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 38.6744065284729 + }, + { + "epoch": 87, + "train_loss": 5.832627346191407, + "train_acc": 0.00878, + "test_loss": 4.605170877075195, + "test_acc": 0.01, + "lyapunov": 1.9224827862761515, + "grad_norm": 0.08827499584565024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 38.66921091079712 + }, + { + "epoch": 88, + "train_loss": 5.8317487963867185, + "train_acc": 0.00824, + "test_loss": 4.605170699310302, + "test_acc": 0.01, + "lyapunov": 1.921761295984468, + "grad_norm": 0.08846045903994489, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 38.67842221260071 + }, + { + "epoch": 89, + "train_loss": 5.8302451986694335, + "train_acc": 0.00862, + "test_loss": 4.605170578765869, + "test_acc": 0.01, + "lyapunov": 1.9205519287177668, + "grad_norm": 0.0880969562704879, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 38.66373419761658 + }, + { + "epoch": 90, + "train_loss": 5.828649435424805, + "train_acc": 0.00928, + "test_loss": 4.605170637512207, + "test_acc": 0.01, + "lyapunov": 1.919257033816384, + "grad_norm": 0.08878565745159492, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 38.68431329727173 + }, + { + "epoch": 91, + "train_loss": 5.830266084594727, + "train_acc": 0.0087, + "test_loss": 4.60517045211792, + "test_acc": 0.01, + "lyapunov": 1.920564612464222, + "grad_norm": 0.0883222592119473, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 38.67736315727234 + }, + { + "epoch": 92, + "train_loss": 5.831894824829101, + "train_acc": 0.00856, + "test_loss": 4.605170608520508, + "test_acc": 0.01, + "lyapunov": 1.9219116762166133, + "grad_norm": 0.08764554261224523, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 38.67611908912659 + }, + { + "epoch": 93, + "train_loss": 5.82894446182251, + "train_acc": 0.00844, + "test_loss": 4.6051702972412105, + "test_acc": 0.01, + "lyapunov": 1.9194979228631919, + "grad_norm": 0.08833998566442527, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 38.69344687461853 + }, + { + "epoch": 94, + "train_loss": 5.837506525115967, + "train_acc": 0.00874, + "test_loss": 4.60517064819336, + "test_acc": 0.01, + "lyapunov": 1.9243434188920823, + "grad_norm": 0.11393882739366498, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 38.68289828300476 + }, + { + "epoch": 95, + "train_loss": 5.831888694152832, + "train_acc": 0.00764, + "test_loss": 4.605170504760742, + "test_acc": 0.01, + "lyapunov": 1.9216798833568993, + "grad_norm": 0.10076789355226513, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 38.68230414390564 + }, + { + "epoch": 96, + "train_loss": 5.839447547912598, + "train_acc": 0.00876, + "test_loss": 4.605170679473877, + "test_acc": 0.01, + "lyapunov": 1.9261463017719787, + "grad_norm": 0.11376740734099834, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 38.6755793094635 + }, + { + "epoch": 97, + "train_loss": 5.828961611328125, + "train_acc": 0.00828, + "test_loss": 4.605170320129394, + "test_acc": 0.01, + "lyapunov": 1.9195098590363018, + "grad_norm": 0.08840788709710101, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 38.676655769348145 + }, + { + "epoch": 98, + "train_loss": 5.829206983032226, + "train_acc": 0.00852, + "test_loss": 4.605170263671875, + "test_acc": 0.01, + "lyapunov": 1.9197069199188896, + "grad_norm": 0.08784611697907319, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 38.679508209228516 + }, + { + "epoch": 99, + "train_loss": 5.830749737243653, + "train_acc": 0.0086, + "test_loss": 4.605170584106445, + "test_acc": 0.01, + "lyapunov": 1.9209906048786916, + "grad_norm": 0.08837860643236768, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 38.6536865234375 + }, + { + "epoch": 100, + "train_loss": 5.833174273071289, + "train_acc": 0.00912, + "test_loss": 4.605170581054687, + "test_acc": 0.01, + "lyapunov": 1.923052377713001, + "grad_norm": 0.0880219202195275, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 38.669525146484375 + }, + { + "epoch": 101, + "train_loss": 5.832474216003418, + "train_acc": 0.00924, + "test_loss": 4.605170333862305, + "test_acc": 0.01, + "lyapunov": 1.9223707411295312, + "grad_norm": 0.088109218729273, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 38.68469524383545 + }, + { + "epoch": 102, + "train_loss": 5.832093044128418, + "train_acc": 0.0085, + "test_loss": 4.6051706710815425, + "test_acc": 0.01, + "lyapunov": 1.9221026568156678, + "grad_norm": 0.08806360302850152, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 38.667779207229614 + }, + { + "epoch": 103, + "train_loss": 5.829613971557618, + "train_acc": 0.00884, + "test_loss": 4.605170641326905, + "test_acc": 0.01, + "lyapunov": 1.9200275365044088, + "grad_norm": 0.08827372352248057, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 38.67877268791199 + }, + { + "epoch": 104, + "train_loss": 5.829403175201416, + "train_acc": 0.0085, + "test_loss": 4.605170069885254, + "test_acc": 0.01, + "lyapunov": 1.9198780102498085, + "grad_norm": 0.08759321728417062, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 38.67757058143616 + }, + { + "epoch": 105, + "train_loss": 5.83223681137085, + "train_acc": 0.00838, + "test_loss": 4.605170602416992, + "test_acc": 0.01, + "lyapunov": 1.922215115993529, + "grad_norm": 0.08796326905677253, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 38.667465925216675 + }, + { + "epoch": 106, + "train_loss": 5.833028655090332, + "train_acc": 0.00824, + "test_loss": 4.605170317840576, + "test_acc": 0.01, + "lyapunov": 1.92289487815574, + "grad_norm": 0.08795960069436239, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 38.68554091453552 + }, + { + "epoch": 107, + "train_loss": 5.827796527557373, + "train_acc": 0.00876, + "test_loss": 4.605170085144043, + "test_acc": 0.01, + "lyapunov": 1.918589440453083, + "grad_norm": 0.08772654367791473, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 38.68501615524292 + }, + { + "epoch": 108, + "train_loss": 5.82904862991333, + "train_acc": 0.00916, + "test_loss": 4.605170137023926, + "test_acc": 0.01, + "lyapunov": 1.9196739556539395, + "grad_norm": 0.08791956109774068, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 38.68057060241699 + }, + { + "epoch": 109, + "train_loss": 5.830072443237305, + "train_acc": 0.00772, + "test_loss": 4.605170295715332, + "test_acc": 0.01, + "lyapunov": 1.9204182008953046, + "grad_norm": 0.08807291337304174, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 38.66407561302185 + }, + { + "epoch": 110, + "train_loss": 5.830760421295166, + "train_acc": 0.00882, + "test_loss": 4.605170086669922, + "test_acc": 0.01, + "lyapunov": 1.9210344882267516, + "grad_norm": 0.08829325644128909, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 38.66635870933533 + }, + { + "epoch": 111, + "train_loss": 5.844144050140381, + "train_acc": 0.00756, + "test_loss": 4.605170138549805, + "test_acc": 0.01, + "lyapunov": 1.9289683185879836, + "grad_norm": 0.08860258635222626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 38.67165184020996 + }, + { + "epoch": 112, + "train_loss": 5.830768748779297, + "train_acc": 0.0085, + "test_loss": 4.605170237731934, + "test_acc": 0.01, + "lyapunov": 1.9210170031813405, + "grad_norm": 0.0882870971276682, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 38.67701458930969 + }, + { + "epoch": 113, + "train_loss": 5.8316661862182615, + "train_acc": 0.00856, + "test_loss": 4.605170329284668, + "test_acc": 0.01, + "lyapunov": 1.921789816883214, + "grad_norm": 0.08856537933077034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 38.66913890838623 + }, + { + "epoch": 114, + "train_loss": 5.83167002532959, + "train_acc": 0.00886, + "test_loss": 4.60517038269043, + "test_acc": 0.01, + "lyapunov": 1.9217432996501094, + "grad_norm": 0.08829399946029161, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 38.68831920623779 + }, + { + "epoch": 115, + "train_loss": 5.829227747192383, + "train_acc": 0.00872, + "test_loss": 4.605170357513428, + "test_acc": 0.01, + "lyapunov": 1.9198200571567505, + "grad_norm": 0.08820685400799948, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 38.898104667663574 + }, + { + "epoch": 116, + "train_loss": 5.826888065795899, + "train_acc": 0.0084, + "test_loss": 4.605169971466064, + "test_acc": 0.01, + "lyapunov": 1.9179128426724992, + "grad_norm": 0.08799764957632915, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 38.664024114608765 + }, + { + "epoch": 117, + "train_loss": 5.833059454956055, + "train_acc": 0.00838, + "test_loss": 4.605170207214355, + "test_acc": 0.01, + "lyapunov": 1.9228876301699587, + "grad_norm": 0.09229149137870292, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 38.66628289222717 + }, + { + "epoch": 118, + "train_loss": 5.834235620422363, + "train_acc": 0.00838, + "test_loss": 4.605170387268067, + "test_acc": 0.01, + "lyapunov": 1.9234702946889737, + "grad_norm": 0.11393843809281681, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 38.67253303527832 + }, + { + "epoch": 119, + "train_loss": 5.836164589385986, + "train_acc": 0.00878, + "test_loss": 4.605170240783691, + "test_acc": 0.01, + "lyapunov": 1.9253446165558017, + "grad_norm": 0.13051062587564605, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 38.675392627716064 + }, + { + "epoch": 120, + "train_loss": 5.833294369506836, + "train_acc": 0.00902, + "test_loss": 4.605170152282715, + "test_acc": 0.01, + "lyapunov": 1.9231391212214595, + "grad_norm": 0.09107209306940374, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 38.68769383430481 + }, + { + "epoch": 121, + "train_loss": 5.830208008880615, + "train_acc": 0.00872, + "test_loss": 4.605169981384277, + "test_acc": 0.01, + "lyapunov": 1.920601219777256, + "grad_norm": 0.08818902289292577, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 38.663066148757935 + }, + { + "epoch": 122, + "train_loss": 5.828988634338379, + "train_acc": 0.00866, + "test_loss": 4.6051700424194335, + "test_acc": 0.01, + "lyapunov": 1.9195775912545832, + "grad_norm": 0.08827912521059493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 38.66604161262512 + }, + { + "epoch": 123, + "train_loss": 5.8335463383483885, + "train_acc": 0.0083, + "test_loss": 4.605170326995849, + "test_acc": 0.01, + "lyapunov": 1.9230621321426937, + "grad_norm": 0.09180967837607329, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 38.66097450256348 + }, + { + "epoch": 124, + "train_loss": 5.8313025344848635, + "train_acc": 0.009, + "test_loss": 4.605170251464844, + "test_acc": 0.01, + "lyapunov": 1.9215273033932347, + "grad_norm": 0.0880278926594288, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 38.678382396698 + }, + { + "epoch": 125, + "train_loss": 5.829151732025147, + "train_acc": 0.00856, + "test_loss": 4.605170100402832, + "test_acc": 0.01, + "lyapunov": 1.9196982078844933, + "grad_norm": 0.08802943628622184, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 38.651947021484375 + }, + { + "epoch": 126, + "train_loss": 5.828555057067871, + "train_acc": 0.00854, + "test_loss": 4.605170222473144, + "test_acc": 0.01, + "lyapunov": 1.9192795976043662, + "grad_norm": 0.088302392455243, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 38.67385935783386 + }, + { + "epoch": 127, + "train_loss": 5.829820846405029, + "train_acc": 0.00872, + "test_loss": 4.605170227050781, + "test_acc": 0.01, + "lyapunov": 1.9203001791254029, + "grad_norm": 0.0881103504591081, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 38.67335605621338 + }, + { + "epoch": 128, + "train_loss": 5.846653115692138, + "train_acc": 0.00814, + "test_loss": 4.605170144653321, + "test_acc": 0.01, + "lyapunov": 1.9271661183413338, + "grad_norm": 0.12434413440967498, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 38.651455879211426 + }, + { + "epoch": 129, + "train_loss": 5.8315210632324215, + "train_acc": 0.00858, + "test_loss": 4.6051701629638675, + "test_acc": 0.01, + "lyapunov": 1.9216848407559992, + "grad_norm": 0.09353770310247324, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 38.65707588195801 + }, + { + "epoch": 130, + "train_loss": 5.833166874389648, + "train_acc": 0.00868, + "test_loss": 4.605170000457764, + "test_acc": 0.01, + "lyapunov": 1.9230641779082511, + "grad_norm": 0.08835242150848918, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 38.65906548500061 + }, + { + "epoch": 131, + "train_loss": 5.82969641418457, + "train_acc": 0.00892, + "test_loss": 4.60517036895752, + "test_acc": 0.01, + "lyapunov": 1.9201975795619017, + "grad_norm": 0.08800100320314078, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 38.66576051712036 + }, + { + "epoch": 132, + "train_loss": 5.830922511901855, + "train_acc": 0.00898, + "test_loss": 4.605170082092285, + "test_acc": 0.01, + "lyapunov": 1.921166550472874, + "grad_norm": 0.08780352004054458, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 38.67506122589111 + }, + { + "epoch": 133, + "train_loss": 5.830705413360596, + "train_acc": 0.0089, + "test_loss": 4.605170077514648, + "test_acc": 0.01, + "lyapunov": 1.9210232758461057, + "grad_norm": 0.08765525433917719, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 38.66982293128967 + }, + { + "epoch": 134, + "train_loss": 5.828949987030029, + "train_acc": 0.0092, + "test_loss": 4.60517048034668, + "test_acc": 0.01, + "lyapunov": 1.9195570479268613, + "grad_norm": 0.0878219052630613, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 38.658127784729004 + }, + { + "epoch": 135, + "train_loss": 5.832552122955322, + "train_acc": 0.00898, + "test_loss": 4.605170314025879, + "test_acc": 0.01, + "lyapunov": 1.922510105935509, + "grad_norm": 0.08848585809638171, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 38.671475887298584 + }, + { + "epoch": 136, + "train_loss": 5.828762425842285, + "train_acc": 0.00862, + "test_loss": 4.605170394897461, + "test_acc": 0.01, + "lyapunov": 1.9194351151166364, + "grad_norm": 0.08813677537771221, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 38.67206072807312 + }, + { + "epoch": 137, + "train_loss": 5.830585724487305, + "train_acc": 0.0092, + "test_loss": 4.605170066833496, + "test_acc": 0.01, + "lyapunov": 1.920962211725962, + "grad_norm": 0.08822452447484254, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 38.67813777923584 + }, + { + "epoch": 138, + "train_loss": 5.8304260397338865, + "train_acc": 0.0081, + "test_loss": 4.605170138549805, + "test_acc": 0.01, + "lyapunov": 1.9208168641990409, + "grad_norm": 0.08849509125868348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 38.67507195472717 + }, + { + "epoch": 139, + "train_loss": 5.829665904846191, + "train_acc": 0.00956, + "test_loss": 4.60517013092041, + "test_acc": 0.01, + "lyapunov": 1.9201480406324576, + "grad_norm": 0.08790362350901093, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 38.673912048339844 + }, + { + "epoch": 140, + "train_loss": 5.832476518859863, + "train_acc": 0.00906, + "test_loss": 4.6051704071044925, + "test_acc": 0.01, + "lyapunov": 1.9224549364250945, + "grad_norm": 0.08802773683248163, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 38.67948055267334 + }, + { + "epoch": 141, + "train_loss": 5.830304007110596, + "train_acc": 0.00992, + "test_loss": 4.605170399475098, + "test_acc": 0.01, + "lyapunov": 1.920735996702443, + "grad_norm": 0.0882868275030572, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 38.675227880477905 + }, + { + "epoch": 142, + "train_loss": 5.831250300292969, + "train_acc": 0.00984, + "test_loss": 4.605170373535156, + "test_acc": 0.01, + "lyapunov": 1.921463219710933, + "grad_norm": 0.08794004853752245, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 38.70003008842468 + }, + { + "epoch": 143, + "train_loss": 5.832011743011474, + "train_acc": 0.00878, + "test_loss": 4.605170379638672, + "test_acc": 0.01, + "lyapunov": 1.9220852223808502, + "grad_norm": 0.08842628454422183, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 38.69024062156677 + }, + { + "epoch": 144, + "train_loss": 5.829982127532959, + "train_acc": 0.0097, + "test_loss": 4.605170482635498, + "test_acc": 0.01, + "lyapunov": 1.9204687541708008, + "grad_norm": 0.08841994345313893, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 38.6822247505188 + }, + { + "epoch": 145, + "train_loss": 5.831171199645996, + "train_acc": 0.00958, + "test_loss": 4.605170204162597, + "test_acc": 0.01, + "lyapunov": 1.9213833555845958, + "grad_norm": 0.11341783409581589, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 38.68064069747925 + }, + { + "epoch": 146, + "train_loss": 5.832137032470703, + "train_acc": 0.00976, + "test_loss": 4.605170028686524, + "test_acc": 0.01, + "lyapunov": 1.9221693624925735, + "grad_norm": 0.08798089094104568, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 38.68038535118103 + }, + { + "epoch": 147, + "train_loss": 5.83251281906128, + "train_acc": 0.00974, + "test_loss": 4.605170251464844, + "test_acc": 0.01, + "lyapunov": 1.9224824981616282, + "grad_norm": 0.08796659107314206, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 38.673001766204834 + }, + { + "epoch": 148, + "train_loss": 5.829547540588379, + "train_acc": 0.01, + "test_loss": 4.60517032623291, + "test_acc": 0.01, + "lyapunov": 1.920109924757877, + "grad_norm": 0.08826415625381624, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 38.669779539108276 + }, + { + "epoch": 149, + "train_loss": 5.830913259735107, + "train_acc": 0.01, + "test_loss": 4.605170252227783, + "test_acc": 0.01, + "lyapunov": 1.9211858764024037, + "grad_norm": 0.08849620940008496, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 38.67606210708618 + }, + { + "epoch": 150, + "train_loss": 5.830235260314941, + "train_acc": 0.01, + "test_loss": 4.605170276641846, + "test_acc": 0.01, + "lyapunov": 1.9206774539654823, + "grad_norm": 0.08822638497198837, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 38.67439675331116 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 11.062658223266602, + "train_acc": 0.0191, + "test_loss": 4.636551777648926, + "test_acc": 0.0192, + "lyapunov": 4.093391669070934, + "grad_norm": 6.553327303351535, + "grad_max_sv": 5.005066078901291, + "grad_min_sv": 9.498946289543397e-08, + "grad_condition": 96914448.49987349, + "lr": 0.0009998903417374227, + "time_sec": 81.60158228874207 + }, + { + "epoch": 2, + "train_loss": 7.894516683044434, + "train_acc": 0.02232, + "test_loss": 4.509155606079101, + "test_acc": 0.0281, + "lyapunov": 3.109319945430512, + "grad_norm": 4.711594955608515, + "grad_max_sv": 3.8599576711654664, + "grad_min_sv": 5.844970047842041e-08, + "grad_condition": 1689973621.6123517, + "lr": 0.0009995614150494292, + "time_sec": 81.60659170150757 + }, + { + "epoch": 3, + "train_loss": 7.597164999084472, + "train_acc": 0.02292, + "test_loss": 4.547392833709717, + "test_acc": 0.0138, + "lyapunov": 3.040807009353052, + "grad_norm": 3.4020100363883277, + "grad_max_sv": 2.92706837952137, + "grad_min_sv": 3.304632755468228e-08, + "grad_condition": 5977960877.86062, + "lr": 0.0009990133642141358, + "time_sec": 81.63819622993469 + }, + { + "epoch": 4, + "train_loss": 7.466654327392578, + "train_acc": 0.02596, + "test_loss": 4.54970652999878, + "test_acc": 0.0152, + "lyapunov": 3.026890999825714, + "grad_norm": 2.184726348696494, + "grad_max_sv": 1.823475405573845, + "grad_min_sv": 1.0126577207033096e-08, + "grad_condition": 8307876314.683462, + "lr": 0.0009982464296247522, + "time_sec": 81.63975858688354 + }, + { + "epoch": 5, + "train_loss": 7.35825664352417, + "train_acc": 0.0249, + "test_loss": 4.575929130554199, + "test_acc": 0.013, + "lyapunov": 2.9873962725519827, + "grad_norm": 1.2137091228137746, + "grad_max_sv": 0.961378724873066, + "grad_min_sv": 6.631390698336963e-11, + "grad_condition": 115707330637.43631, + "lr": 0.0009972609476841367, + "time_sec": 81.71280694007874 + }, + { + "epoch": 6, + "train_loss": 7.152584227600098, + "train_acc": 0.02408, + "test_loss": 4.546905226135254, + "test_acc": 0.0165, + "lyapunov": 2.8627321110357102, + "grad_norm": 0.7830228200215259, + "grad_max_sv": 0.4966236546635628, + "grad_min_sv": 8.468786915770583e-12, + "grad_condition": 112190115201.81938, + "lr": 0.000996057350657239, + "time_sec": 81.67318558692932 + }, + { + "epoch": 7, + "train_loss": 6.736108720703125, + "train_acc": 0.02286, + "test_loss": 4.6234777084350585, + "test_acc": 0.01, + "lyapunov": 2.6260088990106607, + "grad_norm": 0.503721920030939, + "grad_max_sv": 0.28278580904006956, + "grad_min_sv": 1.9822557287658092e-12, + "grad_condition": 125105415477.25314, + "lr": 0.000994636166481494, + "time_sec": 81.64523100852966 + }, + { + "epoch": 8, + "train_loss": 6.564093143463134, + "train_acc": 0.02234, + "test_loss": 4.611732032775879, + "test_acc": 0.01, + "lyapunov": 2.514471580915134, + "grad_norm": 0.6828735354454265, + "grad_max_sv": 0.2100991995772347, + "grad_min_sv": 6.476987908912428e-13, + "grad_condition": 143664013250.37378, + "lr": 0.0009929980185352525, + "time_sec": 81.63371157646179 + }, + { + "epoch": 9, + "train_loss": 6.828797580261231, + "train_acc": 0.01912, + "test_loss": 4.606410037231445, + "test_acc": 0.01, + "lyapunov": 2.654179959041078, + "grad_norm": 1.0698865873419308, + "grad_max_sv": 0.16152255814522504, + "grad_min_sv": 1.6541991394265796e-13, + "grad_condition": 140818730869.57614, + "lr": 0.0009911436253643444, + "time_sec": 81.60695457458496 + }, + { + "epoch": 10, + "train_loss": 6.993563550720215, + "train_acc": 0.01038, + "test_loss": 4.6257774490356445, + "test_acc": 0.01, + "lyapunov": 2.7042983194141437, + "grad_norm": 0.6205939496010421, + "grad_max_sv": 0.10736188860610127, + "grad_min_sv": 7.417080745085988e-16, + "grad_condition": 107239971660.70801, + "lr": 0.0009890738003669028, + "time_sec": 81.59540891647339 + }, + { + "epoch": 11, + "train_loss": 6.5890699209594725, + "train_acc": 0.01018, + "test_loss": 4.605637271881103, + "test_acc": 0.01, + "lyapunov": 2.468636756053056, + "grad_norm": 0.39837773763043477, + "grad_max_sv": 0.06119964215904474, + "grad_min_sv": 3.8185383152851266e-45, + "grad_condition": 61199642159.044754, + "lr": 0.00098678945143658, + "time_sec": 81.5604145526886 + }, + { + "epoch": 12, + "train_loss": 6.5774819650268554, + "train_acc": 0.01, + "test_loss": 4.605390992736816, + "test_acc": 0.01, + "lyapunov": 2.4586855413968607, + "grad_norm": 0.7705617527781408, + "grad_max_sv": 0.00864509902894497, + "grad_min_sv": 0.0, + "grad_condition": 8645099028.94497, + "lr": 0.0009842915805643154, + "time_sec": 81.49474096298218 + }, + { + "epoch": 13, + "train_loss": 6.546455008239746, + "train_acc": 0.01002, + "test_loss": 4.605277996826172, + "test_acc": 0.01, + "lyapunov": 2.435590844020209, + "grad_norm": 0.5128829478227843, + "grad_max_sv": 0.004509441927075386, + "grad_min_sv": 0.0, + "grad_condition": 4509441927.075386, + "lr": 0.000981581283398829, + "time_sec": 81.4997489452362 + }, + { + "epoch": 14, + "train_loss": 6.575126316833496, + "train_acc": 0.00944, + "test_loss": 4.605232641601562, + "test_acc": 0.01, + "lyapunov": 2.451746358895851, + "grad_norm": 0.5181440557950673, + "grad_max_sv": 0.013719148561358451, + "grad_min_sv": 0.0, + "grad_condition": 13719148561.358452, + "lr": 0.0009786597487660333, + "time_sec": 81.5125732421875 + }, + { + "epoch": 15, + "train_loss": 6.587129125061035, + "train_acc": 0.0092, + "test_loss": 4.605205821228028, + "test_acc": 0.01, + "lyapunov": 2.453917900314721, + "grad_norm": 0.6398426435720163, + "grad_max_sv": 0.0049395252019166945, + "grad_min_sv": 0.0, + "grad_condition": 4939525201.916695, + "lr": 0.0009755282581475766, + "time_sec": 81.50915098190308 + }, + { + "epoch": 16, + "train_loss": 6.420363327789307, + "train_acc": 0.00962, + "test_loss": 4.605900651550293, + "test_acc": 0.01, + "lyapunov": 2.3524727979889306, + "grad_norm": 0.5507826914381541, + "grad_max_sv": 0.06663376707583665, + "grad_min_sv": 0.0, + "grad_condition": 66633767075.836655, + "lr": 0.0009721881851187403, + "time_sec": 81.59744453430176 + }, + { + "epoch": 17, + "train_loss": 6.291905773010254, + "train_acc": 0.00924, + "test_loss": 4.605198278045655, + "test_acc": 0.01, + "lyapunov": 2.2705817686017515, + "grad_norm": 0.20954429598020885, + "grad_max_sv": 0.007087096758186817, + "grad_min_sv": 0.0, + "grad_condition": 7087096758.186816, + "lr": 0.0009686409947459456, + "time_sec": 81.51701307296753 + }, + { + "epoch": 18, + "train_loss": 6.280198426513672, + "train_acc": 0.00956, + "test_loss": 4.605187928009033, + "test_acc": 0.01, + "lyapunov": 2.262371898612098, + "grad_norm": 0.15673318486817656, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009648882429441254, + "time_sec": 81.49850106239319 + }, + { + "epoch": 19, + "train_loss": 6.319409269714355, + "train_acc": 0.00894, + "test_loss": 4.605180485534668, + "test_acc": 0.01, + "lyapunov": 2.2773679802789712, + "grad_norm": 0.18004037135900994, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00096093157579425, + "time_sec": 81.52363634109497 + }, + { + "epoch": 20, + "train_loss": 6.279429423370361, + "train_acc": 0.0089, + "test_loss": 4.605177160644531, + "test_acc": 0.01, + "lyapunov": 2.261986050764313, + "grad_norm": 0.10793581510968044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009567727288213001, + "time_sec": 81.49810361862183 + }, + { + "epoch": 21, + "train_loss": 6.277427138519287, + "train_acc": 0.00862, + "test_loss": 4.605176016998291, + "test_acc": 0.01, + "lyapunov": 2.2604778922732223, + "grad_norm": 0.1164667413797286, + "grad_max_sv": 0.005474003031849861, + "grad_min_sv": 0.0, + "grad_condition": 5474003031.849861, + "lr": 0.0009524135262330095, + "time_sec": 81.49689865112305 + }, + { + "epoch": 22, + "train_loss": 6.275057526855469, + "train_acc": 0.0092, + "test_loss": 4.605175686645508, + "test_acc": 0.01, + "lyapunov": 2.258924939748271, + "grad_norm": 0.11032559480193316, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009478558801197061, + "time_sec": 81.49366521835327 + }, + { + "epoch": 23, + "train_loss": 6.280477966156006, + "train_acc": 0.00834, + "test_loss": 4.60517352142334, + "test_acc": 0.01, + "lyapunov": 2.262287087452686, + "grad_norm": 0.11733428454185782, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000943101789615607, + "time_sec": 81.4926176071167 + }, + { + "epoch": 24, + "train_loss": 6.27477842300415, + "train_acc": 0.00888, + "test_loss": 4.6051733123779295, + "test_acc": 0.01, + "lyapunov": 2.2587200552606217, + "grad_norm": 0.09563398461056706, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009381533400219313, + "time_sec": 81.48560309410095 + }, + { + "epoch": 25, + "train_loss": 6.275597013549804, + "train_acc": 0.00864, + "test_loss": 4.605174243927002, + "test_acc": 0.01, + "lyapunov": 2.259342540560476, + "grad_norm": 0.10626239815682126, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009330127018922189, + "time_sec": 81.50195908546448 + }, + { + "epoch": 26, + "train_loss": 6.307570930175781, + "train_acc": 0.00846, + "test_loss": 4.6051738105773925, + "test_acc": 0.01, + "lyapunov": 2.2765520228754226, + "grad_norm": 0.15671024580485657, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000927682130080253, + "time_sec": 81.48380661010742 + }, + { + "epoch": 27, + "train_loss": 6.3007610939025875, + "train_acc": 0.00916, + "test_loss": 4.605174212646484, + "test_acc": 0.01, + "lyapunov": 2.2724761200682893, + "grad_norm": 0.15438417468612603, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009221639627510072, + "time_sec": 81.49885392189026 + }, + { + "epoch": 28, + "train_loss": 6.279321163024902, + "train_acc": 0.0084, + "test_loss": 4.605173818206787, + "test_acc": 0.01, + "lyapunov": 2.261768304478482, + "grad_norm": 0.12913751626297293, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009164606203550494, + "time_sec": 81.51960349082947 + }, + { + "epoch": 29, + "train_loss": 6.296547222290039, + "train_acc": 0.00844, + "test_loss": 4.605173532104492, + "test_acc": 0.01, + "lyapunov": 2.269540443444801, + "grad_norm": 0.1257561792074065, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009105746045668516, + "time_sec": 81.48529624938965 + }, + { + "epoch": 30, + "train_loss": 6.301725520019532, + "train_acc": 0.00894, + "test_loss": 4.605173407745362, + "test_acc": 0.01, + "lyapunov": 2.2715838626217657, + "grad_norm": 0.14077235565425347, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009045084971874733, + "time_sec": 81.47704434394836 + }, + { + "epoch": 31, + "train_loss": 6.279767997894287, + "train_acc": 0.0086, + "test_loss": 4.6051743087768555, + "test_acc": 0.01, + "lyapunov": 2.261623111222406, + "grad_norm": 0.11414807727359211, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008982649590120977, + "time_sec": 81.51038384437561 + }, + { + "epoch": 32, + "train_loss": 6.314449734039306, + "train_acc": 0.0091, + "test_loss": 4.605173248291016, + "test_acc": 0.01, + "lyapunov": 2.27814206686776, + "grad_norm": 0.15985043411867914, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008918467286629196, + "time_sec": 81.49317169189453 + }, + { + "epoch": 33, + "train_loss": 6.281702154998779, + "train_acc": 0.0086, + "test_loss": 4.605174011993408, + "test_acc": 0.01, + "lyapunov": 2.262753884810621, + "grad_norm": 0.12070866490334974, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878943, + "time_sec": 81.49454641342163 + }, + { + "epoch": 34, + "train_loss": 6.2773644987487796, + "train_acc": 0.00906, + "test_loss": 4.605173474121094, + "test_acc": 0.01, + "lyapunov": 2.260565836411303, + "grad_norm": 0.11129476697402911, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000878497527825878, + "time_sec": 81.58190107345581 + }, + { + "epoch": 35, + "train_loss": 6.309268474578857, + "train_acc": 0.00864, + "test_loss": 4.605172872161865, + "test_acc": 0.01, + "lyapunov": 2.277102802110755, + "grad_norm": 0.17254724942107424, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000871572412738697, + "time_sec": 81.51573705673218 + }, + { + "epoch": 36, + "train_loss": 6.2885913528442385, + "train_acc": 0.00894, + "test_loss": 4.605173197937011, + "test_acc": 0.01, + "lyapunov": 2.2663694641474263, + "grad_norm": 0.12446302100514797, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107055, + "time_sec": 81.4983901977539 + }, + { + "epoch": 37, + "train_loss": 6.314083187561035, + "train_acc": 0.00826, + "test_loss": 4.605172673034668, + "test_acc": 0.01, + "lyapunov": 2.2792197420164144, + "grad_norm": 0.19167369428125208, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 81.4910204410553 + }, + { + "epoch": 38, + "train_loss": 6.276701861419678, + "train_acc": 0.00804, + "test_loss": 4.605172772979737, + "test_acc": 0.01, + "lyapunov": 2.260084454055942, + "grad_norm": 0.10142640032392508, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 81.49372029304504 + }, + { + "epoch": 39, + "train_loss": 6.2982295426940915, + "train_acc": 0.00834, + "test_loss": 4.605172825622558, + "test_acc": 0.01, + "lyapunov": 2.271109230378095, + "grad_norm": 0.13881594105822967, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 81.50897860527039 + }, + { + "epoch": 40, + "train_loss": 6.282011164550782, + "train_acc": 0.00864, + "test_loss": 4.607664538574219, + "test_acc": 0.01, + "lyapunov": 2.263592470637368, + "grad_norm": 0.1022934137238382, + "grad_max_sv": 0.006253971112892031, + "grad_min_sv": 0.0, + "grad_condition": 6253971112.892032, + "lr": 0.0008345653031794289, + "time_sec": 81.51133847236633 + }, + { + "epoch": 41, + "train_loss": 6.283648276977539, + "train_acc": 0.00898, + "test_loss": 4.615698904418945, + "test_acc": 0.01, + "lyapunov": 2.2645610153217755, + "grad_norm": 0.12524739066407903, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 81.50317192077637 + }, + { + "epoch": 42, + "train_loss": 6.291501354827881, + "train_acc": 0.00914, + "test_loss": 4.605554750061035, + "test_acc": 0.01, + "lyapunov": 2.267925240499589, + "grad_norm": 0.1307307918214705, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 81.48968553543091 + }, + { + "epoch": 43, + "train_loss": 6.276330156860352, + "train_acc": 0.00896, + "test_loss": 4.605246144104004, + "test_acc": 0.01, + "lyapunov": 2.2598801464071054, + "grad_norm": 0.0933943349122675, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 81.50180649757385 + }, + { + "epoch": 44, + "train_loss": 6.2769957354736325, + "train_acc": 0.00898, + "test_loss": 4.60537618560791, + "test_acc": 0.01, + "lyapunov": 2.26023776756833, + "grad_norm": 0.10724706931673801, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 81.48934960365295 + }, + { + "epoch": 45, + "train_loss": 6.27975429473877, + "train_acc": 0.0095, + "test_loss": 4.605248934936523, + "test_acc": 0.01, + "lyapunov": 2.2623073298607945, + "grad_norm": 0.095192742319822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 81.50000143051147 + }, + { + "epoch": 46, + "train_loss": 6.297380412445069, + "train_acc": 0.00876, + "test_loss": 4.6052475326538085, + "test_acc": 0.01, + "lyapunov": 2.271654522327511, + "grad_norm": 0.1534535578732401, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 81.47789859771729 + }, + { + "epoch": 47, + "train_loss": 6.282922696990966, + "train_acc": 0.0092, + "test_loss": 4.605248429107666, + "test_acc": 0.01, + "lyapunov": 2.264536363084603, + "grad_norm": 0.10842785613108402, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 81.48331236839294 + }, + { + "epoch": 48, + "train_loss": 6.280480013275146, + "train_acc": 0.00806, + "test_loss": 4.605249649047852, + "test_acc": 0.01, + "lyapunov": 2.2628020630468186, + "grad_norm": 0.09295297080650741, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 81.48791313171387 + }, + { + "epoch": 49, + "train_loss": 6.295236266479492, + "train_acc": 0.0081, + "test_loss": 4.605244645690918, + "test_acc": 0.01, + "lyapunov": 2.270114410868691, + "grad_norm": 0.14920321268372522, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 81.49582886695862 + }, + { + "epoch": 50, + "train_loss": 6.315434308013916, + "train_acc": 0.00828, + "test_loss": 4.605247691345215, + "test_acc": 0.01, + "lyapunov": 2.2807927832883945, + "grad_norm": 0.17847170404488147, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 81.49979019165039 + }, + { + "epoch": 51, + "train_loss": 6.302057292938232, + "train_acc": 0.009, + "test_loss": 4.605251131439209, + "test_acc": 0.01, + "lyapunov": 2.2735387291139957, + "grad_norm": 0.1418090218860237, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 81.49881410598755 + }, + { + "epoch": 52, + "train_loss": 6.278756464233399, + "train_acc": 0.00866, + "test_loss": 4.605250935363769, + "test_acc": 0.01, + "lyapunov": 2.2616379620778897, + "grad_norm": 0.09283264461248593, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 81.49807143211365 + }, + { + "epoch": 53, + "train_loss": 6.276537058105469, + "train_acc": 0.00894, + "test_loss": 4.605252996826172, + "test_acc": 0.01, + "lyapunov": 2.2600054393339035, + "grad_norm": 0.09889008649312356, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 81.50720810890198 + }, + { + "epoch": 54, + "train_loss": 6.2842115702819825, + "train_acc": 0.0088, + "test_loss": 4.60517135925293, + "test_acc": 0.01, + "lyapunov": 2.2653747550057024, + "grad_norm": 0.1176830015085984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 81.49119186401367 + }, + { + "epoch": 55, + "train_loss": 6.280401730041504, + "train_acc": 0.00886, + "test_loss": 4.605172096252441, + "test_acc": 0.01, + "lyapunov": 2.262633579771232, + "grad_norm": 0.10354075360180534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 81.49315738677979 + }, + { + "epoch": 56, + "train_loss": 6.316937896728516, + "train_acc": 0.00866, + "test_loss": 4.605172169494629, + "test_acc": 0.01, + "lyapunov": 2.2807149234635142, + "grad_norm": 0.15351000119410838, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 81.5045874118805 + }, + { + "epoch": 57, + "train_loss": 6.296867928161621, + "train_acc": 0.00924, + "test_loss": 4.605172319030761, + "test_acc": 0.01, + "lyapunov": 2.272276422861592, + "grad_norm": 0.14439465021569048, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 81.49606895446777 + }, + { + "epoch": 58, + "train_loss": 6.277121980133057, + "train_acc": 0.00822, + "test_loss": 4.605172018432617, + "test_acc": 0.01, + "lyapunov": 2.26043635926893, + "grad_norm": 0.09147768117276701, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 81.49943733215332 + }, + { + "epoch": 59, + "train_loss": 6.2761470947265625, + "train_acc": 0.00864, + "test_loss": 4.605172242736816, + "test_acc": 0.01, + "lyapunov": 2.2597581962185442, + "grad_norm": 0.0885807415167131, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 81.49118137359619 + }, + { + "epoch": 60, + "train_loss": 6.297447052307129, + "train_acc": 0.00916, + "test_loss": 4.605172019195557, + "test_acc": 0.01, + "lyapunov": 2.2733187815722298, + "grad_norm": 0.15437497590627458, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 81.49486422538757 + }, + { + "epoch": 61, + "train_loss": 6.3111451325988766, + "train_acc": 0.00872, + "test_loss": 4.605171881103516, + "test_acc": 0.01, + "lyapunov": 2.279795357638308, + "grad_norm": 0.1590526758324701, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 81.56430292129517 + }, + { + "epoch": 62, + "train_loss": 6.295817751617432, + "train_acc": 0.00874, + "test_loss": 4.605171612548828, + "test_acc": 0.01, + "lyapunov": 2.271848827981583, + "grad_norm": 0.1613023358766049, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 81.48160147666931 + }, + { + "epoch": 63, + "train_loss": 6.307024629974365, + "train_acc": 0.0085, + "test_loss": 4.605171653747559, + "test_acc": 0.01, + "lyapunov": 2.2748339487158735, + "grad_norm": 0.13676348001909264, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 81.48560905456543 + }, + { + "epoch": 64, + "train_loss": 6.277896643218994, + "train_acc": 0.00846, + "test_loss": 4.605171467590332, + "test_acc": 0.01, + "lyapunov": 2.261008509589583, + "grad_norm": 0.09063727687835958, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 81.4799861907959 + }, + { + "epoch": 65, + "train_loss": 6.285225621643066, + "train_acc": 0.00848, + "test_loss": 4.605171078491211, + "test_acc": 0.01, + "lyapunov": 2.2658682217073562, + "grad_norm": 0.10317682067163818, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 81.51162958145142 + }, + { + "epoch": 66, + "train_loss": 6.280715701446534, + "train_acc": 0.00842, + "test_loss": 4.605171147918701, + "test_acc": 0.01, + "lyapunov": 2.2628414155272267, + "grad_norm": 0.09673219941672938, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 81.47932028770447 + }, + { + "epoch": 67, + "train_loss": 6.277698368530274, + "train_acc": 0.00856, + "test_loss": 4.6051715675354, + "test_acc": 0.01, + "lyapunov": 2.26088782466586, + "grad_norm": 0.09056972140208994, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 81.48698115348816 + }, + { + "epoch": 68, + "train_loss": 6.30627403137207, + "train_acc": 0.00826, + "test_loss": 4.605171142578125, + "test_acc": 0.01, + "lyapunov": 2.2745680943169555, + "grad_norm": 0.13148861913625765, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 81.49131727218628 + }, + { + "epoch": 69, + "train_loss": 6.280330782623291, + "train_acc": 0.00892, + "test_loss": 4.605170972442627, + "test_acc": 0.01, + "lyapunov": 2.2627177104315797, + "grad_norm": 0.1124362788188755, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 83.16999244689941 + }, + { + "epoch": 70, + "train_loss": 6.28732081451416, + "train_acc": 0.00818, + "test_loss": 4.605170994567871, + "test_acc": 0.01, + "lyapunov": 2.2672290460532887, + "grad_norm": 0.10634119980305662, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 81.48939347267151 + }, + { + "epoch": 71, + "train_loss": 6.279782330627442, + "train_acc": 0.00912, + "test_loss": 4.605171276855469, + "test_acc": 0.01, + "lyapunov": 2.262383164652168, + "grad_norm": 0.10626668013646236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 81.48840260505676 + }, + { + "epoch": 72, + "train_loss": 6.295553107910156, + "train_acc": 0.00816, + "test_loss": 4.605171234130859, + "test_acc": 0.01, + "lyapunov": 2.2699396323669903, + "grad_norm": 0.10087516213292237, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 81.66768407821655 + }, + { + "epoch": 73, + "train_loss": 6.279174601287842, + "train_acc": 0.00854, + "test_loss": 4.605171266174317, + "test_acc": 0.01, + "lyapunov": 2.261961253402788, + "grad_norm": 0.09224354382614662, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 81.47679734230042 + }, + { + "epoch": 74, + "train_loss": 6.282529046783448, + "train_acc": 0.00878, + "test_loss": 4.605171199035644, + "test_acc": 0.01, + "lyapunov": 2.263870295966068, + "grad_norm": 0.09731782277810722, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 81.49993348121643 + }, + { + "epoch": 75, + "train_loss": 6.277901949768067, + "train_acc": 0.0089, + "test_loss": 4.605170727539062, + "test_acc": 0.01, + "lyapunov": 2.261039003996593, + "grad_norm": 0.09211112509965803, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 81.50083065032959 + }, + { + "epoch": 76, + "train_loss": 6.340216960601807, + "train_acc": 0.00838, + "test_loss": 4.605170699310302, + "test_acc": 0.01, + "lyapunov": 2.2909446268740212, + "grad_norm": 0.23685392065021807, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 81.50020790100098 + }, + { + "epoch": 77, + "train_loss": 6.312104174957275, + "train_acc": 0.00864, + "test_loss": 4.605171252441406, + "test_acc": 0.01, + "lyapunov": 2.2805933543788197, + "grad_norm": 0.18831482170422406, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 81.49737644195557 + }, + { + "epoch": 78, + "train_loss": 6.2789193016052245, + "train_acc": 0.00852, + "test_loss": 4.605171314239502, + "test_acc": 0.01, + "lyapunov": 2.261766994090946, + "grad_norm": 0.0924358449039435, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 81.48207116127014 + }, + { + "epoch": 79, + "train_loss": 6.278578204803467, + "train_acc": 0.00926, + "test_loss": 4.6051709121704105, + "test_acc": 0.01, + "lyapunov": 2.2615611260504367, + "grad_norm": 0.106081439799758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 81.5153739452362 + }, + { + "epoch": 80, + "train_loss": 6.280757647094727, + "train_acc": 0.00926, + "test_loss": 4.605170848083496, + "test_acc": 0.01, + "lyapunov": 2.2630625789427694, + "grad_norm": 0.09000806752766331, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 81.48912286758423 + }, + { + "epoch": 81, + "train_loss": 6.281069091949463, + "train_acc": 0.00898, + "test_loss": 4.605170893859864, + "test_acc": 0.01, + "lyapunov": 2.263333380984528, + "grad_norm": 0.09221512328536063, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 81.5581386089325 + }, + { + "epoch": 82, + "train_loss": 6.27887787902832, + "train_acc": 0.0087, + "test_loss": 4.605170852661133, + "test_acc": 0.01, + "lyapunov": 2.261768191671737, + "grad_norm": 0.09223604647823178, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 81.48868751525879 + }, + { + "epoch": 83, + "train_loss": 6.283419313049317, + "train_acc": 0.00842, + "test_loss": 4.605170945739746, + "test_acc": 0.01, + "lyapunov": 2.2647099933965738, + "grad_norm": 0.11489596444213686, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 81.48753881454468 + }, + { + "epoch": 84, + "train_loss": 6.331098417663574, + "train_acc": 0.00886, + "test_loss": 4.605170746612549, + "test_acc": 0.01, + "lyapunov": 2.288768025005565, + "grad_norm": 0.21523480615204088, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 81.49917888641357 + }, + { + "epoch": 85, + "train_loss": 6.279946563415527, + "train_acc": 0.00858, + "test_loss": 4.605170806884765, + "test_acc": 0.01, + "lyapunov": 2.262576125162032, + "grad_norm": 0.09063877969543369, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 81.49754786491394 + }, + { + "epoch": 86, + "train_loss": 6.294878379211426, + "train_acc": 0.0082, + "test_loss": 4.605170738983154, + "test_acc": 0.01, + "lyapunov": 2.270076130967006, + "grad_norm": 0.11269347737073286, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 81.49726057052612 + }, + { + "epoch": 87, + "train_loss": 6.2920974577331545, + "train_acc": 0.009, + "test_loss": 4.6051703125, + "test_acc": 0.01, + "lyapunov": 2.2685716097312207, + "grad_norm": 0.14345779012680526, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 81.51811003684998 + }, + { + "epoch": 88, + "train_loss": 6.280257380981445, + "train_acc": 0.00862, + "test_loss": 4.605170468139648, + "test_acc": 0.01, + "lyapunov": 2.262734867422782, + "grad_norm": 0.089208601870095, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 81.54773998260498 + }, + { + "epoch": 89, + "train_loss": 6.281720874176026, + "train_acc": 0.00798, + "test_loss": 4.605170385742188, + "test_acc": 0.01, + "lyapunov": 2.2637228892587333, + "grad_norm": 0.13294770236555567, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 81.49507021903992 + }, + { + "epoch": 90, + "train_loss": 6.282031690979004, + "train_acc": 0.00864, + "test_loss": 4.6051704216003415, + "test_acc": 0.01, + "lyapunov": 2.263972556804452, + "grad_norm": 0.09670924579322722, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 81.50043749809265 + }, + { + "epoch": 91, + "train_loss": 6.281220606231689, + "train_acc": 0.00882, + "test_loss": 4.605170685577392, + "test_acc": 0.01, + "lyapunov": 2.2634493798551047, + "grad_norm": 0.08948481670861189, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 81.50585508346558 + }, + { + "epoch": 92, + "train_loss": 6.279705551147461, + "train_acc": 0.00862, + "test_loss": 4.60517056274414, + "test_acc": 0.01, + "lyapunov": 2.2624147529797174, + "grad_norm": 0.09256700006903949, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 81.51557660102844 + }, + { + "epoch": 93, + "train_loss": 6.281244622955322, + "train_acc": 0.0087, + "test_loss": 4.60517061920166, + "test_acc": 0.01, + "lyapunov": 2.2632562803185503, + "grad_norm": 0.11132757286060115, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 81.49661374092102 + }, + { + "epoch": 94, + "train_loss": 6.306097177734375, + "train_acc": 0.00858, + "test_loss": 4.605170388793946, + "test_acc": 0.01, + "lyapunov": 2.274985415856247, + "grad_norm": 0.14003151421649307, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 81.48347187042236 + }, + { + "epoch": 95, + "train_loss": 6.283950561676026, + "train_acc": 0.00878, + "test_loss": 4.605170606994629, + "test_acc": 0.01, + "lyapunov": 2.264391293001297, + "grad_norm": 0.11506545388832123, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 81.5063374042511 + }, + { + "epoch": 96, + "train_loss": 6.302323147125244, + "train_acc": 0.00874, + "test_loss": 4.60517081451416, + "test_acc": 0.01, + "lyapunov": 2.274367270872111, + "grad_norm": 0.12307854636703328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 81.4797682762146 + }, + { + "epoch": 97, + "train_loss": 6.281584391479492, + "train_acc": 0.00864, + "test_loss": 4.605170351409912, + "test_acc": 0.01, + "lyapunov": 2.2636835014118866, + "grad_norm": 0.10251001946667801, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 81.49354839324951 + }, + { + "epoch": 98, + "train_loss": 6.2782898904418944, + "train_acc": 0.00868, + "test_loss": 4.60517045135498, + "test_acc": 0.01, + "lyapunov": 2.261435853245923, + "grad_norm": 0.08854436555507054, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 81.4875979423523 + }, + { + "epoch": 99, + "train_loss": 6.295129021606446, + "train_acc": 0.0082, + "test_loss": 4.605170526123047, + "test_acc": 0.01, + "lyapunov": 2.2712618536351585, + "grad_norm": 0.11715866448048785, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 81.48900055885315 + }, + { + "epoch": 100, + "train_loss": 6.278292948303223, + "train_acc": 0.00866, + "test_loss": 4.605170332336426, + "test_acc": 0.01, + "lyapunov": 2.2613569385255388, + "grad_norm": 0.09963153634244509, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 81.49986267089844 + }, + { + "epoch": 101, + "train_loss": 6.278483645935059, + "train_acc": 0.00804, + "test_loss": 4.60517053604126, + "test_acc": 0.01, + "lyapunov": 2.261537701272599, + "grad_norm": 0.08871006809333543, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 81.51374125480652 + }, + { + "epoch": 102, + "train_loss": 6.280324393310547, + "train_acc": 0.00806, + "test_loss": 4.605170599365234, + "test_acc": 0.01, + "lyapunov": 2.262814277883076, + "grad_norm": 0.08821870247597413, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 81.50025415420532 + }, + { + "epoch": 103, + "train_loss": 6.2799532815551755, + "train_acc": 0.00876, + "test_loss": 4.605170227050781, + "test_acc": 0.01, + "lyapunov": 2.2625574236330777, + "grad_norm": 0.08935081241113577, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 81.50659584999084 + }, + { + "epoch": 104, + "train_loss": 6.298912643432617, + "train_acc": 0.00842, + "test_loss": 4.60517052154541, + "test_acc": 0.01, + "lyapunov": 2.2703244808079948, + "grad_norm": 0.11414965346863236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 81.5045850276947 + }, + { + "epoch": 105, + "train_loss": 6.290122275390625, + "train_acc": 0.0086, + "test_loss": 4.605170248413086, + "test_acc": 0.01, + "lyapunov": 2.268586759981902, + "grad_norm": 0.09478727747372748, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 81.49806952476501 + }, + { + "epoch": 106, + "train_loss": 6.29548063659668, + "train_acc": 0.00866, + "test_loss": 4.605170534515381, + "test_acc": 0.01, + "lyapunov": 2.2701295159966746, + "grad_norm": 0.11489602174527157, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 81.48596048355103 + }, + { + "epoch": 107, + "train_loss": 6.282184426269532, + "train_acc": 0.0082, + "test_loss": 4.605170352172852, + "test_acc": 0.01, + "lyapunov": 2.2641438352482397, + "grad_norm": 0.08961045804319463, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 81.49523115158081 + }, + { + "epoch": 108, + "train_loss": 6.2777880932617185, + "train_acc": 0.00864, + "test_loss": 4.605170249938965, + "test_acc": 0.01, + "lyapunov": 2.2611292018305007, + "grad_norm": 0.08837496982685777, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 81.5235505104065 + }, + { + "epoch": 109, + "train_loss": 6.279533188171387, + "train_acc": 0.00846, + "test_loss": 4.6051705436706545, + "test_acc": 0.01, + "lyapunov": 2.2622785964585326, + "grad_norm": 0.09025198956904176, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 81.49149775505066 + }, + { + "epoch": 110, + "train_loss": 6.281950114135742, + "train_acc": 0.00808, + "test_loss": 4.605170324707031, + "test_acc": 0.01, + "lyapunov": 2.2638927835332767, + "grad_norm": 0.09569022356709349, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 81.48516082763672 + }, + { + "epoch": 111, + "train_loss": 6.28185485534668, + "train_acc": 0.00926, + "test_loss": 4.6051703125, + "test_acc": 0.01, + "lyapunov": 2.2638340045119185, + "grad_norm": 0.08892162931996153, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 81.49398422241211 + }, + { + "epoch": 112, + "train_loss": 6.310760371704101, + "train_acc": 0.0083, + "test_loss": 4.605170272064209, + "test_acc": 0.01, + "lyapunov": 2.2783618381870983, + "grad_norm": 0.14829000342501422, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 81.47959303855896 + }, + { + "epoch": 113, + "train_loss": 6.280448321685791, + "train_acc": 0.00868, + "test_loss": 4.605170561218261, + "test_acc": 0.01, + "lyapunov": 2.262940209235072, + "grad_norm": 0.08905882191321668, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 81.49572110176086 + }, + { + "epoch": 114, + "train_loss": 6.29521280166626, + "train_acc": 0.00898, + "test_loss": 4.6051701675415035, + "test_acc": 0.01, + "lyapunov": 2.2707663734855554, + "grad_norm": 0.10226349996651533, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 81.48670983314514 + }, + { + "epoch": 115, + "train_loss": 6.2799824197387695, + "train_acc": 0.00898, + "test_loss": 4.605170332336426, + "test_acc": 0.01, + "lyapunov": 2.2626387176611233, + "grad_norm": 0.08828544817683198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 81.48745203018188 + }, + { + "epoch": 116, + "train_loss": 6.2778549322509765, + "train_acc": 0.00826, + "test_loss": 4.6051702964782715, + "test_acc": 0.01, + "lyapunov": 2.26113668122255, + "grad_norm": 0.08806272896088922, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 81.54066944122314 + }, + { + "epoch": 117, + "train_loss": 6.279518751220703, + "train_acc": 0.00934, + "test_loss": 4.605170413208008, + "test_acc": 0.01, + "lyapunov": 2.2623144555884553, + "grad_norm": 0.0877771191158831, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 81.48839020729065 + }, + { + "epoch": 118, + "train_loss": 6.281088227996826, + "train_acc": 0.00902, + "test_loss": 4.605170362854004, + "test_acc": 0.01, + "lyapunov": 2.2633964198324685, + "grad_norm": 0.0880896864668632, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 81.50261282920837 + }, + { + "epoch": 119, + "train_loss": 6.282254580841064, + "train_acc": 0.00884, + "test_loss": 4.605170101165771, + "test_acc": 0.01, + "lyapunov": 2.264233167214162, + "grad_norm": 0.08831557648722567, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 81.52568435668945 + }, + { + "epoch": 120, + "train_loss": 6.277676391906739, + "train_acc": 0.0087, + "test_loss": 4.6051705383300785, + "test_acc": 0.01, + "lyapunov": 2.2610504279661057, + "grad_norm": 0.08852764058763012, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 81.50404500961304 + }, + { + "epoch": 121, + "train_loss": 6.282078470611572, + "train_acc": 0.00904, + "test_loss": 4.605170125579834, + "test_acc": 0.01, + "lyapunov": 2.264081825685623, + "grad_norm": 0.08733889209956962, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 81.49174380302429 + }, + { + "epoch": 122, + "train_loss": 6.280417911529541, + "train_acc": 0.00854, + "test_loss": 4.605170150756836, + "test_acc": 0.01, + "lyapunov": 2.2629349579286697, + "grad_norm": 0.08896774607886365, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 81.48855018615723 + }, + { + "epoch": 123, + "train_loss": 6.279605996398926, + "train_acc": 0.00798, + "test_loss": 4.605170092773437, + "test_acc": 0.01, + "lyapunov": 2.262386467755603, + "grad_norm": 0.08795933479592377, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 81.50146007537842 + }, + { + "epoch": 124, + "train_loss": 6.291684345397949, + "train_acc": 0.00856, + "test_loss": 4.6051700492858885, + "test_acc": 0.01, + "lyapunov": 2.2678240815087047, + "grad_norm": 0.11392589044407447, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 81.48491311073303 + }, + { + "epoch": 125, + "train_loss": 6.285427192077637, + "train_acc": 0.00888, + "test_loss": 4.605170321655273, + "test_acc": 0.01, + "lyapunov": 2.2660442904743086, + "grad_norm": 0.1133754054706649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 81.49100470542908 + }, + { + "epoch": 126, + "train_loss": 6.280400201568604, + "train_acc": 0.00878, + "test_loss": 4.6051705368041995, + "test_acc": 0.01, + "lyapunov": 2.2629254120390128, + "grad_norm": 0.08821452866992016, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 81.49153852462769 + }, + { + "epoch": 127, + "train_loss": 6.279529089202881, + "train_acc": 0.0088, + "test_loss": 4.605170316314697, + "test_acc": 0.01, + "lyapunov": 2.2623902915993614, + "grad_norm": 0.08745608733781365, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 81.50230026245117 + }, + { + "epoch": 128, + "train_loss": 6.278408692016601, + "train_acc": 0.00888, + "test_loss": 4.605170304870605, + "test_acc": 0.01, + "lyapunov": 2.261508503228502, + "grad_norm": 0.08825893270809801, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 81.49138951301575 + }, + { + "epoch": 129, + "train_loss": 6.279044237976074, + "train_acc": 0.00934, + "test_loss": 4.605170484924316, + "test_acc": 0.01, + "lyapunov": 2.261979506753595, + "grad_norm": 0.08762519682827673, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 81.50332951545715 + }, + { + "epoch": 130, + "train_loss": 6.2814196604919434, + "train_acc": 0.00892, + "test_loss": 4.605170237731934, + "test_acc": 0.01, + "lyapunov": 2.263650309399266, + "grad_norm": 0.0879745908721408, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 81.48634791374207 + }, + { + "epoch": 131, + "train_loss": 6.279289369659423, + "train_acc": 0.00816, + "test_loss": 4.605170503234863, + "test_acc": 0.01, + "lyapunov": 2.2619674528956106, + "grad_norm": 0.08830358541425926, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 81.49762201309204 + }, + { + "epoch": 132, + "train_loss": 6.284051736145019, + "train_acc": 0.00918, + "test_loss": 4.605169993591309, + "test_acc": 0.01, + "lyapunov": 2.265367220734696, + "grad_norm": 0.09065551426084856, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 81.5026957988739 + }, + { + "epoch": 133, + "train_loss": 6.28203574508667, + "train_acc": 0.00886, + "test_loss": 4.60517046508789, + "test_acc": 0.01, + "lyapunov": 2.264016958148888, + "grad_norm": 0.08811709248877145, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 81.4884991645813 + }, + { + "epoch": 134, + "train_loss": 6.295380000305176, + "train_acc": 0.00924, + "test_loss": 4.6051701171875, + "test_acc": 0.01, + "lyapunov": 2.270651138652011, + "grad_norm": 0.09385452218544989, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 81.49120998382568 + }, + { + "epoch": 135, + "train_loss": 6.279313954925537, + "train_acc": 0.0096, + "test_loss": 4.605170198059082, + "test_acc": 0.01, + "lyapunov": 2.2621799277527557, + "grad_norm": 0.08809804121534516, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 81.503009557724 + }, + { + "epoch": 136, + "train_loss": 6.281174714050293, + "train_acc": 0.009, + "test_loss": 4.605170434570312, + "test_acc": 0.01, + "lyapunov": 2.263484787758049, + "grad_norm": 0.08787496788421857, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 81.49492454528809 + }, + { + "epoch": 137, + "train_loss": 6.2790307751464844, + "train_acc": 0.00906, + "test_loss": 4.605170115661621, + "test_acc": 0.01, + "lyapunov": 2.2619833738907524, + "grad_norm": 0.08850586212515105, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 81.51062154769897 + }, + { + "epoch": 138, + "train_loss": 6.278728715362549, + "train_acc": 0.0095, + "test_loss": 4.605170520019532, + "test_acc": 0.01, + "lyapunov": 2.2618095082090335, + "grad_norm": 0.08731291361885624, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 81.48903918266296 + }, + { + "epoch": 139, + "train_loss": 6.279946011657715, + "train_acc": 0.00924, + "test_loss": 4.605169985198975, + "test_acc": 0.01, + "lyapunov": 2.262684661104246, + "grad_norm": 0.08830501755378455, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 81.50976133346558 + }, + { + "epoch": 140, + "train_loss": 6.2800713043212895, + "train_acc": 0.0093, + "test_loss": 4.605170336914062, + "test_acc": 0.01, + "lyapunov": 2.2627302271020993, + "grad_norm": 0.08760865122091131, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 81.47953510284424 + }, + { + "epoch": 141, + "train_loss": 6.280382924652099, + "train_acc": 0.00976, + "test_loss": 4.605170390319824, + "test_acc": 0.01, + "lyapunov": 2.262962554116993, + "grad_norm": 0.08731546735423716, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 81.50757503509521 + }, + { + "epoch": 142, + "train_loss": 6.280370573883057, + "train_acc": 0.00936, + "test_loss": 4.605170272064209, + "test_acc": 0.01, + "lyapunov": 2.262975048226164, + "grad_norm": 0.08839664162758272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 81.70762014389038 + }, + { + "epoch": 143, + "train_loss": 6.278507639923096, + "train_acc": 0.0095, + "test_loss": 4.6051704162597655, + "test_acc": 0.01, + "lyapunov": 2.261611500054674, + "grad_norm": 0.08694971985774991, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 81.48127150535583 + }, + { + "epoch": 144, + "train_loss": 6.281042174987793, + "train_acc": 0.00942, + "test_loss": 4.605170404815674, + "test_acc": 0.01, + "lyapunov": 2.263450643290644, + "grad_norm": 0.0881830241474449, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 81.58690285682678 + }, + { + "epoch": 145, + "train_loss": 6.278796115875244, + "train_acc": 0.01, + "test_loss": 4.605169946289062, + "test_acc": 0.01, + "lyapunov": 2.2618483887304124, + "grad_norm": 0.08774085138052039, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 81.47702813148499 + }, + { + "epoch": 146, + "train_loss": 6.28765030166626, + "train_acc": 0.01, + "test_loss": 4.605170179748535, + "test_acc": 0.01, + "lyapunov": 2.266257317169853, + "grad_norm": 0.0926994360583192, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 81.53279685974121 + }, + { + "epoch": 147, + "train_loss": 6.28031106124878, + "train_acc": 0.01, + "test_loss": 4.605170380401612, + "test_acc": 0.01, + "lyapunov": 2.2628798844564297, + "grad_norm": 0.08793782485118157, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 81.48903107643127 + }, + { + "epoch": 148, + "train_loss": 6.280096773681641, + "train_acc": 0.01, + "test_loss": 4.605170349884033, + "test_acc": 0.01, + "lyapunov": 2.2627320112779623, + "grad_norm": 0.08818349122842602, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 81.4692907333374 + }, + { + "epoch": 149, + "train_loss": 6.281090885467529, + "train_acc": 0.01, + "test_loss": 4.605170343017578, + "test_acc": 0.01, + "lyapunov": 2.263427186195198, + "grad_norm": 0.0872012744277379, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 81.53167700767517 + }, + { + "epoch": 150, + "train_loss": 6.279137640380859, + "train_acc": 0.01, + "test_loss": 4.605170111083984, + "test_acc": 0.01, + "lyapunov": 2.262077055318886, + "grad_norm": 0.08725575780836431, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 81.56354284286499 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 12.888672213134766, + "train_acc": 0.0157, + "test_loss": 4.668669903564453, + "test_acc": 0.0113, + "lyapunov": 4.721897013656928, + "grad_norm": 6.113449849588324, + "grad_max_sv": 4.916350275278091, + "grad_min_sv": 9.121745356832633e-08, + "grad_condition": 85604761.14095068, + "lr": 0.0009998903417374227, + "time_sec": 124.4171769618988 + }, + { + "epoch": 2, + "train_loss": 8.873665056762695, + "train_acc": 0.0172, + "test_loss": 4.618728218078613, + "test_acc": 0.0106, + "lyapunov": 3.5643789152355145, + "grad_norm": 4.270033727895912, + "grad_max_sv": 3.703069430589676, + "grad_min_sv": 4.972798216271515e-08, + "grad_condition": 4407702901.858317, + "lr": 0.0009995614150494292, + "time_sec": 124.48686790466309 + }, + { + "epoch": 3, + "train_loss": 8.600334560241699, + "train_acc": 0.01782, + "test_loss": 4.650051962280274, + "test_acc": 0.01, + "lyapunov": 3.4914282776815506, + "grad_norm": 3.3926839865294114, + "grad_max_sv": 2.9882367312908173, + "grad_min_sv": 1.3234509199243523e-08, + "grad_condition": 54857460231.037346, + "lr": 0.0009990133642141358, + "time_sec": 124.54058074951172 + }, + { + "epoch": 4, + "train_loss": 8.263027096862793, + "train_acc": 0.01714, + "test_loss": 4.599512353515625, + "test_acc": 0.0105, + "lyapunov": 3.3760591937452937, + "grad_norm": 2.278902599299841, + "grad_max_sv": 1.9339918196201324, + "grad_min_sv": 2.3884921456027857e-10, + "grad_condition": 107255985296.78781, + "lr": 0.0009982464296247522, + "time_sec": 124.56976628303528 + }, + { + "epoch": 5, + "train_loss": 8.014010938720704, + "train_acc": 0.01496, + "test_loss": 4.616816136169434, + "test_acc": 0.01, + "lyapunov": 3.2668096848461023, + "grad_norm": 1.8273408452911775, + "grad_max_sv": 1.1145809442189922, + "grad_min_sv": 1.2368932906215386e-11, + "grad_condition": 320257530150.4256, + "lr": 0.0009972609476841367, + "time_sec": 124.43335103988647 + }, + { + "epoch": 6, + "train_loss": 7.492105539398193, + "train_acc": 0.01378, + "test_loss": 4.617157006835938, + "test_acc": 0.01, + "lyapunov": 2.993205757702098, + "grad_norm": 1.155205925820389, + "grad_max_sv": 0.8030500062418355, + "grad_min_sv": 1.9935007673619705e-12, + "grad_condition": 394942710887.2484, + "lr": 0.000996057350657239, + "time_sec": 124.40957427024841 + }, + { + "epoch": 7, + "train_loss": 7.546499238586426, + "train_acc": 0.01474, + "test_loss": 4.614982270812988, + "test_acc": 0.01, + "lyapunov": 3.0089273160071017, + "grad_norm": 2.2107120727107343, + "grad_max_sv": 0.5263522088527679, + "grad_min_sv": 2.339208170494913e-12, + "grad_condition": 228093595550.92413, + "lr": 0.000994636166481494, + "time_sec": 124.44238233566284 + }, + { + "epoch": 8, + "train_loss": 7.431590474243164, + "train_acc": 0.01458, + "test_loss": 4.613349987792969, + "test_acc": 0.01, + "lyapunov": 2.9677638501462424, + "grad_norm": 1.4698803730862553, + "grad_max_sv": 0.3683710671344215, + "grad_min_sv": 1.0445961128587334e-12, + "grad_condition": 222600534264.8287, + "lr": 0.0009929980185352525, + "time_sec": 124.46612310409546 + }, + { + "epoch": 9, + "train_loss": 7.177635037078858, + "train_acc": 0.01324, + "test_loss": 4.612429743957519, + "test_acc": 0.01, + "lyapunov": 2.8310226979463, + "grad_norm": 1.4861384451742359, + "grad_max_sv": 0.32697355831472236, + "grad_min_sv": 7.011187907653872e-13, + "grad_condition": 236887025983.79956, + "lr": 0.0009911436253643444, + "time_sec": 124.47700262069702 + }, + { + "epoch": 10, + "train_loss": 7.269148045806885, + "train_acc": 0.01266, + "test_loss": 4.60582406539917, + "test_acc": 0.01, + "lyapunov": 2.8725382824383123, + "grad_norm": 2.342581709783361, + "grad_max_sv": 0.25737013639882206, + "grad_min_sv": 2.152763686233954e-13, + "grad_condition": 237339662745.88754, + "lr": 0.0009890738003669028, + "time_sec": 124.34593343734741 + }, + { + "epoch": 11, + "train_loss": 7.854859015350342, + "train_acc": 0.0135, + "test_loss": 4.610336604309082, + "test_acc": 0.01, + "lyapunov": 3.174172605699895, + "grad_norm": 2.7187327990789893, + "grad_max_sv": 0.20388649497181177, + "grad_min_sv": 8.088439153332857e-14, + "grad_condition": 191904183934.97748, + "lr": 0.00098678945143658, + "time_sec": 124.38984727859497 + }, + { + "epoch": 12, + "train_loss": 7.352457761230469, + "train_acc": 0.01424, + "test_loss": 4.6108569480896, + "test_acc": 0.01, + "lyapunov": 2.9249625279165596, + "grad_norm": 1.4927365138413504, + "grad_max_sv": 0.19409580584615468, + "grad_min_sv": 6.321730296975161e-14, + "grad_condition": 185278377907.65347, + "lr": 0.0009842915805643154, + "time_sec": 124.45291423797607 + }, + { + "epoch": 13, + "train_loss": 7.126369653930664, + "train_acc": 0.0127, + "test_loss": 4.606200820922852, + "test_acc": 0.01, + "lyapunov": 2.7892982831696416, + "grad_norm": 1.5745132805186597, + "grad_max_sv": 0.16401691318606026, + "grad_min_sv": 1.1404081781040362e-15, + "grad_condition": 163820543107.00018, + "lr": 0.000981581283398829, + "time_sec": 124.47300815582275 + }, + { + "epoch": 14, + "train_loss": 6.9970923039245605, + "train_acc": 0.0119, + "test_loss": 4.606117165374756, + "test_acc": 0.01, + "lyapunov": 2.7211814384021418, + "grad_norm": 0.8580084847133529, + "grad_max_sv": 0.13348757792264224, + "grad_min_sv": 3.507279862736168e-28, + "grad_condition": 133487577922.64218, + "lr": 0.0009786597487660333, + "time_sec": 124.41379904747009 + }, + { + "epoch": 15, + "train_loss": 7.052154786376953, + "train_acc": 0.0117, + "test_loss": 4.606044427490234, + "test_acc": 0.01, + "lyapunov": 2.753269191288277, + "grad_norm": 1.006394199833171, + "grad_max_sv": 0.12816582168452442, + "grad_min_sv": 4.518028483603919e-34, + "grad_condition": 128165821684.52441, + "lr": 0.0009755282581475766, + "time_sec": 124.34007215499878 + }, + { + "epoch": 16, + "train_loss": 7.258110624084472, + "train_acc": 0.0109, + "test_loss": 4.605929005432129, + "test_acc": 0.01, + "lyapunov": 2.862082756998594, + "grad_norm": 1.1482559574218805, + "grad_max_sv": 0.10950499838218093, + "grad_min_sv": 3.564320494794489e-35, + "grad_condition": 109504998382.18094, + "lr": 0.0009721881851187403, + "time_sec": 124.38707971572876 + }, + { + "epoch": 17, + "train_loss": 6.873683618774414, + "train_acc": 0.00996, + "test_loss": 4.61062957611084, + "test_acc": 0.01, + "lyapunov": 2.641120981377409, + "grad_norm": 2.0808485430057084, + "grad_max_sv": 0.05978809341322631, + "grad_min_sv": 2.4522723125684297e-46, + "grad_condition": 59788093413.2263, + "lr": 0.0009686409947459456, + "time_sec": 124.47280597686768 + }, + { + "epoch": 18, + "train_loss": 7.016553334655762, + "train_acc": 0.01398, + "test_loss": 4.622579546356201, + "test_acc": 0.01, + "lyapunov": 2.728775659180663, + "grad_norm": 1.2800257190104987, + "grad_max_sv": 0.1043331983499229, + "grad_min_sv": 3.1060564013215523e-18, + "grad_condition": 104332858891.6054, + "lr": 0.0009648882429441254, + "time_sec": 124.54543328285217 + }, + { + "epoch": 19, + "train_loss": 6.869653914642334, + "train_acc": 0.01194, + "test_loss": 4.643599758911133, + "test_acc": 0.01, + "lyapunov": 2.638523844501856, + "grad_norm": 0.5641956497166879, + "grad_max_sv": 0.06742433752388025, + "grad_min_sv": 9.779701625669289e-16, + "grad_condition": 67360221904.04246, + "lr": 0.00096093157579425, + "time_sec": 124.44028401374817 + }, + { + "epoch": 20, + "train_loss": 6.866667858276367, + "train_acc": 0.0096, + "test_loss": 4.634420860290527, + "test_acc": 0.01, + "lyapunov": 2.628649781731998, + "grad_norm": 0.5455051217507713, + "grad_max_sv": 0.028104651859030126, + "grad_min_sv": 0.0, + "grad_condition": 28104651859.03013, + "lr": 0.0009567727288213001, + "time_sec": 124.34887290000916 + }, + { + "epoch": 21, + "train_loss": 6.825957579650879, + "train_acc": 0.00936, + "test_loss": 4.642799243164062, + "test_acc": 0.01, + "lyapunov": 2.607143042337559, + "grad_norm": 0.5228902482624009, + "grad_max_sv": 0.029772339016199113, + "grad_min_sv": 0.0, + "grad_condition": 29772339016.19911, + "lr": 0.0009524135262330095, + "time_sec": 124.38223886489868 + }, + { + "epoch": 22, + "train_loss": 6.60694779296875, + "train_acc": 0.00934, + "test_loss": 4.642452531433105, + "test_acc": 0.01, + "lyapunov": 2.4819612728665246, + "grad_norm": 0.5929983668433683, + "grad_max_sv": 0.028571362840011716, + "grad_min_sv": 0.0, + "grad_condition": 28571362840.01172, + "lr": 0.0009478558801197061, + "time_sec": 124.46409487724304 + }, + { + "epoch": 23, + "train_loss": 6.587394898986816, + "train_acc": 0.00922, + "test_loss": 4.642014373779297, + "test_acc": 0.01, + "lyapunov": 2.46996273287117, + "grad_norm": 0.5937371167405978, + "grad_max_sv": 0.027252211095765234, + "grad_min_sv": 0.0, + "grad_condition": 27252211095.765236, + "lr": 0.000943101789615607, + "time_sec": 124.41273093223572 + }, + { + "epoch": 24, + "train_loss": 6.5855675335693356, + "train_acc": 0.00944, + "test_loss": 4.629414208984375, + "test_acc": 0.01, + "lyapunov": 2.468693129546807, + "grad_norm": 0.5173238649422355, + "grad_max_sv": 0.026766624441370367, + "grad_min_sv": 0.0, + "grad_condition": 26766624441.37037, + "lr": 0.0009381533400219313, + "time_sec": 124.34699821472168 + }, + { + "epoch": 25, + "train_loss": 6.599731462860108, + "train_acc": 0.00936, + "test_loss": 4.6412096755981445, + "test_acc": 0.01, + "lyapunov": 2.476690198454406, + "grad_norm": 0.5699426578758121, + "grad_max_sv": 0.025352103635668755, + "grad_min_sv": 0.0, + "grad_condition": 25352103635.668755, + "lr": 0.0009330127018922189, + "time_sec": 124.3536787033081 + }, + { + "epoch": 26, + "train_loss": 6.5942790597534175, + "train_acc": 0.00964, + "test_loss": 4.640745770263672, + "test_acc": 0.01, + "lyapunov": 2.4741494673902116, + "grad_norm": 0.546145353806512, + "grad_max_sv": 0.021123076300136746, + "grad_min_sv": 0.0, + "grad_condition": 21123076300.136745, + "lr": 0.000927682130080253, + "time_sec": 124.4051742553711 + }, + { + "epoch": 27, + "train_loss": 6.6229908557128905, + "train_acc": 0.00888, + "test_loss": 4.605336713409423, + "test_acc": 0.01, + "lyapunov": 2.4850437781390022, + "grad_norm": 0.6663677646075784, + "grad_max_sv": 0.011104274867102503, + "grad_min_sv": 0.0, + "grad_condition": 11104274867.102505, + "lr": 0.0009221639627510072, + "time_sec": 124.44045972824097 + }, + { + "epoch": 28, + "train_loss": 6.597202638854981, + "train_acc": 0.00916, + "test_loss": 4.605269973754883, + "test_acc": 0.01, + "lyapunov": 2.4748127710483874, + "grad_norm": 0.6602347286377247, + "grad_max_sv": 0.005200258875265718, + "grad_min_sv": 0.0, + "grad_condition": 5200258875.2657175, + "lr": 0.0009164606203550494, + "time_sec": 124.41216611862183 + }, + { + "epoch": 29, + "train_loss": 6.5781180551147465, + "train_acc": 0.00896, + "test_loss": 4.605207743072509, + "test_acc": 0.01, + "lyapunov": 2.463899161809546, + "grad_norm": 0.16963115020621336, + "grad_max_sv": 0.0064356182236224415, + "grad_min_sv": 0.0, + "grad_condition": 6435618223.622441, + "lr": 0.0009105746045668516, + "time_sec": 124.52706933021545 + }, + { + "epoch": 30, + "train_loss": 6.580226347045898, + "train_acc": 0.00922, + "test_loss": 4.605211033630371, + "test_acc": 0.01, + "lyapunov": 2.4648621435970295, + "grad_norm": 0.14897426222581245, + "grad_max_sv": 0.006681703682988882, + "grad_min_sv": 0.0, + "grad_condition": 6681703682.988882, + "lr": 0.0009045084971874733, + "time_sec": 124.31314778327942 + }, + { + "epoch": 31, + "train_loss": 6.580346279144287, + "train_acc": 0.00906, + "test_loss": 4.605202531433106, + "test_acc": 0.01, + "lyapunov": 2.4647859356287496, + "grad_norm": 0.13651802704858546, + "grad_max_sv": 0.0033354544546455147, + "grad_min_sv": 0.0, + "grad_condition": 3335454454.6455145, + "lr": 0.0008982649590120977, + "time_sec": 124.37081241607666 + }, + { + "epoch": 32, + "train_loss": 6.5977811730957034, + "train_acc": 0.00854, + "test_loss": 4.605187432861328, + "test_acc": 0.01, + "lyapunov": 2.4727761562523023, + "grad_norm": 0.12974748253445384, + "grad_max_sv": 0.002326939906924963, + "grad_min_sv": 0.0, + "grad_condition": 2326939906.924963, + "lr": 0.0008918467286629196, + "time_sec": 124.42768621444702 + }, + { + "epoch": 33, + "train_loss": 6.574522008514404, + "train_acc": 0.00888, + "test_loss": 4.60518201751709, + "test_acc": 0.01, + "lyapunov": 2.461720284903446, + "grad_norm": 0.10990146900045704, + "grad_max_sv": 0.0026134482119232415, + "grad_min_sv": 0.0, + "grad_condition": 2613448211.9232416, + "lr": 0.0008852566213878943, + "time_sec": 124.36949467658997 + }, + { + "epoch": 34, + "train_loss": 6.577264302215577, + "train_acc": 0.0092, + "test_loss": 4.605177014923096, + "test_acc": 0.01, + "lyapunov": 2.463475263941928, + "grad_norm": 0.12976444128871847, + "grad_max_sv": 0.0009734443388879299, + "grad_min_sv": 0.0, + "grad_condition": 973444338.8879299, + "lr": 0.000878497527825878, + "time_sec": 124.3325207233429 + }, + { + "epoch": 35, + "train_loss": 6.587216622314453, + "train_acc": 0.00888, + "test_loss": 4.636661901855469, + "test_acc": 0.01, + "lyapunov": 2.4681083863348605, + "grad_norm": 0.13220591916165889, + "grad_max_sv": 0.00457856860011816, + "grad_min_sv": 0.0, + "grad_condition": 4578568600.118161, + "lr": 0.000871572412738697, + "time_sec": 124.3110682964325 + }, + { + "epoch": 36, + "train_loss": 6.592979219360352, + "train_acc": 0.0092, + "test_loss": 4.6051753067016605, + "test_acc": 0.01, + "lyapunov": 2.4714617686503377, + "grad_norm": 0.1239857838330967, + "grad_max_sv": 0.0005948701407760381, + "grad_min_sv": 0.0, + "grad_condition": 594870140.7760382, + "lr": 0.0008644843137107055, + "time_sec": 124.4406750202179 + }, + { + "epoch": 37, + "train_loss": 6.613644898376465, + "train_acc": 0.00858, + "test_loss": 4.605174197387695, + "test_acc": 0.01, + "lyapunov": 2.48187786294981, + "grad_norm": 0.18028613006863556, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 124.42482614517212 + }, + { + "epoch": 38, + "train_loss": 6.598032460021972, + "train_acc": 0.00866, + "test_loss": 4.605173423004151, + "test_acc": 0.01, + "lyapunov": 2.4748510588770327, + "grad_norm": 0.17702039657703328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 124.38127946853638 + }, + { + "epoch": 39, + "train_loss": 6.595033478546142, + "train_acc": 0.00904, + "test_loss": 4.605172880554199, + "test_acc": 0.01, + "lyapunov": 2.4724140514803055, + "grad_norm": 0.1406852681746766, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 124.27310037612915 + }, + { + "epoch": 40, + "train_loss": 6.607061416625976, + "train_acc": 0.00882, + "test_loss": 4.605173010253906, + "test_acc": 0.01, + "lyapunov": 2.4797774525859473, + "grad_norm": 0.1602364870035822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008345653031794289, + "time_sec": 124.35175013542175 + }, + { + "epoch": 41, + "train_loss": 6.652051022644043, + "train_acc": 0.00868, + "test_loss": 4.60517377319336, + "test_acc": 0.01, + "lyapunov": 2.494590156218585, + "grad_norm": 0.1877202250366353, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 124.42674827575684 + }, + { + "epoch": 42, + "train_loss": 6.609013889770508, + "train_acc": 0.00818, + "test_loss": 4.60517264328003, + "test_acc": 0.01, + "lyapunov": 2.4807275219646563, + "grad_norm": 0.19291631462520265, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 124.38730263710022 + }, + { + "epoch": 43, + "train_loss": 6.573144034423828, + "train_acc": 0.0082, + "test_loss": 4.6051730613708495, + "test_acc": 0.01, + "lyapunov": 2.4609296730412242, + "grad_norm": 0.09628320238477034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 124.36512160301208 + }, + { + "epoch": 44, + "train_loss": 6.575241811828613, + "train_acc": 0.00884, + "test_loss": 4.605172496032715, + "test_acc": 0.01, + "lyapunov": 2.462244158205779, + "grad_norm": 0.10484293099591814, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 124.30067491531372 + }, + { + "epoch": 45, + "train_loss": 6.594184577026367, + "train_acc": 0.00936, + "test_loss": 4.605172833251953, + "test_acc": 0.01, + "lyapunov": 2.4732542019670882, + "grad_norm": 0.16310890352013555, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 124.42177891731262 + }, + { + "epoch": 46, + "train_loss": 6.577082351989746, + "train_acc": 0.00882, + "test_loss": 4.605172598266601, + "test_acc": 0.01, + "lyapunov": 2.463544076665893, + "grad_norm": 0.10037821136236143, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 124.40465664863586 + }, + { + "epoch": 47, + "train_loss": 6.5774040518188475, + "train_acc": 0.00862, + "test_loss": 4.605172250366211, + "test_acc": 0.01, + "lyapunov": 2.4635354655478006, + "grad_norm": 0.1162215297313361, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 124.41038012504578 + }, + { + "epoch": 48, + "train_loss": 6.6083132769775395, + "train_acc": 0.0086, + "test_loss": 4.605171835327148, + "test_acc": 0.01, + "lyapunov": 2.4782137511026523, + "grad_norm": 0.17135162198913576, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 124.31084632873535 + }, + { + "epoch": 49, + "train_loss": 6.604438779449463, + "train_acc": 0.0088, + "test_loss": 4.60517212600708, + "test_acc": 0.01, + "lyapunov": 2.478019986311188, + "grad_norm": 0.16895443836343932, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 124.28308844566345 + }, + { + "epoch": 50, + "train_loss": 6.588782655029297, + "train_acc": 0.00888, + "test_loss": 4.605172025299073, + "test_acc": 0.01, + "lyapunov": 2.470017822197331, + "grad_norm": 0.12889442183383476, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 124.42897295951843 + }, + { + "epoch": 51, + "train_loss": 6.601284326782227, + "train_acc": 0.00796, + "test_loss": 4.6051717948913575, + "test_acc": 0.01, + "lyapunov": 2.4773334834886636, + "grad_norm": 0.17649093442856895, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 124.39905118942261 + }, + { + "epoch": 52, + "train_loss": 6.575957306518554, + "train_acc": 0.00918, + "test_loss": 4.6051720420837405, + "test_acc": 0.01, + "lyapunov": 2.46280481565334, + "grad_norm": 0.0968044467412458, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 124.42980766296387 + }, + { + "epoch": 53, + "train_loss": 6.587701625518799, + "train_acc": 0.00872, + "test_loss": 4.6051725509643555, + "test_acc": 0.01, + "lyapunov": 2.4698515999347657, + "grad_norm": 0.13994770283254052, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 124.28514337539673 + }, + { + "epoch": 54, + "train_loss": 6.578931684265137, + "train_acc": 0.00938, + "test_loss": 4.605171647644043, + "test_acc": 0.01, + "lyapunov": 2.464453091097, + "grad_norm": 0.104587329873943, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 124.3464949131012 + }, + { + "epoch": 55, + "train_loss": 6.610985378723145, + "train_acc": 0.00822, + "test_loss": 4.605172131347656, + "test_acc": 0.01, + "lyapunov": 2.4811968675354863, + "grad_norm": 0.23664084539084446, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 124.3919792175293 + }, + { + "epoch": 56, + "train_loss": 6.577887360839844, + "train_acc": 0.0089, + "test_loss": 4.605171892547608, + "test_acc": 0.01, + "lyapunov": 2.4638065877168076, + "grad_norm": 0.12418210732155195, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 124.42023730278015 + }, + { + "epoch": 57, + "train_loss": 6.575769240722656, + "train_acc": 0.00934, + "test_loss": 4.605171751403809, + "test_acc": 0.01, + "lyapunov": 2.4626593559294405, + "grad_norm": 0.08871385738467265, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 124.39303755760193 + }, + { + "epoch": 58, + "train_loss": 6.649054284973144, + "train_acc": 0.00788, + "test_loss": 4.6051721786499025, + "test_acc": 0.01, + "lyapunov": 2.4995590183131227, + "grad_norm": 0.26439944389263503, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 124.30309414863586 + }, + { + "epoch": 59, + "train_loss": 6.620378266906738, + "train_acc": 0.0087, + "test_loss": 4.605171722412109, + "test_acc": 0.01, + "lyapunov": 2.4861825994213524, + "grad_norm": 0.2011814553286534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 124.40799474716187 + }, + { + "epoch": 60, + "train_loss": 6.615863608703613, + "train_acc": 0.00898, + "test_loss": 4.605171568298339, + "test_acc": 0.01, + "lyapunov": 2.4820322356260647, + "grad_norm": 0.16244295400836278, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 124.44055390357971 + }, + { + "epoch": 61, + "train_loss": 6.62539726638794, + "train_acc": 0.00854, + "test_loss": 4.605171578979492, + "test_acc": 0.01, + "lyapunov": 2.4873651598420596, + "grad_norm": 0.18579251012972714, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 124.47138166427612 + }, + { + "epoch": 62, + "train_loss": 6.591934550476074, + "train_acc": 0.00868, + "test_loss": 4.605171854400635, + "test_acc": 0.01, + "lyapunov": 2.471130254018642, + "grad_norm": 0.14241384092347348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 124.35206151008606 + }, + { + "epoch": 63, + "train_loss": 6.607412483825684, + "train_acc": 0.00866, + "test_loss": 4.605171817779541, + "test_acc": 0.01, + "lyapunov": 2.4772931200159176, + "grad_norm": 0.12000050103102612, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 124.31255435943604 + }, + { + "epoch": 64, + "train_loss": 6.574604081420898, + "train_acc": 0.0084, + "test_loss": 4.60517174911499, + "test_acc": 0.01, + "lyapunov": 2.461947503297225, + "grad_norm": 0.11837720061951122, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 124.42598223686218 + }, + { + "epoch": 65, + "train_loss": 6.669198082733154, + "train_acc": 0.00846, + "test_loss": 4.605171404266358, + "test_acc": 0.01, + "lyapunov": 2.50827671865673, + "grad_norm": 0.3654068480597362, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 124.41292977333069 + }, + { + "epoch": 66, + "train_loss": 6.576071541442871, + "train_acc": 0.00868, + "test_loss": 4.60517176437378, + "test_acc": 0.01, + "lyapunov": 2.462862340995418, + "grad_norm": 0.0924056370989614, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 124.44835186004639 + }, + { + "epoch": 67, + "train_loss": 6.623493032073974, + "train_acc": 0.00798, + "test_loss": 4.605171159362793, + "test_acc": 0.01, + "lyapunov": 2.4856161059016157, + "grad_norm": 0.23515698863564433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 124.32646751403809 + }, + { + "epoch": 68, + "train_loss": 6.58642106048584, + "train_acc": 0.00814, + "test_loss": 4.605171382141113, + "test_acc": 0.01, + "lyapunov": 2.4687487658332374, + "grad_norm": 0.10028160631921758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 124.34812188148499 + }, + { + "epoch": 69, + "train_loss": 6.612601704254151, + "train_acc": 0.00846, + "test_loss": 4.605171432495117, + "test_acc": 0.01, + "lyapunov": 2.478518716514568, + "grad_norm": 0.16428393693339724, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 124.40169882774353 + }, + { + "epoch": 70, + "train_loss": 6.594199375915528, + "train_acc": 0.0078, + "test_loss": 4.605171556854248, + "test_acc": 0.01, + "lyapunov": 2.4733456675048986, + "grad_norm": 0.13222269600542105, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 124.43159890174866 + }, + { + "epoch": 71, + "train_loss": 6.584797274169921, + "train_acc": 0.00884, + "test_loss": 4.605171443176269, + "test_acc": 0.01, + "lyapunov": 2.468046905439528, + "grad_norm": 0.09698860702372256, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 124.38395667076111 + }, + { + "epoch": 72, + "train_loss": 6.62336443145752, + "train_acc": 0.00826, + "test_loss": 4.60517096862793, + "test_acc": 0.01, + "lyapunov": 2.486185181171388, + "grad_norm": 0.20758922397897858, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 124.28166174888611 + }, + { + "epoch": 73, + "train_loss": 6.624484212188721, + "train_acc": 0.00906, + "test_loss": 4.6051707977294924, + "test_acc": 0.01, + "lyapunov": 2.487110945879651, + "grad_norm": 0.19977656643109526, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 124.35272693634033 + }, + { + "epoch": 74, + "train_loss": 6.603300393676758, + "train_acc": 0.0091, + "test_loss": 4.605170932006836, + "test_acc": 0.01, + "lyapunov": 2.477061335083164, + "grad_norm": 0.16600248799904951, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 124.40994596481323 + }, + { + "epoch": 75, + "train_loss": 6.5982538143920895, + "train_acc": 0.00856, + "test_loss": 4.605171234130859, + "test_acc": 0.01, + "lyapunov": 2.473140881799371, + "grad_norm": 0.16128953646649988, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 124.43308448791504 + }, + { + "epoch": 76, + "train_loss": 6.592834194946289, + "train_acc": 0.00854, + "test_loss": 4.605171026611328, + "test_acc": 0.01, + "lyapunov": 2.47263060750254, + "grad_norm": 0.1340374980962284, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 124.34016180038452 + }, + { + "epoch": 77, + "train_loss": 6.584505953979492, + "train_acc": 0.00864, + "test_loss": 4.605171239471436, + "test_acc": 0.01, + "lyapunov": 2.4676697760286843, + "grad_norm": 0.11435356827937113, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 124.3169755935669 + }, + { + "epoch": 78, + "train_loss": 6.5763300253295895, + "train_acc": 0.00884, + "test_loss": 4.6051710525512695, + "test_acc": 0.01, + "lyapunov": 2.4630901801311755, + "grad_norm": 0.08961847488711042, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 124.3459620475769 + }, + { + "epoch": 79, + "train_loss": 6.575958716125489, + "train_acc": 0.00932, + "test_loss": 4.605170614624023, + "test_acc": 0.01, + "lyapunov": 2.462890618902338, + "grad_norm": 0.0894392700212742, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 124.39721941947937 + }, + { + "epoch": 80, + "train_loss": 6.57727864440918, + "train_acc": 0.00828, + "test_loss": 4.6051712982177735, + "test_acc": 0.01, + "lyapunov": 2.4634996923949104, + "grad_norm": 0.09357159928827649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 124.43293237686157 + }, + { + "epoch": 81, + "train_loss": 6.576623619689942, + "train_acc": 0.00858, + "test_loss": 4.60517075958252, + "test_acc": 0.01, + "lyapunov": 2.4632719782612207, + "grad_norm": 0.08778044836554635, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 124.33877468109131 + }, + { + "epoch": 82, + "train_loss": 6.706115616912842, + "train_acc": 0.00852, + "test_loss": 4.60517084274292, + "test_acc": 0.01, + "lyapunov": 2.5237014750995295, + "grad_norm": 0.35892654821663944, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 124.33198618888855 + }, + { + "epoch": 83, + "train_loss": 6.693132893981933, + "train_acc": 0.00928, + "test_loss": 4.605170736694336, + "test_acc": 0.01, + "lyapunov": 2.5217734712468998, + "grad_norm": 0.37154817796859707, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 124.33878684043884 + }, + { + "epoch": 84, + "train_loss": 6.673238817443847, + "train_acc": 0.00904, + "test_loss": 4.605171113586426, + "test_acc": 0.01, + "lyapunov": 2.5138309251926745, + "grad_norm": 0.48242670306903057, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 124.42056584358215 + }, + { + "epoch": 85, + "train_loss": 6.597096472473145, + "train_acc": 0.0083, + "test_loss": 4.605170780181885, + "test_acc": 0.01, + "lyapunov": 2.4718706601720943, + "grad_norm": 0.13232535416814104, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 124.43193411827087 + }, + { + "epoch": 86, + "train_loss": 6.575025537414551, + "train_acc": 0.00834, + "test_loss": 4.6051709815979, + "test_acc": 0.01, + "lyapunov": 2.4622172730048293, + "grad_norm": 0.11156499374939659, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 124.34226822853088 + }, + { + "epoch": 87, + "train_loss": 6.573478553161621, + "train_acc": 0.00842, + "test_loss": 4.605170571899414, + "test_acc": 0.01, + "lyapunov": 2.4612386501048835, + "grad_norm": 0.09079297617092336, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 124.27930355072021 + }, + { + "epoch": 88, + "train_loss": 6.5734689576721195, + "train_acc": 0.00854, + "test_loss": 4.605170808410644, + "test_acc": 0.01, + "lyapunov": 2.461263867595312, + "grad_norm": 0.09120456341783888, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 124.38532066345215 + }, + { + "epoch": 89, + "train_loss": 6.578163130187988, + "train_acc": 0.00852, + "test_loss": 4.605170602416992, + "test_acc": 0.01, + "lyapunov": 2.4642753814492386, + "grad_norm": 0.09559837141233972, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 124.44146919250488 + }, + { + "epoch": 90, + "train_loss": 6.5798112936401365, + "train_acc": 0.0083, + "test_loss": 4.605170631408692, + "test_acc": 0.01, + "lyapunov": 2.4649541908517825, + "grad_norm": 0.09735485237927284, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 124.39319109916687 + }, + { + "epoch": 91, + "train_loss": 6.574903171081543, + "train_acc": 0.0083, + "test_loss": 4.605170557403564, + "test_acc": 0.01, + "lyapunov": 2.4621782180903207, + "grad_norm": 0.08981548140002098, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 124.35036778450012 + }, + { + "epoch": 92, + "train_loss": 6.5757408012390135, + "train_acc": 0.00836, + "test_loss": 4.605170684814453, + "test_acc": 0.01, + "lyapunov": 2.4627471470162083, + "grad_norm": 0.08817445544280453, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 124.33928322792053 + }, + { + "epoch": 93, + "train_loss": 6.612554905395508, + "train_acc": 0.00834, + "test_loss": 4.605170486450195, + "test_acc": 0.01, + "lyapunov": 2.4806297959574044, + "grad_norm": 0.1882025016044833, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 124.40910911560059 + }, + { + "epoch": 94, + "train_loss": 6.595741138000489, + "train_acc": 0.00806, + "test_loss": 4.60517061920166, + "test_acc": 0.01, + "lyapunov": 2.472626593411731, + "grad_norm": 0.16104566409905433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 124.41845726966858 + }, + { + "epoch": 95, + "train_loss": 6.5987700848388675, + "train_acc": 0.0085, + "test_loss": 4.605170571899414, + "test_acc": 0.01, + "lyapunov": 2.4736888725739306, + "grad_norm": 0.1552458690168984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 124.34644985198975 + }, + { + "epoch": 96, + "train_loss": 6.597373901672364, + "train_acc": 0.00828, + "test_loss": 4.6051704193115235, + "test_acc": 0.01, + "lyapunov": 2.473390321902302, + "grad_norm": 0.1443472451352086, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 124.32696723937988 + }, + { + "epoch": 97, + "train_loss": 6.590096541442871, + "train_acc": 0.00862, + "test_loss": 4.6051705436706545, + "test_acc": 0.01, + "lyapunov": 2.4693754414463287, + "grad_norm": 0.11035396630097889, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 124.30454087257385 + }, + { + "epoch": 98, + "train_loss": 6.70725288696289, + "train_acc": 0.00854, + "test_loss": 4.605170336151123, + "test_acc": 0.01, + "lyapunov": 2.529677952037138, + "grad_norm": 0.5122066284498856, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 124.31350612640381 + }, + { + "epoch": 99, + "train_loss": 6.575984575958252, + "train_acc": 0.0085, + "test_loss": 4.60517036895752, + "test_acc": 0.01, + "lyapunov": 2.462917518737676, + "grad_norm": 0.08798552577224787, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 124.33125352859497 + }, + { + "epoch": 100, + "train_loss": 6.575890505371094, + "train_acc": 0.00856, + "test_loss": 4.605170387268067, + "test_acc": 0.01, + "lyapunov": 2.462910512524188, + "grad_norm": 0.08984849200071802, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 124.41467308998108 + }, + { + "epoch": 101, + "train_loss": 6.5755246405029295, + "train_acc": 0.00866, + "test_loss": 4.605170295715332, + "test_acc": 0.01, + "lyapunov": 2.4626409702593715, + "grad_norm": 0.08833234367069784, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 124.4282865524292 + }, + { + "epoch": 102, + "train_loss": 6.578647835388184, + "train_acc": 0.00874, + "test_loss": 4.60517028503418, + "test_acc": 0.01, + "lyapunov": 2.4644368957070744, + "grad_norm": 0.0881800871840224, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 124.39285898208618 + }, + { + "epoch": 103, + "train_loss": 6.603837554931641, + "train_acc": 0.0081, + "test_loss": 4.605170309448242, + "test_acc": 0.01, + "lyapunov": 2.475680511016065, + "grad_norm": 0.12862246002842495, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 124.30171847343445 + }, + { + "epoch": 104, + "train_loss": 6.589783010559082, + "train_acc": 0.0087, + "test_loss": 4.605170768737793, + "test_acc": 0.01, + "lyapunov": 2.469147738898197, + "grad_norm": 0.1132666503606524, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 124.33115792274475 + }, + { + "epoch": 105, + "train_loss": 6.607209113769532, + "train_acc": 0.00868, + "test_loss": 4.605170411682129, + "test_acc": 0.01, + "lyapunov": 2.4791276979324457, + "grad_norm": 0.19473222939710866, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 124.42748808860779 + }, + { + "epoch": 106, + "train_loss": 6.605109618988037, + "train_acc": 0.00876, + "test_loss": 4.605170632171631, + "test_acc": 0.01, + "lyapunov": 2.4781547934198014, + "grad_norm": 0.19321601949412123, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 124.40237879753113 + }, + { + "epoch": 107, + "train_loss": 6.5744285192871095, + "train_acc": 0.0084, + "test_loss": 4.605170581054687, + "test_acc": 0.01, + "lyapunov": 2.461912363081637, + "grad_norm": 0.09153624986240072, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 124.35668659210205 + }, + { + "epoch": 108, + "train_loss": 6.591736253662109, + "train_acc": 0.009, + "test_loss": 4.605170578002929, + "test_acc": 0.01, + "lyapunov": 2.469679483672237, + "grad_norm": 0.17005631477257033, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 124.29520559310913 + }, + { + "epoch": 109, + "train_loss": 6.618268890991211, + "train_acc": 0.00898, + "test_loss": 4.605170452880859, + "test_acc": 0.01, + "lyapunov": 2.4846892923955113, + "grad_norm": 0.22506407024101205, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 124.44524145126343 + }, + { + "epoch": 110, + "train_loss": 6.588956251525879, + "train_acc": 0.0079, + "test_loss": 4.605170387268067, + "test_acc": 0.01, + "lyapunov": 2.4697647594734837, + "grad_norm": 0.1497151598092074, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 124.427237033844 + }, + { + "epoch": 111, + "train_loss": 6.597999030761719, + "train_acc": 0.0082, + "test_loss": 4.605170532226563, + "test_acc": 0.01, + "lyapunov": 2.47352661866971, + "grad_norm": 0.1265460364033806, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 124.4067976474762 + }, + { + "epoch": 112, + "train_loss": 6.581220099945068, + "train_acc": 0.00878, + "test_loss": 4.605170124816895, + "test_acc": 0.01, + "lyapunov": 2.466078118595016, + "grad_norm": 0.1166543211179088, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 124.3555097579956 + }, + { + "epoch": 113, + "train_loss": 6.5873154238891605, + "train_acc": 0.00902, + "test_loss": 4.605170477294922, + "test_acc": 0.01, + "lyapunov": 2.467848820454629, + "grad_norm": 0.11336040865405435, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 124.34751081466675 + }, + { + "epoch": 114, + "train_loss": 6.575267355041504, + "train_acc": 0.00892, + "test_loss": 4.60517041015625, + "test_acc": 0.01, + "lyapunov": 2.4624666978636056, + "grad_norm": 0.0882429459696398, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 124.43968343734741 + }, + { + "epoch": 115, + "train_loss": 6.575747386169434, + "train_acc": 0.0087, + "test_loss": 4.60517027130127, + "test_acc": 0.01, + "lyapunov": 2.46279121481854, + "grad_norm": 0.08906865623909292, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 124.40401101112366 + }, + { + "epoch": 116, + "train_loss": 6.574066097106933, + "train_acc": 0.00888, + "test_loss": 4.605170015716553, + "test_acc": 0.01, + "lyapunov": 2.4617425267348816, + "grad_norm": 0.09299280580563789, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 124.43384170532227 + }, + { + "epoch": 117, + "train_loss": 6.575292884674072, + "train_acc": 0.00916, + "test_loss": 4.605170446777343, + "test_acc": 0.01, + "lyapunov": 2.462491541567361, + "grad_norm": 0.08789900440919356, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 124.31648087501526 + }, + { + "epoch": 118, + "train_loss": 6.578267410125733, + "train_acc": 0.00826, + "test_loss": 4.605170466613769, + "test_acc": 0.01, + "lyapunov": 2.4644045262690395, + "grad_norm": 0.10415607883931481, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 124.33564472198486 + }, + { + "epoch": 119, + "train_loss": 6.574555395050049, + "train_acc": 0.00854, + "test_loss": 4.605170401000977, + "test_acc": 0.01, + "lyapunov": 2.4620885909975643, + "grad_norm": 0.08778921241218508, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 124.65056228637695 + }, + { + "epoch": 120, + "train_loss": 6.583910481872558, + "train_acc": 0.00864, + "test_loss": 4.605170470428467, + "test_acc": 0.01, + "lyapunov": 2.467699810671989, + "grad_norm": 0.3040678237626765, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 124.44140434265137 + }, + { + "epoch": 121, + "train_loss": 6.586020791015625, + "train_acc": 0.00884, + "test_loss": 4.605170375823975, + "test_acc": 0.01, + "lyapunov": 2.467914994720303, + "grad_norm": 0.11635906922176238, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 124.43893909454346 + }, + { + "epoch": 122, + "train_loss": 6.576034954528809, + "train_acc": 0.0088, + "test_loss": 4.605170199584961, + "test_acc": 0.01, + "lyapunov": 2.463029363880987, + "grad_norm": 0.08771533827211757, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 124.32056403160095 + }, + { + "epoch": 123, + "train_loss": 6.574589498291016, + "train_acc": 0.00878, + "test_loss": 4.605170094299316, + "test_acc": 0.01, + "lyapunov": 2.4620493037621385, + "grad_norm": 0.08813480095873011, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 124.4015576839447 + }, + { + "epoch": 124, + "train_loss": 6.576157915649414, + "train_acc": 0.00904, + "test_loss": 4.605170024108887, + "test_acc": 0.01, + "lyapunov": 2.4630649205668806, + "grad_norm": 0.08749001934915172, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 124.42104578018188 + }, + { + "epoch": 125, + "train_loss": 6.579862565307617, + "train_acc": 0.00876, + "test_loss": 4.605170492553711, + "test_acc": 0.01, + "lyapunov": 2.465126996759868, + "grad_norm": 0.09372036345061274, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 124.4746482372284 + }, + { + "epoch": 126, + "train_loss": 6.577153359985352, + "train_acc": 0.00866, + "test_loss": 4.605170122528076, + "test_acc": 0.01, + "lyapunov": 2.463735998134174, + "grad_norm": 0.09613135620568294, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 124.38881230354309 + }, + { + "epoch": 127, + "train_loss": 6.574400754547119, + "train_acc": 0.0083, + "test_loss": 4.605170375823975, + "test_acc": 0.01, + "lyapunov": 2.4619021769374836, + "grad_norm": 0.08860379526254596, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 124.31344938278198 + }, + { + "epoch": 128, + "train_loss": 6.571165360717774, + "train_acc": 0.00878, + "test_loss": 4.605170154571534, + "test_acc": 0.01, + "lyapunov": 2.459857079074206, + "grad_norm": 0.08757319736074258, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 124.39138221740723 + }, + { + "epoch": 129, + "train_loss": 6.575437990264892, + "train_acc": 0.00846, + "test_loss": 4.605170350646973, + "test_acc": 0.01, + "lyapunov": 2.46259711831427, + "grad_norm": 0.08813574783200358, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 124.41060423851013 + }, + { + "epoch": 130, + "train_loss": 6.591315377197265, + "train_acc": 0.00954, + "test_loss": 4.605170065307617, + "test_acc": 0.01, + "lyapunov": 2.4702539943978, + "grad_norm": 0.11366316284903058, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 124.4502763748169 + }, + { + "epoch": 131, + "train_loss": 6.577392526092529, + "train_acc": 0.00946, + "test_loss": 4.60517007446289, + "test_acc": 0.01, + "lyapunov": 2.46386312401813, + "grad_norm": 0.08820500519427996, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 124.3550136089325 + }, + { + "epoch": 132, + "train_loss": 6.592328434906006, + "train_acc": 0.00882, + "test_loss": 4.6051704208374025, + "test_acc": 0.01, + "lyapunov": 2.4700996772102686, + "grad_norm": 0.114161955094371, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 124.37056255340576 + }, + { + "epoch": 133, + "train_loss": 6.588796159973144, + "train_acc": 0.00896, + "test_loss": 4.605170506286621, + "test_acc": 0.01, + "lyapunov": 2.468394133745862, + "grad_norm": 0.1295209594512649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 124.36608004570007 + }, + { + "epoch": 134, + "train_loss": 6.576412990264893, + "train_acc": 0.00898, + "test_loss": 4.605170251464844, + "test_acc": 0.01, + "lyapunov": 2.4632679434383618, + "grad_norm": 0.08812453692162578, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 124.43608951568604 + }, + { + "epoch": 135, + "train_loss": 6.5760765690612795, + "train_acc": 0.00924, + "test_loss": 4.605169999694824, + "test_acc": 0.01, + "lyapunov": 2.463012531895162, + "grad_norm": 0.08722595509863246, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 124.46503901481628 + }, + { + "epoch": 136, + "train_loss": 6.575435556030273, + "train_acc": 0.00884, + "test_loss": 4.605170062255859, + "test_acc": 0.01, + "lyapunov": 2.4626583150585595, + "grad_norm": 0.08796433458523298, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 124.34801983833313 + }, + { + "epoch": 137, + "train_loss": 6.575190331268311, + "train_acc": 0.00934, + "test_loss": 4.6051701629638675, + "test_acc": 0.01, + "lyapunov": 2.4624439023644724, + "grad_norm": 0.08813731535348707, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 124.35173964500427 + }, + { + "epoch": 138, + "train_loss": 6.574904625091553, + "train_acc": 0.0089, + "test_loss": 4.60517007446289, + "test_acc": 0.01, + "lyapunov": 2.4622641213409735, + "grad_norm": 0.08807062213809792, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 124.40467262268066 + }, + { + "epoch": 139, + "train_loss": 6.5738159555053715, + "train_acc": 0.00926, + "test_loss": 4.605170321655273, + "test_acc": 0.01, + "lyapunov": 2.4615705336451223, + "grad_norm": 0.08717896516246301, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 124.4789035320282 + }, + { + "epoch": 140, + "train_loss": 6.575532109680176, + "train_acc": 0.00924, + "test_loss": 4.605170358276367, + "test_acc": 0.01, + "lyapunov": 2.4626962266614676, + "grad_norm": 0.0882680648293281, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 124.40317368507385 + }, + { + "epoch": 141, + "train_loss": 6.5800046757507324, + "train_acc": 0.00862, + "test_loss": 4.60517036895752, + "test_acc": 0.01, + "lyapunov": 2.4654090264264275, + "grad_norm": 0.11343015603036581, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 124.35891890525818 + }, + { + "epoch": 142, + "train_loss": 6.57490125793457, + "train_acc": 0.00948, + "test_loss": 4.6051704162597655, + "test_acc": 0.01, + "lyapunov": 2.462258317586406, + "grad_norm": 0.08755517239002598, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 124.29203748703003 + }, + { + "epoch": 143, + "train_loss": 6.576884376220703, + "train_acc": 0.00966, + "test_loss": 4.605170155334473, + "test_acc": 0.01, + "lyapunov": 2.4635954634917665, + "grad_norm": 0.08753943717047542, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 124.41098976135254 + }, + { + "epoch": 144, + "train_loss": 6.573677404937744, + "train_acc": 0.00962, + "test_loss": 4.60517022857666, + "test_acc": 0.01, + "lyapunov": 2.461500019673496, + "grad_norm": 0.08775396126300311, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 124.44748258590698 + }, + { + "epoch": 145, + "train_loss": 6.573780137023926, + "train_acc": 0.0092, + "test_loss": 4.605170056152343, + "test_acc": 0.01, + "lyapunov": 2.4615867387913073, + "grad_norm": 0.08734584455870835, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 124.4104528427124 + }, + { + "epoch": 146, + "train_loss": 6.574326271667481, + "train_acc": 0.00928, + "test_loss": 4.605170436859131, + "test_acc": 0.01, + "lyapunov": 2.4619192083168517, + "grad_norm": 0.08784696936548642, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 124.3491895198822 + }, + { + "epoch": 147, + "train_loss": 6.573583771209717, + "train_acc": 0.00938, + "test_loss": 4.605170133209229, + "test_acc": 0.01, + "lyapunov": 2.461428134947482, + "grad_norm": 0.08718184577116198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 124.33614110946655 + }, + { + "epoch": 148, + "train_loss": 6.577077916870117, + "train_acc": 0.01, + "test_loss": 4.605170425415039, + "test_acc": 0.01, + "lyapunov": 2.4637341109078252, + "grad_norm": 0.08788027221282606, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 124.37565398216248 + }, + { + "epoch": 149, + "train_loss": 6.5732455339050295, + "train_acc": 0.01, + "test_loss": 4.605170333862305, + "test_acc": 0.01, + "lyapunov": 2.461217089382279, + "grad_norm": 0.08788179142338205, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 124.34460210800171 + }, + { + "epoch": 150, + "train_loss": 6.574304178619385, + "train_acc": 0.01, + "test_loss": 4.605170114135742, + "test_acc": 0.01, + "lyapunov": 2.4619127923570328, + "grad_norm": 0.08771827398079268, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 124.40945982933044 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 13.988400897827148, + "train_acc": 0.01438, + "test_loss": 4.683009733581543, + "test_acc": 0.0106, + "lyapunov": 5.045674181960123, + "grad_norm": 5.752499013515142, + "grad_max_sv": 4.6983559966087345, + "grad_min_sv": 8.501930549228987e-08, + "grad_condition": 317270864.69818985, + "lr": 0.0009998903417374227, + "time_sec": 167.40048050880432 + }, + { + "epoch": 2, + "train_loss": 9.313672403564453, + "train_acc": 0.01648, + "test_loss": 4.631449128723145, + "test_acc": 0.01, + "lyapunov": 3.775117972317864, + "grad_norm": 4.062466764062373, + "grad_max_sv": 3.613509923219681, + "grad_min_sv": 4.5653093948966327e-08, + "grad_condition": 646545370.9190311, + "lr": 0.0009995614150494292, + "time_sec": 167.42056441307068 + }, + { + "epoch": 3, + "train_loss": 9.2102595413208, + "train_acc": 0.01704, + "test_loss": 4.625689315795898, + "test_acc": 0.0099, + "lyapunov": 3.769411094353327, + "grad_norm": 3.2423057609153028, + "grad_max_sv": 2.773962843418121, + "grad_min_sv": 1.3365777420984947e-08, + "grad_condition": 79084430364.82771, + "lr": 0.0009990133642141358, + "time_sec": 167.40087485313416 + }, + { + "epoch": 4, + "train_loss": 8.593553448181153, + "train_acc": 0.01608, + "test_loss": 4.623868472290039, + "test_acc": 0.01, + "lyapunov": 3.5245635119240606, + "grad_norm": 2.236847501376478, + "grad_max_sv": 1.9526167243719101, + "grad_min_sv": 4.5824498221260444e-11, + "grad_condition": 250389376731.7333, + "lr": 0.0009982464296247522, + "time_sec": 167.34348464012146 + }, + { + "epoch": 5, + "train_loss": 7.8038157984924315, + "train_acc": 0.01666, + "test_loss": 4.618056827545166, + "test_acc": 0.01, + "lyapunov": 3.1676931515374145, + "grad_norm": 1.5048980928317333, + "grad_max_sv": 1.1324948772788048, + "grad_min_sv": 1.5125593644607378e-11, + "grad_condition": 218348544809.20728, + "lr": 0.0009972609476841367, + "time_sec": 167.4401364326477 + }, + { + "epoch": 6, + "train_loss": 7.634129183959961, + "train_acc": 0.01436, + "test_loss": 4.617713563537598, + "test_acc": 0.01, + "lyapunov": 3.0711578097184904, + "grad_norm": 1.9264530093156518, + "grad_max_sv": 0.7561077677975927, + "grad_min_sv": 2.3226373858483118e-12, + "grad_condition": 319185362917.36163, + "lr": 0.000996057350657239, + "time_sec": 167.3985676765442 + }, + { + "epoch": 7, + "train_loss": 7.547255232238769, + "train_acc": 0.01396, + "test_loss": 4.614803285980225, + "test_acc": 0.01, + "lyapunov": 3.0217712657226015, + "grad_norm": 1.075279960644913, + "grad_max_sv": 0.6469582007612514, + "grad_min_sv": 1.889760736503505e-12, + "grad_condition": 338582040139.5369, + "lr": 0.000994636166481494, + "time_sec": 167.22783827781677 + }, + { + "epoch": 8, + "train_loss": 7.305741961669922, + "train_acc": 0.01248, + "test_loss": 4.611902558898926, + "test_acc": 0.01, + "lyapunov": 2.8956392976024268, + "grad_norm": 1.304673575393078, + "grad_max_sv": 0.4924972869455814, + "grad_min_sv": 8.285040604573086e-13, + "grad_condition": 334051794817.99695, + "lr": 0.0009929980185352525, + "time_sec": 167.31978368759155 + }, + { + "epoch": 9, + "train_loss": 7.328730865783691, + "train_acc": 0.01336, + "test_loss": 4.606002921295166, + "test_acc": 0.01, + "lyapunov": 2.913580340192751, + "grad_norm": 1.4776699959663357, + "grad_max_sv": 0.3292516863617735, + "grad_min_sv": 5.235604182531881e-13, + "grad_condition": 246744375025.40308, + "lr": 0.0009911436253643444, + "time_sec": 167.3429365158081 + }, + { + "epoch": 10, + "train_loss": 7.308604444580078, + "train_acc": 0.01346, + "test_loss": 4.611476264953613, + "test_acc": 0.01, + "lyapunov": 2.900581695234684, + "grad_norm": 1.3123879020319187, + "grad_max_sv": 0.27272568672558684, + "grad_min_sv": 2.0496919726941882e-13, + "grad_condition": 238625164756.47662, + "lr": 0.0009890738003669028, + "time_sec": 167.2653293609619 + }, + { + "epoch": 11, + "train_loss": 7.490302003173828, + "train_acc": 0.01364, + "test_loss": 4.611579527282715, + "test_acc": 0.01, + "lyapunov": 3.0006146321211324, + "grad_norm": 2.2969507920003114, + "grad_max_sv": 0.19786488203932162, + "grad_min_sv": 8.37648333500382e-14, + "grad_condition": 183815724532.2033, + "lr": 0.00098678945143658, + "time_sec": 167.22061586380005 + }, + { + "epoch": 12, + "train_loss": 7.307793238525391, + "train_acc": 0.01262, + "test_loss": 4.606186763000489, + "test_acc": 0.01, + "lyapunov": 2.9112238219327025, + "grad_norm": 1.4729621434597777, + "grad_max_sv": 0.2151564534753561, + "grad_min_sv": 1.990284826719073e-14, + "grad_condition": 211594713734.62634, + "lr": 0.0009842915805643154, + "time_sec": 167.35631036758423 + }, + { + "epoch": 13, + "train_loss": 7.459832763977051, + "train_acc": 0.01172, + "test_loss": 4.606186486053467, + "test_acc": 0.01, + "lyapunov": 2.9779586944433736, + "grad_norm": 1.2584288878227161, + "grad_max_sv": 0.17604726925492287, + "grad_min_sv": 2.9740421215427092e-27, + "grad_condition": 176047269254.9224, + "lr": 0.000981581283398829, + "time_sec": 167.55029773712158 + }, + { + "epoch": 14, + "train_loss": 7.959970283813477, + "train_acc": 0.01162, + "test_loss": 4.606137133789063, + "test_acc": 0.01, + "lyapunov": 3.224144145960698, + "grad_norm": 1.3145379480759145, + "grad_max_sv": 0.16056990809738636, + "grad_min_sv": 6.069672152326662e-32, + "grad_condition": 160569908097.38638, + "lr": 0.0009786597487660333, + "time_sec": 167.2209074497223 + }, + { + "epoch": 15, + "train_loss": 7.6532865875244145, + "train_acc": 0.01084, + "test_loss": 4.606105514526368, + "test_acc": 0.01, + "lyapunov": 3.0689418846384036, + "grad_norm": 0.7741481577990978, + "grad_max_sv": 0.1402381032705307, + "grad_min_sv": 5.380285453775135e-40, + "grad_condition": 140238103270.5307, + "lr": 0.0009755282581475766, + "time_sec": 167.3077232837677 + }, + { + "epoch": 16, + "train_loss": 7.216664337158203, + "train_acc": 0.01118, + "test_loss": 4.606032288360596, + "test_acc": 0.01, + "lyapunov": 2.8502078891715126, + "grad_norm": 2.0735777194936222, + "grad_max_sv": 0.10496805571019649, + "grad_min_sv": 1.2874706397430962e-40, + "grad_condition": 104968055710.1965, + "lr": 0.0009721881851187403, + "time_sec": 167.3395276069641 + }, + { + "epoch": 17, + "train_loss": 8.192574862670899, + "train_acc": 0.01158, + "test_loss": 4.6059588500976565, + "test_acc": 0.01, + "lyapunov": 3.3359562454321194, + "grad_norm": 3.147348676481939, + "grad_max_sv": 0.09904798325151205, + "grad_min_sv": 3.313275631249688e-41, + "grad_condition": 99047983251.51205, + "lr": 0.0009686409947459456, + "time_sec": 167.2007658481598 + }, + { + "epoch": 18, + "train_loss": 7.947704606018067, + "train_acc": 0.01086, + "test_loss": 4.605810301208496, + "test_acc": 0.01, + "lyapunov": 3.2087259890173403, + "grad_norm": 1.1551680706222047, + "grad_max_sv": 0.0897066842764616, + "grad_min_sv": 3.5133705422167894e-42, + "grad_condition": 89706684276.4616, + "lr": 0.0009648882429441254, + "time_sec": 167.2022511959076 + }, + { + "epoch": 19, + "train_loss": 8.011894176635742, + "train_acc": 0.00998, + "test_loss": 4.610458689880371, + "test_acc": 0.01, + "lyapunov": 3.247671382201602, + "grad_norm": 0.789157877855446, + "grad_max_sv": 0.04834392946213484, + "grad_min_sv": 1.7516230804060213e-46, + "grad_condition": 48343929462.134834, + "lr": 0.00096093157579425, + "time_sec": 167.33806610107422 + }, + { + "epoch": 20, + "train_loss": 8.051023805236817, + "train_acc": 0.00904, + "test_loss": 4.610909297180176, + "test_acc": 0.01, + "lyapunov": 3.2383710405100947, + "grad_norm": 1.1273733660004814, + "grad_max_sv": 0.010316886380314827, + "grad_min_sv": 0.0, + "grad_condition": 10316886380.314827, + "lr": 0.0009567727288213001, + "time_sec": 167.29369735717773 + }, + { + "epoch": 21, + "train_loss": 7.128181716918945, + "train_acc": 0.00838, + "test_loss": 4.607191325378418, + "test_acc": 0.01, + "lyapunov": 2.7860927539103475, + "grad_norm": 1.0701329510796986, + "grad_max_sv": 0.014478291012346744, + "grad_min_sv": 0.0, + "grad_condition": 14478291012.346745, + "lr": 0.0009524135262330095, + "time_sec": 167.20805835723877 + }, + { + "epoch": 22, + "train_loss": 6.963491222686768, + "train_acc": 0.0091, + "test_loss": 4.607380027770996, + "test_acc": 0.01, + "lyapunov": 2.6966084769314818, + "grad_norm": 1.1730630244839415, + "grad_max_sv": 0.012138673383742572, + "grad_min_sv": 0.0, + "grad_condition": 12138673383.742573, + "lr": 0.0009478558801197061, + "time_sec": 167.22877049446106 + }, + { + "epoch": 23, + "train_loss": 6.875370686798096, + "train_acc": 0.00858, + "test_loss": 4.609367184448242, + "test_acc": 0.01, + "lyapunov": 2.6493814430578286, + "grad_norm": 1.3739908151868958, + "grad_max_sv": 0.011468294635415077, + "grad_min_sv": 0.0, + "grad_condition": 11468294635.415077, + "lr": 0.000943101789615607, + "time_sec": 167.56782293319702 + }, + { + "epoch": 24, + "train_loss": 7.175245254516602, + "train_acc": 0.00882, + "test_loss": 4.6075513046264645, + "test_acc": 0.01, + "lyapunov": 2.813519052837206, + "grad_norm": 1.9559849705093102, + "grad_max_sv": 0.011112797912210226, + "grad_min_sv": 0.0, + "grad_condition": 11112797912.210226, + "lr": 0.0009381533400219313, + "time_sec": 167.2002296447754 + }, + { + "epoch": 25, + "train_loss": 6.835657153320312, + "train_acc": 0.00898, + "test_loss": 4.609123987579346, + "test_acc": 0.01, + "lyapunov": 2.6257676047742216, + "grad_norm": 0.8499098981030252, + "grad_max_sv": 0.010097978403791785, + "grad_min_sv": 0.0, + "grad_condition": 10097978403.791786, + "lr": 0.0009330127018922189, + "time_sec": 167.22895908355713 + }, + { + "epoch": 26, + "train_loss": 6.806944010009766, + "train_acc": 0.00952, + "test_loss": 4.608995832824707, + "test_acc": 0.01, + "lyapunov": 2.608501203224787, + "grad_norm": 0.16959020377034753, + "grad_max_sv": 0.009534611040726304, + "grad_min_sv": 0.0, + "grad_condition": 9534611040.726305, + "lr": 0.000927682130080253, + "time_sec": 167.30368304252625 + }, + { + "epoch": 27, + "train_loss": 6.796024333190918, + "train_acc": 0.00918, + "test_loss": 4.608860453033447, + "test_acc": 0.01, + "lyapunov": 2.601986149083013, + "grad_norm": 0.10936615989500913, + "grad_max_sv": 0.003977444209158421, + "grad_min_sv": 0.0, + "grad_condition": 3977444209.1584206, + "lr": 0.0009221639627510072, + "time_sec": 167.31120085716248 + }, + { + "epoch": 28, + "train_loss": 6.799691816711426, + "train_acc": 0.00886, + "test_loss": 4.6074915008544925, + "test_acc": 0.01, + "lyapunov": 2.604261659905124, + "grad_norm": 0.09652074382540592, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009164606203550494, + "time_sec": 167.08661937713623 + }, + { + "epoch": 29, + "train_loss": 6.8092449851989745, + "train_acc": 0.00872, + "test_loss": 4.608655583190918, + "test_acc": 0.01, + "lyapunov": 2.608830842825458, + "grad_norm": 0.12376584460534797, + "grad_max_sv": 0.002880856767296791, + "grad_min_sv": 0.0, + "grad_condition": 2880856767.296791, + "lr": 0.0009105746045668516, + "time_sec": 167.20095920562744 + }, + { + "epoch": 30, + "train_loss": 6.801117441558838, + "train_acc": 0.00916, + "test_loss": 4.608566645812989, + "test_acc": 0.01, + "lyapunov": 2.605140414689203, + "grad_norm": 0.10511250252895085, + "grad_max_sv": 0.0030666613951325417, + "grad_min_sv": 0.0, + "grad_condition": 3066661395.1325417, + "lr": 0.0009045084971874733, + "time_sec": 167.22371792793274 + }, + { + "epoch": 31, + "train_loss": 6.818323947296142, + "train_acc": 0.00892, + "test_loss": 4.607396678161621, + "test_acc": 0.01, + "lyapunov": 2.6131436501622507, + "grad_norm": 0.17673479255010097, + "grad_max_sv": 0.001358983526006341, + "grad_min_sv": 0.0, + "grad_condition": 1358983526.006341, + "lr": 0.0008982649590120977, + "time_sec": 167.21490716934204 + }, + { + "epoch": 32, + "train_loss": 6.81385307510376, + "train_acc": 0.00854, + "test_loss": 4.608588083648682, + "test_acc": 0.01, + "lyapunov": 2.61087080828674, + "grad_norm": 0.1300116564110217, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008918467286629196, + "time_sec": 167.17329859733582 + }, + { + "epoch": 33, + "train_loss": 6.798595635375976, + "train_acc": 0.00848, + "test_loss": 7.428785041809082, + "test_acc": 0.01, + "lyapunov": 2.603473731623891, + "grad_norm": 0.10178851829698213, + "grad_max_sv": 0.0006682275328785181, + "grad_min_sv": 0.0, + "grad_condition": 668227532.8785181, + "lr": 0.0008852566213878943, + "time_sec": 167.23122191429138 + }, + { + "epoch": 34, + "train_loss": 6.79622100402832, + "train_acc": 0.0085, + "test_loss": 7.445402703094483, + "test_acc": 0.01, + "lyapunov": 2.602201823383341, + "grad_norm": 0.09821894401826198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000878497527825878, + "time_sec": 167.51045203208923 + }, + { + "epoch": 35, + "train_loss": 6.800452690124512, + "train_acc": 0.0086, + "test_loss": 4.6083794067382815, + "test_acc": 0.01, + "lyapunov": 2.604824850321426, + "grad_norm": 0.09521574599597374, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000871572412738697, + "time_sec": 167.14473628997803 + }, + { + "epoch": 36, + "train_loss": 6.801179714050293, + "train_acc": 0.00882, + "test_loss": 4.608353971862793, + "test_acc": 0.01, + "lyapunov": 2.605245649357281, + "grad_norm": 0.09891258167661582, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107055, + "time_sec": 167.21640372276306 + }, + { + "epoch": 37, + "train_loss": 6.798632629699707, + "train_acc": 0.00856, + "test_loss": 4.608331527709961, + "test_acc": 0.01, + "lyapunov": 2.603703239079936, + "grad_norm": 0.09374120059954827, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 167.28665328025818 + }, + { + "epoch": 38, + "train_loss": 6.798052488708496, + "train_acc": 0.00864, + "test_loss": 4.608306627655029, + "test_acc": 0.01, + "lyapunov": 2.6033894985228243, + "grad_norm": 0.0928347460465077, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 167.22592282295227 + }, + { + "epoch": 39, + "train_loss": 6.797720238189697, + "train_acc": 0.00854, + "test_loss": 4.608331230163574, + "test_acc": 0.01, + "lyapunov": 2.6030823568553876, + "grad_norm": 0.1025783953694396, + "grad_max_sv": 0.000793654378503561, + "grad_min_sv": 0.0, + "grad_condition": 793654378.503561, + "lr": 0.0008422735529643442, + "time_sec": 167.11991024017334 + }, + { + "epoch": 40, + "train_loss": 6.796907914123535, + "train_acc": 0.00818, + "test_loss": 7.429255201721191, + "test_acc": 0.01, + "lyapunov": 2.6026227175427215, + "grad_norm": 0.09282398303274703, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008345653031794289, + "time_sec": 167.28346157073975 + }, + { + "epoch": 41, + "train_loss": 6.811164211883545, + "train_acc": 0.00882, + "test_loss": 4.7162436149597164, + "test_acc": 0.01, + "lyapunov": 2.608923517529617, + "grad_norm": 0.1222466987863888, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 167.2502682209015 + }, + { + "epoch": 42, + "train_loss": 6.810527358703613, + "train_acc": 0.00896, + "test_loss": 4.736723460388184, + "test_acc": 0.01, + "lyapunov": 2.6098364740991227, + "grad_norm": 0.12481417359397351, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 167.19833540916443 + }, + { + "epoch": 43, + "train_loss": 6.8037118544006345, + "train_acc": 0.0083, + "test_loss": 4.676154768371582, + "test_acc": 0.01, + "lyapunov": 2.606640679147237, + "grad_norm": 0.12856017826684152, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 167.17452216148376 + }, + { + "epoch": 44, + "train_loss": 6.794667855529785, + "train_acc": 0.00872, + "test_loss": 4.7420101188659665, + "test_acc": 0.01, + "lyapunov": 2.6012551680855127, + "grad_norm": 0.09209394266338691, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 167.27408933639526 + }, + { + "epoch": 45, + "train_loss": 6.7950104260253905, + "train_acc": 0.00898, + "test_loss": 4.896900399780273, + "test_acc": 0.01, + "lyapunov": 2.6014791181325303, + "grad_norm": 0.09205616000449629, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 167.31984734535217 + }, + { + "epoch": 46, + "train_loss": 6.819086815185547, + "train_acc": 0.00892, + "test_loss": 4.605172099304199, + "test_acc": 0.01, + "lyapunov": 2.612778242896585, + "grad_norm": 0.11562328930387418, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 167.12109279632568 + }, + { + "epoch": 47, + "train_loss": 6.798819590454102, + "train_acc": 0.00832, + "test_loss": 4.605172010803223, + "test_acc": 0.01, + "lyapunov": 2.6037960967139515, + "grad_norm": 0.09084227993519768, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 167.26839470863342 + }, + { + "epoch": 48, + "train_loss": 6.797002004394531, + "train_acc": 0.00882, + "test_loss": 4.6051717926025395, + "test_acc": 0.01, + "lyapunov": 2.6027391889820928, + "grad_norm": 0.09202982942979847, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 167.25185203552246 + }, + { + "epoch": 49, + "train_loss": 6.799232456512451, + "train_acc": 0.00864, + "test_loss": 4.605324877929688, + "test_acc": 0.01, + "lyapunov": 2.6040493954173134, + "grad_norm": 0.0929356327661651, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 167.24265789985657 + }, + { + "epoch": 50, + "train_loss": 6.812471532135009, + "train_acc": 0.00842, + "test_loss": 4.608313929748535, + "test_acc": 0.01, + "lyapunov": 2.6102352337459163, + "grad_norm": 0.11621130736417108, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 167.15211701393127 + }, + { + "epoch": 51, + "train_loss": 6.794671293334961, + "train_acc": 0.00842, + "test_loss": 4.605172332763672, + "test_acc": 0.01, + "lyapunov": 2.6012639694506556, + "grad_norm": 0.0930565557537395, + "grad_max_sv": 0.0036748358979821205, + "grad_min_sv": 0.0, + "grad_condition": 3674835897.9821205, + "lr": 0.0007408768370508575, + "time_sec": 167.3388113975525 + }, + { + "epoch": 52, + "train_loss": 6.799352421264649, + "train_acc": 0.00892, + "test_loss": 4.605172877502441, + "test_acc": 0.01, + "lyapunov": 2.6041594795558765, + "grad_norm": 0.09046235706111078, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 168.00543642044067 + }, + { + "epoch": 53, + "train_loss": 6.821222294006348, + "train_acc": 0.00822, + "test_loss": 4.605560771179199, + "test_acc": 0.01, + "lyapunov": 2.612406419061334, + "grad_norm": 0.10733736636185434, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 167.15741348266602 + }, + { + "epoch": 54, + "train_loss": 6.7975339453125, + "train_acc": 0.0087, + "test_loss": 4.605171894073487, + "test_acc": 0.01, + "lyapunov": 2.603086569729973, + "grad_norm": 0.09401396255246093, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 167.15016341209412 + }, + { + "epoch": 55, + "train_loss": 6.818788750457764, + "train_acc": 0.00834, + "test_loss": 4.60517187576294, + "test_acc": 0.01, + "lyapunov": 2.614099033653279, + "grad_norm": 0.10409203954293918, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 167.16365313529968 + }, + { + "epoch": 56, + "train_loss": 6.823291486663819, + "train_acc": 0.00896, + "test_loss": 4.605172322082519, + "test_acc": 0.01, + "lyapunov": 2.6149235838819345, + "grad_norm": 0.1215199933903174, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 167.22393465042114 + }, + { + "epoch": 57, + "train_loss": 6.812863822021485, + "train_acc": 0.00918, + "test_loss": 4.605172196197509, + "test_acc": 0.01, + "lyapunov": 2.6100745280380444, + "grad_norm": 0.11428618016798626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 167.36779832839966 + }, + { + "epoch": 58, + "train_loss": 6.845285939025879, + "train_acc": 0.00852, + "test_loss": 4.605171984863281, + "test_acc": 0.01, + "lyapunov": 2.621920944784608, + "grad_norm": 0.16133795983355934, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 167.1204113960266 + }, + { + "epoch": 59, + "train_loss": 6.8284387295532225, + "train_acc": 0.00838, + "test_loss": 4.605172086334228, + "test_acc": 0.01, + "lyapunov": 2.619316293150568, + "grad_norm": 0.1660277007934849, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 167.1542353630066 + }, + { + "epoch": 60, + "train_loss": 6.853109035339355, + "train_acc": 0.00904, + "test_loss": 4.605171766662598, + "test_acc": 0.01, + "lyapunov": 2.626850544644134, + "grad_norm": 0.14505200146170139, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 167.25803112983704 + }, + { + "epoch": 61, + "train_loss": 6.8587484286499025, + "train_acc": 0.00894, + "test_loss": 4.605171794128418, + "test_acc": 0.01, + "lyapunov": 2.6341320041500396, + "grad_norm": 0.23780774328945256, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 167.1593141555786 + }, + { + "epoch": 62, + "train_loss": 6.856730157775879, + "train_acc": 0.00858, + "test_loss": 4.605171855926514, + "test_acc": 0.01, + "lyapunov": 2.6288814319064246, + "grad_norm": 0.19871702414437586, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 167.14994502067566 + }, + { + "epoch": 63, + "train_loss": 6.840637737731933, + "train_acc": 0.00874, + "test_loss": 4.60517123260498, + "test_acc": 0.01, + "lyapunov": 2.624538544803629, + "grad_norm": 0.2247756960679524, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 167.2067906856537 + }, + { + "epoch": 64, + "train_loss": 6.822744883117676, + "train_acc": 0.00848, + "test_loss": 4.60517158203125, + "test_acc": 0.01, + "lyapunov": 2.613635628424642, + "grad_norm": 0.1329153891377645, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 167.26912307739258 + }, + { + "epoch": 65, + "train_loss": 6.8317010522460935, + "train_acc": 0.00862, + "test_loss": 4.605171473693848, + "test_acc": 0.01, + "lyapunov": 2.6185932665529763, + "grad_norm": 0.13671337080211707, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 167.09261989593506 + }, + { + "epoch": 66, + "train_loss": 6.812226905822754, + "train_acc": 0.0088, + "test_loss": 4.605171728515625, + "test_acc": 0.01, + "lyapunov": 2.610206864374068, + "grad_norm": 0.12722937279819782, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 167.21893763542175 + }, + { + "epoch": 67, + "train_loss": 6.808111183776855, + "train_acc": 0.0093, + "test_loss": 4.6051715423583985, + "test_acc": 0.01, + "lyapunov": 2.6089447556859087, + "grad_norm": 0.15865472726238314, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 167.29591965675354 + }, + { + "epoch": 68, + "train_loss": 6.83726111694336, + "train_acc": 0.00862, + "test_loss": 4.605171617126465, + "test_acc": 0.01, + "lyapunov": 2.6234818724415185, + "grad_norm": 0.21106961802984933, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 167.22871494293213 + }, + { + "epoch": 69, + "train_loss": 6.833951936035156, + "train_acc": 0.00874, + "test_loss": 4.605171533203125, + "test_acc": 0.01, + "lyapunov": 2.6221561791646817, + "grad_norm": 0.23690960823937743, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 167.11618614196777 + }, + { + "epoch": 70, + "train_loss": 6.80746663269043, + "train_acc": 0.00868, + "test_loss": 4.6051711715698245, + "test_acc": 0.01, + "lyapunov": 2.608615706948673, + "grad_norm": 0.19368668238286113, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 167.25853991508484 + }, + { + "epoch": 71, + "train_loss": 6.840300604553223, + "train_acc": 0.00892, + "test_loss": 4.605171086120605, + "test_acc": 0.01, + "lyapunov": 2.6233106214372093, + "grad_norm": 0.21230815886405713, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 167.2756736278534 + }, + { + "epoch": 72, + "train_loss": 6.826620941162109, + "train_acc": 0.00886, + "test_loss": 4.605171425628662, + "test_acc": 0.01, + "lyapunov": 2.617017206328604, + "grad_norm": 0.16852859644395693, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 167.11485767364502 + }, + { + "epoch": 73, + "train_loss": 6.81151391418457, + "train_acc": 0.0083, + "test_loss": 4.605171309661865, + "test_acc": 0.01, + "lyapunov": 2.6109183840739454, + "grad_norm": 0.15884163876986282, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 167.23269772529602 + }, + { + "epoch": 74, + "train_loss": 6.803579806518555, + "train_acc": 0.00836, + "test_loss": 4.605171119689941, + "test_acc": 0.01, + "lyapunov": 2.606299752774446, + "grad_norm": 0.12416094470418608, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 167.30208802223206 + }, + { + "epoch": 75, + "train_loss": 6.85053612701416, + "train_acc": 0.00864, + "test_loss": 4.605171006774903, + "test_acc": 0.01, + "lyapunov": 2.6286537153336704, + "grad_norm": 0.19093915741238635, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 167.27450942993164 + }, + { + "epoch": 76, + "train_loss": 6.801593222961426, + "train_acc": 0.00904, + "test_loss": 4.605170780181885, + "test_acc": 0.01, + "lyapunov": 2.6054461362111905, + "grad_norm": 0.12884562844199357, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 167.09656834602356 + }, + { + "epoch": 77, + "train_loss": 6.796963772583008, + "train_acc": 0.00794, + "test_loss": 4.605171012878418, + "test_acc": 0.01, + "lyapunov": 2.6028354930145965, + "grad_norm": 0.09104303565016296, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 167.33878350257874 + }, + { + "epoch": 78, + "train_loss": 6.7984873474121095, + "train_acc": 0.00882, + "test_loss": 4.605170700073242, + "test_acc": 0.01, + "lyapunov": 2.603611297314734, + "grad_norm": 0.10157683305126329, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 167.25584626197815 + }, + { + "epoch": 79, + "train_loss": 6.820661872863769, + "train_acc": 0.00986, + "test_loss": 4.605170817565918, + "test_acc": 0.01, + "lyapunov": 2.612017824826643, + "grad_norm": 0.14611535298895395, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 167.1672751903534 + }, + { + "epoch": 80, + "train_loss": 6.806377208557129, + "train_acc": 0.00852, + "test_loss": 4.605170895385742, + "test_acc": 0.01, + "lyapunov": 2.607236401809146, + "grad_norm": 0.10585908127422697, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 167.1809687614441 + }, + { + "epoch": 81, + "train_loss": 6.808554836425781, + "train_acc": 0.00942, + "test_loss": 4.605170629882813, + "test_acc": 0.01, + "lyapunov": 2.6088667123214058, + "grad_norm": 0.14379651420159803, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 167.25520253181458 + }, + { + "epoch": 82, + "train_loss": 6.8339071276855465, + "train_acc": 0.00906, + "test_loss": 4.605170634460449, + "test_acc": 0.01, + "lyapunov": 2.620855552766024, + "grad_norm": 0.23055639987610052, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 167.52204132080078 + }, + { + "epoch": 83, + "train_loss": 6.828104596252442, + "train_acc": 0.0093, + "test_loss": 4.605170736694336, + "test_acc": 0.01, + "lyapunov": 2.6192942519322076, + "grad_norm": 0.19017261102902538, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 167.1194040775299 + }, + { + "epoch": 84, + "train_loss": 6.808681617126465, + "train_acc": 0.0084, + "test_loss": 4.6051709182739256, + "test_acc": 0.01, + "lyapunov": 2.609468307641461, + "grad_norm": 0.15622504553249358, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 167.19974207878113 + }, + { + "epoch": 85, + "train_loss": 6.818397989654541, + "train_acc": 0.00824, + "test_loss": 4.605170721435547, + "test_acc": 0.01, + "lyapunov": 2.6138416312234787, + "grad_norm": 0.14833733270771185, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 167.2553927898407 + }, + { + "epoch": 86, + "train_loss": 6.799676761169434, + "train_acc": 0.00838, + "test_loss": 4.60517102508545, + "test_acc": 0.01, + "lyapunov": 2.604430999292437, + "grad_norm": 0.11142070053574807, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 167.18824887275696 + }, + { + "epoch": 87, + "train_loss": 6.818209040527344, + "train_acc": 0.00854, + "test_loss": 4.605170503997803, + "test_acc": 0.01, + "lyapunov": 2.6141847765354242, + "grad_norm": 0.14462203411441973, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 167.1196677684784 + }, + { + "epoch": 88, + "train_loss": 6.874744393615723, + "train_acc": 0.00888, + "test_loss": 4.605170900726319, + "test_acc": 0.01, + "lyapunov": 2.6346183640267844, + "grad_norm": 0.20078574833508478, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 167.2573266029358 + }, + { + "epoch": 89, + "train_loss": 6.803292810211182, + "train_acc": 0.00886, + "test_loss": 4.60517081451416, + "test_acc": 0.01, + "lyapunov": 2.606465803082947, + "grad_norm": 0.12244758192489462, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 167.22969937324524 + }, + { + "epoch": 90, + "train_loss": 6.842185859069824, + "train_acc": 0.00942, + "test_loss": 4.605170654296875, + "test_acc": 0.01, + "lyapunov": 2.622050429853942, + "grad_norm": 0.1882414210254429, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 167.11765575408936 + }, + { + "epoch": 91, + "train_loss": 6.836290773010254, + "train_acc": 0.00882, + "test_loss": 4.605170703125, + "test_acc": 0.01, + "lyapunov": 2.619682075422438, + "grad_norm": 0.19767006125117328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 167.22952795028687 + }, + { + "epoch": 92, + "train_loss": 6.791880859985351, + "train_acc": 0.00842, + "test_loss": 4.605170771789551, + "test_acc": 0.01, + "lyapunov": 2.5996962294859043, + "grad_norm": 0.08760976620030388, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 167.26651191711426 + }, + { + "epoch": 93, + "train_loss": 6.80370014678955, + "train_acc": 0.00806, + "test_loss": 4.605170739746094, + "test_acc": 0.01, + "lyapunov": 2.606304941884697, + "grad_norm": 0.13940577534302254, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 167.17852663993835 + }, + { + "epoch": 94, + "train_loss": 6.83537752532959, + "train_acc": 0.00846, + "test_loss": 4.605170500183106, + "test_acc": 0.01, + "lyapunov": 2.623438694288054, + "grad_norm": 0.26310451945532815, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 167.17071175575256 + }, + { + "epoch": 95, + "train_loss": 6.799238587646484, + "train_acc": 0.00926, + "test_loss": 4.6051702911376955, + "test_acc": 0.01, + "lyapunov": 2.60419953631623, + "grad_norm": 0.10657735488339905, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 167.223788022995 + }, + { + "epoch": 96, + "train_loss": 6.804974398498535, + "train_acc": 0.00916, + "test_loss": 4.605170680236816, + "test_acc": 0.01, + "lyapunov": 2.60721908383967, + "grad_norm": 0.17693273008046123, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 167.2773995399475 + }, + { + "epoch": 97, + "train_loss": 6.8050346893310545, + "train_acc": 0.0086, + "test_loss": 4.605170379638672, + "test_acc": 0.01, + "lyapunov": 2.607598216332438, + "grad_norm": 0.1351166427526852, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 167.0982165336609 + }, + { + "epoch": 98, + "train_loss": 6.814014775848388, + "train_acc": 0.00896, + "test_loss": 4.605170265960694, + "test_acc": 0.01, + "lyapunov": 2.611722286399978, + "grad_norm": 0.16300027920865434, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 167.213885307312 + }, + { + "epoch": 99, + "train_loss": 6.810039446411133, + "train_acc": 0.00874, + "test_loss": 4.605170517730713, + "test_acc": 0.01, + "lyapunov": 2.609659137018501, + "grad_norm": 0.13742401941675986, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 167.23094940185547 + }, + { + "epoch": 100, + "train_loss": 6.818154907836914, + "train_acc": 0.00906, + "test_loss": 4.6051704177856445, + "test_acc": 0.01, + "lyapunov": 2.613592106363048, + "grad_norm": 0.13552057031594136, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 167.14863324165344 + }, + { + "epoch": 101, + "train_loss": 6.820175225524903, + "train_acc": 0.00914, + "test_loss": 4.605170472717285, + "test_acc": 0.01, + "lyapunov": 2.615781251731736, + "grad_norm": 0.1825661927434339, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 167.13485431671143 + }, + { + "epoch": 102, + "train_loss": 6.843083056182861, + "train_acc": 0.00814, + "test_loss": 4.605170304107666, + "test_acc": 0.01, + "lyapunov": 2.6266718941271456, + "grad_norm": 0.28170773297668966, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 167.3005588054657 + }, + { + "epoch": 103, + "train_loss": 6.81555390625, + "train_acc": 0.0089, + "test_loss": 4.605170388793946, + "test_acc": 0.01, + "lyapunov": 2.6132783401957558, + "grad_norm": 0.20579070177059625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 167.31917262077332 + }, + { + "epoch": 104, + "train_loss": 6.797420726623535, + "train_acc": 0.00826, + "test_loss": 4.60517056274414, + "test_acc": 0.01, + "lyapunov": 2.6031100310937827, + "grad_norm": 0.09877603372479003, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 167.13279914855957 + }, + { + "epoch": 105, + "train_loss": 6.825426294555664, + "train_acc": 0.00898, + "test_loss": 4.605170573425293, + "test_acc": 0.01, + "lyapunov": 2.6164557750877515, + "grad_norm": 0.23298022186302586, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 167.27876543998718 + }, + { + "epoch": 106, + "train_loss": 6.81034471786499, + "train_acc": 0.00862, + "test_loss": 4.605170178222656, + "test_acc": 0.01, + "lyapunov": 2.6101580525908017, + "grad_norm": 0.11576839370764984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 167.24659395217896 + }, + { + "epoch": 107, + "train_loss": 6.8369368406677244, + "train_acc": 0.00846, + "test_loss": 4.605170590209961, + "test_acc": 0.01, + "lyapunov": 2.62125125931352, + "grad_norm": 0.1931519664931494, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 167.2057774066925 + }, + { + "epoch": 108, + "train_loss": 6.812288922576904, + "train_acc": 0.0088, + "test_loss": 4.605170223999023, + "test_acc": 0.01, + "lyapunov": 2.6103451739796593, + "grad_norm": 0.13299121884159582, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 167.10559225082397 + }, + { + "epoch": 109, + "train_loss": 6.797308649902344, + "train_acc": 0.00842, + "test_loss": 4.605170259094239, + "test_acc": 0.01, + "lyapunov": 2.6030520350122086, + "grad_norm": 0.09292253205333328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 167.28680682182312 + }, + { + "epoch": 110, + "train_loss": 6.802461311950683, + "train_acc": 0.00886, + "test_loss": 4.605170384979248, + "test_acc": 0.01, + "lyapunov": 2.605947788414138, + "grad_norm": 0.09044100601755074, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 167.254047870636 + }, + { + "epoch": 111, + "train_loss": 6.800218295593262, + "train_acc": 0.00898, + "test_loss": 4.605170218658447, + "test_acc": 0.01, + "lyapunov": 2.6047815380193997, + "grad_norm": 0.09096765167841042, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 167.18093347549438 + }, + { + "epoch": 112, + "train_loss": 6.80289358581543, + "train_acc": 0.00846, + "test_loss": 4.605170321655273, + "test_acc": 0.01, + "lyapunov": 2.606188810085092, + "grad_norm": 0.11124745619391717, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 167.17500185966492 + }, + { + "epoch": 113, + "train_loss": 6.80328687286377, + "train_acc": 0.0083, + "test_loss": 4.605170209503174, + "test_acc": 0.01, + "lyapunov": 2.606580800717444, + "grad_norm": 0.1173945856600355, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 167.2652928829193 + }, + { + "epoch": 114, + "train_loss": 6.833984843902588, + "train_acc": 0.00896, + "test_loss": 4.605170062255859, + "test_acc": 0.01, + "lyapunov": 2.6208856666789337, + "grad_norm": 0.20744787133639947, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 167.21882677078247 + }, + { + "epoch": 115, + "train_loss": 6.822520295410156, + "train_acc": 0.00838, + "test_loss": 4.605170328521728, + "test_acc": 0.01, + "lyapunov": 2.615956858295919, + "grad_norm": 0.14399695964710044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 167.09929537773132 + }, + { + "epoch": 116, + "train_loss": 6.799036735839843, + "train_acc": 0.00894, + "test_loss": 4.605170152282715, + "test_acc": 0.01, + "lyapunov": 2.603793166787423, + "grad_norm": 0.10032145854595359, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 167.25386571884155 + }, + { + "epoch": 117, + "train_loss": 6.800587829284668, + "train_acc": 0.00834, + "test_loss": 4.605170477294922, + "test_acc": 0.01, + "lyapunov": 2.604958756805381, + "grad_norm": 0.11401729218950767, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 167.27676010131836 + }, + { + "epoch": 118, + "train_loss": 6.800997655029297, + "train_acc": 0.0088, + "test_loss": 4.605170313262939, + "test_acc": 0.01, + "lyapunov": 2.6053062838971464, + "grad_norm": 0.10865983471852475, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 167.16999578475952 + }, + { + "epoch": 119, + "train_loss": 6.800622797088623, + "train_acc": 0.0082, + "test_loss": 4.605170126342774, + "test_acc": 0.01, + "lyapunov": 2.604655019462566, + "grad_norm": 0.12369520749734833, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 167.13503623008728 + }, + { + "epoch": 120, + "train_loss": 6.795711727905274, + "train_acc": 0.00866, + "test_loss": 4.60517028503418, + "test_acc": 0.01, + "lyapunov": 2.602085701949761, + "grad_norm": 0.08734190443194187, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 167.28283619880676 + }, + { + "epoch": 121, + "train_loss": 6.796959948425293, + "train_acc": 0.0093, + "test_loss": 4.605170495605469, + "test_acc": 0.01, + "lyapunov": 2.6028400558949736, + "grad_norm": 0.08752194617001091, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 167.22894525527954 + }, + { + "epoch": 122, + "train_loss": 6.80965912033081, + "train_acc": 0.00928, + "test_loss": 4.605170267486573, + "test_acc": 0.01, + "lyapunov": 2.6096866935720224, + "grad_norm": 0.11691201011842964, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 167.16074228286743 + }, + { + "epoch": 123, + "train_loss": 6.817136254882812, + "train_acc": 0.00856, + "test_loss": 4.605170227050781, + "test_acc": 0.01, + "lyapunov": 2.6124652438151563, + "grad_norm": 0.1550769682935547, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 167.20862245559692 + }, + { + "epoch": 124, + "train_loss": 6.797611290588379, + "train_acc": 0.0096, + "test_loss": 4.605170072174072, + "test_acc": 0.01, + "lyapunov": 2.603274511864118, + "grad_norm": 0.10698377372823001, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 167.24812293052673 + }, + { + "epoch": 125, + "train_loss": 6.811994839477539, + "train_acc": 0.00868, + "test_loss": 4.605170003509522, + "test_acc": 0.01, + "lyapunov": 2.6103333463449307, + "grad_norm": 0.14234235939730758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 167.15956830978394 + }, + { + "epoch": 126, + "train_loss": 6.799865046234131, + "train_acc": 0.00862, + "test_loss": 4.605170318603515, + "test_acc": 0.01, + "lyapunov": 2.604667879431449, + "grad_norm": 0.09265194462378636, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 167.1222221851349 + }, + { + "epoch": 127, + "train_loss": 6.804667163391113, + "train_acc": 0.00886, + "test_loss": 4.605170178985595, + "test_acc": 0.01, + "lyapunov": 2.60723816342366, + "grad_norm": 0.09360794490801955, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 167.1491777896881 + }, + { + "epoch": 128, + "train_loss": 6.803801723480225, + "train_acc": 0.0089, + "test_loss": 4.605170277404786, + "test_acc": 0.01, + "lyapunov": 2.606579548867462, + "grad_norm": 0.10479682515434138, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 167.26385951042175 + }, + { + "epoch": 129, + "train_loss": 6.7995252819824215, + "train_acc": 0.0085, + "test_loss": 4.605170484924316, + "test_acc": 0.01, + "lyapunov": 2.604231426478042, + "grad_norm": 0.08941205723411079, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 167.30450534820557 + }, + { + "epoch": 130, + "train_loss": 6.821313883209228, + "train_acc": 0.00852, + "test_loss": 4.605170134735108, + "test_acc": 0.01, + "lyapunov": 2.615080727335742, + "grad_norm": 0.1662641683208483, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 167.14770483970642 + }, + { + "epoch": 131, + "train_loss": 6.795292775421142, + "train_acc": 0.00846, + "test_loss": 4.605170323944092, + "test_acc": 0.01, + "lyapunov": 2.601862790944326, + "grad_norm": 0.11411966381332427, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 167.2135558128357 + }, + { + "epoch": 132, + "train_loss": 6.796047713775635, + "train_acc": 0.00904, + "test_loss": 4.6051700454711915, + "test_acc": 0.01, + "lyapunov": 2.602336645736109, + "grad_norm": 0.08834944397480328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 167.23654413223267 + }, + { + "epoch": 133, + "train_loss": 6.799664002380371, + "train_acc": 0.00904, + "test_loss": 4.605170405578614, + "test_acc": 0.01, + "lyapunov": 2.6045111707409325, + "grad_norm": 0.08768823633488758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 167.25386261940002 + }, + { + "epoch": 134, + "train_loss": 6.799534449920654, + "train_acc": 0.00966, + "test_loss": 4.605170095825195, + "test_acc": 0.01, + "lyapunov": 2.604433027374775, + "grad_norm": 0.08880059006188033, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 167.089768409729 + }, + { + "epoch": 135, + "train_loss": 6.816852741394043, + "train_acc": 0.00922, + "test_loss": 4.6051704139709475, + "test_acc": 0.01, + "lyapunov": 2.6120451417420525, + "grad_norm": 0.1344230192150204, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 167.21077299118042 + }, + { + "epoch": 136, + "train_loss": 6.79835750869751, + "train_acc": 0.01, + "test_loss": 4.60517020111084, + "test_acc": 0.01, + "lyapunov": 2.6037550874988136, + "grad_norm": 0.09237399837874004, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 167.25671005249023 + }, + { + "epoch": 137, + "train_loss": 6.799135870971679, + "train_acc": 0.00948, + "test_loss": 4.605170085144043, + "test_acc": 0.01, + "lyapunov": 2.6042151554771094, + "grad_norm": 0.08937220866741212, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 167.19218349456787 + }, + { + "epoch": 138, + "train_loss": 6.824215604553222, + "train_acc": 0.01, + "test_loss": 4.605170098876953, + "test_acc": 0.01, + "lyapunov": 2.616335995666816, + "grad_norm": 0.10994228945768546, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 167.09943842887878 + }, + { + "epoch": 139, + "train_loss": 6.802577704467773, + "train_acc": 0.01, + "test_loss": 4.605170218658447, + "test_acc": 0.01, + "lyapunov": 2.6062524855289313, + "grad_norm": 0.09042623460420336, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 167.20513486862183 + }, + { + "epoch": 140, + "train_loss": 6.7961073709106445, + "train_acc": 0.01, + "test_loss": 4.605170453643799, + "test_acc": 0.01, + "lyapunov": 2.602320309490194, + "grad_norm": 0.08815797205742677, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 167.25681805610657 + }, + { + "epoch": 141, + "train_loss": 6.797138239898682, + "train_acc": 0.01, + "test_loss": 4.605170432281494, + "test_acc": 0.01, + "lyapunov": 2.6029675891027426, + "grad_norm": 0.0879981627311107, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 167.06548428535461 + }, + { + "epoch": 142, + "train_loss": 6.801417353363037, + "train_acc": 0.01, + "test_loss": 4.605170329284668, + "test_acc": 0.01, + "lyapunov": 2.605164134593876, + "grad_norm": 0.08843743115572271, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 167.19282054901123 + }, + { + "epoch": 143, + "train_loss": 6.799633148193359, + "train_acc": 0.01, + "test_loss": 4.6051702880859375, + "test_acc": 0.01, + "lyapunov": 2.6045726491972006, + "grad_norm": 0.09210601924786092, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 167.22217631340027 + }, + { + "epoch": 144, + "train_loss": 6.799774599914551, + "train_acc": 0.01, + "test_loss": 4.605170209503174, + "test_acc": 0.01, + "lyapunov": 2.6046122669258995, + "grad_norm": 0.08889860655727871, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 167.18017983436584 + }, + { + "epoch": 145, + "train_loss": 6.7985524331665035, + "train_acc": 0.01, + "test_loss": 4.6051704223632814, + "test_acc": 0.01, + "lyapunov": 2.6038548361005076, + "grad_norm": 0.08800873662125164, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 167.10364723205566 + }, + { + "epoch": 146, + "train_loss": 6.797061258239746, + "train_acc": 0.01, + "test_loss": 4.605170094299316, + "test_acc": 0.01, + "lyapunov": 2.6029466247314685, + "grad_norm": 0.08767630908448117, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 167.13109254837036 + }, + { + "epoch": 147, + "train_loss": 6.7999437774658205, + "train_acc": 0.01, + "test_loss": 4.605170198059082, + "test_acc": 0.01, + "lyapunov": 2.6046864193723636, + "grad_norm": 0.08792294865681417, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 167.20970582962036 + }, + { + "epoch": 148, + "train_loss": 6.798582576293946, + "train_acc": 0.01, + "test_loss": 4.605170455932617, + "test_acc": 0.01, + "lyapunov": 2.6038761730389215, + "grad_norm": 0.09215822971292409, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 167.12604355812073 + }, + { + "epoch": 149, + "train_loss": 6.796307967529297, + "train_acc": 0.01, + "test_loss": 4.605170027923584, + "test_acc": 0.01, + "lyapunov": 2.6024758651128512, + "grad_norm": 0.08782242943220565, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 167.15288949012756 + }, + { + "epoch": 150, + "train_loss": 6.797921124420166, + "train_acc": 0.01, + "test_loss": 4.6051702972412105, + "test_acc": 0.01, + "lyapunov": 2.6034922130272515, + "grad_norm": 0.08768432297346943, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 167.14476084709167 + } + ], + "20": [ + { + "epoch": 1, + "train_loss": 15.093960892944336, + "train_acc": 0.01476, + "test_loss": 4.694812010192871, + "test_acc": 0.0101, + "lyapunov": 5.28920032362194, + "grad_norm": 5.920792423737725, + "grad_max_sv": 4.9676717877388, + "grad_min_sv": 8.119859199878787e-08, + "grad_condition": 1111289730.0106924, + "lr": 0.0009998903417374227, + "time_sec": 210.120050907135 + }, + { + "epoch": 2, + "train_loss": 9.793692145080566, + "train_acc": 0.01708, + "test_loss": 4.630818698120117, + "test_acc": 0.0101, + "lyapunov": 3.9491244813670283, + "grad_norm": 4.179099264712139, + "grad_max_sv": 3.6389390349388124, + "grad_min_sv": 4.435643456510846e-08, + "grad_condition": 1465465238.7805393, + "lr": 0.0009995614150494292, + "time_sec": 210.1432433128357 + }, + { + "epoch": 3, + "train_loss": 9.864517554931641, + "train_acc": 0.01526, + "test_loss": 4.635793448638916, + "test_acc": 0.01, + "lyapunov": 4.013264959120689, + "grad_norm": 3.461175130912805, + "grad_max_sv": 3.00231654047966, + "grad_min_sv": 7.094927521799298e-09, + "grad_condition": 151743845631.83978, + "lr": 0.0009990133642141358, + "time_sec": 210.18036890029907 + }, + { + "epoch": 4, + "train_loss": 9.012857937622071, + "train_acc": 0.01522, + "test_loss": 4.623633129882813, + "test_acc": 0.01, + "lyapunov": 3.700052426599176, + "grad_norm": 2.6286152850939577, + "grad_max_sv": 2.296706238389015, + "grad_min_sv": 3.159897203264806e-11, + "grad_condition": 343973728227.78937, + "lr": 0.0009982464296247522, + "time_sec": 210.1404571533203 + }, + { + "epoch": 5, + "train_loss": 8.190340083312988, + "train_acc": 0.0141, + "test_loss": 4.620581848144531, + "test_acc": 0.01, + "lyapunov": 3.3428353769395054, + "grad_norm": 1.8058911521537262, + "grad_max_sv": 1.3938701748847961, + "grad_min_sv": 9.547992879409192e-12, + "grad_condition": 323805955248.2424, + "lr": 0.0009972609476841367, + "time_sec": 210.12661004066467 + }, + { + "epoch": 6, + "train_loss": 7.759998917236328, + "train_acc": 0.01288, + "test_loss": 4.617343115997315, + "test_acc": 0.01, + "lyapunov": 3.1374943689312165, + "grad_norm": 1.7534337420481565, + "grad_max_sv": 0.9646675065159919, + "grad_min_sv": 2.9231036572180592e-12, + "grad_condition": 375265614590.23444, + "lr": 0.000996057350657239, + "time_sec": 210.0431251525879 + }, + { + "epoch": 7, + "train_loss": 7.5100171649169924, + "train_acc": 0.01298, + "test_loss": 4.613992894744873, + "test_acc": 0.01, + "lyapunov": 3.009886204434173, + "grad_norm": 1.2599904723678697, + "grad_max_sv": 0.683513353765011, + "grad_min_sv": 2.034050211148161e-12, + "grad_condition": 321368791479.6951, + "lr": 0.000994636166481494, + "time_sec": 210.03102850914001 + }, + { + "epoch": 8, + "train_loss": 7.526667755889893, + "train_acc": 0.0137, + "test_loss": 4.6132587142944335, + "test_acc": 0.01, + "lyapunov": 3.020487799973744, + "grad_norm": 1.4149077024298684, + "grad_max_sv": 0.43169260323047637, + "grad_min_sv": 1.314155534129329e-12, + "grad_condition": 228604061031.44318, + "lr": 0.0009929980185352525, + "time_sec": 210.09079957008362 + }, + { + "epoch": 9, + "train_loss": 7.424001091003418, + "train_acc": 0.0139, + "test_loss": 4.612518185424805, + "test_acc": 0.01, + "lyapunov": 2.9646140498578397, + "grad_norm": 1.4854391503992914, + "grad_max_sv": 0.39994182234216435, + "grad_min_sv": 7.056669271977351e-13, + "grad_condition": 272585344238.14337, + "lr": 0.0009911436253643444, + "time_sec": 210.04538559913635 + }, + { + "epoch": 10, + "train_loss": 7.422507609710693, + "train_acc": 0.01292, + "test_loss": 4.612365335083008, + "test_acc": 0.01, + "lyapunov": 2.9684851279344096, + "grad_norm": 1.4578891690299673, + "grad_max_sv": 0.3333915390074253, + "grad_min_sv": 5.315411665648874e-13, + "grad_condition": 252944829203.9721, + "lr": 0.0009890738003669028, + "time_sec": 210.01400017738342 + }, + { + "epoch": 11, + "train_loss": 7.279168519592285, + "train_acc": 0.01416, + "test_loss": 4.605921854400635, + "test_acc": 0.01, + "lyapunov": 2.8905254178644753, + "grad_norm": 1.1550117670507138, + "grad_max_sv": 0.26091913171112535, + "grad_min_sv": 1.5622282665285416e-13, + "grad_condition": 237845802721.57803, + "lr": 0.00098678945143658, + "time_sec": 210.0479826927185 + }, + { + "epoch": 12, + "train_loss": 7.238350921325684, + "train_acc": 0.01288, + "test_loss": 4.6059690254211425, + "test_acc": 0.01, + "lyapunov": 2.870093943212953, + "grad_norm": 1.2092537765879001, + "grad_max_sv": 0.2273966234177351, + "grad_min_sv": 2.126834221214877e-15, + "grad_condition": 226904883800.9376, + "lr": 0.0009842915805643154, + "time_sec": 210.02421975135803 + }, + { + "epoch": 13, + "train_loss": 7.237049304504395, + "train_acc": 0.0122, + "test_loss": 4.606073367309571, + "test_acc": 0.01, + "lyapunov": 2.8677229795919357, + "grad_norm": 1.945360181719986, + "grad_max_sv": 0.19105065988258402, + "grad_min_sv": 7.58301405160596e-16, + "grad_condition": 190882486106.46655, + "lr": 0.000981581283398829, + "time_sec": 209.9947109222412 + }, + { + "epoch": 14, + "train_loss": 7.725393817138672, + "train_acc": 0.01264, + "test_loss": 5.5369372573852536, + "test_acc": 0.0157, + "lyapunov": 3.1145479276661985, + "grad_norm": 3.5850673850910875, + "grad_max_sv": 0.13178386465706673, + "grad_min_sv": 1.7957017814409413e-15, + "grad_condition": 131460341909.11662, + "lr": 0.0009786597487660333, + "time_sec": 210.06614232063293 + }, + { + "epoch": 15, + "train_loss": 7.938173998718262, + "train_acc": 0.0112, + "test_loss": 4.605860107421875, + "test_acc": 0.01, + "lyapunov": 3.22320399442902, + "grad_norm": 1.470918431013692, + "grad_max_sv": 0.13412793046313495, + "grad_min_sv": 1.3123556012424532e-27, + "grad_condition": 134127930463.13481, + "lr": 0.0009755282581475766, + "time_sec": 210.01092720031738 + }, + { + "epoch": 16, + "train_loss": 7.877476094970703, + "train_acc": 0.01078, + "test_loss": 4.605639274597168, + "test_acc": 0.01, + "lyapunov": 3.1950507353028983, + "grad_norm": 1.136967603821004, + "grad_max_sv": 0.11695587523281574, + "grad_min_sv": 5.493959932514282e-37, + "grad_condition": 116955875232.81572, + "lr": 0.0009721881851187403, + "time_sec": 210.03272008895874 + }, + { + "epoch": 17, + "train_loss": 7.939653808288575, + "train_acc": 0.01054, + "test_loss": 4.60557441482544, + "test_acc": 0.01, + "lyapunov": 3.220062300982073, + "grad_norm": 1.7456145739471243, + "grad_max_sv": 0.09164720228873194, + "grad_min_sv": 2.1019476964872255e-46, + "grad_condition": 91647202288.73193, + "lr": 0.0009686409947459456, + "time_sec": 210.02848625183105 + }, + { + "epoch": 18, + "train_loss": 7.52693728515625, + "train_acc": 0.0113, + "test_loss": 4.605569499206543, + "test_acc": 0.01, + "lyapunov": 3.0156563999097976, + "grad_norm": 2.4071740405774276, + "grad_max_sv": 0.08130668587982655, + "grad_min_sv": 4.554220009055656e-46, + "grad_condition": 81306685879.82654, + "lr": 0.0009648882429441254, + "time_sec": 210.00972390174866 + }, + { + "epoch": 19, + "train_loss": 7.715430914611816, + "train_acc": 0.0111, + "test_loss": 4.605534184265137, + "test_acc": 0.01, + "lyapunov": 3.1088165675892547, + "grad_norm": 2.6762849936508677, + "grad_max_sv": 0.042965149600058795, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 42965149600.05879, + "lr": 0.00096093157579425, + "time_sec": 209.9727280139923 + }, + { + "epoch": 20, + "train_loss": 7.460425003356933, + "train_acc": 0.0111, + "test_loss": 7.111512740325928, + "test_acc": 0.01, + "lyapunov": 2.9692358793809897, + "grad_norm": 2.853254134437055, + "grad_max_sv": 0.050038989260792734, + "grad_min_sv": 2.5374011942761624e-43, + "grad_condition": 50038989260.792725, + "lr": 0.0009567727288213001, + "time_sec": 210.01186299324036 + }, + { + "epoch": 21, + "train_loss": 7.205679086456299, + "train_acc": 0.0091, + "test_loss": 7.044362417602539, + "test_acc": 0.01, + "lyapunov": 2.8364865828658004, + "grad_norm": 3.3061229521295945, + "grad_max_sv": 0.02213773485273123, + "grad_min_sv": 0.0, + "grad_condition": 22137734852.731228, + "lr": 0.0009524135262330095, + "time_sec": 209.98502397537231 + }, + { + "epoch": 22, + "train_loss": 7.1949261268615725, + "train_acc": 0.0098, + "test_loss": 4.605458296203613, + "test_acc": 0.01, + "lyapunov": 2.8206752724659716, + "grad_norm": 6.972340571186882, + "grad_max_sv": 0.02202093116939068, + "grad_min_sv": 0.0, + "grad_condition": 22020931169.39068, + "lr": 0.0009478558801197061, + "time_sec": 209.94458675384521 + }, + { + "epoch": 23, + "train_loss": 7.115987669677734, + "train_acc": 0.00996, + "test_loss": 6.645735456848144, + "test_acc": 0.01, + "lyapunov": 2.7744642029637876, + "grad_norm": 7.989108672811228, + "grad_max_sv": 0.011007561534643173, + "grad_min_sv": 0.0, + "grad_condition": 11007561534.643173, + "lr": 0.000943101789615607, + "time_sec": 209.97865319252014 + }, + { + "epoch": 24, + "train_loss": 7.058884606628418, + "train_acc": 0.00872, + "test_loss": 6.569473106384278, + "test_acc": 0.01, + "lyapunov": 2.745215448881964, + "grad_norm": 5.5094378668531405, + "grad_max_sv": 0.01464888285845518, + "grad_min_sv": 0.0, + "grad_condition": 14648882858.455181, + "lr": 0.0009381533400219313, + "time_sec": 210.0189917087555 + }, + { + "epoch": 25, + "train_loss": 7.515213393859863, + "train_acc": 0.01036, + "test_loss": 4.605401533508301, + "test_acc": 0.01, + "lyapunov": 3.0008729113947097, + "grad_norm": 2.870644125398128, + "grad_max_sv": 0.07644851161090856, + "grad_min_sv": 3.1529215447308385e-46, + "grad_condition": 76448511610.90854, + "lr": 0.0009330127018922189, + "time_sec": 210.00069952011108 + }, + { + "epoch": 26, + "train_loss": 7.552015746002197, + "train_acc": 0.01018, + "test_loss": 4.605392645263672, + "test_acc": 0.01, + "lyapunov": 3.0268727373284148, + "grad_norm": 1.9702867287865506, + "grad_max_sv": 0.07252425029873848, + "grad_min_sv": 1.0509738482436128e-46, + "grad_condition": 72524250298.73848, + "lr": 0.000927682130080253, + "time_sec": 210.00505328178406 + }, + { + "epoch": 27, + "train_loss": 7.204120320739746, + "train_acc": 0.00916, + "test_loss": 4.605300965118408, + "test_acc": 0.01, + "lyapunov": 2.8272059610127793, + "grad_norm": 2.304850056236489, + "grad_max_sv": 0.002205173298716545, + "grad_min_sv": 0.0, + "grad_condition": 2205173298.716545, + "lr": 0.0009221639627510072, + "time_sec": 210.04179668426514 + }, + { + "epoch": 28, + "train_loss": 7.194927945556641, + "train_acc": 0.00832, + "test_loss": 5.018761894989014, + "test_acc": 0.01, + "lyapunov": 2.834069358723243, + "grad_norm": 2.6612819081862673, + "grad_max_sv": 0.007065491378307342, + "grad_min_sv": 0.0, + "grad_condition": 7065491378.307343, + "lr": 0.0009164606203550494, + "time_sec": 209.9864535331726 + }, + { + "epoch": 29, + "train_loss": 7.058241820373535, + "train_acc": 0.0089, + "test_loss": 4.605222779083252, + "test_acc": 0.01, + "lyapunov": 2.7548481247309224, + "grad_norm": 1.6469496155298196, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009105746045668516, + "time_sec": 209.949223279953 + }, + { + "epoch": 30, + "train_loss": 6.992346358947754, + "train_acc": 0.00846, + "test_loss": 5.288449756622314, + "test_acc": 0.01, + "lyapunov": 2.7193446976449485, + "grad_norm": 0.12148601528604053, + "grad_max_sv": 0.010588385537266732, + "grad_min_sv": 0.0, + "grad_condition": 10588385537.266731, + "lr": 0.0009045084971874733, + "time_sec": 209.9674859046936 + }, + { + "epoch": 31, + "train_loss": 6.981909171295166, + "train_acc": 0.0089, + "test_loss": 5.256688010406494, + "test_acc": 0.01, + "lyapunov": 2.713971863622251, + "grad_norm": 0.1172841827453055, + "grad_max_sv": 0.004473739862442016, + "grad_min_sv": 0.0, + "grad_condition": 4473739862.442017, + "lr": 0.0008982649590120977, + "time_sec": 210.0011682510376 + }, + { + "epoch": 32, + "train_loss": 6.981826614379883, + "train_acc": 0.00878, + "test_loss": 5.260603121185302, + "test_acc": 0.01, + "lyapunov": 2.714321748679861, + "grad_norm": 0.09952710953666385, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008918467286629196, + "time_sec": 209.97604823112488 + }, + { + "epoch": 33, + "train_loss": 6.99227462890625, + "train_acc": 0.00872, + "test_loss": 5.264018801879883, + "test_acc": 0.01, + "lyapunov": 2.7198148792052206, + "grad_norm": 0.10982760460792622, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878943, + "time_sec": 209.99684286117554 + }, + { + "epoch": 34, + "train_loss": 6.985566412353515, + "train_acc": 0.00828, + "test_loss": 5.252056950378418, + "test_acc": 0.01, + "lyapunov": 2.71640632646468, + "grad_norm": 0.0980287254251016, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000878497527825878, + "time_sec": 209.97523665428162 + }, + { + "epoch": 35, + "train_loss": 6.983518271942138, + "train_acc": 0.00802, + "test_loss": 5.235891506958008, + "test_acc": 0.01, + "lyapunov": 2.7152942220878113, + "grad_norm": 0.098301014644246, + "grad_max_sv": 0.010264468565583228, + "grad_min_sv": 0.0, + "grad_condition": 10264468565.58323, + "lr": 0.000871572412738697, + "time_sec": 209.92434358596802 + }, + { + "epoch": 36, + "train_loss": 7.056292109069824, + "train_acc": 0.00856, + "test_loss": 5.234983450317383, + "test_acc": 0.01, + "lyapunov": 2.7453303550515336, + "grad_norm": 0.16314843571536908, + "grad_max_sv": 0.004481474310159684, + "grad_min_sv": 0.0, + "grad_condition": 4481474310.159683, + "lr": 0.0008644843137107055, + "time_sec": 209.98300409317017 + }, + { + "epoch": 37, + "train_loss": 7.04465570388794, + "train_acc": 0.00922, + "test_loss": 4.60517428894043, + "test_acc": 0.01, + "lyapunov": 2.7430449416265463, + "grad_norm": 0.3622526875575334, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 209.93617868423462 + }, + { + "epoch": 38, + "train_loss": 6.99952162109375, + "train_acc": 0.00886, + "test_loss": 4.605173640441895, + "test_acc": 0.01, + "lyapunov": 2.7234638078743236, + "grad_norm": 0.13703797479309945, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 209.95248365402222 + }, + { + "epoch": 39, + "train_loss": 7.040763073120117, + "train_acc": 0.00844, + "test_loss": 4.605174145507813, + "test_acc": 0.01, + "lyapunov": 2.7378825531591233, + "grad_norm": 0.1820768645877041, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 209.9344642162323 + }, + { + "epoch": 40, + "train_loss": 7.0346226399230956, + "train_acc": 0.0086, + "test_loss": 4.6051736892700195, + "test_acc": 0.01, + "lyapunov": 2.7368516513453724, + "grad_norm": 0.16922090716634502, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008345653031794289, + "time_sec": 209.97976160049438 + }, + { + "epoch": 41, + "train_loss": 7.102251969604493, + "train_acc": 0.00846, + "test_loss": 4.605173461914062, + "test_acc": 0.01, + "lyapunov": 2.764533970362085, + "grad_norm": 0.2796669100517588, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 209.97592854499817 + }, + { + "epoch": 42, + "train_loss": 6.989806396331787, + "train_acc": 0.00866, + "test_loss": 4.605173326110839, + "test_acc": 0.01, + "lyapunov": 2.718248601459786, + "grad_norm": 0.11817449733439238, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 209.91329216957092 + }, + { + "epoch": 43, + "train_loss": 6.980831128997803, + "train_acc": 0.00798, + "test_loss": 4.605173022460938, + "test_acc": 0.01, + "lyapunov": 2.713783808071595, + "grad_norm": 0.09538783881391288, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 209.95550656318665 + }, + { + "epoch": 44, + "train_loss": 6.979222456054687, + "train_acc": 0.00884, + "test_loss": 4.605172604370117, + "test_acc": 0.01, + "lyapunov": 2.712872148474769, + "grad_norm": 0.0919946830154422, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 209.928706407547 + }, + { + "epoch": 45, + "train_loss": 6.981346151428222, + "train_acc": 0.00856, + "test_loss": 4.605171971130371, + "test_acc": 0.01, + "lyapunov": 2.7140665036028304, + "grad_norm": 0.09306477436154323, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 209.92562985420227 + }, + { + "epoch": 46, + "train_loss": 6.981760795288086, + "train_acc": 0.0086, + "test_loss": 4.605172605133057, + "test_acc": 0.01, + "lyapunov": 2.714427888850727, + "grad_norm": 0.08970786008826526, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 210.02350616455078 + }, + { + "epoch": 47, + "train_loss": 7.014443389587402, + "train_acc": 0.0088, + "test_loss": 4.605172411346436, + "test_acc": 0.01, + "lyapunov": 2.728213080969613, + "grad_norm": 0.1697709047839743, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 209.98714351654053 + }, + { + "epoch": 48, + "train_loss": 6.98308254486084, + "train_acc": 0.0088, + "test_loss": 4.605172724151611, + "test_acc": 0.01, + "lyapunov": 2.7148986033466467, + "grad_norm": 0.10089096056823664, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 209.9425868988037 + }, + { + "epoch": 49, + "train_loss": 6.981540090026855, + "train_acc": 0.00806, + "test_loss": 4.610235414886475, + "test_acc": 0.01, + "lyapunov": 2.714101230396944, + "grad_norm": 0.09707765972227518, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 210.01923370361328 + }, + { + "epoch": 50, + "train_loss": 7.012723862762451, + "train_acc": 0.0088, + "test_loss": 4.6051725616455075, + "test_acc": 0.01, + "lyapunov": 2.729266738037929, + "grad_norm": 0.1358370231708399, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 209.99068450927734 + }, + { + "epoch": 51, + "train_loss": 7.017712171630859, + "train_acc": 0.00878, + "test_loss": 4.60517274017334, + "test_acc": 0.01, + "lyapunov": 2.729401938445733, + "grad_norm": 0.13779403599934203, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 210.01132082939148 + }, + { + "epoch": 52, + "train_loss": 6.98579848815918, + "train_acc": 0.00862, + "test_loss": 4.605172367095947, + "test_acc": 0.01, + "lyapunov": 2.7164978974920406, + "grad_norm": 0.11440777465495124, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 209.96309852600098 + }, + { + "epoch": 53, + "train_loss": 6.980713491516113, + "train_acc": 0.0088, + "test_loss": 4.605172201538086, + "test_acc": 0.01, + "lyapunov": 2.7136193919364753, + "grad_norm": 0.0963297125293723, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 210.0020875930786 + }, + { + "epoch": 54, + "train_loss": 6.9838667016601566, + "train_acc": 0.00856, + "test_loss": 4.605172233581543, + "test_acc": 0.01, + "lyapunov": 2.715499324871756, + "grad_norm": 0.1368676120419564, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 209.94060635566711 + }, + { + "epoch": 55, + "train_loss": 6.983624946899414, + "train_acc": 0.00906, + "test_loss": 4.605171611022949, + "test_acc": 0.01, + "lyapunov": 2.7151694712431533, + "grad_norm": 0.1214142336589057, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 209.92118954658508 + }, + { + "epoch": 56, + "train_loss": 6.996163428649902, + "train_acc": 0.00826, + "test_loss": 4.60517228012085, + "test_acc": 0.01, + "lyapunov": 2.721804239560881, + "grad_norm": 0.13635707009394835, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 210.05888557434082 + }, + { + "epoch": 57, + "train_loss": 6.9852110571289066, + "train_acc": 0.00888, + "test_loss": 4.6051725509643555, + "test_acc": 0.01, + "lyapunov": 2.7162836719961727, + "grad_norm": 0.09827989868248155, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 210.03313207626343 + }, + { + "epoch": 58, + "train_loss": 6.990598773498535, + "train_acc": 0.0087, + "test_loss": 4.605171973419189, + "test_acc": 0.01, + "lyapunov": 2.718923308355424, + "grad_norm": 0.11245505032562926, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 210.20554780960083 + }, + { + "epoch": 59, + "train_loss": 6.990819956512452, + "train_acc": 0.00914, + "test_loss": 4.605172409057618, + "test_acc": 0.01, + "lyapunov": 2.719175950950369, + "grad_norm": 0.11267799994144367, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 210.00883507728577 + }, + { + "epoch": 60, + "train_loss": 7.063073814697265, + "train_acc": 0.00868, + "test_loss": 4.605172189331054, + "test_acc": 0.01, + "lyapunov": 2.7483064634415806, + "grad_norm": 0.18267690644430695, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 210.0396704673767 + }, + { + "epoch": 61, + "train_loss": 6.994184250183105, + "train_acc": 0.00868, + "test_loss": 4.605171653747559, + "test_acc": 0.01, + "lyapunov": 2.7201892951565325, + "grad_norm": 0.1215511744322559, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 210.01424837112427 + }, + { + "epoch": 62, + "train_loss": 7.032484904479981, + "train_acc": 0.00918, + "test_loss": 4.605172390747071, + "test_acc": 0.01, + "lyapunov": 2.7373275226339353, + "grad_norm": 0.20957283019702622, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 210.07943868637085 + }, + { + "epoch": 63, + "train_loss": 6.997943234863281, + "train_acc": 0.00816, + "test_loss": 4.6051715438842775, + "test_acc": 0.01, + "lyapunov": 2.722739946506822, + "grad_norm": 0.14325925108066898, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 210.0124545097351 + }, + { + "epoch": 64, + "train_loss": 7.036040018615723, + "train_acc": 0.00846, + "test_loss": 4.6051715461730955, + "test_acc": 0.01, + "lyapunov": 2.737502407234953, + "grad_norm": 0.1852649849094369, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 210.16446352005005 + }, + { + "epoch": 65, + "train_loss": 6.987151607818603, + "train_acc": 0.00856, + "test_loss": 4.605171313476562, + "test_acc": 0.01, + "lyapunov": 2.717369063126157, + "grad_norm": 0.11469395705842762, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 210.01318955421448 + }, + { + "epoch": 66, + "train_loss": 7.095058049316406, + "train_acc": 0.0084, + "test_loss": 4.605171440124511, + "test_acc": 0.01, + "lyapunov": 2.76260655432406, + "grad_norm": 0.38302198809757837, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 209.99922275543213 + }, + { + "epoch": 67, + "train_loss": 6.990951052246094, + "train_acc": 0.00822, + "test_loss": 4.60517152709961, + "test_acc": 0.01, + "lyapunov": 2.719036699865785, + "grad_norm": 0.12621463018935974, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 210.0219807624817 + }, + { + "epoch": 68, + "train_loss": 6.979004976806641, + "train_acc": 0.0089, + "test_loss": 4.6051711723327635, + "test_acc": 0.01, + "lyapunov": 2.7127806817174265, + "grad_norm": 0.0898257720991778, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 209.98719429969788 + }, + { + "epoch": 69, + "train_loss": 7.030236116638184, + "train_acc": 0.0085, + "test_loss": 4.605171342468262, + "test_acc": 0.01, + "lyapunov": 2.7335510912453733, + "grad_norm": 0.16033156081316657, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 210.08958458900452 + }, + { + "epoch": 70, + "train_loss": 7.039960643615722, + "train_acc": 0.00892, + "test_loss": 4.6051711669921875, + "test_acc": 0.01, + "lyapunov": 2.739665296681397, + "grad_norm": 0.22271149603025697, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 210.03332662582397 + }, + { + "epoch": 71, + "train_loss": 6.994076708221436, + "train_acc": 0.0088, + "test_loss": 4.605171272277832, + "test_acc": 0.01, + "lyapunov": 2.720922397530597, + "grad_norm": 0.1379622518868338, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 210.08726000785828 + }, + { + "epoch": 72, + "train_loss": 7.031296715240479, + "train_acc": 0.0093, + "test_loss": 4.605170808410644, + "test_acc": 0.01, + "lyapunov": 2.7340313668751044, + "grad_norm": 0.15171246429702803, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 209.98722290992737 + }, + { + "epoch": 73, + "train_loss": 7.004211445465088, + "train_acc": 0.00854, + "test_loss": 4.605171342468262, + "test_acc": 0.01, + "lyapunov": 2.723038975844908, + "grad_norm": 0.13946310624469108, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 210.0228340625763 + }, + { + "epoch": 74, + "train_loss": 7.004648984680176, + "train_acc": 0.00784, + "test_loss": 4.605171240234375, + "test_acc": 0.01, + "lyapunov": 2.7241133033771954, + "grad_norm": 0.14177753146701746, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 210.09978771209717 + }, + { + "epoch": 75, + "train_loss": 7.037411134338379, + "train_acc": 0.00828, + "test_loss": 4.605171034240723, + "test_acc": 0.01, + "lyapunov": 2.7407932879065005, + "grad_norm": 0.3048803615675911, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 209.95723867416382 + }, + { + "epoch": 76, + "train_loss": 7.073835411071777, + "train_acc": 0.00852, + "test_loss": 4.605171124267578, + "test_acc": 0.01, + "lyapunov": 2.7557388784940287, + "grad_norm": 0.3366831366752972, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 210.0526421070099 + }, + { + "epoch": 77, + "train_loss": 7.069385101013183, + "train_acc": 0.00882, + "test_loss": 4.605171006011963, + "test_acc": 0.01, + "lyapunov": 2.7532967996719244, + "grad_norm": 0.3023678187768571, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 210.00937223434448 + }, + { + "epoch": 78, + "train_loss": 7.039409867553711, + "train_acc": 0.00918, + "test_loss": 4.605171101379394, + "test_acc": 0.01, + "lyapunov": 2.7399997028243512, + "grad_norm": 0.2334340472843992, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 209.98830223083496 + }, + { + "epoch": 79, + "train_loss": 7.060353764648437, + "train_acc": 0.0089, + "test_loss": 4.605171464538574, + "test_acc": 0.01, + "lyapunov": 2.7474362892872843, + "grad_norm": 0.24607577443282014, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 209.9931514263153 + }, + { + "epoch": 80, + "train_loss": 6.994573851013183, + "train_acc": 0.00838, + "test_loss": 4.605170816040039, + "test_acc": 0.01, + "lyapunov": 2.7213273816706276, + "grad_norm": 0.13316471216665574, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 210.0208034515381 + }, + { + "epoch": 81, + "train_loss": 6.987541461791992, + "train_acc": 0.00882, + "test_loss": 4.605170903778077, + "test_acc": 0.01, + "lyapunov": 2.7174221109551238, + "grad_norm": 0.103648369821384, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 209.98763418197632 + }, + { + "epoch": 82, + "train_loss": 7.037619709472656, + "train_acc": 0.009, + "test_loss": 4.60517109298706, + "test_acc": 0.01, + "lyapunov": 2.740689567897631, + "grad_norm": 0.2931576105004017, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 209.9937252998352 + }, + { + "epoch": 83, + "train_loss": 6.985121826171875, + "train_acc": 0.00916, + "test_loss": 4.605170684051513, + "test_acc": 0.01, + "lyapunov": 2.7163276074792417, + "grad_norm": 0.1492971550466505, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 209.95198678970337 + }, + { + "epoch": 84, + "train_loss": 7.066727964477539, + "train_acc": 0.00896, + "test_loss": 4.605170683288574, + "test_acc": 0.01, + "lyapunov": 2.7504812116208286, + "grad_norm": 0.2866450325163035, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 210.01719284057617 + }, + { + "epoch": 85, + "train_loss": 6.989573917999268, + "train_acc": 0.00868, + "test_loss": 4.605171029663086, + "test_acc": 0.01, + "lyapunov": 2.718881234488524, + "grad_norm": 0.17966945444038818, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 209.97075200080872 + }, + { + "epoch": 86, + "train_loss": 7.024203224792481, + "train_acc": 0.009, + "test_loss": 4.60517100982666, + "test_acc": 0.01, + "lyapunov": 2.7339598565455288, + "grad_norm": 0.22243544874027923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 210.22112345695496 + }, + { + "epoch": 87, + "train_loss": 6.999354568481445, + "train_acc": 0.0089, + "test_loss": 4.605170932006836, + "test_acc": 0.01, + "lyapunov": 2.723075409984345, + "grad_norm": 0.18428974005449253, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 210.0000035762787 + }, + { + "epoch": 88, + "train_loss": 6.986679251861572, + "train_acc": 0.0085, + "test_loss": 4.605170610046387, + "test_acc": 0.01, + "lyapunov": 2.7169672826976727, + "grad_norm": 0.12620646621233791, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 209.9843943119049 + }, + { + "epoch": 89, + "train_loss": 7.011478589172364, + "train_acc": 0.00836, + "test_loss": 4.605170822143554, + "test_acc": 0.01, + "lyapunov": 2.7271931854355365, + "grad_norm": 0.15417699872251808, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 209.97113156318665 + }, + { + "epoch": 90, + "train_loss": 7.101416894836426, + "train_acc": 0.00908, + "test_loss": 4.605170645141602, + "test_acc": 0.01, + "lyapunov": 2.7632448941545413, + "grad_norm": 0.31835714546200394, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 209.9718475341797 + }, + { + "epoch": 91, + "train_loss": 7.0410906286621096, + "train_acc": 0.00862, + "test_loss": 4.605170471191406, + "test_acc": 0.01, + "lyapunov": 2.7411284916236274, + "grad_norm": 0.3464519876405528, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 209.98472666740417 + }, + { + "epoch": 92, + "train_loss": 7.078473837890625, + "train_acc": 0.00868, + "test_loss": 4.605170490264893, + "test_acc": 0.01, + "lyapunov": 2.756490916547263, + "grad_norm": 0.3699213952956702, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 209.99044036865234 + }, + { + "epoch": 93, + "train_loss": 6.9829315435791015, + "train_acc": 0.00898, + "test_loss": 4.605170346069336, + "test_acc": 0.01, + "lyapunov": 2.71514059576537, + "grad_norm": 0.0883076892297495, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 209.9776222705841 + }, + { + "epoch": 94, + "train_loss": 6.9855348080444335, + "train_acc": 0.00822, + "test_loss": 4.605170868682861, + "test_acc": 0.01, + "lyapunov": 2.7164944638986417, + "grad_norm": 0.1479238762597201, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 210.00643134117126 + }, + { + "epoch": 95, + "train_loss": 6.9874295346069335, + "train_acc": 0.00856, + "test_loss": 4.605170775604248, + "test_acc": 0.01, + "lyapunov": 2.7169240917391178, + "grad_norm": 0.15626938065528906, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 209.99916791915894 + }, + { + "epoch": 96, + "train_loss": 6.983181795043945, + "train_acc": 0.00818, + "test_loss": 4.605170436096191, + "test_acc": 0.01, + "lyapunov": 2.7151255619800305, + "grad_norm": 0.12016550567041384, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 210.07179808616638 + }, + { + "epoch": 97, + "train_loss": 6.9956132180786135, + "train_acc": 0.0088, + "test_loss": 4.6051704200744625, + "test_acc": 0.01, + "lyapunov": 2.7203723811127647, + "grad_norm": 0.14197786423069308, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 209.9841606616974 + }, + { + "epoch": 98, + "train_loss": 6.9846799612426755, + "train_acc": 0.00844, + "test_loss": 4.605170723724365, + "test_acc": 0.01, + "lyapunov": 2.715931734465577, + "grad_norm": 0.1266081420314572, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 209.96538734436035 + }, + { + "epoch": 99, + "train_loss": 7.002227352294922, + "train_acc": 0.0088, + "test_loss": 4.605170701599121, + "test_acc": 0.01, + "lyapunov": 2.7254832943382166, + "grad_norm": 0.30098740432801424, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 209.96611714363098 + }, + { + "epoch": 100, + "train_loss": 7.031358368072509, + "train_acc": 0.0084, + "test_loss": 4.605170401763916, + "test_acc": 0.01, + "lyapunov": 2.734792661179057, + "grad_norm": 0.22052159160290236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 209.99191045761108 + }, + { + "epoch": 101, + "train_loss": 7.02535282836914, + "train_acc": 0.0089, + "test_loss": 4.605170426940918, + "test_acc": 0.01, + "lyapunov": 2.732613311094396, + "grad_norm": 0.1884414449751891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 209.96369862556458 + }, + { + "epoch": 102, + "train_loss": 6.979629467163086, + "train_acc": 0.00892, + "test_loss": 4.605170404052735, + "test_acc": 0.01, + "lyapunov": 2.713197677031807, + "grad_norm": 0.11445011044498424, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 209.94372940063477 + }, + { + "epoch": 103, + "train_loss": 6.992681996459961, + "train_acc": 0.00866, + "test_loss": 4.605170614624023, + "test_acc": 0.01, + "lyapunov": 2.7198261897582228, + "grad_norm": 0.11698623871801088, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 209.9833948612213 + }, + { + "epoch": 104, + "train_loss": 6.981217978515625, + "train_acc": 0.00812, + "test_loss": 4.605170754241944, + "test_acc": 0.01, + "lyapunov": 2.7141413487436825, + "grad_norm": 0.08755411353395318, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 210.01173162460327 + }, + { + "epoch": 105, + "train_loss": 6.981228657531738, + "train_acc": 0.00804, + "test_loss": 4.605170397949219, + "test_acc": 0.01, + "lyapunov": 2.7141372974571363, + "grad_norm": 0.09294871100024936, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 209.94330191612244 + }, + { + "epoch": 106, + "train_loss": 7.012609109344482, + "train_acc": 0.0086, + "test_loss": 4.605170350646973, + "test_acc": 0.01, + "lyapunov": 2.7288797901719426, + "grad_norm": 0.20993573311720926, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 210.00956416130066 + }, + { + "epoch": 107, + "train_loss": 7.00075564453125, + "train_acc": 0.00862, + "test_loss": 4.60517020111084, + "test_acc": 0.01, + "lyapunov": 2.7233152907827627, + "grad_norm": 0.15372921012205631, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 210.00604104995728 + }, + { + "epoch": 108, + "train_loss": 7.0513025799560545, + "train_acc": 0.00884, + "test_loss": 4.605170352172852, + "test_acc": 0.01, + "lyapunov": 2.7449967105065465, + "grad_norm": 0.27576954124117053, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 209.93969535827637 + }, + { + "epoch": 109, + "train_loss": 6.980083810424805, + "train_acc": 0.00836, + "test_loss": 4.605170263671875, + "test_acc": 0.01, + "lyapunov": 2.713495020366386, + "grad_norm": 0.08939231438623309, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 209.99505877494812 + }, + { + "epoch": 110, + "train_loss": 6.984004687805176, + "train_acc": 0.00854, + "test_loss": 4.60517056350708, + "test_acc": 0.01, + "lyapunov": 2.715787248538278, + "grad_norm": 0.09252734679044972, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 209.9858946800232 + }, + { + "epoch": 111, + "train_loss": 6.983103836517334, + "train_acc": 0.00846, + "test_loss": 4.6051701759338375, + "test_acc": 0.01, + "lyapunov": 2.715198960145721, + "grad_norm": 0.12412466148890375, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 209.98376154899597 + }, + { + "epoch": 112, + "train_loss": 7.001786309051513, + "train_acc": 0.00842, + "test_loss": 4.605170098876953, + "test_acc": 0.01, + "lyapunov": 2.7237192645402213, + "grad_norm": 0.2611435951973152, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 210.04836750030518 + }, + { + "epoch": 113, + "train_loss": 6.985844685974121, + "train_acc": 0.0083, + "test_loss": 4.605170079040527, + "test_acc": 0.01, + "lyapunov": 2.716268786993783, + "grad_norm": 0.12269496905075315, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 210.01298427581787 + }, + { + "epoch": 114, + "train_loss": 6.982051696472168, + "train_acc": 0.0086, + "test_loss": 4.605170341491699, + "test_acc": 0.01, + "lyapunov": 2.7146723093584066, + "grad_norm": 0.10102267353118359, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 209.98340034484863 + }, + { + "epoch": 115, + "train_loss": 6.97831426361084, + "train_acc": 0.00934, + "test_loss": 4.60517028503418, + "test_acc": 0.01, + "lyapunov": 2.7124323881495638, + "grad_norm": 0.0910994755377039, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 209.99640536308289 + }, + { + "epoch": 116, + "train_loss": 6.9820148625183105, + "train_acc": 0.00932, + "test_loss": 4.605170400238037, + "test_acc": 0.01, + "lyapunov": 2.7146591920681926, + "grad_norm": 0.10075615501603827, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 209.9244248867035 + }, + { + "epoch": 117, + "train_loss": 6.9843703225708005, + "train_acc": 0.00914, + "test_loss": 4.605170434570312, + "test_acc": 0.01, + "lyapunov": 2.715647294393281, + "grad_norm": 0.11228216953551147, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 209.9830358028412 + }, + { + "epoch": 118, + "train_loss": 7.017746971740722, + "train_acc": 0.00848, + "test_loss": 4.605170096588135, + "test_acc": 0.01, + "lyapunov": 2.7295747071580814, + "grad_norm": 0.20995938315988794, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 209.98030400276184 + }, + { + "epoch": 119, + "train_loss": 6.992286892089844, + "train_acc": 0.00848, + "test_loss": 4.605170076751709, + "test_acc": 0.01, + "lyapunov": 2.7198437071212416, + "grad_norm": 0.13966024517159772, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 209.8962001800537 + }, + { + "epoch": 120, + "train_loss": 6.988741851654053, + "train_acc": 0.00882, + "test_loss": 4.605170139312744, + "test_acc": 0.01, + "lyapunov": 2.7180907177498272, + "grad_norm": 0.16074749971185626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 210.00037145614624 + }, + { + "epoch": 121, + "train_loss": 6.9938799935913085, + "train_acc": 0.00866, + "test_loss": 4.605170372772217, + "test_acc": 0.01, + "lyapunov": 2.7198036820687297, + "grad_norm": 0.15994838954410112, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 210.0474226474762 + }, + { + "epoch": 122, + "train_loss": 7.0039596870422365, + "train_acc": 0.00892, + "test_loss": 4.6051700347900395, + "test_acc": 0.01, + "lyapunov": 2.7259010494212665, + "grad_norm": 0.09437754111929303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 210.04152083396912 + }, + { + "epoch": 123, + "train_loss": 7.009052494049072, + "train_acc": 0.00872, + "test_loss": 4.605170434570312, + "test_acc": 0.01, + "lyapunov": 2.72874392755806, + "grad_norm": 0.10432489602660702, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 210.2749161720276 + }, + { + "epoch": 124, + "train_loss": 7.074693834838867, + "train_acc": 0.0093, + "test_loss": 4.605170128631592, + "test_acc": 0.01, + "lyapunov": 2.758679599103415, + "grad_norm": 0.22022455692760384, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 210.06590056419373 + }, + { + "epoch": 125, + "train_loss": 6.982606186523437, + "train_acc": 0.00892, + "test_loss": 4.605170491027832, + "test_acc": 0.01, + "lyapunov": 2.7148781255687897, + "grad_norm": 0.08823763166065995, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 210.01559233665466 + }, + { + "epoch": 126, + "train_loss": 6.982140954437256, + "train_acc": 0.0086, + "test_loss": 4.605170350646973, + "test_acc": 0.01, + "lyapunov": 2.7147414952592777, + "grad_norm": 0.10255408158855737, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 210.03672337532043 + }, + { + "epoch": 127, + "train_loss": 6.979871159973144, + "train_acc": 0.00872, + "test_loss": 4.605170230102539, + "test_acc": 0.01, + "lyapunov": 2.71336467369743, + "grad_norm": 0.08818157608440398, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 210.00639820098877 + }, + { + "epoch": 128, + "train_loss": 6.985049297180176, + "train_acc": 0.00864, + "test_loss": 4.605170027160645, + "test_acc": 0.01, + "lyapunov": 2.716455806551687, + "grad_norm": 0.08762261938563776, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 209.97323060035706 + }, + { + "epoch": 129, + "train_loss": 6.985287237243653, + "train_acc": 0.00956, + "test_loss": 4.605170120239258, + "test_acc": 0.01, + "lyapunov": 2.7165556063737406, + "grad_norm": 0.08764461237151443, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 210.0408091545105 + }, + { + "epoch": 130, + "train_loss": 7.065185516815186, + "train_acc": 0.00922, + "test_loss": 4.605170118713379, + "test_acc": 0.01, + "lyapunov": 2.756326196138816, + "grad_norm": 0.2237427649903656, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 210.05785131454468 + }, + { + "epoch": 131, + "train_loss": 7.003630043640137, + "train_acc": 0.00874, + "test_loss": 4.605170425415039, + "test_acc": 0.01, + "lyapunov": 2.7251280341916684, + "grad_norm": 0.11404915316549034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 210.06771302223206 + }, + { + "epoch": 132, + "train_loss": 7.016419371795655, + "train_acc": 0.00874, + "test_loss": 4.605170411682129, + "test_acc": 0.01, + "lyapunov": 2.732408604048707, + "grad_norm": 0.09643363295807468, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 210.00194883346558 + }, + { + "epoch": 133, + "train_loss": 7.027043022460938, + "train_acc": 0.00868, + "test_loss": 4.605170454406738, + "test_acc": 0.01, + "lyapunov": 2.7380632366365787, + "grad_norm": 0.08968045213589285, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 210.257652759552 + }, + { + "epoch": 134, + "train_loss": 7.035782067260742, + "train_acc": 0.00788, + "test_loss": 4.605170135498047, + "test_acc": 0.01, + "lyapunov": 2.743028284033851, + "grad_norm": 0.09341294223256699, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 209.9916913509369 + }, + { + "epoch": 135, + "train_loss": 7.071151198425293, + "train_acc": 0.0096, + "test_loss": 4.605170458984375, + "test_acc": 0.01, + "lyapunov": 2.760085921153388, + "grad_norm": 0.09297571487706319, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 210.2266161441803 + }, + { + "epoch": 136, + "train_loss": 7.034707638702392, + "train_acc": 0.00916, + "test_loss": 4.605170063018798, + "test_acc": 0.01, + "lyapunov": 2.742517843880617, + "grad_norm": 0.08845657511108296, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 210.06171536445618 + }, + { + "epoch": 137, + "train_loss": 7.0274613586425785, + "train_acc": 0.00888, + "test_loss": 4.605170385742188, + "test_acc": 0.01, + "lyapunov": 2.7373946475250945, + "grad_norm": 0.10398852016478509, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 209.9369614124298 + }, + { + "epoch": 138, + "train_loss": 7.025472250366211, + "train_acc": 0.0095, + "test_loss": 4.605170440673828, + "test_acc": 0.01, + "lyapunov": 2.736402528670133, + "grad_norm": 0.09038559548514402, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 210.0793435573578 + }, + { + "epoch": 139, + "train_loss": 7.014701705322266, + "train_acc": 0.00924, + "test_loss": 4.605170342254639, + "test_acc": 0.01, + "lyapunov": 2.7315333481030084, + "grad_norm": 0.10172944851300819, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 210.09445595741272 + }, + { + "epoch": 140, + "train_loss": 7.003781777954101, + "train_acc": 0.00918, + "test_loss": 4.605170393371582, + "test_acc": 0.01, + "lyapunov": 2.7260687607328604, + "grad_norm": 0.08766437036057895, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 210.07793593406677 + }, + { + "epoch": 141, + "train_loss": 7.056627904968262, + "train_acc": 0.01, + "test_loss": 4.60516996383667, + "test_acc": 0.01, + "lyapunov": 2.7532575478029373, + "grad_norm": 0.09441259373264534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 210.04277729988098 + }, + { + "epoch": 142, + "train_loss": 6.989320599212647, + "train_acc": 0.00982, + "test_loss": 4.605170464324951, + "test_acc": 0.01, + "lyapunov": 2.718763675836041, + "grad_norm": 0.08778246721140825, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 210.0390853881836 + }, + { + "epoch": 143, + "train_loss": 7.0194689248657225, + "train_acc": 0.01, + "test_loss": 4.605170278930664, + "test_acc": 0.01, + "lyapunov": 2.7337976069096714, + "grad_norm": 0.088168048948687, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 210.09060406684875 + }, + { + "epoch": 144, + "train_loss": 6.989500450592041, + "train_acc": 0.01, + "test_loss": 4.605170496368408, + "test_acc": 0.01, + "lyapunov": 2.71841098280514, + "grad_norm": 0.08876604826979184, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 210.08678889274597 + }, + { + "epoch": 145, + "train_loss": 6.977725113220215, + "train_acc": 0.01, + "test_loss": 4.605170376586914, + "test_acc": 0.01, + "lyapunov": 2.712189649986794, + "grad_norm": 0.08740841232989421, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 210.07671403884888 + }, + { + "epoch": 146, + "train_loss": 7.063753978881836, + "train_acc": 0.01, + "test_loss": 4.605170356750488, + "test_acc": 0.01, + "lyapunov": 2.7562683031077273, + "grad_norm": 0.08829447012972118, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 210.06147265434265 + }, + { + "epoch": 147, + "train_loss": 6.97903392501831, + "train_acc": 0.01, + "test_loss": 4.605170056915283, + "test_acc": 0.01, + "lyapunov": 2.712921044405769, + "grad_norm": 0.08792833595670006, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 210.12889552116394 + }, + { + "epoch": 148, + "train_loss": 7.024583773956299, + "train_acc": 0.01, + "test_loss": 4.605170234680176, + "test_acc": 0.01, + "lyapunov": 2.736283694386787, + "grad_norm": 0.08841220675764232, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 210.09635305404663 + }, + { + "epoch": 149, + "train_loss": 6.9777571395874025, + "train_acc": 0.01, + "test_loss": 4.605170068359375, + "test_acc": 0.01, + "lyapunov": 2.7121838078169564, + "grad_norm": 0.08769792454661404, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 210.0731065273285 + }, + { + "epoch": 150, + "train_loss": 6.9812114135742185, + "train_acc": 0.01, + "test_loss": 4.605170178985595, + "test_acc": 0.01, + "lyapunov": 2.71422858494322, + "grad_norm": 0.08799513594752054, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 210.09806776046753 + } + ] + } +}
\ No newline at end of file |
