diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
| commit | cd99d6b874d9d09b3bb87b8485cc787885af71f1 (patch) | |
| tree | 59a233959932ca0e4f12f196275e07fcf443b33f /runs/depth_scaling | |
init commit
Diffstat (limited to 'runs/depth_scaling')
| -rw-r--r-- | runs/depth_scaling/cifar100_20251230-213033/config.json | 21 | ||||
| -rw-r--r-- | runs/depth_scaling/cifar100_20251230-213033/results.json | 21026 | ||||
| -rw-r--r-- | runs/depth_scaling/cifar10_20251229-160504/config.json | 20 | ||||
| -rw-r--r-- | runs/depth_scaling/cifar10_20251229-160504/results.json | 11222 |
4 files changed, 32289 insertions, 0 deletions
diff --git a/runs/depth_scaling/cifar100_20251230-213033/config.json b/runs/depth_scaling/cifar100_20251230-213033/config.json new file mode 100644 index 0000000..1ccfe37 --- /dev/null +++ b/runs/depth_scaling/cifar100_20251230-213033/config.json @@ -0,0 +1,21 @@ +{ + "dataset": "cifar100", + "depths": [ + 4, + 8, + 12, + 16, + 20 + ], + "T": 4, + "epochs": 150, + "batch_size": 128, + "lr": 0.001, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "data_dir": "./data", + "out_dir": "runs/depth_scaling", + "device": "cuda", + "seed": 42, + "no_progress": false +}
\ No newline at end of file diff --git a/runs/depth_scaling/cifar100_20251230-213033/results.json b/runs/depth_scaling/cifar100_20251230-213033/results.json new file mode 100644 index 0000000..160dc74 --- /dev/null +++ b/runs/depth_scaling/cifar100_20251230-213033/results.json @@ -0,0 +1,21026 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 4.346117241363525, + "train_acc": 0.09834, + "test_loss": 3.550243005371094, + "test_acc": 0.1705, + "lyapunov": null, + "grad_norm": 6.371099905681965, + "grad_max_sv": 5.004546135663986, + "grad_min_sv": 1.1479638856171093e-07, + "grad_condition": 101906528.03771546, + "lr": 0.0009998903417374227, + "time_sec": 16.05687952041626 + }, + { + "epoch": 2, + "train_loss": 3.5102988652038576, + "train_acc": 0.18534, + "test_loss": 3.5716390384674073, + "test_acc": 0.2002, + "lyapunov": null, + "grad_norm": 4.572810771811442, + "grad_max_sv": 3.3247465908527376, + "grad_min_sv": 8.398422393085526e-08, + "grad_condition": 76227232.13894418, + "lr": 0.0009995614150494292, + "time_sec": 15.448272466659546 + }, + { + "epoch": 3, + "train_loss": 3.054396768722534, + "train_acc": 0.25274, + "test_loss": 2.993664514160156, + "test_acc": 0.2763, + "lyapunov": null, + "grad_norm": 3.5860981037463016, + "grad_max_sv": 2.402756503224373, + "grad_min_sv": 6.775348947440918e-08, + "grad_condition": 42769838.6817436, + "lr": 0.0009990133642141358, + "time_sec": 15.465861558914185 + }, + { + "epoch": 4, + "train_loss": 2.722675824432373, + "train_acc": 0.3136, + "test_loss": 2.728995104598999, + "test_acc": 0.3281, + "lyapunov": null, + "grad_norm": 2.9852975671602957, + "grad_max_sv": 1.8682193964719773, + "grad_min_sv": 5.5938930086305014e-08, + "grad_condition": 328348281.0445617, + "lr": 0.0009982464296247522, + "time_sec": 15.43475079536438 + }, + { + "epoch": 5, + "train_loss": 2.508175393676758, + "train_acc": 0.3569, + "test_loss": 3.419650896835327, + "test_acc": 0.2461, + "lyapunov": null, + "grad_norm": 2.6358092556880783, + "grad_max_sv": 1.6064732760190963, + "grad_min_sv": 4.9754905795396096e-08, + "grad_condition": 44385388.81342572, + "lr": 0.0009972609476841367, + "time_sec": 15.444115400314331 + }, + { + "epoch": 6, + "train_loss": 2.3319723847961424, + "train_acc": 0.39276, + "test_loss": 2.5260577701568603, + "test_acc": 0.373, + "lyapunov": null, + "grad_norm": 2.4120452283895926, + "grad_max_sv": 1.3716692090034486, + "grad_min_sv": 4.6226219474476696e-08, + "grad_condition": 36175494.06179842, + "lr": 0.000996057350657239, + "time_sec": 15.43784475326538 + }, + { + "epoch": 7, + "train_loss": 2.190326895675659, + "train_acc": 0.42378, + "test_loss": 2.579724459838867, + "test_acc": 0.3695, + "lyapunov": null, + "grad_norm": 2.2437900964501787, + "grad_max_sv": 1.2385427325963974, + "grad_min_sv": 4.28970178392718e-08, + "grad_condition": 190661418.56414273, + "lr": 0.000994636166481494, + "time_sec": 15.455140829086304 + }, + { + "epoch": 8, + "train_loss": 2.070303360748291, + "train_acc": 0.44962, + "test_loss": 2.7414955226898194, + "test_acc": 0.3392, + "lyapunov": null, + "grad_norm": 2.0940271772848607, + "grad_max_sv": 1.1511073380708694, + "grad_min_sv": 4.056795894439441e-08, + "grad_condition": 707337590.06387, + "lr": 0.0009929980185352525, + "time_sec": 15.463218450546265 + }, + { + "epoch": 9, + "train_loss": 1.9642453713607788, + "train_acc": 0.47356, + "test_loss": 2.222684016609192, + "test_acc": 0.4312, + "lyapunov": null, + "grad_norm": 1.964494515952547, + "grad_max_sv": 1.0273158520460128, + "grad_min_sv": 3.78966669392633e-08, + "grad_condition": 428475326.2676049, + "lr": 0.0009911436253643444, + "time_sec": 15.443583011627197 + }, + { + "epoch": 10, + "train_loss": 1.8679190033721924, + "train_acc": 0.49384, + "test_loss": 2.2569959682464598, + "test_acc": 0.4227, + "lyapunov": null, + "grad_norm": 1.863426925292341, + "grad_max_sv": 0.9406855523586273, + "grad_min_sv": 3.563859525823609e-08, + "grad_condition": 44606817.73724544, + "lr": 0.0009890738003669028, + "time_sec": 15.442885637283325 + }, + { + "epoch": 11, + "train_loss": 1.7814382321929931, + "train_acc": 0.51302, + "test_loss": 2.504388472366333, + "test_acc": 0.3946, + "lyapunov": null, + "grad_norm": 1.7723102238636992, + "grad_max_sv": 0.8945659548044205, + "grad_min_sv": 3.425328631706526e-08, + "grad_condition": 109308981.21335419, + "lr": 0.00098678945143658, + "time_sec": 15.459418535232544 + }, + { + "epoch": 12, + "train_loss": 1.7159840296936035, + "train_acc": 0.53146, + "test_loss": 2.508260029220581, + "test_acc": 0.3935, + "lyapunov": null, + "grad_norm": 1.686140929704303, + "grad_max_sv": 0.8295574262738228, + "grad_min_sv": 3.2012488864613386e-08, + "grad_condition": 89179142.85485055, + "lr": 0.0009842915805643154, + "time_sec": 15.439209461212158 + }, + { + "epoch": 13, + "train_loss": 1.6503846585845947, + "train_acc": 0.54474, + "test_loss": 2.1456974792480468, + "test_acc": 0.4502, + "lyapunov": null, + "grad_norm": 1.619802250264676, + "grad_max_sv": 0.7797225803136826, + "grad_min_sv": 3.0749212220730626e-08, + "grad_condition": 285444721.0869424, + "lr": 0.000981581283398829, + "time_sec": 15.433976173400879 + }, + { + "epoch": 14, + "train_loss": 1.5905582858276368, + "train_acc": 0.5585, + "test_loss": 2.3602350467681883, + "test_acc": 0.4172, + "lyapunov": null, + "grad_norm": 1.5586059487347217, + "grad_max_sv": 0.7570723682641983, + "grad_min_sv": 2.990113052159238e-08, + "grad_condition": 33337603.41083364, + "lr": 0.0009786597487660333, + "time_sec": 15.430689811706543 + }, + { + "epoch": 15, + "train_loss": 1.5257548734283448, + "train_acc": 0.57394, + "test_loss": 2.2596036737442016, + "test_acc": 0.4401, + "lyapunov": null, + "grad_norm": 1.494958992831554, + "grad_max_sv": 0.7011767938733101, + "grad_min_sv": 2.8093294829334425e-08, + "grad_condition": 215948380.66679326, + "lr": 0.0009755282581475766, + "time_sec": 15.445661544799805 + }, + { + "epoch": 16, + "train_loss": 1.4769169562911988, + "train_acc": 0.58454, + "test_loss": 2.1792555765151977, + "test_acc": 0.4464, + "lyapunov": null, + "grad_norm": 1.4433947117799557, + "grad_max_sv": 0.6677212715148926, + "grad_min_sv": 2.683760501054344e-08, + "grad_condition": 45818352.96134277, + "lr": 0.0009721881851187403, + "time_sec": 15.456706523895264 + }, + { + "epoch": 17, + "train_loss": 1.429377403755188, + "train_acc": 0.5973, + "test_loss": 1.954601181793213, + "test_acc": 0.4919, + "lyapunov": null, + "grad_norm": 1.402899746172417, + "grad_max_sv": 0.6569379523396492, + "grad_min_sv": 2.6772942612884876e-08, + "grad_condition": 33425629.606939513, + "lr": 0.0009686409947459456, + "time_sec": 15.437876462936401 + }, + { + "epoch": 18, + "train_loss": 1.3954533521652221, + "train_acc": 0.60348, + "test_loss": 2.0381541999816895, + "test_acc": 0.4877, + "lyapunov": null, + "grad_norm": 1.3646767773598742, + "grad_max_sv": 0.6277542792260646, + "grad_min_sv": 2.5360278501545055e-08, + "grad_condition": 1276893214.2885015, + "lr": 0.0009648882429441254, + "time_sec": 15.442293643951416 + }, + { + "epoch": 19, + "train_loss": 1.34601386013031, + "train_acc": 0.61788, + "test_loss": 2.016515805435181, + "test_acc": 0.4879, + "lyapunov": null, + "grad_norm": 1.3307426948998278, + "grad_max_sv": 0.6192222326993942, + "grad_min_sv": 2.5143750027184496e-08, + "grad_condition": 86894504.02450311, + "lr": 0.00096093157579425, + "time_sec": 15.452877044677734 + }, + { + "epoch": 20, + "train_loss": 1.3103528637313844, + "train_acc": 0.6263, + "test_loss": 1.9570331373214722, + "test_acc": 0.5034, + "lyapunov": null, + "grad_norm": 1.3019068672950393, + "grad_max_sv": 0.5866124749183654, + "grad_min_sv": 2.432551227254942e-08, + "grad_condition": 79675782.79073408, + "lr": 0.0009567727288213001, + "time_sec": 15.442177057266235 + }, + { + "epoch": 21, + "train_loss": 1.2698568128204346, + "train_acc": 0.6344, + "test_loss": 2.4308045747756957, + "test_acc": 0.4364, + "lyapunov": null, + "grad_norm": 1.268768380545349, + "grad_max_sv": 0.5797948583960533, + "grad_min_sv": 2.4104086050920348e-08, + "grad_condition": 252776511.74393004, + "lr": 0.0009524135262330095, + "time_sec": 15.434435844421387 + }, + { + "epoch": 22, + "train_loss": 1.2418579862976074, + "train_acc": 0.64312, + "test_loss": 2.0848071727752684, + "test_acc": 0.4867, + "lyapunov": null, + "grad_norm": 1.2415784803203374, + "grad_max_sv": 0.5592644922435284, + "grad_min_sv": 2.333180208254765e-08, + "grad_condition": 407593245.7962709, + "lr": 0.0009478558801197061, + "time_sec": 15.460945129394531 + }, + { + "epoch": 23, + "train_loss": 1.2006691330718995, + "train_acc": 0.65526, + "test_loss": 2.041600823402405, + "test_acc": 0.4981, + "lyapunov": null, + "grad_norm": 1.2102718857806654, + "grad_max_sv": 0.5479752145707607, + "grad_min_sv": 2.2646243507534748e-08, + "grad_condition": 185681115.951604, + "lr": 0.000943101789615607, + "time_sec": 15.44005274772644 + }, + { + "epoch": 24, + "train_loss": 1.172968614616394, + "train_acc": 0.66154, + "test_loss": 1.9552119861602784, + "test_acc": 0.513, + "lyapunov": null, + "grad_norm": 1.1987019399549284, + "grad_max_sv": 0.5312893047928811, + "grad_min_sv": 2.1980094488081857e-08, + "grad_condition": 1318897337.4819613, + "lr": 0.0009381533400219313, + "time_sec": 15.440562009811401 + }, + { + "epoch": 25, + "train_loss": 1.1449218238067627, + "train_acc": 0.6641, + "test_loss": 2.128752773284912, + "test_acc": 0.4906, + "lyapunov": null, + "grad_norm": 1.1778317272519585, + "grad_max_sv": 0.5174455069005489, + "grad_min_sv": 2.167262270237613e-08, + "grad_condition": 94067067.14088301, + "lr": 0.0009330127018922189, + "time_sec": 15.443851232528687 + }, + { + "epoch": 26, + "train_loss": 1.1113452094268799, + "train_acc": 0.67438, + "test_loss": 1.8866374584197998, + "test_acc": 0.5238, + "lyapunov": null, + "grad_norm": 1.1514970963524438, + "grad_max_sv": 0.5059572130441665, + "grad_min_sv": 2.105146406777836e-08, + "grad_condition": 50748348.81685668, + "lr": 0.000927682130080253, + "time_sec": 15.436878681182861 + }, + { + "epoch": 27, + "train_loss": 1.0829708759689332, + "train_acc": 0.68438, + "test_loss": 1.9943335615158082, + "test_acc": 0.5124, + "lyapunov": null, + "grad_norm": 1.1319771840855883, + "grad_max_sv": 0.4948433578014374, + "grad_min_sv": 2.0725160652934616e-08, + "grad_condition": 77507476.80554287, + "lr": 0.0009221639627510072, + "time_sec": 15.441301822662354 + }, + { + "epoch": 28, + "train_loss": 1.0513020403671265, + "train_acc": 0.6904, + "test_loss": 1.9359693916320801, + "test_acc": 0.5214, + "lyapunov": null, + "grad_norm": 1.1163749465170618, + "grad_max_sv": 0.48814368024468424, + "grad_min_sv": 2.0212865362197185e-08, + "grad_condition": 298941066.3217323, + "lr": 0.0009164606203550494, + "time_sec": 15.441382646560669 + }, + { + "epoch": 29, + "train_loss": 1.029607636756897, + "train_acc": 0.69482, + "test_loss": 1.8560630758285523, + "test_acc": 0.5431, + "lyapunov": null, + "grad_norm": 1.0928580221633342, + "grad_max_sv": 0.5047290526330471, + "grad_min_sv": 2.040681175013992e-08, + "grad_condition": 48855533.517919585, + "lr": 0.0009105746045668516, + "time_sec": 15.460914373397827 + }, + { + "epoch": 30, + "train_loss": 1.0061684103393556, + "train_acc": 0.70324, + "test_loss": 1.8417754476547241, + "test_acc": 0.5501, + "lyapunov": null, + "grad_norm": 1.0821004976322715, + "grad_max_sv": 0.4740450643002987, + "grad_min_sv": 1.9723761995882327e-08, + "grad_condition": 57054017.19113614, + "lr": 0.0009045084971874733, + "time_sec": 15.458839178085327 + }, + { + "epoch": 31, + "train_loss": 0.9935745064163208, + "train_acc": 0.70312, + "test_loss": 1.9427630338668824, + "test_acc": 0.522, + "lyapunov": null, + "grad_norm": 1.0722093249603526, + "grad_max_sv": 0.46733852848410606, + "grad_min_sv": 1.9939205435706707e-08, + "grad_condition": 112229781.98396464, + "lr": 0.0008982649590120977, + "time_sec": 15.452664375305176 + }, + { + "epoch": 32, + "train_loss": 0.9721898876953124, + "train_acc": 0.70988, + "test_loss": 1.9291723361968993, + "test_acc": 0.5365, + "lyapunov": null, + "grad_norm": 1.0493640798096933, + "grad_max_sv": 0.451675596088171, + "grad_min_sv": 1.9157993355872065e-08, + "grad_condition": 369697835.9253775, + "lr": 0.0008918467286629196, + "time_sec": 15.447975158691406 + }, + { + "epoch": 33, + "train_loss": 0.9359502591705322, + "train_acc": 0.71948, + "test_loss": 1.8434128448486329, + "test_acc": 0.544, + "lyapunov": null, + "grad_norm": 1.0350388755850537, + "grad_max_sv": 0.4494323328137398, + "grad_min_sv": 1.8973058482987804e-08, + "grad_condition": 171928795.69725567, + "lr": 0.0008852566213878943, + "time_sec": 15.466245889663696 + }, + { + "epoch": 34, + "train_loss": 0.9224456702995301, + "train_acc": 0.72168, + "test_loss": 1.9599631881713868, + "test_acc": 0.5373, + "lyapunov": null, + "grad_norm": 1.0242311025233581, + "grad_max_sv": 0.44513428434729574, + "grad_min_sv": 1.8523945613654545e-08, + "grad_condition": 888195654.0727282, + "lr": 0.000878497527825878, + "time_sec": 15.461785316467285 + }, + { + "epoch": 35, + "train_loss": 0.9021567019844056, + "train_acc": 0.72618, + "test_loss": 1.9999154584884644, + "test_acc": 0.5252, + "lyapunov": null, + "grad_norm": 1.0039865896001459, + "grad_max_sv": 0.43928237855434416, + "grad_min_sv": 1.8592035315456722e-08, + "grad_condition": 59743908.57133106, + "lr": 0.000871572412738697, + "time_sec": 15.456985473632812 + }, + { + "epoch": 36, + "train_loss": 0.873283097190857, + "train_acc": 0.73628, + "test_loss": 1.982330265045166, + "test_acc": 0.5279, + "lyapunov": null, + "grad_norm": 0.9875825554026111, + "grad_max_sv": 0.42813498005270956, + "grad_min_sv": 1.7983777930719037e-08, + "grad_condition": 38527409.79900636, + "lr": 0.0008644843137107055, + "time_sec": 15.460105419158936 + }, + { + "epoch": 37, + "train_loss": 0.855709279346466, + "train_acc": 0.74242, + "test_loss": 1.9136155584335328, + "test_acc": 0.5472, + "lyapunov": null, + "grad_norm": 0.9742310219337682, + "grad_max_sv": 0.4270216949284077, + "grad_min_sv": 1.8125810764824114e-08, + "grad_condition": 40840950.73216411, + "lr": 0.0008572363398164014, + "time_sec": 15.459755897521973 + }, + { + "epoch": 38, + "train_loss": 0.8404359550476074, + "train_acc": 0.74404, + "test_loss": 1.9389733367919921, + "test_acc": 0.543, + "lyapunov": null, + "grad_norm": 0.9722202503028375, + "grad_max_sv": 0.42485796511173246, + "grad_min_sv": 1.783134123689578e-08, + "grad_condition": 35194167.51271446, + "lr": 0.0008498316702566826, + "time_sec": 15.465211629867554 + }, + { + "epoch": 39, + "train_loss": 0.8240101078987122, + "train_acc": 0.7481, + "test_loss": 1.8307217979431152, + "test_acc": 0.5614, + "lyapunov": null, + "grad_norm": 0.9595502877351665, + "grad_max_sv": 0.42209447696805, + "grad_min_sv": 1.767885368514355e-08, + "grad_condition": 49656386.85866156, + "lr": 0.0008422735529643442, + "time_sec": 15.455949544906616 + }, + { + "epoch": 40, + "train_loss": 0.8046207006645203, + "train_acc": 0.75466, + "test_loss": 1.850761813545227, + "test_acc": 0.5635, + "lyapunov": null, + "grad_norm": 0.9479757240987767, + "grad_max_sv": 0.4134661167860031, + "grad_min_sv": 1.7007238412025672e-08, + "grad_condition": 126702887.42727256, + "lr": 0.0008345653031794289, + "time_sec": 15.462433099746704 + }, + { + "epoch": 41, + "train_loss": 0.7895244974899291, + "train_acc": 0.7586, + "test_loss": 1.8032215663909912, + "test_acc": 0.5672, + "lyapunov": null, + "grad_norm": 0.9378242670136524, + "grad_max_sv": 0.3964280657470226, + "grad_min_sv": 1.6944396442897246e-08, + "grad_condition": 56052359.18882908, + "lr": 0.0008267103019950526, + "time_sec": 15.461899757385254 + }, + { + "epoch": 42, + "train_loss": 0.7817759350585938, + "train_acc": 0.76056, + "test_loss": 1.8505826110839845, + "test_acc": 0.5582, + "lyapunov": null, + "grad_norm": 0.9337187835649021, + "grad_max_sv": 0.40529350489377974, + "grad_min_sv": 1.6676117367206422e-08, + "grad_condition": 104849301.5445062, + "lr": 0.0008187119948743447, + "time_sec": 15.4581778049469 + }, + { + "epoch": 43, + "train_loss": 0.7522177431297302, + "train_acc": 0.77, + "test_loss": 1.8242130517959594, + "test_acc": 0.5664, + "lyapunov": null, + "grad_norm": 0.9099555522847652, + "grad_max_sv": 0.3934644728899002, + "grad_min_sv": 1.6434511908997028e-08, + "grad_condition": 61342068.969211556, + "lr": 0.000810573890139155, + "time_sec": 15.447810411453247 + }, + { + "epoch": 44, + "train_loss": 0.7323650365447998, + "train_acc": 0.77464, + "test_loss": 1.8068662160873412, + "test_acc": 0.5687, + "lyapunov": null, + "grad_norm": 0.9037556138602378, + "grad_max_sv": 0.38610322400927544, + "grad_min_sv": 1.6304181772903992e-08, + "grad_condition": 167736758.90882486, + "lr": 0.0008022995574311873, + "time_sec": 15.458601951599121 + }, + { + "epoch": 45, + "train_loss": 0.7159886347198486, + "train_acc": 0.77928, + "test_loss": 1.8823264539718627, + "test_acc": 0.5645, + "lyapunov": null, + "grad_norm": 0.8924866037240323, + "grad_max_sv": 0.3947519548237324, + "grad_min_sv": 1.6336485028634052e-08, + "grad_condition": 69167052.26120928, + "lr": 0.0007938926261462363, + "time_sec": 15.471583843231201 + }, + { + "epoch": 46, + "train_loss": 0.7136952446365357, + "train_acc": 0.78054, + "test_loss": 1.7574677402496337, + "test_acc": 0.5825, + "lyapunov": null, + "grad_norm": 0.8931942393361509, + "grad_max_sv": 0.37973910570144653, + "grad_min_sv": 1.6153765381235476e-08, + "grad_condition": 489329276.9292526, + "lr": 0.0007853567838422158, + "time_sec": 15.471785068511963 + }, + { + "epoch": 47, + "train_loss": 0.6837898429489135, + "train_acc": 0.78762, + "test_loss": 1.813544430541992, + "test_acc": 0.5725, + "lyapunov": null, + "grad_norm": 0.8815821036419627, + "grad_max_sv": 0.3751175247132778, + "grad_min_sv": 1.5766544728818e-08, + "grad_condition": 56980767.9665909, + "lr": 0.0007766957746216719, + "time_sec": 15.457926750183105 + }, + { + "epoch": 48, + "train_loss": 0.6856673602676392, + "train_acc": 0.78888, + "test_loss": 1.990400904083252, + "test_acc": 0.5508, + "lyapunov": null, + "grad_norm": 0.8744462547536074, + "grad_max_sv": 0.3799706071615219, + "grad_min_sv": 1.6096928557272904e-08, + "grad_condition": 303945380.88277286, + "lr": 0.0007679133974894982, + "time_sec": 15.456810712814331 + }, + { + "epoch": 49, + "train_loss": 0.667086083278656, + "train_acc": 0.792, + "test_loss": 1.8513258657455445, + "test_acc": 0.5727, + "lyapunov": null, + "grad_norm": 0.8677773875250141, + "grad_max_sv": 0.3783408857882023, + "grad_min_sv": 1.5666924351245835e-08, + "grad_condition": 353923080.3313891, + "lr": 0.000759013504686565, + "time_sec": 15.462752342224121 + }, + { + "epoch": 50, + "train_loss": 0.6466483051490783, + "train_acc": 0.79742, + "test_loss": 2.043276873779297, + "test_acc": 0.5419, + "lyapunov": null, + "grad_norm": 0.8555816651124006, + "grad_max_sv": 0.3675771526992321, + "grad_min_sv": 1.5045219146090152e-08, + "grad_condition": 536508015.45004594, + "lr": 0.0007499999999999998, + "time_sec": 15.458629846572876 + }, + { + "epoch": 51, + "train_loss": 0.6258693974494934, + "train_acc": 0.80236, + "test_loss": 1.954080751991272, + "test_acc": 0.5622, + "lyapunov": null, + "grad_norm": 0.8469179426728266, + "grad_max_sv": 0.377849230915308, + "grad_min_sv": 1.5333696528480045e-08, + "grad_condition": 117912957.37628272, + "lr": 0.0007408768370508575, + "time_sec": 15.46766972541809 + }, + { + "epoch": 52, + "train_loss": 0.6236670018768311, + "train_acc": 0.80516, + "test_loss": 1.8472453788757324, + "test_acc": 0.5858, + "lyapunov": null, + "grad_norm": 0.8404179479578597, + "grad_max_sv": 0.3541756056249142, + "grad_min_sv": 1.5022051764665422e-08, + "grad_condition": 129884434.5908782, + "lr": 0.0007316480175599307, + "time_sec": 15.461432695388794 + }, + { + "epoch": 53, + "train_loss": 0.6075375831794739, + "train_acc": 0.80952, + "test_loss": 1.9628248615264892, + "test_acc": 0.5673, + "lyapunov": null, + "grad_norm": 0.8367502172326149, + "grad_max_sv": 0.3639704927802086, + "grad_min_sv": 1.532564684603166e-08, + "grad_condition": 35699441.49240203, + "lr": 0.0007223175895924635, + "time_sec": 15.46337342262268 + }, + { + "epoch": 54, + "train_loss": 0.5996641965866089, + "train_acc": 0.81216, + "test_loss": 1.8179010778427125, + "test_acc": 0.5843, + "lyapunov": null, + "grad_norm": 0.8307418709294171, + "grad_max_sv": 0.3613003775477409, + "grad_min_sv": 1.4895932505510321e-08, + "grad_condition": 875528249.2472179, + "lr": 0.0007128896457825361, + "time_sec": 15.465355396270752 + }, + { + "epoch": 55, + "train_loss": 0.5882498831176758, + "train_acc": 0.81494, + "test_loss": 1.8813747344970704, + "test_acc": 0.582, + "lyapunov": null, + "grad_norm": 0.8235931888813899, + "grad_max_sv": 0.3551651187241077, + "grad_min_sv": 1.469800572865415e-08, + "grad_condition": 484027587.3941019, + "lr": 0.0007033683215378998, + "time_sec": 15.460170984268188 + }, + { + "epoch": 56, + "train_loss": 0.5707145217132569, + "train_acc": 0.82072, + "test_loss": 1.840101174545288, + "test_acc": 0.5813, + "lyapunov": null, + "grad_norm": 0.8086603393569909, + "grad_max_sv": 0.34960880503058434, + "grad_min_sv": 1.4356627959719037e-08, + "grad_condition": 198153063.82803452, + "lr": 0.0006937577932260512, + "time_sec": 15.455865383148193 + }, + { + "epoch": 57, + "train_loss": 0.5646172902584076, + "train_acc": 0.82002, + "test_loss": 1.8341705081939697, + "test_acc": 0.5873, + "lyapunov": null, + "grad_norm": 0.810642435475112, + "grad_max_sv": 0.3562955237925053, + "grad_min_sv": 1.4607543052502087e-08, + "grad_condition": 226679350.92895135, + "lr": 0.0006840622763423388, + "time_sec": 15.474364757537842 + }, + { + "epoch": 58, + "train_loss": 0.5469015620231629, + "train_acc": 0.82858, + "test_loss": 1.9427689083099364, + "test_acc": 0.5739, + "lyapunov": null, + "grad_norm": 0.7944800992028263, + "grad_max_sv": 0.33950445652008054, + "grad_min_sv": 1.368517551399162e-08, + "grad_condition": 347795127.79131866, + "lr": 0.0006742860236609073, + "time_sec": 15.464811563491821 + }, + { + "epoch": 59, + "train_loss": 0.5445322315883636, + "train_acc": 0.82716, + "test_loss": 1.8801843715667725, + "test_acc": 0.5792, + "lyapunov": null, + "grad_norm": 0.7916664309528131, + "grad_max_sv": 0.3434500187635422, + "grad_min_sv": 1.4393026628520266e-08, + "grad_condition": 315625887.3364844, + "lr": 0.0006644333233692913, + "time_sec": 15.463439702987671 + }, + { + "epoch": 60, + "train_loss": 0.5323922993850708, + "train_acc": 0.8299, + "test_loss": 1.9002599145889283, + "test_acc": 0.5809, + "lyapunov": null, + "grad_norm": 0.7870533377985126, + "grad_max_sv": 0.34093547612428665, + "grad_min_sv": 1.4214920851518542e-08, + "grad_condition": 91722689.16411342, + "lr": 0.0006545084971874734, + "time_sec": 15.450496912002563 + }, + { + "epoch": 61, + "train_loss": 0.519907633266449, + "train_acc": 0.83526, + "test_loss": 1.9299441148757934, + "test_acc": 0.5794, + "lyapunov": null, + "grad_norm": 0.7766553414478388, + "grad_max_sv": 0.3247631438076496, + "grad_min_sv": 1.3660971805162792e-08, + "grad_condition": 158255223.31341702, + "lr": 0.0006445158984722354, + "time_sec": 15.486064910888672 + }, + { + "epoch": 62, + "train_loss": 0.5158719365882873, + "train_acc": 0.83688, + "test_loss": 1.8924803583145142, + "test_acc": 0.5838, + "lyapunov": null, + "grad_norm": 0.7769879212152438, + "grad_max_sv": 0.34014692306518557, + "grad_min_sv": 1.4163850685366964e-08, + "grad_condition": 69424987.38028774, + "lr": 0.0006344599103076324, + "time_sec": 15.469778776168823 + }, + { + "epoch": 63, + "train_loss": 0.5016013371658326, + "train_acc": 0.83886, + "test_loss": 1.9557724254608155, + "test_acc": 0.578, + "lyapunov": null, + "grad_norm": 0.7667097633814496, + "grad_max_sv": 0.3396275587379932, + "grad_min_sv": 1.3258012922148093e-08, + "grad_condition": 246523332.7028369, + "lr": 0.0006243449435824269, + "time_sec": 15.490433692932129 + }, + { + "epoch": 64, + "train_loss": 0.4887677048301697, + "train_acc": 0.84204, + "test_loss": 1.919124504852295, + "test_acc": 0.5841, + "lyapunov": null, + "grad_norm": 0.7573654062297513, + "grad_max_sv": 0.32946483269333837, + "grad_min_sv": 1.3579194014026741e-08, + "grad_condition": 122613286.93525049, + "lr": 0.0006141754350553275, + "time_sec": 15.473332166671753 + }, + { + "epoch": 65, + "train_loss": 0.4757623895263672, + "train_acc": 0.84768, + "test_loss": 1.9984818859100342, + "test_acc": 0.5761, + "lyapunov": null, + "grad_norm": 0.748014318960053, + "grad_max_sv": 0.33319817706942556, + "grad_min_sv": 1.3326467683972414e-08, + "grad_condition": 623990635.8236978, + "lr": 0.0006039558454088793, + "time_sec": 15.485574960708618 + }, + { + "epoch": 66, + "train_loss": 0.4649162304496765, + "train_acc": 0.85152, + "test_loss": 1.9724672309875488, + "test_acc": 0.576, + "lyapunov": null, + "grad_norm": 0.7417116384839675, + "grad_max_sv": 0.3309340290725231, + "grad_min_sv": 1.334454621318426e-08, + "grad_condition": 142248731.7186973, + "lr": 0.000593690657292862, + "time_sec": 15.480328559875488 + }, + { + "epoch": 67, + "train_loss": 0.4583131973075867, + "train_acc": 0.85314, + "test_loss": 1.911379218673706, + "test_acc": 0.5815, + "lyapunov": null, + "grad_norm": 0.737726746568229, + "grad_max_sv": 0.32083366960287096, + "grad_min_sv": 1.2965913287477093e-08, + "grad_condition": 78597953.03928533, + "lr": 0.0005833843733580507, + "time_sec": 15.469099283218384 + }, + { + "epoch": 68, + "train_loss": 0.44331007887840274, + "train_acc": 0.85794, + "test_loss": 1.9728064548492432, + "test_acc": 0.5854, + "lyapunov": null, + "grad_norm": 0.7274207800935486, + "grad_max_sv": 0.3188414238393307, + "grad_min_sv": 1.2804001882360528e-08, + "grad_condition": 55555678.95357393, + "lr": 0.0005730415142812054, + "time_sec": 15.481547117233276 + }, + { + "epoch": 69, + "train_loss": 0.43979987537384035, + "train_acc": 0.85974, + "test_loss": 1.919715219116211, + "test_acc": 0.5884, + "lyapunov": null, + "grad_norm": 0.7242391218539499, + "grad_max_sv": 0.3140024244785309, + "grad_min_sv": 1.275962300552845e-08, + "grad_condition": 326554514.7187793, + "lr": 0.0005626666167821517, + "time_sec": 15.48648977279663 + }, + { + "epoch": 70, + "train_loss": 0.4322844411468506, + "train_acc": 0.86176, + "test_loss": 2.0117150314331056, + "test_acc": 0.5834, + "lyapunov": null, + "grad_norm": 0.7186156540948507, + "grad_max_sv": 0.31351484879851343, + "grad_min_sv": 1.2888502469096674e-08, + "grad_condition": 178788272.1664782, + "lr": 0.0005522642316338265, + "time_sec": 15.48006272315979 + }, + { + "epoch": 71, + "train_loss": 0.42623882338523866, + "train_acc": 0.86272, + "test_loss": 1.9539510818481445, + "test_acc": 0.5875, + "lyapunov": null, + "grad_norm": 0.7137008149677833, + "grad_max_sv": 0.31342701613903046, + "grad_min_sv": 1.2595162532727522e-08, + "grad_condition": 302205097.8444015, + "lr": 0.0005418389216661573, + "time_sec": 15.492274284362793 + }, + { + "epoch": 72, + "train_loss": 0.41300243412017823, + "train_acc": 0.86584, + "test_loss": 1.9104324056625366, + "test_acc": 0.5874, + "lyapunov": null, + "grad_norm": 0.7058331032866322, + "grad_max_sv": 0.3122198607772589, + "grad_min_sv": 1.2484183565045215e-08, + "grad_condition": 249411647.9543108, + "lr": 0.0005313952597646563, + "time_sec": 15.472809076309204 + }, + { + "epoch": 73, + "train_loss": 0.4090885982322693, + "train_acc": 0.86766, + "test_loss": 1.9304109241485596, + "test_acc": 0.5896, + "lyapunov": null, + "grad_norm": 0.7030000923329225, + "grad_max_sv": 0.3075466021895409, + "grad_min_sv": 1.252222159744791e-08, + "grad_condition": 331808797.86113906, + "lr": 0.0005209378268645994, + "time_sec": 15.497188806533813 + }, + { + "epoch": 74, + "train_loss": 0.40033238063812254, + "train_acc": 0.87144, + "test_loss": 1.985810231399536, + "test_acc": 0.5849, + "lyapunov": null, + "grad_norm": 0.6995855816146154, + "grad_max_sv": 0.31191978715360164, + "grad_min_sv": 1.2527367021682167e-08, + "grad_condition": 263818262.83558512, + "lr": 0.0005104712099416781, + "time_sec": 15.483733892440796 + }, + { + "epoch": 75, + "train_loss": 0.39340143531799315, + "train_acc": 0.87318, + "test_loss": 1.9034859148025514, + "test_acc": 0.5988, + "lyapunov": null, + "grad_norm": 0.6917443264462005, + "grad_max_sv": 0.3097103513777256, + "grad_min_sv": 1.2234487580323195e-08, + "grad_condition": 189402494.46869463, + "lr": 0.0004999999999999996, + "time_sec": 15.491854667663574 + }, + { + "epoch": 76, + "train_loss": 0.38218573943138123, + "train_acc": 0.87562, + "test_loss": 1.9674748405456544, + "test_acc": 0.5897, + "lyapunov": null, + "grad_norm": 0.6848552863949536, + "grad_max_sv": 0.306015183404088, + "grad_min_sv": 1.2231246879906843e-08, + "grad_condition": 67368302.47465871, + "lr": 0.0004895287900583212, + "time_sec": 15.475126504898071 + }, + { + "epoch": 77, + "train_loss": 0.37298857500076293, + "train_acc": 0.8782, + "test_loss": 1.9116508392333984, + "test_acc": 0.5973, + "lyapunov": null, + "grad_norm": 0.676733354734531, + "grad_max_sv": 0.30364411063492297, + "grad_min_sv": 1.2298366306937036e-08, + "grad_condition": 113213891.7010752, + "lr": 0.0004790621731353997, + "time_sec": 15.476521015167236 + }, + { + "epoch": 78, + "train_loss": 0.3701143793487549, + "train_acc": 0.88078, + "test_loss": 2.085685297012329, + "test_acc": 0.5795, + "lyapunov": null, + "grad_norm": 0.6755741762416969, + "grad_max_sv": 0.30699342787265776, + "grad_min_sv": 1.205234841629107e-08, + "grad_condition": 3030668677.964108, + "lr": 0.000468604740235343, + "time_sec": 15.484160423278809 + }, + { + "epoch": 79, + "train_loss": 0.36959360103607175, + "train_acc": 0.87916, + "test_loss": 1.9509956113815308, + "test_acc": 0.601, + "lyapunov": null, + "grad_norm": 0.6757618176434513, + "grad_max_sv": 0.3065595250576735, + "grad_min_sv": 1.2097158442331279e-08, + "grad_condition": 77210703.25088154, + "lr": 0.00045816107833384175, + "time_sec": 15.480469226837158 + }, + { + "epoch": 80, + "train_loss": 0.3621886194419861, + "train_acc": 0.88318, + "test_loss": 1.9287394012451171, + "test_acc": 0.5985, + "lyapunov": null, + "grad_norm": 0.6691339361755074, + "grad_max_sv": 0.3024368964135647, + "grad_min_sv": 1.2120088314785185e-08, + "grad_condition": 405016123.1402856, + "lr": 0.0004477357683661729, + "time_sec": 15.493567705154419 + }, + { + "epoch": 81, + "train_loss": 0.35030229503631594, + "train_acc": 0.88624, + "test_loss": 2.00673182220459, + "test_acc": 0.5919, + "lyapunov": null, + "grad_norm": 0.6596224304671231, + "grad_max_sv": 0.29136806540191174, + "grad_min_sv": 1.127730693450046e-08, + "grad_condition": 1639288832.1236253, + "lr": 0.00043733338321784746, + "time_sec": 15.493369817733765 + }, + { + "epoch": 82, + "train_loss": 0.34493877026557923, + "train_acc": 0.8872, + "test_loss": 2.030837797164917, + "test_acc": 0.5955, + "lyapunov": null, + "grad_norm": 0.656267153049647, + "grad_max_sv": 0.28955256529152396, + "grad_min_sv": 1.1868315586143104e-08, + "grad_condition": 869246762.0746359, + "lr": 0.0004269584857187939, + "time_sec": 15.51423978805542 + }, + { + "epoch": 83, + "train_loss": 0.33515030410289764, + "train_acc": 0.89166, + "test_loss": 2.0619586929321287, + "test_acc": 0.5889, + "lyapunov": null, + "grad_norm": 0.6433611607654642, + "grad_max_sv": 0.28342132121324537, + "grad_min_sv": 1.1435175364601923e-08, + "grad_condition": 62926422.11698373, + "lr": 0.0004166156266419484, + "time_sec": 15.476901769638062 + }, + { + "epoch": 84, + "train_loss": 0.33155179508209226, + "train_acc": 0.8925, + "test_loss": 2.021995645713806, + "test_acc": 0.5931, + "lyapunov": null, + "grad_norm": 0.6432295423646542, + "grad_max_sv": 0.29169376716017725, + "grad_min_sv": 1.1024380705050054e-08, + "grad_condition": 1442816426.8026254, + "lr": 0.0004063093427071373, + "time_sec": 15.489609479904175 + }, + { + "epoch": 85, + "train_loss": 0.32435158078193665, + "train_acc": 0.89488, + "test_loss": 2.013304320335388, + "test_acc": 0.5916, + "lyapunov": null, + "grad_norm": 0.6387569144998656, + "grad_max_sv": 0.29359805807471273, + "grad_min_sv": 1.1595539084474638e-08, + "grad_condition": 189598831.94028363, + "lr": 0.0003960441545911199, + "time_sec": 15.501060247421265 + }, + { + "epoch": 86, + "train_loss": 0.3179238869667053, + "train_acc": 0.89698, + "test_loss": 1.9903604904174805, + "test_acc": 0.5974, + "lyapunov": null, + "grad_norm": 0.6339090393643317, + "grad_max_sv": 0.2939893651753664, + "grad_min_sv": 1.1321056620980375e-08, + "grad_condition": 126309584.77428427, + "lr": 0.0003858245649446718, + "time_sec": 15.473534345626831 + }, + { + "epoch": 87, + "train_loss": 0.3082590392589569, + "train_acc": 0.90084, + "test_loss": 1.9719016357421875, + "test_acc": 0.5973, + "lyapunov": null, + "grad_norm": 0.6204648872897773, + "grad_max_sv": 0.2808060821145773, + "grad_min_sv": 1.1003370339922671e-08, + "grad_condition": 295054731.1552657, + "lr": 0.00037565505641757235, + "time_sec": 15.489596128463745 + }, + { + "epoch": 88, + "train_loss": 0.30407683875083924, + "train_acc": 0.9015, + "test_loss": 2.046679413032532, + "test_acc": 0.5983, + "lyapunov": null, + "grad_norm": 0.6232550099645187, + "grad_max_sv": 0.2919613588601351, + "grad_min_sv": 1.106688122280361e-08, + "grad_condition": 322143674.85252506, + "lr": 0.00036554008969236695, + "time_sec": 15.49986457824707 + }, + { + "epoch": 89, + "train_loss": 0.3027446964073181, + "train_acc": 0.90118, + "test_loss": 2.086252244949341, + "test_acc": 0.5888, + "lyapunov": null, + "grad_norm": 0.6190288324649083, + "grad_max_sv": 0.28052753023803234, + "grad_min_sv": 1.0900322809496467e-08, + "grad_condition": 566479183.315316, + "lr": 0.0003554841015277638, + "time_sec": 15.504590034484863 + }, + { + "epoch": 90, + "train_loss": 0.29228587161064146, + "train_acc": 0.9047, + "test_loss": 2.0138395809173586, + "test_acc": 0.5944, + "lyapunov": null, + "grad_norm": 0.6096912272320082, + "grad_max_sv": 0.28337894156575205, + "grad_min_sv": 1.0885550369042416e-08, + "grad_condition": 2055184394.3102565, + "lr": 0.000345491502812526, + "time_sec": 15.49034571647644 + }, + { + "epoch": 91, + "train_loss": 0.2902773824119568, + "train_acc": 0.9069, + "test_loss": 2.0066411319732667, + "test_acc": 0.6022, + "lyapunov": null, + "grad_norm": 0.6066794741118794, + "grad_max_sv": 0.27967384792864325, + "grad_min_sv": 1.113149796019841e-08, + "grad_condition": 126085093.27825883, + "lr": 0.0003355666766307081, + "time_sec": 15.486260652542114 + }, + { + "epoch": 92, + "train_loss": 0.2833449110221863, + "train_acc": 0.90814, + "test_loss": 2.077221655654907, + "test_acc": 0.5914, + "lyapunov": null, + "grad_norm": 0.6042052133918574, + "grad_max_sv": 0.27325271964073183, + "grad_min_sv": 1.057503346621057e-08, + "grad_condition": 3596600642.934755, + "lr": 0.00032571397633909225, + "time_sec": 15.505445957183838 + }, + { + "epoch": 93, + "train_loss": 0.275921519203186, + "train_acc": 0.91156, + "test_loss": 2.0253973026275633, + "test_acc": 0.6011, + "lyapunov": null, + "grad_norm": 0.596345487343705, + "grad_max_sv": 0.27955980561673643, + "grad_min_sv": 1.0745895713884512e-08, + "grad_condition": 99226565.9342475, + "lr": 0.00031593772365766094, + "time_sec": 15.494666337966919 + }, + { + "epoch": 94, + "train_loss": 0.27615388660430906, + "train_acc": 0.90982, + "test_loss": 2.0751438976287844, + "test_acc": 0.5926, + "lyapunov": null, + "grad_norm": 0.5987218023474344, + "grad_max_sv": 0.27597025111317636, + "grad_min_sv": 1.0580089662877434e-08, + "grad_condition": 377084496.3903383, + "lr": 0.0003062422067739483, + "time_sec": 15.47998309135437 + }, + { + "epoch": 95, + "train_loss": 0.26991701264381407, + "train_acc": 0.9106, + "test_loss": 2.065015655708313, + "test_acc": 0.5995, + "lyapunov": null, + "grad_norm": 0.591359331692498, + "grad_max_sv": 0.280801360309124, + "grad_min_sv": 1.058501965522929e-08, + "grad_condition": 177268235.5442259, + "lr": 0.00029663167846209965, + "time_sec": 15.503370761871338 + }, + { + "epoch": 96, + "train_loss": 0.26606324160575867, + "train_acc": 0.9137, + "test_loss": 2.0547151592254638, + "test_acc": 0.6024, + "lyapunov": null, + "grad_norm": 0.5902198713479344, + "grad_max_sv": 0.2709753967821598, + "grad_min_sv": 1.0618598106555168e-08, + "grad_condition": 842340240.5160465, + "lr": 0.00028711035421746345, + "time_sec": 15.498698949813843 + }, + { + "epoch": 97, + "train_loss": 0.25566293501853943, + "train_acc": 0.91732, + "test_loss": 2.007575707626343, + "test_acc": 0.5994, + "lyapunov": null, + "grad_norm": 0.5817467490050799, + "grad_max_sv": 0.2697387088090181, + "grad_min_sv": 1.025438704743524e-08, + "grad_condition": 463836797.56778467, + "lr": 0.00027768241040753615, + "time_sec": 15.489367485046387 + }, + { + "epoch": 98, + "train_loss": 0.2515622547864914, + "train_acc": 0.91842, + "test_loss": 2.04601014251709, + "test_acc": 0.6008, + "lyapunov": null, + "grad_norm": 0.5794799592204589, + "grad_max_sv": 0.26677791140973567, + "grad_min_sv": 1.029050446439174e-08, + "grad_condition": 588388249.9313815, + "lr": 0.00026835198244006903, + "time_sec": 15.474334001541138 + }, + { + "epoch": 99, + "train_loss": 0.24500514444351196, + "train_acc": 0.92196, + "test_loss": 2.086534292602539, + "test_acc": 0.6033, + "lyapunov": null, + "grad_norm": 0.5694490714138027, + "grad_max_sv": 0.2623301979154348, + "grad_min_sv": 9.966415031648947e-09, + "grad_condition": 1015125356.3291184, + "lr": 0.0002591231629491421, + "time_sec": 15.491194248199463 + }, + { + "epoch": 100, + "train_loss": 0.24579128606796263, + "train_acc": 0.92022, + "test_loss": 2.033238724517822, + "test_acc": 0.6073, + "lyapunov": null, + "grad_norm": 0.5680720755555388, + "grad_max_sv": 0.25963654592633245, + "grad_min_sv": 9.939859338002274e-09, + "grad_condition": 445557731.47806203, + "lr": 0.0002499999999999997, + "time_sec": 15.490838050842285 + }, + { + "epoch": 101, + "train_loss": 0.24127339096069336, + "train_acc": 0.92306, + "test_loss": 2.1002378002166746, + "test_acc": 0.6036, + "lyapunov": null, + "grad_norm": 0.5641906297524981, + "grad_max_sv": 0.27549757733941077, + "grad_min_sv": 1.0068470844863327e-08, + "grad_condition": 409101783.765684, + "lr": 0.00024098649531343477, + "time_sec": 15.490317106246948 + }, + { + "epoch": 102, + "train_loss": 0.2390659130167961, + "train_acc": 0.9225, + "test_loss": 2.0233927448272704, + "test_acc": 0.6081, + "lyapunov": null, + "grad_norm": 0.5658609942304538, + "grad_max_sv": 0.2694991033524275, + "grad_min_sv": 9.839277652549483e-09, + "grad_condition": 3844646046.5289702, + "lr": 0.0002320866025105016, + "time_sec": 15.493839740753174 + }, + { + "epoch": 103, + "train_loss": 0.23365470203876496, + "train_acc": 0.92546, + "test_loss": 2.007601522064209, + "test_acc": 0.6095, + "lyapunov": null, + "grad_norm": 0.5584257053092218, + "grad_max_sv": 0.2743960417807102, + "grad_min_sv": 1.0207792428690299e-08, + "grad_condition": 250547163.15828475, + "lr": 0.0002233042253783278, + "time_sec": 15.469611167907715 + }, + { + "epoch": 104, + "train_loss": 0.22797604578971864, + "train_acc": 0.92666, + "test_loss": 1.9921390232086182, + "test_acc": 0.6104, + "lyapunov": null, + "grad_norm": 0.5477060234172001, + "grad_max_sv": 0.2509814579039812, + "grad_min_sv": 9.610087979301102e-09, + "grad_condition": 2430635198.302944, + "lr": 0.000214643216157784, + "time_sec": 15.485874652862549 + }, + { + "epoch": 105, + "train_loss": 0.2194866455602646, + "train_acc": 0.92896, + "test_loss": 2.065049479866028, + "test_acc": 0.6048, + "lyapunov": null, + "grad_norm": 0.5427601977062464, + "grad_max_sv": 0.24938638992607592, + "grad_min_sv": 9.552283189700334e-09, + "grad_condition": 249820703.92123896, + "lr": 0.00020610737385376332, + "time_sec": 15.492459058761597 + }, + { + "epoch": 106, + "train_loss": 0.22127391705036165, + "train_acc": 0.9277, + "test_loss": 2.0674615295410157, + "test_acc": 0.6066, + "lyapunov": null, + "grad_norm": 0.545565415204051, + "grad_max_sv": 0.252237818390131, + "grad_min_sv": 9.870081852563286e-09, + "grad_condition": 1730317003.0799267, + "lr": 0.00019770044256881242, + "time_sec": 15.494806051254272 + }, + { + "epoch": 107, + "train_loss": 0.21957805599212646, + "train_acc": 0.92936, + "test_loss": 2.069959518432617, + "test_acc": 0.6059, + "lyapunov": null, + "grad_norm": 0.5427102510735407, + "grad_max_sv": 0.26037181839346885, + "grad_min_sv": 9.796433978262464e-09, + "grad_condition": 619659373.2197987, + "lr": 0.0001894261098608447, + "time_sec": 15.494577169418335 + }, + { + "epoch": 108, + "train_loss": 0.21802687605857848, + "train_acc": 0.92854, + "test_loss": 2.069862120437622, + "test_acc": 0.6064, + "lyapunov": null, + "grad_norm": 0.5412145734801318, + "grad_max_sv": 0.26357722133398054, + "grad_min_sv": 9.731102705856913e-09, + "grad_condition": 4896886016.781491, + "lr": 0.000181288005125655, + "time_sec": 15.492915630340576 + }, + { + "epoch": 109, + "train_loss": 0.2105085688495636, + "train_acc": 0.9329, + "test_loss": 2.0300133407592775, + "test_acc": 0.6118, + "lyapunov": null, + "grad_norm": 0.5316865416598037, + "grad_max_sv": 0.24584890641272067, + "grad_min_sv": 9.288343090713484e-09, + "grad_condition": 1467162755.386783, + "lr": 0.0001732896980049473, + "time_sec": 15.496263980865479 + }, + { + "epoch": 110, + "train_loss": 0.20778575693130494, + "train_acc": 0.9324, + "test_loss": 2.033147290420532, + "test_acc": 0.6113, + "lyapunov": null, + "grad_norm": 0.5310273370102141, + "grad_max_sv": 0.25715232640504837, + "grad_min_sv": 9.619756366117082e-09, + "grad_condition": 909703469.1889927, + "lr": 0.00016543469682057076, + "time_sec": 15.48079514503479 + }, + { + "epoch": 111, + "train_loss": 0.2022018117570877, + "train_acc": 0.93408, + "test_loss": 2.0903577659606936, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.5248885212713278, + "grad_max_sv": 0.25115896202623844, + "grad_min_sv": 9.449230327059423e-09, + "grad_condition": 654306379.114652, + "lr": 0.00015772644703565552, + "time_sec": 15.481376886367798 + }, + { + "epoch": 112, + "train_loss": 0.2012022008705139, + "train_acc": 0.93478, + "test_loss": 2.1256960330963133, + "test_acc": 0.6062, + "lyapunov": null, + "grad_norm": 0.5259715208516651, + "grad_max_sv": 0.25880570262670516, + "grad_min_sv": 9.483339922537942e-09, + "grad_condition": 3450539548.1120477, + "lr": 0.00015016832974331713, + "time_sec": 15.474645853042603 + }, + { + "epoch": 113, + "train_loss": 0.20022091041088105, + "train_acc": 0.9359, + "test_loss": 2.0813249099731443, + "test_acc": 0.6127, + "lyapunov": null, + "grad_norm": 0.518582122023061, + "grad_max_sv": 0.25183347687125207, + "grad_min_sv": 9.362834274724563e-09, + "grad_condition": 206343345.02075773, + "lr": 0.00014276366018359834, + "time_sec": 15.51976227760315 + }, + { + "epoch": 114, + "train_loss": 0.20003674240589142, + "train_acc": 0.93548, + "test_loss": 2.059957353401184, + "test_acc": 0.6113, + "lyapunov": null, + "grad_norm": 0.5204510649985771, + "grad_max_sv": 0.24840169511735438, + "grad_min_sv": 9.433198861711483e-09, + "grad_condition": 156281157.83753783, + "lr": 0.00013551568628929425, + "time_sec": 15.486659526824951 + }, + { + "epoch": 115, + "train_loss": 0.19450239594459534, + "train_acc": 0.9368, + "test_loss": 2.081795527267456, + "test_acc": 0.613, + "lyapunov": null, + "grad_norm": 0.513222572000434, + "grad_max_sv": 0.25595347620546816, + "grad_min_sv": 9.54867237041787e-09, + "grad_condition": 768174194.3770015, + "lr": 0.00012842758726130276, + "time_sec": 15.51030945777893 + }, + { + "epoch": 116, + "train_loss": 0.19022185802936553, + "train_acc": 0.93888, + "test_loss": 2.0910057247161866, + "test_acc": 0.6109, + "lyapunov": null, + "grad_norm": 0.509950221902217, + "grad_max_sv": 0.24649180248379707, + "grad_min_sv": 9.286189562706521e-09, + "grad_condition": 190506622.94702727, + "lr": 0.0001215024721741218, + "time_sec": 15.4960777759552 + }, + { + "epoch": 117, + "train_loss": 0.18697156070709228, + "train_acc": 0.9409, + "test_loss": 2.1048245140075683, + "test_acc": 0.6113, + "lyapunov": null, + "grad_norm": 0.5023066665762482, + "grad_max_sv": 0.24158176295459272, + "grad_min_sv": 9.132921396148092e-09, + "grad_condition": 4603577974.011314, + "lr": 0.00011474337861210538, + "time_sec": 15.499973773956299 + }, + { + "epoch": 118, + "train_loss": 0.1897142271566391, + "train_acc": 0.93756, + "test_loss": 2.0972971321105955, + "test_acc": 0.611, + "lyapunov": null, + "grad_norm": 0.5079589956238173, + "grad_max_sv": 0.23757222667336464, + "grad_min_sv": 8.902529727208147e-09, + "grad_condition": 203658547.6693558, + "lr": 0.00010815327133708009, + "time_sec": 15.504847049713135 + }, + { + "epoch": 119, + "train_loss": 0.1865368722629547, + "train_acc": 0.93914, + "test_loss": 2.071676664352417, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.503144489128604, + "grad_max_sv": 0.24214695654809476, + "grad_min_sv": 9.078004823076872e-09, + "grad_condition": 401272428.2934058, + "lr": 0.00010173504098790182, + "time_sec": 15.494940042495728 + }, + { + "epoch": 120, + "train_loss": 0.18263185959339143, + "train_acc": 0.9413, + "test_loss": 2.0995028049468996, + "test_acc": 0.61, + "lyapunov": null, + "grad_norm": 0.49963467133223916, + "grad_max_sv": 0.2448117069900036, + "grad_min_sv": 9.255170430218228e-09, + "grad_condition": 840960640.7523018, + "lr": 9.549150281252629e-05, + "time_sec": 15.50493049621582 + }, + { + "epoch": 121, + "train_loss": 0.17661990516662598, + "train_acc": 0.94376, + "test_loss": 2.0479217910766603, + "test_acc": 0.6139, + "lyapunov": null, + "grad_norm": 0.49017967274439106, + "grad_max_sv": 0.24487083926796913, + "grad_min_sv": 9.062790381261093e-09, + "grad_condition": 297900363.86286056, + "lr": 8.942539543314794e-05, + "time_sec": 15.500595331192017 + }, + { + "epoch": 122, + "train_loss": 0.17436686351299285, + "train_acc": 0.94568, + "test_loss": 2.1033685138702394, + "test_acc": 0.6076, + "lyapunov": null, + "grad_norm": 0.4850908453719191, + "grad_max_sv": 0.24267951920628547, + "grad_min_sv": 9.175133607909614e-09, + "grad_condition": 151651082.8966439, + "lr": 8.353937964495024e-05, + "time_sec": 15.500707149505615 + }, + { + "epoch": 123, + "train_loss": 0.17420966561317444, + "train_acc": 0.94574, + "test_loss": 2.0771576751708984, + "test_acc": 0.6091, + "lyapunov": null, + "grad_norm": 0.48697820878218756, + "grad_max_sv": 0.24934822954237462, + "grad_min_sv": 9.043736691862272e-09, + "grad_condition": 342563176.44086933, + "lr": 7.783603724899243e-05, + "time_sec": 15.506757974624634 + }, + { + "epoch": 124, + "train_loss": 0.1725812414932251, + "train_acc": 0.94486, + "test_loss": 2.135185445022583, + "test_acc": 0.608, + "lyapunov": null, + "grad_norm": 0.4844109930695783, + "grad_max_sv": 0.24152979552745818, + "grad_min_sv": 9.037162034160328e-09, + "grad_condition": 142594941.29597357, + "lr": 7.231786991974666e-05, + "time_sec": 15.495522499084473 + }, + { + "epoch": 125, + "train_loss": 0.17122176954269408, + "train_acc": 0.94558, + "test_loss": 2.1152863483428956, + "test_acc": 0.612, + "lyapunov": null, + "grad_norm": 0.4826385410866865, + "grad_max_sv": 0.24549916423857213, + "grad_min_sv": 8.782795131207118e-09, + "grad_condition": 1347993858.355885, + "lr": 6.698729810778072e-05, + "time_sec": 15.489627361297607 + }, + { + "epoch": 126, + "train_loss": 0.17058868828058243, + "train_acc": 0.94662, + "test_loss": 2.1105800861358643, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.48281055678110163, + "grad_max_sv": 0.24400779306888581, + "grad_min_sv": 8.881911921611655e-09, + "grad_condition": 907798367.550338, + "lr": 6.184665997806817e-05, + "time_sec": 15.487231254577637 + }, + { + "epoch": 127, + "train_loss": 0.16842705961704255, + "train_acc": 0.94676, + "test_loss": 2.075766274642944, + "test_acc": 0.6129, + "lyapunov": null, + "grad_norm": 0.4814153543267475, + "grad_max_sv": 0.24004302807152272, + "grad_min_sv": 8.701755094839368e-09, + "grad_condition": 2608046426.213746, + "lr": 5.6898210384392595e-05, + "time_sec": 15.498921394348145 + }, + { + "epoch": 128, + "train_loss": 0.16494292568683624, + "train_acc": 0.94768, + "test_loss": 2.151611907196045, + "test_acc": 0.6047, + "lyapunov": null, + "grad_norm": 0.4763822150733386, + "grad_max_sv": 0.22842325568199157, + "grad_min_sv": 8.631154578726818e-09, + "grad_condition": 260686423.05458745, + "lr": 5.214411988029363e-05, + "time_sec": 15.489452600479126 + }, + { + "epoch": 129, + "train_loss": 0.16430129640102387, + "train_acc": 0.94824, + "test_loss": 2.0951647556304933, + "test_acc": 0.6128, + "lyapunov": null, + "grad_norm": 0.4754481221102857, + "grad_max_sv": 0.23247553929686546, + "grad_min_sv": 8.414460946461547e-09, + "grad_condition": 437817787.9214033, + "lr": 4.7586473766990294e-05, + "time_sec": 15.491871118545532 + }, + { + "epoch": 130, + "train_loss": 0.16159661509513856, + "train_acc": 0.94926, + "test_loss": 2.0767082111358643, + "test_acc": 0.6156, + "lyapunov": null, + "grad_norm": 0.4695751355550292, + "grad_max_sv": 0.24420519769191742, + "grad_min_sv": 8.783045789696309e-09, + "grad_condition": 2887625517.4136095, + "lr": 4.32272711786996e-05, + "time_sec": 15.50525712966919 + }, + { + "epoch": 131, + "train_loss": 0.16233114049911498, + "train_acc": 0.94986, + "test_loss": 2.090193899154663, + "test_acc": 0.6138, + "lyapunov": null, + "grad_norm": 0.4718133586500909, + "grad_max_sv": 0.23811170123517514, + "grad_min_sv": 8.731167988607069e-09, + "grad_condition": 171473959.97673047, + "lr": 3.906842420574966e-05, + "time_sec": 15.489828824996948 + }, + { + "epoch": 132, + "train_loss": 0.16304145799160003, + "train_acc": 0.9489, + "test_loss": 2.0699268299102784, + "test_acc": 0.6176, + "lyapunov": null, + "grad_norm": 0.47181034193305915, + "grad_max_sv": 0.24468088522553444, + "grad_min_sv": 8.694641913677115e-09, + "grad_condition": 3950610050.0669045, + "lr": 3.5111757055874305e-05, + "time_sec": 15.489463329315186 + }, + { + "epoch": 133, + "train_loss": 0.16222090543746948, + "train_acc": 0.94862, + "test_loss": 2.0846460132598876, + "test_acc": 0.6154, + "lyapunov": null, + "grad_norm": 0.47432514605256276, + "grad_max_sv": 0.2351464234292507, + "grad_min_sv": 8.508125437679944e-09, + "grad_condition": 3262769680.1508665, + "lr": 3.1359005254054254e-05, + "time_sec": 15.493263721466064 + }, + { + "epoch": 134, + "train_loss": 0.1564504327917099, + "train_acc": 0.95064, + "test_loss": 2.039795367050171, + "test_acc": 0.616, + "lyapunov": null, + "grad_norm": 0.46132567077349346, + "grad_max_sv": 0.23477552309632302, + "grad_min_sv": 8.499829853240298e-09, + "grad_condition": 275652896.5549098, + "lr": 2.7811814881259484e-05, + "time_sec": 15.501915693283081 + }, + { + "epoch": 135, + "train_loss": 0.1633557910346985, + "train_acc": 0.94906, + "test_loss": 2.1431523998260498, + "test_acc": 0.6082, + "lyapunov": null, + "grad_norm": 0.4725347110912027, + "grad_max_sv": 0.2321782097220421, + "grad_min_sv": 8.273568699135141e-09, + "grad_condition": 719211854.1190578, + "lr": 2.4471741852423218e-05, + "time_sec": 15.49996304512024 + }, + { + "epoch": 136, + "train_loss": 0.1577922046995163, + "train_acc": 0.95056, + "test_loss": 2.039000785446167, + "test_acc": 0.6154, + "lyapunov": null, + "grad_norm": 0.46347763663429586, + "grad_max_sv": 0.23204916007816792, + "grad_min_sv": 8.698969911215922e-09, + "grad_condition": 2466699319.0239253, + "lr": 2.1340251233966362e-05, + "time_sec": 15.497424125671387 + }, + { + "epoch": 137, + "train_loss": 0.15701312964439393, + "train_acc": 0.94962, + "test_loss": 2.085305763244629, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.46705315608384584, + "grad_max_sv": 0.22602895461022854, + "grad_min_sv": 8.363478537018877e-09, + "grad_condition": 5418883019.032962, + "lr": 1.8418716601170932e-05, + "time_sec": 15.491859674453735 + }, + { + "epoch": 138, + "train_loss": 0.15615028873443604, + "train_acc": 0.95128, + "test_loss": 2.101923070907593, + "test_acc": 0.6133, + "lyapunov": null, + "grad_norm": 0.46267937397470993, + "grad_max_sv": 0.23617675378918648, + "grad_min_sv": 8.55792531187071e-09, + "grad_condition": 668785672.229811, + "lr": 1.570841943568445e-05, + "time_sec": 15.490991592407227 + }, + { + "epoch": 139, + "train_loss": 0.15497800857305527, + "train_acc": 0.95104, + "test_loss": 2.131324795150757, + "test_acc": 0.6096, + "lyapunov": null, + "grad_norm": 0.4627316674414162, + "grad_max_sv": 0.23336338251829147, + "grad_min_sv": 8.54283688542061e-09, + "grad_condition": 547232078.4054619, + "lr": 1.3210548563419845e-05, + "time_sec": 15.493245840072632 + }, + { + "epoch": 140, + "train_loss": 0.15815438273906707, + "train_acc": 0.95054, + "test_loss": 2.0743191734313964, + "test_acc": 0.6132, + "lyapunov": null, + "grad_norm": 0.46525185071118685, + "grad_max_sv": 0.23031578138470649, + "grad_min_sv": 8.578327668909771e-09, + "grad_condition": 1472538153.7679148, + "lr": 1.0926199633097203e-05, + "time_sec": 15.508398056030273 + }, + { + "epoch": 141, + "train_loss": 0.15565036369800567, + "train_acc": 0.95156, + "test_loss": 2.083190835571289, + "test_acc": 0.6143, + "lyapunov": null, + "grad_norm": 0.4634211187185363, + "grad_max_sv": 0.2209864068776369, + "grad_min_sv": 8.388305931458784e-09, + "grad_condition": 735187313.3407264, + "lr": 8.856374635655688e-06, + "time_sec": 15.477578163146973 + }, + { + "epoch": 142, + "train_loss": 0.1526834367275238, + "train_acc": 0.95296, + "test_loss": 2.0579229915618895, + "test_acc": 0.6125, + "lyapunov": null, + "grad_norm": 0.45577943773159835, + "grad_max_sv": 0.22755092419683934, + "grad_min_sv": 8.457177222030362e-09, + "grad_condition": 1934756909.5252705, + "lr": 7.001981464747503e-06, + "time_sec": 15.47980809211731 + }, + { + "epoch": 143, + "train_loss": 0.1551715327501297, + "train_acc": 0.95138, + "test_loss": 2.094068197631836, + "test_acc": 0.6117, + "lyapunov": null, + "grad_norm": 0.46037433954931045, + "grad_max_sv": 0.22780660428106786, + "grad_min_sv": 8.502836361531321e-09, + "grad_condition": 963929271.8099291, + "lr": 5.3638335185058295e-06, + "time_sec": 15.485134363174438 + }, + { + "epoch": 144, + "train_loss": 0.15432416381835937, + "train_acc": 0.95178, + "test_loss": 2.110651277923584, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.4613614148812742, + "grad_max_sv": 0.22735756635665894, + "grad_min_sv": 8.44454743694368e-09, + "grad_condition": 1076939620.5494838, + "lr": 3.942649342761114e-06, + "time_sec": 15.493315696716309 + }, + { + "epoch": 145, + "train_loss": 0.15650244321346282, + "train_acc": 0.95044, + "test_loss": 2.0880191951751708, + "test_acc": 0.6119, + "lyapunov": null, + "grad_norm": 0.4660268832705423, + "grad_max_sv": 0.23027937039732932, + "grad_min_sv": 8.513131491633477e-09, + "grad_condition": 297143450.17696226, + "lr": 2.7390523158633524e-06, + "time_sec": 15.480180501937866 + }, + { + "epoch": 146, + "train_loss": 0.15448970682621002, + "train_acc": 0.952, + "test_loss": 2.0194208770751954, + "test_acc": 0.621, + "lyapunov": null, + "grad_norm": 0.4600178145858194, + "grad_max_sv": 0.22371375933289528, + "grad_min_sv": 8.652061342297613e-09, + "grad_condition": 2586380341.3174944, + "lr": 1.7535703752478133e-06, + "time_sec": 15.502386331558228 + }, + { + "epoch": 147, + "train_loss": 0.15414279275417328, + "train_acc": 0.95114, + "test_loss": 2.1069964057922363, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.4616285885002781, + "grad_max_sv": 0.2342820342630148, + "grad_min_sv": 8.68108046944878e-09, + "grad_condition": 379507449.7225493, + "lr": 9.866357858642196e-07, + "time_sec": 15.488835096359253 + }, + { + "epoch": 148, + "train_loss": 0.15620617700576783, + "train_acc": 0.95078, + "test_loss": 2.1161761821746827, + "test_acc": 0.6085, + "lyapunov": null, + "grad_norm": 0.46475971700568747, + "grad_max_sv": 0.2303019493818283, + "grad_min_sv": 8.695906369591763e-09, + "grad_condition": 729395813.573787, + "lr": 4.38584950570808e-07, + "time_sec": 15.500977277755737 + }, + { + "epoch": 149, + "train_loss": 0.1530400000667572, + "train_acc": 0.95168, + "test_loss": 2.0760107112884523, + "test_acc": 0.6147, + "lyapunov": null, + "grad_norm": 0.4585791144767188, + "grad_max_sv": 0.23029794916510582, + "grad_min_sv": 8.466522902726702e-09, + "grad_condition": 540903237.1982462, + "lr": 1.096582625772501e-07, + "time_sec": 15.49415111541748 + }, + { + "epoch": 150, + "train_loss": 0.15208094583511353, + "train_acc": 0.95228, + "test_loss": 2.0765135959625245, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.45743890734329773, + "grad_max_sv": 0.23194126076996327, + "grad_min_sv": 8.657490525268864e-09, + "grad_condition": 1180436704.3069885, + "lr": 0.0, + "time_sec": 15.487801790237427 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.642479771652222, + "train_acc": 0.0563, + "test_loss": 4.471788549804687, + "test_acc": 0.0525, + "lyapunov": null, + "grad_norm": 6.299700683423435, + "grad_max_sv": 5.376748514175415, + "grad_min_sv": 1.0876815811078355e-07, + "grad_condition": 123806577.64929362, + "lr": 0.0009998903417374227, + "time_sec": 32.55821919441223 + }, + { + "epoch": 2, + "train_loss": 3.921236069869995, + "train_acc": 0.1164, + "test_loss": 4.031661200714112, + "test_acc": 0.0987, + "lyapunov": null, + "grad_norm": 4.744809408953577, + "grad_max_sv": 4.056096857786178, + "grad_min_sv": 8.545224932585138e-08, + "grad_condition": 432966802.88566554, + "lr": 0.0009995614150494292, + "time_sec": 32.52909827232361 + }, + { + "epoch": 3, + "train_loss": 3.563258330001831, + "train_acc": 0.16394, + "test_loss": 3.665959655380249, + "test_acc": 0.1478, + "lyapunov": null, + "grad_norm": 3.968544793489477, + "grad_max_sv": 3.2656030714511872, + "grad_min_sv": 7.328074659307404e-08, + "grad_condition": 54148101.24592471, + "lr": 0.0009990133642141358, + "time_sec": 32.514859199523926 + }, + { + "epoch": 4, + "train_loss": 3.30762485168457, + "train_acc": 0.20282, + "test_loss": 3.602442971038818, + "test_acc": 0.1715, + "lyapunov": null, + "grad_norm": 3.360539325527588, + "grad_max_sv": 2.5611240684986116, + "grad_min_sv": 6.275024531099404e-08, + "grad_condition": 48558402.55237199, + "lr": 0.0009982464296247522, + "time_sec": 32.511942863464355 + }, + { + "epoch": 5, + "train_loss": 3.070727022857666, + "train_acc": 0.2431, + "test_loss": 3.0896433425903322, + "test_acc": 0.2428, + "lyapunov": null, + "grad_norm": 2.8612981669887914, + "grad_max_sv": 2.039329302310944, + "grad_min_sv": 5.3213209671998385e-08, + "grad_condition": 45899387.46141158, + "lr": 0.0009972609476841367, + "time_sec": 32.535019874572754 + }, + { + "epoch": 6, + "train_loss": 2.873271194458008, + "train_acc": 0.2795, + "test_loss": 3.0904090099334716, + "test_acc": 0.2488, + "lyapunov": null, + "grad_norm": 2.4953735022476837, + "grad_max_sv": 1.6734129816293717, + "grad_min_sv": 4.6456209978895655e-08, + "grad_condition": 55631562.29872565, + "lr": 0.000996057350657239, + "time_sec": 32.5289192199707 + }, + { + "epoch": 7, + "train_loss": 2.698648819732666, + "train_acc": 0.31066, + "test_loss": 2.9098104148864747, + "test_acc": 0.2799, + "lyapunov": null, + "grad_norm": 2.1963953249289316, + "grad_max_sv": 1.3662363350391389, + "grad_min_sv": 4.123726340746203e-08, + "grad_condition": 175183802.14149565, + "lr": 0.000994636166481494, + "time_sec": 32.53304076194763 + }, + { + "epoch": 8, + "train_loss": 2.5489939933776857, + "train_acc": 0.3414, + "test_loss": 2.918805715942383, + "test_acc": 0.2796, + "lyapunov": null, + "grad_norm": 1.9702205989411337, + "grad_max_sv": 1.1486580684781074, + "grad_min_sv": 3.6719605156498857e-08, + "grad_condition": 45078452.49282994, + "lr": 0.0009929980185352525, + "time_sec": 32.52384686470032 + }, + { + "epoch": 9, + "train_loss": 2.429889005661011, + "train_acc": 0.36856, + "test_loss": 2.617208067703247, + "test_acc": 0.3352, + "lyapunov": null, + "grad_norm": 1.7958642065413024, + "grad_max_sv": 0.976833887398243, + "grad_min_sv": 3.4111676243397945e-08, + "grad_condition": 88392837.95669074, + "lr": 0.0009911436253643444, + "time_sec": 32.52341938018799 + }, + { + "epoch": 10, + "train_loss": 2.312202433395386, + "train_acc": 0.39006, + "test_loss": 2.6336415348052977, + "test_acc": 0.3376, + "lyapunov": null, + "grad_norm": 1.6688154279715788, + "grad_max_sv": 0.8335120677947998, + "grad_min_sv": 3.1057890326202656e-08, + "grad_condition": 43581868.8179111, + "lr": 0.0009890738003669028, + "time_sec": 32.53657627105713 + }, + { + "epoch": 11, + "train_loss": 2.2113982202911378, + "train_acc": 0.41394, + "test_loss": 2.4651415496826172, + "test_acc": 0.3668, + "lyapunov": null, + "grad_norm": 1.5852177586967415, + "grad_max_sv": 0.7658713042736054, + "grad_min_sv": 2.981889714037678e-08, + "grad_condition": 33093574.792371016, + "lr": 0.00098678945143658, + "time_sec": 32.52194833755493 + }, + { + "epoch": 12, + "train_loss": 2.1308777001190187, + "train_acc": 0.432, + "test_loss": 2.5040061386108396, + "test_acc": 0.3654, + "lyapunov": null, + "grad_norm": 1.5129835225343262, + "grad_max_sv": 0.6879909574985504, + "grad_min_sv": 2.8309841176854533e-08, + "grad_condition": 30209408.624890875, + "lr": 0.0009842915805643154, + "time_sec": 32.519477128982544 + }, + { + "epoch": 13, + "train_loss": 2.051232373428345, + "train_acc": 0.4496, + "test_loss": 2.3721223037719725, + "test_acc": 0.3951, + "lyapunov": null, + "grad_norm": 1.4527042328822815, + "grad_max_sv": 0.6657147958874703, + "grad_min_sv": 2.7529119311919813e-08, + "grad_condition": 32877524.0735294, + "lr": 0.000981581283398829, + "time_sec": 32.51488184928894 + }, + { + "epoch": 14, + "train_loss": 1.9786859475326537, + "train_acc": 0.46372, + "test_loss": 2.4099101028442385, + "test_acc": 0.3885, + "lyapunov": null, + "grad_norm": 1.3903946049407439, + "grad_max_sv": 0.619149561971426, + "grad_min_sv": 2.6381883344583912e-08, + "grad_condition": 32158488.579634093, + "lr": 0.0009786597487660333, + "time_sec": 32.53034734725952 + }, + { + "epoch": 15, + "train_loss": 1.9087054037857056, + "train_acc": 0.48146, + "test_loss": 2.356669859313965, + "test_acc": 0.4054, + "lyapunov": null, + "grad_norm": 1.3401497982688246, + "grad_max_sv": 0.5884689308702946, + "grad_min_sv": 2.5261919572860948e-08, + "grad_condition": 27243493.57243519, + "lr": 0.0009755282581475766, + "time_sec": 32.53805232048035 + }, + { + "epoch": 16, + "train_loss": 1.8580862741851807, + "train_acc": 0.4903, + "test_loss": 2.3727874526977537, + "test_acc": 0.3978, + "lyapunov": null, + "grad_norm": 1.2980660063098806, + "grad_max_sv": 0.5687403865158558, + "grad_min_sv": 2.4705210138753485e-08, + "grad_condition": 36506916.881677285, + "lr": 0.0009721881851187403, + "time_sec": 32.529054403305054 + }, + { + "epoch": 17, + "train_loss": 1.7838218069458007, + "train_acc": 0.50946, + "test_loss": 2.411915710067749, + "test_acc": 0.4013, + "lyapunov": null, + "grad_norm": 1.2536082066251264, + "grad_max_sv": 0.5238922812044621, + "grad_min_sv": 2.3606322296920722e-08, + "grad_condition": 36849925.4309851, + "lr": 0.0009686409947459456, + "time_sec": 32.526257038116455 + }, + { + "epoch": 18, + "train_loss": 1.7371992016983033, + "train_acc": 0.51958, + "test_loss": 2.2599031024932863, + "test_acc": 0.4264, + "lyapunov": null, + "grad_norm": 1.229284180873741, + "grad_max_sv": 0.5230717524886132, + "grad_min_sv": 2.312521401454104e-08, + "grad_condition": 49053511.209702894, + "lr": 0.0009648882429441254, + "time_sec": 32.5399911403656 + }, + { + "epoch": 19, + "train_loss": 1.6830381874847413, + "train_acc": 0.53178, + "test_loss": 2.1889729766845702, + "test_acc": 0.4447, + "lyapunov": null, + "grad_norm": 1.1785390649791196, + "grad_max_sv": 0.4872257113456726, + "grad_min_sv": 2.2137700339541766e-08, + "grad_condition": 138866163.95418012, + "lr": 0.00096093157579425, + "time_sec": 32.52653670310974 + }, + { + "epoch": 20, + "train_loss": 1.6344180388641358, + "train_acc": 0.54714, + "test_loss": 2.227257891082764, + "test_acc": 0.4375, + "lyapunov": null, + "grad_norm": 1.1489035121891145, + "grad_max_sv": 0.47284500747919084, + "grad_min_sv": 2.1496744417870418e-08, + "grad_condition": 29593450.061258078, + "lr": 0.0009567727288213001, + "time_sec": 32.52734684944153 + }, + { + "epoch": 21, + "train_loss": 1.5880603087615968, + "train_acc": 0.55388, + "test_loss": 2.109391535949707, + "test_acc": 0.4605, + "lyapunov": null, + "grad_norm": 1.1350345214433142, + "grad_max_sv": 0.47259567975997924, + "grad_min_sv": 2.13382750108293e-08, + "grad_condition": 39203948.276769534, + "lr": 0.0009524135262330095, + "time_sec": 32.51701855659485 + }, + { + "epoch": 22, + "train_loss": 1.5451898790740968, + "train_acc": 0.56776, + "test_loss": 2.1289856529235838, + "test_acc": 0.4622, + "lyapunov": null, + "grad_norm": 1.1083032352595108, + "grad_max_sv": 0.44387331902980803, + "grad_min_sv": 2.0636199499213248e-08, + "grad_condition": 31425874.99589374, + "lr": 0.0009478558801197061, + "time_sec": 32.51593995094299 + }, + { + "epoch": 23, + "train_loss": 1.4903677392959596, + "train_acc": 0.57754, + "test_loss": 2.133696251296997, + "test_acc": 0.4671, + "lyapunov": null, + "grad_norm": 1.0825668306165386, + "grad_max_sv": 0.4390222616493702, + "grad_min_sv": 2.047547279677986e-08, + "grad_condition": 129993822.14571199, + "lr": 0.000943101789615607, + "time_sec": 32.51069974899292 + }, + { + "epoch": 24, + "train_loss": 1.4748817832183838, + "train_acc": 0.58158, + "test_loss": 2.1626602745056154, + "test_acc": 0.4632, + "lyapunov": null, + "grad_norm": 1.0751338305034317, + "grad_max_sv": 0.43956650570034983, + "grad_min_sv": 2.0244324640261713e-08, + "grad_condition": 41342301.85017798, + "lr": 0.0009381533400219313, + "time_sec": 32.533777952194214 + }, + { + "epoch": 25, + "train_loss": 1.4211272861099242, + "train_acc": 0.5951, + "test_loss": 2.096311450576782, + "test_acc": 0.481, + "lyapunov": null, + "grad_norm": 1.0399638076679998, + "grad_max_sv": 0.42748609334230425, + "grad_min_sv": 1.9937479189824357e-08, + "grad_condition": 38871491.7985058, + "lr": 0.0009330127018922189, + "time_sec": 32.53145217895508 + }, + { + "epoch": 26, + "train_loss": 1.396544298095703, + "train_acc": 0.6008, + "test_loss": 2.1271941719055176, + "test_acc": 0.4714, + "lyapunov": null, + "grad_norm": 1.028506322176559, + "grad_max_sv": 0.4079991213977337, + "grad_min_sv": 1.9165852835345554e-08, + "grad_condition": 39309871.185656376, + "lr": 0.000927682130080253, + "time_sec": 32.53234934806824 + }, + { + "epoch": 27, + "train_loss": 1.361050274734497, + "train_acc": 0.60774, + "test_loss": 2.0897907325744627, + "test_acc": 0.4811, + "lyapunov": null, + "grad_norm": 1.009655904655981, + "grad_max_sv": 0.39270137771964075, + "grad_min_sv": 1.8564359835493426e-08, + "grad_condition": 28517922.90367631, + "lr": 0.0009221639627510072, + "time_sec": 32.54458284378052 + }, + { + "epoch": 28, + "train_loss": 1.3167539808654785, + "train_acc": 0.62254, + "test_loss": 2.2306322479248046, + "test_acc": 0.4663, + "lyapunov": null, + "grad_norm": 0.9884512545787755, + "grad_max_sv": 0.393748565018177, + "grad_min_sv": 1.8592529393846036e-08, + "grad_condition": 34171303.89028352, + "lr": 0.0009164606203550494, + "time_sec": 32.525365352630615 + }, + { + "epoch": 29, + "train_loss": 1.2844751734542847, + "train_acc": 0.62692, + "test_loss": 2.19309764251709, + "test_acc": 0.4751, + "lyapunov": null, + "grad_norm": 0.9700062599103884, + "grad_max_sv": 0.387305423617363, + "grad_min_sv": 1.7872535887364373e-08, + "grad_condition": 26903062.552241027, + "lr": 0.0009105746045668516, + "time_sec": 32.526561975479126 + }, + { + "epoch": 30, + "train_loss": 1.2640808475494385, + "train_acc": 0.63334, + "test_loss": 2.2757652931213377, + "test_acc": 0.4536, + "lyapunov": null, + "grad_norm": 0.9608534659761124, + "grad_max_sv": 0.39087340533733367, + "grad_min_sv": 1.800268759344359e-08, + "grad_condition": 33161981.652286977, + "lr": 0.0009045084971874733, + "time_sec": 32.51922965049744 + }, + { + "epoch": 31, + "train_loss": 1.2303438648223877, + "train_acc": 0.64076, + "test_loss": 2.1164483276367188, + "test_acc": 0.4864, + "lyapunov": null, + "grad_norm": 0.9467438832197973, + "grad_max_sv": 0.3729639552533627, + "grad_min_sv": 1.7477179434233213e-08, + "grad_condition": 28618454.375976466, + "lr": 0.0008982649590120977, + "time_sec": 32.51436138153076 + }, + { + "epoch": 32, + "train_loss": 1.2104430978012084, + "train_acc": 0.6455, + "test_loss": 2.2232689281463625, + "test_acc": 0.481, + "lyapunov": null, + "grad_norm": 0.9361931150490757, + "grad_max_sv": 0.37210237309336663, + "grad_min_sv": 1.7445883718214537e-08, + "grad_condition": 29250266.68112684, + "lr": 0.0008918467286629196, + "time_sec": 32.532060861587524 + }, + { + "epoch": 33, + "train_loss": 1.1789497135162355, + "train_acc": 0.65278, + "test_loss": 2.143947396850586, + "test_acc": 0.4907, + "lyapunov": null, + "grad_norm": 0.9196344126113596, + "grad_max_sv": 0.367071446031332, + "grad_min_sv": 1.6865934492071855e-08, + "grad_condition": 40056883.7628016, + "lr": 0.0008852566213878943, + "time_sec": 32.526479959487915 + }, + { + "epoch": 34, + "train_loss": 1.1554690090179442, + "train_acc": 0.65844, + "test_loss": 2.1499678684234618, + "test_acc": 0.4922, + "lyapunov": null, + "grad_norm": 0.9057802742532243, + "grad_max_sv": 0.3550798542797565, + "grad_min_sv": 1.6556807021315262e-08, + "grad_condition": 255610578.57101497, + "lr": 0.000878497527825878, + "time_sec": 32.53326392173767 + }, + { + "epoch": 35, + "train_loss": 1.1325925022506713, + "train_acc": 0.66696, + "test_loss": 2.187357851409912, + "test_acc": 0.498, + "lyapunov": null, + "grad_norm": 0.8980481880537616, + "grad_max_sv": 0.35023384541273117, + "grad_min_sv": 1.653067620913107e-08, + "grad_condition": 47664672.04568529, + "lr": 0.000871572412738697, + "time_sec": 32.529192209243774 + }, + { + "epoch": 36, + "train_loss": 1.1162108192062379, + "train_acc": 0.67076, + "test_loss": 2.078928050994873, + "test_acc": 0.5062, + "lyapunov": null, + "grad_norm": 0.8887291214894226, + "grad_max_sv": 0.34587462246418, + "grad_min_sv": 1.598691768550653e-08, + "grad_condition": 47253750.309311725, + "lr": 0.0008644843137107055, + "time_sec": 32.53391623497009 + }, + { + "epoch": 37, + "train_loss": 1.088490778541565, + "train_acc": 0.67814, + "test_loss": 2.117596751022339, + "test_acc": 0.5079, + "lyapunov": null, + "grad_norm": 0.8827902897341499, + "grad_max_sv": 0.3460941031575203, + "grad_min_sv": 1.613751039689776e-08, + "grad_condition": 120430106.41639173, + "lr": 0.0008572363398164014, + "time_sec": 32.52939796447754 + }, + { + "epoch": 38, + "train_loss": 1.0622543322944642, + "train_acc": 0.68324, + "test_loss": 2.2524201555252077, + "test_acc": 0.4904, + "lyapunov": null, + "grad_norm": 0.8643928358196139, + "grad_max_sv": 0.3311579547822475, + "grad_min_sv": 1.5921391385842476e-08, + "grad_condition": 28147641.32749777, + "lr": 0.0008498316702566826, + "time_sec": 32.51650023460388 + }, + { + "epoch": 39, + "train_loss": 1.0258385097503662, + "train_acc": 0.6921, + "test_loss": 2.215389312553406, + "test_acc": 0.4912, + "lyapunov": null, + "grad_norm": 0.8507960671612714, + "grad_max_sv": 0.3430253557860851, + "grad_min_sv": 1.6041156275514722e-08, + "grad_condition": 41417221.90444088, + "lr": 0.0008422735529643442, + "time_sec": 32.51078248023987 + }, + { + "epoch": 40, + "train_loss": 1.008150099067688, + "train_acc": 0.69894, + "test_loss": 2.285165777206421, + "test_acc": 0.4887, + "lyapunov": null, + "grad_norm": 0.8500378683317822, + "grad_max_sv": 0.33013429269194605, + "grad_min_sv": 1.547893761040184e-08, + "grad_condition": 735713799.268648, + "lr": 0.0008345653031794289, + "time_sec": 32.51578617095947 + }, + { + "epoch": 41, + "train_loss": 0.9898018364715576, + "train_acc": 0.70114, + "test_loss": 2.1710759185791018, + "test_acc": 0.5054, + "lyapunov": null, + "grad_norm": 0.845636323093009, + "grad_max_sv": 0.334617256373167, + "grad_min_sv": 1.552002822438614e-08, + "grad_condition": 178790285.2774743, + "lr": 0.0008267103019950526, + "time_sec": 32.55498909950256 + }, + { + "epoch": 42, + "train_loss": 0.9689999252319336, + "train_acc": 0.70992, + "test_loss": 2.1532568422317504, + "test_acc": 0.5088, + "lyapunov": null, + "grad_norm": 0.8290515928528267, + "grad_max_sv": 0.32156808376312257, + "grad_min_sv": 1.513711112358096e-08, + "grad_condition": 63393159.17157264, + "lr": 0.0008187119948743447, + "time_sec": 32.5278046131134 + }, + { + "epoch": 43, + "train_loss": 0.9382334645080567, + "train_acc": 0.7173, + "test_loss": 2.1617983654022215, + "test_acc": 0.5099, + "lyapunov": null, + "grad_norm": 0.8199573726083517, + "grad_max_sv": 0.3176788903772831, + "grad_min_sv": 1.4969858624924724e-08, + "grad_condition": 39337083.20882653, + "lr": 0.000810573890139155, + "time_sec": 32.54653334617615 + }, + { + "epoch": 44, + "train_loss": 0.9182830782318115, + "train_acc": 0.7211, + "test_loss": 2.2938510860443113, + "test_acc": 0.5032, + "lyapunov": null, + "grad_norm": 0.8158010406023241, + "grad_max_sv": 0.32802748009562493, + "grad_min_sv": 1.5100565674969203e-08, + "grad_condition": 67700595.0906401, + "lr": 0.0008022995574311873, + "time_sec": 32.530778884887695 + }, + { + "epoch": 45, + "train_loss": 0.89899619556427, + "train_acc": 0.72596, + "test_loss": 2.3243038515090944, + "test_acc": 0.4978, + "lyapunov": null, + "grad_norm": 0.8106149860815325, + "grad_max_sv": 0.31970001086592675, + "grad_min_sv": 1.444995242211311e-08, + "grad_condition": 61707891.58292439, + "lr": 0.0007938926261462363, + "time_sec": 32.53210163116455 + }, + { + "epoch": 46, + "train_loss": 0.8833617488861084, + "train_acc": 0.72982, + "test_loss": 2.3542774658203127, + "test_acc": 0.4957, + "lyapunov": null, + "grad_norm": 0.8034668926314622, + "grad_max_sv": 0.3169444307684898, + "grad_min_sv": 1.4620525734955046e-08, + "grad_condition": 2306938949.5105658, + "lr": 0.0007853567838422158, + "time_sec": 32.52321457862854 + }, + { + "epoch": 47, + "train_loss": 0.8611621459960938, + "train_acc": 0.73636, + "test_loss": 2.3614687870025635, + "test_acc": 0.5019, + "lyapunov": null, + "grad_norm": 0.7952702534581538, + "grad_max_sv": 0.3213916938751936, + "grad_min_sv": 1.4360261544471564e-08, + "grad_condition": 98833361.99001758, + "lr": 0.0007766957746216719, + "time_sec": 32.551071643829346 + }, + { + "epoch": 48, + "train_loss": 0.8414902052116394, + "train_acc": 0.74232, + "test_loss": 2.3029669830322264, + "test_acc": 0.5085, + "lyapunov": null, + "grad_norm": 0.784297561095192, + "grad_max_sv": 0.3114811100065708, + "grad_min_sv": 1.4304356266148232e-08, + "grad_condition": 35252220.65254038, + "lr": 0.0007679133974894982, + "time_sec": 32.53156328201294 + }, + { + "epoch": 49, + "train_loss": 0.8309669767951965, + "train_acc": 0.74656, + "test_loss": 2.286893635559082, + "test_acc": 0.5045, + "lyapunov": null, + "grad_norm": 0.7866799445354931, + "grad_max_sv": 0.31325423568487165, + "grad_min_sv": 1.420554635719537e-08, + "grad_condition": 245828981.88515216, + "lr": 0.000759013504686565, + "time_sec": 32.530038595199585 + }, + { + "epoch": 50, + "train_loss": 0.7998139995956421, + "train_acc": 0.75392, + "test_loss": 2.3185002082824706, + "test_acc": 0.5087, + "lyapunov": null, + "grad_norm": 0.7702444904048175, + "grad_max_sv": 0.3126057405024767, + "grad_min_sv": 1.4057572236413247e-08, + "grad_condition": 895759530.8359982, + "lr": 0.0007499999999999998, + "time_sec": 32.539623498916626 + }, + { + "epoch": 51, + "train_loss": 0.7901191444015503, + "train_acc": 0.75788, + "test_loss": 2.337850633239746, + "test_acc": 0.509, + "lyapunov": null, + "grad_norm": 0.7647274965495858, + "grad_max_sv": 0.3004269126802683, + "grad_min_sv": 1.4008410850752107e-08, + "grad_condition": 176379975.2857924, + "lr": 0.0007408768370508575, + "time_sec": 32.52524662017822 + }, + { + "epoch": 52, + "train_loss": 0.7781133801651001, + "train_acc": 0.76004, + "test_loss": 2.3018055530548094, + "test_acc": 0.5142, + "lyapunov": null, + "grad_norm": 0.7628575677364715, + "grad_max_sv": 0.3077410638332367, + "grad_min_sv": 1.3944687078052547e-08, + "grad_condition": 476227675.55278826, + "lr": 0.0007316480175599307, + "time_sec": 32.53758096694946 + }, + { + "epoch": 53, + "train_loss": 0.7562806001663208, + "train_acc": 0.7648, + "test_loss": 2.379827104949951, + "test_acc": 0.5063, + "lyapunov": null, + "grad_norm": 0.7526764366291289, + "grad_max_sv": 0.30248577073216437, + "grad_min_sv": 1.3496081205355803e-08, + "grad_condition": 1089676260.2113607, + "lr": 0.0007223175895924635, + "time_sec": 32.54466271400452 + }, + { + "epoch": 54, + "train_loss": 0.7475943574333191, + "train_acc": 0.76786, + "test_loss": 2.377075054550171, + "test_acc": 0.512, + "lyapunov": null, + "grad_norm": 0.750215382398683, + "grad_max_sv": 0.3043755616992712, + "grad_min_sv": 1.3518679307933379e-08, + "grad_condition": 37379268.11133198, + "lr": 0.0007128896457825361, + "time_sec": 32.53366780281067 + }, + { + "epoch": 55, + "train_loss": 0.7366778998947143, + "train_acc": 0.77304, + "test_loss": 2.4013710193634035, + "test_acc": 0.5052, + "lyapunov": null, + "grad_norm": 0.7465343546140976, + "grad_max_sv": 0.30028381906449797, + "grad_min_sv": 1.382671875327368e-08, + "grad_condition": 28698720.96166121, + "lr": 0.0007033683215378998, + "time_sec": 32.53609323501587 + }, + { + "epoch": 56, + "train_loss": 0.7091366660690308, + "train_acc": 0.77762, + "test_loss": 2.33411563911438, + "test_acc": 0.5126, + "lyapunov": null, + "grad_norm": 0.7380136003829837, + "grad_max_sv": 0.2953734669834375, + "grad_min_sv": 1.303365445352823e-08, + "grad_condition": 1175915690.269457, + "lr": 0.0006937577932260512, + "time_sec": 32.5473690032959 + }, + { + "epoch": 57, + "train_loss": 0.6999513886070251, + "train_acc": 0.78266, + "test_loss": 2.43815316696167, + "test_acc": 0.5107, + "lyapunov": null, + "grad_norm": 0.7328699359209336, + "grad_max_sv": 0.2920531783252954, + "grad_min_sv": 1.2993845399135451e-08, + "grad_condition": 152587828.403437, + "lr": 0.0006840622763423388, + "time_sec": 32.55185127258301 + }, + { + "epoch": 58, + "train_loss": 0.6799741724395751, + "train_acc": 0.78742, + "test_loss": 2.381142023277283, + "test_acc": 0.5177, + "lyapunov": null, + "grad_norm": 0.7278793670004745, + "grad_max_sv": 0.2917668532580137, + "grad_min_sv": 1.304645755725517e-08, + "grad_condition": 169810706.32481682, + "lr": 0.0006742860236609073, + "time_sec": 32.537921667099 + }, + { + "epoch": 59, + "train_loss": 0.6622171486473083, + "train_acc": 0.79306, + "test_loss": 2.350548614120483, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.7160794966099063, + "grad_max_sv": 0.28989222049713137, + "grad_min_sv": 1.3154668510517373e-08, + "grad_condition": 518100543.52278435, + "lr": 0.0006644333233692913, + "time_sec": 32.556652784347534 + }, + { + "epoch": 60, + "train_loss": 0.6548414518356324, + "train_acc": 0.79498, + "test_loss": 2.558105725860596, + "test_acc": 0.5026, + "lyapunov": null, + "grad_norm": 0.7139601066120349, + "grad_max_sv": 0.2839757200330496, + "grad_min_sv": 1.2719528911207812e-08, + "grad_condition": 106598497.36127238, + "lr": 0.0006545084971874734, + "time_sec": 32.54617619514465 + }, + { + "epoch": 61, + "train_loss": 0.6367912077522278, + "train_acc": 0.79956, + "test_loss": 2.549720768737793, + "test_acc": 0.503, + "lyapunov": null, + "grad_norm": 0.7072938119035849, + "grad_max_sv": 0.2815666403621435, + "grad_min_sv": 1.2655917643131925e-08, + "grad_condition": 351545390.3878931, + "lr": 0.0006445158984722354, + "time_sec": 32.52895545959473 + }, + { + "epoch": 62, + "train_loss": 0.6108809622764587, + "train_acc": 0.80962, + "test_loss": 2.4582517892837523, + "test_acc": 0.5155, + "lyapunov": null, + "grad_norm": 0.6871779503013541, + "grad_max_sv": 0.27853575013577936, + "grad_min_sv": 1.2499909360016991e-08, + "grad_condition": 84323115.24066128, + "lr": 0.0006344599103076324, + "time_sec": 32.53638219833374 + }, + { + "epoch": 63, + "train_loss": 0.6110955193519593, + "train_acc": 0.8082, + "test_loss": 2.421668832015991, + "test_acc": 0.5218, + "lyapunov": null, + "grad_norm": 0.6974575785480693, + "grad_max_sv": 0.29437441378831863, + "grad_min_sv": 1.2760532111023327e-08, + "grad_condition": 1141074655.802474, + "lr": 0.0006243449435824269, + "time_sec": 32.5341739654541 + }, + { + "epoch": 64, + "train_loss": 0.5902745287513733, + "train_acc": 0.81326, + "test_loss": 2.525721709823608, + "test_acc": 0.5137, + "lyapunov": null, + "grad_norm": 0.6819775061327956, + "grad_max_sv": 0.2760129250586033, + "grad_min_sv": 1.2472146640636617e-08, + "grad_condition": 153380994.2741132, + "lr": 0.0006141754350553275, + "time_sec": 32.54224371910095 + }, + { + "epoch": 65, + "train_loss": 0.5767888858222961, + "train_acc": 0.81892, + "test_loss": 2.5681256893157958, + "test_acc": 0.5109, + "lyapunov": null, + "grad_norm": 0.6842883453940269, + "grad_max_sv": 0.27693442031741144, + "grad_min_sv": 1.214616162405202e-08, + "grad_condition": 180936373.24743983, + "lr": 0.0006039558454088793, + "time_sec": 32.535571575164795 + }, + { + "epoch": 66, + "train_loss": 0.5719620153427124, + "train_acc": 0.81766, + "test_loss": 2.4380872802734377, + "test_acc": 0.5187, + "lyapunov": null, + "grad_norm": 0.6845868887152398, + "grad_max_sv": 0.2806558083742857, + "grad_min_sv": 1.2417019015428798e-08, + "grad_condition": 91981311.14124386, + "lr": 0.000593690657292862, + "time_sec": 32.537678956985474 + }, + { + "epoch": 67, + "train_loss": 0.5476583632850647, + "train_acc": 0.8273, + "test_loss": 2.4955981588363647, + "test_acc": 0.5183, + "lyapunov": null, + "grad_norm": 0.6627927561159936, + "grad_max_sv": 0.27053381204605104, + "grad_min_sv": 1.1682474739156678e-08, + "grad_condition": 119357334.07208268, + "lr": 0.0005833843733580507, + "time_sec": 32.53704595565796 + }, + { + "epoch": 68, + "train_loss": 0.5349030065536499, + "train_acc": 0.82988, + "test_loss": 2.576411254119873, + "test_acc": 0.5106, + "lyapunov": null, + "grad_norm": 0.6582392321316073, + "grad_max_sv": 0.27176710218191147, + "grad_min_sv": 1.180562275559377e-08, + "grad_condition": 846305950.6996868, + "lr": 0.0005730415142812054, + "time_sec": 32.54088878631592 + }, + { + "epoch": 69, + "train_loss": 0.5356097626113892, + "train_acc": 0.82918, + "test_loss": 2.5702699626922607, + "test_acc": 0.5154, + "lyapunov": null, + "grad_norm": 0.6641979366792015, + "grad_max_sv": 0.27518576607108114, + "grad_min_sv": 1.2052892484938627e-08, + "grad_condition": 130030350.74337718, + "lr": 0.0005626666167821517, + "time_sec": 32.54138922691345 + }, + { + "epoch": 70, + "train_loss": 0.513014861240387, + "train_acc": 0.8363, + "test_loss": 2.6079680850982667, + "test_acc": 0.5106, + "lyapunov": null, + "grad_norm": 0.6500943565960319, + "grad_max_sv": 0.2724282074719667, + "grad_min_sv": 1.178367022645465e-08, + "grad_condition": 673776556.319051, + "lr": 0.0005522642316338265, + "time_sec": 32.5693633556366 + }, + { + "epoch": 71, + "train_loss": 0.49603789474487303, + "train_acc": 0.84198, + "test_loss": 2.5577601636886595, + "test_acc": 0.5169, + "lyapunov": null, + "grad_norm": 0.6430240258167331, + "grad_max_sv": 0.27023660503327845, + "grad_min_sv": 1.1744692686443959e-08, + "grad_condition": 80314537.0435541, + "lr": 0.0005418389216661573, + "time_sec": 32.54641532897949 + }, + { + "epoch": 72, + "train_loss": 0.49025250810623167, + "train_acc": 0.8432, + "test_loss": 2.5663631786346435, + "test_acc": 0.5234, + "lyapunov": null, + "grad_norm": 0.643279476058677, + "grad_max_sv": 0.27230227626860143, + "grad_min_sv": 1.1624652314357053e-08, + "grad_condition": 62786442.37501116, + "lr": 0.0005313952597646563, + "time_sec": 32.54123497009277 + }, + { + "epoch": 73, + "train_loss": 0.48772711526870727, + "train_acc": 0.84528, + "test_loss": 2.648895852470398, + "test_acc": 0.5168, + "lyapunov": null, + "grad_norm": 0.6405905214601311, + "grad_max_sv": 0.2699441872537136, + "grad_min_sv": 1.1482883187884097e-08, + "grad_condition": 111834993.35897943, + "lr": 0.0005209378268645994, + "time_sec": 32.56350803375244 + }, + { + "epoch": 74, + "train_loss": 0.467068857088089, + "train_acc": 0.84904, + "test_loss": 2.6479972763061523, + "test_acc": 0.5139, + "lyapunov": null, + "grad_norm": 0.6363491242612465, + "grad_max_sv": 0.2783078793436289, + "grad_min_sv": 1.1536390146556913e-08, + "grad_condition": 219390233.59819812, + "lr": 0.0005104712099416781, + "time_sec": 32.546509981155396 + }, + { + "epoch": 75, + "train_loss": 0.4711385968875885, + "train_acc": 0.84816, + "test_loss": 2.608884352874756, + "test_acc": 0.5195, + "lyapunov": null, + "grad_norm": 0.6374082155755629, + "grad_max_sv": 0.26901070438325403, + "grad_min_sv": 1.1190769711073856e-08, + "grad_condition": 334559678.03980315, + "lr": 0.0004999999999999996, + "time_sec": 32.54527187347412 + }, + { + "epoch": 76, + "train_loss": 0.45760808762550353, + "train_acc": 0.85254, + "test_loss": 2.6803735092163086, + "test_acc": 0.5135, + "lyapunov": null, + "grad_norm": 0.6239727106157842, + "grad_max_sv": 0.2669793125241995, + "grad_min_sv": 1.1426927580722445e-08, + "grad_condition": 760532191.4933506, + "lr": 0.0004895287900583212, + "time_sec": 32.556286096572876 + }, + { + "epoch": 77, + "train_loss": 0.4403402804660797, + "train_acc": 0.85888, + "test_loss": 2.6952022495269774, + "test_acc": 0.5153, + "lyapunov": null, + "grad_norm": 0.6180261512024202, + "grad_max_sv": 0.2674210451543331, + "grad_min_sv": 1.1284923026578207e-08, + "grad_condition": 800342890.6120255, + "lr": 0.0004790621731353997, + "time_sec": 32.570063829422 + }, + { + "epoch": 78, + "train_loss": 0.43386900725364685, + "train_acc": 0.8609, + "test_loss": 2.6530003887176514, + "test_acc": 0.5232, + "lyapunov": null, + "grad_norm": 0.6088851948477753, + "grad_max_sv": 0.2547843284904957, + "grad_min_sv": 1.0926095429623917e-08, + "grad_condition": 95464128.01992908, + "lr": 0.000468604740235343, + "time_sec": 32.54688787460327 + }, + { + "epoch": 79, + "train_loss": 0.4240487690734863, + "train_acc": 0.8654, + "test_loss": 2.7931711376190185, + "test_acc": 0.5088, + "lyapunov": null, + "grad_norm": 0.5993382897461283, + "grad_max_sv": 0.24774248749017716, + "grad_min_sv": 1.07508628526291e-08, + "grad_condition": 623384828.9212538, + "lr": 0.00045816107833384175, + "time_sec": 32.54505252838135 + }, + { + "epoch": 80, + "train_loss": 0.4058323986816406, + "train_acc": 0.86904, + "test_loss": 2.6775668907165526, + "test_acc": 0.5171, + "lyapunov": null, + "grad_norm": 0.5885819627420461, + "grad_max_sv": 0.24584074690937996, + "grad_min_sv": 1.022559682466867e-08, + "grad_condition": 156757634.53668588, + "lr": 0.0004477357683661729, + "time_sec": 32.55807185173035 + }, + { + "epoch": 81, + "train_loss": 0.3943421869087219, + "train_acc": 0.87248, + "test_loss": 2.596042275619507, + "test_acc": 0.5241, + "lyapunov": null, + "grad_norm": 0.5915570736864834, + "grad_max_sv": 0.252938449382782, + "grad_min_sv": 1.0551333432320953e-08, + "grad_condition": 290621793.5733338, + "lr": 0.00043733338321784746, + "time_sec": 32.56740355491638 + }, + { + "epoch": 82, + "train_loss": 0.39024432485580446, + "train_acc": 0.87492, + "test_loss": 2.715544410324097, + "test_acc": 0.5245, + "lyapunov": null, + "grad_norm": 0.5825377843109248, + "grad_max_sv": 0.2532011177390814, + "grad_min_sv": 1.0358391808878986e-08, + "grad_condition": 412597611.83888507, + "lr": 0.0004269584857187939, + "time_sec": 32.55344319343567 + }, + { + "epoch": 83, + "train_loss": 0.3715799244689941, + "train_acc": 0.88012, + "test_loss": 2.6901692249298095, + "test_acc": 0.5264, + "lyapunov": null, + "grad_norm": 0.5717041976150569, + "grad_max_sv": 0.24421822614967822, + "grad_min_sv": 1.0306600353336345e-08, + "grad_condition": 329985889.12779623, + "lr": 0.0004166156266419484, + "time_sec": 32.559467792510986 + }, + { + "epoch": 84, + "train_loss": 0.3671589259147644, + "train_acc": 0.882, + "test_loss": 2.6448453563690184, + "test_acc": 0.5345, + "lyapunov": null, + "grad_norm": 0.5691852194449533, + "grad_max_sv": 0.24019994884729384, + "grad_min_sv": 9.989625743278551e-09, + "grad_condition": 122734290.43687347, + "lr": 0.0004063093427071373, + "time_sec": 32.583213567733765 + }, + { + "epoch": 85, + "train_loss": 0.35963713159561156, + "train_acc": 0.8824, + "test_loss": 2.718573891067505, + "test_acc": 0.5235, + "lyapunov": null, + "grad_norm": 0.5695765343654775, + "grad_max_sv": 0.24239672683179378, + "grad_min_sv": 1.0202618674231591e-08, + "grad_condition": 1852046324.0623333, + "lr": 0.0003960441545911199, + "time_sec": 32.562474727630615 + }, + { + "epoch": 86, + "train_loss": 0.35900317364692685, + "train_acc": 0.88314, + "test_loss": 2.690758750152588, + "test_acc": 0.5281, + "lyapunov": null, + "grad_norm": 0.5695226754489282, + "grad_max_sv": 0.2359969958662987, + "grad_min_sv": 9.85500920487603e-09, + "grad_condition": 394077563.11466306, + "lr": 0.0003858245649446718, + "time_sec": 32.56024169921875 + }, + { + "epoch": 87, + "train_loss": 0.34593051030158994, + "train_acc": 0.88774, + "test_loss": 2.6911534130096437, + "test_acc": 0.5276, + "lyapunov": null, + "grad_norm": 0.5605319049257929, + "grad_max_sv": 0.24156057350337506, + "grad_min_sv": 9.944241273420092e-09, + "grad_condition": 944172650.8084786, + "lr": 0.00037565505641757235, + "time_sec": 32.55394530296326 + }, + { + "epoch": 88, + "train_loss": 0.3350362122821808, + "train_acc": 0.89292, + "test_loss": 2.761347038269043, + "test_acc": 0.5248, + "lyapunov": null, + "grad_norm": 0.5537857918957506, + "grad_max_sv": 0.24467103444039823, + "grad_min_sv": 9.84480716557587e-09, + "grad_condition": 557423472.2448919, + "lr": 0.00036554008969236695, + "time_sec": 32.565001487731934 + }, + { + "epoch": 89, + "train_loss": 0.32590197957992556, + "train_acc": 0.89466, + "test_loss": 2.873864278793335, + "test_acc": 0.5155, + "lyapunov": null, + "grad_norm": 0.5519161551510952, + "grad_max_sv": 0.2400045834481716, + "grad_min_sv": 9.881915213807297e-09, + "grad_condition": 248477788.07047543, + "lr": 0.0003554841015277638, + "time_sec": 32.55529260635376 + }, + { + "epoch": 90, + "train_loss": 0.31863860460281374, + "train_acc": 0.89664, + "test_loss": 2.8045926555633547, + "test_acc": 0.5231, + "lyapunov": null, + "grad_norm": 0.5479641587602809, + "grad_max_sv": 0.24628719314932823, + "grad_min_sv": 1.0033076104122573e-08, + "grad_condition": 105371945.52289103, + "lr": 0.000345491502812526, + "time_sec": 32.55959415435791 + }, + { + "epoch": 91, + "train_loss": 0.31169461310863494, + "train_acc": 0.89832, + "test_loss": 2.764314810180664, + "test_acc": 0.5242, + "lyapunov": null, + "grad_norm": 0.5454170376093662, + "grad_max_sv": 0.24890379793941975, + "grad_min_sv": 9.700326364034394e-09, + "grad_condition": 77171376.4128032, + "lr": 0.0003355666766307081, + "time_sec": 32.56360149383545 + }, + { + "epoch": 92, + "train_loss": 0.3113831770801544, + "train_acc": 0.90008, + "test_loss": 2.778244842529297, + "test_acc": 0.5291, + "lyapunov": null, + "grad_norm": 0.5407137447043685, + "grad_max_sv": 0.23328636735677719, + "grad_min_sv": 9.360961983687077e-09, + "grad_condition": 128397939.07976246, + "lr": 0.00032571397633909225, + "time_sec": 32.571138858795166 + }, + { + "epoch": 93, + "train_loss": 0.30188457230567933, + "train_acc": 0.903, + "test_loss": 2.7606024471282957, + "test_acc": 0.5339, + "lyapunov": null, + "grad_norm": 0.5330386559824729, + "grad_max_sv": 0.24647361300885678, + "grad_min_sv": 9.782626700523788e-09, + "grad_condition": 930794659.3385656, + "lr": 0.00031593772365766094, + "time_sec": 32.56698513031006 + }, + { + "epoch": 94, + "train_loss": 0.2888755958557129, + "train_acc": 0.90584, + "test_loss": 2.8303293384552, + "test_acc": 0.5252, + "lyapunov": null, + "grad_norm": 0.5239071385040424, + "grad_max_sv": 0.24134295992553234, + "grad_min_sv": 9.665177403035685e-09, + "grad_condition": 341790086.36703265, + "lr": 0.0003062422067739483, + "time_sec": 32.560898303985596 + }, + { + "epoch": 95, + "train_loss": 0.2843299233055115, + "train_acc": 0.90856, + "test_loss": 2.878970125961304, + "test_acc": 0.5228, + "lyapunov": null, + "grad_norm": 0.5173032628331714, + "grad_max_sv": 0.22986819855868817, + "grad_min_sv": 9.369064224050081e-09, + "grad_condition": 493164980.6666913, + "lr": 0.00029663167846209965, + "time_sec": 32.586976528167725 + }, + { + "epoch": 96, + "train_loss": 0.280480184469223, + "train_acc": 0.9093, + "test_loss": 2.9630297519683837, + "test_acc": 0.5184, + "lyapunov": null, + "grad_norm": 0.5133233008116458, + "grad_max_sv": 0.22380913645029069, + "grad_min_sv": 9.095019559701712e-09, + "grad_condition": 693584615.2355412, + "lr": 0.00028711035421746345, + "time_sec": 32.56851410865784 + }, + { + "epoch": 97, + "train_loss": 0.2670245563793182, + "train_acc": 0.9139, + "test_loss": 2.9036443214416505, + "test_acc": 0.5232, + "lyapunov": null, + "grad_norm": 0.5060688229901619, + "grad_max_sv": 0.23383041098713875, + "grad_min_sv": 9.393182952245269e-09, + "grad_condition": 365456172.90854704, + "lr": 0.00027768241040753615, + "time_sec": 32.560548305511475 + }, + { + "epoch": 98, + "train_loss": 0.2613537116527557, + "train_acc": 0.91552, + "test_loss": 2.93895020904541, + "test_acc": 0.5186, + "lyapunov": null, + "grad_norm": 0.5033096276176704, + "grad_max_sv": 0.22504370659589767, + "grad_min_sv": 9.149747783043782e-09, + "grad_condition": 181789237.51414594, + "lr": 0.00026835198244006903, + "time_sec": 32.57581615447998 + }, + { + "epoch": 99, + "train_loss": 0.25923142310142516, + "train_acc": 0.91662, + "test_loss": 2.9681204444885254, + "test_acc": 0.519, + "lyapunov": null, + "grad_norm": 0.5005047043499057, + "grad_max_sv": 0.23424391224980354, + "grad_min_sv": 9.202334173646042e-09, + "grad_condition": 1390486041.6800082, + "lr": 0.0002591231629491421, + "time_sec": 32.568488359451294 + }, + { + "epoch": 100, + "train_loss": 0.2552828652858734, + "train_acc": 0.91668, + "test_loss": 2.9585084489822386, + "test_acc": 0.5195, + "lyapunov": null, + "grad_norm": 0.5000052829086656, + "grad_max_sv": 0.23269009366631507, + "grad_min_sv": 9.008429451874688e-09, + "grad_condition": 118235741.33881798, + "lr": 0.0002499999999999997, + "time_sec": 32.64319896697998 + }, + { + "epoch": 101, + "train_loss": 0.2504552359342575, + "train_acc": 0.92034, + "test_loss": 2.881327504348755, + "test_acc": 0.527, + "lyapunov": null, + "grad_norm": 0.4976095445457081, + "grad_max_sv": 0.23710807636380196, + "grad_min_sv": 8.987613531706572e-09, + "grad_condition": 188175820.91636205, + "lr": 0.00024098649531343477, + "time_sec": 32.56459856033325 + }, + { + "epoch": 102, + "train_loss": 0.24319207516670227, + "train_acc": 0.9211, + "test_loss": 2.8339650466918944, + "test_acc": 0.5304, + "lyapunov": null, + "grad_norm": 0.49020316429940586, + "grad_max_sv": 0.22668980285525323, + "grad_min_sv": 8.876688220674786e-09, + "grad_condition": 3067014755.4611425, + "lr": 0.0002320866025105016, + "time_sec": 32.56655430793762 + }, + { + "epoch": 103, + "train_loss": 0.23643713227272034, + "train_acc": 0.92328, + "test_loss": 2.8374974479675292, + "test_acc": 0.5312, + "lyapunov": null, + "grad_norm": 0.48382300142218854, + "grad_max_sv": 0.22789723835885525, + "grad_min_sv": 8.629146283113676e-09, + "grad_condition": 335837582.58375555, + "lr": 0.0002233042253783278, + "time_sec": 32.56167936325073 + }, + { + "epoch": 104, + "train_loss": 0.23221797705173491, + "train_acc": 0.92652, + "test_loss": 2.8848680614471434, + "test_acc": 0.5292, + "lyapunov": null, + "grad_norm": 0.47687316634744686, + "grad_max_sv": 0.21569081246852875, + "grad_min_sv": 8.62663665758762e-09, + "grad_condition": 1157675505.971954, + "lr": 0.000214643216157784, + "time_sec": 32.563629150390625 + }, + { + "epoch": 105, + "train_loss": 0.2289664591026306, + "train_acc": 0.9265, + "test_loss": 2.9271271530151366, + "test_acc": 0.5268, + "lyapunov": null, + "grad_norm": 0.47818041348027984, + "grad_max_sv": 0.21913939844816924, + "grad_min_sv": 8.707405810184226e-09, + "grad_condition": 207155237.78245467, + "lr": 0.00020610737385376332, + "time_sec": 32.56299424171448 + }, + { + "epoch": 106, + "train_loss": 0.22260613627433776, + "train_acc": 0.92814, + "test_loss": 2.8978806022644044, + "test_acc": 0.5295, + "lyapunov": null, + "grad_norm": 0.4722385726091627, + "grad_max_sv": 0.2149375133216381, + "grad_min_sv": 8.579168120879944e-09, + "grad_condition": 165117262.170354, + "lr": 0.00019770044256881242, + "time_sec": 32.58579874038696 + }, + { + "epoch": 107, + "train_loss": 0.21763298731803893, + "train_acc": 0.93018, + "test_loss": 2.908183602523804, + "test_acc": 0.5286, + "lyapunov": null, + "grad_norm": 0.4652522989647011, + "grad_max_sv": 0.22290415540337563, + "grad_min_sv": 8.928726000223541e-09, + "grad_condition": 479064684.028664, + "lr": 0.0001894261098608447, + "time_sec": 32.594443798065186 + }, + { + "epoch": 108, + "train_loss": 0.2121983386325836, + "train_acc": 0.9317, + "test_loss": 2.8597964405059813, + "test_acc": 0.5362, + "lyapunov": null, + "grad_norm": 0.45763107412030085, + "grad_max_sv": 0.21216899007558823, + "grad_min_sv": 8.420200893585924e-09, + "grad_condition": 688259775.9446552, + "lr": 0.000181288005125655, + "time_sec": 32.56038689613342 + }, + { + "epoch": 109, + "train_loss": 0.20583704056739807, + "train_acc": 0.93444, + "test_loss": 2.9211787143707277, + "test_acc": 0.5282, + "lyapunov": null, + "grad_norm": 0.4568920236456778, + "grad_max_sv": 0.22295879386365414, + "grad_min_sv": 8.673458856169048e-09, + "grad_condition": 89075535.84085791, + "lr": 0.0001732896980049473, + "time_sec": 32.575947761535645 + }, + { + "epoch": 110, + "train_loss": 0.21038897478103638, + "train_acc": 0.93206, + "test_loss": 2.9601449073791506, + "test_acc": 0.5279, + "lyapunov": null, + "grad_norm": 0.45979845223683363, + "grad_max_sv": 0.22593539729714393, + "grad_min_sv": 8.6531671937215e-09, + "grad_condition": 89403715.48231289, + "lr": 0.00016543469682057076, + "time_sec": 32.607563495635986 + }, + { + "epoch": 111, + "train_loss": 0.19834216837882995, + "train_acc": 0.93586, + "test_loss": 2.9055423223495485, + "test_acc": 0.5353, + "lyapunov": null, + "grad_norm": 0.44710603724659786, + "grad_max_sv": 0.2183500427752733, + "grad_min_sv": 8.1763572969476e-09, + "grad_condition": 161545447.91228038, + "lr": 0.00015772644703565552, + "time_sec": 32.57204461097717 + }, + { + "epoch": 112, + "train_loss": 0.19908358410835267, + "train_acc": 0.93552, + "test_loss": 2.994161311531067, + "test_acc": 0.5244, + "lyapunov": null, + "grad_norm": 0.4546597416131923, + "grad_max_sv": 0.21809808388352395, + "grad_min_sv": 8.425444494170043e-09, + "grad_condition": 140538020.508261, + "lr": 0.00015016832974331713, + "time_sec": 32.601916790008545 + }, + { + "epoch": 113, + "train_loss": 0.191571541864872, + "train_acc": 0.93866, + "test_loss": 2.986764238739014, + "test_acc": 0.5296, + "lyapunov": null, + "grad_norm": 0.4450596671055528, + "grad_max_sv": 0.21210374720394612, + "grad_min_sv": 8.032377695355725e-09, + "grad_condition": 1444127435.9832203, + "lr": 0.00014276366018359834, + "time_sec": 32.559205770492554 + }, + { + "epoch": 114, + "train_loss": 0.1893005026912689, + "train_acc": 0.93862, + "test_loss": 3.0139925247192383, + "test_acc": 0.5255, + "lyapunov": null, + "grad_norm": 0.4424054116910155, + "grad_max_sv": 0.21594099812209605, + "grad_min_sv": 8.292241756094332e-09, + "grad_condition": 1221030181.2962646, + "lr": 0.00013551568628929425, + "time_sec": 32.54303812980652 + }, + { + "epoch": 115, + "train_loss": 0.1869383985710144, + "train_acc": 0.94032, + "test_loss": 2.9447794439315795, + "test_acc": 0.5338, + "lyapunov": null, + "grad_norm": 0.44046789562845245, + "grad_max_sv": 0.22429420053958893, + "grad_min_sv": 8.562988351723532e-09, + "grad_condition": 109188406.44486985, + "lr": 0.00012842758726130276, + "time_sec": 32.57725954055786 + }, + { + "epoch": 116, + "train_loss": 0.18216380766868592, + "train_acc": 0.94282, + "test_loss": 2.9761684719085695, + "test_acc": 0.533, + "lyapunov": null, + "grad_norm": 0.43380483120573066, + "grad_max_sv": 0.21227659583091735, + "grad_min_sv": 8.084414394003703e-09, + "grad_condition": 442388430.74640197, + "lr": 0.0001215024721741218, + "time_sec": 32.56703448295593 + }, + { + "epoch": 117, + "train_loss": 0.18284838955402374, + "train_acc": 0.94104, + "test_loss": 2.988401131248474, + "test_acc": 0.5304, + "lyapunov": null, + "grad_norm": 0.43518014689479523, + "grad_max_sv": 0.20529667772352694, + "grad_min_sv": 8.008318215188027e-09, + "grad_condition": 525224592.1224529, + "lr": 0.00011474337861210538, + "time_sec": 32.56633758544922 + }, + { + "epoch": 118, + "train_loss": 0.17929271565437316, + "train_acc": 0.94202, + "test_loss": 2.969692068481445, + "test_acc": 0.531, + "lyapunov": null, + "grad_norm": 0.43166468988319484, + "grad_max_sv": 0.20995365753769873, + "grad_min_sv": 7.949281083993037e-09, + "grad_condition": 206686551.43998715, + "lr": 0.00010815327133708009, + "time_sec": 32.58298921585083 + }, + { + "epoch": 119, + "train_loss": 0.1746947413468361, + "train_acc": 0.94538, + "test_loss": 2.9470513034820556, + "test_acc": 0.5265, + "lyapunov": null, + "grad_norm": 0.4240479391496432, + "grad_max_sv": 0.21465191170573233, + "grad_min_sv": 8.01244074109808e-09, + "grad_condition": 266673927.46960324, + "lr": 0.00010173504098790182, + "time_sec": 32.58079934120178 + }, + { + "epoch": 120, + "train_loss": 0.17056026011943817, + "train_acc": 0.94666, + "test_loss": 2.9715382446289063, + "test_acc": 0.5374, + "lyapunov": null, + "grad_norm": 0.4216192661535551, + "grad_max_sv": 0.21133692860603331, + "grad_min_sv": 8.155698732288316e-09, + "grad_condition": 310751065.89462894, + "lr": 9.549150281252629e-05, + "time_sec": 32.567041635513306 + }, + { + "epoch": 121, + "train_loss": 0.16829824639320373, + "train_acc": 0.94648, + "test_loss": 3.087546385574341, + "test_acc": 0.5255, + "lyapunov": null, + "grad_norm": 0.4183748049917772, + "grad_max_sv": 0.20680695101618768, + "grad_min_sv": 7.995454154665922e-09, + "grad_condition": 1023933342.3354034, + "lr": 8.942539543314794e-05, + "time_sec": 32.589598178863525 + }, + { + "epoch": 122, + "train_loss": 0.16800043944358825, + "train_acc": 0.94632, + "test_loss": 2.9318422325134277, + "test_acc": 0.5338, + "lyapunov": null, + "grad_norm": 0.42099752391898676, + "grad_max_sv": 0.21042499877512455, + "grad_min_sv": 7.547093950439551e-09, + "grad_condition": 900826897.3857119, + "lr": 8.353937964495024e-05, + "time_sec": 32.595381021499634 + }, + { + "epoch": 123, + "train_loss": 0.16323296820640565, + "train_acc": 0.94816, + "test_loss": 3.0529399940490722, + "test_acc": 0.5285, + "lyapunov": null, + "grad_norm": 0.41313116824251195, + "grad_max_sv": 0.19900580085814, + "grad_min_sv": 7.892230206862915e-09, + "grad_condition": 209614816.18259263, + "lr": 7.783603724899243e-05, + "time_sec": 32.5691282749176 + }, + { + "epoch": 124, + "train_loss": 0.16248614077568055, + "train_acc": 0.94808, + "test_loss": 2.968647869491577, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.4109739294498664, + "grad_max_sv": 0.2045503228902817, + "grad_min_sv": 7.709402672934767e-09, + "grad_condition": 204317712.1943869, + "lr": 7.231786991974666e-05, + "time_sec": 32.56873893737793 + }, + { + "epoch": 125, + "train_loss": 0.16562083917617798, + "train_acc": 0.94652, + "test_loss": 2.990608223724365, + "test_acc": 0.5324, + "lyapunov": null, + "grad_norm": 0.41726227575170305, + "grad_max_sv": 0.21484395451843738, + "grad_min_sv": 8.067420890524312e-09, + "grad_condition": 451509267.6606773, + "lr": 6.698729810778072e-05, + "time_sec": 32.563942432403564 + }, + { + "epoch": 126, + "train_loss": 0.16248787566184997, + "train_acc": 0.94908, + "test_loss": 3.0610411296844484, + "test_acc": 0.5248, + "lyapunov": null, + "grad_norm": 0.41265591679124974, + "grad_max_sv": 0.20524860061705114, + "grad_min_sv": 7.563831366450003e-09, + "grad_condition": 115790817.80184206, + "lr": 6.184665997806817e-05, + "time_sec": 32.568299770355225 + }, + { + "epoch": 127, + "train_loss": 0.15771708325862885, + "train_acc": 0.95078, + "test_loss": 2.962667014122009, + "test_acc": 0.5409, + "lyapunov": null, + "grad_norm": 0.4075071230249109, + "grad_max_sv": 0.20769537538290023, + "grad_min_sv": 8.188405986597757e-09, + "grad_condition": 380886928.1801485, + "lr": 5.6898210384392595e-05, + "time_sec": 32.57155394554138 + }, + { + "epoch": 128, + "train_loss": 0.15537331622004508, + "train_acc": 0.95126, + "test_loss": 2.9610030857086183, + "test_acc": 0.5357, + "lyapunov": null, + "grad_norm": 0.4021889013709537, + "grad_max_sv": 0.19925076719373463, + "grad_min_sv": 7.527878987789033e-09, + "grad_condition": 171791225.70681745, + "lr": 5.214411988029363e-05, + "time_sec": 32.58445978164673 + }, + { + "epoch": 129, + "train_loss": 0.15362726456165313, + "train_acc": 0.9504, + "test_loss": 3.0267199047088624, + "test_acc": 0.5318, + "lyapunov": null, + "grad_norm": 0.40304342978976343, + "grad_max_sv": 0.2073110181838274, + "grad_min_sv": 7.651128650391566e-09, + "grad_condition": 655223821.7012879, + "lr": 4.7586473766990294e-05, + "time_sec": 32.58788251876831 + }, + { + "epoch": 130, + "train_loss": 0.15159179414272309, + "train_acc": 0.95296, + "test_loss": 3.075101675415039, + "test_acc": 0.5263, + "lyapunov": null, + "grad_norm": 0.3974054527380892, + "grad_max_sv": 0.20575362853705884, + "grad_min_sv": 7.740591648555672e-09, + "grad_condition": 144759180.06870463, + "lr": 4.32272711786996e-05, + "time_sec": 32.578858613967896 + }, + { + "epoch": 131, + "train_loss": 0.1488430485343933, + "train_acc": 0.95292, + "test_loss": 2.9862019886016844, + "test_acc": 0.5315, + "lyapunov": null, + "grad_norm": 0.3954060106149679, + "grad_max_sv": 0.20766182690858842, + "grad_min_sv": 7.58607175857344e-09, + "grad_condition": 425579805.0794872, + "lr": 3.906842420574966e-05, + "time_sec": 32.586265325546265 + }, + { + "epoch": 132, + "train_loss": 0.14661406512260436, + "train_acc": 0.95324, + "test_loss": 3.057056298828125, + "test_acc": 0.5262, + "lyapunov": null, + "grad_norm": 0.39095745142548216, + "grad_max_sv": 0.19490535818040372, + "grad_min_sv": 7.49121251628342e-09, + "grad_condition": 3507301112.9708757, + "lr": 3.5111757055874305e-05, + "time_sec": 32.574090003967285 + }, + { + "epoch": 133, + "train_loss": 0.1463806065893173, + "train_acc": 0.95318, + "test_loss": 3.0613175567626953, + "test_acc": 0.527, + "lyapunov": null, + "grad_norm": 0.3949318760097119, + "grad_max_sv": 0.2000393845140934, + "grad_min_sv": 7.511325199847929e-09, + "grad_condition": 264016430.37942663, + "lr": 3.1359005254054254e-05, + "time_sec": 32.57793402671814 + }, + { + "epoch": 134, + "train_loss": 0.14586117388010025, + "train_acc": 0.95352, + "test_loss": 3.0277784969329833, + "test_acc": 0.5333, + "lyapunov": null, + "grad_norm": 0.3915443650869973, + "grad_max_sv": 0.20002376139163972, + "grad_min_sv": 7.407051562673041e-09, + "grad_condition": 1569872714.1138968, + "lr": 2.7811814881259484e-05, + "time_sec": 32.58327078819275 + }, + { + "epoch": 135, + "train_loss": 0.14679538232803344, + "train_acc": 0.9531, + "test_loss": 3.02330316696167, + "test_acc": 0.5325, + "lyapunov": null, + "grad_norm": 0.39654447314663155, + "grad_max_sv": 0.2064110331237316, + "grad_min_sv": 8.009200439971707e-09, + "grad_condition": 408075856.5604743, + "lr": 2.4471741852423218e-05, + "time_sec": 32.57164478302002 + }, + { + "epoch": 136, + "train_loss": 0.14213005175113677, + "train_acc": 0.95606, + "test_loss": 3.066131346511841, + "test_acc": 0.5326, + "lyapunov": null, + "grad_norm": 0.386859099144263, + "grad_max_sv": 0.20008183866739274, + "grad_min_sv": 7.493826075335216e-09, + "grad_condition": 1294487907.3292127, + "lr": 2.1340251233966362e-05, + "time_sec": 32.59002447128296 + }, + { + "epoch": 137, + "train_loss": 0.14528326896190644, + "train_acc": 0.95314, + "test_loss": 2.9820048439025877, + "test_acc": 0.5384, + "lyapunov": null, + "grad_norm": 0.3940518150499405, + "grad_max_sv": 0.20172332599759102, + "grad_min_sv": 7.518978299708582e-09, + "grad_condition": 2050951064.0374703, + "lr": 1.8418716601170932e-05, + "time_sec": 32.582863569259644 + }, + { + "epoch": 138, + "train_loss": 0.14290555841445923, + "train_acc": 0.954, + "test_loss": 2.9484275436401366, + "test_acc": 0.5392, + "lyapunov": null, + "grad_norm": 0.3885095445150157, + "grad_max_sv": 0.1956668719649315, + "grad_min_sv": 7.481351363262425e-09, + "grad_condition": 817168787.737042, + "lr": 1.570841943568445e-05, + "time_sec": 32.56788969039917 + }, + { + "epoch": 139, + "train_loss": 0.1455221847629547, + "train_acc": 0.95376, + "test_loss": 2.9918841510772705, + "test_acc": 0.539, + "lyapunov": null, + "grad_norm": 0.39394584988421966, + "grad_max_sv": 0.1982663732022047, + "grad_min_sv": 7.502347731524073e-09, + "grad_condition": 1796580822.5410652, + "lr": 1.3210548563419845e-05, + "time_sec": 32.57190442085266 + }, + { + "epoch": 140, + "train_loss": 0.1442144584083557, + "train_acc": 0.95352, + "test_loss": 2.970733211517334, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.39260771988813964, + "grad_max_sv": 0.19792755618691443, + "grad_min_sv": 7.351794456978561e-09, + "grad_condition": 208762115.79842368, + "lr": 1.0926199633097203e-05, + "time_sec": 32.58234429359436 + }, + { + "epoch": 141, + "train_loss": 0.1421483956861496, + "train_acc": 0.95486, + "test_loss": 2.9954518421173097, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.3895044607831209, + "grad_max_sv": 0.19535492211580277, + "grad_min_sv": 7.2159212467261255e-09, + "grad_condition": 226711442.0952455, + "lr": 8.856374635655688e-06, + "time_sec": 32.580827951431274 + }, + { + "epoch": 142, + "train_loss": 0.14344135119915008, + "train_acc": 0.95412, + "test_loss": 3.0175164573669435, + "test_acc": 0.5347, + "lyapunov": null, + "grad_norm": 0.3912699552240718, + "grad_max_sv": 0.20520108379423618, + "grad_min_sv": 7.762914990688819e-09, + "grad_condition": 387803307.69275963, + "lr": 7.001981464747503e-06, + "time_sec": 32.58955121040344 + }, + { + "epoch": 143, + "train_loss": 0.145557352809906, + "train_acc": 0.95334, + "test_loss": 2.9905672885894776, + "test_acc": 0.5351, + "lyapunov": null, + "grad_norm": 0.3937145534468507, + "grad_max_sv": 0.19824392758309842, + "grad_min_sv": 7.470967854170812e-09, + "grad_condition": 615993628.5132923, + "lr": 5.3638335185058295e-06, + "time_sec": 32.584557056427 + }, + { + "epoch": 144, + "train_loss": 0.13792892556190492, + "train_acc": 0.9568, + "test_loss": 3.0243384300231932, + "test_acc": 0.5351, + "lyapunov": null, + "grad_norm": 0.38137874618156004, + "grad_max_sv": 0.20396318212151526, + "grad_min_sv": 7.759564610645975e-09, + "grad_condition": 401781652.79968464, + "lr": 3.942649342761114e-06, + "time_sec": 32.58082866668701 + }, + { + "epoch": 145, + "train_loss": 0.14240989098906517, + "train_acc": 0.95506, + "test_loss": 3.008878281021118, + "test_acc": 0.5332, + "lyapunov": null, + "grad_norm": 0.38824198485970274, + "grad_max_sv": 0.1965224850922823, + "grad_min_sv": 7.475432478099615e-09, + "grad_condition": 547980005.9847585, + "lr": 2.7390523158633524e-06, + "time_sec": 32.580146074295044 + }, + { + "epoch": 146, + "train_loss": 0.14141309247016906, + "train_acc": 0.95526, + "test_loss": 2.9967607612609863, + "test_acc": 0.5355, + "lyapunov": null, + "grad_norm": 0.3897738666220961, + "grad_max_sv": 0.20576116181910037, + "grad_min_sv": 7.723471491180578e-09, + "grad_condition": 174968319.88759154, + "lr": 1.7535703752478133e-06, + "time_sec": 32.57999658584595 + }, + { + "epoch": 147, + "train_loss": 0.14116668840408325, + "train_acc": 0.95622, + "test_loss": 3.015700612258911, + "test_acc": 0.5356, + "lyapunov": null, + "grad_norm": 0.38647682331651556, + "grad_max_sv": 0.20005690585821867, + "grad_min_sv": 7.458373789469112e-09, + "grad_condition": 559134109.3457831, + "lr": 9.866357858642196e-07, + "time_sec": 32.57423949241638 + }, + { + "epoch": 148, + "train_loss": 0.13872075388908386, + "train_acc": 0.95694, + "test_loss": 3.02675003452301, + "test_acc": 0.5311, + "lyapunov": null, + "grad_norm": 0.3834516001697345, + "grad_max_sv": 0.20063496865332126, + "grad_min_sv": 7.280352303873708e-09, + "grad_condition": 342935155.3336584, + "lr": 4.38584950570808e-07, + "time_sec": 32.59147930145264 + }, + { + "epoch": 149, + "train_loss": 0.14044044229030608, + "train_acc": 0.9558, + "test_loss": 3.0015827127456665, + "test_acc": 0.537, + "lyapunov": null, + "grad_norm": 0.38662537604202735, + "grad_max_sv": 0.1903643485158682, + "grad_min_sv": 7.2725075060480446e-09, + "grad_condition": 1114748941.7660475, + "lr": 1.096582625772501e-07, + "time_sec": 32.56627154350281 + }, + { + "epoch": 150, + "train_loss": 0.14047483313083647, + "train_acc": 0.95586, + "test_loss": 3.1137742416381835, + "test_acc": 0.5222, + "lyapunov": null, + "grad_norm": 0.38553295960146916, + "grad_max_sv": 0.2001470748335123, + "grad_min_sv": 7.337464655082695e-09, + "grad_condition": 1377858482.3116786, + "lr": 0.0, + "time_sec": 32.586660385131836 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.87748296585083, + "train_acc": 0.0306, + "test_loss": 4.82872876663208, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 5.932964620640208, + "grad_max_sv": 5.34441111087799, + "grad_min_sv": 9.95076935739192e-08, + "grad_condition": 162613846.39082906, + "lr": 0.0009998903417374227, + "time_sec": 49.64781618118286 + }, + { + "epoch": 2, + "train_loss": 4.325910377655029, + "train_acc": 0.05894, + "test_loss": 4.736625276947022, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 4.434671975936239, + "grad_max_sv": 3.9236845791339876, + "grad_min_sv": 7.506598741907622e-08, + "grad_condition": 326618949.3555427, + "lr": 0.0009995614150494292, + "time_sec": 49.66104316711426 + }, + { + "epoch": 3, + "train_loss": 4.033521332244873, + "train_acc": 0.08816, + "test_loss": 4.546054625701904, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 3.5972867305140204, + "grad_max_sv": 3.0456687450408935, + "grad_min_sv": 6.285284603370356e-08, + "grad_condition": 641155242.0675491, + "lr": 0.0009990133642141358, + "time_sec": 49.67153525352478 + }, + { + "epoch": 4, + "train_loss": 3.8378815770721437, + "train_acc": 0.11312, + "test_loss": 4.485385893249512, + "test_acc": 0.0421, + "lyapunov": null, + "grad_norm": 3.005868245561951, + "grad_max_sv": 2.4899374902248383, + "grad_min_sv": 5.274935636068179e-08, + "grad_condition": 56291013.628438115, + "lr": 0.0009982464296247522, + "time_sec": 49.65495419502258 + }, + { + "epoch": 5, + "train_loss": 3.6790373979949953, + "train_acc": 0.1354, + "test_loss": 4.809463809204102, + "test_acc": 0.0483, + "lyapunov": null, + "grad_norm": 2.481791347519261, + "grad_max_sv": 1.911762249469757, + "grad_min_sv": 4.251578253344768e-08, + "grad_condition": 59447447.39549043, + "lr": 0.0009972609476841367, + "time_sec": 49.609050989151 + }, + { + "epoch": 6, + "train_loss": 3.5471466955566404, + "train_acc": 0.1563, + "test_loss": 4.763859475708008, + "test_acc": 0.0562, + "lyapunov": null, + "grad_norm": 2.0531107778434636, + "grad_max_sv": 1.4932055324316025, + "grad_min_sv": 3.614347272584695e-08, + "grad_condition": 45442606.51570525, + "lr": 0.000996057350657239, + "time_sec": 49.593199491500854 + }, + { + "epoch": 7, + "train_loss": 3.4418113514709474, + "train_acc": 0.17478, + "test_loss": 4.615470837402344, + "test_acc": 0.061, + "lyapunov": null, + "grad_norm": 1.7367000738812381, + "grad_max_sv": 1.1847797572612762, + "grad_min_sv": 3.088092909442341e-08, + "grad_condition": 65255140.867708586, + "lr": 0.000994636166481494, + "time_sec": 49.60785531997681 + }, + { + "epoch": 8, + "train_loss": 3.354895782546997, + "train_acc": 0.18784, + "test_loss": 5.2386075889587405, + "test_acc": 0.0585, + "lyapunov": null, + "grad_norm": 1.5335851977180728, + "grad_max_sv": 0.9428193107247352, + "grad_min_sv": 2.6885542893373415e-08, + "grad_condition": 75909476.50814043, + "lr": 0.0009929980185352525, + "time_sec": 49.60816526412964 + }, + { + "epoch": 9, + "train_loss": 3.2788688597869875, + "train_acc": 0.20466, + "test_loss": 5.2327860107421875, + "test_acc": 0.0714, + "lyapunov": null, + "grad_norm": 1.374914600034168, + "grad_max_sv": 0.7664340496063232, + "grad_min_sv": 2.4066519885290737e-08, + "grad_condition": 51969313.05697616, + "lr": 0.0009911436253643444, + "time_sec": 49.62115836143494 + }, + { + "epoch": 10, + "train_loss": 3.214320725250244, + "train_acc": 0.21478, + "test_loss": 5.367890010070801, + "test_acc": 0.0635, + "lyapunov": null, + "grad_norm": 1.2723756047607861, + "grad_max_sv": 0.6678376257419586, + "grad_min_sv": 2.3140357913176147e-08, + "grad_condition": 33781734.36143675, + "lr": 0.0009890738003669028, + "time_sec": 49.653478384017944 + }, + { + "epoch": 11, + "train_loss": 3.157560857696533, + "train_acc": 0.22716, + "test_loss": 4.9893413871765135, + "test_acc": 0.0793, + "lyapunov": null, + "grad_norm": 1.1804196554033854, + "grad_max_sv": 0.5599115259945393, + "grad_min_sv": 2.0999575375824088e-08, + "grad_condition": 40003653.553005375, + "lr": 0.00098678945143658, + "time_sec": 49.64659833908081 + }, + { + "epoch": 12, + "train_loss": 3.10919125541687, + "train_acc": 0.23374, + "test_loss": 5.922018681335449, + "test_acc": 0.0572, + "lyapunov": null, + "grad_norm": 1.1127516543729237, + "grad_max_sv": 0.5103657670319081, + "grad_min_sv": 2.0326233945988648e-08, + "grad_condition": 31959597.02886455, + "lr": 0.0009842915805643154, + "time_sec": 49.6422758102417 + }, + { + "epoch": 13, + "train_loss": 3.0661709033203124, + "train_acc": 0.24498, + "test_loss": 5.5857378784179685, + "test_acc": 0.0641, + "lyapunov": null, + "grad_norm": 1.0572945850355566, + "grad_max_sv": 0.468644580245018, + "grad_min_sv": 1.9489185115739716e-08, + "grad_condition": 28974309.240684826, + "lr": 0.000981581283398829, + "time_sec": 49.644200801849365 + }, + { + "epoch": 14, + "train_loss": 3.031631886138916, + "train_acc": 0.2494, + "test_loss": 6.1126462295532225, + "test_acc": 0.0622, + "lyapunov": null, + "grad_norm": 1.0078886975437553, + "grad_max_sv": 0.4199274107813835, + "grad_min_sv": 1.78886194669714e-08, + "grad_condition": 58726821.90857921, + "lr": 0.0009786597487660333, + "time_sec": 49.64050054550171 + }, + { + "epoch": 15, + "train_loss": 2.9854307820892334, + "train_acc": 0.25912, + "test_loss": 6.682256416320801, + "test_acc": 0.0577, + "lyapunov": null, + "grad_norm": 0.9661185163428607, + "grad_max_sv": 0.4044369950890541, + "grad_min_sv": 1.7625257230091673e-08, + "grad_condition": 47054066.77256496, + "lr": 0.0009755282581475766, + "time_sec": 49.64783048629761 + }, + { + "epoch": 16, + "train_loss": 2.950966311187744, + "train_acc": 0.26442, + "test_loss": 6.452827975463867, + "test_acc": 0.0549, + "lyapunov": null, + "grad_norm": 0.9327205202160699, + "grad_max_sv": 0.38560108840465546, + "grad_min_sv": 1.7282875616189337e-08, + "grad_condition": 314726395.9437877, + "lr": 0.0009721881851187403, + "time_sec": 49.64088153839111 + }, + { + "epoch": 17, + "train_loss": 2.916735321044922, + "train_acc": 0.27246, + "test_loss": 6.896680711364746, + "test_acc": 0.0438, + "lyapunov": null, + "grad_norm": 0.8945744514519771, + "grad_max_sv": 0.354119461029768, + "grad_min_sv": 1.643565590847551e-08, + "grad_condition": 26255983.39074681, + "lr": 0.0009686409947459456, + "time_sec": 49.627718448638916 + }, + { + "epoch": 18, + "train_loss": 2.8857511570739747, + "train_acc": 0.27974, + "test_loss": 5.6459962882995605, + "test_acc": 0.0503, + "lyapunov": null, + "grad_norm": 0.8793484279442325, + "grad_max_sv": 0.35779951736330984, + "grad_min_sv": 1.628617940785393e-08, + "grad_condition": 111551423.90357837, + "lr": 0.0009648882429441254, + "time_sec": 49.611419677734375 + }, + { + "epoch": 19, + "train_loss": 2.850851222381592, + "train_acc": 0.28394, + "test_loss": 6.184397215270996, + "test_acc": 0.0477, + "lyapunov": null, + "grad_norm": 0.8560875588234809, + "grad_max_sv": 0.3290360912680626, + "grad_min_sv": 1.5741092075638452e-08, + "grad_condition": 33852379.436212204, + "lr": 0.00096093157579425, + "time_sec": 49.60723423957825 + }, + { + "epoch": 20, + "train_loss": 2.8297593169403075, + "train_acc": 0.2865, + "test_loss": 6.550658810424805, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.8484343768951315, + "grad_max_sv": 0.3310988314449787, + "grad_min_sv": 1.579570341747605e-08, + "grad_condition": 26630780.62742402, + "lr": 0.0009567727288213001, + "time_sec": 49.63738775253296 + }, + { + "epoch": 21, + "train_loss": 2.8062883308410647, + "train_acc": 0.29554, + "test_loss": 6.611366340637207, + "test_acc": 0.0425, + "lyapunov": null, + "grad_norm": 0.8271444897566678, + "grad_max_sv": 0.31499212570488455, + "grad_min_sv": 1.5104316366393312e-08, + "grad_condition": 56385885.9009584, + "lr": 0.0009524135262330095, + "time_sec": 49.624245405197144 + }, + { + "epoch": 22, + "train_loss": 2.7797841816711424, + "train_acc": 0.29848, + "test_loss": 5.2575527236938475, + "test_acc": 0.0689, + "lyapunov": null, + "grad_norm": 0.8192773127159139, + "grad_max_sv": 0.3165230479091406, + "grad_min_sv": 1.5343957029956278e-08, + "grad_condition": 28932546.565699626, + "lr": 0.0009478558801197061, + "time_sec": 49.6358916759491 + }, + { + "epoch": 23, + "train_loss": 2.758929995956421, + "train_acc": 0.30298, + "test_loss": 5.9057046417236325, + "test_acc": 0.0483, + "lyapunov": null, + "grad_norm": 0.7977853555521689, + "grad_max_sv": 0.2981082580983639, + "grad_min_sv": 1.4607530535171166e-08, + "grad_condition": 23062158.33463922, + "lr": 0.000943101789615607, + "time_sec": 49.64936828613281 + }, + { + "epoch": 24, + "train_loss": 2.7243907251739503, + "train_acc": 0.30978, + "test_loss": 6.879129153442383, + "test_acc": 0.0503, + "lyapunov": null, + "grad_norm": 0.785562618961601, + "grad_max_sv": 0.3072618875652552, + "grad_min_sv": 1.4546391063907649e-08, + "grad_condition": 26103951.701446574, + "lr": 0.0009381533400219313, + "time_sec": 49.654170513153076 + }, + { + "epoch": 25, + "train_loss": 2.7052862129211426, + "train_acc": 0.31438, + "test_loss": 7.123418940734863, + "test_acc": 0.0498, + "lyapunov": null, + "grad_norm": 0.7800832079587465, + "grad_max_sv": 0.28868941627442835, + "grad_min_sv": 1.4423146366127071e-08, + "grad_condition": 25468875.32253523, + "lr": 0.0009330127018922189, + "time_sec": 49.644099712371826 + }, + { + "epoch": 26, + "train_loss": 2.6786952052307127, + "train_acc": 0.31786, + "test_loss": 6.8779948043823245, + "test_acc": 0.04, + "lyapunov": null, + "grad_norm": 0.7660717213990589, + "grad_max_sv": 0.28445089757442477, + "grad_min_sv": 1.4051416873800404e-08, + "grad_condition": 157008558.44244316, + "lr": 0.000927682130080253, + "time_sec": 49.6546745300293 + }, + { + "epoch": 27, + "train_loss": 2.650107885437012, + "train_acc": 0.3233, + "test_loss": 6.409167988586426, + "test_acc": 0.0663, + "lyapunov": null, + "grad_norm": 0.7553219053413048, + "grad_max_sv": 0.2734900705516338, + "grad_min_sv": 1.3975185350623143e-08, + "grad_condition": 26675374.92153287, + "lr": 0.0009221639627510072, + "time_sec": 49.651949882507324 + }, + { + "epoch": 28, + "train_loss": 2.6323010539245604, + "train_acc": 0.32642, + "test_loss": 6.348737354278565, + "test_acc": 0.0767, + "lyapunov": null, + "grad_norm": 0.7542460840346141, + "grad_max_sv": 0.28178194239735604, + "grad_min_sv": 1.4111558673673974e-08, + "grad_condition": 153191030.94962814, + "lr": 0.0009164606203550494, + "time_sec": 49.657703161239624 + }, + { + "epoch": 29, + "train_loss": 2.622528738861084, + "train_acc": 0.33052, + "test_loss": 5.323012785339356, + "test_acc": 0.0615, + "lyapunov": null, + "grad_norm": 0.7434329600183185, + "grad_max_sv": 0.28229105696082113, + "grad_min_sv": 1.3741382927194567e-08, + "grad_condition": 99920561.24148658, + "lr": 0.0009105746045668516, + "time_sec": 49.640869140625 + }, + { + "epoch": 30, + "train_loss": 2.589859499359131, + "train_acc": 0.3361, + "test_loss": 5.348752153015137, + "test_acc": 0.0806, + "lyapunov": null, + "grad_norm": 0.7401188593705409, + "grad_max_sv": 0.2747684422880411, + "grad_min_sv": 1.3880728885751203e-08, + "grad_condition": 23324413.51449412, + "lr": 0.0009045084971874733, + "time_sec": 49.62320137023926 + }, + { + "epoch": 31, + "train_loss": 2.574071376495361, + "train_acc": 0.33836, + "test_loss": 4.929797785949707, + "test_acc": 0.0696, + "lyapunov": null, + "grad_norm": 0.7328550694976608, + "grad_max_sv": 0.27694769613444803, + "grad_min_sv": 1.3843863291840286e-08, + "grad_condition": 27250825.622907154, + "lr": 0.0008982649590120977, + "time_sec": 49.61762976646423 + }, + { + "epoch": 32, + "train_loss": 2.5636251927185056, + "train_acc": 0.33996, + "test_loss": 4.977822930908203, + "test_acc": 0.0603, + "lyapunov": null, + "grad_norm": 0.72578993407064, + "grad_max_sv": 0.26916658468544485, + "grad_min_sv": 1.3664173616201313e-08, + "grad_condition": 37586474.04914663, + "lr": 0.0008918467286629196, + "time_sec": 49.59874439239502 + }, + { + "epoch": 33, + "train_loss": 2.534274593658447, + "train_acc": 0.34576, + "test_loss": 5.612884985351562, + "test_acc": 0.0648, + "lyapunov": null, + "grad_norm": 0.7195677912828391, + "grad_max_sv": 0.2578020472079515, + "grad_min_sv": 1.3214893858359833e-08, + "grad_condition": 31599310.228798192, + "lr": 0.0008852566213878943, + "time_sec": 49.60587477684021 + }, + { + "epoch": 34, + "train_loss": 2.5204806367492676, + "train_acc": 0.34968, + "test_loss": 5.823319554901123, + "test_acc": 0.0571, + "lyapunov": null, + "grad_norm": 0.7058229239582122, + "grad_max_sv": 0.2517259892076254, + "grad_min_sv": 1.3128194935319027e-08, + "grad_condition": 38016748.40510639, + "lr": 0.000878497527825878, + "time_sec": 49.63596320152283 + }, + { + "epoch": 35, + "train_loss": 2.4967036684417723, + "train_acc": 0.35386, + "test_loss": 5.568839009094238, + "test_acc": 0.0655, + "lyapunov": null, + "grad_norm": 0.7071521329332581, + "grad_max_sv": 0.2598913241177797, + "grad_min_sv": 1.3420283057063997e-08, + "grad_condition": 21475756.171551444, + "lr": 0.000871572412738697, + "time_sec": 49.64343976974487 + }, + { + "epoch": 36, + "train_loss": 2.483395898208618, + "train_acc": 0.356, + "test_loss": 5.925778231811523, + "test_acc": 0.0775, + "lyapunov": null, + "grad_norm": 0.7019030587227678, + "grad_max_sv": 0.2620332419872284, + "grad_min_sv": 1.330909059973906e-08, + "grad_condition": 39143745.76315293, + "lr": 0.0008644843137107055, + "time_sec": 49.633464097976685 + }, + { + "epoch": 37, + "train_loss": 2.455888598480225, + "train_acc": 0.3619, + "test_loss": 5.800891122436523, + "test_acc": 0.0522, + "lyapunov": null, + "grad_norm": 0.7041203727881495, + "grad_max_sv": 0.25247339606285096, + "grad_min_sv": 1.317027563119133e-08, + "grad_condition": 25971636.862640023, + "lr": 0.0008572363398164014, + "time_sec": 49.641075134277344 + }, + { + "epoch": 38, + "train_loss": 2.444258794937134, + "train_acc": 0.3643, + "test_loss": 6.3827191253662106, + "test_acc": 0.0512, + "lyapunov": null, + "grad_norm": 0.6991868964165402, + "grad_max_sv": 0.2449926756322384, + "grad_min_sv": 1.2983126976284787e-08, + "grad_condition": 22727640.443126805, + "lr": 0.0008498316702566826, + "time_sec": 49.6653778553009 + }, + { + "epoch": 39, + "train_loss": 2.427623992614746, + "train_acc": 0.36718, + "test_loss": 5.836345671081543, + "test_acc": 0.0532, + "lyapunov": null, + "grad_norm": 0.6944654131754266, + "grad_max_sv": 0.24421218782663345, + "grad_min_sv": 1.2779784830385666e-08, + "grad_condition": 26159365.26096248, + "lr": 0.0008422735529643442, + "time_sec": 49.65552568435669 + }, + { + "epoch": 40, + "train_loss": 2.4149912483215332, + "train_acc": 0.36854, + "test_loss": 5.969065676879882, + "test_acc": 0.0689, + "lyapunov": null, + "grad_norm": 0.6869986110904911, + "grad_max_sv": 0.23399859815835952, + "grad_min_sv": 1.2716373970489415e-08, + "grad_condition": 21923336.447286993, + "lr": 0.0008345653031794289, + "time_sec": 49.66923117637634 + }, + { + "epoch": 41, + "train_loss": 2.386474126663208, + "train_acc": 0.37558, + "test_loss": 6.019966047668457, + "test_acc": 0.0579, + "lyapunov": null, + "grad_norm": 0.68492309888036, + "grad_max_sv": 0.2508115164935589, + "grad_min_sv": 1.3077304128472633e-08, + "grad_condition": 23198341.25841063, + "lr": 0.0008267103019950526, + "time_sec": 49.620418071746826 + }, + { + "epoch": 42, + "train_loss": 2.3729596766662597, + "train_acc": 0.38002, + "test_loss": 6.315153423309326, + "test_acc": 0.0611, + "lyapunov": null, + "grad_norm": 0.6839063548904902, + "grad_max_sv": 0.24613724276423454, + "grad_min_sv": 1.2924071682296479e-08, + "grad_condition": 24553794.967906404, + "lr": 0.0008187119948743447, + "time_sec": 49.66134309768677 + }, + { + "epoch": 43, + "train_loss": 2.3540061936950685, + "train_acc": 0.38038, + "test_loss": 6.8890972946166995, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.6797404469786038, + "grad_max_sv": 0.23774098604917526, + "grad_min_sv": 1.269067942399893e-08, + "grad_condition": 36055931.35688925, + "lr": 0.000810573890139155, + "time_sec": 49.60659217834473 + }, + { + "epoch": 44, + "train_loss": 2.3270812229919433, + "train_acc": 0.38584, + "test_loss": 6.7161765426635744, + "test_acc": 0.0423, + "lyapunov": null, + "grad_norm": 0.6759173721688353, + "grad_max_sv": 0.24107158593833447, + "grad_min_sv": 1.2535652725575997e-08, + "grad_condition": 27534242.15084389, + "lr": 0.0008022995574311873, + "time_sec": 49.602726459503174 + }, + { + "epoch": 45, + "train_loss": 2.3246476860046386, + "train_acc": 0.39008, + "test_loss": 6.29091294631958, + "test_acc": 0.0518, + "lyapunov": null, + "grad_norm": 0.6715272373280456, + "grad_max_sv": 0.23545034006237983, + "grad_min_sv": 1.2545344027503624e-08, + "grad_condition": 21225788.36034053, + "lr": 0.0007938926261462363, + "time_sec": 49.6089346408844 + }, + { + "epoch": 46, + "train_loss": 2.302794339752197, + "train_acc": 0.3932, + "test_loss": 6.331070534515381, + "test_acc": 0.0457, + "lyapunov": null, + "grad_norm": 0.6695288339948315, + "grad_max_sv": 0.2387615241110325, + "grad_min_sv": 1.267214993216914e-08, + "grad_condition": 21439809.063333027, + "lr": 0.0007853567838422158, + "time_sec": 49.6616952419281 + }, + { + "epoch": 47, + "train_loss": 2.2937580155944826, + "train_acc": 0.39494, + "test_loss": 6.747457525634766, + "test_acc": 0.0403, + "lyapunov": null, + "grad_norm": 0.6703150590025013, + "grad_max_sv": 0.23008973710238934, + "grad_min_sv": 1.243687924035175e-08, + "grad_condition": 21332244.897804268, + "lr": 0.0007766957746216719, + "time_sec": 49.64005661010742 + }, + { + "epoch": 48, + "train_loss": 2.271936141662598, + "train_acc": 0.40028, + "test_loss": 8.364392227172852, + "test_acc": 0.045, + "lyapunov": null, + "grad_norm": 0.6688819126115724, + "grad_max_sv": 0.23257951848208905, + "grad_min_sv": 1.2320799760989764e-08, + "grad_condition": 43562236.54403031, + "lr": 0.0007679133974894982, + "time_sec": 49.66763877868652 + }, + { + "epoch": 49, + "train_loss": 2.2604706730651856, + "train_acc": 0.40228, + "test_loss": 6.142012088012695, + "test_acc": 0.0648, + "lyapunov": null, + "grad_norm": 0.6643101794178548, + "grad_max_sv": 0.2336978729814291, + "grad_min_sv": 1.2540253756243568e-08, + "grad_condition": 33614084.08040741, + "lr": 0.000759013504686565, + "time_sec": 49.65048050880432 + }, + { + "epoch": 50, + "train_loss": 2.238395141143799, + "train_acc": 0.40952, + "test_loss": 7.636728004455566, + "test_acc": 0.0642, + "lyapunov": null, + "grad_norm": 0.6646450225062208, + "grad_max_sv": 0.23055841773748398, + "grad_min_sv": 1.2360750140105737e-08, + "grad_condition": 29243478.728895236, + "lr": 0.0007499999999999998, + "time_sec": 49.64303922653198 + }, + { + "epoch": 51, + "train_loss": 2.22945908203125, + "train_acc": 0.40844, + "test_loss": 6.013677481079101, + "test_acc": 0.0746, + "lyapunov": null, + "grad_norm": 0.6654733307343168, + "grad_max_sv": 0.23596662729978563, + "grad_min_sv": 1.2487093845048314e-08, + "grad_condition": 24754111.81759522, + "lr": 0.0007408768370508575, + "time_sec": 49.64409947395325 + }, + { + "epoch": 52, + "train_loss": 2.2170784504699705, + "train_acc": 0.40908, + "test_loss": 6.157418632507325, + "test_acc": 0.0702, + "lyapunov": null, + "grad_norm": 0.6594175681266546, + "grad_max_sv": 0.2355981681495905, + "grad_min_sv": 1.236185071251672e-08, + "grad_condition": 25757058.499904532, + "lr": 0.0007316480175599307, + "time_sec": 49.636614084243774 + }, + { + "epoch": 53, + "train_loss": 2.1939515002059937, + "train_acc": 0.41558, + "test_loss": 6.859078231048584, + "test_acc": 0.0569, + "lyapunov": null, + "grad_norm": 0.662946169812431, + "grad_max_sv": 0.23508151918649672, + "grad_min_sv": 1.2330145124361813e-08, + "grad_condition": 32594540.125570327, + "lr": 0.0007223175895924635, + "time_sec": 49.70306444168091 + }, + { + "epoch": 54, + "train_loss": 2.1878874357604983, + "train_acc": 0.41686, + "test_loss": 6.514185330963135, + "test_acc": 0.0579, + "lyapunov": null, + "grad_norm": 0.6592013207620988, + "grad_max_sv": 0.23284565843641758, + "grad_min_sv": 1.246490098361086e-08, + "grad_condition": 21669360.08749289, + "lr": 0.0007128896457825361, + "time_sec": 49.62425947189331 + }, + { + "epoch": 55, + "train_loss": 2.1700433895111084, + "train_acc": 0.42082, + "test_loss": 7.349776064300537, + "test_acc": 0.0557, + "lyapunov": null, + "grad_norm": 0.6591415320918335, + "grad_max_sv": 0.23167332261800766, + "grad_min_sv": 1.2205207861396006e-08, + "grad_condition": 238494592.31476593, + "lr": 0.0007033683215378998, + "time_sec": 49.62825536727905 + }, + { + "epoch": 56, + "train_loss": 2.153282830657959, + "train_acc": 0.4221, + "test_loss": 6.606533212280273, + "test_acc": 0.0616, + "lyapunov": null, + "grad_norm": 0.6581126496222481, + "grad_max_sv": 0.22157299481332302, + "grad_min_sv": 1.218345958564626e-08, + "grad_condition": 21160581.40499527, + "lr": 0.0006937577932260512, + "time_sec": 49.614638328552246 + }, + { + "epoch": 57, + "train_loss": 2.1483337621307372, + "train_acc": 0.42194, + "test_loss": 8.756062689208985, + "test_acc": 0.0525, + "lyapunov": null, + "grad_norm": 0.655149621093074, + "grad_max_sv": 0.23063393794000148, + "grad_min_sv": 1.2325510248545334e-08, + "grad_condition": 32561576.294376243, + "lr": 0.0006840622763423388, + "time_sec": 49.604514598846436 + }, + { + "epoch": 58, + "train_loss": 2.13039572971344, + "train_acc": 0.428, + "test_loss": 6.102099295043946, + "test_acc": 0.077, + "lyapunov": null, + "grad_norm": 0.6579204722244499, + "grad_max_sv": 0.22870929054915906, + "grad_min_sv": 1.2437226873385221e-08, + "grad_condition": 29029893.441014826, + "lr": 0.0006742860236609073, + "time_sec": 49.63142991065979 + }, + { + "epoch": 59, + "train_loss": 2.1072697998809815, + "train_acc": 0.4333, + "test_loss": 6.253016600799561, + "test_acc": 0.0479, + "lyapunov": null, + "grad_norm": 0.6541760692934044, + "grad_max_sv": 0.22985584288835526, + "grad_min_sv": 1.2442094027981244e-08, + "grad_condition": 231036397.09788594, + "lr": 0.0006644333233692913, + "time_sec": 49.64534831047058 + }, + { + "epoch": 60, + "train_loss": 2.1020205306243898, + "train_acc": 0.43472, + "test_loss": 5.772405567932129, + "test_acc": 0.0592, + "lyapunov": null, + "grad_norm": 0.6527505369999154, + "grad_max_sv": 0.22004029378294945, + "grad_min_sv": 1.217291406285792e-08, + "grad_condition": 24874942.26037088, + "lr": 0.0006545084971874734, + "time_sec": 49.647597312927246 + }, + { + "epoch": 61, + "train_loss": 2.0730964871215822, + "train_acc": 0.4414, + "test_loss": 7.9832359893798825, + "test_acc": 0.0641, + "lyapunov": null, + "grad_norm": 0.6546297418175855, + "grad_max_sv": 0.223886064812541, + "grad_min_sv": 1.2451116643275028e-08, + "grad_condition": 22916995.636865757, + "lr": 0.0006445158984722354, + "time_sec": 49.65083956718445 + }, + { + "epoch": 62, + "train_loss": 2.062996348876953, + "train_acc": 0.4436, + "test_loss": 7.34946787109375, + "test_acc": 0.044, + "lyapunov": null, + "grad_norm": 0.6483177973397803, + "grad_max_sv": 0.22704768665134906, + "grad_min_sv": 1.20682398005445e-08, + "grad_condition": 38390561.96495845, + "lr": 0.0006344599103076324, + "time_sec": 49.65266275405884 + }, + { + "epoch": 63, + "train_loss": 2.0523825840759278, + "train_acc": 0.44564, + "test_loss": 8.959309451293946, + "test_acc": 0.0413, + "lyapunov": null, + "grad_norm": 0.6488732278425234, + "grad_max_sv": 0.22664117477834225, + "grad_min_sv": 1.2159747242446172e-08, + "grad_condition": 31006507.26126058, + "lr": 0.0006243449435824269, + "time_sec": 49.65293788909912 + }, + { + "epoch": 64, + "train_loss": 2.0479974696350096, + "train_acc": 0.44714, + "test_loss": 8.05115908203125, + "test_acc": 0.0537, + "lyapunov": null, + "grad_norm": 0.6455494446410326, + "grad_max_sv": 0.2193945564329624, + "grad_min_sv": 1.2038907266117942e-08, + "grad_condition": 901694346.4545784, + "lr": 0.0006141754350553275, + "time_sec": 49.64103627204895 + }, + { + "epoch": 65, + "train_loss": 2.027272645950317, + "train_acc": 0.45036, + "test_loss": 8.782285342407226, + "test_acc": 0.0554, + "lyapunov": null, + "grad_norm": 0.6482083158352888, + "grad_max_sv": 0.2296803079545498, + "grad_min_sv": 1.2045603877547384e-08, + "grad_condition": 44744302.33572485, + "lr": 0.0006039558454088793, + "time_sec": 49.62383842468262 + }, + { + "epoch": 66, + "train_loss": 2.012310220794678, + "train_acc": 0.4561, + "test_loss": 8.360753945922852, + "test_acc": 0.0486, + "lyapunov": null, + "grad_norm": 0.6486341651257033, + "grad_max_sv": 0.21999806091189383, + "grad_min_sv": 1.2103176813549332e-08, + "grad_condition": 25365047.453725625, + "lr": 0.000593690657292862, + "time_sec": 49.620052099227905 + }, + { + "epoch": 67, + "train_loss": 2.2251435960388184, + "train_acc": 0.43342, + "test_loss": 4.351189101409912, + "test_acc": 0.0583, + "lyapunov": null, + "grad_norm": 0.6822841692183329, + "grad_max_sv": 0.23429610803723336, + "grad_min_sv": 1.2533971320831828e-08, + "grad_condition": 620776564.7686789, + "lr": 0.0005833843733580507, + "time_sec": 49.6039252281189 + }, + { + "epoch": 68, + "train_loss": 3.644752220916748, + "train_acc": 0.14882, + "test_loss": 4.446993719482422, + "test_acc": 0.1036, + "lyapunov": null, + "grad_norm": 0.5322357731359522, + "grad_max_sv": 0.1740941284224391, + "grad_min_sv": 9.981525750379916e-09, + "grad_condition": 19772886.771588072, + "lr": 0.0005730415142812054, + "time_sec": 49.6299045085907 + }, + { + "epoch": 69, + "train_loss": 3.1906630830383302, + "train_acc": 0.22138, + "test_loss": 4.447753040695191, + "test_acc": 0.1086, + "lyapunov": null, + "grad_norm": 0.5849582495428348, + "grad_max_sv": 0.19428364057093858, + "grad_min_sv": 1.0978856412879878e-08, + "grad_condition": 20893419.13528825, + "lr": 0.0005626666167821517, + "time_sec": 49.62305164337158 + }, + { + "epoch": 70, + "train_loss": 2.9685875498962404, + "train_acc": 0.26182, + "test_loss": 5.079945266723633, + "test_acc": 0.1082, + "lyapunov": null, + "grad_norm": 0.5988082474018407, + "grad_max_sv": 0.20677474029362203, + "grad_min_sv": 1.1152884460408074e-08, + "grad_condition": 28125873.10543083, + "lr": 0.0005522642316338265, + "time_sec": 49.63573360443115 + }, + { + "epoch": 71, + "train_loss": 2.8187981507110598, + "train_acc": 0.29056, + "test_loss": 5.128676221466065, + "test_acc": 0.1097, + "lyapunov": null, + "grad_norm": 0.6073589396586558, + "grad_max_sv": 0.19603765942156315, + "grad_min_sv": 1.1142021388854673e-08, + "grad_condition": 23682104.838631887, + "lr": 0.0005418389216661573, + "time_sec": 49.65342855453491 + }, + { + "epoch": 72, + "train_loss": 2.7264524671173094, + "train_acc": 0.30584, + "test_loss": 4.905041383361817, + "test_acc": 0.1255, + "lyapunov": null, + "grad_norm": 0.6147190521685049, + "grad_max_sv": 0.20450513996183872, + "grad_min_sv": 1.1536205649087527e-08, + "grad_condition": 28562481.748963058, + "lr": 0.0005313952597646563, + "time_sec": 49.65431094169617 + }, + { + "epoch": 73, + "train_loss": 2.6403448142242434, + "train_acc": 0.32094, + "test_loss": 5.800853311538696, + "test_acc": 0.107, + "lyapunov": null, + "grad_norm": 0.6247716864218055, + "grad_max_sv": 0.21473125889897346, + "grad_min_sv": 1.1889953104027295e-08, + "grad_condition": 65722876.53475368, + "lr": 0.0005209378268645994, + "time_sec": 49.64467167854309 + }, + { + "epoch": 74, + "train_loss": 2.5647068825531005, + "train_acc": 0.33604, + "test_loss": 6.016946387481689, + "test_acc": 0.1108, + "lyapunov": null, + "grad_norm": 0.6262187013652493, + "grad_max_sv": 0.21014209054410457, + "grad_min_sv": 1.1593367979512159e-08, + "grad_condition": 23978185.39414488, + "lr": 0.0005104712099416781, + "time_sec": 49.635523080825806 + }, + { + "epoch": 75, + "train_loss": 2.5212148859405517, + "train_acc": 0.34632, + "test_loss": 6.316108853149414, + "test_acc": 0.1027, + "lyapunov": null, + "grad_norm": 0.6347754908556336, + "grad_max_sv": 0.21141788363456726, + "grad_min_sv": 1.179611141682857e-08, + "grad_condition": 33522616.12577144, + "lr": 0.0004999999999999996, + "time_sec": 49.63302993774414 + }, + { + "epoch": 76, + "train_loss": 2.470890021209717, + "train_acc": 0.35636, + "test_loss": 6.3965694896698, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 0.6330916660078362, + "grad_max_sv": 0.21149154454469682, + "grad_min_sv": 1.186264902419687e-08, + "grad_condition": 78784632.22578731, + "lr": 0.0004895287900583212, + "time_sec": 49.637208223342896 + }, + { + "epoch": 77, + "train_loss": 2.421552244262695, + "train_acc": 0.36788, + "test_loss": 6.69319435043335, + "test_acc": 0.1017, + "lyapunov": null, + "grad_norm": 0.634293677395214, + "grad_max_sv": 0.2066604733467102, + "grad_min_sv": 1.1785100880942756e-08, + "grad_condition": 59189077.883828625, + "lr": 0.0004790621731353997, + "time_sec": 49.63215613365173 + }, + { + "epoch": 78, + "train_loss": 2.3847443492126463, + "train_acc": 0.37546, + "test_loss": 7.132302479934692, + "test_acc": 0.0943, + "lyapunov": null, + "grad_norm": 0.6382190364657672, + "grad_max_sv": 0.20905729271471502, + "grad_min_sv": 1.1757649508170598e-08, + "grad_condition": 26167748.83618117, + "lr": 0.000468604740235343, + "time_sec": 49.61492323875427 + }, + { + "epoch": 79, + "train_loss": 2.3435024488830565, + "train_acc": 0.38554, + "test_loss": 7.740195120239258, + "test_acc": 0.0916, + "lyapunov": null, + "grad_norm": 0.6365390593800095, + "grad_max_sv": 0.214980835467577, + "grad_min_sv": 1.20849943802126e-08, + "grad_condition": 26878255.479230188, + "lr": 0.00045816107833384175, + "time_sec": 49.625444412231445 + }, + { + "epoch": 80, + "train_loss": 2.3083001178741456, + "train_acc": 0.39014, + "test_loss": 6.61783053894043, + "test_acc": 0.1104, + "lyapunov": null, + "grad_norm": 0.6406625014101909, + "grad_max_sv": 0.21362034603953362, + "grad_min_sv": 1.2048267306052906e-08, + "grad_condition": 20392384.690080393, + "lr": 0.0004477357683661729, + "time_sec": 49.60279703140259 + }, + { + "epoch": 81, + "train_loss": 2.2839368876647947, + "train_acc": 0.39676, + "test_loss": 6.873206716918945, + "test_acc": 0.1118, + "lyapunov": null, + "grad_norm": 0.640888071388829, + "grad_max_sv": 0.21525344289839268, + "grad_min_sv": 1.1972712192151457e-08, + "grad_condition": 50063258.30804229, + "lr": 0.00043733338321784746, + "time_sec": 49.61454939842224 + }, + { + "epoch": 82, + "train_loss": 2.256084364776611, + "train_acc": 0.40168, + "test_loss": 8.169263735961914, + "test_acc": 0.0948, + "lyapunov": null, + "grad_norm": 0.6434003244484818, + "grad_max_sv": 0.21655187159776687, + "grad_min_sv": 1.23490741438248e-08, + "grad_condition": 21577781.507507768, + "lr": 0.0004269584857187939, + "time_sec": 49.62588882446289 + }, + { + "epoch": 83, + "train_loss": 2.2249307306671144, + "train_acc": 0.40856, + "test_loss": 7.893931579589844, + "test_acc": 0.1041, + "lyapunov": null, + "grad_norm": 0.6443153342631529, + "grad_max_sv": 0.2138610877096653, + "grad_min_sv": 1.1779399097799904e-08, + "grad_condition": 37321529.4476779, + "lr": 0.0004166156266419484, + "time_sec": 49.63660502433777 + }, + { + "epoch": 84, + "train_loss": 2.208123627166748, + "train_acc": 0.4104, + "test_loss": 7.499340794372559, + "test_acc": 0.104, + "lyapunov": null, + "grad_norm": 0.6478863121733859, + "grad_max_sv": 0.21281871050596238, + "grad_min_sv": 1.2020403913903798e-08, + "grad_condition": 28996288.04674848, + "lr": 0.0004063093427071373, + "time_sec": 49.6533477306366 + }, + { + "epoch": 85, + "train_loss": 2.187458460845947, + "train_acc": 0.41414, + "test_loss": 7.118385442352295, + "test_acc": 0.1033, + "lyapunov": null, + "grad_norm": 0.6504270947812989, + "grad_max_sv": 0.22195289880037308, + "grad_min_sv": 1.2075933084054746e-08, + "grad_condition": 35680632.041642115, + "lr": 0.0003960441545911199, + "time_sec": 49.64801740646362 + }, + { + "epoch": 86, + "train_loss": 2.16914088722229, + "train_acc": 0.41866, + "test_loss": 8.384735362243653, + "test_acc": 0.0929, + "lyapunov": null, + "grad_norm": 0.6545464063385937, + "grad_max_sv": 0.22763431407511234, + "grad_min_sv": 1.2551986523431924e-08, + "grad_condition": 55796762.73182211, + "lr": 0.0003858245649446718, + "time_sec": 49.66041612625122 + }, + { + "epoch": 87, + "train_loss": 2.1368742782592776, + "train_acc": 0.42592, + "test_loss": 6.581503366088867, + "test_acc": 0.1232, + "lyapunov": null, + "grad_norm": 0.6536380667194897, + "grad_max_sv": 0.2278426967561245, + "grad_min_sv": 1.2359256434946175e-08, + "grad_condition": 24353654.705191635, + "lr": 0.00037565505641757235, + "time_sec": 49.66181540489197 + }, + { + "epoch": 88, + "train_loss": 2.1224456649780272, + "train_acc": 0.4304, + "test_loss": 7.7792722061157225, + "test_acc": 0.1034, + "lyapunov": null, + "grad_norm": 0.6522543248368956, + "grad_max_sv": 0.21917447336018087, + "grad_min_sv": 1.2232303508996622e-08, + "grad_condition": 23923683.00683912, + "lr": 0.00036554008969236695, + "time_sec": 49.64878726005554 + }, + { + "epoch": 89, + "train_loss": 2.099866188964844, + "train_acc": 0.4329, + "test_loss": 7.891568328857422, + "test_acc": 0.0965, + "lyapunov": null, + "grad_norm": 0.6502507826061058, + "grad_max_sv": 0.2151956543326378, + "grad_min_sv": 1.197734313118648e-08, + "grad_condition": 22524026.625488658, + "lr": 0.0003554841015277638, + "time_sec": 49.636536598205566 + }, + { + "epoch": 90, + "train_loss": 2.0865442153167724, + "train_acc": 0.43664, + "test_loss": 7.531399671936035, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 0.6569777082536814, + "grad_max_sv": 0.2229558028280735, + "grad_min_sv": 1.218858882712226e-08, + "grad_condition": 23258750.132011104, + "lr": 0.000345491502812526, + "time_sec": 49.61567449569702 + }, + { + "epoch": 91, + "train_loss": 2.06498106628418, + "train_acc": 0.44214, + "test_loss": 8.12637159576416, + "test_acc": 0.0982, + "lyapunov": null, + "grad_norm": 0.6551117087544674, + "grad_max_sv": 0.2304719265550375, + "grad_min_sv": 1.2402068626238271e-08, + "grad_condition": 26484691.211153176, + "lr": 0.0003355666766307081, + "time_sec": 49.61532545089722 + }, + { + "epoch": 92, + "train_loss": 2.05007131362915, + "train_acc": 0.44468, + "test_loss": 8.683588043212891, + "test_acc": 0.0875, + "lyapunov": null, + "grad_norm": 0.6572758654097208, + "grad_max_sv": 0.2220118623226881, + "grad_min_sv": 1.228345688220056e-08, + "grad_condition": 43719860.633667246, + "lr": 0.00032571397633909225, + "time_sec": 49.61735486984253 + }, + { + "epoch": 93, + "train_loss": 2.0329663645935057, + "train_acc": 0.44968, + "test_loss": 8.036752981567382, + "test_acc": 0.0946, + "lyapunov": null, + "grad_norm": 0.6594762151865757, + "grad_max_sv": 0.23468641191720963, + "grad_min_sv": 1.2702623283789016e-08, + "grad_condition": 22758035.70513925, + "lr": 0.00031593772365766094, + "time_sec": 49.594003438949585 + }, + { + "epoch": 94, + "train_loss": 2.015877328491211, + "train_acc": 0.45332, + "test_loss": 6.995108350372314, + "test_acc": 0.1074, + "lyapunov": null, + "grad_norm": 0.652167332688343, + "grad_max_sv": 0.21848529055714608, + "grad_min_sv": 1.2157653033612048e-08, + "grad_condition": 31954927.567971922, + "lr": 0.0003062422067739483, + "time_sec": 49.64247727394104 + }, + { + "epoch": 95, + "train_loss": 1.9991163059997559, + "train_acc": 0.45638, + "test_loss": 7.588622467803955, + "test_acc": 0.1142, + "lyapunov": null, + "grad_norm": 0.6621803475520015, + "grad_max_sv": 0.21934038177132606, + "grad_min_sv": 1.2358172536697243e-08, + "grad_condition": 24385893.04871109, + "lr": 0.00029663167846209965, + "time_sec": 49.63428497314453 + }, + { + "epoch": 96, + "train_loss": 1.9834483330917358, + "train_acc": 0.45752, + "test_loss": 7.558978903198242, + "test_acc": 0.1094, + "lyapunov": null, + "grad_norm": 0.6668846817868389, + "grad_max_sv": 0.21797076910734176, + "grad_min_sv": 1.225281484884544e-08, + "grad_condition": 22333814.982193254, + "lr": 0.00028711035421746345, + "time_sec": 49.63755655288696 + }, + { + "epoch": 97, + "train_loss": 1.969242282485962, + "train_acc": 0.46376, + "test_loss": 7.394112825012207, + "test_acc": 0.1099, + "lyapunov": null, + "grad_norm": 0.6554699630149605, + "grad_max_sv": 0.2301444172859192, + "grad_min_sv": 1.2433391152755214e-08, + "grad_condition": 24491819.03636659, + "lr": 0.00027768241040753615, + "time_sec": 49.655335903167725 + }, + { + "epoch": 98, + "train_loss": 1.9529696557617187, + "train_acc": 0.46774, + "test_loss": 7.055284997558593, + "test_acc": 0.1162, + "lyapunov": null, + "grad_norm": 0.6640537000345971, + "grad_max_sv": 0.22325844801962375, + "grad_min_sv": 1.2163324900060778e-08, + "grad_condition": 52648989.07312742, + "lr": 0.00026835198244006903, + "time_sec": 49.669140100479126 + }, + { + "epoch": 99, + "train_loss": 1.939459365234375, + "train_acc": 0.46992, + "test_loss": 7.755525547790527, + "test_acc": 0.1106, + "lyapunov": null, + "grad_norm": 0.6598990438805343, + "grad_max_sv": 0.23020310550928116, + "grad_min_sv": 1.2323512080247845e-08, + "grad_condition": 26539045.73575706, + "lr": 0.0002591231629491421, + "time_sec": 49.658100605010986 + }, + { + "epoch": 100, + "train_loss": 1.9241277764892577, + "train_acc": 0.47272, + "test_loss": 6.962932342529297, + "test_acc": 0.1245, + "lyapunov": null, + "grad_norm": 0.6566318375145326, + "grad_max_sv": 0.228052269667387, + "grad_min_sv": 1.2546390118495231e-08, + "grad_condition": 21651299.709478803, + "lr": 0.0002499999999999997, + "time_sec": 49.63715100288391 + }, + { + "epoch": 101, + "train_loss": 1.9074506490325929, + "train_acc": 0.47786, + "test_loss": 7.837496071624756, + "test_acc": 0.1147, + "lyapunov": null, + "grad_norm": 0.6602483696560503, + "grad_max_sv": 0.2316434532403946, + "grad_min_sv": 1.2379145530871938e-08, + "grad_condition": 26011010.493026, + "lr": 0.00024098649531343477, + "time_sec": 49.64603877067566 + }, + { + "epoch": 102, + "train_loss": 1.8926145942687989, + "train_acc": 0.48072, + "test_loss": 8.698235131835938, + "test_acc": 0.0935, + "lyapunov": null, + "grad_norm": 0.6633351574173826, + "grad_max_sv": 0.22496680207550526, + "grad_min_sv": 1.2393885331918319e-08, + "grad_condition": 62142872.25343563, + "lr": 0.0002320866025105016, + "time_sec": 49.613752126693726 + }, + { + "epoch": 103, + "train_loss": 1.8847379415130616, + "train_acc": 0.48146, + "test_loss": 8.400778024291991, + "test_acc": 0.1064, + "lyapunov": null, + "grad_norm": 0.6628163988108642, + "grad_max_sv": 0.2389563336968422, + "grad_min_sv": 1.2502011579674024e-08, + "grad_condition": 561960509.0407003, + "lr": 0.0002233042253783278, + "time_sec": 49.64220905303955 + }, + { + "epoch": 104, + "train_loss": 1.864337573890686, + "train_acc": 0.48388, + "test_loss": 7.582353992080688, + "test_acc": 0.1105, + "lyapunov": null, + "grad_norm": 0.6662860681196462, + "grad_max_sv": 0.2305597063153982, + "grad_min_sv": 1.2549438151154835e-08, + "grad_condition": 28749280.670694787, + "lr": 0.000214643216157784, + "time_sec": 49.59931921958923 + }, + { + "epoch": 105, + "train_loss": 1.8436736141586303, + "train_acc": 0.49176, + "test_loss": 7.296687260437012, + "test_acc": 0.1222, + "lyapunov": null, + "grad_norm": 0.6651015349952935, + "grad_max_sv": 0.22770841754972934, + "grad_min_sv": 1.2484767888520238e-08, + "grad_condition": 223685448.9202466, + "lr": 0.00020610737385376332, + "time_sec": 49.59563899040222 + }, + { + "epoch": 106, + "train_loss": 1.841442982711792, + "train_acc": 0.49332, + "test_loss": 8.086389836120606, + "test_acc": 0.1055, + "lyapunov": null, + "grad_norm": 0.6642212770974275, + "grad_max_sv": 0.23377629406750203, + "grad_min_sv": 1.239430658661611e-08, + "grad_condition": 25560457.467378292, + "lr": 0.00019770044256881242, + "time_sec": 49.633612394332886 + }, + { + "epoch": 107, + "train_loss": 1.8276642670440675, + "train_acc": 0.49872, + "test_loss": 8.12283078918457, + "test_acc": 0.1035, + "lyapunov": null, + "grad_norm": 0.6635032674607848, + "grad_max_sv": 0.22688985653221608, + "grad_min_sv": 1.237523354902237e-08, + "grad_condition": 25808230.55779849, + "lr": 0.0001894261098608447, + "time_sec": 49.63720369338989 + }, + { + "epoch": 108, + "train_loss": 1.8169137536621094, + "train_acc": 0.49852, + "test_loss": 8.409533373260498, + "test_acc": 0.0987, + "lyapunov": null, + "grad_norm": 0.6667541497565868, + "grad_max_sv": 0.22939535826444626, + "grad_min_sv": 1.2364147994672892e-08, + "grad_condition": 124450338.46619192, + "lr": 0.000181288005125655, + "time_sec": 49.650787591934204 + }, + { + "epoch": 109, + "train_loss": 1.7991494818115235, + "train_acc": 0.50362, + "test_loss": 7.646248370361328, + "test_acc": 0.1117, + "lyapunov": null, + "grad_norm": 0.6718663681176132, + "grad_max_sv": 0.22661731615662575, + "grad_min_sv": 1.2321765009010166e-08, + "grad_condition": 38880987.41150442, + "lr": 0.0001732896980049473, + "time_sec": 49.649791955947876 + }, + { + "epoch": 110, + "train_loss": 1.8055472195053102, + "train_acc": 0.5002, + "test_loss": 7.981080414581299, + "test_acc": 0.1032, + "lyapunov": null, + "grad_norm": 0.66872350270792, + "grad_max_sv": 0.22803995087742807, + "grad_min_sv": 1.2362955611371421e-08, + "grad_condition": 262033827.92100912, + "lr": 0.00016543469682057076, + "time_sec": 49.647390365600586 + }, + { + "epoch": 111, + "train_loss": 1.7805239984130858, + "train_acc": 0.50612, + "test_loss": 8.953764317321777, + "test_acc": 0.098, + "lyapunov": null, + "grad_norm": 0.673049303663611, + "grad_max_sv": 0.23256770558655263, + "grad_min_sv": 1.2522076875409738e-08, + "grad_condition": 79448628.08930221, + "lr": 0.00015772644703565552, + "time_sec": 49.64419651031494 + }, + { + "epoch": 112, + "train_loss": 1.7635594388580322, + "train_acc": 0.51178, + "test_loss": 9.006199928283692, + "test_acc": 0.0944, + "lyapunov": null, + "grad_norm": 0.6690577762179267, + "grad_max_sv": 0.231477802246809, + "grad_min_sv": 1.2611339457110904e-08, + "grad_condition": 74574181.95014855, + "lr": 0.00015016832974331713, + "time_sec": 49.6623969078064 + }, + { + "epoch": 113, + "train_loss": 1.7649991600799562, + "train_acc": 0.50992, + "test_loss": 8.706898388671876, + "test_acc": 0.0957, + "lyapunov": null, + "grad_norm": 0.6698910233260391, + "grad_max_sv": 0.24120958633720874, + "grad_min_sv": 1.2578526964457382e-08, + "grad_condition": 53483669.38925791, + "lr": 0.00014276366018359834, + "time_sec": 49.66872000694275 + }, + { + "epoch": 114, + "train_loss": 1.7550373428726196, + "train_acc": 0.51416, + "test_loss": 9.079370852661134, + "test_acc": 0.0946, + "lyapunov": null, + "grad_norm": 0.6663575459996698, + "grad_max_sv": 0.22731570713222027, + "grad_min_sv": 1.247297455250762e-08, + "grad_condition": 42511186.51551006, + "lr": 0.00013551568628929425, + "time_sec": 49.61651134490967 + }, + { + "epoch": 115, + "train_loss": 1.7389271509552002, + "train_acc": 0.51604, + "test_loss": 8.636061263275147, + "test_acc": 0.1024, + "lyapunov": null, + "grad_norm": 0.6736568214282298, + "grad_max_sv": 0.23145201802253723, + "grad_min_sv": 1.2523735046232608e-08, + "grad_condition": 34281489.67578278, + "lr": 0.00012842758726130276, + "time_sec": 49.587687492370605 + }, + { + "epoch": 116, + "train_loss": 1.73655320854187, + "train_acc": 0.51642, + "test_loss": 9.354261597442626, + "test_acc": 0.0971, + "lyapunov": null, + "grad_norm": 0.6692761494554511, + "grad_max_sv": 0.23360017724335194, + "grad_min_sv": 1.2428947707143757e-08, + "grad_condition": 42706933.20787396, + "lr": 0.0001215024721741218, + "time_sec": 49.61284112930298 + }, + { + "epoch": 117, + "train_loss": 1.722219416847229, + "train_acc": 0.52034, + "test_loss": 9.05172070465088, + "test_acc": 0.0864, + "lyapunov": null, + "grad_norm": 0.6709665811373348, + "grad_max_sv": 0.23329499438405038, + "grad_min_sv": 1.2499731633086597e-08, + "grad_condition": 23426718.363504913, + "lr": 0.00011474337861210538, + "time_sec": 49.612444162368774 + }, + { + "epoch": 118, + "train_loss": 1.720088274269104, + "train_acc": 0.5212, + "test_loss": 8.445899168395997, + "test_acc": 0.1071, + "lyapunov": null, + "grad_norm": 0.6772013084899083, + "grad_max_sv": 0.23568132370710373, + "grad_min_sv": 1.26266935157604e-08, + "grad_condition": 30951096.93160528, + "lr": 0.00010815327133708009, + "time_sec": 49.616597414016724 + }, + { + "epoch": 119, + "train_loss": 1.7100347495269776, + "train_acc": 0.52412, + "test_loss": 7.941069074249268, + "test_acc": 0.116, + "lyapunov": null, + "grad_norm": 0.6653971862031371, + "grad_max_sv": 0.23134685456752777, + "grad_min_sv": 1.2402505802922015e-08, + "grad_condition": 22810188.64319814, + "lr": 0.00010173504098790182, + "time_sec": 49.63788056373596 + }, + { + "epoch": 120, + "train_loss": 1.700667360534668, + "train_acc": 0.52674, + "test_loss": 9.192179844665528, + "test_acc": 0.0952, + "lyapunov": null, + "grad_norm": 0.67019495782139, + "grad_max_sv": 0.23498024754226207, + "grad_min_sv": 1.2522474526766025e-08, + "grad_condition": 25575812.55122325, + "lr": 9.549150281252629e-05, + "time_sec": 49.633721113204956 + }, + { + "epoch": 121, + "train_loss": 1.6934022713470458, + "train_acc": 0.52622, + "test_loss": 8.246514013671876, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 0.67264731502187, + "grad_max_sv": 0.23390924520790576, + "grad_min_sv": 1.2629734989083596e-08, + "grad_condition": 75127709.41882512, + "lr": 8.942539543314794e-05, + "time_sec": 49.658979177474976 + }, + { + "epoch": 122, + "train_loss": 1.6853880523681641, + "train_acc": 0.52858, + "test_loss": 8.835922454071046, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 0.6681915576498015, + "grad_max_sv": 0.22805486135184766, + "grad_min_sv": 1.2523601156111397e-08, + "grad_condition": 22825184.37456271, + "lr": 8.353937964495024e-05, + "time_sec": 49.645174980163574 + }, + { + "epoch": 123, + "train_loss": 1.6754656018447875, + "train_acc": 0.52996, + "test_loss": 8.766720679473877, + "test_acc": 0.0969, + "lyapunov": null, + "grad_norm": 0.6635381868278838, + "grad_max_sv": 0.23943961299955846, + "grad_min_sv": 1.2716584071870152e-08, + "grad_condition": 25094494.26316102, + "lr": 7.783603724899243e-05, + "time_sec": 49.64848589897156 + }, + { + "epoch": 124, + "train_loss": 1.6794914197158815, + "train_acc": 0.53018, + "test_loss": 8.580409744262695, + "test_acc": 0.1045, + "lyapunov": null, + "grad_norm": 0.671245577708117, + "grad_max_sv": 0.23060270808637143, + "grad_min_sv": 1.234503174199486e-08, + "grad_condition": 63345986.58758273, + "lr": 7.231786991974666e-05, + "time_sec": 49.87266302108765 + }, + { + "epoch": 125, + "train_loss": 1.6680570980834961, + "train_acc": 0.53182, + "test_loss": 8.834838022613525, + "test_acc": 0.1023, + "lyapunov": null, + "grad_norm": 0.6759384740097162, + "grad_max_sv": 0.23802748061716555, + "grad_min_sv": 1.276443843678532e-08, + "grad_condition": 24804650.245445848, + "lr": 6.698729810778072e-05, + "time_sec": 49.65100860595703 + }, + { + "epoch": 126, + "train_loss": 1.6599959258651733, + "train_acc": 0.53514, + "test_loss": 8.445849030303956, + "test_acc": 0.0993, + "lyapunov": null, + "grad_norm": 0.6683123713335807, + "grad_max_sv": 0.23196808211505413, + "grad_min_sv": 1.239824619359009e-08, + "grad_condition": 24122291.210029412, + "lr": 6.184665997806817e-05, + "time_sec": 49.60801029205322 + }, + { + "epoch": 127, + "train_loss": 1.6581390426254272, + "train_acc": 0.53286, + "test_loss": 8.180217957305908, + "test_acc": 0.1144, + "lyapunov": null, + "grad_norm": 0.671697720762431, + "grad_max_sv": 0.23852520175278186, + "grad_min_sv": 1.290384490787444e-08, + "grad_condition": 30505273.567765664, + "lr": 5.6898210384392595e-05, + "time_sec": 49.62530255317688 + }, + { + "epoch": 128, + "train_loss": 1.6536951416015624, + "train_acc": 0.53944, + "test_loss": 9.100402154541015, + "test_acc": 0.0967, + "lyapunov": null, + "grad_norm": 0.667185365414166, + "grad_max_sv": 0.2322216048836708, + "grad_min_sv": 1.2572321161918864e-08, + "grad_condition": 23830602.615603756, + "lr": 5.214411988029363e-05, + "time_sec": 49.59242367744446 + }, + { + "epoch": 129, + "train_loss": 1.6502027558135985, + "train_acc": 0.53564, + "test_loss": 8.243769989013671, + "test_acc": 0.1101, + "lyapunov": null, + "grad_norm": 0.6719880999378245, + "grad_max_sv": 0.23203521333634852, + "grad_min_sv": 1.2620684003428195e-08, + "grad_condition": 74978797.83799863, + "lr": 4.7586473766990294e-05, + "time_sec": 49.60294818878174 + }, + { + "epoch": 130, + "train_loss": 1.6536482720565795, + "train_acc": 0.53586, + "test_loss": 8.237010109710694, + "test_acc": 0.1067, + "lyapunov": null, + "grad_norm": 0.6804852067291551, + "grad_max_sv": 0.2377860952168703, + "grad_min_sv": 1.2762065921406718e-08, + "grad_condition": 39212371.63315557, + "lr": 4.32272711786996e-05, + "time_sec": 49.597888708114624 + }, + { + "epoch": 131, + "train_loss": 1.639038058242798, + "train_acc": 0.54146, + "test_loss": 8.44538454055786, + "test_acc": 0.1063, + "lyapunov": null, + "grad_norm": 0.6724835885199256, + "grad_max_sv": 0.2353504840284586, + "grad_min_sv": 1.2740010607581453e-08, + "grad_condition": 26983674.320896793, + "lr": 3.906842420574966e-05, + "time_sec": 49.665122509002686 + }, + { + "epoch": 132, + "train_loss": 1.6450230081176758, + "train_acc": 0.53788, + "test_loss": 8.850830727386475, + "test_acc": 0.1028, + "lyapunov": null, + "grad_norm": 0.6728968812754041, + "grad_max_sv": 0.2380696687847376, + "grad_min_sv": 1.2689633881700357e-08, + "grad_condition": 85473852.69328196, + "lr": 3.5111757055874305e-05, + "time_sec": 49.62814116477966 + }, + { + "epoch": 133, + "train_loss": 1.6397483406066895, + "train_acc": 0.53942, + "test_loss": 8.841438789367675, + "test_acc": 0.0951, + "lyapunov": null, + "grad_norm": 0.6743180544065257, + "grad_max_sv": 0.23258159644901752, + "grad_min_sv": 1.2391172625816904e-08, + "grad_condition": 50130338.96886261, + "lr": 3.1359005254054254e-05, + "time_sec": 49.650676250457764 + }, + { + "epoch": 134, + "train_loss": 1.6300106893539428, + "train_acc": 0.54306, + "test_loss": 8.161712069702148, + "test_acc": 0.0977, + "lyapunov": null, + "grad_norm": 0.6697898119311428, + "grad_max_sv": 0.23791733495891093, + "grad_min_sv": 1.2599619581693533e-08, + "grad_condition": 33905362.44570724, + "lr": 2.7811814881259484e-05, + "time_sec": 49.678349018096924 + }, + { + "epoch": 135, + "train_loss": 1.6280161280059815, + "train_acc": 0.54206, + "test_loss": 8.8084473777771, + "test_acc": 0.099, + "lyapunov": null, + "grad_norm": 0.6685419282298722, + "grad_max_sv": 0.2294952504336834, + "grad_min_sv": 1.2453856032546007e-08, + "grad_condition": 28183066.52638216, + "lr": 2.4471741852423218e-05, + "time_sec": 49.63830757141113 + }, + { + "epoch": 136, + "train_loss": 1.6250385632324218, + "train_acc": 0.5424, + "test_loss": 9.245115556335449, + "test_acc": 0.0982, + "lyapunov": null, + "grad_norm": 0.673719312762165, + "grad_max_sv": 0.2436251524835825, + "grad_min_sv": 1.2834923374116514e-08, + "grad_condition": 22720217.479475908, + "lr": 2.1340251233966362e-05, + "time_sec": 49.68732476234436 + }, + { + "epoch": 137, + "train_loss": 1.6283387484741212, + "train_acc": 0.5456, + "test_loss": 8.400495840454102, + "test_acc": 0.1051, + "lyapunov": null, + "grad_norm": 0.6729648252425294, + "grad_max_sv": 0.228320786729455, + "grad_min_sv": 1.2201329287198082e-08, + "grad_condition": 29654367.28966447, + "lr": 1.8418716601170932e-05, + "time_sec": 49.65324902534485 + }, + { + "epoch": 138, + "train_loss": 1.6186187603378297, + "train_acc": 0.54454, + "test_loss": 8.544135133361817, + "test_acc": 0.1026, + "lyapunov": null, + "grad_norm": 0.6767335790557945, + "grad_max_sv": 0.24417912773787975, + "grad_min_sv": 1.2745562341653915e-08, + "grad_condition": 22462589.905390937, + "lr": 1.570841943568445e-05, + "time_sec": 49.62770223617554 + }, + { + "epoch": 139, + "train_loss": 1.614481148033142, + "train_acc": 0.54796, + "test_loss": 8.814221725463867, + "test_acc": 0.0977, + "lyapunov": null, + "grad_norm": 0.6703542181357327, + "grad_max_sv": 0.2325075563043356, + "grad_min_sv": 1.2578777475180657e-08, + "grad_condition": 21363698.231181078, + "lr": 1.3210548563419845e-05, + "time_sec": 49.592610120773315 + }, + { + "epoch": 140, + "train_loss": 1.6180111114883422, + "train_acc": 0.54492, + "test_loss": 8.483137963104248, + "test_acc": 0.1107, + "lyapunov": null, + "grad_norm": 0.6809540897117702, + "grad_max_sv": 0.2395390760153532, + "grad_min_sv": 1.2634957796686664e-08, + "grad_condition": 54098275.066982284, + "lr": 1.0926199633097203e-05, + "time_sec": 49.62364315986633 + }, + { + "epoch": 141, + "train_loss": 1.613265188369751, + "train_acc": 0.548, + "test_loss": 9.025719612884522, + "test_acc": 0.0959, + "lyapunov": null, + "grad_norm": 0.6738933430180942, + "grad_max_sv": 0.2385118592530489, + "grad_min_sv": 1.2675423211039316e-08, + "grad_condition": 24268524.45347375, + "lr": 8.856374635655688e-06, + "time_sec": 49.6093544960022 + }, + { + "epoch": 142, + "train_loss": 1.6109765142822265, + "train_acc": 0.54672, + "test_loss": 8.501644051361083, + "test_acc": 0.1071, + "lyapunov": null, + "grad_norm": 0.6688401906779454, + "grad_max_sv": 0.2420313537120819, + "grad_min_sv": 1.2541520851006016e-08, + "grad_condition": 34051323.70080558, + "lr": 7.001981464747503e-06, + "time_sec": 49.626237869262695 + }, + { + "epoch": 143, + "train_loss": 1.6083808990859985, + "train_acc": 0.5495, + "test_loss": 8.410878736114501, + "test_acc": 0.1029, + "lyapunov": null, + "grad_norm": 0.6694620190305317, + "grad_max_sv": 0.2360597461462021, + "grad_min_sv": 1.2411240957882486e-08, + "grad_condition": 256359120.1912489, + "lr": 5.3638335185058295e-06, + "time_sec": 49.64081525802612 + }, + { + "epoch": 144, + "train_loss": 1.6100667620468139, + "train_acc": 0.54798, + "test_loss": 8.832001342010498, + "test_acc": 0.1019, + "lyapunov": null, + "grad_norm": 0.6707738006928022, + "grad_max_sv": 0.23732503540813923, + "grad_min_sv": 1.258596476483298e-08, + "grad_condition": 24176116.650407396, + "lr": 3.942649342761114e-06, + "time_sec": 49.650325536727905 + }, + { + "epoch": 145, + "train_loss": 1.6037773385238647, + "train_acc": 0.54702, + "test_loss": 8.7359261428833, + "test_acc": 0.0989, + "lyapunov": null, + "grad_norm": 0.6690176163372957, + "grad_max_sv": 0.23970598317682743, + "grad_min_sv": 1.2538464763678369e-08, + "grad_condition": 33292646.116570044, + "lr": 2.7390523158633524e-06, + "time_sec": 49.64434027671814 + }, + { + "epoch": 146, + "train_loss": 1.6090083113098144, + "train_acc": 0.54738, + "test_loss": 8.776909831237793, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 0.6706150402911953, + "grad_max_sv": 0.2313551239669323, + "grad_min_sv": 1.2493580149597339e-08, + "grad_condition": 36814707.572352916, + "lr": 1.7535703752478133e-06, + "time_sec": 49.653162479400635 + }, + { + "epoch": 147, + "train_loss": 1.6126505808258056, + "train_acc": 0.54692, + "test_loss": 9.092076904296874, + "test_acc": 0.0975, + "lyapunov": null, + "grad_norm": 0.6703962324024396, + "grad_max_sv": 0.233590966463089, + "grad_min_sv": 1.2700339725724153e-08, + "grad_condition": 46904603.438913696, + "lr": 9.866357858642196e-07, + "time_sec": 49.64583897590637 + }, + { + "epoch": 148, + "train_loss": 1.6134785464096069, + "train_acc": 0.54594, + "test_loss": 8.983751535797118, + "test_acc": 0.0995, + "lyapunov": null, + "grad_norm": 0.674578489012928, + "grad_max_sv": 0.23970573469996453, + "grad_min_sv": 1.272608372571149e-08, + "grad_condition": 21842271.84696827, + "lr": 4.38584950570808e-07, + "time_sec": 49.64808487892151 + }, + { + "epoch": 149, + "train_loss": 1.6119013549423218, + "train_acc": 0.54862, + "test_loss": 8.56843572845459, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 0.6747520334683573, + "grad_max_sv": 0.2384514592587948, + "grad_min_sv": 1.2600235418935846e-08, + "grad_condition": 25340562.620727975, + "lr": 1.096582625772501e-07, + "time_sec": 49.64168334007263 + }, + { + "epoch": 150, + "train_loss": 1.6072704146957397, + "train_acc": 0.54742, + "test_loss": 8.887614213562012, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 0.6742776904392008, + "grad_max_sv": 0.24012672565877438, + "grad_min_sv": 1.2860058681840591e-08, + "grad_condition": 24539045.015578836, + "lr": 0.0, + "time_sec": 49.61355018615723 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.088581143493652, + "train_acc": 0.01332, + "test_loss": 4.951591259765625, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.595797699274781, + "grad_max_sv": 5.059777915477753, + "grad_min_sv": 8.380082079928463e-08, + "grad_condition": 144739678.32890567, + "lr": 0.0009998903417374227, + "time_sec": 66.76207876205444 + }, + { + "epoch": 2, + "train_loss": 4.727508141174316, + "train_acc": 0.0242, + "test_loss": 4.891763400268554, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 4.11050155163041, + "grad_max_sv": 3.698546850681305, + "grad_min_sv": 6.387429426490954e-08, + "grad_condition": 67471298.37535235, + "lr": 0.0009995614150494292, + "time_sec": 66.79832410812378 + }, + { + "epoch": 3, + "train_loss": 4.516627143707275, + "train_acc": 0.03364, + "test_loss": 5.023839845275879, + "test_acc": 0.0096, + "lyapunov": null, + "grad_norm": 3.230804659530269, + "grad_max_sv": 2.737754541635513, + "grad_min_sv": 4.854583614544161e-08, + "grad_condition": 87922174.2345469, + "lr": 0.0009990133642141358, + "time_sec": 66.76044511795044 + }, + { + "epoch": 4, + "train_loss": 4.37137044631958, + "train_acc": 0.04084, + "test_loss": 5.107725936889649, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 2.5815981982320455, + "grad_max_sv": 2.1624936670064927, + "grad_min_sv": 3.8690102244220983e-08, + "grad_condition": 66775302.44012289, + "lr": 0.0009982464296247522, + "time_sec": 66.69986486434937 + }, + { + "epoch": 5, + "train_loss": 4.2787111569213865, + "train_acc": 0.0499, + "test_loss": 5.093746864318848, + "test_acc": 0.0119, + "lyapunov": null, + "grad_norm": 2.0501754928637608, + "grad_max_sv": 1.6735655426979066, + "grad_min_sv": 3.02018420605954e-08, + "grad_condition": 83847616.58229446, + "lr": 0.0009972609476841367, + "time_sec": 66.70642113685608 + }, + { + "epoch": 6, + "train_loss": 4.173126724395752, + "train_acc": 0.06114, + "test_loss": 5.650288801574707, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 1.4461755519297805, + "grad_max_sv": 1.029741930961609, + "grad_min_sv": 2.1617413775709693e-08, + "grad_condition": 53690503.75103078, + "lr": 0.000996057350657239, + "time_sec": 66.68753027915955 + }, + { + "epoch": 7, + "train_loss": 4.093725746765137, + "train_acc": 0.07048, + "test_loss": 5.236350575256347, + "test_acc": 0.0131, + "lyapunov": null, + "grad_norm": 1.104296817764675, + "grad_max_sv": 0.6810471951961518, + "grad_min_sv": 1.7525281126307134e-08, + "grad_condition": 46908594.94631828, + "lr": 0.000994636166481494, + "time_sec": 66.73089575767517 + }, + { + "epoch": 8, + "train_loss": 4.031361261062622, + "train_acc": 0.08184, + "test_loss": 5.266020038604736, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.9907154687339563, + "grad_max_sv": 0.5727237299084663, + "grad_min_sv": 1.568161453573136e-08, + "grad_condition": 205087186.79278168, + "lr": 0.0009929980185352525, + "time_sec": 66.74000144004822 + }, + { + "epoch": 9, + "train_loss": 3.9836690045166017, + "train_acc": 0.08876, + "test_loss": 5.373385707092285, + "test_acc": 0.0145, + "lyapunov": null, + "grad_norm": 0.9286442561107239, + "grad_max_sv": 0.49140588417649267, + "grad_min_sv": 1.4355377359054344e-08, + "grad_condition": 49567929.749295376, + "lr": 0.0009911436253643444, + "time_sec": 66.75752806663513 + }, + { + "epoch": 10, + "train_loss": 3.9524392292785646, + "train_acc": 0.09442, + "test_loss": 5.648289218139649, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.8635186549937055, + "grad_max_sv": 0.44110502675175667, + "grad_min_sv": 1.380239241649539e-08, + "grad_condition": 160205558.71937332, + "lr": 0.0009890738003669028, + "time_sec": 66.74852681159973 + }, + { + "epoch": 11, + "train_loss": 3.9057430783081055, + "train_acc": 0.09904, + "test_loss": 5.593870043945312, + "test_acc": 0.0153, + "lyapunov": null, + "grad_norm": 0.8313455134497171, + "grad_max_sv": 0.4245350927114487, + "grad_min_sv": 1.3408236181761123e-08, + "grad_condition": 70475775.54279244, + "lr": 0.00098678945143658, + "time_sec": 66.72569394111633 + }, + { + "epoch": 12, + "train_loss": 3.879755588531494, + "train_acc": 0.1059, + "test_loss": 5.91184571685791, + "test_acc": 0.0122, + "lyapunov": null, + "grad_norm": 0.8098343665002108, + "grad_max_sv": 0.3995117902755737, + "grad_min_sv": 1.3223197731335352e-08, + "grad_condition": 2262455188.632939, + "lr": 0.0009842915805643154, + "time_sec": 66.74134874343872 + }, + { + "epoch": 13, + "train_loss": 3.8387034120178223, + "train_acc": 0.11128, + "test_loss": 5.55406644744873, + "test_acc": 0.0159, + "lyapunov": null, + "grad_norm": 0.7779364983364899, + "grad_max_sv": 0.36580874100327493, + "grad_min_sv": 1.2747200656137991e-08, + "grad_condition": 31403290.857171714, + "lr": 0.000981581283398829, + "time_sec": 66.71355533599854 + }, + { + "epoch": 14, + "train_loss": 3.8182811224365234, + "train_acc": 0.11366, + "test_loss": 5.846968073272705, + "test_acc": 0.0132, + "lyapunov": null, + "grad_norm": 0.7545251260271086, + "grad_max_sv": 0.34809157326817514, + "grad_min_sv": 1.2320788722597342e-08, + "grad_condition": 32144212.47563106, + "lr": 0.0009786597487660333, + "time_sec": 66.72689533233643 + }, + { + "epoch": 15, + "train_loss": 3.7967992616271973, + "train_acc": 0.11852, + "test_loss": 5.68047932510376, + "test_acc": 0.0155, + "lyapunov": null, + "grad_norm": 0.731162073111203, + "grad_max_sv": 0.3421657994389534, + "grad_min_sv": 1.1936111505433944e-08, + "grad_condition": 244312799.4199868, + "lr": 0.0009755282581475766, + "time_sec": 66.7026903629303 + }, + { + "epoch": 16, + "train_loss": 3.7741379774475097, + "train_acc": 0.12086, + "test_loss": 5.484867942047119, + "test_acc": 0.0182, + "lyapunov": null, + "grad_norm": 0.7090304412758509, + "grad_max_sv": 0.3223520040512085, + "grad_min_sv": 1.1672073835233832e-08, + "grad_condition": 31524319.78711735, + "lr": 0.0009721881851187403, + "time_sec": 66.739328622818 + }, + { + "epoch": 17, + "train_loss": 3.753197032470703, + "train_acc": 0.1256, + "test_loss": 6.568574522399902, + "test_acc": 0.0151, + "lyapunov": null, + "grad_norm": 0.6935882502734273, + "grad_max_sv": 0.3146128565073013, + "grad_min_sv": 1.1361096601426174e-08, + "grad_condition": 210125774.08050695, + "lr": 0.0009686409947459456, + "time_sec": 66.74520659446716 + }, + { + "epoch": 18, + "train_loss": 3.725816408157349, + "train_acc": 0.1287, + "test_loss": 6.34478737487793, + "test_acc": 0.0159, + "lyapunov": null, + "grad_norm": 0.6758795184950354, + "grad_max_sv": 0.30437840037047864, + "grad_min_sv": 1.1510641159673262e-08, + "grad_condition": 31558341.74036485, + "lr": 0.0009648882429441254, + "time_sec": 66.78180265426636 + }, + { + "epoch": 19, + "train_loss": 3.714654729003906, + "train_acc": 0.13168, + "test_loss": 6.368891102600098, + "test_acc": 0.016, + "lyapunov": null, + "grad_norm": 0.6618910868321934, + "grad_max_sv": 0.2960255391895771, + "grad_min_sv": 1.1117618592404455e-08, + "grad_condition": 30205848.660664685, + "lr": 0.00096093157579425, + "time_sec": 66.74912786483765 + }, + { + "epoch": 20, + "train_loss": 3.6946691497802733, + "train_acc": 0.13396, + "test_loss": 6.4278502319335935, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.6443454538226331, + "grad_max_sv": 0.28263592235744, + "grad_min_sv": 1.0974601266297567e-08, + "grad_condition": 85210724.40585044, + "lr": 0.0009567727288213001, + "time_sec": 66.75979924201965 + }, + { + "epoch": 21, + "train_loss": 3.678538037261963, + "train_acc": 0.1389, + "test_loss": 5.944661869812012, + "test_acc": 0.0147, + "lyapunov": null, + "grad_norm": 0.6338793846375858, + "grad_max_sv": 0.2817647561430931, + "grad_min_sv": 1.0979779263564637e-08, + "grad_condition": 31384399.636330932, + "lr": 0.0009524135262330095, + "time_sec": 66.75862097740173 + }, + { + "epoch": 22, + "train_loss": 3.6583445849609375, + "train_acc": 0.1389, + "test_loss": 6.617507224273681, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.6270968339485256, + "grad_max_sv": 0.2682405423372984, + "grad_min_sv": 1.0661627264374474e-08, + "grad_condition": 28199289.108431924, + "lr": 0.0009478558801197061, + "time_sec": 66.70150375366211 + }, + { + "epoch": 23, + "train_loss": 3.646308810348511, + "train_acc": 0.14268, + "test_loss": 6.335385469818116, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6088892694217577, + "grad_max_sv": 0.25535150058567524, + "grad_min_sv": 1.0300061187296095e-08, + "grad_condition": 34795287.59915707, + "lr": 0.000943101789615607, + "time_sec": 66.70925712585449 + }, + { + "epoch": 24, + "train_loss": 3.6351177741241454, + "train_acc": 0.1426, + "test_loss": 6.3158514701843265, + "test_acc": 0.0177, + "lyapunov": null, + "grad_norm": 0.5964648659799031, + "grad_max_sv": 0.24951178021728992, + "grad_min_sv": 1.0093550447537458e-08, + "grad_condition": 51838350.11107895, + "lr": 0.0009381533400219313, + "time_sec": 66.70350575447083 + }, + { + "epoch": 25, + "train_loss": 3.6183255680847166, + "train_acc": 0.14644, + "test_loss": 6.721168376159668, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5933387221507487, + "grad_max_sv": 0.25210563503205774, + "grad_min_sv": 1.0153997685290878e-08, + "grad_condition": 247394984.04080305, + "lr": 0.0009330127018922189, + "time_sec": 66.75347089767456 + }, + { + "epoch": 26, + "train_loss": 3.6071299158477785, + "train_acc": 0.14866, + "test_loss": 6.642034001922608, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5954282647789416, + "grad_max_sv": 0.2547519262880087, + "grad_min_sv": 1.0135606323680157e-08, + "grad_condition": 28483815.51624248, + "lr": 0.000927682130080253, + "time_sec": 66.75868964195251 + }, + { + "epoch": 27, + "train_loss": 3.5931669886779787, + "train_acc": 0.1502, + "test_loss": 6.223846574401856, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.5877941221593797, + "grad_max_sv": 0.24717812985181808, + "grad_min_sv": 9.855245958201308e-09, + "grad_condition": 28193359.09622656, + "lr": 0.0009221639627510072, + "time_sec": 66.77666926383972 + }, + { + "epoch": 28, + "train_loss": 3.5780224719238283, + "train_acc": 0.15286, + "test_loss": 6.90847115020752, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.5733930952654505, + "grad_max_sv": 0.2419151894748211, + "grad_min_sv": 9.843924880792442e-09, + "grad_condition": 28364870.16247251, + "lr": 0.0009164606203550494, + "time_sec": 66.74913716316223 + }, + { + "epoch": 29, + "train_loss": 3.573341248779297, + "train_acc": 0.15312, + "test_loss": 6.439982345581055, + "test_acc": 0.021, + "lyapunov": null, + "grad_norm": 0.5679699095868811, + "grad_max_sv": 0.2286886375397444, + "grad_min_sv": 9.63519248414757e-09, + "grad_condition": 29833754.648618333, + "lr": 0.0009105746045668516, + "time_sec": 66.7665946483612 + }, + { + "epoch": 30, + "train_loss": 3.5598143620300293, + "train_acc": 0.1562, + "test_loss": 6.429332733154297, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.5589691788337113, + "grad_max_sv": 0.227083408087492, + "grad_min_sv": 9.709436735172439e-09, + "grad_condition": 27930931.211393736, + "lr": 0.0009045084971874733, + "time_sec": 66.75674724578857 + }, + { + "epoch": 31, + "train_loss": 3.5470434929656984, + "train_acc": 0.16, + "test_loss": 6.6052438804626465, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.5612591002612681, + "grad_max_sv": 0.22930745929479598, + "grad_min_sv": 9.687322477525128e-09, + "grad_condition": 27425333.623921502, + "lr": 0.0008982649590120977, + "time_sec": 66.71509528160095 + }, + { + "epoch": 32, + "train_loss": 3.537414684448242, + "train_acc": 0.16062, + "test_loss": 6.011712426757812, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.5564909883403706, + "grad_max_sv": 0.22170890271663665, + "grad_min_sv": 9.485011626120255e-09, + "grad_condition": 25722607.460985243, + "lr": 0.0008918467286629196, + "time_sec": 66.73007607460022 + }, + { + "epoch": 33, + "train_loss": 3.5317853105163572, + "train_acc": 0.1603, + "test_loss": 6.360434799194336, + "test_acc": 0.0189, + "lyapunov": null, + "grad_norm": 0.550433878030662, + "grad_max_sv": 0.2289751097559929, + "grad_min_sv": 9.54062134832928e-09, + "grad_condition": 381531522.893629, + "lr": 0.0008852566213878943, + "time_sec": 66.71780228614807 + }, + { + "epoch": 34, + "train_loss": 3.5253816675567626, + "train_acc": 0.16216, + "test_loss": 6.247197938537598, + "test_acc": 0.0221, + "lyapunov": null, + "grad_norm": 0.5426800931973276, + "grad_max_sv": 0.21441863812506198, + "grad_min_sv": 9.316700774752996e-09, + "grad_condition": 26950152.667612456, + "lr": 0.000878497527825878, + "time_sec": 66.72579026222229 + }, + { + "epoch": 35, + "train_loss": 3.502744727020264, + "train_acc": 0.16578, + "test_loss": 6.571361762237549, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.5398257014810475, + "grad_max_sv": 0.20931940749287606, + "grad_min_sv": 9.403711298539009e-09, + "grad_condition": 25780458.398535747, + "lr": 0.000871572412738697, + "time_sec": 66.74532318115234 + }, + { + "epoch": 36, + "train_loss": 3.5064585032653808, + "train_acc": 0.1655, + "test_loss": 6.218161656951905, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.5305975593103218, + "grad_max_sv": 0.20301839672029018, + "grad_min_sv": 9.261498659651757e-09, + "grad_condition": 24222820.24324985, + "lr": 0.0008644843137107055, + "time_sec": 66.7688057422638 + }, + { + "epoch": 37, + "train_loss": 3.4891217603302, + "train_acc": 0.16706, + "test_loss": 6.142190956115723, + "test_acc": 0.0211, + "lyapunov": null, + "grad_norm": 0.5317318651110877, + "grad_max_sv": 0.20387103594839573, + "grad_min_sv": 9.19414472749791e-09, + "grad_condition": 41748735.80026223, + "lr": 0.0008572363398164014, + "time_sec": 66.75609850883484 + }, + { + "epoch": 38, + "train_loss": 3.4776386444854737, + "train_acc": 0.17062, + "test_loss": 6.417214579772949, + "test_acc": 0.0205, + "lyapunov": null, + "grad_norm": 0.5236386972874332, + "grad_max_sv": 0.20101286694407464, + "grad_min_sv": 9.154465988037152e-09, + "grad_condition": 37634567.23075999, + "lr": 0.0008498316702566826, + "time_sec": 66.79052495956421 + }, + { + "epoch": 39, + "train_loss": 3.46743884765625, + "train_acc": 0.16932, + "test_loss": 5.726113172912598, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.5210988175669885, + "grad_max_sv": 0.19942357540130615, + "grad_min_sv": 8.937806597608677e-09, + "grad_condition": 49428217.19173406, + "lr": 0.0008422735529643442, + "time_sec": 66.74242496490479 + }, + { + "epoch": 40, + "train_loss": 3.451697437210083, + "train_acc": 0.17372, + "test_loss": 6.044572091674804, + "test_acc": 0.0225, + "lyapunov": null, + "grad_norm": 0.5170646983548032, + "grad_max_sv": 0.19684507846832275, + "grad_min_sv": 9.003056534485909e-09, + "grad_condition": 138977031.8076538, + "lr": 0.0008345653031794289, + "time_sec": 66.70748567581177 + }, + { + "epoch": 41, + "train_loss": 3.4474837628173827, + "train_acc": 0.17626, + "test_loss": 5.9893402641296385, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.5155937638119307, + "grad_max_sv": 0.19306579753756523, + "grad_min_sv": 8.943595689384076e-09, + "grad_condition": 75805302.28035732, + "lr": 0.0008267103019950526, + "time_sec": 66.69197702407837 + }, + { + "epoch": 42, + "train_loss": 3.4423429164123536, + "train_acc": 0.17422, + "test_loss": 5.739228091430664, + "test_acc": 0.0203, + "lyapunov": null, + "grad_norm": 0.5099978166539899, + "grad_max_sv": 0.1884769570082426, + "grad_min_sv": 8.939715143152505e-09, + "grad_condition": 24445550.576415405, + "lr": 0.0008187119948743447, + "time_sec": 66.70687818527222 + }, + { + "epoch": 43, + "train_loss": 3.4337082667541505, + "train_acc": 0.1755, + "test_loss": 5.964181529998779, + "test_acc": 0.0177, + "lyapunov": null, + "grad_norm": 0.5104491505466159, + "grad_max_sv": 0.19002889432013034, + "grad_min_sv": 9.048546927015178e-09, + "grad_condition": 102521993.69997685, + "lr": 0.000810573890139155, + "time_sec": 66.7257513999939 + }, + { + "epoch": 44, + "train_loss": 3.420871334762573, + "train_acc": 0.17948, + "test_loss": 5.929026190948487, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.5050154925488476, + "grad_max_sv": 0.18516961708664895, + "grad_min_sv": 8.980576357564551e-09, + "grad_condition": 24771047.136464976, + "lr": 0.0008022995574311873, + "time_sec": 66.74575066566467 + }, + { + "epoch": 45, + "train_loss": 3.4096126289367676, + "train_acc": 0.18164, + "test_loss": 5.663789749145508, + "test_acc": 0.0195, + "lyapunov": null, + "grad_norm": 0.5049903163352594, + "grad_max_sv": 0.18273597210645676, + "grad_min_sv": 8.972159917797207e-09, + "grad_condition": 23794424.428349543, + "lr": 0.0007938926261462363, + "time_sec": 66.7593412399292 + }, + { + "epoch": 46, + "train_loss": 3.410715911254883, + "train_acc": 0.1807, + "test_loss": 5.895871440124512, + "test_acc": 0.018, + "lyapunov": null, + "grad_norm": 0.5025553542851052, + "grad_max_sv": 0.1833956018090248, + "grad_min_sv": 8.830828140959924e-09, + "grad_condition": 30936751.6432406, + "lr": 0.0007853567838422158, + "time_sec": 66.75630521774292 + }, + { + "epoch": 47, + "train_loss": 3.4009066193389894, + "train_acc": 0.18276, + "test_loss": 6.028702513122559, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.5031283438960251, + "grad_max_sv": 0.1799595769494772, + "grad_min_sv": 8.917869195879114e-09, + "grad_condition": 23059530.36595428, + "lr": 0.0007766957746216719, + "time_sec": 66.75422596931458 + }, + { + "epoch": 48, + "train_loss": 3.390701540603638, + "train_acc": 0.18414, + "test_loss": 6.1965219741821285, + "test_acc": 0.0191, + "lyapunov": null, + "grad_norm": 0.4978643158932146, + "grad_max_sv": 0.1835469003766775, + "grad_min_sv": 8.827262552163485e-09, + "grad_condition": 51184664.832447655, + "lr": 0.0007679133974894982, + "time_sec": 66.75912022590637 + }, + { + "epoch": 49, + "train_loss": 3.3818662035369873, + "train_acc": 0.185, + "test_loss": 5.9103582473754885, + "test_acc": 0.0216, + "lyapunov": null, + "grad_norm": 0.49852008894363287, + "grad_max_sv": 0.18433105908334255, + "grad_min_sv": 8.89238179827001e-09, + "grad_condition": 40247674.29131043, + "lr": 0.000759013504686565, + "time_sec": 66.705406665802 + }, + { + "epoch": 50, + "train_loss": 3.3789881330871583, + "train_acc": 0.18412, + "test_loss": 6.037129666137695, + "test_acc": 0.0221, + "lyapunov": null, + "grad_norm": 0.49658079337268785, + "grad_max_sv": 0.179146596416831, + "grad_min_sv": 8.88557344369545e-09, + "grad_condition": 24117261.20845995, + "lr": 0.0007499999999999998, + "time_sec": 66.72649240493774 + }, + { + "epoch": 51, + "train_loss": 3.368231953201294, + "train_acc": 0.18852, + "test_loss": 5.9292546646118165, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.4961366760585921, + "grad_max_sv": 0.17853211835026742, + "grad_min_sv": 8.978999294084744e-09, + "grad_condition": 23793132.034851797, + "lr": 0.0007408768370508575, + "time_sec": 66.72111701965332 + }, + { + "epoch": 52, + "train_loss": 3.3652955891418457, + "train_acc": 0.18696, + "test_loss": 6.321981049346924, + "test_acc": 0.0194, + "lyapunov": null, + "grad_norm": 0.492099764209841, + "grad_max_sv": 0.16977054849267006, + "grad_min_sv": 8.831625028515866e-09, + "grad_condition": 22251962.97293579, + "lr": 0.0007316480175599307, + "time_sec": 66.76648426055908 + }, + { + "epoch": 53, + "train_loss": 3.348167460861206, + "train_acc": 0.19116, + "test_loss": 6.423485536193848, + "test_acc": 0.0194, + "lyapunov": null, + "grad_norm": 0.49189585228327304, + "grad_max_sv": 0.17462090440094472, + "grad_min_sv": 8.786478893248183e-09, + "grad_condition": 188050773.829039, + "lr": 0.0007223175895924635, + "time_sec": 66.76346206665039 + }, + { + "epoch": 54, + "train_loss": 3.348860473022461, + "train_acc": 0.1902, + "test_loss": 5.888034158325195, + "test_acc": 0.0208, + "lyapunov": null, + "grad_norm": 0.49279210316788963, + "grad_max_sv": 0.17498359829187393, + "grad_min_sv": 8.822100200367444e-09, + "grad_condition": 28219026.60736394, + "lr": 0.0007128896457825361, + "time_sec": 66.78646183013916 + }, + { + "epoch": 55, + "train_loss": 3.340097451171875, + "train_acc": 0.19068, + "test_loss": 6.104175454711914, + "test_acc": 0.0217, + "lyapunov": null, + "grad_norm": 0.48880812803196916, + "grad_max_sv": 0.16894785091280937, + "grad_min_sv": 8.688565139580718e-09, + "grad_condition": 29986515.161999334, + "lr": 0.0007033683215378998, + "time_sec": 66.76022791862488 + }, + { + "epoch": 56, + "train_loss": 3.3290103381347658, + "train_acc": 0.19526, + "test_loss": 6.31472435760498, + "test_acc": 0.021, + "lyapunov": null, + "grad_norm": 0.4920323275084941, + "grad_max_sv": 0.16673259809613228, + "grad_min_sv": 8.834232892440674e-09, + "grad_condition": 22477005.35692047, + "lr": 0.0006937577932260512, + "time_sec": 66.74644947052002 + }, + { + "epoch": 57, + "train_loss": 3.3146336823272704, + "train_acc": 0.19646, + "test_loss": 5.99189327545166, + "test_acc": 0.0226, + "lyapunov": null, + "grad_norm": 0.48946191063890415, + "grad_max_sv": 0.167069473862648, + "grad_min_sv": 8.78488659317167e-09, + "grad_condition": 21365105.05732888, + "lr": 0.0006840622763423388, + "time_sec": 66.73155951499939 + }, + { + "epoch": 58, + "train_loss": 3.304142900466919, + "train_acc": 0.19854, + "test_loss": 5.5838108703613285, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.4865732671541852, + "grad_max_sv": 0.16740650571882726, + "grad_min_sv": 8.786859095888389e-09, + "grad_condition": 22043022.83729876, + "lr": 0.0006742860236609073, + "time_sec": 66.7638807296753 + }, + { + "epoch": 59, + "train_loss": 3.306339856491089, + "train_acc": 0.19832, + "test_loss": 6.71665584564209, + "test_acc": 0.0226, + "lyapunov": null, + "grad_norm": 0.4874859882247268, + "grad_max_sv": 0.17165971212089062, + "grad_min_sv": 8.715364420430748e-09, + "grad_condition": 25734869.826652374, + "lr": 0.0006644333233692913, + "time_sec": 66.69665598869324 + }, + { + "epoch": 60, + "train_loss": 3.2998611443328856, + "train_acc": 0.19806, + "test_loss": 5.851872462463379, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.4884739100521322, + "grad_max_sv": 0.16974798031151295, + "grad_min_sv": 8.883696248074279e-09, + "grad_condition": 21737745.94010177, + "lr": 0.0006545084971874734, + "time_sec": 66.72846579551697 + }, + { + "epoch": 61, + "train_loss": 3.2928254180908203, + "train_acc": 0.19828, + "test_loss": 5.552249732971191, + "test_acc": 0.023, + "lyapunov": null, + "grad_norm": 0.49016744220935893, + "grad_max_sv": 0.16948793716728688, + "grad_min_sv": 8.760361631943159e-09, + "grad_condition": 27254819.27808509, + "lr": 0.0006445158984722354, + "time_sec": 66.78463363647461 + }, + { + "epoch": 62, + "train_loss": 3.275610556716919, + "train_acc": 0.20532, + "test_loss": 5.873171199035644, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.4866265828805679, + "grad_max_sv": 0.16542929150164126, + "grad_min_sv": 8.78843325786971e-09, + "grad_condition": 66183687.20952544, + "lr": 0.0006344599103076324, + "time_sec": 66.76870799064636 + }, + { + "epoch": 63, + "train_loss": 3.271966901855469, + "train_acc": 0.20438, + "test_loss": 5.9298525764465335, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.4859022585476048, + "grad_max_sv": 0.16404966413974761, + "grad_min_sv": 8.811849419587681e-09, + "grad_condition": 22319350.467063613, + "lr": 0.0006243449435824269, + "time_sec": 66.73905062675476 + }, + { + "epoch": 64, + "train_loss": 3.266578521652222, + "train_acc": 0.2042, + "test_loss": 5.641555810546875, + "test_acc": 0.0272, + "lyapunov": null, + "grad_norm": 0.48486007197076664, + "grad_max_sv": 0.1655890803784132, + "grad_min_sv": 8.723941788413291e-09, + "grad_condition": 22305108.16299928, + "lr": 0.0006141754350553275, + "time_sec": 66.7476577758789 + }, + { + "epoch": 65, + "train_loss": 3.2511880633544923, + "train_acc": 0.2074, + "test_loss": 5.8412233901977535, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.48754428036288966, + "grad_max_sv": 0.16739307381212712, + "grad_min_sv": 8.817329924526441e-09, + "grad_condition": 21968003.756148495, + "lr": 0.0006039558454088793, + "time_sec": 66.75903058052063 + }, + { + "epoch": 66, + "train_loss": 3.249825279388428, + "train_acc": 0.2102, + "test_loss": 5.375687086486816, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.4852656386861206, + "grad_max_sv": 0.16313621625304223, + "grad_min_sv": 8.705907367234644e-09, + "grad_condition": 22679705.957923576, + "lr": 0.000593690657292862, + "time_sec": 66.70783424377441 + }, + { + "epoch": 67, + "train_loss": 3.245251103134155, + "train_acc": 0.21036, + "test_loss": 6.777110389709472, + "test_acc": 0.0168, + "lyapunov": null, + "grad_norm": 0.4867378238882827, + "grad_max_sv": 0.1655280452221632, + "grad_min_sv": 8.915351975939679e-09, + "grad_condition": 110454092.86004348, + "lr": 0.0005833843733580507, + "time_sec": 66.69803929328918 + }, + { + "epoch": 68, + "train_loss": 3.2381321800231935, + "train_acc": 0.20952, + "test_loss": 6.102328826904297, + "test_acc": 0.0197, + "lyapunov": null, + "grad_norm": 0.48671688246611916, + "grad_max_sv": 0.1659169655293226, + "grad_min_sv": 8.76257463186536e-09, + "grad_condition": 44812459.07892763, + "lr": 0.0005730415142812054, + "time_sec": 66.69719409942627 + }, + { + "epoch": 69, + "train_loss": 3.2316595709991454, + "train_acc": 0.21144, + "test_loss": 5.602972175598144, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.4847784835340826, + "grad_max_sv": 0.1632793139666319, + "grad_min_sv": 8.814856525610204e-09, + "grad_condition": 107593372.59174109, + "lr": 0.0005626666167821517, + "time_sec": 66.68555569648743 + }, + { + "epoch": 70, + "train_loss": 3.21884576965332, + "train_acc": 0.21162, + "test_loss": 6.080870904541015, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.4868075160552665, + "grad_max_sv": 0.15996163412928582, + "grad_min_sv": 8.820852938351554e-09, + "grad_condition": 24906478.982524626, + "lr": 0.0005522642316338265, + "time_sec": 66.75078678131104 + }, + { + "epoch": 71, + "train_loss": 3.2169480547332765, + "train_acc": 0.2131, + "test_loss": 6.322179025268555, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.48693869340308327, + "grad_max_sv": 0.16328724324703217, + "grad_min_sv": 8.897740871871563e-09, + "grad_condition": 21378151.74249644, + "lr": 0.0005418389216661573, + "time_sec": 66.82618498802185 + }, + { + "epoch": 72, + "train_loss": 3.209583250656128, + "train_acc": 0.21452, + "test_loss": 5.9164725677490235, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.48710676929190333, + "grad_max_sv": 0.1638231087476015, + "grad_min_sv": 8.895584530099753e-09, + "grad_condition": 26372411.903145302, + "lr": 0.0005313952597646563, + "time_sec": 66.76002073287964 + }, + { + "epoch": 73, + "train_loss": 3.206989998016357, + "train_acc": 0.2156, + "test_loss": 6.779888274383545, + "test_acc": 0.02, + "lyapunov": null, + "grad_norm": 0.4871385804296449, + "grad_max_sv": 0.16540717855095863, + "grad_min_sv": 8.919061500467506e-09, + "grad_condition": 24713788.997361727, + "lr": 0.0005209378268645994, + "time_sec": 66.79043841362 + }, + { + "epoch": 74, + "train_loss": 3.196985797729492, + "train_acc": 0.21718, + "test_loss": 6.031893154907227, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.4885299333145373, + "grad_max_sv": 0.1637456502765417, + "grad_min_sv": 8.884239661999249e-09, + "grad_condition": 31643344.54858377, + "lr": 0.0005104712099416781, + "time_sec": 66.7399845123291 + }, + { + "epoch": 75, + "train_loss": 3.1916642933654784, + "train_acc": 0.21804, + "test_loss": 6.505784149169922, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.48738903646108195, + "grad_max_sv": 0.16264366619288922, + "grad_min_sv": 8.976378307323785e-09, + "grad_condition": 23550016.098660976, + "lr": 0.0004999999999999996, + "time_sec": 66.73288559913635 + }, + { + "epoch": 76, + "train_loss": 3.1814585160827638, + "train_acc": 0.22052, + "test_loss": 6.48178818359375, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.4843426315380276, + "grad_max_sv": 0.16138911359012126, + "grad_min_sv": 8.912034432650984e-09, + "grad_condition": 23286891.30520594, + "lr": 0.0004895287900583212, + "time_sec": 66.69967555999756 + }, + { + "epoch": 77, + "train_loss": 3.1693101245117186, + "train_acc": 0.22188, + "test_loss": 6.60695295715332, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.48473864055458005, + "grad_max_sv": 0.16252022571861743, + "grad_min_sv": 8.865778075572983e-09, + "grad_condition": 20379861.793125592, + "lr": 0.0004790621731353997, + "time_sec": 66.73058843612671 + }, + { + "epoch": 78, + "train_loss": 3.172366504058838, + "train_acc": 0.22092, + "test_loss": 6.633734432983398, + "test_acc": 0.0249, + "lyapunov": null, + "grad_norm": 0.4834678400720691, + "grad_max_sv": 0.1624290570616722, + "grad_min_sv": 8.932120706961477e-09, + "grad_condition": 23408681.375307254, + "lr": 0.000468604740235343, + "time_sec": 66.69404172897339 + }, + { + "epoch": 79, + "train_loss": 3.1615784413146972, + "train_acc": 0.2258, + "test_loss": 6.273578634643554, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.48944403353102334, + "grad_max_sv": 0.16398866586387156, + "grad_min_sv": 8.946382384911189e-09, + "grad_condition": 22712578.898883633, + "lr": 0.00045816107833384175, + "time_sec": 66.7472972869873 + }, + { + "epoch": 80, + "train_loss": 3.1575608079528807, + "train_acc": 0.22382, + "test_loss": 6.2906877746582035, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.4897084401415468, + "grad_max_sv": 0.16338732056319713, + "grad_min_sv": 8.928839754715478e-09, + "grad_condition": 54043718.99023694, + "lr": 0.0004477357683661729, + "time_sec": 66.72847270965576 + }, + { + "epoch": 81, + "train_loss": 3.1497875170898437, + "train_acc": 0.22584, + "test_loss": 6.6115754776000975, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.48772100619317266, + "grad_max_sv": 0.15775733068585396, + "grad_min_sv": 9.009791279712686e-09, + "grad_condition": 20818306.202141248, + "lr": 0.00043733338321784746, + "time_sec": 66.74951100349426 + }, + { + "epoch": 82, + "train_loss": 3.150099751586914, + "train_acc": 0.22466, + "test_loss": 6.489882479858398, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.48649716303896257, + "grad_max_sv": 0.15712360739707948, + "grad_min_sv": 8.928376640099378e-09, + "grad_condition": 33122173.6130862, + "lr": 0.0004269584857187939, + "time_sec": 66.73039722442627 + }, + { + "epoch": 83, + "train_loss": 3.1423302052307127, + "train_acc": 0.22782, + "test_loss": 6.021305515289306, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.48633742199561775, + "grad_max_sv": 0.1581266548484564, + "grad_min_sv": 8.888032958058456e-09, + "grad_condition": 115025831.2804152, + "lr": 0.0004166156266419484, + "time_sec": 66.74857115745544 + }, + { + "epoch": 84, + "train_loss": 3.128035169677734, + "train_acc": 0.22886, + "test_loss": 6.798161625671387, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.48802181363511177, + "grad_max_sv": 0.1612305197864771, + "grad_min_sv": 8.905917459056666e-09, + "grad_condition": 24037955.80487976, + "lr": 0.0004063093427071373, + "time_sec": 66.70986270904541 + }, + { + "epoch": 85, + "train_loss": 3.127580302810669, + "train_acc": 0.23112, + "test_loss": 6.7588252937316895, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.4875306431638057, + "grad_max_sv": 0.16091111600399016, + "grad_min_sv": 9.01161150146379e-09, + "grad_condition": 21073737.755382914, + "lr": 0.0003960441545911199, + "time_sec": 66.68802571296692 + }, + { + "epoch": 86, + "train_loss": 3.114855668182373, + "train_acc": 0.2308, + "test_loss": 6.564279100036621, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.48637730612121255, + "grad_max_sv": 0.15542719289660453, + "grad_min_sv": 8.93872263707518e-09, + "grad_condition": 21703985.404231258, + "lr": 0.0003858245649446718, + "time_sec": 66.6933023929596 + }, + { + "epoch": 87, + "train_loss": 3.1120968659210204, + "train_acc": 0.23044, + "test_loss": 6.98433928451538, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.4900107193499055, + "grad_max_sv": 0.16207418888807296, + "grad_min_sv": 8.972892097738883e-09, + "grad_condition": 47614869.04451983, + "lr": 0.00037565505641757235, + "time_sec": 66.71200680732727 + }, + { + "epoch": 88, + "train_loss": 3.105097593078613, + "train_acc": 0.23214, + "test_loss": 6.7922447959899905, + "test_acc": 0.0302, + "lyapunov": null, + "grad_norm": 0.4884472360111878, + "grad_max_sv": 0.15889082551002504, + "grad_min_sv": 8.899033936138335e-09, + "grad_condition": 25000729.654329486, + "lr": 0.00036554008969236695, + "time_sec": 66.7427408695221 + }, + { + "epoch": 89, + "train_loss": 3.0926671070098877, + "train_acc": 0.23664, + "test_loss": 6.916401704406738, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.49050493507655857, + "grad_max_sv": 0.16100925132632254, + "grad_min_sv": 9.010439719348006e-09, + "grad_condition": 21207674.720614858, + "lr": 0.0003554841015277638, + "time_sec": 66.76495027542114 + }, + { + "epoch": 90, + "train_loss": 3.090296846160889, + "train_acc": 0.23536, + "test_loss": 7.012615090179444, + "test_acc": 0.0308, + "lyapunov": null, + "grad_norm": 0.49019979842343425, + "grad_max_sv": 0.1572930809110403, + "grad_min_sv": 8.949024762796698e-09, + "grad_condition": 734920063.8359609, + "lr": 0.000345491502812526, + "time_sec": 66.73302173614502 + }, + { + "epoch": 91, + "train_loss": 3.085657378997803, + "train_acc": 0.23746, + "test_loss": 6.360618818664551, + "test_acc": 0.0363, + "lyapunov": null, + "grad_norm": 0.4915162849741807, + "grad_max_sv": 0.15855198130011558, + "grad_min_sv": 8.980356871329809e-09, + "grad_condition": 28731902.889844812, + "lr": 0.0003355666766307081, + "time_sec": 66.74396848678589 + }, + { + "epoch": 92, + "train_loss": 3.0831817041778566, + "train_acc": 0.2383, + "test_loss": 5.9396498611450195, + "test_acc": 0.0352, + "lyapunov": null, + "grad_norm": 0.49047678071806555, + "grad_max_sv": 0.15942419767379762, + "grad_min_sv": 9.062854348755588e-09, + "grad_condition": 57497218.341688454, + "lr": 0.00032571397633909225, + "time_sec": 66.77806997299194 + }, + { + "epoch": 93, + "train_loss": 3.071146830596924, + "train_acc": 0.23998, + "test_loss": 6.60078558807373, + "test_acc": 0.0328, + "lyapunov": null, + "grad_norm": 0.48952410405337216, + "grad_max_sv": 0.1553661532700062, + "grad_min_sv": 9.10862152092573e-09, + "grad_condition": 20074531.31734441, + "lr": 0.00031593772365766094, + "time_sec": 66.71407961845398 + }, + { + "epoch": 94, + "train_loss": 3.0655629290008544, + "train_acc": 0.23992, + "test_loss": 6.003435957336426, + "test_acc": 0.0378, + "lyapunov": null, + "grad_norm": 0.49221246193757373, + "grad_max_sv": 0.15908809714019298, + "grad_min_sv": 9.144222304358074e-09, + "grad_condition": 19907441.898985844, + "lr": 0.0003062422067739483, + "time_sec": 66.693532705307 + }, + { + "epoch": 95, + "train_loss": 3.060634704437256, + "train_acc": 0.23888, + "test_loss": 6.056681440734863, + "test_acc": 0.0373, + "lyapunov": null, + "grad_norm": 0.49339217556104, + "grad_max_sv": 0.15901063568890095, + "grad_min_sv": 9.065924972545547e-09, + "grad_condition": 29502219.759497046, + "lr": 0.00029663167846209965, + "time_sec": 66.70557427406311 + }, + { + "epoch": 96, + "train_loss": 3.061671485443115, + "train_acc": 0.24224, + "test_loss": 6.776474742126465, + "test_acc": 0.0353, + "lyapunov": null, + "grad_norm": 0.49062641992823525, + "grad_max_sv": 0.15993262231349945, + "grad_min_sv": 9.044680277306427e-09, + "grad_condition": 42484326.952753186, + "lr": 0.00028711035421746345, + "time_sec": 66.71291422843933 + }, + { + "epoch": 97, + "train_loss": 3.0552709561157227, + "train_acc": 0.24368, + "test_loss": 6.627662403869629, + "test_acc": 0.0312, + "lyapunov": null, + "grad_norm": 0.49312118223102674, + "grad_max_sv": 0.1586600374430418, + "grad_min_sv": 9.106857379315159e-09, + "grad_condition": 19815371.442228314, + "lr": 0.00027768241040753615, + "time_sec": 66.74342608451843 + }, + { + "epoch": 98, + "train_loss": 3.047260310974121, + "train_acc": 0.24534, + "test_loss": 6.661625199890136, + "test_acc": 0.0358, + "lyapunov": null, + "grad_norm": 0.4920094661808142, + "grad_max_sv": 0.1592965368181467, + "grad_min_sv": 9.102059620250124e-09, + "grad_condition": 78440147.91108674, + "lr": 0.00026835198244006903, + "time_sec": 66.75223684310913 + }, + { + "epoch": 99, + "train_loss": 3.046775559768677, + "train_acc": 0.24216, + "test_loss": 6.965150428771973, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.4926874565507386, + "grad_max_sv": 0.16148377656936647, + "grad_min_sv": 9.167028746162597e-09, + "grad_condition": 82327087.71133485, + "lr": 0.0002591231629491421, + "time_sec": 66.76156210899353 + }, + { + "epoch": 100, + "train_loss": 3.041998874053955, + "train_acc": 0.24108, + "test_loss": 6.647268369293213, + "test_acc": 0.0319, + "lyapunov": null, + "grad_norm": 0.49732363208650837, + "grad_max_sv": 0.15973055586218834, + "grad_min_sv": 9.144760823587283e-09, + "grad_condition": 19643395.96339509, + "lr": 0.0002499999999999997, + "time_sec": 66.74560022354126 + }, + { + "epoch": 101, + "train_loss": 3.0355277448272706, + "train_acc": 0.24656, + "test_loss": 6.661636563873291, + "test_acc": 0.0352, + "lyapunov": null, + "grad_norm": 0.4945949712556627, + "grad_max_sv": 0.16228868998587132, + "grad_min_sv": 9.097275698727314e-09, + "grad_condition": 29717156.96899251, + "lr": 0.00024098649531343477, + "time_sec": 66.74929976463318 + }, + { + "epoch": 102, + "train_loss": 3.028595997467041, + "train_acc": 0.24942, + "test_loss": 7.008212976837158, + "test_acc": 0.0297, + "lyapunov": null, + "grad_norm": 0.4951875945091829, + "grad_max_sv": 0.1601081270724535, + "grad_min_sv": 9.183049341776606e-09, + "grad_condition": 28833554.07107707, + "lr": 0.0002320866025105016, + "time_sec": 66.70356440544128 + }, + { + "epoch": 103, + "train_loss": 3.0245940507507325, + "train_acc": 0.24584, + "test_loss": 6.46308011932373, + "test_acc": 0.0341, + "lyapunov": null, + "grad_norm": 0.49371498929192353, + "grad_max_sv": 0.15619246214628218, + "grad_min_sv": 9.060142111202984e-09, + "grad_condition": 39182662.24958947, + "lr": 0.0002233042253783278, + "time_sec": 66.71340656280518 + }, + { + "epoch": 104, + "train_loss": 3.021408618774414, + "train_acc": 0.2456, + "test_loss": 6.825051796722412, + "test_acc": 0.0336, + "lyapunov": null, + "grad_norm": 0.4938389055758033, + "grad_max_sv": 0.1602877888828516, + "grad_min_sv": 9.021206631709689e-09, + "grad_condition": 22621712.521351572, + "lr": 0.000214643216157784, + "time_sec": 66.69873213768005 + }, + { + "epoch": 105, + "train_loss": 3.0085532719421386, + "train_acc": 0.25126, + "test_loss": 6.49373994140625, + "test_acc": 0.0345, + "lyapunov": null, + "grad_norm": 0.49734202210836465, + "grad_max_sv": 0.1637524042278528, + "grad_min_sv": 9.15554402847185e-09, + "grad_condition": 21636907.97691984, + "lr": 0.00020610737385376332, + "time_sec": 66.7116219997406 + }, + { + "epoch": 106, + "train_loss": 3.0132780470275877, + "train_acc": 0.24846, + "test_loss": 6.5495201698303225, + "test_acc": 0.0336, + "lyapunov": null, + "grad_norm": 0.4981310757648767, + "grad_max_sv": 0.15820327922701835, + "grad_min_sv": 9.158961136734866e-09, + "grad_condition": 20307530.065489154, + "lr": 0.00019770044256881242, + "time_sec": 66.74218201637268 + }, + { + "epoch": 107, + "train_loss": 3.0039769695281984, + "train_acc": 0.24998, + "test_loss": 6.218603918457031, + "test_acc": 0.0361, + "lyapunov": null, + "grad_norm": 0.4961392053949623, + "grad_max_sv": 0.1600139781832695, + "grad_min_sv": 9.131589118194228e-09, + "grad_condition": 36979479.48401734, + "lr": 0.0001894261098608447, + "time_sec": 66.80793809890747 + }, + { + "epoch": 108, + "train_loss": 3.001887908782959, + "train_acc": 0.2516, + "test_loss": 6.588950064086914, + "test_acc": 0.0328, + "lyapunov": null, + "grad_norm": 0.49597326074702125, + "grad_max_sv": 0.1588774763047695, + "grad_min_sv": 9.17765310692875e-09, + "grad_condition": 50896304.22255845, + "lr": 0.000181288005125655, + "time_sec": 66.76537990570068 + }, + { + "epoch": 109, + "train_loss": 2.9904132221221924, + "train_acc": 0.25664, + "test_loss": 6.382045315551758, + "test_acc": 0.0395, + "lyapunov": null, + "grad_norm": 0.4973619331899814, + "grad_max_sv": 0.1614119179546833, + "grad_min_sv": 9.145205881466722e-09, + "grad_condition": 19754492.90124496, + "lr": 0.0001732896980049473, + "time_sec": 66.78630447387695 + }, + { + "epoch": 110, + "train_loss": 2.989228514251709, + "train_acc": 0.25492, + "test_loss": 6.322301493072509, + "test_acc": 0.0369, + "lyapunov": null, + "grad_norm": 0.498337161336674, + "grad_max_sv": 0.15811876803636551, + "grad_min_sv": 9.229779307506902e-09, + "grad_condition": 19822899.140848357, + "lr": 0.00016543469682057076, + "time_sec": 66.75606536865234 + }, + { + "epoch": 111, + "train_loss": 2.984906556854248, + "train_acc": 0.25606, + "test_loss": 6.8701157440185545, + "test_acc": 0.0367, + "lyapunov": null, + "grad_norm": 0.49721550527739367, + "grad_max_sv": 0.16228222362697126, + "grad_min_sv": 9.23479824502943e-09, + "grad_condition": 293614052.48096585, + "lr": 0.00015772644703565552, + "time_sec": 66.73988127708435 + }, + { + "epoch": 112, + "train_loss": 2.9811305560302737, + "train_acc": 0.25646, + "test_loss": 7.038999290466308, + "test_acc": 0.0335, + "lyapunov": null, + "grad_norm": 0.4941490782513605, + "grad_max_sv": 0.15477370359003545, + "grad_min_sv": 9.218313174429171e-09, + "grad_condition": 164935506.24721447, + "lr": 0.00015016832974331713, + "time_sec": 66.71515774726868 + }, + { + "epoch": 113, + "train_loss": 2.9800968042755125, + "train_acc": 0.25398, + "test_loss": 6.309658117675781, + "test_acc": 0.0389, + "lyapunov": null, + "grad_norm": 0.49886850458670223, + "grad_max_sv": 0.16330830678343772, + "grad_min_sv": 9.236376152799153e-09, + "grad_condition": 21870251.37413417, + "lr": 0.00014276366018359834, + "time_sec": 66.71296858787537 + }, + { + "epoch": 114, + "train_loss": 2.9754512078094484, + "train_acc": 0.25594, + "test_loss": 6.60843113861084, + "test_acc": 0.0346, + "lyapunov": null, + "grad_norm": 0.4960627007320755, + "grad_max_sv": 0.1573273716494441, + "grad_min_sv": 9.209630175144312e-09, + "grad_condition": 21208142.4041068, + "lr": 0.00013551568628929425, + "time_sec": 66.73864150047302 + }, + { + "epoch": 115, + "train_loss": 2.973171382446289, + "train_acc": 0.25546, + "test_loss": 6.1580316360473635, + "test_acc": 0.0359, + "lyapunov": null, + "grad_norm": 0.4975170133978326, + "grad_max_sv": 0.16185041181743146, + "grad_min_sv": 9.172154036285463e-09, + "grad_condition": 23675277.644423716, + "lr": 0.00012842758726130276, + "time_sec": 66.7741425037384 + }, + { + "epoch": 116, + "train_loss": 2.9698315058135987, + "train_acc": 0.2585, + "test_loss": 6.728188695526123, + "test_acc": 0.0352, + "lyapunov": null, + "grad_norm": 0.49786156791485014, + "grad_max_sv": 0.1629601776599884, + "grad_min_sv": 9.141069147108882e-09, + "grad_condition": 42245446.81835711, + "lr": 0.0001215024721741218, + "time_sec": 66.85877132415771 + }, + { + "epoch": 117, + "train_loss": 2.96759364151001, + "train_acc": 0.25688, + "test_loss": 6.810253086853027, + "test_acc": 0.0317, + "lyapunov": null, + "grad_norm": 0.5004102922188621, + "grad_max_sv": 0.16316126510500908, + "grad_min_sv": 9.275286505516789e-09, + "grad_condition": 21737711.712548293, + "lr": 0.00011474337861210538, + "time_sec": 66.78435349464417 + }, + { + "epoch": 118, + "train_loss": 2.9639752848815917, + "train_acc": 0.25784, + "test_loss": 6.6183334121704105, + "test_acc": 0.037, + "lyapunov": null, + "grad_norm": 0.4993536159032588, + "grad_max_sv": 0.16331967823207377, + "grad_min_sv": 9.30454736036701e-09, + "grad_condition": 24980238.64283476, + "lr": 0.00010815327133708009, + "time_sec": 66.78651332855225 + }, + { + "epoch": 119, + "train_loss": 2.955244768218994, + "train_acc": 0.26012, + "test_loss": 7.170739624023438, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.49772875386211013, + "grad_max_sv": 0.15745177641510963, + "grad_min_sv": 9.275912776773865e-09, + "grad_condition": 20252652.260798354, + "lr": 0.00010173504098790182, + "time_sec": 66.7590229511261 + }, + { + "epoch": 120, + "train_loss": 2.9573191987609864, + "train_acc": 0.25902, + "test_loss": 6.63704820098877, + "test_acc": 0.0341, + "lyapunov": null, + "grad_norm": 0.4996347696527594, + "grad_max_sv": 0.16082486175000668, + "grad_min_sv": 9.223728218710203e-09, + "grad_condition": 31826325.619799424, + "lr": 9.549150281252629e-05, + "time_sec": 66.7681827545166 + }, + { + "epoch": 121, + "train_loss": 2.9523595883178713, + "train_acc": 0.2618, + "test_loss": 6.729842405700683, + "test_acc": 0.036, + "lyapunov": null, + "grad_norm": 0.5013710314611776, + "grad_max_sv": 0.15908933244645596, + "grad_min_sv": 9.356316055253444e-09, + "grad_condition": 25691489.85231958, + "lr": 8.942539543314794e-05, + "time_sec": 66.74568009376526 + }, + { + "epoch": 122, + "train_loss": 2.9497915851593017, + "train_acc": 0.2617, + "test_loss": 6.87424278717041, + "test_acc": 0.033, + "lyapunov": null, + "grad_norm": 0.5005453549657005, + "grad_max_sv": 0.16275203377008438, + "grad_min_sv": 9.293272996112322e-09, + "grad_condition": 83221431.81677945, + "lr": 8.353937964495024e-05, + "time_sec": 66.74210405349731 + }, + { + "epoch": 123, + "train_loss": 2.9416942150115966, + "train_acc": 0.2643, + "test_loss": 6.686075965118408, + "test_acc": 0.0363, + "lyapunov": null, + "grad_norm": 0.5025049175782571, + "grad_max_sv": 0.15961344465613364, + "grad_min_sv": 9.371966801230425e-09, + "grad_condition": 35132803.96387108, + "lr": 7.783603724899243e-05, + "time_sec": 66.75957775115967 + }, + { + "epoch": 124, + "train_loss": 2.94895947555542, + "train_acc": 0.25956, + "test_loss": 6.959716784667969, + "test_acc": 0.0344, + "lyapunov": null, + "grad_norm": 0.5043618033931743, + "grad_max_sv": 0.16490019261837005, + "grad_min_sv": 9.45151938935851e-09, + "grad_condition": 20739176.963236075, + "lr": 7.231786991974666e-05, + "time_sec": 66.76986241340637 + }, + { + "epoch": 125, + "train_loss": 2.9465578133392336, + "train_acc": 0.2615, + "test_loss": 6.6146667854309085, + "test_acc": 0.0372, + "lyapunov": null, + "grad_norm": 0.50165695568463, + "grad_max_sv": 0.16004594042897224, + "grad_min_sv": 9.333669109823362e-09, + "grad_condition": 27696527.631483592, + "lr": 6.698729810778072e-05, + "time_sec": 66.79878735542297 + }, + { + "epoch": 126, + "train_loss": 2.944279951171875, + "train_acc": 0.25922, + "test_loss": 6.776188401794434, + "test_acc": 0.0359, + "lyapunov": null, + "grad_norm": 0.5004778327715103, + "grad_max_sv": 0.1615132074803114, + "grad_min_sv": 9.285796417901615e-09, + "grad_condition": 20380420.794493236, + "lr": 6.184665997806817e-05, + "time_sec": 66.81306886672974 + }, + { + "epoch": 127, + "train_loss": 2.9345046046447756, + "train_acc": 0.26554, + "test_loss": 6.409585705566406, + "test_acc": 0.0365, + "lyapunov": null, + "grad_norm": 0.5009056150070453, + "grad_max_sv": 0.16262583658099175, + "grad_min_sv": 9.41551325135681e-09, + "grad_condition": 92271454.95901966, + "lr": 5.6898210384392595e-05, + "time_sec": 66.77955317497253 + }, + { + "epoch": 128, + "train_loss": 2.9406036145782473, + "train_acc": 0.26226, + "test_loss": 6.883744766235352, + "test_acc": 0.0362, + "lyapunov": null, + "grad_norm": 0.5019103000513857, + "grad_max_sv": 0.15915893130004405, + "grad_min_sv": 9.27946301465532e-09, + "grad_condition": 26892136.241638493, + "lr": 5.214411988029363e-05, + "time_sec": 66.7971682548523 + }, + { + "epoch": 129, + "train_loss": 2.9357696857452393, + "train_acc": 0.26482, + "test_loss": 6.798914263916016, + "test_acc": 0.0371, + "lyapunov": null, + "grad_norm": 0.502875147430765, + "grad_max_sv": 0.16597487404942513, + "grad_min_sv": 9.331743605622833e-09, + "grad_condition": 21894734.234583445, + "lr": 4.7586473766990294e-05, + "time_sec": 66.76526641845703 + }, + { + "epoch": 130, + "train_loss": 2.931978320159912, + "train_acc": 0.2632, + "test_loss": 6.588931091308594, + "test_acc": 0.0383, + "lyapunov": null, + "grad_norm": 0.5024988425718886, + "grad_max_sv": 0.16058847755193711, + "grad_min_sv": 9.346998992854072e-09, + "grad_condition": 23689235.71364718, + "lr": 4.32272711786996e-05, + "time_sec": 66.73650169372559 + }, + { + "epoch": 131, + "train_loss": 2.9257036571502684, + "train_acc": 0.26346, + "test_loss": 6.79047756652832, + "test_acc": 0.037, + "lyapunov": null, + "grad_norm": 0.5025936155191698, + "grad_max_sv": 0.1606222338974476, + "grad_min_sv": 9.344622825535609e-09, + "grad_condition": 19448498.594337363, + "lr": 3.906842420574966e-05, + "time_sec": 66.72977805137634 + }, + { + "epoch": 132, + "train_loss": 2.9238443630981443, + "train_acc": 0.26652, + "test_loss": 6.582272483825683, + "test_acc": 0.0359, + "lyapunov": null, + "grad_norm": 0.5057115235264575, + "grad_max_sv": 0.1622081771492958, + "grad_min_sv": 9.322094066382264e-09, + "grad_condition": 110706873.75285177, + "lr": 3.5111757055874305e-05, + "time_sec": 66.74127459526062 + }, + { + "epoch": 133, + "train_loss": 2.9275563074493407, + "train_acc": 0.26798, + "test_loss": 6.701000856018067, + "test_acc": 0.0403, + "lyapunov": null, + "grad_norm": 0.5047358455148018, + "grad_max_sv": 0.1596795056015253, + "grad_min_sv": 9.385729068944748e-09, + "grad_condition": 24899256.961485635, + "lr": 3.1359005254054254e-05, + "time_sec": 66.78476786613464 + }, + { + "epoch": 134, + "train_loss": 2.922698397293091, + "train_acc": 0.2656, + "test_loss": 6.822336962890625, + "test_acc": 0.0348, + "lyapunov": null, + "grad_norm": 0.5011816329114258, + "grad_max_sv": 0.16208452992141248, + "grad_min_sv": 9.367489639533489e-09, + "grad_condition": 21334456.488015514, + "lr": 2.7811814881259484e-05, + "time_sec": 66.77467155456543 + }, + { + "epoch": 135, + "train_loss": 2.9318275360870363, + "train_acc": 0.26446, + "test_loss": 6.82299095916748, + "test_acc": 0.0375, + "lyapunov": null, + "grad_norm": 0.5036159796429942, + "grad_max_sv": 0.16086461171507835, + "grad_min_sv": 9.421430274825227e-09, + "grad_condition": 23697065.511433274, + "lr": 2.4471741852423218e-05, + "time_sec": 66.81163048744202 + }, + { + "epoch": 136, + "train_loss": 2.924918181915283, + "train_acc": 0.26562, + "test_loss": 6.8049731414794925, + "test_acc": 0.0379, + "lyapunov": null, + "grad_norm": 0.5025705246301901, + "grad_max_sv": 0.1608381040394306, + "grad_min_sv": 9.298360864606891e-09, + "grad_condition": 21070247.46761896, + "lr": 2.1340251233966362e-05, + "time_sec": 66.75751781463623 + }, + { + "epoch": 137, + "train_loss": 2.9179174461364745, + "train_acc": 0.267, + "test_loss": 7.41930817565918, + "test_acc": 0.0354, + "lyapunov": null, + "grad_norm": 0.5020038013732862, + "grad_max_sv": 0.16103104539215565, + "grad_min_sv": 9.377383154707264e-09, + "grad_condition": 25924694.766624488, + "lr": 1.8418716601170932e-05, + "time_sec": 66.75570106506348 + }, + { + "epoch": 138, + "train_loss": 2.923201954345703, + "train_acc": 0.26658, + "test_loss": 6.757112614440918, + "test_acc": 0.0368, + "lyapunov": null, + "grad_norm": 0.5024810225531171, + "grad_max_sv": 0.1589697927236557, + "grad_min_sv": 9.370084333437667e-09, + "grad_condition": 21088389.845349483, + "lr": 1.570841943568445e-05, + "time_sec": 66.72540855407715 + }, + { + "epoch": 139, + "train_loss": 2.91647822807312, + "train_acc": 0.26728, + "test_loss": 6.73676093826294, + "test_acc": 0.0367, + "lyapunov": null, + "grad_norm": 0.5029392119297419, + "grad_max_sv": 0.16374287530779838, + "grad_min_sv": 9.458621610947127e-09, + "grad_condition": 21151341.282133214, + "lr": 1.3210548563419845e-05, + "time_sec": 66.74242377281189 + }, + { + "epoch": 140, + "train_loss": 2.9202518330383302, + "train_acc": 0.2648, + "test_loss": 7.060108929443359, + "test_acc": 0.0321, + "lyapunov": null, + "grad_norm": 0.5033375321825745, + "grad_max_sv": 0.1628003478050232, + "grad_min_sv": 9.350477757699705e-09, + "grad_condition": 42538003.149772, + "lr": 1.0926199633097203e-05, + "time_sec": 66.72664403915405 + }, + { + "epoch": 141, + "train_loss": 2.9214018739318846, + "train_acc": 0.26676, + "test_loss": 7.03288666305542, + "test_acc": 0.0373, + "lyapunov": null, + "grad_norm": 0.5040934974077137, + "grad_max_sv": 0.1631232462823391, + "grad_min_sv": 9.429894434753727e-09, + "grad_condition": 22205151.285805613, + "lr": 8.856374635655688e-06, + "time_sec": 66.73880624771118 + }, + { + "epoch": 142, + "train_loss": 2.9171245983886718, + "train_acc": 0.26776, + "test_loss": 7.131447039031983, + "test_acc": 0.0347, + "lyapunov": null, + "grad_norm": 0.502296749693395, + "grad_max_sv": 0.16366422846913337, + "grad_min_sv": 9.319274187069571e-09, + "grad_condition": 23643079.173571, + "lr": 7.001981464747503e-06, + "time_sec": 66.7779552936554 + }, + { + "epoch": 143, + "train_loss": 2.922498332595825, + "train_acc": 0.26552, + "test_loss": 6.954830606079102, + "test_acc": 0.0348, + "lyapunov": null, + "grad_norm": 0.5043546674267846, + "grad_max_sv": 0.1646194864064455, + "grad_min_sv": 9.327249025914419e-09, + "grad_condition": 20109722.273851108, + "lr": 5.3638335185058295e-06, + "time_sec": 66.78727650642395 + }, + { + "epoch": 144, + "train_loss": 2.9214989219665526, + "train_acc": 0.26862, + "test_loss": 7.012627954101562, + "test_acc": 0.0377, + "lyapunov": null, + "grad_norm": 0.5036510560585029, + "grad_max_sv": 0.1648405112326145, + "grad_min_sv": 9.423214848702788e-09, + "grad_condition": 39000025.89670716, + "lr": 3.942649342761114e-06, + "time_sec": 66.78706383705139 + }, + { + "epoch": 145, + "train_loss": 2.922225288314819, + "train_acc": 0.2672, + "test_loss": 6.957889157104492, + "test_acc": 0.0364, + "lyapunov": null, + "grad_norm": 0.503867068026341, + "grad_max_sv": 0.16379656754434108, + "grad_min_sv": 9.359998385562173e-09, + "grad_condition": 77281010.69187385, + "lr": 2.7390523158633524e-06, + "time_sec": 66.7628915309906 + }, + { + "epoch": 146, + "train_loss": 2.9163033376312257, + "train_acc": 0.2685, + "test_loss": 6.855587731933594, + "test_acc": 0.0358, + "lyapunov": null, + "grad_norm": 0.5029204495133565, + "grad_max_sv": 0.16139821223914624, + "grad_min_sv": 9.274698062333719e-09, + "grad_condition": 20548752.94100132, + "lr": 1.7535703752478133e-06, + "time_sec": 66.76251316070557 + }, + { + "epoch": 147, + "train_loss": 2.9199572286987303, + "train_acc": 0.2662, + "test_loss": 7.004822827148438, + "test_acc": 0.0334, + "lyapunov": null, + "grad_norm": 0.5038995262415072, + "grad_max_sv": 0.15897907465696334, + "grad_min_sv": 9.380836815675586e-09, + "grad_condition": 19124324.302936584, + "lr": 9.866357858642196e-07, + "time_sec": 66.77228903770447 + }, + { + "epoch": 148, + "train_loss": 2.9100856079101565, + "train_acc": 0.26856, + "test_loss": 7.008816410064697, + "test_acc": 0.0333, + "lyapunov": null, + "grad_norm": 0.5033801740007838, + "grad_max_sv": 0.16318991631269456, + "grad_min_sv": 9.304624077298429e-09, + "grad_condition": 88163387.15126483, + "lr": 4.38584950570808e-07, + "time_sec": 66.73154377937317 + }, + { + "epoch": 149, + "train_loss": 2.918438820800781, + "train_acc": 0.26988, + "test_loss": 7.183802980041504, + "test_acc": 0.0335, + "lyapunov": null, + "grad_norm": 0.5034594519443074, + "grad_max_sv": 0.16287193521857263, + "grad_min_sv": 9.228533171673492e-09, + "grad_condition": 31684078.48425772, + "lr": 1.096582625772501e-07, + "time_sec": 66.71334385871887 + }, + { + "epoch": 150, + "train_loss": 2.9179681867980958, + "train_acc": 0.26896, + "test_loss": 7.132198828887939, + "test_acc": 0.0374, + "lyapunov": null, + "grad_norm": 0.5039379693049055, + "grad_max_sv": 0.16534604988992213, + "grad_min_sv": 9.358835868777949e-09, + "grad_condition": 24483022.85106538, + "lr": 0.0, + "time_sec": 66.76589560508728 + } + ], + "20": [ + { + "epoch": 1, + "train_loss": 5.21357828704834, + "train_acc": 0.00958, + "test_loss": 4.717830415344238, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 6.028281164907647, + "grad_max_sv": 5.586896324157715, + "grad_min_sv": 8.321505736708091e-08, + "grad_condition": 126391405.93672016, + "lr": 0.0009998903417374227, + "time_sec": 83.75971913337708 + }, + { + "epoch": 2, + "train_loss": 5.002406215209961, + "train_acc": 0.01054, + "test_loss": 4.706539186859131, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.942916858382687, + "grad_max_sv": 4.443458986282349, + "grad_min_sv": 6.176679956948483e-08, + "grad_condition": 368514713.27491444, + "lr": 0.0009995614150494292, + "time_sec": 83.72638368606567 + }, + { + "epoch": 3, + "train_loss": 4.941021067657471, + "train_acc": 0.0102, + "test_loss": 4.685369007110595, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.551335199238429, + "grad_max_sv": 4.130530917644501, + "grad_min_sv": 5.607447592093085e-08, + "grad_condition": 379082253.2858798, + "lr": 0.0009990133642141358, + "time_sec": 83.7252631187439 + }, + { + "epoch": 4, + "train_loss": 4.901978406677246, + "train_acc": 0.00948, + "test_loss": 4.704164950561523, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.292365216371512, + "grad_max_sv": 3.9344047129154207, + "grad_min_sv": 5.476369089318922e-08, + "grad_condition": 96219244.721114, + "lr": 0.0009982464296247522, + "time_sec": 83.74504327774048 + }, + { + "epoch": 5, + "train_loss": 4.875739136657715, + "train_acc": 0.00976, + "test_loss": 4.67882677154541, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.102770691913926, + "grad_max_sv": 3.7305591464042664, + "grad_min_sv": 5.105303844121778e-08, + "grad_condition": 114422829.17041938, + "lr": 0.0009972609476841367, + "time_sec": 83.7535228729248 + }, + { + "epoch": 6, + "train_loss": 4.854646638641357, + "train_acc": 0.01, + "test_loss": 4.6779319816589355, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 3.9533090018879022, + "grad_max_sv": 3.569680255651474, + "grad_min_sv": 4.9375477451096826e-08, + "grad_condition": 120982864.11796215, + "lr": 0.000996057350657239, + "time_sec": 83.76437997817993 + }, + { + "epoch": 7, + "train_loss": 4.843388534240723, + "train_acc": 0.0093, + "test_loss": 4.688051298522949, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.808254303294448, + "grad_max_sv": 3.401720005273819, + "grad_min_sv": 4.769865569742571e-08, + "grad_condition": 124322938.54178014, + "lr": 0.000994636166481494, + "time_sec": 83.73754358291626 + }, + { + "epoch": 8, + "train_loss": 4.831099078216552, + "train_acc": 0.0098, + "test_loss": 4.686168608093261, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 3.638633817460268, + "grad_max_sv": 3.29349827170372, + "grad_min_sv": 4.562366222038428e-08, + "grad_condition": 130991249.85200353, + "lr": 0.0009929980185352525, + "time_sec": 83.75114607810974 + }, + { + "epoch": 9, + "train_loss": 4.8127050201416015, + "train_acc": 0.01066, + "test_loss": 4.702382767486572, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.500656504897414, + "grad_max_sv": 3.2044365644454955, + "grad_min_sv": 4.392227098831691e-08, + "grad_condition": 228917141.42878217, + "lr": 0.0009911436253643444, + "time_sec": 83.75008654594421 + }, + { + "epoch": 10, + "train_loss": 4.809432870025635, + "train_acc": 0.00958, + "test_loss": 4.662561440277099, + "test_acc": 0.0105, + "lyapunov": null, + "grad_norm": 3.3981948131519792, + "grad_max_sv": 3.0618119478225707, + "grad_min_sv": 4.221159614070658e-08, + "grad_condition": 89285987.82360582, + "lr": 0.0009890738003669028, + "time_sec": 83.75357627868652 + }, + { + "epoch": 11, + "train_loss": 4.788434708251953, + "train_acc": 0.01052, + "test_loss": 4.672326850891113, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.239567320080417, + "grad_max_sv": 2.9396412312984466, + "grad_min_sv": 3.992155273024878e-08, + "grad_condition": 91783422.62374839, + "lr": 0.00098678945143658, + "time_sec": 83.73260736465454 + }, + { + "epoch": 12, + "train_loss": 4.779874237365723, + "train_acc": 0.01008, + "test_loss": 4.67001594543457, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 3.103566946411183, + "grad_max_sv": 2.861602544784546, + "grad_min_sv": 3.936066093057633e-08, + "grad_condition": 119851949.4663836, + "lr": 0.0009842915805643154, + "time_sec": 83.817462682724 + }, + { + "epoch": 13, + "train_loss": 4.770841501159668, + "train_acc": 0.00992, + "test_loss": 4.656426369476319, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 3.0009960370081323, + "grad_max_sv": 2.656493490934372, + "grad_min_sv": 3.707013069217946e-08, + "grad_condition": 498107586.22724324, + "lr": 0.000981581283398829, + "time_sec": 83.74097108840942 + }, + { + "epoch": 14, + "train_loss": 4.756785203857422, + "train_acc": 0.01042, + "test_loss": 4.675232955932617, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 2.8493309861575318, + "grad_max_sv": 2.5364737689495085, + "grad_min_sv": 3.586032745195311e-08, + "grad_condition": 113107959.8123773, + "lr": 0.0009786597487660333, + "time_sec": 83.73817372322083 + }, + { + "epoch": 15, + "train_loss": 4.754773846588135, + "train_acc": 0.00998, + "test_loss": 4.659816702270508, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 2.754495953066911, + "grad_max_sv": 2.477891582250595, + "grad_min_sv": 3.409575287799394e-08, + "grad_condition": 161602481.60469836, + "lr": 0.0009755282581475766, + "time_sec": 83.75961685180664 + }, + { + "epoch": 16, + "train_loss": 4.743301128997802, + "train_acc": 0.0101, + "test_loss": 4.649964485168457, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 2.6595920331694725, + "grad_max_sv": 2.3447550773620605, + "grad_min_sv": 3.222141393699474e-08, + "grad_condition": 183792258.0998055, + "lr": 0.0009721881851187403, + "time_sec": 83.78172135353088 + }, + { + "epoch": 17, + "train_loss": 4.733358394927978, + "train_acc": 0.01016, + "test_loss": 4.642168313598633, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 2.5896272478360634, + "grad_max_sv": 2.3136182010173796, + "grad_min_sv": 3.172710767995745e-08, + "grad_condition": 117247363.48613138, + "lr": 0.0009686409947459456, + "time_sec": 83.75683784484863 + }, + { + "epoch": 18, + "train_loss": 4.729640578918457, + "train_acc": 0.0106, + "test_loss": 4.654958557128906, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 2.5388744373274417, + "grad_max_sv": 2.2171274721622467, + "grad_min_sv": 3.0159331015910953e-08, + "grad_condition": 101838677.71373975, + "lr": 0.0009648882429441254, + "time_sec": 83.75490856170654 + }, + { + "epoch": 19, + "train_loss": 4.723793775634766, + "train_acc": 0.0104, + "test_loss": 4.653732388305664, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 2.4692592532468662, + "grad_max_sv": 2.1681156396865844, + "grad_min_sv": 2.978641970435847e-08, + "grad_condition": 233798757.5515837, + "lr": 0.00096093157579425, + "time_sec": 83.76724123954773 + }, + { + "epoch": 20, + "train_loss": 4.718724663238525, + "train_acc": 0.0102, + "test_loss": 4.649697755432129, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 2.427591699320917, + "grad_max_sv": 2.1466651976108553, + "grad_min_sv": 2.9465831946628997e-08, + "grad_condition": 88939856.59831895, + "lr": 0.0009567727288213001, + "time_sec": 83.74052405357361 + }, + { + "epoch": 21, + "train_loss": 4.712672980194092, + "train_acc": 0.01012, + "test_loss": 4.647871576690674, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 2.357057284901842, + "grad_max_sv": 2.1047394454479216, + "grad_min_sv": 2.8490478837239763e-08, + "grad_condition": 91579762.44536874, + "lr": 0.0009524135262330095, + "time_sec": 83.75857543945312 + }, + { + "epoch": 22, + "train_loss": 4.706978241882324, + "train_acc": 0.01024, + "test_loss": 4.648735240936279, + "test_acc": 0.0085, + "lyapunov": null, + "grad_norm": 2.2900045512493366, + "grad_max_sv": 2.081936264038086, + "grad_min_sv": 2.8080869171609457e-08, + "grad_condition": 136805304.6805451, + "lr": 0.0009478558801197061, + "time_sec": 83.75628423690796 + }, + { + "epoch": 23, + "train_loss": 4.700225740966797, + "train_acc": 0.00964, + "test_loss": 4.647530085754394, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 2.2107587083430276, + "grad_max_sv": 1.988323137164116, + "grad_min_sv": 2.6475746447984784e-08, + "grad_condition": 164008669.76777038, + "lr": 0.000943101789615607, + "time_sec": 83.77352237701416 + }, + { + "epoch": 24, + "train_loss": 4.692355620117188, + "train_acc": 0.0096, + "test_loss": 4.637314375305176, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 2.058860964349953, + "grad_max_sv": 1.8445529341697693, + "grad_min_sv": 2.4344878213344857e-08, + "grad_condition": 86439388.46384792, + "lr": 0.0009381533400219313, + "time_sec": 83.79498553276062 + }, + { + "epoch": 25, + "train_loss": 4.681464791564942, + "train_acc": 0.00928, + "test_loss": 4.623963987731933, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.887935665727307, + "grad_max_sv": 1.675812867283821, + "grad_min_sv": 2.197329014158589e-08, + "grad_condition": 136861974.56893334, + "lr": 0.0009330127018922189, + "time_sec": 83.75438261032104 + }, + { + "epoch": 26, + "train_loss": 4.666114781646728, + "train_acc": 0.00968, + "test_loss": 4.622957837677002, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.6987317795206707, + "grad_max_sv": 1.5008918464183807, + "grad_min_sv": 1.8850404182035874e-08, + "grad_condition": 396848763.8507156, + "lr": 0.000927682130080253, + "time_sec": 83.80677318572998 + }, + { + "epoch": 27, + "train_loss": 4.656886034545899, + "train_acc": 0.0103, + "test_loss": 4.618579483032226, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.49568981841554, + "grad_max_sv": 1.3568953216075896, + "grad_min_sv": 1.566217179560514e-08, + "grad_condition": 103503015.49660948, + "lr": 0.0009221639627510072, + "time_sec": 83.78064775466919 + }, + { + "epoch": 28, + "train_loss": 4.643399444732666, + "train_acc": 0.01056, + "test_loss": 4.614220301055909, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 1.3088039077662417, + "grad_max_sv": 1.1537246599793434, + "grad_min_sv": 1.2267503651797185e-08, + "grad_condition": 114843460.24858093, + "lr": 0.0009164606203550494, + "time_sec": 83.7792694568634 + }, + { + "epoch": 29, + "train_loss": 4.633547606048584, + "train_acc": 0.00896, + "test_loss": 4.611564260101319, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 1.0933490764935123, + "grad_max_sv": 0.9679391533136368, + "grad_min_sv": 7.642074995560522e-09, + "grad_condition": 804214751.6294578, + "lr": 0.0009105746045668516, + "time_sec": 83.83227157592773 + }, + { + "epoch": 30, + "train_loss": 4.624774245300293, + "train_acc": 0.00964, + "test_loss": 4.608921669769287, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.8837855695002744, + "grad_max_sv": 0.773915484547615, + "grad_min_sv": 2.366957635572509e-11, + "grad_condition": 237910863465.00665, + "lr": 0.0009045084971874733, + "time_sec": 83.80770468711853 + }, + { + "epoch": 31, + "train_loss": 4.618612337646485, + "train_acc": 0.01032, + "test_loss": 4.607751036071777, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.7415257832044893, + "grad_max_sv": 0.644972386956215, + "grad_min_sv": 3.660935201474329e-12, + "grad_condition": 261782379031.45782, + "lr": 0.0008982649590120977, + "time_sec": 83.79283952713013 + }, + { + "epoch": 32, + "train_loss": 4.616099582977295, + "train_acc": 0.0089, + "test_loss": 4.606554626464844, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.6524091899037507, + "grad_max_sv": 0.5655980415642261, + "grad_min_sv": 1.3079153537243355e-13, + "grad_condition": 507838982675.7344, + "lr": 0.0008918467286629196, + "time_sec": 83.77927327156067 + }, + { + "epoch": 33, + "train_loss": 4.613166402130127, + "train_acc": 0.00916, + "test_loss": 4.606206927490234, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.5720100552333853, + "grad_max_sv": 0.4838749781250954, + "grad_min_sv": 7.656531138726084e-14, + "grad_condition": 452556546253.1081, + "lr": 0.0008852566213878943, + "time_sec": 83.7956645488739 + }, + { + "epoch": 34, + "train_loss": 4.610275639953613, + "train_acc": 0.0096, + "test_loss": 4.605738200378418, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.4266452221992571, + "grad_max_sv": 0.36331126987934115, + "grad_min_sv": 5.44079975167954e-15, + "grad_condition": 361256197137.27747, + "lr": 0.000878497527825878, + "time_sec": 83.78154063224792 + }, + { + "epoch": 35, + "train_loss": 4.608961817626954, + "train_acc": 0.01014, + "test_loss": 4.605575282287598, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 0.32905926875005, + "grad_max_sv": 0.2839593421667814, + "grad_min_sv": 8.941027107756884e-17, + "grad_condition": 283933784815.36444, + "lr": 0.000871572412738697, + "time_sec": 83.76054668426514 + }, + { + "epoch": 36, + "train_loss": 4.608401114196777, + "train_acc": 0.00938, + "test_loss": 4.605348924255371, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2743447711162471, + "grad_max_sv": 0.2315550185739994, + "grad_min_sv": 2.4262184593062427e-31, + "grad_condition": 231555018573.99936, + "lr": 0.0008644843137107055, + "time_sec": 83.76748013496399 + }, + { + "epoch": 37, + "train_loss": 4.6074152955627445, + "train_acc": 0.01014, + "test_loss": 4.605235860443115, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.22829204328314687, + "grad_max_sv": 0.19001176171004772, + "grad_min_sv": 0.0, + "grad_condition": 190011761710.0477, + "lr": 0.0008572363398164014, + "time_sec": 83.82857966423035 + }, + { + "epoch": 38, + "train_loss": 4.6074430204772945, + "train_acc": 0.00846, + "test_loss": 4.605340163421631, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2131689057955099, + "grad_max_sv": 0.17414189949631692, + "grad_min_sv": 0.0, + "grad_condition": 174141899496.3169, + "lr": 0.0008498316702566826, + "time_sec": 83.7941620349884 + }, + { + "epoch": 39, + "train_loss": 4.608160193786621, + "train_acc": 0.00878, + "test_loss": 4.605639952087403, + "test_acc": 0.009, + "lyapunov": null, + "grad_norm": 0.24317456921386985, + "grad_max_sv": 0.2019160557538271, + "grad_min_sv": 0.0, + "grad_condition": 201916055753.8271, + "lr": 0.0008422735529643442, + "time_sec": 83.80830645561218 + }, + { + "epoch": 40, + "train_loss": 4.606921190032959, + "train_acc": 0.00868, + "test_loss": 4.605219190216064, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.17887802551259574, + "grad_max_sv": 0.14444960467517376, + "grad_min_sv": 0.0, + "grad_condition": 144449604675.17377, + "lr": 0.0008345653031794289, + "time_sec": 83.76973342895508 + }, + { + "epoch": 41, + "train_loss": 4.606422245941162, + "train_acc": 0.00834, + "test_loss": 4.605222705078125, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.17289778065418965, + "grad_max_sv": 0.13819168899208306, + "grad_min_sv": 0.0, + "grad_condition": 138191688992.08307, + "lr": 0.0008267103019950526, + "time_sec": 83.74321436882019 + }, + { + "epoch": 42, + "train_loss": 4.606239071655273, + "train_acc": 0.01008, + "test_loss": 4.605207167053223, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.16994723888320276, + "grad_max_sv": 0.13730969540774823, + "grad_min_sv": 0.0, + "grad_condition": 137309695407.74821, + "lr": 0.0008187119948743447, + "time_sec": 83.7667281627655 + }, + { + "epoch": 43, + "train_loss": 4.606040752410888, + "train_acc": 0.00878, + "test_loss": 4.605204765319824, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.14038728911483775, + "grad_max_sv": 0.10907853152602912, + "grad_min_sv": 0.0, + "grad_condition": 109078531526.0291, + "lr": 0.000810573890139155, + "time_sec": 83.71949076652527 + }, + { + "epoch": 44, + "train_loss": 4.605822370910644, + "train_acc": 0.00892, + "test_loss": 4.605195722198486, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.11252097462442588, + "grad_max_sv": 0.05359459263272583, + "grad_min_sv": 0.0, + "grad_condition": 53594592632.72584, + "lr": 0.0008022995574311873, + "time_sec": 83.74685764312744 + }, + { + "epoch": 45, + "train_loss": 4.605744844055176, + "train_acc": 0.0091, + "test_loss": 4.605188182067871, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09696133635132191, + "grad_max_sv": 0.02572248433716595, + "grad_min_sv": 0.0, + "grad_condition": 25722484337.16595, + "lr": 0.0007938926261462363, + "time_sec": 83.688485622406 + }, + { + "epoch": 46, + "train_loss": 4.605597140960693, + "train_acc": 0.00844, + "test_loss": 4.605181010437012, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09018030151754076, + "grad_max_sv": 0.008408381370827556, + "grad_min_sv": 0.0, + "grad_condition": 8408381370.827555, + "lr": 0.0007853567838422158, + "time_sec": 83.6915934085846 + }, + { + "epoch": 47, + "train_loss": 4.605502964324951, + "train_acc": 0.00962, + "test_loss": 4.605176095581054, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.08904470683636952, + "grad_max_sv": 0.006156692747026682, + "grad_min_sv": 0.0, + "grad_condition": 6156692747.026682, + "lr": 0.0007766957746216719, + "time_sec": 83.68823766708374 + }, + { + "epoch": 48, + "train_loss": 4.605539189758301, + "train_acc": 0.00832, + "test_loss": 4.605174793243409, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.08881260926985375, + "grad_max_sv": 0.005750873032957316, + "grad_min_sv": 0.0, + "grad_condition": 5750873032.957315, + "lr": 0.0007679133974894982, + "time_sec": 83.71515822410583 + }, + { + "epoch": 49, + "train_loss": 4.605639272460937, + "train_acc": 0.00838, + "test_loss": 4.605174536132813, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09166121492862447, + "grad_max_sv": 0.012213990930467844, + "grad_min_sv": 0.0, + "grad_condition": 12213990930.467844, + "lr": 0.000759013504686565, + "time_sec": 83.6816132068634 + }, + { + "epoch": 50, + "train_loss": 4.605558903808594, + "train_acc": 0.00886, + "test_loss": 4.605173831939697, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.09052173034897262, + "grad_max_sv": 0.015108420280739665, + "grad_min_sv": 0.0, + "grad_condition": 15108420280.739666, + "lr": 0.0007499999999999998, + "time_sec": 83.65550971031189 + }, + { + "epoch": 51, + "train_loss": 4.606378012390136, + "train_acc": 0.00982, + "test_loss": 4.605191948699951, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.13316554004595244, + "grad_max_sv": 0.08486739061772823, + "grad_min_sv": 5.639984459982783e-14, + "grad_condition": 78828935747.45195, + "lr": 0.0007408768370508575, + "time_sec": 83.73471426963806 + }, + { + "epoch": 52, + "train_loss": 4.548985960083008, + "train_acc": 0.01534, + "test_loss": 6.090479849243164, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.31291438549111006, + "grad_max_sv": 0.21921597719192504, + "grad_min_sv": 1.8728595782364096e-11, + "grad_condition": 72581711957.44724, + "lr": 0.0007316480175599307, + "time_sec": 83.83673882484436 + }, + { + "epoch": 53, + "train_loss": 4.517283289031982, + "train_acc": 0.01706, + "test_loss": 6.098530506896973, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.298946556890386, + "grad_max_sv": 0.21190068013966085, + "grad_min_sv": 3.1303262042079113e-12, + "grad_condition": 83525509037.16917, + "lr": 0.0007223175895924635, + "time_sec": 83.79953289031982 + }, + { + "epoch": 54, + "train_loss": 4.506922316894531, + "train_acc": 0.01826, + "test_loss": 6.029461811828614, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2872016386861535, + "grad_max_sv": 0.2001660715788603, + "grad_min_sv": 2.1477832165699736e-12, + "grad_condition": 93342369625.0347, + "lr": 0.0007128896457825361, + "time_sec": 83.83765316009521 + }, + { + "epoch": 55, + "train_loss": 4.500352125549316, + "train_acc": 0.01822, + "test_loss": 6.254561413574219, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2840675312383032, + "grad_max_sv": 0.19858233965933322, + "grad_min_sv": 2.2369640777182348e-12, + "grad_condition": 84452645725.82004, + "lr": 0.0007033683215378998, + "time_sec": 83.87366318702698 + }, + { + "epoch": 56, + "train_loss": 4.494334082946778, + "train_acc": 0.01898, + "test_loss": 6.176936679077149, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28473204888904313, + "grad_max_sv": 0.20153928063809873, + "grad_min_sv": 2.5336075244057393e-12, + "grad_condition": 84473652713.76613, + "lr": 0.0006937577932260512, + "time_sec": 83.85195803642273 + }, + { + "epoch": 57, + "train_loss": 4.491042407073975, + "train_acc": 0.01962, + "test_loss": 6.597558038330078, + "test_acc": 0.009, + "lyapunov": null, + "grad_norm": 0.27666587557698485, + "grad_max_sv": 0.19496511965990065, + "grad_min_sv": 2.6691194986502985e-12, + "grad_condition": 76747509393.5625, + "lr": 0.0006840622763423388, + "time_sec": 83.8267707824707 + }, + { + "epoch": 58, + "train_loss": 4.48429320526123, + "train_acc": 0.0202, + "test_loss": 6.6381898071289065, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2720732789744726, + "grad_max_sv": 0.189533968269825, + "grad_min_sv": 2.6686336090421275e-12, + "grad_condition": 76958091069.54593, + "lr": 0.0006742860236609073, + "time_sec": 83.81882667541504 + }, + { + "epoch": 59, + "train_loss": 4.479027882080078, + "train_acc": 0.02112, + "test_loss": 6.593468840026856, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28013135845208736, + "grad_max_sv": 0.1970901783555746, + "grad_min_sv": 3.427181970598606e-12, + "grad_condition": 77152467146.4727, + "lr": 0.0006644333233692913, + "time_sec": 83.80582737922668 + }, + { + "epoch": 60, + "train_loss": 4.455229897613525, + "train_acc": 0.02522, + "test_loss": 7.094032968139649, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2984456215457652, + "grad_max_sv": 0.20514705888926982, + "grad_min_sv": 1.3113472435618547e-11, + "grad_condition": 46710044351.44385, + "lr": 0.0006545084971874734, + "time_sec": 83.83238410949707 + }, + { + "epoch": 61, + "train_loss": 4.434012725677491, + "train_acc": 0.02664, + "test_loss": 7.727159403991699, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.31670091276798196, + "grad_max_sv": 0.22147773541510105, + "grad_min_sv": 2.0530699328249547e-10, + "grad_condition": 23070127911.0107, + "lr": 0.0006445158984722354, + "time_sec": 83.8679609298706 + }, + { + "epoch": 62, + "train_loss": 4.419747852783203, + "train_acc": 0.02636, + "test_loss": 7.459843544006348, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 0.3192666281191851, + "grad_max_sv": 0.22665422596037388, + "grad_min_sv": 2.7867287440722047e-10, + "grad_condition": 28668691596.510204, + "lr": 0.0006344599103076324, + "time_sec": 83.7790117263794 + }, + { + "epoch": 63, + "train_loss": 4.410167588043213, + "train_acc": 0.0297, + "test_loss": 6.561855883789063, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.30978499796993897, + "grad_max_sv": 0.21358359269797803, + "grad_min_sv": 1.0904945902848835e-10, + "grad_condition": 28758391079.590137, + "lr": 0.0006243449435824269, + "time_sec": 83.8552029132843 + }, + { + "epoch": 64, + "train_loss": 4.398182756958008, + "train_acc": 0.02932, + "test_loss": 7.0834544662475585, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2981823968653719, + "grad_max_sv": 0.2038045074790716, + "grad_min_sv": 4.896934048336616e-10, + "grad_condition": 6480139621.348356, + "lr": 0.0006141754350553275, + "time_sec": 83.81044340133667 + }, + { + "epoch": 65, + "train_loss": 4.39155801651001, + "train_acc": 0.0299, + "test_loss": 6.743014807128906, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2915326524043412, + "grad_max_sv": 0.19417541958391665, + "grad_min_sv": 1.18620941511223e-09, + "grad_condition": 1528876877.7676086, + "lr": 0.0006039558454088793, + "time_sec": 83.8169424533844 + }, + { + "epoch": 66, + "train_loss": 4.383871633453369, + "train_acc": 0.03122, + "test_loss": 6.343855700683593, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2920918221308499, + "grad_max_sv": 0.19423219338059425, + "grad_min_sv": 1.1915352001942714e-09, + "grad_condition": 890331184.9718037, + "lr": 0.000593690657292862, + "time_sec": 83.8088231086731 + }, + { + "epoch": 67, + "train_loss": 4.380996891784668, + "train_acc": 0.03214, + "test_loss": 6.3810079963684085, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28877371474045604, + "grad_max_sv": 0.193271204829216, + "grad_min_sv": 1.6600884500828778e-09, + "grad_condition": 372383180.6138096, + "lr": 0.0005833843733580507, + "time_sec": 83.78432846069336 + }, + { + "epoch": 68, + "train_loss": 4.376522983703613, + "train_acc": 0.0316, + "test_loss": 6.291935075378418, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.2862661185936042, + "grad_max_sv": 0.18648179918527602, + "grad_min_sv": 1.468030542869361e-09, + "grad_condition": 2139805441.5710232, + "lr": 0.0005730415142812054, + "time_sec": 83.7891354560852 + }, + { + "epoch": 69, + "train_loss": 4.372224440612793, + "train_acc": 0.03352, + "test_loss": 6.681443427276611, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2796495478797956, + "grad_max_sv": 0.18046599105000496, + "grad_min_sv": 1.2168376441450828e-09, + "grad_condition": 721985908.0902131, + "lr": 0.0005626666167821517, + "time_sec": 83.80607604980469 + }, + { + "epoch": 70, + "train_loss": 4.369470675811767, + "train_acc": 0.03222, + "test_loss": 6.483533153533935, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.28218706578232045, + "grad_max_sv": 0.18038711175322533, + "grad_min_sv": 1.6886237430915884e-09, + "grad_condition": 284801174.2502399, + "lr": 0.0005522642316338265, + "time_sec": 83.80915093421936 + }, + { + "epoch": 71, + "train_loss": 4.36190840423584, + "train_acc": 0.03452, + "test_loss": 6.448402415466308, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.27607671132097, + "grad_max_sv": 0.17782694809138774, + "grad_min_sv": 1.594215062207787e-09, + "grad_condition": 2097996064.0572019, + "lr": 0.0005418389216661573, + "time_sec": 83.82332372665405 + }, + { + "epoch": 72, + "train_loss": 4.354908424377442, + "train_acc": 0.03596, + "test_loss": 6.558257571411133, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 0.2756995722839523, + "grad_max_sv": 0.16976643167436123, + "grad_min_sv": 1.6113121665065067e-09, + "grad_condition": 277986841.7750164, + "lr": 0.0005313952597646563, + "time_sec": 83.79193758964539 + }, + { + "epoch": 73, + "train_loss": 4.354222341156006, + "train_acc": 0.03476, + "test_loss": 6.309269012451172, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26842599931569244, + "grad_max_sv": 0.1654328290373087, + "grad_min_sv": 1.5355291571898453e-09, + "grad_condition": 494546718.69761646, + "lr": 0.0005209378268645994, + "time_sec": 83.83719944953918 + }, + { + "epoch": 74, + "train_loss": 4.348915999755859, + "train_acc": 0.03656, + "test_loss": 6.48945037689209, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2721751559070442, + "grad_max_sv": 0.1733177002519369, + "grad_min_sv": 1.6353850840794179e-09, + "grad_condition": 4394906218.143788, + "lr": 0.0005104712099416781, + "time_sec": 83.87231683731079 + }, + { + "epoch": 75, + "train_loss": 4.344389753723145, + "train_acc": 0.0362, + "test_loss": 6.536355171203613, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2762971427042467, + "grad_max_sv": 0.17327322103083134, + "grad_min_sv": 1.6745484680748961e-09, + "grad_condition": 296861622.65127766, + "lr": 0.0004999999999999996, + "time_sec": 83.7963707447052 + }, + { + "epoch": 76, + "train_loss": 4.336879919433594, + "train_acc": 0.0385, + "test_loss": 6.207801509094239, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.27617831363540746, + "grad_max_sv": 0.17525496631860732, + "grad_min_sv": 1.712406004191272e-09, + "grad_condition": 355194777.2860588, + "lr": 0.0004895287900583212, + "time_sec": 83.78706455230713 + }, + { + "epoch": 77, + "train_loss": 4.334291800689697, + "train_acc": 0.03816, + "test_loss": 5.998904524230957, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.27646822759404405, + "grad_max_sv": 0.17449169531464576, + "grad_min_sv": 1.7281031508770487e-09, + "grad_condition": 617370975.1793921, + "lr": 0.0004790621731353997, + "time_sec": 83.79909944534302 + }, + { + "epoch": 78, + "train_loss": 4.33249505783081, + "train_acc": 0.0375, + "test_loss": 6.079836444854736, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.28240731905667205, + "grad_max_sv": 0.17906831130385398, + "grad_min_sv": 1.832980646302232e-09, + "grad_condition": 570608704.9054655, + "lr": 0.000468604740235343, + "time_sec": 83.78829288482666 + }, + { + "epoch": 79, + "train_loss": 4.327211993713379, + "train_acc": 0.0372, + "test_loss": 6.010349069976806, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26579955843267283, + "grad_max_sv": 0.16206405386328698, + "grad_min_sv": 1.8076382385400804e-09, + "grad_condition": 680257720.1741323, + "lr": 0.00045816107833384175, + "time_sec": 83.79378890991211 + }, + { + "epoch": 80, + "train_loss": 4.325840251617431, + "train_acc": 0.0399, + "test_loss": 6.453493260192871, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 0.2678340843927439, + "grad_max_sv": 0.16088486537337304, + "grad_min_sv": 1.8230197001067525e-09, + "grad_condition": 491813566.00292075, + "lr": 0.0004477357683661729, + "time_sec": 83.77716493606567 + }, + { + "epoch": 81, + "train_loss": 4.324064207763672, + "train_acc": 0.03872, + "test_loss": 6.066691808319092, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27284601483817317, + "grad_max_sv": 0.1656409576535225, + "grad_min_sv": 1.966192943528289e-09, + "grad_condition": 120565010.54568236, + "lr": 0.00043733338321784746, + "time_sec": 83.78050255775452 + }, + { + "epoch": 82, + "train_loss": 4.3167226469421385, + "train_acc": 0.04004, + "test_loss": 6.479253450012207, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.266468676835963, + "grad_max_sv": 0.16226925253868102, + "grad_min_sv": 1.8786357255094232e-09, + "grad_condition": 832620477.3818345, + "lr": 0.0004269584857187939, + "time_sec": 83.77594256401062 + }, + { + "epoch": 83, + "train_loss": 4.314026451263428, + "train_acc": 0.04066, + "test_loss": 6.491674769592285, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2618645063357135, + "grad_max_sv": 0.15328656397759916, + "grad_min_sv": 1.8954250842473375e-09, + "grad_condition": 324046081.6731597, + "lr": 0.0004166156266419484, + "time_sec": 83.79970407485962 + }, + { + "epoch": 84, + "train_loss": 4.307831993713379, + "train_acc": 0.04056, + "test_loss": 6.641959228515625, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2686563253168225, + "grad_max_sv": 0.16125894524157047, + "grad_min_sv": 2.0374150564578254e-09, + "grad_condition": 160522665.97837877, + "lr": 0.0004063093427071373, + "time_sec": 83.82930493354797 + }, + { + "epoch": 85, + "train_loss": 4.308941020507812, + "train_acc": 0.0418, + "test_loss": 6.508579216003418, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.27160717763788633, + "grad_max_sv": 0.1655819222331047, + "grad_min_sv": 2.023065160186577e-09, + "grad_condition": 120462376.21506557, + "lr": 0.0003960441545911199, + "time_sec": 83.7900025844574 + }, + { + "epoch": 86, + "train_loss": 4.304050233764649, + "train_acc": 0.03994, + "test_loss": 6.396804527282715, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.2729810873547816, + "grad_max_sv": 0.16440293304622172, + "grad_min_sv": 2.151508744253905e-09, + "grad_condition": 132130608.9556226, + "lr": 0.0003858245649446718, + "time_sec": 83.80140709877014 + }, + { + "epoch": 87, + "train_loss": 4.299405968475342, + "train_acc": 0.04196, + "test_loss": 6.600989144897461, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2695479470251096, + "grad_max_sv": 0.1591991312801838, + "grad_min_sv": 1.9906060319194175e-09, + "grad_condition": 119698677.25192289, + "lr": 0.00037565505641757235, + "time_sec": 83.82861065864563 + }, + { + "epoch": 88, + "train_loss": 4.301599495544433, + "train_acc": 0.04232, + "test_loss": 6.554762725830078, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2647703969850391, + "grad_max_sv": 0.15560886412858962, + "grad_min_sv": 1.9747980002995937e-09, + "grad_condition": 122983202.1326602, + "lr": 0.00036554008969236695, + "time_sec": 83.82960343360901 + }, + { + "epoch": 89, + "train_loss": 4.297747989654541, + "train_acc": 0.04348, + "test_loss": 6.357062748718262, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.26734470016505596, + "grad_max_sv": 0.15722180251032114, + "grad_min_sv": 1.981925610086699e-09, + "grad_condition": 100233762.481437, + "lr": 0.0003554841015277638, + "time_sec": 83.85219097137451 + }, + { + "epoch": 90, + "train_loss": 4.294689517669678, + "train_acc": 0.04346, + "test_loss": 6.4904538467407225, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26448991829060364, + "grad_max_sv": 0.1514646142721176, + "grad_min_sv": 2.0380848893969404e-09, + "grad_condition": 115297831.8608543, + "lr": 0.000345491502812526, + "time_sec": 83.78560423851013 + }, + { + "epoch": 91, + "train_loss": 4.288459105834961, + "train_acc": 0.04228, + "test_loss": 6.363833187866211, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2716021382283501, + "grad_max_sv": 0.16101026125252246, + "grad_min_sv": 2.0529807125135857e-09, + "grad_condition": 111422037.25124231, + "lr": 0.0003355666766307081, + "time_sec": 83.80491185188293 + }, + { + "epoch": 92, + "train_loss": 4.2877139868164065, + "train_acc": 0.04416, + "test_loss": 6.387586988067627, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2675364217657968, + "grad_max_sv": 0.1556147363036871, + "grad_min_sv": 2.072003611047757e-09, + "grad_condition": 100163844.77093126, + "lr": 0.00032571397633909225, + "time_sec": 83.80176591873169 + }, + { + "epoch": 93, + "train_loss": 4.286743914489746, + "train_acc": 0.04442, + "test_loss": 6.614454327392578, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.2696169338715711, + "grad_max_sv": 0.1587842211127281, + "grad_min_sv": 2.1451849420948964e-09, + "grad_condition": 175440678.68888003, + "lr": 0.00031593772365766094, + "time_sec": 83.81897950172424 + }, + { + "epoch": 94, + "train_loss": 4.281456643066406, + "train_acc": 0.04426, + "test_loss": 6.365528283691407, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27294877944821766, + "grad_max_sv": 0.16244313083589076, + "grad_min_sv": 2.1448280498881368e-09, + "grad_condition": 93958550.86214396, + "lr": 0.0003062422067739483, + "time_sec": 83.78250980377197 + }, + { + "epoch": 95, + "train_loss": 4.280488971710205, + "train_acc": 0.04608, + "test_loss": 6.470796231842041, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.273056993639001, + "grad_max_sv": 0.16184688359498978, + "grad_min_sv": 2.2206805599250813e-09, + "grad_condition": 185414259.9896317, + "lr": 0.00029663167846209965, + "time_sec": 83.82439541816711 + }, + { + "epoch": 96, + "train_loss": 4.279716082458496, + "train_acc": 0.04314, + "test_loss": 6.52447133026123, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 0.27442923945512043, + "grad_max_sv": 0.1630928661674261, + "grad_min_sv": 2.3233001415073897e-09, + "grad_condition": 103462231.52886583, + "lr": 0.00028711035421746345, + "time_sec": 83.83807969093323 + }, + { + "epoch": 97, + "train_loss": 4.274856643218994, + "train_acc": 0.04572, + "test_loss": 6.772166311645508, + "test_acc": 0.0109, + "lyapunov": null, + "grad_norm": 0.2771278283509764, + "grad_max_sv": 0.17104111909866332, + "grad_min_sv": 2.4184343061159352e-09, + "grad_condition": 271014828.3038153, + "lr": 0.00027768241040753615, + "time_sec": 83.85514092445374 + }, + { + "epoch": 98, + "train_loss": 4.2779387315368655, + "train_acc": 0.04608, + "test_loss": 6.668636999511719, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27463112819076785, + "grad_max_sv": 0.16144732832908631, + "grad_min_sv": 2.2677979229649758e-09, + "grad_condition": 4419130655.463402, + "lr": 0.00026835198244006903, + "time_sec": 83.83084058761597 + }, + { + "epoch": 99, + "train_loss": 4.276140930480957, + "train_acc": 0.04544, + "test_loss": 6.88837735748291, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.26886350994697167, + "grad_max_sv": 0.15219354666769505, + "grad_min_sv": 2.2166218230715296e-09, + "grad_condition": 103754705.283932, + "lr": 0.0002591231629491421, + "time_sec": 83.79713916778564 + }, + { + "epoch": 100, + "train_loss": 4.273054361877441, + "train_acc": 0.04564, + "test_loss": 6.783898326873779, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.26691489320326656, + "grad_max_sv": 0.14936545640230178, + "grad_min_sv": 2.2781338981925358e-09, + "grad_condition": 87358992.35708968, + "lr": 0.0002499999999999997, + "time_sec": 83.80319023132324 + }, + { + "epoch": 101, + "train_loss": 4.26914766998291, + "train_acc": 0.04564, + "test_loss": 6.513159948730468, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.26611169562468134, + "grad_max_sv": 0.15025373138487338, + "grad_min_sv": 2.2174503035848892e-09, + "grad_condition": 96439723.92469814, + "lr": 0.00024098649531343477, + "time_sec": 83.83437013626099 + }, + { + "epoch": 102, + "train_loss": 4.26979032119751, + "train_acc": 0.04642, + "test_loss": 6.493202007293701, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.26813810856759995, + "grad_max_sv": 0.1489817149937153, + "grad_min_sv": 2.380725915018811e-09, + "grad_condition": 76215277.93021134, + "lr": 0.0002320866025105016, + "time_sec": 83.80248379707336 + }, + { + "epoch": 103, + "train_loss": 4.260873723297119, + "train_acc": 0.04782, + "test_loss": 6.493594526672363, + "test_acc": 0.0111, + "lyapunov": null, + "grad_norm": 0.2688305350715821, + "grad_max_sv": 0.1512874387204647, + "grad_min_sv": 2.453062892919522e-09, + "grad_condition": 134347199.1051014, + "lr": 0.0002233042253783278, + "time_sec": 83.81874346733093 + }, + { + "epoch": 104, + "train_loss": 4.262198150939941, + "train_acc": 0.04738, + "test_loss": 6.605858857727051, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.27225916391154686, + "grad_max_sv": 0.15373125690966843, + "grad_min_sv": 2.44866176035783e-09, + "grad_condition": 419013949.5031613, + "lr": 0.000214643216157784, + "time_sec": 84.03694415092468 + }, + { + "epoch": 105, + "train_loss": 4.262576495056153, + "train_acc": 0.04672, + "test_loss": 6.746639459991455, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2762952402363064, + "grad_max_sv": 0.15909811817109584, + "grad_min_sv": 2.4671919398103204e-09, + "grad_condition": 139499125.202051, + "lr": 0.00020610737385376332, + "time_sec": 83.83756351470947 + }, + { + "epoch": 106, + "train_loss": 4.256981732330322, + "train_acc": 0.04834, + "test_loss": 6.714322766113281, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.27463124817104645, + "grad_max_sv": 0.15689255371689798, + "grad_min_sv": 2.5142482939360944e-09, + "grad_condition": 118433721.44138017, + "lr": 0.00019770044256881242, + "time_sec": 83.83591985702515 + }, + { + "epoch": 107, + "train_loss": 4.2602463818359375, + "train_acc": 0.04698, + "test_loss": 6.657286577606201, + "test_acc": 0.0109, + "lyapunov": null, + "grad_norm": 0.2689041932222791, + "grad_max_sv": 0.15177576132118703, + "grad_min_sv": 2.4187723310364893e-09, + "grad_condition": 94992794.34351222, + "lr": 0.0001894261098608447, + "time_sec": 83.80453681945801 + }, + { + "epoch": 108, + "train_loss": 4.2544874598693845, + "train_acc": 0.04844, + "test_loss": 6.59372087097168, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2710712522794079, + "grad_max_sv": 0.15038638189435005, + "grad_min_sv": 2.514627481589593e-09, + "grad_condition": 93107492.33691652, + "lr": 0.000181288005125655, + "time_sec": 83.77546954154968 + }, + { + "epoch": 109, + "train_loss": 4.253146978759766, + "train_acc": 0.04824, + "test_loss": 6.575524732208252, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2727669683249611, + "grad_max_sv": 0.15002147294580936, + "grad_min_sv": 2.4739045799762604e-09, + "grad_condition": 125566166.74099617, + "lr": 0.0001732896980049473, + "time_sec": 83.82711911201477 + }, + { + "epoch": 110, + "train_loss": 4.250933767089844, + "train_acc": 0.04966, + "test_loss": 6.632392105102539, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.27898350710296843, + "grad_max_sv": 0.15593392103910447, + "grad_min_sv": 2.5894539202545724e-09, + "grad_condition": 625752503.9437258, + "lr": 0.00016543469682057076, + "time_sec": 83.74293255805969 + }, + { + "epoch": 111, + "train_loss": 4.24997673614502, + "train_acc": 0.04972, + "test_loss": 6.568419965362549, + "test_acc": 0.0109, + "lyapunov": null, + "grad_norm": 0.27772763472261885, + "grad_max_sv": 0.15495621263980866, + "grad_min_sv": 2.661621495425592e-09, + "grad_condition": 70119073.46937823, + "lr": 0.00015772644703565552, + "time_sec": 83.79197788238525 + }, + { + "epoch": 112, + "train_loss": 4.249247148590088, + "train_acc": 0.0507, + "test_loss": 6.707973278045654, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 0.27686969610418316, + "grad_max_sv": 0.15229813233017922, + "grad_min_sv": 2.662702908856618e-09, + "grad_condition": 153958977.83635777, + "lr": 0.00015016832974331713, + "time_sec": 83.80273818969727 + }, + { + "epoch": 113, + "train_loss": 4.250667928771973, + "train_acc": 0.0492, + "test_loss": 6.8461118530273435, + "test_acc": 0.0096, + "lyapunov": null, + "grad_norm": 0.28055092675814575, + "grad_max_sv": 0.1576558079570532, + "grad_min_sv": 2.742332778221668e-09, + "grad_condition": 137456876.77179033, + "lr": 0.00014276366018359834, + "time_sec": 83.80364871025085 + }, + { + "epoch": 114, + "train_loss": 4.2449106436157225, + "train_acc": 0.05016, + "test_loss": 6.787322373962402, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.27979119322019597, + "grad_max_sv": 0.15479157418012618, + "grad_min_sv": 2.6695785599467614e-09, + "grad_condition": 81382647.58523288, + "lr": 0.00013551568628929425, + "time_sec": 83.82229542732239 + }, + { + "epoch": 115, + "train_loss": 4.244952727355957, + "train_acc": 0.05002, + "test_loss": 6.741559551239014, + "test_acc": 0.0092, + "lyapunov": null, + "grad_norm": 0.2773863197316903, + "grad_max_sv": 0.15171751268208028, + "grad_min_sv": 2.682797061023465e-09, + "grad_condition": 212074169.4590431, + "lr": 0.00012842758726130276, + "time_sec": 83.82812428474426 + }, + { + "epoch": 116, + "train_loss": 4.242339648132324, + "train_acc": 0.04982, + "test_loss": 6.755374185180664, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2805527611657844, + "grad_max_sv": 0.1574402242898941, + "grad_min_sv": 2.8019030511548804e-09, + "grad_condition": 238625880.71394747, + "lr": 0.0001215024721741218, + "time_sec": 83.79120373725891 + }, + { + "epoch": 117, + "train_loss": 4.240206247253418, + "train_acc": 0.04966, + "test_loss": 6.836046894073486, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2758039178422697, + "grad_max_sv": 0.1517912581562996, + "grad_min_sv": 2.68810798897956e-09, + "grad_condition": 72825643.14736441, + "lr": 0.00011474337861210538, + "time_sec": 83.7668628692627 + }, + { + "epoch": 118, + "train_loss": 4.2366791255187985, + "train_acc": 0.05162, + "test_loss": 6.8930122108459475, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.28097411795628907, + "grad_max_sv": 0.15138982199132442, + "grad_min_sv": 2.6724390362123373e-09, + "grad_condition": 105031519.49257562, + "lr": 0.00010815327133708009, + "time_sec": 83.7777681350708 + }, + { + "epoch": 119, + "train_loss": 4.239317052307129, + "train_acc": 0.05098, + "test_loss": 6.895288885498047, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.28557653268704064, + "grad_max_sv": 0.15877793319523334, + "grad_min_sv": 2.852896488665657e-09, + "grad_condition": 130124221.77470978, + "lr": 0.00010173504098790182, + "time_sec": 83.770183801651 + }, + { + "epoch": 120, + "train_loss": 4.238326491088867, + "train_acc": 0.04944, + "test_loss": 6.971952970123291, + "test_acc": 0.0116, + "lyapunov": null, + "grad_norm": 0.28330987147198217, + "grad_max_sv": 0.15257025621831416, + "grad_min_sv": 2.890761002100062e-09, + "grad_condition": 92481164.9877267, + "lr": 9.549150281252629e-05, + "time_sec": 83.78682947158813 + }, + { + "epoch": 121, + "train_loss": 4.238821759033203, + "train_acc": 0.05118, + "test_loss": 6.903655708312988, + "test_acc": 0.0107, + "lyapunov": null, + "grad_norm": 0.2844816880687477, + "grad_max_sv": 0.15047130659222602, + "grad_min_sv": 2.9364908977515257e-09, + "grad_condition": 155468550.15943855, + "lr": 8.942539543314794e-05, + "time_sec": 83.74171853065491 + }, + { + "epoch": 122, + "train_loss": 4.231929050292969, + "train_acc": 0.05106, + "test_loss": 6.9859304649353025, + "test_acc": 0.011, + "lyapunov": null, + "grad_norm": 0.28661742540946805, + "grad_max_sv": 0.15440320819616318, + "grad_min_sv": 3.0144829410438945e-09, + "grad_condition": 58782400.13901849, + "lr": 8.353937964495024e-05, + "time_sec": 83.77999758720398 + }, + { + "epoch": 123, + "train_loss": 4.234138116607666, + "train_acc": 0.05334, + "test_loss": 6.891355895996094, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.28893265325047696, + "grad_max_sv": 0.15679317489266395, + "grad_min_sv": 3.0731328568706083e-09, + "grad_condition": 83816649.99544896, + "lr": 7.783603724899243e-05, + "time_sec": 83.76851487159729 + }, + { + "epoch": 124, + "train_loss": 4.229343013763428, + "train_acc": 0.05258, + "test_loss": 7.009951159667969, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2863743887145036, + "grad_max_sv": 0.15191952474415302, + "grad_min_sv": 3.0230644397499785e-09, + "grad_condition": 211100331.6657278, + "lr": 7.231786991974666e-05, + "time_sec": 83.76139807701111 + }, + { + "epoch": 125, + "train_loss": 4.232501866760254, + "train_acc": 0.05186, + "test_loss": 6.96674277420044, + "test_acc": 0.0111, + "lyapunov": null, + "grad_norm": 0.2858550264764349, + "grad_max_sv": 0.15213587880134583, + "grad_min_sv": 3.046650505489357e-09, + "grad_condition": 63383717.426429704, + "lr": 6.698729810778072e-05, + "time_sec": 83.78086757659912 + }, + { + "epoch": 126, + "train_loss": 4.229700404968262, + "train_acc": 0.0524, + "test_loss": 7.008199283599853, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.2850115287876514, + "grad_max_sv": 0.14953349605202676, + "grad_min_sv": 2.9821331362644977e-09, + "grad_condition": 76613514.19037959, + "lr": 6.184665997806817e-05, + "time_sec": 83.765873670578 + }, + { + "epoch": 127, + "train_loss": 4.226065429992675, + "train_acc": 0.05148, + "test_loss": 6.9513890808105465, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.28929346428701186, + "grad_max_sv": 0.15673540011048318, + "grad_min_sv": 3.046475822998662e-09, + "grad_condition": 68840265.65077923, + "lr": 5.6898210384392595e-05, + "time_sec": 83.76980423927307 + }, + { + "epoch": 128, + "train_loss": 4.223751395874023, + "train_acc": 0.05446, + "test_loss": 6.981657604980469, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.2886516286895676, + "grad_max_sv": 0.15273929238319398, + "grad_min_sv": 3.0959206469283186e-09, + "grad_condition": 61503758.19812535, + "lr": 5.214411988029363e-05, + "time_sec": 83.77617073059082 + }, + { + "epoch": 129, + "train_loss": 4.223811264648438, + "train_acc": 0.05404, + "test_loss": 6.9342261474609375, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2869141420134922, + "grad_max_sv": 0.15136036798357963, + "grad_min_sv": 3.047223613023009e-09, + "grad_condition": 97351366.2154063, + "lr": 4.7586473766990294e-05, + "time_sec": 83.78148245811462 + }, + { + "epoch": 130, + "train_loss": 4.224827704467773, + "train_acc": 0.0532, + "test_loss": 7.028645568084717, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.2903989310802725, + "grad_max_sv": 0.15144419111311436, + "grad_min_sv": 3.1437888660390544e-09, + "grad_condition": 118830904.24527971, + "lr": 4.32272711786996e-05, + "time_sec": 83.79948663711548 + }, + { + "epoch": 131, + "train_loss": 4.221605782775879, + "train_acc": 0.05298, + "test_loss": 6.999451491546631, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.29092754210208693, + "grad_max_sv": 0.15410602577030658, + "grad_min_sv": 3.2033975992662445e-09, + "grad_condition": 57038304.52076046, + "lr": 3.906842420574966e-05, + "time_sec": 83.77110433578491 + }, + { + "epoch": 132, + "train_loss": 4.218992453613281, + "train_acc": 0.05284, + "test_loss": 7.0255691505432125, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2914825249386215, + "grad_max_sv": 0.15589108187705278, + "grad_min_sv": 3.206146753816086e-09, + "grad_condition": 122587816.51957992, + "lr": 3.5111757055874305e-05, + "time_sec": 83.75379085540771 + }, + { + "epoch": 133, + "train_loss": 4.220229903869629, + "train_acc": 0.05394, + "test_loss": 6.9970667213439945, + "test_acc": 0.0106, + "lyapunov": null, + "grad_norm": 0.293170941298062, + "grad_max_sv": 0.15195444263517857, + "grad_min_sv": 3.1603012576666978e-09, + "grad_condition": 99833022.93899234, + "lr": 3.1359005254054254e-05, + "time_sec": 83.83364748954773 + }, + { + "epoch": 134, + "train_loss": 4.221537724761963, + "train_acc": 0.05412, + "test_loss": 7.081800342559815, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.29192289713649316, + "grad_max_sv": 0.1527898743748665, + "grad_min_sv": 3.242900753486211e-09, + "grad_condition": 53839731.29661299, + "lr": 2.7811814881259484e-05, + "time_sec": 83.77570366859436 + }, + { + "epoch": 135, + "train_loss": 4.224225687103272, + "train_acc": 0.0536, + "test_loss": 7.031653879547119, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2928013245487039, + "grad_max_sv": 0.15023601055145264, + "grad_min_sv": 3.1499084042485583e-09, + "grad_condition": 56443800.83675871, + "lr": 2.4471741852423218e-05, + "time_sec": 83.79031038284302 + }, + { + "epoch": 136, + "train_loss": 4.2209420147705075, + "train_acc": 0.05542, + "test_loss": 7.0730202087402345, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.29383612459846997, + "grad_max_sv": 0.1526225544512272, + "grad_min_sv": 3.216327003211297e-09, + "grad_condition": 488112741.3165139, + "lr": 2.1340251233966362e-05, + "time_sec": 83.78721952438354 + }, + { + "epoch": 137, + "train_loss": 4.217904202728271, + "train_acc": 0.0547, + "test_loss": 7.029183413696289, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.29146081115101274, + "grad_max_sv": 0.14856699295341969, + "grad_min_sv": 3.193107374344084e-09, + "grad_condition": 54362425.00069554, + "lr": 1.8418716601170932e-05, + "time_sec": 83.76650714874268 + }, + { + "epoch": 138, + "train_loss": 4.222578598480225, + "train_acc": 0.05248, + "test_loss": 7.08011364440918, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 0.29305556036271213, + "grad_max_sv": 0.1505037024617195, + "grad_min_sv": 3.2047648587836542e-09, + "grad_condition": 326741808.1820611, + "lr": 1.570841943568445e-05, + "time_sec": 83.7816994190216 + }, + { + "epoch": 139, + "train_loss": 4.218749967193603, + "train_acc": 0.05366, + "test_loss": 7.0575081214904785, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.29397952766323676, + "grad_max_sv": 0.148932196572423, + "grad_min_sv": 3.2381111236823303e-09, + "grad_condition": 52412171.837261274, + "lr": 1.3210548563419845e-05, + "time_sec": 83.8086462020874 + }, + { + "epoch": 140, + "train_loss": 4.217845681304931, + "train_acc": 0.05502, + "test_loss": 7.102373625946045, + "test_acc": 0.0104, + "lyapunov": null, + "grad_norm": 0.2935367604869691, + "grad_max_sv": 0.14902403093874456, + "grad_min_sv": 3.2832004351335264e-09, + "grad_condition": 52749321.36829077, + "lr": 1.0926199633097203e-05, + "time_sec": 83.79147672653198 + }, + { + "epoch": 141, + "train_loss": 4.214903557434082, + "train_acc": 0.05414, + "test_loss": 7.033845091247558, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.29612387661640516, + "grad_max_sv": 0.15556762106716632, + "grad_min_sv": 3.2642252397602213e-09, + "grad_condition": 123272892.75406721, + "lr": 8.856374635655688e-06, + "time_sec": 83.81054306030273 + }, + { + "epoch": 142, + "train_loss": 4.215419233093262, + "train_acc": 0.05478, + "test_loss": 7.08431992111206, + "test_acc": 0.0097, + "lyapunov": null, + "grad_norm": 0.29494037543034185, + "grad_max_sv": 0.15155189596116542, + "grad_min_sv": 3.2587884789964106e-09, + "grad_condition": 76214087.81495127, + "lr": 7.001981464747503e-06, + "time_sec": 83.78057074546814 + }, + { + "epoch": 143, + "train_loss": 4.217841682281494, + "train_acc": 0.05398, + "test_loss": 7.037088000488281, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.2932160255751842, + "grad_max_sv": 0.14940347485244274, + "grad_min_sv": 3.258327102573233e-09, + "grad_condition": 73149202.84067681, + "lr": 5.3638335185058295e-06, + "time_sec": 83.79549980163574 + }, + { + "epoch": 144, + "train_loss": 4.215883382873535, + "train_acc": 0.0537, + "test_loss": 7.091348276519775, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.2950445450440956, + "grad_max_sv": 0.153789921104908, + "grad_min_sv": 3.312160905266648e-09, + "grad_condition": 52811849.90694652, + "lr": 3.942649342761114e-06, + "time_sec": 83.8086678981781 + }, + { + "epoch": 145, + "train_loss": 4.2175880349731445, + "train_acc": 0.05522, + "test_loss": 7.115469957733154, + "test_acc": 0.0098, + "lyapunov": null, + "grad_norm": 0.29403172002116806, + "grad_max_sv": 0.15080158710479735, + "grad_min_sv": 3.237252350907216e-09, + "grad_condition": 52283776.27412096, + "lr": 2.7390523158633524e-06, + "time_sec": 83.78764986991882 + }, + { + "epoch": 146, + "train_loss": 4.211100564270019, + "train_acc": 0.05546, + "test_loss": 7.0454746505737305, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.2953687426258213, + "grad_max_sv": 0.1488959614187479, + "grad_min_sv": 3.3052532932842382e-09, + "grad_condition": 57195017.16791941, + "lr": 1.7535703752478133e-06, + "time_sec": 83.81411933898926 + }, + { + "epoch": 147, + "train_loss": 4.215898538208008, + "train_acc": 0.0547, + "test_loss": 7.0791287528991695, + "test_acc": 0.0099, + "lyapunov": null, + "grad_norm": 0.29507184047055474, + "grad_max_sv": 0.1496420454233885, + "grad_min_sv": 3.2882809359756003e-09, + "grad_condition": 440797367.90569246, + "lr": 9.866357858642196e-07, + "time_sec": 83.83466935157776 + }, + { + "epoch": 148, + "train_loss": 4.21191631515503, + "train_acc": 0.05502, + "test_loss": 6.993793771362305, + "test_acc": 0.0102, + "lyapunov": null, + "grad_norm": 0.29572223257711466, + "grad_max_sv": 0.1509379804134369, + "grad_min_sv": 3.2624034737582796e-09, + "grad_condition": 53696330.15699832, + "lr": 4.38584950570808e-07, + "time_sec": 83.83085513114929 + }, + { + "epoch": 149, + "train_loss": 4.214856278686524, + "train_acc": 0.05504, + "test_loss": 7.080280429077148, + "test_acc": 0.0103, + "lyapunov": null, + "grad_norm": 0.29551682436364557, + "grad_max_sv": 0.1497094627469778, + "grad_min_sv": 3.273750590060409e-09, + "grad_condition": 73934031.32038581, + "lr": 1.096582625772501e-07, + "time_sec": 83.84602665901184 + }, + { + "epoch": 150, + "train_loss": 4.2193192990112305, + "train_acc": 0.0535, + "test_loss": 7.083986274719238, + "test_acc": 0.0101, + "lyapunov": null, + "grad_norm": 0.2957722763250381, + "grad_max_sv": 0.15103124249726535, + "grad_min_sv": 3.2879624276699325e-09, + "grad_condition": 65137818.05484857, + "lr": 0.0, + "time_sec": 83.81010937690735 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 8.745512613220216, + "train_acc": 0.02574, + "test_loss": 4.55846024017334, + "test_acc": 0.0339, + "lyapunov": 3.2288631459941035, + "grad_norm": 7.160399518281865, + "grad_max_sv": 5.050605493783951, + "grad_min_sv": 1.0948114780862107e-07, + "grad_condition": 174574426.40620375, + "lr": 0.0009998903417374227, + "time_sec": 38.78080153465271 + }, + { + "epoch": 2, + "train_loss": 6.857188781433106, + "train_acc": 0.03116, + "test_loss": 4.409567827606201, + "test_acc": 0.0498, + "lyapunov": 2.566672464160968, + "grad_norm": 4.581532406245075, + "grad_max_sv": 3.4727421343326568, + "grad_min_sv": 6.695858347782747e-08, + "grad_condition": 100510712.5879864, + "lr": 0.0009995614150494292, + "time_sec": 38.758466482162476 + }, + { + "epoch": 3, + "train_loss": 6.406850777893067, + "train_acc": 0.03836, + "test_loss": 4.3329737182617185, + "test_acc": 0.0541, + "lyapunov": 2.4151331805207237, + "grad_norm": 2.8463282070399885, + "grad_max_sv": 2.2940395712852477, + "grad_min_sv": 3.7823234264044994e-08, + "grad_condition": 106198851.94331202, + "lr": 0.0009990133642141358, + "time_sec": 38.77664065361023 + }, + { + "epoch": 4, + "train_loss": 6.1679999932861325, + "train_acc": 0.04216, + "test_loss": 4.314407443237305, + "test_acc": 0.0539, + "lyapunov": 2.324155716030189, + "grad_norm": 1.4958218707983646, + "grad_max_sv": 1.126097397506237, + "grad_min_sv": 1.8212272229894964e-08, + "grad_condition": 178099339.46093446, + "lr": 0.0009982464296247522, + "time_sec": 38.772703409194946 + }, + { + "epoch": 5, + "train_loss": 6.023621784973145, + "train_acc": 0.04472, + "test_loss": 4.327248037719727, + "test_acc": 0.0523, + "lyapunov": 2.24559463046091, + "grad_norm": 0.8361636453752828, + "grad_max_sv": 0.5582518823444843, + "grad_min_sv": 9.160982232525595e-09, + "grad_condition": 218277432.54054898, + "lr": 0.0009972609476841367, + "time_sec": 38.792168855667114 + }, + { + "epoch": 6, + "train_loss": 5.923550573730469, + "train_acc": 0.03788, + "test_loss": 4.373689149475098, + "test_acc": 0.0448, + "lyapunov": 2.143530731615813, + "grad_norm": 0.6125747823801606, + "grad_max_sv": 0.3806876644492149, + "grad_min_sv": 4.764090941352089e-09, + "grad_condition": 2115444033.3075993, + "lr": 0.000996057350657239, + "time_sec": 38.80649399757385 + }, + { + "epoch": 7, + "train_loss": 5.819468310699463, + "train_acc": 0.03402, + "test_loss": 4.396667736816406, + "test_acc": 0.0409, + "lyapunov": 2.047879105028899, + "grad_norm": 0.5012166631957408, + "grad_max_sv": 0.29988972246646883, + "grad_min_sv": 2.6462318619344118e-09, + "grad_condition": 1674717584.2678788, + "lr": 0.000994636166481494, + "time_sec": 38.8136990070343 + }, + { + "epoch": 8, + "train_loss": 5.776593683929443, + "train_acc": 0.02754, + "test_loss": 4.459617399597168, + "test_acc": 0.0288, + "lyapunov": 1.982207260168422, + "grad_norm": 0.48582047366784137, + "grad_max_sv": 0.2761614330112934, + "grad_min_sv": 2.1785290433868222e-10, + "grad_condition": 40862120030.312584, + "lr": 0.0009929980185352525, + "time_sec": 38.845232248306274 + }, + { + "epoch": 9, + "train_loss": 5.781761088104248, + "train_acc": 0.0231, + "test_loss": 4.675199285888672, + "test_acc": 0.0029, + "lyapunov": 1.954250096360131, + "grad_norm": 0.46266769063149876, + "grad_max_sv": 0.2622381761670113, + "grad_min_sv": 5.480658221434448e-10, + "grad_condition": 100986477853.47366, + "lr": 0.0009911436253643444, + "time_sec": 38.80020809173584 + }, + { + "epoch": 10, + "train_loss": 5.8479565664672855, + "train_acc": 0.01186, + "test_loss": 4.6061001365661625, + "test_acc": 0.01, + "lyapunov": 1.9396185356637705, + "grad_norm": 0.261511927042467, + "grad_max_sv": 0.09869588532019406, + "grad_min_sv": 2.728127020095826e-13, + "grad_condition": 88878548722.67065, + "lr": 0.0009890738003669028, + "time_sec": 38.743908405303955 + }, + { + "epoch": 11, + "train_loss": 5.8408165109252925, + "train_acc": 0.01034, + "test_loss": 4.6082617340087895, + "test_acc": 0.01, + "lyapunov": 1.9296608300465148, + "grad_norm": 0.2344195135575755, + "grad_max_sv": 0.08715516603551805, + "grad_min_sv": 2.4710747756651273e-15, + "grad_condition": 86872648368.75877, + "lr": 0.00098678945143658, + "time_sec": 38.751142263412476 + }, + { + "epoch": 12, + "train_loss": 5.84793187210083, + "train_acc": 0.00954, + "test_loss": 4.6062534797668455, + "test_acc": 0.01, + "lyapunov": 1.932467032881344, + "grad_norm": 0.24986425241000795, + "grad_max_sv": 0.07697397316806018, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 76973973168.06018, + "lr": 0.0009842915805643154, + "time_sec": 38.75897789001465 + }, + { + "epoch": 13, + "train_loss": 5.845315325927734, + "train_acc": 0.01, + "test_loss": 4.606490065002442, + "test_acc": 0.01, + "lyapunov": 1.9308954513896153, + "grad_norm": 0.2234501732158856, + "grad_max_sv": 0.07171829692088068, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 71718296920.88069, + "lr": 0.000981581283398829, + "time_sec": 38.77409482002258 + }, + { + "epoch": 14, + "train_loss": 5.844472907714843, + "train_acc": 0.00932, + "test_loss": 4.611052139282227, + "test_acc": 0.01, + "lyapunov": 1.9302553133586484, + "grad_norm": 0.2546366793913816, + "grad_max_sv": 0.0627493538428098, + "grad_min_sv": 5.442503105591157e-42, + "grad_condition": 62749353842.80979, + "lr": 0.0009786597487660333, + "time_sec": 38.75410294532776 + }, + { + "epoch": 15, + "train_loss": 5.839373329620361, + "train_acc": 0.01012, + "test_loss": 4.605493424987793, + "test_acc": 0.01, + "lyapunov": 1.9264278128323957, + "grad_norm": 0.33195464165742516, + "grad_max_sv": 0.0596250070258975, + "grad_min_sv": 1.1532839803575087e-39, + "grad_condition": 59625007025.89751, + "lr": 0.0009755282581475766, + "time_sec": 38.737260818481445 + }, + { + "epoch": 16, + "train_loss": 5.840845001983642, + "train_acc": 0.01006, + "test_loss": 4.606367964935303, + "test_acc": 0.01, + "lyapunov": 1.9284262577895923, + "grad_norm": 0.41972925674223915, + "grad_max_sv": 0.04947211216203869, + "grad_min_sv": 0.0, + "grad_condition": 49472112162.03868, + "lr": 0.0009721881851187403, + "time_sec": 38.72240591049194 + }, + { + "epoch": 17, + "train_loss": 5.838009662322998, + "train_acc": 0.01014, + "test_loss": 4.607442309570312, + "test_acc": 0.01, + "lyapunov": 1.927741524203659, + "grad_norm": 0.41171422252176765, + "grad_max_sv": 0.06055757296271622, + "grad_min_sv": 6.063498673792123e-17, + "grad_condition": 60551208649.85646, + "lr": 0.0009686409947459456, + "time_sec": 38.7178897857666 + }, + { + "epoch": 18, + "train_loss": 5.8419268412780765, + "train_acc": 0.00974, + "test_loss": 4.605891960144043, + "test_acc": 0.01, + "lyapunov": 1.9291500267775163, + "grad_norm": 0.3483236145113203, + "grad_max_sv": 0.03731603529304266, + "grad_min_sv": 6.04933030713951e-30, + "grad_condition": 37316035293.042656, + "lr": 0.0009648882429441254, + "time_sec": 38.760350704193115 + }, + { + "epoch": 19, + "train_loss": 5.826735510559082, + "train_acc": 0.01202, + "test_loss": 4.605664205932618, + "test_acc": 0.01, + "lyapunov": 1.9298754738419868, + "grad_norm": 0.3207639814137615, + "grad_max_sv": 0.06981198373250663, + "grad_min_sv": 1.9222199366026642e-14, + "grad_condition": 67062140845.185585, + "lr": 0.00096093157579425, + "time_sec": 38.76730132102966 + }, + { + "epoch": 20, + "train_loss": 5.84202998046875, + "train_acc": 0.00976, + "test_loss": 4.606653337097168, + "test_acc": 0.01, + "lyapunov": 1.9302551270750783, + "grad_norm": 0.20194476347748866, + "grad_max_sv": 0.03701699019875378, + "grad_min_sv": 0.0, + "grad_condition": 37016990198.75377, + "lr": 0.0009567727288213001, + "time_sec": 38.725250244140625 + }, + { + "epoch": 21, + "train_loss": 5.84192676071167, + "train_acc": 0.00982, + "test_loss": 4.614536486816406, + "test_acc": 0.01, + "lyapunov": 1.9300702325523358, + "grad_norm": 0.2358565070101103, + "grad_max_sv": 0.033911947428714485, + "grad_min_sv": 0.0, + "grad_condition": 33911947428.714485, + "lr": 0.0009524135262330095, + "time_sec": 38.72857594490051 + }, + { + "epoch": 22, + "train_loss": 5.839627782592774, + "train_acc": 0.00992, + "test_loss": 4.606048239898682, + "test_acc": 0.01, + "lyapunov": 1.9269078469947172, + "grad_norm": 0.17845225075047805, + "grad_max_sv": 0.025568678742274642, + "grad_min_sv": 0.0, + "grad_condition": 25568678742.274643, + "lr": 0.0009478558801197061, + "time_sec": 38.68861746788025 + }, + { + "epoch": 23, + "train_loss": 5.838393308258056, + "train_acc": 0.00958, + "test_loss": 4.586302839660645, + "test_acc": 0.0188, + "lyapunov": 1.9266618383510032, + "grad_norm": 0.13466647962688946, + "grad_max_sv": 0.01349067515693605, + "grad_min_sv": 0.0, + "grad_condition": 13490675156.936049, + "lr": 0.000943101789615607, + "time_sec": 38.702245473861694 + }, + { + "epoch": 24, + "train_loss": 5.835893999938965, + "train_acc": 0.0103, + "test_loss": 4.605248524475098, + "test_acc": 0.01, + "lyapunov": 1.9250504610788486, + "grad_norm": 0.1306925374207253, + "grad_max_sv": 0.021706052590161562, + "grad_min_sv": 4.2115888976736585e-17, + "grad_condition": 21702749025.936443, + "lr": 0.0009381533400219313, + "time_sec": 38.70141124725342 + }, + { + "epoch": 25, + "train_loss": 5.839240811767578, + "train_acc": 0.00906, + "test_loss": 4.605221250915528, + "test_acc": 0.01, + "lyapunov": 1.9273294420803295, + "grad_norm": 0.12078726665544544, + "grad_max_sv": 0.010838619247078896, + "grad_min_sv": 0.0, + "grad_condition": 10838619247.078896, + "lr": 0.0009330127018922189, + "time_sec": 38.68912363052368 + }, + { + "epoch": 26, + "train_loss": 5.832334176635742, + "train_acc": 0.00902, + "test_loss": 4.605214032745361, + "test_acc": 0.01, + "lyapunov": 1.92168139923564, + "grad_norm": 0.11780855950452304, + "grad_max_sv": 0.012504769628867507, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 12504769628.867508, + "lr": 0.000927682130080253, + "time_sec": 38.69681906700134 + }, + { + "epoch": 27, + "train_loss": 5.832823591003418, + "train_acc": 0.00856, + "test_loss": 4.605198753356934, + "test_acc": 0.01, + "lyapunov": 1.9220849495104817, + "grad_norm": 0.1307395775308225, + "grad_max_sv": 0.00955222793854773, + "grad_min_sv": 0.0, + "grad_condition": 9552227938.54773, + "lr": 0.0009221639627510072, + "time_sec": 38.67968559265137 + }, + { + "epoch": 28, + "train_loss": 5.8319349609375, + "train_acc": 0.00908, + "test_loss": 4.60519333190918, + "test_acc": 0.01, + "lyapunov": 1.9214767400565964, + "grad_norm": 0.11312977194763361, + "grad_max_sv": 0.007689819484949112, + "grad_min_sv": 0.0, + "grad_condition": 7689819484.949112, + "lr": 0.0009164606203550494, + "time_sec": 38.693461418151855 + }, + { + "epoch": 29, + "train_loss": 5.832658680419922, + "train_acc": 0.0089, + "test_loss": 4.605188513946533, + "test_acc": 0.01, + "lyapunov": 1.9219111963306241, + "grad_norm": 0.1139488031414971, + "grad_max_sv": 0.009555681003257632, + "grad_min_sv": 0.0, + "grad_condition": 9555681003.257633, + "lr": 0.0009105746045668516, + "time_sec": 38.88858246803284 + }, + { + "epoch": 30, + "train_loss": 5.8301619506835936, + "train_acc": 0.00936, + "test_loss": 4.605182504272461, + "test_acc": 0.01, + "lyapunov": 1.9200728305465424, + "grad_norm": 0.10113831163550316, + "grad_max_sv": 0.004735648166388273, + "grad_min_sv": 0.0, + "grad_condition": 4735648166.388273, + "lr": 0.0009045084971874733, + "time_sec": 38.682101011276245 + }, + { + "epoch": 31, + "train_loss": 5.832088593292236, + "train_acc": 0.00848, + "test_loss": 4.60520027999878, + "test_acc": 0.01, + "lyapunov": 1.921536988309582, + "grad_norm": 0.11928153797201548, + "grad_max_sv": 0.005120814079418778, + "grad_min_sv": 0.0, + "grad_condition": 5120814079.418779, + "lr": 0.0008982649590120977, + "time_sec": 38.66986131668091 + }, + { + "epoch": 32, + "train_loss": 5.830597168426514, + "train_acc": 0.009, + "test_loss": 4.605257048797608, + "test_acc": 0.01, + "lyapunov": 1.9206426658898668, + "grad_norm": 0.09874780482605999, + "grad_max_sv": 0.0029883835930377247, + "grad_min_sv": 0.0, + "grad_condition": 2988383593.0377245, + "lr": 0.0008918467286629196, + "time_sec": 38.69553232192993 + }, + { + "epoch": 33, + "train_loss": 5.829611896514892, + "train_acc": 0.00884, + "test_loss": 4.60517430267334, + "test_acc": 0.01, + "lyapunov": 1.9195137139781357, + "grad_norm": 0.09972362630787891, + "grad_max_sv": 0.00664278594776988, + "grad_min_sv": 0.0, + "grad_condition": 6642785947.76988, + "lr": 0.0008852566213878943, + "time_sec": 38.67990040779114 + }, + { + "epoch": 34, + "train_loss": 5.828044633636474, + "train_acc": 0.0083, + "test_loss": 4.605173886871338, + "test_acc": 0.01, + "lyapunov": 1.918492463848475, + "grad_norm": 0.0974792016961528, + "grad_max_sv": 0.001599628059193492, + "grad_min_sv": 0.0, + "grad_condition": 1599628059.193492, + "lr": 0.000878497527825878, + "time_sec": 38.68664336204529 + }, + { + "epoch": 35, + "train_loss": 5.830746371154786, + "train_acc": 0.00894, + "test_loss": 4.6051726875305175, + "test_acc": 0.01, + "lyapunov": 1.920728165475304, + "grad_norm": 0.0938240145066066, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000871572412738697, + "time_sec": 38.67132115364075 + }, + { + "epoch": 36, + "train_loss": 5.829937998809815, + "train_acc": 0.00866, + "test_loss": 4.605172854614258, + "test_acc": 0.01, + "lyapunov": 1.920135024868314, + "grad_norm": 0.09205400750487011, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107055, + "time_sec": 38.64905834197998 + }, + { + "epoch": 37, + "train_loss": 5.829817896728516, + "train_acc": 0.00818, + "test_loss": 4.6051733100891115, + "test_acc": 0.01, + "lyapunov": 1.9200208934066851, + "grad_norm": 0.09228371311542864, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 38.657002210617065 + }, + { + "epoch": 38, + "train_loss": 5.831039802246094, + "train_acc": 0.0088, + "test_loss": 4.6051726837158204, + "test_acc": 0.01, + "lyapunov": 1.9210114238207296, + "grad_norm": 0.09181178733619569, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 38.66207027435303 + }, + { + "epoch": 39, + "train_loss": 5.829483923492432, + "train_acc": 0.00886, + "test_loss": 4.605172607421875, + "test_acc": 0.01, + "lyapunov": 1.919772486552558, + "grad_norm": 0.09053836987454536, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 38.67074227333069 + }, + { + "epoch": 40, + "train_loss": 5.829308145904541, + "train_acc": 0.00862, + "test_loss": 4.605172937774658, + "test_acc": 0.01, + "lyapunov": 1.9195958787522962, + "grad_norm": 0.09302966072405643, + "grad_max_sv": 0.0028064717072993515, + "grad_min_sv": 0.0, + "grad_condition": 2806471707.2993517, + "lr": 0.0008345653031794289, + "time_sec": 38.66209268569946 + }, + { + "epoch": 41, + "train_loss": 5.828913317565918, + "train_acc": 0.00894, + "test_loss": 4.605173394775391, + "test_acc": 0.01, + "lyapunov": 1.9192491733204677, + "grad_norm": 0.09010018258992165, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 38.68193006515503 + }, + { + "epoch": 42, + "train_loss": 5.83203209274292, + "train_acc": 0.0089, + "test_loss": 4.6051725547790525, + "test_acc": 0.01, + "lyapunov": 1.9218718840947846, + "grad_norm": 0.09554864716201418, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 38.67262053489685 + }, + { + "epoch": 43, + "train_loss": 5.836768571929932, + "train_acc": 0.00868, + "test_loss": 4.605172836303711, + "test_acc": 0.01, + "lyapunov": 1.9252831368800014, + "grad_norm": 0.11288803301983473, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 38.673030853271484 + }, + { + "epoch": 44, + "train_loss": 5.830244238128662, + "train_acc": 0.00862, + "test_loss": 4.605172270202637, + "test_acc": 0.01, + "lyapunov": 1.9203159440204005, + "grad_norm": 0.09075156234022023, + "grad_max_sv": 0.0006292640697211027, + "grad_min_sv": 0.0, + "grad_condition": 629264069.7211027, + "lr": 0.0008022995574311873, + "time_sec": 38.67639136314392 + }, + { + "epoch": 45, + "train_loss": 5.831813296051026, + "train_acc": 0.00798, + "test_loss": 4.605172733306885, + "test_acc": 0.01, + "lyapunov": 1.9216700673408216, + "grad_norm": 0.09800318179113622, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 38.66922402381897 + }, + { + "epoch": 46, + "train_loss": 5.829525221710205, + "train_acc": 0.0088, + "test_loss": 4.605172639465332, + "test_acc": 0.01, + "lyapunov": 1.9197535209948449, + "grad_norm": 0.09607771134569527, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 38.6734299659729 + }, + { + "epoch": 47, + "train_loss": 5.831378362731933, + "train_acc": 0.00896, + "test_loss": 4.605172109985352, + "test_acc": 0.01, + "lyapunov": 1.9213088927671427, + "grad_norm": 0.09002095025572443, + "grad_max_sv": 0.0022390282712876795, + "grad_min_sv": 0.0, + "grad_condition": 2239028271.2876797, + "lr": 0.0007766957746216719, + "time_sec": 38.681992530822754 + }, + { + "epoch": 48, + "train_loss": 5.8296267512512205, + "train_acc": 0.00852, + "test_loss": 4.605172399902344, + "test_acc": 0.01, + "lyapunov": 1.9198472441919625, + "grad_norm": 0.08948131522401738, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 38.69184613227844 + }, + { + "epoch": 49, + "train_loss": 5.82939344329834, + "train_acc": 0.009, + "test_loss": 4.6051721862792965, + "test_acc": 0.01, + "lyapunov": 1.919716474345273, + "grad_norm": 0.08962129117217822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 38.66769075393677 + }, + { + "epoch": 50, + "train_loss": 5.829856867675781, + "train_acc": 0.00824, + "test_loss": 4.605171932983398, + "test_acc": 0.01, + "lyapunov": 1.9200777041027919, + "grad_norm": 0.08949650095695762, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 38.6767897605896 + }, + { + "epoch": 51, + "train_loss": 5.831189596557617, + "train_acc": 0.00886, + "test_loss": 4.605172845458984, + "test_acc": 0.01, + "lyapunov": 1.9211604323838374, + "grad_norm": 0.08928877604280225, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 38.669432640075684 + }, + { + "epoch": 52, + "train_loss": 5.827941221618652, + "train_acc": 0.00906, + "test_loss": 4.605172493743897, + "test_acc": 0.01, + "lyapunov": 1.9184872210787995, + "grad_norm": 0.08912832082902897, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 38.65984392166138 + }, + { + "epoch": 53, + "train_loss": 5.829616719360351, + "train_acc": 0.00856, + "test_loss": 4.6051721878051755, + "test_acc": 0.01, + "lyapunov": 1.9199278674772025, + "grad_norm": 0.08891740863163855, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 38.684584856033325 + }, + { + "epoch": 54, + "train_loss": 5.828832433013916, + "train_acc": 0.00888, + "test_loss": 4.605171940612793, + "test_acc": 0.01, + "lyapunov": 1.9193241215118058, + "grad_norm": 0.08862714787237397, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 38.6649751663208 + }, + { + "epoch": 55, + "train_loss": 5.829295374145508, + "train_acc": 0.00864, + "test_loss": 4.6051718048095704, + "test_acc": 0.01, + "lyapunov": 1.9196355620308605, + "grad_norm": 0.08936964720805882, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 38.66834211349487 + }, + { + "epoch": 56, + "train_loss": 5.831980644836426, + "train_acc": 0.00872, + "test_loss": 4.605172239685059, + "test_acc": 0.01, + "lyapunov": 1.9218218890602325, + "grad_norm": 0.08828331902779529, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 38.67644000053406 + }, + { + "epoch": 57, + "train_loss": 5.8291939093017575, + "train_acc": 0.00898, + "test_loss": 4.605171894836426, + "test_acc": 0.01, + "lyapunov": 1.9195057918958347, + "grad_norm": 0.08970762017367405, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 38.66079378128052 + }, + { + "epoch": 58, + "train_loss": 5.826841032867431, + "train_acc": 0.0085, + "test_loss": 4.605172017669678, + "test_acc": 0.01, + "lyapunov": 1.9176025924170415, + "grad_norm": 0.09048223717877525, + "grad_max_sv": 0.0014875998720526695, + "grad_min_sv": 0.0, + "grad_condition": 1487599872.0526695, + "lr": 0.0006742860236609073, + "time_sec": 38.66658973693848 + }, + { + "epoch": 59, + "train_loss": 5.835019799499512, + "train_acc": 0.00882, + "test_loss": 4.60517190322876, + "test_acc": 0.01, + "lyapunov": 1.9238726757371518, + "grad_norm": 0.09441160205385561, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 38.67969727516174 + }, + { + "epoch": 60, + "train_loss": 5.830721065979004, + "train_acc": 0.00836, + "test_loss": 4.605171463012695, + "test_acc": 0.01, + "lyapunov": 1.9208579142685132, + "grad_norm": 0.08921306700093072, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 38.663196325302124 + }, + { + "epoch": 61, + "train_loss": 5.829596945648193, + "train_acc": 0.00828, + "test_loss": 4.605171449279785, + "test_acc": 0.01, + "lyapunov": 1.9199584844472157, + "grad_norm": 0.08848056161918356, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 38.68021297454834 + }, + { + "epoch": 62, + "train_loss": 5.830569870300293, + "train_acc": 0.00824, + "test_loss": 4.605171228790283, + "test_acc": 0.01, + "lyapunov": 1.9206647436941982, + "grad_norm": 0.08839721397975912, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 38.675719022750854 + }, + { + "epoch": 63, + "train_loss": 5.8305546853637695, + "train_acc": 0.00854, + "test_loss": 4.605172233581543, + "test_acc": 0.01, + "lyapunov": 1.9206541834584892, + "grad_norm": 0.08903578043587344, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 38.658900022506714 + }, + { + "epoch": 64, + "train_loss": 5.836477585449218, + "train_acc": 0.00876, + "test_loss": 4.605171844482422, + "test_acc": 0.01, + "lyapunov": 1.9251100108446673, + "grad_norm": 0.09951449127834824, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 38.67370843887329 + }, + { + "epoch": 65, + "train_loss": 5.830157748260498, + "train_acc": 0.00854, + "test_loss": 4.605171319580078, + "test_acc": 0.01, + "lyapunov": 1.920334783661396, + "grad_norm": 0.09108085096662916, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 38.67955160140991 + }, + { + "epoch": 66, + "train_loss": 5.828997611694336, + "train_acc": 0.00866, + "test_loss": 4.605171671295166, + "test_acc": 0.01, + "lyapunov": 1.919463188751884, + "grad_norm": 0.08904439645709107, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 38.67839956283569 + }, + { + "epoch": 67, + "train_loss": 5.830838754272461, + "train_acc": 0.00868, + "test_loss": 4.605171606445312, + "test_acc": 0.01, + "lyapunov": 1.9207777364174727, + "grad_norm": 0.09755498438636814, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 38.67587614059448 + }, + { + "epoch": 68, + "train_loss": 5.827152337646484, + "train_acc": 0.00928, + "test_loss": 4.605171282958985, + "test_acc": 0.01, + "lyapunov": 1.9178936585136082, + "grad_norm": 0.08799438562008605, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 38.67634415626526 + }, + { + "epoch": 69, + "train_loss": 5.830286772155762, + "train_acc": 0.0096, + "test_loss": 4.605171063232422, + "test_acc": 0.01, + "lyapunov": 1.9204461242231872, + "grad_norm": 0.09070089337302271, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 38.678497076034546 + }, + { + "epoch": 70, + "train_loss": 5.832680291290283, + "train_acc": 0.0098, + "test_loss": 4.605171459197998, + "test_acc": 0.01, + "lyapunov": 1.9224533403621, + "grad_norm": 0.08827257843406246, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 38.66450572013855 + }, + { + "epoch": 71, + "train_loss": 5.830269169921875, + "train_acc": 0.00836, + "test_loss": 4.605171234130859, + "test_acc": 0.01, + "lyapunov": 1.9205291399260616, + "grad_norm": 0.08807564726395264, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 38.656336545944214 + }, + { + "epoch": 72, + "train_loss": 5.830037397460938, + "train_acc": 0.00858, + "test_loss": 4.605171022033692, + "test_acc": 0.01, + "lyapunov": 1.9203362114289229, + "grad_norm": 0.08760409668351568, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 38.68950128555298 + }, + { + "epoch": 73, + "train_loss": 5.83207408782959, + "train_acc": 0.00862, + "test_loss": 4.605171083068847, + "test_acc": 0.01, + "lyapunov": 1.922044792138707, + "grad_norm": 0.08837012490740455, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 38.678892612457275 + }, + { + "epoch": 74, + "train_loss": 5.830842367553711, + "train_acc": 0.00886, + "test_loss": 4.6051713088989255, + "test_acc": 0.01, + "lyapunov": 1.9209648620746935, + "grad_norm": 0.0881334492267735, + "grad_max_sv": 0.0016617819666862488, + "grad_min_sv": 0.0, + "grad_condition": 1661781966.6862488, + "lr": 0.0005104712099416781, + "time_sec": 38.66536831855774 + }, + { + "epoch": 75, + "train_loss": 5.831041750488281, + "train_acc": 0.00846, + "test_loss": 4.605171099853516, + "test_acc": 0.01, + "lyapunov": 1.9211621680832884, + "grad_norm": 0.08829717661983798, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 38.674325704574585 + }, + { + "epoch": 76, + "train_loss": 5.836333667144776, + "train_acc": 0.00864, + "test_loss": 4.605171186065673, + "test_acc": 0.01, + "lyapunov": 1.9246098906792644, + "grad_norm": 0.11366095758738136, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 38.687448501586914 + }, + { + "epoch": 77, + "train_loss": 5.835334293212891, + "train_acc": 0.0089, + "test_loss": 4.6051709121704105, + "test_acc": 0.01, + "lyapunov": 1.9234618140608453, + "grad_norm": 0.10831693857812812, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 38.65811228752136 + }, + { + "epoch": 78, + "train_loss": 5.827478051452637, + "train_acc": 0.00882, + "test_loss": 4.605171005249024, + "test_acc": 0.01, + "lyapunov": 1.9182067341206934, + "grad_norm": 0.08781347391325668, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 38.676063537597656 + }, + { + "epoch": 79, + "train_loss": 5.8290468742370605, + "train_acc": 0.00886, + "test_loss": 4.605171278381348, + "test_acc": 0.01, + "lyapunov": 1.919505515671752, + "grad_norm": 0.08854207911135165, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 38.673518896102905 + }, + { + "epoch": 80, + "train_loss": 5.833914941253662, + "train_acc": 0.0089, + "test_loss": 4.605170984649658, + "test_acc": 0.01, + "lyapunov": 1.9234306675088986, + "grad_norm": 0.09381991898821151, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 38.672255754470825 + }, + { + "epoch": 81, + "train_loss": 5.829356372680664, + "train_acc": 0.00902, + "test_loss": 4.605171099853516, + "test_acc": 0.01, + "lyapunov": 1.919769955413116, + "grad_norm": 0.08816368922697575, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 38.67954111099243 + }, + { + "epoch": 82, + "train_loss": 5.831741758117675, + "train_acc": 0.00918, + "test_loss": 4.605171073913574, + "test_acc": 0.01, + "lyapunov": 1.921732059525102, + "grad_norm": 0.09264254493603952, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 38.673032999038696 + }, + { + "epoch": 83, + "train_loss": 5.834408538513183, + "train_acc": 0.0092, + "test_loss": 4.605170977020264, + "test_acc": 0.01, + "lyapunov": 1.9238771880069352, + "grad_norm": 0.08953937527623661, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 38.68673372268677 + }, + { + "epoch": 84, + "train_loss": 5.830432665252686, + "train_acc": 0.009, + "test_loss": 4.605170909118653, + "test_acc": 0.01, + "lyapunov": 1.920691382854491, + "grad_norm": 0.08848473612958971, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 38.663509130477905 + }, + { + "epoch": 85, + "train_loss": 5.83150433013916, + "train_acc": 0.00862, + "test_loss": 4.605170706176758, + "test_acc": 0.01, + "lyapunov": 1.921521064875376, + "grad_norm": 0.0878123084846611, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 38.6465003490448 + }, + { + "epoch": 86, + "train_loss": 5.831791127319336, + "train_acc": 0.00896, + "test_loss": 4.605170570373535, + "test_acc": 0.01, + "lyapunov": 1.9217873232443925, + "grad_norm": 0.0877757716455608, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 38.6744065284729 + }, + { + "epoch": 87, + "train_loss": 5.832627346191407, + "train_acc": 0.00878, + "test_loss": 4.605170877075195, + "test_acc": 0.01, + "lyapunov": 1.9224827862761515, + "grad_norm": 0.08827499584565024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 38.66921091079712 + }, + { + "epoch": 88, + "train_loss": 5.8317487963867185, + "train_acc": 0.00824, + "test_loss": 4.605170699310302, + "test_acc": 0.01, + "lyapunov": 1.921761295984468, + "grad_norm": 0.08846045903994489, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 38.67842221260071 + }, + { + "epoch": 89, + "train_loss": 5.8302451986694335, + "train_acc": 0.00862, + "test_loss": 4.605170578765869, + "test_acc": 0.01, + "lyapunov": 1.9205519287177668, + "grad_norm": 0.0880969562704879, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 38.66373419761658 + }, + { + "epoch": 90, + "train_loss": 5.828649435424805, + "train_acc": 0.00928, + "test_loss": 4.605170637512207, + "test_acc": 0.01, + "lyapunov": 1.919257033816384, + "grad_norm": 0.08878565745159492, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 38.68431329727173 + }, + { + "epoch": 91, + "train_loss": 5.830266084594727, + "train_acc": 0.0087, + "test_loss": 4.60517045211792, + "test_acc": 0.01, + "lyapunov": 1.920564612464222, + "grad_norm": 0.0883222592119473, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 38.67736315727234 + }, + { + "epoch": 92, + "train_loss": 5.831894824829101, + "train_acc": 0.00856, + "test_loss": 4.605170608520508, + "test_acc": 0.01, + "lyapunov": 1.9219116762166133, + "grad_norm": 0.08764554261224523, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 38.67611908912659 + }, + { + "epoch": 93, + "train_loss": 5.82894446182251, + "train_acc": 0.00844, + "test_loss": 4.6051702972412105, + "test_acc": 0.01, + "lyapunov": 1.9194979228631919, + "grad_norm": 0.08833998566442527, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 38.69344687461853 + }, + { + "epoch": 94, + "train_loss": 5.837506525115967, + "train_acc": 0.00874, + "test_loss": 4.60517064819336, + "test_acc": 0.01, + "lyapunov": 1.9243434188920823, + "grad_norm": 0.11393882739366498, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 38.68289828300476 + }, + { + "epoch": 95, + "train_loss": 5.831888694152832, + "train_acc": 0.00764, + "test_loss": 4.605170504760742, + "test_acc": 0.01, + "lyapunov": 1.9216798833568993, + "grad_norm": 0.10076789355226513, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 38.68230414390564 + }, + { + "epoch": 96, + "train_loss": 5.839447547912598, + "train_acc": 0.00876, + "test_loss": 4.605170679473877, + "test_acc": 0.01, + "lyapunov": 1.9261463017719787, + "grad_norm": 0.11376740734099834, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 38.6755793094635 + }, + { + "epoch": 97, + "train_loss": 5.828961611328125, + "train_acc": 0.00828, + "test_loss": 4.605170320129394, + "test_acc": 0.01, + "lyapunov": 1.9195098590363018, + "grad_norm": 0.08840788709710101, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 38.676655769348145 + }, + { + "epoch": 98, + "train_loss": 5.829206983032226, + "train_acc": 0.00852, + "test_loss": 4.605170263671875, + "test_acc": 0.01, + "lyapunov": 1.9197069199188896, + "grad_norm": 0.08784611697907319, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 38.679508209228516 + }, + { + "epoch": 99, + "train_loss": 5.830749737243653, + "train_acc": 0.0086, + "test_loss": 4.605170584106445, + "test_acc": 0.01, + "lyapunov": 1.9209906048786916, + "grad_norm": 0.08837860643236768, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 38.6536865234375 + }, + { + "epoch": 100, + "train_loss": 5.833174273071289, + "train_acc": 0.00912, + "test_loss": 4.605170581054687, + "test_acc": 0.01, + "lyapunov": 1.923052377713001, + "grad_norm": 0.0880219202195275, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 38.669525146484375 + }, + { + "epoch": 101, + "train_loss": 5.832474216003418, + "train_acc": 0.00924, + "test_loss": 4.605170333862305, + "test_acc": 0.01, + "lyapunov": 1.9223707411295312, + "grad_norm": 0.088109218729273, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 38.68469524383545 + }, + { + "epoch": 102, + "train_loss": 5.832093044128418, + "train_acc": 0.0085, + "test_loss": 4.6051706710815425, + "test_acc": 0.01, + "lyapunov": 1.9221026568156678, + "grad_norm": 0.08806360302850152, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 38.667779207229614 + }, + { + "epoch": 103, + "train_loss": 5.829613971557618, + "train_acc": 0.00884, + "test_loss": 4.605170641326905, + "test_acc": 0.01, + "lyapunov": 1.9200275365044088, + "grad_norm": 0.08827372352248057, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 38.67877268791199 + }, + { + "epoch": 104, + "train_loss": 5.829403175201416, + "train_acc": 0.0085, + "test_loss": 4.605170069885254, + "test_acc": 0.01, + "lyapunov": 1.9198780102498085, + "grad_norm": 0.08759321728417062, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 38.67757058143616 + }, + { + "epoch": 105, + "train_loss": 5.83223681137085, + "train_acc": 0.00838, + "test_loss": 4.605170602416992, + "test_acc": 0.01, + "lyapunov": 1.922215115993529, + "grad_norm": 0.08796326905677253, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 38.667465925216675 + }, + { + "epoch": 106, + "train_loss": 5.833028655090332, + "train_acc": 0.00824, + "test_loss": 4.605170317840576, + "test_acc": 0.01, + "lyapunov": 1.92289487815574, + "grad_norm": 0.08795960069436239, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 38.68554091453552 + }, + { + "epoch": 107, + "train_loss": 5.827796527557373, + "train_acc": 0.00876, + "test_loss": 4.605170085144043, + "test_acc": 0.01, + "lyapunov": 1.918589440453083, + "grad_norm": 0.08772654367791473, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 38.68501615524292 + }, + { + "epoch": 108, + "train_loss": 5.82904862991333, + "train_acc": 0.00916, + "test_loss": 4.605170137023926, + "test_acc": 0.01, + "lyapunov": 1.9196739556539395, + "grad_norm": 0.08791956109774068, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 38.68057060241699 + }, + { + "epoch": 109, + "train_loss": 5.830072443237305, + "train_acc": 0.00772, + "test_loss": 4.605170295715332, + "test_acc": 0.01, + "lyapunov": 1.9204182008953046, + "grad_norm": 0.08807291337304174, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 38.66407561302185 + }, + { + "epoch": 110, + "train_loss": 5.830760421295166, + "train_acc": 0.00882, + "test_loss": 4.605170086669922, + "test_acc": 0.01, + "lyapunov": 1.9210344882267516, + "grad_norm": 0.08829325644128909, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 38.66635870933533 + }, + { + "epoch": 111, + "train_loss": 5.844144050140381, + "train_acc": 0.00756, + "test_loss": 4.605170138549805, + "test_acc": 0.01, + "lyapunov": 1.9289683185879836, + "grad_norm": 0.08860258635222626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 38.67165184020996 + }, + { + "epoch": 112, + "train_loss": 5.830768748779297, + "train_acc": 0.0085, + "test_loss": 4.605170237731934, + "test_acc": 0.01, + "lyapunov": 1.9210170031813405, + "grad_norm": 0.0882870971276682, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 38.67701458930969 + }, + { + "epoch": 113, + "train_loss": 5.8316661862182615, + "train_acc": 0.00856, + "test_loss": 4.605170329284668, + "test_acc": 0.01, + "lyapunov": 1.921789816883214, + "grad_norm": 0.08856537933077034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 38.66913890838623 + }, + { + "epoch": 114, + "train_loss": 5.83167002532959, + "train_acc": 0.00886, + "test_loss": 4.60517038269043, + "test_acc": 0.01, + "lyapunov": 1.9217432996501094, + "grad_norm": 0.08829399946029161, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 38.68831920623779 + }, + { + "epoch": 115, + "train_loss": 5.829227747192383, + "train_acc": 0.00872, + "test_loss": 4.605170357513428, + "test_acc": 0.01, + "lyapunov": 1.9198200571567505, + "grad_norm": 0.08820685400799948, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 38.898104667663574 + }, + { + "epoch": 116, + "train_loss": 5.826888065795899, + "train_acc": 0.0084, + "test_loss": 4.605169971466064, + "test_acc": 0.01, + "lyapunov": 1.9179128426724992, + "grad_norm": 0.08799764957632915, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 38.664024114608765 + }, + { + "epoch": 117, + "train_loss": 5.833059454956055, + "train_acc": 0.00838, + "test_loss": 4.605170207214355, + "test_acc": 0.01, + "lyapunov": 1.9228876301699587, + "grad_norm": 0.09229149137870292, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 38.66628289222717 + }, + { + "epoch": 118, + "train_loss": 5.834235620422363, + "train_acc": 0.00838, + "test_loss": 4.605170387268067, + "test_acc": 0.01, + "lyapunov": 1.9234702946889737, + "grad_norm": 0.11393843809281681, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 38.67253303527832 + }, + { + "epoch": 119, + "train_loss": 5.836164589385986, + "train_acc": 0.00878, + "test_loss": 4.605170240783691, + "test_acc": 0.01, + "lyapunov": 1.9253446165558017, + "grad_norm": 0.13051062587564605, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 38.675392627716064 + }, + { + "epoch": 120, + "train_loss": 5.833294369506836, + "train_acc": 0.00902, + "test_loss": 4.605170152282715, + "test_acc": 0.01, + "lyapunov": 1.9231391212214595, + "grad_norm": 0.09107209306940374, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 38.68769383430481 + }, + { + "epoch": 121, + "train_loss": 5.830208008880615, + "train_acc": 0.00872, + "test_loss": 4.605169981384277, + "test_acc": 0.01, + "lyapunov": 1.920601219777256, + "grad_norm": 0.08818902289292577, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 38.663066148757935 + }, + { + "epoch": 122, + "train_loss": 5.828988634338379, + "train_acc": 0.00866, + "test_loss": 4.6051700424194335, + "test_acc": 0.01, + "lyapunov": 1.9195775912545832, + "grad_norm": 0.08827912521059493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 38.66604161262512 + }, + { + "epoch": 123, + "train_loss": 5.8335463383483885, + "train_acc": 0.0083, + "test_loss": 4.605170326995849, + "test_acc": 0.01, + "lyapunov": 1.9230621321426937, + "grad_norm": 0.09180967837607329, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 38.66097450256348 + }, + { + "epoch": 124, + "train_loss": 5.8313025344848635, + "train_acc": 0.009, + "test_loss": 4.605170251464844, + "test_acc": 0.01, + "lyapunov": 1.9215273033932347, + "grad_norm": 0.0880278926594288, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 38.678382396698 + }, + { + "epoch": 125, + "train_loss": 5.829151732025147, + "train_acc": 0.00856, + "test_loss": 4.605170100402832, + "test_acc": 0.01, + "lyapunov": 1.9196982078844933, + "grad_norm": 0.08802943628622184, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 38.651947021484375 + }, + { + "epoch": 126, + "train_loss": 5.828555057067871, + "train_acc": 0.00854, + "test_loss": 4.605170222473144, + "test_acc": 0.01, + "lyapunov": 1.9192795976043662, + "grad_norm": 0.088302392455243, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 38.67385935783386 + }, + { + "epoch": 127, + "train_loss": 5.829820846405029, + "train_acc": 0.00872, + "test_loss": 4.605170227050781, + "test_acc": 0.01, + "lyapunov": 1.9203001791254029, + "grad_norm": 0.0881103504591081, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 38.67335605621338 + }, + { + "epoch": 128, + "train_loss": 5.846653115692138, + "train_acc": 0.00814, + "test_loss": 4.605170144653321, + "test_acc": 0.01, + "lyapunov": 1.9271661183413338, + "grad_norm": 0.12434413440967498, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 38.651455879211426 + }, + { + "epoch": 129, + "train_loss": 5.8315210632324215, + "train_acc": 0.00858, + "test_loss": 4.6051701629638675, + "test_acc": 0.01, + "lyapunov": 1.9216848407559992, + "grad_norm": 0.09353770310247324, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 38.65707588195801 + }, + { + "epoch": 130, + "train_loss": 5.833166874389648, + "train_acc": 0.00868, + "test_loss": 4.605170000457764, + "test_acc": 0.01, + "lyapunov": 1.9230641779082511, + "grad_norm": 0.08835242150848918, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 38.65906548500061 + }, + { + "epoch": 131, + "train_loss": 5.82969641418457, + "train_acc": 0.00892, + "test_loss": 4.60517036895752, + "test_acc": 0.01, + "lyapunov": 1.9201975795619017, + "grad_norm": 0.08800100320314078, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 38.66576051712036 + }, + { + "epoch": 132, + "train_loss": 5.830922511901855, + "train_acc": 0.00898, + "test_loss": 4.605170082092285, + "test_acc": 0.01, + "lyapunov": 1.921166550472874, + "grad_norm": 0.08780352004054458, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 38.67506122589111 + }, + { + "epoch": 133, + "train_loss": 5.830705413360596, + "train_acc": 0.0089, + "test_loss": 4.605170077514648, + "test_acc": 0.01, + "lyapunov": 1.9210232758461057, + "grad_norm": 0.08765525433917719, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 38.66982293128967 + }, + { + "epoch": 134, + "train_loss": 5.828949987030029, + "train_acc": 0.0092, + "test_loss": 4.60517048034668, + "test_acc": 0.01, + "lyapunov": 1.9195570479268613, + "grad_norm": 0.0878219052630613, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 38.658127784729004 + }, + { + "epoch": 135, + "train_loss": 5.832552122955322, + "train_acc": 0.00898, + "test_loss": 4.605170314025879, + "test_acc": 0.01, + "lyapunov": 1.922510105935509, + "grad_norm": 0.08848585809638171, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 38.671475887298584 + }, + { + "epoch": 136, + "train_loss": 5.828762425842285, + "train_acc": 0.00862, + "test_loss": 4.605170394897461, + "test_acc": 0.01, + "lyapunov": 1.9194351151166364, + "grad_norm": 0.08813677537771221, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 38.67206072807312 + }, + { + "epoch": 137, + "train_loss": 5.830585724487305, + "train_acc": 0.0092, + "test_loss": 4.605170066833496, + "test_acc": 0.01, + "lyapunov": 1.920962211725962, + "grad_norm": 0.08822452447484254, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 38.67813777923584 + }, + { + "epoch": 138, + "train_loss": 5.8304260397338865, + "train_acc": 0.0081, + "test_loss": 4.605170138549805, + "test_acc": 0.01, + "lyapunov": 1.9208168641990409, + "grad_norm": 0.08849509125868348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 38.67507195472717 + }, + { + "epoch": 139, + "train_loss": 5.829665904846191, + "train_acc": 0.00956, + "test_loss": 4.60517013092041, + "test_acc": 0.01, + "lyapunov": 1.9201480406324576, + "grad_norm": 0.08790362350901093, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 38.673912048339844 + }, + { + "epoch": 140, + "train_loss": 5.832476518859863, + "train_acc": 0.00906, + "test_loss": 4.6051704071044925, + "test_acc": 0.01, + "lyapunov": 1.9224549364250945, + "grad_norm": 0.08802773683248163, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 38.67948055267334 + }, + { + "epoch": 141, + "train_loss": 5.830304007110596, + "train_acc": 0.00992, + "test_loss": 4.605170399475098, + "test_acc": 0.01, + "lyapunov": 1.920735996702443, + "grad_norm": 0.0882868275030572, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 38.675227880477905 + }, + { + "epoch": 142, + "train_loss": 5.831250300292969, + "train_acc": 0.00984, + "test_loss": 4.605170373535156, + "test_acc": 0.01, + "lyapunov": 1.921463219710933, + "grad_norm": 0.08794004853752245, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 38.70003008842468 + }, + { + "epoch": 143, + "train_loss": 5.832011743011474, + "train_acc": 0.00878, + "test_loss": 4.605170379638672, + "test_acc": 0.01, + "lyapunov": 1.9220852223808502, + "grad_norm": 0.08842628454422183, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 38.69024062156677 + }, + { + "epoch": 144, + "train_loss": 5.829982127532959, + "train_acc": 0.0097, + "test_loss": 4.605170482635498, + "test_acc": 0.01, + "lyapunov": 1.9204687541708008, + "grad_norm": 0.08841994345313893, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 38.6822247505188 + }, + { + "epoch": 145, + "train_loss": 5.831171199645996, + "train_acc": 0.00958, + "test_loss": 4.605170204162597, + "test_acc": 0.01, + "lyapunov": 1.9213833555845958, + "grad_norm": 0.11341783409581589, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 38.68064069747925 + }, + { + "epoch": 146, + "train_loss": 5.832137032470703, + "train_acc": 0.00976, + "test_loss": 4.605170028686524, + "test_acc": 0.01, + "lyapunov": 1.9221693624925735, + "grad_norm": 0.08798089094104568, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 38.68038535118103 + }, + { + "epoch": 147, + "train_loss": 5.83251281906128, + "train_acc": 0.00974, + "test_loss": 4.605170251464844, + "test_acc": 0.01, + "lyapunov": 1.9224824981616282, + "grad_norm": 0.08796659107314206, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 38.673001766204834 + }, + { + "epoch": 148, + "train_loss": 5.829547540588379, + "train_acc": 0.01, + "test_loss": 4.60517032623291, + "test_acc": 0.01, + "lyapunov": 1.920109924757877, + "grad_norm": 0.08826415625381624, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 38.669779539108276 + }, + { + "epoch": 149, + "train_loss": 5.830913259735107, + "train_acc": 0.01, + "test_loss": 4.605170252227783, + "test_acc": 0.01, + "lyapunov": 1.9211858764024037, + "grad_norm": 0.08849620940008496, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 38.67606210708618 + }, + { + "epoch": 150, + "train_loss": 5.830235260314941, + "train_acc": 0.01, + "test_loss": 4.605170276641846, + "test_acc": 0.01, + "lyapunov": 1.9206774539654823, + "grad_norm": 0.08822638497198837, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 38.67439675331116 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 11.062658223266602, + "train_acc": 0.0191, + "test_loss": 4.636551777648926, + "test_acc": 0.0192, + "lyapunov": 4.093391669070934, + "grad_norm": 6.553327303351535, + "grad_max_sv": 5.005066078901291, + "grad_min_sv": 9.498946289543397e-08, + "grad_condition": 96914448.49987349, + "lr": 0.0009998903417374227, + "time_sec": 81.60158228874207 + }, + { + "epoch": 2, + "train_loss": 7.894516683044434, + "train_acc": 0.02232, + "test_loss": 4.509155606079101, + "test_acc": 0.0281, + "lyapunov": 3.109319945430512, + "grad_norm": 4.711594955608515, + "grad_max_sv": 3.8599576711654664, + "grad_min_sv": 5.844970047842041e-08, + "grad_condition": 1689973621.6123517, + "lr": 0.0009995614150494292, + "time_sec": 81.60659170150757 + }, + { + "epoch": 3, + "train_loss": 7.597164999084472, + "train_acc": 0.02292, + "test_loss": 4.547392833709717, + "test_acc": 0.0138, + "lyapunov": 3.040807009353052, + "grad_norm": 3.4020100363883277, + "grad_max_sv": 2.92706837952137, + "grad_min_sv": 3.304632755468228e-08, + "grad_condition": 5977960877.86062, + "lr": 0.0009990133642141358, + "time_sec": 81.63819622993469 + }, + { + "epoch": 4, + "train_loss": 7.466654327392578, + "train_acc": 0.02596, + "test_loss": 4.54970652999878, + "test_acc": 0.0152, + "lyapunov": 3.026890999825714, + "grad_norm": 2.184726348696494, + "grad_max_sv": 1.823475405573845, + "grad_min_sv": 1.0126577207033096e-08, + "grad_condition": 8307876314.683462, + "lr": 0.0009982464296247522, + "time_sec": 81.63975858688354 + }, + { + "epoch": 5, + "train_loss": 7.35825664352417, + "train_acc": 0.0249, + "test_loss": 4.575929130554199, + "test_acc": 0.013, + "lyapunov": 2.9873962725519827, + "grad_norm": 1.2137091228137746, + "grad_max_sv": 0.961378724873066, + "grad_min_sv": 6.631390698336963e-11, + "grad_condition": 115707330637.43631, + "lr": 0.0009972609476841367, + "time_sec": 81.71280694007874 + }, + { + "epoch": 6, + "train_loss": 7.152584227600098, + "train_acc": 0.02408, + "test_loss": 4.546905226135254, + "test_acc": 0.0165, + "lyapunov": 2.8627321110357102, + "grad_norm": 0.7830228200215259, + "grad_max_sv": 0.4966236546635628, + "grad_min_sv": 8.468786915770583e-12, + "grad_condition": 112190115201.81938, + "lr": 0.000996057350657239, + "time_sec": 81.67318558692932 + }, + { + "epoch": 7, + "train_loss": 6.736108720703125, + "train_acc": 0.02286, + "test_loss": 4.6234777084350585, + "test_acc": 0.01, + "lyapunov": 2.6260088990106607, + "grad_norm": 0.503721920030939, + "grad_max_sv": 0.28278580904006956, + "grad_min_sv": 1.9822557287658092e-12, + "grad_condition": 125105415477.25314, + "lr": 0.000994636166481494, + "time_sec": 81.64523100852966 + }, + { + "epoch": 8, + "train_loss": 6.564093143463134, + "train_acc": 0.02234, + "test_loss": 4.611732032775879, + "test_acc": 0.01, + "lyapunov": 2.514471580915134, + "grad_norm": 0.6828735354454265, + "grad_max_sv": 0.2100991995772347, + "grad_min_sv": 6.476987908912428e-13, + "grad_condition": 143664013250.37378, + "lr": 0.0009929980185352525, + "time_sec": 81.63371157646179 + }, + { + "epoch": 9, + "train_loss": 6.828797580261231, + "train_acc": 0.01912, + "test_loss": 4.606410037231445, + "test_acc": 0.01, + "lyapunov": 2.654179959041078, + "grad_norm": 1.0698865873419308, + "grad_max_sv": 0.16152255814522504, + "grad_min_sv": 1.6541991394265796e-13, + "grad_condition": 140818730869.57614, + "lr": 0.0009911436253643444, + "time_sec": 81.60695457458496 + }, + { + "epoch": 10, + "train_loss": 6.993563550720215, + "train_acc": 0.01038, + "test_loss": 4.6257774490356445, + "test_acc": 0.01, + "lyapunov": 2.7042983194141437, + "grad_norm": 0.6205939496010421, + "grad_max_sv": 0.10736188860610127, + "grad_min_sv": 7.417080745085988e-16, + "grad_condition": 107239971660.70801, + "lr": 0.0009890738003669028, + "time_sec": 81.59540891647339 + }, + { + "epoch": 11, + "train_loss": 6.5890699209594725, + "train_acc": 0.01018, + "test_loss": 4.605637271881103, + "test_acc": 0.01, + "lyapunov": 2.468636756053056, + "grad_norm": 0.39837773763043477, + "grad_max_sv": 0.06119964215904474, + "grad_min_sv": 3.8185383152851266e-45, + "grad_condition": 61199642159.044754, + "lr": 0.00098678945143658, + "time_sec": 81.5604145526886 + }, + { + "epoch": 12, + "train_loss": 6.5774819650268554, + "train_acc": 0.01, + "test_loss": 4.605390992736816, + "test_acc": 0.01, + "lyapunov": 2.4586855413968607, + "grad_norm": 0.7705617527781408, + "grad_max_sv": 0.00864509902894497, + "grad_min_sv": 0.0, + "grad_condition": 8645099028.94497, + "lr": 0.0009842915805643154, + "time_sec": 81.49474096298218 + }, + { + "epoch": 13, + "train_loss": 6.546455008239746, + "train_acc": 0.01002, + "test_loss": 4.605277996826172, + "test_acc": 0.01, + "lyapunov": 2.435590844020209, + "grad_norm": 0.5128829478227843, + "grad_max_sv": 0.004509441927075386, + "grad_min_sv": 0.0, + "grad_condition": 4509441927.075386, + "lr": 0.000981581283398829, + "time_sec": 81.4997489452362 + }, + { + "epoch": 14, + "train_loss": 6.575126316833496, + "train_acc": 0.00944, + "test_loss": 4.605232641601562, + "test_acc": 0.01, + "lyapunov": 2.451746358895851, + "grad_norm": 0.5181440557950673, + "grad_max_sv": 0.013719148561358451, + "grad_min_sv": 0.0, + "grad_condition": 13719148561.358452, + "lr": 0.0009786597487660333, + "time_sec": 81.5125732421875 + }, + { + "epoch": 15, + "train_loss": 6.587129125061035, + "train_acc": 0.0092, + "test_loss": 4.605205821228028, + "test_acc": 0.01, + "lyapunov": 2.453917900314721, + "grad_norm": 0.6398426435720163, + "grad_max_sv": 0.0049395252019166945, + "grad_min_sv": 0.0, + "grad_condition": 4939525201.916695, + "lr": 0.0009755282581475766, + "time_sec": 81.50915098190308 + }, + { + "epoch": 16, + "train_loss": 6.420363327789307, + "train_acc": 0.00962, + "test_loss": 4.605900651550293, + "test_acc": 0.01, + "lyapunov": 2.3524727979889306, + "grad_norm": 0.5507826914381541, + "grad_max_sv": 0.06663376707583665, + "grad_min_sv": 0.0, + "grad_condition": 66633767075.836655, + "lr": 0.0009721881851187403, + "time_sec": 81.59744453430176 + }, + { + "epoch": 17, + "train_loss": 6.291905773010254, + "train_acc": 0.00924, + "test_loss": 4.605198278045655, + "test_acc": 0.01, + "lyapunov": 2.2705817686017515, + "grad_norm": 0.20954429598020885, + "grad_max_sv": 0.007087096758186817, + "grad_min_sv": 0.0, + "grad_condition": 7087096758.186816, + "lr": 0.0009686409947459456, + "time_sec": 81.51701307296753 + }, + { + "epoch": 18, + "train_loss": 6.280198426513672, + "train_acc": 0.00956, + "test_loss": 4.605187928009033, + "test_acc": 0.01, + "lyapunov": 2.262371898612098, + "grad_norm": 0.15673318486817656, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009648882429441254, + "time_sec": 81.49850106239319 + }, + { + "epoch": 19, + "train_loss": 6.319409269714355, + "train_acc": 0.00894, + "test_loss": 4.605180485534668, + "test_acc": 0.01, + "lyapunov": 2.2773679802789712, + "grad_norm": 0.18004037135900994, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00096093157579425, + "time_sec": 81.52363634109497 + }, + { + "epoch": 20, + "train_loss": 6.279429423370361, + "train_acc": 0.0089, + "test_loss": 4.605177160644531, + "test_acc": 0.01, + "lyapunov": 2.261986050764313, + "grad_norm": 0.10793581510968044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009567727288213001, + "time_sec": 81.49810361862183 + }, + { + "epoch": 21, + "train_loss": 6.277427138519287, + "train_acc": 0.00862, + "test_loss": 4.605176016998291, + "test_acc": 0.01, + "lyapunov": 2.2604778922732223, + "grad_norm": 0.1164667413797286, + "grad_max_sv": 0.005474003031849861, + "grad_min_sv": 0.0, + "grad_condition": 5474003031.849861, + "lr": 0.0009524135262330095, + "time_sec": 81.49689865112305 + }, + { + "epoch": 22, + "train_loss": 6.275057526855469, + "train_acc": 0.0092, + "test_loss": 4.605175686645508, + "test_acc": 0.01, + "lyapunov": 2.258924939748271, + "grad_norm": 0.11032559480193316, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009478558801197061, + "time_sec": 81.49366521835327 + }, + { + "epoch": 23, + "train_loss": 6.280477966156006, + "train_acc": 0.00834, + "test_loss": 4.60517352142334, + "test_acc": 0.01, + "lyapunov": 2.262287087452686, + "grad_norm": 0.11733428454185782, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000943101789615607, + "time_sec": 81.4926176071167 + }, + { + "epoch": 24, + "train_loss": 6.27477842300415, + "train_acc": 0.00888, + "test_loss": 4.6051733123779295, + "test_acc": 0.01, + "lyapunov": 2.2587200552606217, + "grad_norm": 0.09563398461056706, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009381533400219313, + "time_sec": 81.48560309410095 + }, + { + "epoch": 25, + "train_loss": 6.275597013549804, + "train_acc": 0.00864, + "test_loss": 4.605174243927002, + "test_acc": 0.01, + "lyapunov": 2.259342540560476, + "grad_norm": 0.10626239815682126, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009330127018922189, + "time_sec": 81.50195908546448 + }, + { + "epoch": 26, + "train_loss": 6.307570930175781, + "train_acc": 0.00846, + "test_loss": 4.6051738105773925, + "test_acc": 0.01, + "lyapunov": 2.2765520228754226, + "grad_norm": 0.15671024580485657, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000927682130080253, + "time_sec": 81.48380661010742 + }, + { + "epoch": 27, + "train_loss": 6.3007610939025875, + "train_acc": 0.00916, + "test_loss": 4.605174212646484, + "test_acc": 0.01, + "lyapunov": 2.2724761200682893, + "grad_norm": 0.15438417468612603, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009221639627510072, + "time_sec": 81.49885392189026 + }, + { + "epoch": 28, + "train_loss": 6.279321163024902, + "train_acc": 0.0084, + "test_loss": 4.605173818206787, + "test_acc": 0.01, + "lyapunov": 2.261768304478482, + "grad_norm": 0.12913751626297293, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009164606203550494, + "time_sec": 81.51960349082947 + }, + { + "epoch": 29, + "train_loss": 6.296547222290039, + "train_acc": 0.00844, + "test_loss": 4.605173532104492, + "test_acc": 0.01, + "lyapunov": 2.269540443444801, + "grad_norm": 0.1257561792074065, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009105746045668516, + "time_sec": 81.48529624938965 + }, + { + "epoch": 30, + "train_loss": 6.301725520019532, + "train_acc": 0.00894, + "test_loss": 4.605173407745362, + "test_acc": 0.01, + "lyapunov": 2.2715838626217657, + "grad_norm": 0.14077235565425347, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009045084971874733, + "time_sec": 81.47704434394836 + }, + { + "epoch": 31, + "train_loss": 6.279767997894287, + "train_acc": 0.0086, + "test_loss": 4.6051743087768555, + "test_acc": 0.01, + "lyapunov": 2.261623111222406, + "grad_norm": 0.11414807727359211, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008982649590120977, + "time_sec": 81.51038384437561 + }, + { + "epoch": 32, + "train_loss": 6.314449734039306, + "train_acc": 0.0091, + "test_loss": 4.605173248291016, + "test_acc": 0.01, + "lyapunov": 2.27814206686776, + "grad_norm": 0.15985043411867914, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008918467286629196, + "time_sec": 81.49317169189453 + }, + { + "epoch": 33, + "train_loss": 6.281702154998779, + "train_acc": 0.0086, + "test_loss": 4.605174011993408, + "test_acc": 0.01, + "lyapunov": 2.262753884810621, + "grad_norm": 0.12070866490334974, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878943, + "time_sec": 81.49454641342163 + }, + { + "epoch": 34, + "train_loss": 6.2773644987487796, + "train_acc": 0.00906, + "test_loss": 4.605173474121094, + "test_acc": 0.01, + "lyapunov": 2.260565836411303, + "grad_norm": 0.11129476697402911, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000878497527825878, + "time_sec": 81.58190107345581 + }, + { + "epoch": 35, + "train_loss": 6.309268474578857, + "train_acc": 0.00864, + "test_loss": 4.605172872161865, + "test_acc": 0.01, + "lyapunov": 2.277102802110755, + "grad_norm": 0.17254724942107424, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000871572412738697, + "time_sec": 81.51573705673218 + }, + { + "epoch": 36, + "train_loss": 6.2885913528442385, + "train_acc": 0.00894, + "test_loss": 4.605173197937011, + "test_acc": 0.01, + "lyapunov": 2.2663694641474263, + "grad_norm": 0.12446302100514797, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107055, + "time_sec": 81.4983901977539 + }, + { + "epoch": 37, + "train_loss": 6.314083187561035, + "train_acc": 0.00826, + "test_loss": 4.605172673034668, + "test_acc": 0.01, + "lyapunov": 2.2792197420164144, + "grad_norm": 0.19167369428125208, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 81.4910204410553 + }, + { + "epoch": 38, + "train_loss": 6.276701861419678, + "train_acc": 0.00804, + "test_loss": 4.605172772979737, + "test_acc": 0.01, + "lyapunov": 2.260084454055942, + "grad_norm": 0.10142640032392508, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 81.49372029304504 + }, + { + "epoch": 39, + "train_loss": 6.2982295426940915, + "train_acc": 0.00834, + "test_loss": 4.605172825622558, + "test_acc": 0.01, + "lyapunov": 2.271109230378095, + "grad_norm": 0.13881594105822967, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 81.50897860527039 + }, + { + "epoch": 40, + "train_loss": 6.282011164550782, + "train_acc": 0.00864, + "test_loss": 4.607664538574219, + "test_acc": 0.01, + "lyapunov": 2.263592470637368, + "grad_norm": 0.1022934137238382, + "grad_max_sv": 0.006253971112892031, + "grad_min_sv": 0.0, + "grad_condition": 6253971112.892032, + "lr": 0.0008345653031794289, + "time_sec": 81.51133847236633 + }, + { + "epoch": 41, + "train_loss": 6.283648276977539, + "train_acc": 0.00898, + "test_loss": 4.615698904418945, + "test_acc": 0.01, + "lyapunov": 2.2645610153217755, + "grad_norm": 0.12524739066407903, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 81.50317192077637 + }, + { + "epoch": 42, + "train_loss": 6.291501354827881, + "train_acc": 0.00914, + "test_loss": 4.605554750061035, + "test_acc": 0.01, + "lyapunov": 2.267925240499589, + "grad_norm": 0.1307307918214705, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 81.48968553543091 + }, + { + "epoch": 43, + "train_loss": 6.276330156860352, + "train_acc": 0.00896, + "test_loss": 4.605246144104004, + "test_acc": 0.01, + "lyapunov": 2.2598801464071054, + "grad_norm": 0.0933943349122675, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 81.50180649757385 + }, + { + "epoch": 44, + "train_loss": 6.2769957354736325, + "train_acc": 0.00898, + "test_loss": 4.60537618560791, + "test_acc": 0.01, + "lyapunov": 2.26023776756833, + "grad_norm": 0.10724706931673801, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 81.48934960365295 + }, + { + "epoch": 45, + "train_loss": 6.27975429473877, + "train_acc": 0.0095, + "test_loss": 4.605248934936523, + "test_acc": 0.01, + "lyapunov": 2.2623073298607945, + "grad_norm": 0.095192742319822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 81.50000143051147 + }, + { + "epoch": 46, + "train_loss": 6.297380412445069, + "train_acc": 0.00876, + "test_loss": 4.6052475326538085, + "test_acc": 0.01, + "lyapunov": 2.271654522327511, + "grad_norm": 0.1534535578732401, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 81.47789859771729 + }, + { + "epoch": 47, + "train_loss": 6.282922696990966, + "train_acc": 0.0092, + "test_loss": 4.605248429107666, + "test_acc": 0.01, + "lyapunov": 2.264536363084603, + "grad_norm": 0.10842785613108402, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 81.48331236839294 + }, + { + "epoch": 48, + "train_loss": 6.280480013275146, + "train_acc": 0.00806, + "test_loss": 4.605249649047852, + "test_acc": 0.01, + "lyapunov": 2.2628020630468186, + "grad_norm": 0.09295297080650741, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 81.48791313171387 + }, + { + "epoch": 49, + "train_loss": 6.295236266479492, + "train_acc": 0.0081, + "test_loss": 4.605244645690918, + "test_acc": 0.01, + "lyapunov": 2.270114410868691, + "grad_norm": 0.14920321268372522, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 81.49582886695862 + }, + { + "epoch": 50, + "train_loss": 6.315434308013916, + "train_acc": 0.00828, + "test_loss": 4.605247691345215, + "test_acc": 0.01, + "lyapunov": 2.2807927832883945, + "grad_norm": 0.17847170404488147, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 81.49979019165039 + }, + { + "epoch": 51, + "train_loss": 6.302057292938232, + "train_acc": 0.009, + "test_loss": 4.605251131439209, + "test_acc": 0.01, + "lyapunov": 2.2735387291139957, + "grad_norm": 0.1418090218860237, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 81.49881410598755 + }, + { + "epoch": 52, + "train_loss": 6.278756464233399, + "train_acc": 0.00866, + "test_loss": 4.605250935363769, + "test_acc": 0.01, + "lyapunov": 2.2616379620778897, + "grad_norm": 0.09283264461248593, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 81.49807143211365 + }, + { + "epoch": 53, + "train_loss": 6.276537058105469, + "train_acc": 0.00894, + "test_loss": 4.605252996826172, + "test_acc": 0.01, + "lyapunov": 2.2600054393339035, + "grad_norm": 0.09889008649312356, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 81.50720810890198 + }, + { + "epoch": 54, + "train_loss": 6.2842115702819825, + "train_acc": 0.0088, + "test_loss": 4.60517135925293, + "test_acc": 0.01, + "lyapunov": 2.2653747550057024, + "grad_norm": 0.1176830015085984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 81.49119186401367 + }, + { + "epoch": 55, + "train_loss": 6.280401730041504, + "train_acc": 0.00886, + "test_loss": 4.605172096252441, + "test_acc": 0.01, + "lyapunov": 2.262633579771232, + "grad_norm": 0.10354075360180534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 81.49315738677979 + }, + { + "epoch": 56, + "train_loss": 6.316937896728516, + "train_acc": 0.00866, + "test_loss": 4.605172169494629, + "test_acc": 0.01, + "lyapunov": 2.2807149234635142, + "grad_norm": 0.15351000119410838, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 81.5045874118805 + }, + { + "epoch": 57, + "train_loss": 6.296867928161621, + "train_acc": 0.00924, + "test_loss": 4.605172319030761, + "test_acc": 0.01, + "lyapunov": 2.272276422861592, + "grad_norm": 0.14439465021569048, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 81.49606895446777 + }, + { + "epoch": 58, + "train_loss": 6.277121980133057, + "train_acc": 0.00822, + "test_loss": 4.605172018432617, + "test_acc": 0.01, + "lyapunov": 2.26043635926893, + "grad_norm": 0.09147768117276701, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 81.49943733215332 + }, + { + "epoch": 59, + "train_loss": 6.2761470947265625, + "train_acc": 0.00864, + "test_loss": 4.605172242736816, + "test_acc": 0.01, + "lyapunov": 2.2597581962185442, + "grad_norm": 0.0885807415167131, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 81.49118137359619 + }, + { + "epoch": 60, + "train_loss": 6.297447052307129, + "train_acc": 0.00916, + "test_loss": 4.605172019195557, + "test_acc": 0.01, + "lyapunov": 2.2733187815722298, + "grad_norm": 0.15437497590627458, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 81.49486422538757 + }, + { + "epoch": 61, + "train_loss": 6.3111451325988766, + "train_acc": 0.00872, + "test_loss": 4.605171881103516, + "test_acc": 0.01, + "lyapunov": 2.279795357638308, + "grad_norm": 0.1590526758324701, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 81.56430292129517 + }, + { + "epoch": 62, + "train_loss": 6.295817751617432, + "train_acc": 0.00874, + "test_loss": 4.605171612548828, + "test_acc": 0.01, + "lyapunov": 2.271848827981583, + "grad_norm": 0.1613023358766049, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 81.48160147666931 + }, + { + "epoch": 63, + "train_loss": 6.307024629974365, + "train_acc": 0.0085, + "test_loss": 4.605171653747559, + "test_acc": 0.01, + "lyapunov": 2.2748339487158735, + "grad_norm": 0.13676348001909264, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 81.48560905456543 + }, + { + "epoch": 64, + "train_loss": 6.277896643218994, + "train_acc": 0.00846, + "test_loss": 4.605171467590332, + "test_acc": 0.01, + "lyapunov": 2.261008509589583, + "grad_norm": 0.09063727687835958, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 81.4799861907959 + }, + { + "epoch": 65, + "train_loss": 6.285225621643066, + "train_acc": 0.00848, + "test_loss": 4.605171078491211, + "test_acc": 0.01, + "lyapunov": 2.2658682217073562, + "grad_norm": 0.10317682067163818, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 81.51162958145142 + }, + { + "epoch": 66, + "train_loss": 6.280715701446534, + "train_acc": 0.00842, + "test_loss": 4.605171147918701, + "test_acc": 0.01, + "lyapunov": 2.2628414155272267, + "grad_norm": 0.09673219941672938, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 81.47932028770447 + }, + { + "epoch": 67, + "train_loss": 6.277698368530274, + "train_acc": 0.00856, + "test_loss": 4.6051715675354, + "test_acc": 0.01, + "lyapunov": 2.26088782466586, + "grad_norm": 0.09056972140208994, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 81.48698115348816 + }, + { + "epoch": 68, + "train_loss": 6.30627403137207, + "train_acc": 0.00826, + "test_loss": 4.605171142578125, + "test_acc": 0.01, + "lyapunov": 2.2745680943169555, + "grad_norm": 0.13148861913625765, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 81.49131727218628 + }, + { + "epoch": 69, + "train_loss": 6.280330782623291, + "train_acc": 0.00892, + "test_loss": 4.605170972442627, + "test_acc": 0.01, + "lyapunov": 2.2627177104315797, + "grad_norm": 0.1124362788188755, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 83.16999244689941 + }, + { + "epoch": 70, + "train_loss": 6.28732081451416, + "train_acc": 0.00818, + "test_loss": 4.605170994567871, + "test_acc": 0.01, + "lyapunov": 2.2672290460532887, + "grad_norm": 0.10634119980305662, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 81.48939347267151 + }, + { + "epoch": 71, + "train_loss": 6.279782330627442, + "train_acc": 0.00912, + "test_loss": 4.605171276855469, + "test_acc": 0.01, + "lyapunov": 2.262383164652168, + "grad_norm": 0.10626668013646236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 81.48840260505676 + }, + { + "epoch": 72, + "train_loss": 6.295553107910156, + "train_acc": 0.00816, + "test_loss": 4.605171234130859, + "test_acc": 0.01, + "lyapunov": 2.2699396323669903, + "grad_norm": 0.10087516213292237, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 81.66768407821655 + }, + { + "epoch": 73, + "train_loss": 6.279174601287842, + "train_acc": 0.00854, + "test_loss": 4.605171266174317, + "test_acc": 0.01, + "lyapunov": 2.261961253402788, + "grad_norm": 0.09224354382614662, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 81.47679734230042 + }, + { + "epoch": 74, + "train_loss": 6.282529046783448, + "train_acc": 0.00878, + "test_loss": 4.605171199035644, + "test_acc": 0.01, + "lyapunov": 2.263870295966068, + "grad_norm": 0.09731782277810722, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 81.49993348121643 + }, + { + "epoch": 75, + "train_loss": 6.277901949768067, + "train_acc": 0.0089, + "test_loss": 4.605170727539062, + "test_acc": 0.01, + "lyapunov": 2.261039003996593, + "grad_norm": 0.09211112509965803, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 81.50083065032959 + }, + { + "epoch": 76, + "train_loss": 6.340216960601807, + "train_acc": 0.00838, + "test_loss": 4.605170699310302, + "test_acc": 0.01, + "lyapunov": 2.2909446268740212, + "grad_norm": 0.23685392065021807, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 81.50020790100098 + }, + { + "epoch": 77, + "train_loss": 6.312104174957275, + "train_acc": 0.00864, + "test_loss": 4.605171252441406, + "test_acc": 0.01, + "lyapunov": 2.2805933543788197, + "grad_norm": 0.18831482170422406, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 81.49737644195557 + }, + { + "epoch": 78, + "train_loss": 6.2789193016052245, + "train_acc": 0.00852, + "test_loss": 4.605171314239502, + "test_acc": 0.01, + "lyapunov": 2.261766994090946, + "grad_norm": 0.0924358449039435, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 81.48207116127014 + }, + { + "epoch": 79, + "train_loss": 6.278578204803467, + "train_acc": 0.00926, + "test_loss": 4.6051709121704105, + "test_acc": 0.01, + "lyapunov": 2.2615611260504367, + "grad_norm": 0.106081439799758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 81.5153739452362 + }, + { + "epoch": 80, + "train_loss": 6.280757647094727, + "train_acc": 0.00926, + "test_loss": 4.605170848083496, + "test_acc": 0.01, + "lyapunov": 2.2630625789427694, + "grad_norm": 0.09000806752766331, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 81.48912286758423 + }, + { + "epoch": 81, + "train_loss": 6.281069091949463, + "train_acc": 0.00898, + "test_loss": 4.605170893859864, + "test_acc": 0.01, + "lyapunov": 2.263333380984528, + "grad_norm": 0.09221512328536063, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 81.5581386089325 + }, + { + "epoch": 82, + "train_loss": 6.27887787902832, + "train_acc": 0.0087, + "test_loss": 4.605170852661133, + "test_acc": 0.01, + "lyapunov": 2.261768191671737, + "grad_norm": 0.09223604647823178, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 81.48868751525879 + }, + { + "epoch": 83, + "train_loss": 6.283419313049317, + "train_acc": 0.00842, + "test_loss": 4.605170945739746, + "test_acc": 0.01, + "lyapunov": 2.2647099933965738, + "grad_norm": 0.11489596444213686, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 81.48753881454468 + }, + { + "epoch": 84, + "train_loss": 6.331098417663574, + "train_acc": 0.00886, + "test_loss": 4.605170746612549, + "test_acc": 0.01, + "lyapunov": 2.288768025005565, + "grad_norm": 0.21523480615204088, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 81.49917888641357 + }, + { + "epoch": 85, + "train_loss": 6.279946563415527, + "train_acc": 0.00858, + "test_loss": 4.605170806884765, + "test_acc": 0.01, + "lyapunov": 2.262576125162032, + "grad_norm": 0.09063877969543369, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 81.49754786491394 + }, + { + "epoch": 86, + "train_loss": 6.294878379211426, + "train_acc": 0.0082, + "test_loss": 4.605170738983154, + "test_acc": 0.01, + "lyapunov": 2.270076130967006, + "grad_norm": 0.11269347737073286, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 81.49726057052612 + }, + { + "epoch": 87, + "train_loss": 6.2920974577331545, + "train_acc": 0.009, + "test_loss": 4.6051703125, + "test_acc": 0.01, + "lyapunov": 2.2685716097312207, + "grad_norm": 0.14345779012680526, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 81.51811003684998 + }, + { + "epoch": 88, + "train_loss": 6.280257380981445, + "train_acc": 0.00862, + "test_loss": 4.605170468139648, + "test_acc": 0.01, + "lyapunov": 2.262734867422782, + "grad_norm": 0.089208601870095, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 81.54773998260498 + }, + { + "epoch": 89, + "train_loss": 6.281720874176026, + "train_acc": 0.00798, + "test_loss": 4.605170385742188, + "test_acc": 0.01, + "lyapunov": 2.2637228892587333, + "grad_norm": 0.13294770236555567, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 81.49507021903992 + }, + { + "epoch": 90, + "train_loss": 6.282031690979004, + "train_acc": 0.00864, + "test_loss": 4.6051704216003415, + "test_acc": 0.01, + "lyapunov": 2.263972556804452, + "grad_norm": 0.09670924579322722, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 81.50043749809265 + }, + { + "epoch": 91, + "train_loss": 6.281220606231689, + "train_acc": 0.00882, + "test_loss": 4.605170685577392, + "test_acc": 0.01, + "lyapunov": 2.2634493798551047, + "grad_norm": 0.08948481670861189, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 81.50585508346558 + }, + { + "epoch": 92, + "train_loss": 6.279705551147461, + "train_acc": 0.00862, + "test_loss": 4.60517056274414, + "test_acc": 0.01, + "lyapunov": 2.2624147529797174, + "grad_norm": 0.09256700006903949, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 81.51557660102844 + }, + { + "epoch": 93, + "train_loss": 6.281244622955322, + "train_acc": 0.0087, + "test_loss": 4.60517061920166, + "test_acc": 0.01, + "lyapunov": 2.2632562803185503, + "grad_norm": 0.11132757286060115, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 81.49661374092102 + }, + { + "epoch": 94, + "train_loss": 6.306097177734375, + "train_acc": 0.00858, + "test_loss": 4.605170388793946, + "test_acc": 0.01, + "lyapunov": 2.274985415856247, + "grad_norm": 0.14003151421649307, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 81.48347187042236 + }, + { + "epoch": 95, + "train_loss": 6.283950561676026, + "train_acc": 0.00878, + "test_loss": 4.605170606994629, + "test_acc": 0.01, + "lyapunov": 2.264391293001297, + "grad_norm": 0.11506545388832123, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 81.5063374042511 + }, + { + "epoch": 96, + "train_loss": 6.302323147125244, + "train_acc": 0.00874, + "test_loss": 4.60517081451416, + "test_acc": 0.01, + "lyapunov": 2.274367270872111, + "grad_norm": 0.12307854636703328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 81.4797682762146 + }, + { + "epoch": 97, + "train_loss": 6.281584391479492, + "train_acc": 0.00864, + "test_loss": 4.605170351409912, + "test_acc": 0.01, + "lyapunov": 2.2636835014118866, + "grad_norm": 0.10251001946667801, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 81.49354839324951 + }, + { + "epoch": 98, + "train_loss": 6.2782898904418944, + "train_acc": 0.00868, + "test_loss": 4.60517045135498, + "test_acc": 0.01, + "lyapunov": 2.261435853245923, + "grad_norm": 0.08854436555507054, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 81.4875979423523 + }, + { + "epoch": 99, + "train_loss": 6.295129021606446, + "train_acc": 0.0082, + "test_loss": 4.605170526123047, + "test_acc": 0.01, + "lyapunov": 2.2712618536351585, + "grad_norm": 0.11715866448048785, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 81.48900055885315 + }, + { + "epoch": 100, + "train_loss": 6.278292948303223, + "train_acc": 0.00866, + "test_loss": 4.605170332336426, + "test_acc": 0.01, + "lyapunov": 2.2613569385255388, + "grad_norm": 0.09963153634244509, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 81.49986267089844 + }, + { + "epoch": 101, + "train_loss": 6.278483645935059, + "train_acc": 0.00804, + "test_loss": 4.60517053604126, + "test_acc": 0.01, + "lyapunov": 2.261537701272599, + "grad_norm": 0.08871006809333543, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 81.51374125480652 + }, + { + "epoch": 102, + "train_loss": 6.280324393310547, + "train_acc": 0.00806, + "test_loss": 4.605170599365234, + "test_acc": 0.01, + "lyapunov": 2.262814277883076, + "grad_norm": 0.08821870247597413, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 81.50025415420532 + }, + { + "epoch": 103, + "train_loss": 6.2799532815551755, + "train_acc": 0.00876, + "test_loss": 4.605170227050781, + "test_acc": 0.01, + "lyapunov": 2.2625574236330777, + "grad_norm": 0.08935081241113577, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 81.50659584999084 + }, + { + "epoch": 104, + "train_loss": 6.298912643432617, + "train_acc": 0.00842, + "test_loss": 4.60517052154541, + "test_acc": 0.01, + "lyapunov": 2.2703244808079948, + "grad_norm": 0.11414965346863236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 81.5045850276947 + }, + { + "epoch": 105, + "train_loss": 6.290122275390625, + "train_acc": 0.0086, + "test_loss": 4.605170248413086, + "test_acc": 0.01, + "lyapunov": 2.268586759981902, + "grad_norm": 0.09478727747372748, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 81.49806952476501 + }, + { + "epoch": 106, + "train_loss": 6.29548063659668, + "train_acc": 0.00866, + "test_loss": 4.605170534515381, + "test_acc": 0.01, + "lyapunov": 2.2701295159966746, + "grad_norm": 0.11489602174527157, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 81.48596048355103 + }, + { + "epoch": 107, + "train_loss": 6.282184426269532, + "train_acc": 0.0082, + "test_loss": 4.605170352172852, + "test_acc": 0.01, + "lyapunov": 2.2641438352482397, + "grad_norm": 0.08961045804319463, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 81.49523115158081 + }, + { + "epoch": 108, + "train_loss": 6.2777880932617185, + "train_acc": 0.00864, + "test_loss": 4.605170249938965, + "test_acc": 0.01, + "lyapunov": 2.2611292018305007, + "grad_norm": 0.08837496982685777, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 81.5235505104065 + }, + { + "epoch": 109, + "train_loss": 6.279533188171387, + "train_acc": 0.00846, + "test_loss": 4.6051705436706545, + "test_acc": 0.01, + "lyapunov": 2.2622785964585326, + "grad_norm": 0.09025198956904176, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 81.49149775505066 + }, + { + "epoch": 110, + "train_loss": 6.281950114135742, + "train_acc": 0.00808, + "test_loss": 4.605170324707031, + "test_acc": 0.01, + "lyapunov": 2.2638927835332767, + "grad_norm": 0.09569022356709349, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 81.48516082763672 + }, + { + "epoch": 111, + "train_loss": 6.28185485534668, + "train_acc": 0.00926, + "test_loss": 4.6051703125, + "test_acc": 0.01, + "lyapunov": 2.2638340045119185, + "grad_norm": 0.08892162931996153, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 81.49398422241211 + }, + { + "epoch": 112, + "train_loss": 6.310760371704101, + "train_acc": 0.0083, + "test_loss": 4.605170272064209, + "test_acc": 0.01, + "lyapunov": 2.2783618381870983, + "grad_norm": 0.14829000342501422, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 81.47959303855896 + }, + { + "epoch": 113, + "train_loss": 6.280448321685791, + "train_acc": 0.00868, + "test_loss": 4.605170561218261, + "test_acc": 0.01, + "lyapunov": 2.262940209235072, + "grad_norm": 0.08905882191321668, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 81.49572110176086 + }, + { + "epoch": 114, + "train_loss": 6.29521280166626, + "train_acc": 0.00898, + "test_loss": 4.6051701675415035, + "test_acc": 0.01, + "lyapunov": 2.2707663734855554, + "grad_norm": 0.10226349996651533, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 81.48670983314514 + }, + { + "epoch": 115, + "train_loss": 6.2799824197387695, + "train_acc": 0.00898, + "test_loss": 4.605170332336426, + "test_acc": 0.01, + "lyapunov": 2.2626387176611233, + "grad_norm": 0.08828544817683198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 81.48745203018188 + }, + { + "epoch": 116, + "train_loss": 6.2778549322509765, + "train_acc": 0.00826, + "test_loss": 4.6051702964782715, + "test_acc": 0.01, + "lyapunov": 2.26113668122255, + "grad_norm": 0.08806272896088922, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 81.54066944122314 + }, + { + "epoch": 117, + "train_loss": 6.279518751220703, + "train_acc": 0.00934, + "test_loss": 4.605170413208008, + "test_acc": 0.01, + "lyapunov": 2.2623144555884553, + "grad_norm": 0.0877771191158831, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 81.48839020729065 + }, + { + "epoch": 118, + "train_loss": 6.281088227996826, + "train_acc": 0.00902, + "test_loss": 4.605170362854004, + "test_acc": 0.01, + "lyapunov": 2.2633964198324685, + "grad_norm": 0.0880896864668632, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 81.50261282920837 + }, + { + "epoch": 119, + "train_loss": 6.282254580841064, + "train_acc": 0.00884, + "test_loss": 4.605170101165771, + "test_acc": 0.01, + "lyapunov": 2.264233167214162, + "grad_norm": 0.08831557648722567, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 81.52568435668945 + }, + { + "epoch": 120, + "train_loss": 6.277676391906739, + "train_acc": 0.0087, + "test_loss": 4.6051705383300785, + "test_acc": 0.01, + "lyapunov": 2.2610504279661057, + "grad_norm": 0.08852764058763012, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 81.50404500961304 + }, + { + "epoch": 121, + "train_loss": 6.282078470611572, + "train_acc": 0.00904, + "test_loss": 4.605170125579834, + "test_acc": 0.01, + "lyapunov": 2.264081825685623, + "grad_norm": 0.08733889209956962, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 81.49174380302429 + }, + { + "epoch": 122, + "train_loss": 6.280417911529541, + "train_acc": 0.00854, + "test_loss": 4.605170150756836, + "test_acc": 0.01, + "lyapunov": 2.2629349579286697, + "grad_norm": 0.08896774607886365, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 81.48855018615723 + }, + { + "epoch": 123, + "train_loss": 6.279605996398926, + "train_acc": 0.00798, + "test_loss": 4.605170092773437, + "test_acc": 0.01, + "lyapunov": 2.262386467755603, + "grad_norm": 0.08795933479592377, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 81.50146007537842 + }, + { + "epoch": 124, + "train_loss": 6.291684345397949, + "train_acc": 0.00856, + "test_loss": 4.6051700492858885, + "test_acc": 0.01, + "lyapunov": 2.2678240815087047, + "grad_norm": 0.11392589044407447, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 81.48491311073303 + }, + { + "epoch": 125, + "train_loss": 6.285427192077637, + "train_acc": 0.00888, + "test_loss": 4.605170321655273, + "test_acc": 0.01, + "lyapunov": 2.2660442904743086, + "grad_norm": 0.1133754054706649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 81.49100470542908 + }, + { + "epoch": 126, + "train_loss": 6.280400201568604, + "train_acc": 0.00878, + "test_loss": 4.6051705368041995, + "test_acc": 0.01, + "lyapunov": 2.2629254120390128, + "grad_norm": 0.08821452866992016, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 81.49153852462769 + }, + { + "epoch": 127, + "train_loss": 6.279529089202881, + "train_acc": 0.0088, + "test_loss": 4.605170316314697, + "test_acc": 0.01, + "lyapunov": 2.2623902915993614, + "grad_norm": 0.08745608733781365, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 81.50230026245117 + }, + { + "epoch": 128, + "train_loss": 6.278408692016601, + "train_acc": 0.00888, + "test_loss": 4.605170304870605, + "test_acc": 0.01, + "lyapunov": 2.261508503228502, + "grad_norm": 0.08825893270809801, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 81.49138951301575 + }, + { + "epoch": 129, + "train_loss": 6.279044237976074, + "train_acc": 0.00934, + "test_loss": 4.605170484924316, + "test_acc": 0.01, + "lyapunov": 2.261979506753595, + "grad_norm": 0.08762519682827673, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 81.50332951545715 + }, + { + "epoch": 130, + "train_loss": 6.2814196604919434, + "train_acc": 0.00892, + "test_loss": 4.605170237731934, + "test_acc": 0.01, + "lyapunov": 2.263650309399266, + "grad_norm": 0.0879745908721408, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 81.48634791374207 + }, + { + "epoch": 131, + "train_loss": 6.279289369659423, + "train_acc": 0.00816, + "test_loss": 4.605170503234863, + "test_acc": 0.01, + "lyapunov": 2.2619674528956106, + "grad_norm": 0.08830358541425926, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 81.49762201309204 + }, + { + "epoch": 132, + "train_loss": 6.284051736145019, + "train_acc": 0.00918, + "test_loss": 4.605169993591309, + "test_acc": 0.01, + "lyapunov": 2.265367220734696, + "grad_norm": 0.09065551426084856, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 81.5026957988739 + }, + { + "epoch": 133, + "train_loss": 6.28203574508667, + "train_acc": 0.00886, + "test_loss": 4.60517046508789, + "test_acc": 0.01, + "lyapunov": 2.264016958148888, + "grad_norm": 0.08811709248877145, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 81.4884991645813 + }, + { + "epoch": 134, + "train_loss": 6.295380000305176, + "train_acc": 0.00924, + "test_loss": 4.6051701171875, + "test_acc": 0.01, + "lyapunov": 2.270651138652011, + "grad_norm": 0.09385452218544989, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 81.49120998382568 + }, + { + "epoch": 135, + "train_loss": 6.279313954925537, + "train_acc": 0.0096, + "test_loss": 4.605170198059082, + "test_acc": 0.01, + "lyapunov": 2.2621799277527557, + "grad_norm": 0.08809804121534516, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 81.503009557724 + }, + { + "epoch": 136, + "train_loss": 6.281174714050293, + "train_acc": 0.009, + "test_loss": 4.605170434570312, + "test_acc": 0.01, + "lyapunov": 2.263484787758049, + "grad_norm": 0.08787496788421857, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 81.49492454528809 + }, + { + "epoch": 137, + "train_loss": 6.2790307751464844, + "train_acc": 0.00906, + "test_loss": 4.605170115661621, + "test_acc": 0.01, + "lyapunov": 2.2619833738907524, + "grad_norm": 0.08850586212515105, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 81.51062154769897 + }, + { + "epoch": 138, + "train_loss": 6.278728715362549, + "train_acc": 0.0095, + "test_loss": 4.605170520019532, + "test_acc": 0.01, + "lyapunov": 2.2618095082090335, + "grad_norm": 0.08731291361885624, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 81.48903918266296 + }, + { + "epoch": 139, + "train_loss": 6.279946011657715, + "train_acc": 0.00924, + "test_loss": 4.605169985198975, + "test_acc": 0.01, + "lyapunov": 2.262684661104246, + "grad_norm": 0.08830501755378455, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 81.50976133346558 + }, + { + "epoch": 140, + "train_loss": 6.2800713043212895, + "train_acc": 0.0093, + "test_loss": 4.605170336914062, + "test_acc": 0.01, + "lyapunov": 2.2627302271020993, + "grad_norm": 0.08760865122091131, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 81.47953510284424 + }, + { + "epoch": 141, + "train_loss": 6.280382924652099, + "train_acc": 0.00976, + "test_loss": 4.605170390319824, + "test_acc": 0.01, + "lyapunov": 2.262962554116993, + "grad_norm": 0.08731546735423716, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 81.50757503509521 + }, + { + "epoch": 142, + "train_loss": 6.280370573883057, + "train_acc": 0.00936, + "test_loss": 4.605170272064209, + "test_acc": 0.01, + "lyapunov": 2.262975048226164, + "grad_norm": 0.08839664162758272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 81.70762014389038 + }, + { + "epoch": 143, + "train_loss": 6.278507639923096, + "train_acc": 0.0095, + "test_loss": 4.6051704162597655, + "test_acc": 0.01, + "lyapunov": 2.261611500054674, + "grad_norm": 0.08694971985774991, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 81.48127150535583 + }, + { + "epoch": 144, + "train_loss": 6.281042174987793, + "train_acc": 0.00942, + "test_loss": 4.605170404815674, + "test_acc": 0.01, + "lyapunov": 2.263450643290644, + "grad_norm": 0.0881830241474449, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 81.58690285682678 + }, + { + "epoch": 145, + "train_loss": 6.278796115875244, + "train_acc": 0.01, + "test_loss": 4.605169946289062, + "test_acc": 0.01, + "lyapunov": 2.2618483887304124, + "grad_norm": 0.08774085138052039, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 81.47702813148499 + }, + { + "epoch": 146, + "train_loss": 6.28765030166626, + "train_acc": 0.01, + "test_loss": 4.605170179748535, + "test_acc": 0.01, + "lyapunov": 2.266257317169853, + "grad_norm": 0.0926994360583192, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 81.53279685974121 + }, + { + "epoch": 147, + "train_loss": 6.28031106124878, + "train_acc": 0.01, + "test_loss": 4.605170380401612, + "test_acc": 0.01, + "lyapunov": 2.2628798844564297, + "grad_norm": 0.08793782485118157, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 81.48903107643127 + }, + { + "epoch": 148, + "train_loss": 6.280096773681641, + "train_acc": 0.01, + "test_loss": 4.605170349884033, + "test_acc": 0.01, + "lyapunov": 2.2627320112779623, + "grad_norm": 0.08818349122842602, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 81.4692907333374 + }, + { + "epoch": 149, + "train_loss": 6.281090885467529, + "train_acc": 0.01, + "test_loss": 4.605170343017578, + "test_acc": 0.01, + "lyapunov": 2.263427186195198, + "grad_norm": 0.0872012744277379, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 81.53167700767517 + }, + { + "epoch": 150, + "train_loss": 6.279137640380859, + "train_acc": 0.01, + "test_loss": 4.605170111083984, + "test_acc": 0.01, + "lyapunov": 2.262077055318886, + "grad_norm": 0.08725575780836431, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 81.56354284286499 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 12.888672213134766, + "train_acc": 0.0157, + "test_loss": 4.668669903564453, + "test_acc": 0.0113, + "lyapunov": 4.721897013656928, + "grad_norm": 6.113449849588324, + "grad_max_sv": 4.916350275278091, + "grad_min_sv": 9.121745356832633e-08, + "grad_condition": 85604761.14095068, + "lr": 0.0009998903417374227, + "time_sec": 124.4171769618988 + }, + { + "epoch": 2, + "train_loss": 8.873665056762695, + "train_acc": 0.0172, + "test_loss": 4.618728218078613, + "test_acc": 0.0106, + "lyapunov": 3.5643789152355145, + "grad_norm": 4.270033727895912, + "grad_max_sv": 3.703069430589676, + "grad_min_sv": 4.972798216271515e-08, + "grad_condition": 4407702901.858317, + "lr": 0.0009995614150494292, + "time_sec": 124.48686790466309 + }, + { + "epoch": 3, + "train_loss": 8.600334560241699, + "train_acc": 0.01782, + "test_loss": 4.650051962280274, + "test_acc": 0.01, + "lyapunov": 3.4914282776815506, + "grad_norm": 3.3926839865294114, + "grad_max_sv": 2.9882367312908173, + "grad_min_sv": 1.3234509199243523e-08, + "grad_condition": 54857460231.037346, + "lr": 0.0009990133642141358, + "time_sec": 124.54058074951172 + }, + { + "epoch": 4, + "train_loss": 8.263027096862793, + "train_acc": 0.01714, + "test_loss": 4.599512353515625, + "test_acc": 0.0105, + "lyapunov": 3.3760591937452937, + "grad_norm": 2.278902599299841, + "grad_max_sv": 1.9339918196201324, + "grad_min_sv": 2.3884921456027857e-10, + "grad_condition": 107255985296.78781, + "lr": 0.0009982464296247522, + "time_sec": 124.56976628303528 + }, + { + "epoch": 5, + "train_loss": 8.014010938720704, + "train_acc": 0.01496, + "test_loss": 4.616816136169434, + "test_acc": 0.01, + "lyapunov": 3.2668096848461023, + "grad_norm": 1.8273408452911775, + "grad_max_sv": 1.1145809442189922, + "grad_min_sv": 1.2368932906215386e-11, + "grad_condition": 320257530150.4256, + "lr": 0.0009972609476841367, + "time_sec": 124.43335103988647 + }, + { + "epoch": 6, + "train_loss": 7.492105539398193, + "train_acc": 0.01378, + "test_loss": 4.617157006835938, + "test_acc": 0.01, + "lyapunov": 2.993205757702098, + "grad_norm": 1.155205925820389, + "grad_max_sv": 0.8030500062418355, + "grad_min_sv": 1.9935007673619705e-12, + "grad_condition": 394942710887.2484, + "lr": 0.000996057350657239, + "time_sec": 124.40957427024841 + }, + { + "epoch": 7, + "train_loss": 7.546499238586426, + "train_acc": 0.01474, + "test_loss": 4.614982270812988, + "test_acc": 0.01, + "lyapunov": 3.0089273160071017, + "grad_norm": 2.2107120727107343, + "grad_max_sv": 0.5263522088527679, + "grad_min_sv": 2.339208170494913e-12, + "grad_condition": 228093595550.92413, + "lr": 0.000994636166481494, + "time_sec": 124.44238233566284 + }, + { + "epoch": 8, + "train_loss": 7.431590474243164, + "train_acc": 0.01458, + "test_loss": 4.613349987792969, + "test_acc": 0.01, + "lyapunov": 2.9677638501462424, + "grad_norm": 1.4698803730862553, + "grad_max_sv": 0.3683710671344215, + "grad_min_sv": 1.0445961128587334e-12, + "grad_condition": 222600534264.8287, + "lr": 0.0009929980185352525, + "time_sec": 124.46612310409546 + }, + { + "epoch": 9, + "train_loss": 7.177635037078858, + "train_acc": 0.01324, + "test_loss": 4.612429743957519, + "test_acc": 0.01, + "lyapunov": 2.8310226979463, + "grad_norm": 1.4861384451742359, + "grad_max_sv": 0.32697355831472236, + "grad_min_sv": 7.011187907653872e-13, + "grad_condition": 236887025983.79956, + "lr": 0.0009911436253643444, + "time_sec": 124.47700262069702 + }, + { + "epoch": 10, + "train_loss": 7.269148045806885, + "train_acc": 0.01266, + "test_loss": 4.60582406539917, + "test_acc": 0.01, + "lyapunov": 2.8725382824383123, + "grad_norm": 2.342581709783361, + "grad_max_sv": 0.25737013639882206, + "grad_min_sv": 2.152763686233954e-13, + "grad_condition": 237339662745.88754, + "lr": 0.0009890738003669028, + "time_sec": 124.34593343734741 + }, + { + "epoch": 11, + "train_loss": 7.854859015350342, + "train_acc": 0.0135, + "test_loss": 4.610336604309082, + "test_acc": 0.01, + "lyapunov": 3.174172605699895, + "grad_norm": 2.7187327990789893, + "grad_max_sv": 0.20388649497181177, + "grad_min_sv": 8.088439153332857e-14, + "grad_condition": 191904183934.97748, + "lr": 0.00098678945143658, + "time_sec": 124.38984727859497 + }, + { + "epoch": 12, + "train_loss": 7.352457761230469, + "train_acc": 0.01424, + "test_loss": 4.6108569480896, + "test_acc": 0.01, + "lyapunov": 2.9249625279165596, + "grad_norm": 1.4927365138413504, + "grad_max_sv": 0.19409580584615468, + "grad_min_sv": 6.321730296975161e-14, + "grad_condition": 185278377907.65347, + "lr": 0.0009842915805643154, + "time_sec": 124.45291423797607 + }, + { + "epoch": 13, + "train_loss": 7.126369653930664, + "train_acc": 0.0127, + "test_loss": 4.606200820922852, + "test_acc": 0.01, + "lyapunov": 2.7892982831696416, + "grad_norm": 1.5745132805186597, + "grad_max_sv": 0.16401691318606026, + "grad_min_sv": 1.1404081781040362e-15, + "grad_condition": 163820543107.00018, + "lr": 0.000981581283398829, + "time_sec": 124.47300815582275 + }, + { + "epoch": 14, + "train_loss": 6.9970923039245605, + "train_acc": 0.0119, + "test_loss": 4.606117165374756, + "test_acc": 0.01, + "lyapunov": 2.7211814384021418, + "grad_norm": 0.8580084847133529, + "grad_max_sv": 0.13348757792264224, + "grad_min_sv": 3.507279862736168e-28, + "grad_condition": 133487577922.64218, + "lr": 0.0009786597487660333, + "time_sec": 124.41379904747009 + }, + { + "epoch": 15, + "train_loss": 7.052154786376953, + "train_acc": 0.0117, + "test_loss": 4.606044427490234, + "test_acc": 0.01, + "lyapunov": 2.753269191288277, + "grad_norm": 1.006394199833171, + "grad_max_sv": 0.12816582168452442, + "grad_min_sv": 4.518028483603919e-34, + "grad_condition": 128165821684.52441, + "lr": 0.0009755282581475766, + "time_sec": 124.34007215499878 + }, + { + "epoch": 16, + "train_loss": 7.258110624084472, + "train_acc": 0.0109, + "test_loss": 4.605929005432129, + "test_acc": 0.01, + "lyapunov": 2.862082756998594, + "grad_norm": 1.1482559574218805, + "grad_max_sv": 0.10950499838218093, + "grad_min_sv": 3.564320494794489e-35, + "grad_condition": 109504998382.18094, + "lr": 0.0009721881851187403, + "time_sec": 124.38707971572876 + }, + { + "epoch": 17, + "train_loss": 6.873683618774414, + "train_acc": 0.00996, + "test_loss": 4.61062957611084, + "test_acc": 0.01, + "lyapunov": 2.641120981377409, + "grad_norm": 2.0808485430057084, + "grad_max_sv": 0.05978809341322631, + "grad_min_sv": 2.4522723125684297e-46, + "grad_condition": 59788093413.2263, + "lr": 0.0009686409947459456, + "time_sec": 124.47280597686768 + }, + { + "epoch": 18, + "train_loss": 7.016553334655762, + "train_acc": 0.01398, + "test_loss": 4.622579546356201, + "test_acc": 0.01, + "lyapunov": 2.728775659180663, + "grad_norm": 1.2800257190104987, + "grad_max_sv": 0.1043331983499229, + "grad_min_sv": 3.1060564013215523e-18, + "grad_condition": 104332858891.6054, + "lr": 0.0009648882429441254, + "time_sec": 124.54543328285217 + }, + { + "epoch": 19, + "train_loss": 6.869653914642334, + "train_acc": 0.01194, + "test_loss": 4.643599758911133, + "test_acc": 0.01, + "lyapunov": 2.638523844501856, + "grad_norm": 0.5641956497166879, + "grad_max_sv": 0.06742433752388025, + "grad_min_sv": 9.779701625669289e-16, + "grad_condition": 67360221904.04246, + "lr": 0.00096093157579425, + "time_sec": 124.44028401374817 + }, + { + "epoch": 20, + "train_loss": 6.866667858276367, + "train_acc": 0.0096, + "test_loss": 4.634420860290527, + "test_acc": 0.01, + "lyapunov": 2.628649781731998, + "grad_norm": 0.5455051217507713, + "grad_max_sv": 0.028104651859030126, + "grad_min_sv": 0.0, + "grad_condition": 28104651859.03013, + "lr": 0.0009567727288213001, + "time_sec": 124.34887290000916 + }, + { + "epoch": 21, + "train_loss": 6.825957579650879, + "train_acc": 0.00936, + "test_loss": 4.642799243164062, + "test_acc": 0.01, + "lyapunov": 2.607143042337559, + "grad_norm": 0.5228902482624009, + "grad_max_sv": 0.029772339016199113, + "grad_min_sv": 0.0, + "grad_condition": 29772339016.19911, + "lr": 0.0009524135262330095, + "time_sec": 124.38223886489868 + }, + { + "epoch": 22, + "train_loss": 6.60694779296875, + "train_acc": 0.00934, + "test_loss": 4.642452531433105, + "test_acc": 0.01, + "lyapunov": 2.4819612728665246, + "grad_norm": 0.5929983668433683, + "grad_max_sv": 0.028571362840011716, + "grad_min_sv": 0.0, + "grad_condition": 28571362840.01172, + "lr": 0.0009478558801197061, + "time_sec": 124.46409487724304 + }, + { + "epoch": 23, + "train_loss": 6.587394898986816, + "train_acc": 0.00922, + "test_loss": 4.642014373779297, + "test_acc": 0.01, + "lyapunov": 2.46996273287117, + "grad_norm": 0.5937371167405978, + "grad_max_sv": 0.027252211095765234, + "grad_min_sv": 0.0, + "grad_condition": 27252211095.765236, + "lr": 0.000943101789615607, + "time_sec": 124.41273093223572 + }, + { + "epoch": 24, + "train_loss": 6.5855675335693356, + "train_acc": 0.00944, + "test_loss": 4.629414208984375, + "test_acc": 0.01, + "lyapunov": 2.468693129546807, + "grad_norm": 0.5173238649422355, + "grad_max_sv": 0.026766624441370367, + "grad_min_sv": 0.0, + "grad_condition": 26766624441.37037, + "lr": 0.0009381533400219313, + "time_sec": 124.34699821472168 + }, + { + "epoch": 25, + "train_loss": 6.599731462860108, + "train_acc": 0.00936, + "test_loss": 4.6412096755981445, + "test_acc": 0.01, + "lyapunov": 2.476690198454406, + "grad_norm": 0.5699426578758121, + "grad_max_sv": 0.025352103635668755, + "grad_min_sv": 0.0, + "grad_condition": 25352103635.668755, + "lr": 0.0009330127018922189, + "time_sec": 124.3536787033081 + }, + { + "epoch": 26, + "train_loss": 6.5942790597534175, + "train_acc": 0.00964, + "test_loss": 4.640745770263672, + "test_acc": 0.01, + "lyapunov": 2.4741494673902116, + "grad_norm": 0.546145353806512, + "grad_max_sv": 0.021123076300136746, + "grad_min_sv": 0.0, + "grad_condition": 21123076300.136745, + "lr": 0.000927682130080253, + "time_sec": 124.4051742553711 + }, + { + "epoch": 27, + "train_loss": 6.6229908557128905, + "train_acc": 0.00888, + "test_loss": 4.605336713409423, + "test_acc": 0.01, + "lyapunov": 2.4850437781390022, + "grad_norm": 0.6663677646075784, + "grad_max_sv": 0.011104274867102503, + "grad_min_sv": 0.0, + "grad_condition": 11104274867.102505, + "lr": 0.0009221639627510072, + "time_sec": 124.44045972824097 + }, + { + "epoch": 28, + "train_loss": 6.597202638854981, + "train_acc": 0.00916, + "test_loss": 4.605269973754883, + "test_acc": 0.01, + "lyapunov": 2.4748127710483874, + "grad_norm": 0.6602347286377247, + "grad_max_sv": 0.005200258875265718, + "grad_min_sv": 0.0, + "grad_condition": 5200258875.2657175, + "lr": 0.0009164606203550494, + "time_sec": 124.41216611862183 + }, + { + "epoch": 29, + "train_loss": 6.5781180551147465, + "train_acc": 0.00896, + "test_loss": 4.605207743072509, + "test_acc": 0.01, + "lyapunov": 2.463899161809546, + "grad_norm": 0.16963115020621336, + "grad_max_sv": 0.0064356182236224415, + "grad_min_sv": 0.0, + "grad_condition": 6435618223.622441, + "lr": 0.0009105746045668516, + "time_sec": 124.52706933021545 + }, + { + "epoch": 30, + "train_loss": 6.580226347045898, + "train_acc": 0.00922, + "test_loss": 4.605211033630371, + "test_acc": 0.01, + "lyapunov": 2.4648621435970295, + "grad_norm": 0.14897426222581245, + "grad_max_sv": 0.006681703682988882, + "grad_min_sv": 0.0, + "grad_condition": 6681703682.988882, + "lr": 0.0009045084971874733, + "time_sec": 124.31314778327942 + }, + { + "epoch": 31, + "train_loss": 6.580346279144287, + "train_acc": 0.00906, + "test_loss": 4.605202531433106, + "test_acc": 0.01, + "lyapunov": 2.4647859356287496, + "grad_norm": 0.13651802704858546, + "grad_max_sv": 0.0033354544546455147, + "grad_min_sv": 0.0, + "grad_condition": 3335454454.6455145, + "lr": 0.0008982649590120977, + "time_sec": 124.37081241607666 + }, + { + "epoch": 32, + "train_loss": 6.5977811730957034, + "train_acc": 0.00854, + "test_loss": 4.605187432861328, + "test_acc": 0.01, + "lyapunov": 2.4727761562523023, + "grad_norm": 0.12974748253445384, + "grad_max_sv": 0.002326939906924963, + "grad_min_sv": 0.0, + "grad_condition": 2326939906.924963, + "lr": 0.0008918467286629196, + "time_sec": 124.42768621444702 + }, + { + "epoch": 33, + "train_loss": 6.574522008514404, + "train_acc": 0.00888, + "test_loss": 4.60518201751709, + "test_acc": 0.01, + "lyapunov": 2.461720284903446, + "grad_norm": 0.10990146900045704, + "grad_max_sv": 0.0026134482119232415, + "grad_min_sv": 0.0, + "grad_condition": 2613448211.9232416, + "lr": 0.0008852566213878943, + "time_sec": 124.36949467658997 + }, + { + "epoch": 34, + "train_loss": 6.577264302215577, + "train_acc": 0.0092, + "test_loss": 4.605177014923096, + "test_acc": 0.01, + "lyapunov": 2.463475263941928, + "grad_norm": 0.12976444128871847, + "grad_max_sv": 0.0009734443388879299, + "grad_min_sv": 0.0, + "grad_condition": 973444338.8879299, + "lr": 0.000878497527825878, + "time_sec": 124.3325207233429 + }, + { + "epoch": 35, + "train_loss": 6.587216622314453, + "train_acc": 0.00888, + "test_loss": 4.636661901855469, + "test_acc": 0.01, + "lyapunov": 2.4681083863348605, + "grad_norm": 0.13220591916165889, + "grad_max_sv": 0.00457856860011816, + "grad_min_sv": 0.0, + "grad_condition": 4578568600.118161, + "lr": 0.000871572412738697, + "time_sec": 124.3110682964325 + }, + { + "epoch": 36, + "train_loss": 6.592979219360352, + "train_acc": 0.0092, + "test_loss": 4.6051753067016605, + "test_acc": 0.01, + "lyapunov": 2.4714617686503377, + "grad_norm": 0.1239857838330967, + "grad_max_sv": 0.0005948701407760381, + "grad_min_sv": 0.0, + "grad_condition": 594870140.7760382, + "lr": 0.0008644843137107055, + "time_sec": 124.4406750202179 + }, + { + "epoch": 37, + "train_loss": 6.613644898376465, + "train_acc": 0.00858, + "test_loss": 4.605174197387695, + "test_acc": 0.01, + "lyapunov": 2.48187786294981, + "grad_norm": 0.18028613006863556, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 124.42482614517212 + }, + { + "epoch": 38, + "train_loss": 6.598032460021972, + "train_acc": 0.00866, + "test_loss": 4.605173423004151, + "test_acc": 0.01, + "lyapunov": 2.4748510588770327, + "grad_norm": 0.17702039657703328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 124.38127946853638 + }, + { + "epoch": 39, + "train_loss": 6.595033478546142, + "train_acc": 0.00904, + "test_loss": 4.605172880554199, + "test_acc": 0.01, + "lyapunov": 2.4724140514803055, + "grad_norm": 0.1406852681746766, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 124.27310037612915 + }, + { + "epoch": 40, + "train_loss": 6.607061416625976, + "train_acc": 0.00882, + "test_loss": 4.605173010253906, + "test_acc": 0.01, + "lyapunov": 2.4797774525859473, + "grad_norm": 0.1602364870035822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008345653031794289, + "time_sec": 124.35175013542175 + }, + { + "epoch": 41, + "train_loss": 6.652051022644043, + "train_acc": 0.00868, + "test_loss": 4.60517377319336, + "test_acc": 0.01, + "lyapunov": 2.494590156218585, + "grad_norm": 0.1877202250366353, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 124.42674827575684 + }, + { + "epoch": 42, + "train_loss": 6.609013889770508, + "train_acc": 0.00818, + "test_loss": 4.60517264328003, + "test_acc": 0.01, + "lyapunov": 2.4807275219646563, + "grad_norm": 0.19291631462520265, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 124.38730263710022 + }, + { + "epoch": 43, + "train_loss": 6.573144034423828, + "train_acc": 0.0082, + "test_loss": 4.6051730613708495, + "test_acc": 0.01, + "lyapunov": 2.4609296730412242, + "grad_norm": 0.09628320238477034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 124.36512160301208 + }, + { + "epoch": 44, + "train_loss": 6.575241811828613, + "train_acc": 0.00884, + "test_loss": 4.605172496032715, + "test_acc": 0.01, + "lyapunov": 2.462244158205779, + "grad_norm": 0.10484293099591814, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 124.30067491531372 + }, + { + "epoch": 45, + "train_loss": 6.594184577026367, + "train_acc": 0.00936, + "test_loss": 4.605172833251953, + "test_acc": 0.01, + "lyapunov": 2.4732542019670882, + "grad_norm": 0.16310890352013555, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 124.42177891731262 + }, + { + "epoch": 46, + "train_loss": 6.577082351989746, + "train_acc": 0.00882, + "test_loss": 4.605172598266601, + "test_acc": 0.01, + "lyapunov": 2.463544076665893, + "grad_norm": 0.10037821136236143, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 124.40465664863586 + }, + { + "epoch": 47, + "train_loss": 6.5774040518188475, + "train_acc": 0.00862, + "test_loss": 4.605172250366211, + "test_acc": 0.01, + "lyapunov": 2.4635354655478006, + "grad_norm": 0.1162215297313361, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 124.41038012504578 + }, + { + "epoch": 48, + "train_loss": 6.6083132769775395, + "train_acc": 0.0086, + "test_loss": 4.605171835327148, + "test_acc": 0.01, + "lyapunov": 2.4782137511026523, + "grad_norm": 0.17135162198913576, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 124.31084632873535 + }, + { + "epoch": 49, + "train_loss": 6.604438779449463, + "train_acc": 0.0088, + "test_loss": 4.60517212600708, + "test_acc": 0.01, + "lyapunov": 2.478019986311188, + "grad_norm": 0.16895443836343932, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 124.28308844566345 + }, + { + "epoch": 50, + "train_loss": 6.588782655029297, + "train_acc": 0.00888, + "test_loss": 4.605172025299073, + "test_acc": 0.01, + "lyapunov": 2.470017822197331, + "grad_norm": 0.12889442183383476, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 124.42897295951843 + }, + { + "epoch": 51, + "train_loss": 6.601284326782227, + "train_acc": 0.00796, + "test_loss": 4.6051717948913575, + "test_acc": 0.01, + "lyapunov": 2.4773334834886636, + "grad_norm": 0.17649093442856895, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 124.39905118942261 + }, + { + "epoch": 52, + "train_loss": 6.575957306518554, + "train_acc": 0.00918, + "test_loss": 4.6051720420837405, + "test_acc": 0.01, + "lyapunov": 2.46280481565334, + "grad_norm": 0.0968044467412458, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 124.42980766296387 + }, + { + "epoch": 53, + "train_loss": 6.587701625518799, + "train_acc": 0.00872, + "test_loss": 4.6051725509643555, + "test_acc": 0.01, + "lyapunov": 2.4698515999347657, + "grad_norm": 0.13994770283254052, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 124.28514337539673 + }, + { + "epoch": 54, + "train_loss": 6.578931684265137, + "train_acc": 0.00938, + "test_loss": 4.605171647644043, + "test_acc": 0.01, + "lyapunov": 2.464453091097, + "grad_norm": 0.104587329873943, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 124.3464949131012 + }, + { + "epoch": 55, + "train_loss": 6.610985378723145, + "train_acc": 0.00822, + "test_loss": 4.605172131347656, + "test_acc": 0.01, + "lyapunov": 2.4811968675354863, + "grad_norm": 0.23664084539084446, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 124.3919792175293 + }, + { + "epoch": 56, + "train_loss": 6.577887360839844, + "train_acc": 0.0089, + "test_loss": 4.605171892547608, + "test_acc": 0.01, + "lyapunov": 2.4638065877168076, + "grad_norm": 0.12418210732155195, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 124.42023730278015 + }, + { + "epoch": 57, + "train_loss": 6.575769240722656, + "train_acc": 0.00934, + "test_loss": 4.605171751403809, + "test_acc": 0.01, + "lyapunov": 2.4626593559294405, + "grad_norm": 0.08871385738467265, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 124.39303755760193 + }, + { + "epoch": 58, + "train_loss": 6.649054284973144, + "train_acc": 0.00788, + "test_loss": 4.6051721786499025, + "test_acc": 0.01, + "lyapunov": 2.4995590183131227, + "grad_norm": 0.26439944389263503, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 124.30309414863586 + }, + { + "epoch": 59, + "train_loss": 6.620378266906738, + "train_acc": 0.0087, + "test_loss": 4.605171722412109, + "test_acc": 0.01, + "lyapunov": 2.4861825994213524, + "grad_norm": 0.2011814553286534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 124.40799474716187 + }, + { + "epoch": 60, + "train_loss": 6.615863608703613, + "train_acc": 0.00898, + "test_loss": 4.605171568298339, + "test_acc": 0.01, + "lyapunov": 2.4820322356260647, + "grad_norm": 0.16244295400836278, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 124.44055390357971 + }, + { + "epoch": 61, + "train_loss": 6.62539726638794, + "train_acc": 0.00854, + "test_loss": 4.605171578979492, + "test_acc": 0.01, + "lyapunov": 2.4873651598420596, + "grad_norm": 0.18579251012972714, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 124.47138166427612 + }, + { + "epoch": 62, + "train_loss": 6.591934550476074, + "train_acc": 0.00868, + "test_loss": 4.605171854400635, + "test_acc": 0.01, + "lyapunov": 2.471130254018642, + "grad_norm": 0.14241384092347348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 124.35206151008606 + }, + { + "epoch": 63, + "train_loss": 6.607412483825684, + "train_acc": 0.00866, + "test_loss": 4.605171817779541, + "test_acc": 0.01, + "lyapunov": 2.4772931200159176, + "grad_norm": 0.12000050103102612, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 124.31255435943604 + }, + { + "epoch": 64, + "train_loss": 6.574604081420898, + "train_acc": 0.0084, + "test_loss": 4.60517174911499, + "test_acc": 0.01, + "lyapunov": 2.461947503297225, + "grad_norm": 0.11837720061951122, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 124.42598223686218 + }, + { + "epoch": 65, + "train_loss": 6.669198082733154, + "train_acc": 0.00846, + "test_loss": 4.605171404266358, + "test_acc": 0.01, + "lyapunov": 2.50827671865673, + "grad_norm": 0.3654068480597362, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 124.41292977333069 + }, + { + "epoch": 66, + "train_loss": 6.576071541442871, + "train_acc": 0.00868, + "test_loss": 4.60517176437378, + "test_acc": 0.01, + "lyapunov": 2.462862340995418, + "grad_norm": 0.0924056370989614, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 124.44835186004639 + }, + { + "epoch": 67, + "train_loss": 6.623493032073974, + "train_acc": 0.00798, + "test_loss": 4.605171159362793, + "test_acc": 0.01, + "lyapunov": 2.4856161059016157, + "grad_norm": 0.23515698863564433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 124.32646751403809 + }, + { + "epoch": 68, + "train_loss": 6.58642106048584, + "train_acc": 0.00814, + "test_loss": 4.605171382141113, + "test_acc": 0.01, + "lyapunov": 2.4687487658332374, + "grad_norm": 0.10028160631921758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 124.34812188148499 + }, + { + "epoch": 69, + "train_loss": 6.612601704254151, + "train_acc": 0.00846, + "test_loss": 4.605171432495117, + "test_acc": 0.01, + "lyapunov": 2.478518716514568, + "grad_norm": 0.16428393693339724, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 124.40169882774353 + }, + { + "epoch": 70, + "train_loss": 6.594199375915528, + "train_acc": 0.0078, + "test_loss": 4.605171556854248, + "test_acc": 0.01, + "lyapunov": 2.4733456675048986, + "grad_norm": 0.13222269600542105, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 124.43159890174866 + }, + { + "epoch": 71, + "train_loss": 6.584797274169921, + "train_acc": 0.00884, + "test_loss": 4.605171443176269, + "test_acc": 0.01, + "lyapunov": 2.468046905439528, + "grad_norm": 0.09698860702372256, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 124.38395667076111 + }, + { + "epoch": 72, + "train_loss": 6.62336443145752, + "train_acc": 0.00826, + "test_loss": 4.60517096862793, + "test_acc": 0.01, + "lyapunov": 2.486185181171388, + "grad_norm": 0.20758922397897858, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 124.28166174888611 + }, + { + "epoch": 73, + "train_loss": 6.624484212188721, + "train_acc": 0.00906, + "test_loss": 4.6051707977294924, + "test_acc": 0.01, + "lyapunov": 2.487110945879651, + "grad_norm": 0.19977656643109526, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 124.35272693634033 + }, + { + "epoch": 74, + "train_loss": 6.603300393676758, + "train_acc": 0.0091, + "test_loss": 4.605170932006836, + "test_acc": 0.01, + "lyapunov": 2.477061335083164, + "grad_norm": 0.16600248799904951, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 124.40994596481323 + }, + { + "epoch": 75, + "train_loss": 6.5982538143920895, + "train_acc": 0.00856, + "test_loss": 4.605171234130859, + "test_acc": 0.01, + "lyapunov": 2.473140881799371, + "grad_norm": 0.16128953646649988, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 124.43308448791504 + }, + { + "epoch": 76, + "train_loss": 6.592834194946289, + "train_acc": 0.00854, + "test_loss": 4.605171026611328, + "test_acc": 0.01, + "lyapunov": 2.47263060750254, + "grad_norm": 0.1340374980962284, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 124.34016180038452 + }, + { + "epoch": 77, + "train_loss": 6.584505953979492, + "train_acc": 0.00864, + "test_loss": 4.605171239471436, + "test_acc": 0.01, + "lyapunov": 2.4676697760286843, + "grad_norm": 0.11435356827937113, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 124.3169755935669 + }, + { + "epoch": 78, + "train_loss": 6.5763300253295895, + "train_acc": 0.00884, + "test_loss": 4.6051710525512695, + "test_acc": 0.01, + "lyapunov": 2.4630901801311755, + "grad_norm": 0.08961847488711042, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 124.3459620475769 + }, + { + "epoch": 79, + "train_loss": 6.575958716125489, + "train_acc": 0.00932, + "test_loss": 4.605170614624023, + "test_acc": 0.01, + "lyapunov": 2.462890618902338, + "grad_norm": 0.0894392700212742, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 124.39721941947937 + }, + { + "epoch": 80, + "train_loss": 6.57727864440918, + "train_acc": 0.00828, + "test_loss": 4.6051712982177735, + "test_acc": 0.01, + "lyapunov": 2.4634996923949104, + "grad_norm": 0.09357159928827649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 124.43293237686157 + }, + { + "epoch": 81, + "train_loss": 6.576623619689942, + "train_acc": 0.00858, + "test_loss": 4.60517075958252, + "test_acc": 0.01, + "lyapunov": 2.4632719782612207, + "grad_norm": 0.08778044836554635, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 124.33877468109131 + }, + { + "epoch": 82, + "train_loss": 6.706115616912842, + "train_acc": 0.00852, + "test_loss": 4.60517084274292, + "test_acc": 0.01, + "lyapunov": 2.5237014750995295, + "grad_norm": 0.35892654821663944, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 124.33198618888855 + }, + { + "epoch": 83, + "train_loss": 6.693132893981933, + "train_acc": 0.00928, + "test_loss": 4.605170736694336, + "test_acc": 0.01, + "lyapunov": 2.5217734712468998, + "grad_norm": 0.37154817796859707, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 124.33878684043884 + }, + { + "epoch": 84, + "train_loss": 6.673238817443847, + "train_acc": 0.00904, + "test_loss": 4.605171113586426, + "test_acc": 0.01, + "lyapunov": 2.5138309251926745, + "grad_norm": 0.48242670306903057, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 124.42056584358215 + }, + { + "epoch": 85, + "train_loss": 6.597096472473145, + "train_acc": 0.0083, + "test_loss": 4.605170780181885, + "test_acc": 0.01, + "lyapunov": 2.4718706601720943, + "grad_norm": 0.13232535416814104, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 124.43193411827087 + }, + { + "epoch": 86, + "train_loss": 6.575025537414551, + "train_acc": 0.00834, + "test_loss": 4.6051709815979, + "test_acc": 0.01, + "lyapunov": 2.4622172730048293, + "grad_norm": 0.11156499374939659, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 124.34226822853088 + }, + { + "epoch": 87, + "train_loss": 6.573478553161621, + "train_acc": 0.00842, + "test_loss": 4.605170571899414, + "test_acc": 0.01, + "lyapunov": 2.4612386501048835, + "grad_norm": 0.09079297617092336, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 124.27930355072021 + }, + { + "epoch": 88, + "train_loss": 6.5734689576721195, + "train_acc": 0.00854, + "test_loss": 4.605170808410644, + "test_acc": 0.01, + "lyapunov": 2.461263867595312, + "grad_norm": 0.09120456341783888, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 124.38532066345215 + }, + { + "epoch": 89, + "train_loss": 6.578163130187988, + "train_acc": 0.00852, + "test_loss": 4.605170602416992, + "test_acc": 0.01, + "lyapunov": 2.4642753814492386, + "grad_norm": 0.09559837141233972, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 124.44146919250488 + }, + { + "epoch": 90, + "train_loss": 6.5798112936401365, + "train_acc": 0.0083, + "test_loss": 4.605170631408692, + "test_acc": 0.01, + "lyapunov": 2.4649541908517825, + "grad_norm": 0.09735485237927284, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 124.39319109916687 + }, + { + "epoch": 91, + "train_loss": 6.574903171081543, + "train_acc": 0.0083, + "test_loss": 4.605170557403564, + "test_acc": 0.01, + "lyapunov": 2.4621782180903207, + "grad_norm": 0.08981548140002098, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 124.35036778450012 + }, + { + "epoch": 92, + "train_loss": 6.5757408012390135, + "train_acc": 0.00836, + "test_loss": 4.605170684814453, + "test_acc": 0.01, + "lyapunov": 2.4627471470162083, + "grad_norm": 0.08817445544280453, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 124.33928322792053 + }, + { + "epoch": 93, + "train_loss": 6.612554905395508, + "train_acc": 0.00834, + "test_loss": 4.605170486450195, + "test_acc": 0.01, + "lyapunov": 2.4806297959574044, + "grad_norm": 0.1882025016044833, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 124.40910911560059 + }, + { + "epoch": 94, + "train_loss": 6.595741138000489, + "train_acc": 0.00806, + "test_loss": 4.60517061920166, + "test_acc": 0.01, + "lyapunov": 2.472626593411731, + "grad_norm": 0.16104566409905433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 124.41845726966858 + }, + { + "epoch": 95, + "train_loss": 6.5987700848388675, + "train_acc": 0.0085, + "test_loss": 4.605170571899414, + "test_acc": 0.01, + "lyapunov": 2.4736888725739306, + "grad_norm": 0.1552458690168984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 124.34644985198975 + }, + { + "epoch": 96, + "train_loss": 6.597373901672364, + "train_acc": 0.00828, + "test_loss": 4.6051704193115235, + "test_acc": 0.01, + "lyapunov": 2.473390321902302, + "grad_norm": 0.1443472451352086, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 124.32696723937988 + }, + { + "epoch": 97, + "train_loss": 6.590096541442871, + "train_acc": 0.00862, + "test_loss": 4.6051705436706545, + "test_acc": 0.01, + "lyapunov": 2.4693754414463287, + "grad_norm": 0.11035396630097889, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 124.30454087257385 + }, + { + "epoch": 98, + "train_loss": 6.70725288696289, + "train_acc": 0.00854, + "test_loss": 4.605170336151123, + "test_acc": 0.01, + "lyapunov": 2.529677952037138, + "grad_norm": 0.5122066284498856, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 124.31350612640381 + }, + { + "epoch": 99, + "train_loss": 6.575984575958252, + "train_acc": 0.0085, + "test_loss": 4.60517036895752, + "test_acc": 0.01, + "lyapunov": 2.462917518737676, + "grad_norm": 0.08798552577224787, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 124.33125352859497 + }, + { + "epoch": 100, + "train_loss": 6.575890505371094, + "train_acc": 0.00856, + "test_loss": 4.605170387268067, + "test_acc": 0.01, + "lyapunov": 2.462910512524188, + "grad_norm": 0.08984849200071802, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 124.41467308998108 + }, + { + "epoch": 101, + "train_loss": 6.5755246405029295, + "train_acc": 0.00866, + "test_loss": 4.605170295715332, + "test_acc": 0.01, + "lyapunov": 2.4626409702593715, + "grad_norm": 0.08833234367069784, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 124.4282865524292 + }, + { + "epoch": 102, + "train_loss": 6.578647835388184, + "train_acc": 0.00874, + "test_loss": 4.60517028503418, + "test_acc": 0.01, + "lyapunov": 2.4644368957070744, + "grad_norm": 0.0881800871840224, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 124.39285898208618 + }, + { + "epoch": 103, + "train_loss": 6.603837554931641, + "train_acc": 0.0081, + "test_loss": 4.605170309448242, + "test_acc": 0.01, + "lyapunov": 2.475680511016065, + "grad_norm": 0.12862246002842495, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 124.30171847343445 + }, + { + "epoch": 104, + "train_loss": 6.589783010559082, + "train_acc": 0.0087, + "test_loss": 4.605170768737793, + "test_acc": 0.01, + "lyapunov": 2.469147738898197, + "grad_norm": 0.1132666503606524, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 124.33115792274475 + }, + { + "epoch": 105, + "train_loss": 6.607209113769532, + "train_acc": 0.00868, + "test_loss": 4.605170411682129, + "test_acc": 0.01, + "lyapunov": 2.4791276979324457, + "grad_norm": 0.19473222939710866, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 124.42748808860779 + }, + { + "epoch": 106, + "train_loss": 6.605109618988037, + "train_acc": 0.00876, + "test_loss": 4.605170632171631, + "test_acc": 0.01, + "lyapunov": 2.4781547934198014, + "grad_norm": 0.19321601949412123, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 124.40237879753113 + }, + { + "epoch": 107, + "train_loss": 6.5744285192871095, + "train_acc": 0.0084, + "test_loss": 4.605170581054687, + "test_acc": 0.01, + "lyapunov": 2.461912363081637, + "grad_norm": 0.09153624986240072, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 124.35668659210205 + }, + { + "epoch": 108, + "train_loss": 6.591736253662109, + "train_acc": 0.009, + "test_loss": 4.605170578002929, + "test_acc": 0.01, + "lyapunov": 2.469679483672237, + "grad_norm": 0.17005631477257033, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 124.29520559310913 + }, + { + "epoch": 109, + "train_loss": 6.618268890991211, + "train_acc": 0.00898, + "test_loss": 4.605170452880859, + "test_acc": 0.01, + "lyapunov": 2.4846892923955113, + "grad_norm": 0.22506407024101205, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 124.44524145126343 + }, + { + "epoch": 110, + "train_loss": 6.588956251525879, + "train_acc": 0.0079, + "test_loss": 4.605170387268067, + "test_acc": 0.01, + "lyapunov": 2.4697647594734837, + "grad_norm": 0.1497151598092074, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 124.427237033844 + }, + { + "epoch": 111, + "train_loss": 6.597999030761719, + "train_acc": 0.0082, + "test_loss": 4.605170532226563, + "test_acc": 0.01, + "lyapunov": 2.47352661866971, + "grad_norm": 0.1265460364033806, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 124.4067976474762 + }, + { + "epoch": 112, + "train_loss": 6.581220099945068, + "train_acc": 0.00878, + "test_loss": 4.605170124816895, + "test_acc": 0.01, + "lyapunov": 2.466078118595016, + "grad_norm": 0.1166543211179088, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 124.3555097579956 + }, + { + "epoch": 113, + "train_loss": 6.5873154238891605, + "train_acc": 0.00902, + "test_loss": 4.605170477294922, + "test_acc": 0.01, + "lyapunov": 2.467848820454629, + "grad_norm": 0.11336040865405435, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 124.34751081466675 + }, + { + "epoch": 114, + "train_loss": 6.575267355041504, + "train_acc": 0.00892, + "test_loss": 4.60517041015625, + "test_acc": 0.01, + "lyapunov": 2.4624666978636056, + "grad_norm": 0.0882429459696398, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 124.43968343734741 + }, + { + "epoch": 115, + "train_loss": 6.575747386169434, + "train_acc": 0.0087, + "test_loss": 4.60517027130127, + "test_acc": 0.01, + "lyapunov": 2.46279121481854, + "grad_norm": 0.08906865623909292, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 124.40401101112366 + }, + { + "epoch": 116, + "train_loss": 6.574066097106933, + "train_acc": 0.00888, + "test_loss": 4.605170015716553, + "test_acc": 0.01, + "lyapunov": 2.4617425267348816, + "grad_norm": 0.09299280580563789, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 124.43384170532227 + }, + { + "epoch": 117, + "train_loss": 6.575292884674072, + "train_acc": 0.00916, + "test_loss": 4.605170446777343, + "test_acc": 0.01, + "lyapunov": 2.462491541567361, + "grad_norm": 0.08789900440919356, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 124.31648087501526 + }, + { + "epoch": 118, + "train_loss": 6.578267410125733, + "train_acc": 0.00826, + "test_loss": 4.605170466613769, + "test_acc": 0.01, + "lyapunov": 2.4644045262690395, + "grad_norm": 0.10415607883931481, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 124.33564472198486 + }, + { + "epoch": 119, + "train_loss": 6.574555395050049, + "train_acc": 0.00854, + "test_loss": 4.605170401000977, + "test_acc": 0.01, + "lyapunov": 2.4620885909975643, + "grad_norm": 0.08778921241218508, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 124.65056228637695 + }, + { + "epoch": 120, + "train_loss": 6.583910481872558, + "train_acc": 0.00864, + "test_loss": 4.605170470428467, + "test_acc": 0.01, + "lyapunov": 2.467699810671989, + "grad_norm": 0.3040678237626765, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 124.44140434265137 + }, + { + "epoch": 121, + "train_loss": 6.586020791015625, + "train_acc": 0.00884, + "test_loss": 4.605170375823975, + "test_acc": 0.01, + "lyapunov": 2.467914994720303, + "grad_norm": 0.11635906922176238, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 124.43893909454346 + }, + { + "epoch": 122, + "train_loss": 6.576034954528809, + "train_acc": 0.0088, + "test_loss": 4.605170199584961, + "test_acc": 0.01, + "lyapunov": 2.463029363880987, + "grad_norm": 0.08771533827211757, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 124.32056403160095 + }, + { + "epoch": 123, + "train_loss": 6.574589498291016, + "train_acc": 0.00878, + "test_loss": 4.605170094299316, + "test_acc": 0.01, + "lyapunov": 2.4620493037621385, + "grad_norm": 0.08813480095873011, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 124.4015576839447 + }, + { + "epoch": 124, + "train_loss": 6.576157915649414, + "train_acc": 0.00904, + "test_loss": 4.605170024108887, + "test_acc": 0.01, + "lyapunov": 2.4630649205668806, + "grad_norm": 0.08749001934915172, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 124.42104578018188 + }, + { + "epoch": 125, + "train_loss": 6.579862565307617, + "train_acc": 0.00876, + "test_loss": 4.605170492553711, + "test_acc": 0.01, + "lyapunov": 2.465126996759868, + "grad_norm": 0.09372036345061274, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 124.4746482372284 + }, + { + "epoch": 126, + "train_loss": 6.577153359985352, + "train_acc": 0.00866, + "test_loss": 4.605170122528076, + "test_acc": 0.01, + "lyapunov": 2.463735998134174, + "grad_norm": 0.09613135620568294, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 124.38881230354309 + }, + { + "epoch": 127, + "train_loss": 6.574400754547119, + "train_acc": 0.0083, + "test_loss": 4.605170375823975, + "test_acc": 0.01, + "lyapunov": 2.4619021769374836, + "grad_norm": 0.08860379526254596, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 124.31344938278198 + }, + { + "epoch": 128, + "train_loss": 6.571165360717774, + "train_acc": 0.00878, + "test_loss": 4.605170154571534, + "test_acc": 0.01, + "lyapunov": 2.459857079074206, + "grad_norm": 0.08757319736074258, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 124.39138221740723 + }, + { + "epoch": 129, + "train_loss": 6.575437990264892, + "train_acc": 0.00846, + "test_loss": 4.605170350646973, + "test_acc": 0.01, + "lyapunov": 2.46259711831427, + "grad_norm": 0.08813574783200358, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 124.41060423851013 + }, + { + "epoch": 130, + "train_loss": 6.591315377197265, + "train_acc": 0.00954, + "test_loss": 4.605170065307617, + "test_acc": 0.01, + "lyapunov": 2.4702539943978, + "grad_norm": 0.11366316284903058, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 124.4502763748169 + }, + { + "epoch": 131, + "train_loss": 6.577392526092529, + "train_acc": 0.00946, + "test_loss": 4.60517007446289, + "test_acc": 0.01, + "lyapunov": 2.46386312401813, + "grad_norm": 0.08820500519427996, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 124.3550136089325 + }, + { + "epoch": 132, + "train_loss": 6.592328434906006, + "train_acc": 0.00882, + "test_loss": 4.6051704208374025, + "test_acc": 0.01, + "lyapunov": 2.4700996772102686, + "grad_norm": 0.114161955094371, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 124.37056255340576 + }, + { + "epoch": 133, + "train_loss": 6.588796159973144, + "train_acc": 0.00896, + "test_loss": 4.605170506286621, + "test_acc": 0.01, + "lyapunov": 2.468394133745862, + "grad_norm": 0.1295209594512649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 124.36608004570007 + }, + { + "epoch": 134, + "train_loss": 6.576412990264893, + "train_acc": 0.00898, + "test_loss": 4.605170251464844, + "test_acc": 0.01, + "lyapunov": 2.4632679434383618, + "grad_norm": 0.08812453692162578, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 124.43608951568604 + }, + { + "epoch": 135, + "train_loss": 6.5760765690612795, + "train_acc": 0.00924, + "test_loss": 4.605169999694824, + "test_acc": 0.01, + "lyapunov": 2.463012531895162, + "grad_norm": 0.08722595509863246, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 124.46503901481628 + }, + { + "epoch": 136, + "train_loss": 6.575435556030273, + "train_acc": 0.00884, + "test_loss": 4.605170062255859, + "test_acc": 0.01, + "lyapunov": 2.4626583150585595, + "grad_norm": 0.08796433458523298, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 124.34801983833313 + }, + { + "epoch": 137, + "train_loss": 6.575190331268311, + "train_acc": 0.00934, + "test_loss": 4.6051701629638675, + "test_acc": 0.01, + "lyapunov": 2.4624439023644724, + "grad_norm": 0.08813731535348707, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 124.35173964500427 + }, + { + "epoch": 138, + "train_loss": 6.574904625091553, + "train_acc": 0.0089, + "test_loss": 4.60517007446289, + "test_acc": 0.01, + "lyapunov": 2.4622641213409735, + "grad_norm": 0.08807062213809792, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 124.40467262268066 + }, + { + "epoch": 139, + "train_loss": 6.5738159555053715, + "train_acc": 0.00926, + "test_loss": 4.605170321655273, + "test_acc": 0.01, + "lyapunov": 2.4615705336451223, + "grad_norm": 0.08717896516246301, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 124.4789035320282 + }, + { + "epoch": 140, + "train_loss": 6.575532109680176, + "train_acc": 0.00924, + "test_loss": 4.605170358276367, + "test_acc": 0.01, + "lyapunov": 2.4626962266614676, + "grad_norm": 0.0882680648293281, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 124.40317368507385 + }, + { + "epoch": 141, + "train_loss": 6.5800046757507324, + "train_acc": 0.00862, + "test_loss": 4.60517036895752, + "test_acc": 0.01, + "lyapunov": 2.4654090264264275, + "grad_norm": 0.11343015603036581, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 124.35891890525818 + }, + { + "epoch": 142, + "train_loss": 6.57490125793457, + "train_acc": 0.00948, + "test_loss": 4.6051704162597655, + "test_acc": 0.01, + "lyapunov": 2.462258317586406, + "grad_norm": 0.08755517239002598, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 124.29203748703003 + }, + { + "epoch": 143, + "train_loss": 6.576884376220703, + "train_acc": 0.00966, + "test_loss": 4.605170155334473, + "test_acc": 0.01, + "lyapunov": 2.4635954634917665, + "grad_norm": 0.08753943717047542, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 124.41098976135254 + }, + { + "epoch": 144, + "train_loss": 6.573677404937744, + "train_acc": 0.00962, + "test_loss": 4.60517022857666, + "test_acc": 0.01, + "lyapunov": 2.461500019673496, + "grad_norm": 0.08775396126300311, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 124.44748258590698 + }, + { + "epoch": 145, + "train_loss": 6.573780137023926, + "train_acc": 0.0092, + "test_loss": 4.605170056152343, + "test_acc": 0.01, + "lyapunov": 2.4615867387913073, + "grad_norm": 0.08734584455870835, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 124.4104528427124 + }, + { + "epoch": 146, + "train_loss": 6.574326271667481, + "train_acc": 0.00928, + "test_loss": 4.605170436859131, + "test_acc": 0.01, + "lyapunov": 2.4619192083168517, + "grad_norm": 0.08784696936548642, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 124.3491895198822 + }, + { + "epoch": 147, + "train_loss": 6.573583771209717, + "train_acc": 0.00938, + "test_loss": 4.605170133209229, + "test_acc": 0.01, + "lyapunov": 2.461428134947482, + "grad_norm": 0.08718184577116198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 124.33614110946655 + }, + { + "epoch": 148, + "train_loss": 6.577077916870117, + "train_acc": 0.01, + "test_loss": 4.605170425415039, + "test_acc": 0.01, + "lyapunov": 2.4637341109078252, + "grad_norm": 0.08788027221282606, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 124.37565398216248 + }, + { + "epoch": 149, + "train_loss": 6.5732455339050295, + "train_acc": 0.01, + "test_loss": 4.605170333862305, + "test_acc": 0.01, + "lyapunov": 2.461217089382279, + "grad_norm": 0.08788179142338205, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 124.34460210800171 + }, + { + "epoch": 150, + "train_loss": 6.574304178619385, + "train_acc": 0.01, + "test_loss": 4.605170114135742, + "test_acc": 0.01, + "lyapunov": 2.4619127923570328, + "grad_norm": 0.08771827398079268, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 124.40945982933044 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 13.988400897827148, + "train_acc": 0.01438, + "test_loss": 4.683009733581543, + "test_acc": 0.0106, + "lyapunov": 5.045674181960123, + "grad_norm": 5.752499013515142, + "grad_max_sv": 4.6983559966087345, + "grad_min_sv": 8.501930549228987e-08, + "grad_condition": 317270864.69818985, + "lr": 0.0009998903417374227, + "time_sec": 167.40048050880432 + }, + { + "epoch": 2, + "train_loss": 9.313672403564453, + "train_acc": 0.01648, + "test_loss": 4.631449128723145, + "test_acc": 0.01, + "lyapunov": 3.775117972317864, + "grad_norm": 4.062466764062373, + "grad_max_sv": 3.613509923219681, + "grad_min_sv": 4.5653093948966327e-08, + "grad_condition": 646545370.9190311, + "lr": 0.0009995614150494292, + "time_sec": 167.42056441307068 + }, + { + "epoch": 3, + "train_loss": 9.2102595413208, + "train_acc": 0.01704, + "test_loss": 4.625689315795898, + "test_acc": 0.0099, + "lyapunov": 3.769411094353327, + "grad_norm": 3.2423057609153028, + "grad_max_sv": 2.773962843418121, + "grad_min_sv": 1.3365777420984947e-08, + "grad_condition": 79084430364.82771, + "lr": 0.0009990133642141358, + "time_sec": 167.40087485313416 + }, + { + "epoch": 4, + "train_loss": 8.593553448181153, + "train_acc": 0.01608, + "test_loss": 4.623868472290039, + "test_acc": 0.01, + "lyapunov": 3.5245635119240606, + "grad_norm": 2.236847501376478, + "grad_max_sv": 1.9526167243719101, + "grad_min_sv": 4.5824498221260444e-11, + "grad_condition": 250389376731.7333, + "lr": 0.0009982464296247522, + "time_sec": 167.34348464012146 + }, + { + "epoch": 5, + "train_loss": 7.8038157984924315, + "train_acc": 0.01666, + "test_loss": 4.618056827545166, + "test_acc": 0.01, + "lyapunov": 3.1676931515374145, + "grad_norm": 1.5048980928317333, + "grad_max_sv": 1.1324948772788048, + "grad_min_sv": 1.5125593644607378e-11, + "grad_condition": 218348544809.20728, + "lr": 0.0009972609476841367, + "time_sec": 167.4401364326477 + }, + { + "epoch": 6, + "train_loss": 7.634129183959961, + "train_acc": 0.01436, + "test_loss": 4.617713563537598, + "test_acc": 0.01, + "lyapunov": 3.0711578097184904, + "grad_norm": 1.9264530093156518, + "grad_max_sv": 0.7561077677975927, + "grad_min_sv": 2.3226373858483118e-12, + "grad_condition": 319185362917.36163, + "lr": 0.000996057350657239, + "time_sec": 167.3985676765442 + }, + { + "epoch": 7, + "train_loss": 7.547255232238769, + "train_acc": 0.01396, + "test_loss": 4.614803285980225, + "test_acc": 0.01, + "lyapunov": 3.0217712657226015, + "grad_norm": 1.075279960644913, + "grad_max_sv": 0.6469582007612514, + "grad_min_sv": 1.889760736503505e-12, + "grad_condition": 338582040139.5369, + "lr": 0.000994636166481494, + "time_sec": 167.22783827781677 + }, + { + "epoch": 8, + "train_loss": 7.305741961669922, + "train_acc": 0.01248, + "test_loss": 4.611902558898926, + "test_acc": 0.01, + "lyapunov": 2.8956392976024268, + "grad_norm": 1.304673575393078, + "grad_max_sv": 0.4924972869455814, + "grad_min_sv": 8.285040604573086e-13, + "grad_condition": 334051794817.99695, + "lr": 0.0009929980185352525, + "time_sec": 167.31978368759155 + }, + { + "epoch": 9, + "train_loss": 7.328730865783691, + "train_acc": 0.01336, + "test_loss": 4.606002921295166, + "test_acc": 0.01, + "lyapunov": 2.913580340192751, + "grad_norm": 1.4776699959663357, + "grad_max_sv": 0.3292516863617735, + "grad_min_sv": 5.235604182531881e-13, + "grad_condition": 246744375025.40308, + "lr": 0.0009911436253643444, + "time_sec": 167.3429365158081 + }, + { + "epoch": 10, + "train_loss": 7.308604444580078, + "train_acc": 0.01346, + "test_loss": 4.611476264953613, + "test_acc": 0.01, + "lyapunov": 2.900581695234684, + "grad_norm": 1.3123879020319187, + "grad_max_sv": 0.27272568672558684, + "grad_min_sv": 2.0496919726941882e-13, + "grad_condition": 238625164756.47662, + "lr": 0.0009890738003669028, + "time_sec": 167.2653293609619 + }, + { + "epoch": 11, + "train_loss": 7.490302003173828, + "train_acc": 0.01364, + "test_loss": 4.611579527282715, + "test_acc": 0.01, + "lyapunov": 3.0006146321211324, + "grad_norm": 2.2969507920003114, + "grad_max_sv": 0.19786488203932162, + "grad_min_sv": 8.37648333500382e-14, + "grad_condition": 183815724532.2033, + "lr": 0.00098678945143658, + "time_sec": 167.22061586380005 + }, + { + "epoch": 12, + "train_loss": 7.307793238525391, + "train_acc": 0.01262, + "test_loss": 4.606186763000489, + "test_acc": 0.01, + "lyapunov": 2.9112238219327025, + "grad_norm": 1.4729621434597777, + "grad_max_sv": 0.2151564534753561, + "grad_min_sv": 1.990284826719073e-14, + "grad_condition": 211594713734.62634, + "lr": 0.0009842915805643154, + "time_sec": 167.35631036758423 + }, + { + "epoch": 13, + "train_loss": 7.459832763977051, + "train_acc": 0.01172, + "test_loss": 4.606186486053467, + "test_acc": 0.01, + "lyapunov": 2.9779586944433736, + "grad_norm": 1.2584288878227161, + "grad_max_sv": 0.17604726925492287, + "grad_min_sv": 2.9740421215427092e-27, + "grad_condition": 176047269254.9224, + "lr": 0.000981581283398829, + "time_sec": 167.55029773712158 + }, + { + "epoch": 14, + "train_loss": 7.959970283813477, + "train_acc": 0.01162, + "test_loss": 4.606137133789063, + "test_acc": 0.01, + "lyapunov": 3.224144145960698, + "grad_norm": 1.3145379480759145, + "grad_max_sv": 0.16056990809738636, + "grad_min_sv": 6.069672152326662e-32, + "grad_condition": 160569908097.38638, + "lr": 0.0009786597487660333, + "time_sec": 167.2209074497223 + }, + { + "epoch": 15, + "train_loss": 7.6532865875244145, + "train_acc": 0.01084, + "test_loss": 4.606105514526368, + "test_acc": 0.01, + "lyapunov": 3.0689418846384036, + "grad_norm": 0.7741481577990978, + "grad_max_sv": 0.1402381032705307, + "grad_min_sv": 5.380285453775135e-40, + "grad_condition": 140238103270.5307, + "lr": 0.0009755282581475766, + "time_sec": 167.3077232837677 + }, + { + "epoch": 16, + "train_loss": 7.216664337158203, + "train_acc": 0.01118, + "test_loss": 4.606032288360596, + "test_acc": 0.01, + "lyapunov": 2.8502078891715126, + "grad_norm": 2.0735777194936222, + "grad_max_sv": 0.10496805571019649, + "grad_min_sv": 1.2874706397430962e-40, + "grad_condition": 104968055710.1965, + "lr": 0.0009721881851187403, + "time_sec": 167.3395276069641 + }, + { + "epoch": 17, + "train_loss": 8.192574862670899, + "train_acc": 0.01158, + "test_loss": 4.6059588500976565, + "test_acc": 0.01, + "lyapunov": 3.3359562454321194, + "grad_norm": 3.147348676481939, + "grad_max_sv": 0.09904798325151205, + "grad_min_sv": 3.313275631249688e-41, + "grad_condition": 99047983251.51205, + "lr": 0.0009686409947459456, + "time_sec": 167.2007658481598 + }, + { + "epoch": 18, + "train_loss": 7.947704606018067, + "train_acc": 0.01086, + "test_loss": 4.605810301208496, + "test_acc": 0.01, + "lyapunov": 3.2087259890173403, + "grad_norm": 1.1551680706222047, + "grad_max_sv": 0.0897066842764616, + "grad_min_sv": 3.5133705422167894e-42, + "grad_condition": 89706684276.4616, + "lr": 0.0009648882429441254, + "time_sec": 167.2022511959076 + }, + { + "epoch": 19, + "train_loss": 8.011894176635742, + "train_acc": 0.00998, + "test_loss": 4.610458689880371, + "test_acc": 0.01, + "lyapunov": 3.247671382201602, + "grad_norm": 0.789157877855446, + "grad_max_sv": 0.04834392946213484, + "grad_min_sv": 1.7516230804060213e-46, + "grad_condition": 48343929462.134834, + "lr": 0.00096093157579425, + "time_sec": 167.33806610107422 + }, + { + "epoch": 20, + "train_loss": 8.051023805236817, + "train_acc": 0.00904, + "test_loss": 4.610909297180176, + "test_acc": 0.01, + "lyapunov": 3.2383710405100947, + "grad_norm": 1.1273733660004814, + "grad_max_sv": 0.010316886380314827, + "grad_min_sv": 0.0, + "grad_condition": 10316886380.314827, + "lr": 0.0009567727288213001, + "time_sec": 167.29369735717773 + }, + { + "epoch": 21, + "train_loss": 7.128181716918945, + "train_acc": 0.00838, + "test_loss": 4.607191325378418, + "test_acc": 0.01, + "lyapunov": 2.7860927539103475, + "grad_norm": 1.0701329510796986, + "grad_max_sv": 0.014478291012346744, + "grad_min_sv": 0.0, + "grad_condition": 14478291012.346745, + "lr": 0.0009524135262330095, + "time_sec": 167.20805835723877 + }, + { + "epoch": 22, + "train_loss": 6.963491222686768, + "train_acc": 0.0091, + "test_loss": 4.607380027770996, + "test_acc": 0.01, + "lyapunov": 2.6966084769314818, + "grad_norm": 1.1730630244839415, + "grad_max_sv": 0.012138673383742572, + "grad_min_sv": 0.0, + "grad_condition": 12138673383.742573, + "lr": 0.0009478558801197061, + "time_sec": 167.22877049446106 + }, + { + "epoch": 23, + "train_loss": 6.875370686798096, + "train_acc": 0.00858, + "test_loss": 4.609367184448242, + "test_acc": 0.01, + "lyapunov": 2.6493814430578286, + "grad_norm": 1.3739908151868958, + "grad_max_sv": 0.011468294635415077, + "grad_min_sv": 0.0, + "grad_condition": 11468294635.415077, + "lr": 0.000943101789615607, + "time_sec": 167.56782293319702 + }, + { + "epoch": 24, + "train_loss": 7.175245254516602, + "train_acc": 0.00882, + "test_loss": 4.6075513046264645, + "test_acc": 0.01, + "lyapunov": 2.813519052837206, + "grad_norm": 1.9559849705093102, + "grad_max_sv": 0.011112797912210226, + "grad_min_sv": 0.0, + "grad_condition": 11112797912.210226, + "lr": 0.0009381533400219313, + "time_sec": 167.2002296447754 + }, + { + "epoch": 25, + "train_loss": 6.835657153320312, + "train_acc": 0.00898, + "test_loss": 4.609123987579346, + "test_acc": 0.01, + "lyapunov": 2.6257676047742216, + "grad_norm": 0.8499098981030252, + "grad_max_sv": 0.010097978403791785, + "grad_min_sv": 0.0, + "grad_condition": 10097978403.791786, + "lr": 0.0009330127018922189, + "time_sec": 167.22895908355713 + }, + { + "epoch": 26, + "train_loss": 6.806944010009766, + "train_acc": 0.00952, + "test_loss": 4.608995832824707, + "test_acc": 0.01, + "lyapunov": 2.608501203224787, + "grad_norm": 0.16959020377034753, + "grad_max_sv": 0.009534611040726304, + "grad_min_sv": 0.0, + "grad_condition": 9534611040.726305, + "lr": 0.000927682130080253, + "time_sec": 167.30368304252625 + }, + { + "epoch": 27, + "train_loss": 6.796024333190918, + "train_acc": 0.00918, + "test_loss": 4.608860453033447, + "test_acc": 0.01, + "lyapunov": 2.601986149083013, + "grad_norm": 0.10936615989500913, + "grad_max_sv": 0.003977444209158421, + "grad_min_sv": 0.0, + "grad_condition": 3977444209.1584206, + "lr": 0.0009221639627510072, + "time_sec": 167.31120085716248 + }, + { + "epoch": 28, + "train_loss": 6.799691816711426, + "train_acc": 0.00886, + "test_loss": 4.6074915008544925, + "test_acc": 0.01, + "lyapunov": 2.604261659905124, + "grad_norm": 0.09652074382540592, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009164606203550494, + "time_sec": 167.08661937713623 + }, + { + "epoch": 29, + "train_loss": 6.8092449851989745, + "train_acc": 0.00872, + "test_loss": 4.608655583190918, + "test_acc": 0.01, + "lyapunov": 2.608830842825458, + "grad_norm": 0.12376584460534797, + "grad_max_sv": 0.002880856767296791, + "grad_min_sv": 0.0, + "grad_condition": 2880856767.296791, + "lr": 0.0009105746045668516, + "time_sec": 167.20095920562744 + }, + { + "epoch": 30, + "train_loss": 6.801117441558838, + "train_acc": 0.00916, + "test_loss": 4.608566645812989, + "test_acc": 0.01, + "lyapunov": 2.605140414689203, + "grad_norm": 0.10511250252895085, + "grad_max_sv": 0.0030666613951325417, + "grad_min_sv": 0.0, + "grad_condition": 3066661395.1325417, + "lr": 0.0009045084971874733, + "time_sec": 167.22371792793274 + }, + { + "epoch": 31, + "train_loss": 6.818323947296142, + "train_acc": 0.00892, + "test_loss": 4.607396678161621, + "test_acc": 0.01, + "lyapunov": 2.6131436501622507, + "grad_norm": 0.17673479255010097, + "grad_max_sv": 0.001358983526006341, + "grad_min_sv": 0.0, + "grad_condition": 1358983526.006341, + "lr": 0.0008982649590120977, + "time_sec": 167.21490716934204 + }, + { + "epoch": 32, + "train_loss": 6.81385307510376, + "train_acc": 0.00854, + "test_loss": 4.608588083648682, + "test_acc": 0.01, + "lyapunov": 2.61087080828674, + "grad_norm": 0.1300116564110217, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008918467286629196, + "time_sec": 167.17329859733582 + }, + { + "epoch": 33, + "train_loss": 6.798595635375976, + "train_acc": 0.00848, + "test_loss": 7.428785041809082, + "test_acc": 0.01, + "lyapunov": 2.603473731623891, + "grad_norm": 0.10178851829698213, + "grad_max_sv": 0.0006682275328785181, + "grad_min_sv": 0.0, + "grad_condition": 668227532.8785181, + "lr": 0.0008852566213878943, + "time_sec": 167.23122191429138 + }, + { + "epoch": 34, + "train_loss": 6.79622100402832, + "train_acc": 0.0085, + "test_loss": 7.445402703094483, + "test_acc": 0.01, + "lyapunov": 2.602201823383341, + "grad_norm": 0.09821894401826198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000878497527825878, + "time_sec": 167.51045203208923 + }, + { + "epoch": 35, + "train_loss": 6.800452690124512, + "train_acc": 0.0086, + "test_loss": 4.6083794067382815, + "test_acc": 0.01, + "lyapunov": 2.604824850321426, + "grad_norm": 0.09521574599597374, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000871572412738697, + "time_sec": 167.14473628997803 + }, + { + "epoch": 36, + "train_loss": 6.801179714050293, + "train_acc": 0.00882, + "test_loss": 4.608353971862793, + "test_acc": 0.01, + "lyapunov": 2.605245649357281, + "grad_norm": 0.09891258167661582, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107055, + "time_sec": 167.21640372276306 + }, + { + "epoch": 37, + "train_loss": 6.798632629699707, + "train_acc": 0.00856, + "test_loss": 4.608331527709961, + "test_acc": 0.01, + "lyapunov": 2.603703239079936, + "grad_norm": 0.09374120059954827, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 167.28665328025818 + }, + { + "epoch": 38, + "train_loss": 6.798052488708496, + "train_acc": 0.00864, + "test_loss": 4.608306627655029, + "test_acc": 0.01, + "lyapunov": 2.6033894985228243, + "grad_norm": 0.0928347460465077, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 167.22592282295227 + }, + { + "epoch": 39, + "train_loss": 6.797720238189697, + "train_acc": 0.00854, + "test_loss": 4.608331230163574, + "test_acc": 0.01, + "lyapunov": 2.6030823568553876, + "grad_norm": 0.1025783953694396, + "grad_max_sv": 0.000793654378503561, + "grad_min_sv": 0.0, + "grad_condition": 793654378.503561, + "lr": 0.0008422735529643442, + "time_sec": 167.11991024017334 + }, + { + "epoch": 40, + "train_loss": 6.796907914123535, + "train_acc": 0.00818, + "test_loss": 7.429255201721191, + "test_acc": 0.01, + "lyapunov": 2.6026227175427215, + "grad_norm": 0.09282398303274703, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008345653031794289, + "time_sec": 167.28346157073975 + }, + { + "epoch": 41, + "train_loss": 6.811164211883545, + "train_acc": 0.00882, + "test_loss": 4.7162436149597164, + "test_acc": 0.01, + "lyapunov": 2.608923517529617, + "grad_norm": 0.1222466987863888, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 167.2502682209015 + }, + { + "epoch": 42, + "train_loss": 6.810527358703613, + "train_acc": 0.00896, + "test_loss": 4.736723460388184, + "test_acc": 0.01, + "lyapunov": 2.6098364740991227, + "grad_norm": 0.12481417359397351, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 167.19833540916443 + }, + { + "epoch": 43, + "train_loss": 6.8037118544006345, + "train_acc": 0.0083, + "test_loss": 4.676154768371582, + "test_acc": 0.01, + "lyapunov": 2.606640679147237, + "grad_norm": 0.12856017826684152, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 167.17452216148376 + }, + { + "epoch": 44, + "train_loss": 6.794667855529785, + "train_acc": 0.00872, + "test_loss": 4.7420101188659665, + "test_acc": 0.01, + "lyapunov": 2.6012551680855127, + "grad_norm": 0.09209394266338691, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 167.27408933639526 + }, + { + "epoch": 45, + "train_loss": 6.7950104260253905, + "train_acc": 0.00898, + "test_loss": 4.896900399780273, + "test_acc": 0.01, + "lyapunov": 2.6014791181325303, + "grad_norm": 0.09205616000449629, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 167.31984734535217 + }, + { + "epoch": 46, + "train_loss": 6.819086815185547, + "train_acc": 0.00892, + "test_loss": 4.605172099304199, + "test_acc": 0.01, + "lyapunov": 2.612778242896585, + "grad_norm": 0.11562328930387418, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 167.12109279632568 + }, + { + "epoch": 47, + "train_loss": 6.798819590454102, + "train_acc": 0.00832, + "test_loss": 4.605172010803223, + "test_acc": 0.01, + "lyapunov": 2.6037960967139515, + "grad_norm": 0.09084227993519768, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 167.26839470863342 + }, + { + "epoch": 48, + "train_loss": 6.797002004394531, + "train_acc": 0.00882, + "test_loss": 4.6051717926025395, + "test_acc": 0.01, + "lyapunov": 2.6027391889820928, + "grad_norm": 0.09202982942979847, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 167.25185203552246 + }, + { + "epoch": 49, + "train_loss": 6.799232456512451, + "train_acc": 0.00864, + "test_loss": 4.605324877929688, + "test_acc": 0.01, + "lyapunov": 2.6040493954173134, + "grad_norm": 0.0929356327661651, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 167.24265789985657 + }, + { + "epoch": 50, + "train_loss": 6.812471532135009, + "train_acc": 0.00842, + "test_loss": 4.608313929748535, + "test_acc": 0.01, + "lyapunov": 2.6102352337459163, + "grad_norm": 0.11621130736417108, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 167.15211701393127 + }, + { + "epoch": 51, + "train_loss": 6.794671293334961, + "train_acc": 0.00842, + "test_loss": 4.605172332763672, + "test_acc": 0.01, + "lyapunov": 2.6012639694506556, + "grad_norm": 0.0930565557537395, + "grad_max_sv": 0.0036748358979821205, + "grad_min_sv": 0.0, + "grad_condition": 3674835897.9821205, + "lr": 0.0007408768370508575, + "time_sec": 167.3388113975525 + }, + { + "epoch": 52, + "train_loss": 6.799352421264649, + "train_acc": 0.00892, + "test_loss": 4.605172877502441, + "test_acc": 0.01, + "lyapunov": 2.6041594795558765, + "grad_norm": 0.09046235706111078, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 168.00543642044067 + }, + { + "epoch": 53, + "train_loss": 6.821222294006348, + "train_acc": 0.00822, + "test_loss": 4.605560771179199, + "test_acc": 0.01, + "lyapunov": 2.612406419061334, + "grad_norm": 0.10733736636185434, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 167.15741348266602 + }, + { + "epoch": 54, + "train_loss": 6.7975339453125, + "train_acc": 0.0087, + "test_loss": 4.605171894073487, + "test_acc": 0.01, + "lyapunov": 2.603086569729973, + "grad_norm": 0.09401396255246093, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 167.15016341209412 + }, + { + "epoch": 55, + "train_loss": 6.818788750457764, + "train_acc": 0.00834, + "test_loss": 4.60517187576294, + "test_acc": 0.01, + "lyapunov": 2.614099033653279, + "grad_norm": 0.10409203954293918, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 167.16365313529968 + }, + { + "epoch": 56, + "train_loss": 6.823291486663819, + "train_acc": 0.00896, + "test_loss": 4.605172322082519, + "test_acc": 0.01, + "lyapunov": 2.6149235838819345, + "grad_norm": 0.1215199933903174, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 167.22393465042114 + }, + { + "epoch": 57, + "train_loss": 6.812863822021485, + "train_acc": 0.00918, + "test_loss": 4.605172196197509, + "test_acc": 0.01, + "lyapunov": 2.6100745280380444, + "grad_norm": 0.11428618016798626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 167.36779832839966 + }, + { + "epoch": 58, + "train_loss": 6.845285939025879, + "train_acc": 0.00852, + "test_loss": 4.605171984863281, + "test_acc": 0.01, + "lyapunov": 2.621920944784608, + "grad_norm": 0.16133795983355934, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 167.1204113960266 + }, + { + "epoch": 59, + "train_loss": 6.8284387295532225, + "train_acc": 0.00838, + "test_loss": 4.605172086334228, + "test_acc": 0.01, + "lyapunov": 2.619316293150568, + "grad_norm": 0.1660277007934849, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 167.1542353630066 + }, + { + "epoch": 60, + "train_loss": 6.853109035339355, + "train_acc": 0.00904, + "test_loss": 4.605171766662598, + "test_acc": 0.01, + "lyapunov": 2.626850544644134, + "grad_norm": 0.14505200146170139, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 167.25803112983704 + }, + { + "epoch": 61, + "train_loss": 6.8587484286499025, + "train_acc": 0.00894, + "test_loss": 4.605171794128418, + "test_acc": 0.01, + "lyapunov": 2.6341320041500396, + "grad_norm": 0.23780774328945256, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 167.1593141555786 + }, + { + "epoch": 62, + "train_loss": 6.856730157775879, + "train_acc": 0.00858, + "test_loss": 4.605171855926514, + "test_acc": 0.01, + "lyapunov": 2.6288814319064246, + "grad_norm": 0.19871702414437586, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 167.14994502067566 + }, + { + "epoch": 63, + "train_loss": 6.840637737731933, + "train_acc": 0.00874, + "test_loss": 4.60517123260498, + "test_acc": 0.01, + "lyapunov": 2.624538544803629, + "grad_norm": 0.2247756960679524, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 167.2067906856537 + }, + { + "epoch": 64, + "train_loss": 6.822744883117676, + "train_acc": 0.00848, + "test_loss": 4.60517158203125, + "test_acc": 0.01, + "lyapunov": 2.613635628424642, + "grad_norm": 0.1329153891377645, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 167.26912307739258 + }, + { + "epoch": 65, + "train_loss": 6.8317010522460935, + "train_acc": 0.00862, + "test_loss": 4.605171473693848, + "test_acc": 0.01, + "lyapunov": 2.6185932665529763, + "grad_norm": 0.13671337080211707, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 167.09261989593506 + }, + { + "epoch": 66, + "train_loss": 6.812226905822754, + "train_acc": 0.0088, + "test_loss": 4.605171728515625, + "test_acc": 0.01, + "lyapunov": 2.610206864374068, + "grad_norm": 0.12722937279819782, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 167.21893763542175 + }, + { + "epoch": 67, + "train_loss": 6.808111183776855, + "train_acc": 0.0093, + "test_loss": 4.6051715423583985, + "test_acc": 0.01, + "lyapunov": 2.6089447556859087, + "grad_norm": 0.15865472726238314, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 167.29591965675354 + }, + { + "epoch": 68, + "train_loss": 6.83726111694336, + "train_acc": 0.00862, + "test_loss": 4.605171617126465, + "test_acc": 0.01, + "lyapunov": 2.6234818724415185, + "grad_norm": 0.21106961802984933, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 167.22871494293213 + }, + { + "epoch": 69, + "train_loss": 6.833951936035156, + "train_acc": 0.00874, + "test_loss": 4.605171533203125, + "test_acc": 0.01, + "lyapunov": 2.6221561791646817, + "grad_norm": 0.23690960823937743, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 167.11618614196777 + }, + { + "epoch": 70, + "train_loss": 6.80746663269043, + "train_acc": 0.00868, + "test_loss": 4.6051711715698245, + "test_acc": 0.01, + "lyapunov": 2.608615706948673, + "grad_norm": 0.19368668238286113, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 167.25853991508484 + }, + { + "epoch": 71, + "train_loss": 6.840300604553223, + "train_acc": 0.00892, + "test_loss": 4.605171086120605, + "test_acc": 0.01, + "lyapunov": 2.6233106214372093, + "grad_norm": 0.21230815886405713, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 167.2756736278534 + }, + { + "epoch": 72, + "train_loss": 6.826620941162109, + "train_acc": 0.00886, + "test_loss": 4.605171425628662, + "test_acc": 0.01, + "lyapunov": 2.617017206328604, + "grad_norm": 0.16852859644395693, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 167.11485767364502 + }, + { + "epoch": 73, + "train_loss": 6.81151391418457, + "train_acc": 0.0083, + "test_loss": 4.605171309661865, + "test_acc": 0.01, + "lyapunov": 2.6109183840739454, + "grad_norm": 0.15884163876986282, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 167.23269772529602 + }, + { + "epoch": 74, + "train_loss": 6.803579806518555, + "train_acc": 0.00836, + "test_loss": 4.605171119689941, + "test_acc": 0.01, + "lyapunov": 2.606299752774446, + "grad_norm": 0.12416094470418608, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 167.30208802223206 + }, + { + "epoch": 75, + "train_loss": 6.85053612701416, + "train_acc": 0.00864, + "test_loss": 4.605171006774903, + "test_acc": 0.01, + "lyapunov": 2.6286537153336704, + "grad_norm": 0.19093915741238635, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 167.27450942993164 + }, + { + "epoch": 76, + "train_loss": 6.801593222961426, + "train_acc": 0.00904, + "test_loss": 4.605170780181885, + "test_acc": 0.01, + "lyapunov": 2.6054461362111905, + "grad_norm": 0.12884562844199357, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 167.09656834602356 + }, + { + "epoch": 77, + "train_loss": 6.796963772583008, + "train_acc": 0.00794, + "test_loss": 4.605171012878418, + "test_acc": 0.01, + "lyapunov": 2.6028354930145965, + "grad_norm": 0.09104303565016296, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 167.33878350257874 + }, + { + "epoch": 78, + "train_loss": 6.7984873474121095, + "train_acc": 0.00882, + "test_loss": 4.605170700073242, + "test_acc": 0.01, + "lyapunov": 2.603611297314734, + "grad_norm": 0.10157683305126329, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 167.25584626197815 + }, + { + "epoch": 79, + "train_loss": 6.820661872863769, + "train_acc": 0.00986, + "test_loss": 4.605170817565918, + "test_acc": 0.01, + "lyapunov": 2.612017824826643, + "grad_norm": 0.14611535298895395, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 167.1672751903534 + }, + { + "epoch": 80, + "train_loss": 6.806377208557129, + "train_acc": 0.00852, + "test_loss": 4.605170895385742, + "test_acc": 0.01, + "lyapunov": 2.607236401809146, + "grad_norm": 0.10585908127422697, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 167.1809687614441 + }, + { + "epoch": 81, + "train_loss": 6.808554836425781, + "train_acc": 0.00942, + "test_loss": 4.605170629882813, + "test_acc": 0.01, + "lyapunov": 2.6088667123214058, + "grad_norm": 0.14379651420159803, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 167.25520253181458 + }, + { + "epoch": 82, + "train_loss": 6.8339071276855465, + "train_acc": 0.00906, + "test_loss": 4.605170634460449, + "test_acc": 0.01, + "lyapunov": 2.620855552766024, + "grad_norm": 0.23055639987610052, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 167.52204132080078 + }, + { + "epoch": 83, + "train_loss": 6.828104596252442, + "train_acc": 0.0093, + "test_loss": 4.605170736694336, + "test_acc": 0.01, + "lyapunov": 2.6192942519322076, + "grad_norm": 0.19017261102902538, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 167.1194040775299 + }, + { + "epoch": 84, + "train_loss": 6.808681617126465, + "train_acc": 0.0084, + "test_loss": 4.6051709182739256, + "test_acc": 0.01, + "lyapunov": 2.609468307641461, + "grad_norm": 0.15622504553249358, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 167.19974207878113 + }, + { + "epoch": 85, + "train_loss": 6.818397989654541, + "train_acc": 0.00824, + "test_loss": 4.605170721435547, + "test_acc": 0.01, + "lyapunov": 2.6138416312234787, + "grad_norm": 0.14833733270771185, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 167.2553927898407 + }, + { + "epoch": 86, + "train_loss": 6.799676761169434, + "train_acc": 0.00838, + "test_loss": 4.60517102508545, + "test_acc": 0.01, + "lyapunov": 2.604430999292437, + "grad_norm": 0.11142070053574807, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 167.18824887275696 + }, + { + "epoch": 87, + "train_loss": 6.818209040527344, + "train_acc": 0.00854, + "test_loss": 4.605170503997803, + "test_acc": 0.01, + "lyapunov": 2.6141847765354242, + "grad_norm": 0.14462203411441973, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 167.1196677684784 + }, + { + "epoch": 88, + "train_loss": 6.874744393615723, + "train_acc": 0.00888, + "test_loss": 4.605170900726319, + "test_acc": 0.01, + "lyapunov": 2.6346183640267844, + "grad_norm": 0.20078574833508478, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 167.2573266029358 + }, + { + "epoch": 89, + "train_loss": 6.803292810211182, + "train_acc": 0.00886, + "test_loss": 4.60517081451416, + "test_acc": 0.01, + "lyapunov": 2.606465803082947, + "grad_norm": 0.12244758192489462, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 167.22969937324524 + }, + { + "epoch": 90, + "train_loss": 6.842185859069824, + "train_acc": 0.00942, + "test_loss": 4.605170654296875, + "test_acc": 0.01, + "lyapunov": 2.622050429853942, + "grad_norm": 0.1882414210254429, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 167.11765575408936 + }, + { + "epoch": 91, + "train_loss": 6.836290773010254, + "train_acc": 0.00882, + "test_loss": 4.605170703125, + "test_acc": 0.01, + "lyapunov": 2.619682075422438, + "grad_norm": 0.19767006125117328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 167.22952795028687 + }, + { + "epoch": 92, + "train_loss": 6.791880859985351, + "train_acc": 0.00842, + "test_loss": 4.605170771789551, + "test_acc": 0.01, + "lyapunov": 2.5996962294859043, + "grad_norm": 0.08760976620030388, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 167.26651191711426 + }, + { + "epoch": 93, + "train_loss": 6.80370014678955, + "train_acc": 0.00806, + "test_loss": 4.605170739746094, + "test_acc": 0.01, + "lyapunov": 2.606304941884697, + "grad_norm": 0.13940577534302254, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 167.17852663993835 + }, + { + "epoch": 94, + "train_loss": 6.83537752532959, + "train_acc": 0.00846, + "test_loss": 4.605170500183106, + "test_acc": 0.01, + "lyapunov": 2.623438694288054, + "grad_norm": 0.26310451945532815, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 167.17071175575256 + }, + { + "epoch": 95, + "train_loss": 6.799238587646484, + "train_acc": 0.00926, + "test_loss": 4.6051702911376955, + "test_acc": 0.01, + "lyapunov": 2.60419953631623, + "grad_norm": 0.10657735488339905, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 167.223788022995 + }, + { + "epoch": 96, + "train_loss": 6.804974398498535, + "train_acc": 0.00916, + "test_loss": 4.605170680236816, + "test_acc": 0.01, + "lyapunov": 2.60721908383967, + "grad_norm": 0.17693273008046123, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 167.2773995399475 + }, + { + "epoch": 97, + "train_loss": 6.8050346893310545, + "train_acc": 0.0086, + "test_loss": 4.605170379638672, + "test_acc": 0.01, + "lyapunov": 2.607598216332438, + "grad_norm": 0.1351166427526852, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 167.0982165336609 + }, + { + "epoch": 98, + "train_loss": 6.814014775848388, + "train_acc": 0.00896, + "test_loss": 4.605170265960694, + "test_acc": 0.01, + "lyapunov": 2.611722286399978, + "grad_norm": 0.16300027920865434, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 167.213885307312 + }, + { + "epoch": 99, + "train_loss": 6.810039446411133, + "train_acc": 0.00874, + "test_loss": 4.605170517730713, + "test_acc": 0.01, + "lyapunov": 2.609659137018501, + "grad_norm": 0.13742401941675986, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 167.23094940185547 + }, + { + "epoch": 100, + "train_loss": 6.818154907836914, + "train_acc": 0.00906, + "test_loss": 4.6051704177856445, + "test_acc": 0.01, + "lyapunov": 2.613592106363048, + "grad_norm": 0.13552057031594136, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 167.14863324165344 + }, + { + "epoch": 101, + "train_loss": 6.820175225524903, + "train_acc": 0.00914, + "test_loss": 4.605170472717285, + "test_acc": 0.01, + "lyapunov": 2.615781251731736, + "grad_norm": 0.1825661927434339, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 167.13485431671143 + }, + { + "epoch": 102, + "train_loss": 6.843083056182861, + "train_acc": 0.00814, + "test_loss": 4.605170304107666, + "test_acc": 0.01, + "lyapunov": 2.6266718941271456, + "grad_norm": 0.28170773297668966, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 167.3005588054657 + }, + { + "epoch": 103, + "train_loss": 6.81555390625, + "train_acc": 0.0089, + "test_loss": 4.605170388793946, + "test_acc": 0.01, + "lyapunov": 2.6132783401957558, + "grad_norm": 0.20579070177059625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 167.31917262077332 + }, + { + "epoch": 104, + "train_loss": 6.797420726623535, + "train_acc": 0.00826, + "test_loss": 4.60517056274414, + "test_acc": 0.01, + "lyapunov": 2.6031100310937827, + "grad_norm": 0.09877603372479003, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 167.13279914855957 + }, + { + "epoch": 105, + "train_loss": 6.825426294555664, + "train_acc": 0.00898, + "test_loss": 4.605170573425293, + "test_acc": 0.01, + "lyapunov": 2.6164557750877515, + "grad_norm": 0.23298022186302586, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 167.27876543998718 + }, + { + "epoch": 106, + "train_loss": 6.81034471786499, + "train_acc": 0.00862, + "test_loss": 4.605170178222656, + "test_acc": 0.01, + "lyapunov": 2.6101580525908017, + "grad_norm": 0.11576839370764984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 167.24659395217896 + }, + { + "epoch": 107, + "train_loss": 6.8369368406677244, + "train_acc": 0.00846, + "test_loss": 4.605170590209961, + "test_acc": 0.01, + "lyapunov": 2.62125125931352, + "grad_norm": 0.1931519664931494, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 167.2057774066925 + }, + { + "epoch": 108, + "train_loss": 6.812288922576904, + "train_acc": 0.0088, + "test_loss": 4.605170223999023, + "test_acc": 0.01, + "lyapunov": 2.6103451739796593, + "grad_norm": 0.13299121884159582, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 167.10559225082397 + }, + { + "epoch": 109, + "train_loss": 6.797308649902344, + "train_acc": 0.00842, + "test_loss": 4.605170259094239, + "test_acc": 0.01, + "lyapunov": 2.6030520350122086, + "grad_norm": 0.09292253205333328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 167.28680682182312 + }, + { + "epoch": 110, + "train_loss": 6.802461311950683, + "train_acc": 0.00886, + "test_loss": 4.605170384979248, + "test_acc": 0.01, + "lyapunov": 2.605947788414138, + "grad_norm": 0.09044100601755074, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 167.254047870636 + }, + { + "epoch": 111, + "train_loss": 6.800218295593262, + "train_acc": 0.00898, + "test_loss": 4.605170218658447, + "test_acc": 0.01, + "lyapunov": 2.6047815380193997, + "grad_norm": 0.09096765167841042, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 167.18093347549438 + }, + { + "epoch": 112, + "train_loss": 6.80289358581543, + "train_acc": 0.00846, + "test_loss": 4.605170321655273, + "test_acc": 0.01, + "lyapunov": 2.606188810085092, + "grad_norm": 0.11124745619391717, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 167.17500185966492 + }, + { + "epoch": 113, + "train_loss": 6.80328687286377, + "train_acc": 0.0083, + "test_loss": 4.605170209503174, + "test_acc": 0.01, + "lyapunov": 2.606580800717444, + "grad_norm": 0.1173945856600355, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 167.2652928829193 + }, + { + "epoch": 114, + "train_loss": 6.833984843902588, + "train_acc": 0.00896, + "test_loss": 4.605170062255859, + "test_acc": 0.01, + "lyapunov": 2.6208856666789337, + "grad_norm": 0.20744787133639947, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 167.21882677078247 + }, + { + "epoch": 115, + "train_loss": 6.822520295410156, + "train_acc": 0.00838, + "test_loss": 4.605170328521728, + "test_acc": 0.01, + "lyapunov": 2.615956858295919, + "grad_norm": 0.14399695964710044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 167.09929537773132 + }, + { + "epoch": 116, + "train_loss": 6.799036735839843, + "train_acc": 0.00894, + "test_loss": 4.605170152282715, + "test_acc": 0.01, + "lyapunov": 2.603793166787423, + "grad_norm": 0.10032145854595359, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 167.25386571884155 + }, + { + "epoch": 117, + "train_loss": 6.800587829284668, + "train_acc": 0.00834, + "test_loss": 4.605170477294922, + "test_acc": 0.01, + "lyapunov": 2.604958756805381, + "grad_norm": 0.11401729218950767, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 167.27676010131836 + }, + { + "epoch": 118, + "train_loss": 6.800997655029297, + "train_acc": 0.0088, + "test_loss": 4.605170313262939, + "test_acc": 0.01, + "lyapunov": 2.6053062838971464, + "grad_norm": 0.10865983471852475, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 167.16999578475952 + }, + { + "epoch": 119, + "train_loss": 6.800622797088623, + "train_acc": 0.0082, + "test_loss": 4.605170126342774, + "test_acc": 0.01, + "lyapunov": 2.604655019462566, + "grad_norm": 0.12369520749734833, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 167.13503623008728 + }, + { + "epoch": 120, + "train_loss": 6.795711727905274, + "train_acc": 0.00866, + "test_loss": 4.60517028503418, + "test_acc": 0.01, + "lyapunov": 2.602085701949761, + "grad_norm": 0.08734190443194187, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 167.28283619880676 + }, + { + "epoch": 121, + "train_loss": 6.796959948425293, + "train_acc": 0.0093, + "test_loss": 4.605170495605469, + "test_acc": 0.01, + "lyapunov": 2.6028400558949736, + "grad_norm": 0.08752194617001091, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 167.22894525527954 + }, + { + "epoch": 122, + "train_loss": 6.80965912033081, + "train_acc": 0.00928, + "test_loss": 4.605170267486573, + "test_acc": 0.01, + "lyapunov": 2.6096866935720224, + "grad_norm": 0.11691201011842964, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 167.16074228286743 + }, + { + "epoch": 123, + "train_loss": 6.817136254882812, + "train_acc": 0.00856, + "test_loss": 4.605170227050781, + "test_acc": 0.01, + "lyapunov": 2.6124652438151563, + "grad_norm": 0.1550769682935547, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 167.20862245559692 + }, + { + "epoch": 124, + "train_loss": 6.797611290588379, + "train_acc": 0.0096, + "test_loss": 4.605170072174072, + "test_acc": 0.01, + "lyapunov": 2.603274511864118, + "grad_norm": 0.10698377372823001, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 167.24812293052673 + }, + { + "epoch": 125, + "train_loss": 6.811994839477539, + "train_acc": 0.00868, + "test_loss": 4.605170003509522, + "test_acc": 0.01, + "lyapunov": 2.6103333463449307, + "grad_norm": 0.14234235939730758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 167.15956830978394 + }, + { + "epoch": 126, + "train_loss": 6.799865046234131, + "train_acc": 0.00862, + "test_loss": 4.605170318603515, + "test_acc": 0.01, + "lyapunov": 2.604667879431449, + "grad_norm": 0.09265194462378636, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 167.1222221851349 + }, + { + "epoch": 127, + "train_loss": 6.804667163391113, + "train_acc": 0.00886, + "test_loss": 4.605170178985595, + "test_acc": 0.01, + "lyapunov": 2.60723816342366, + "grad_norm": 0.09360794490801955, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 167.1491777896881 + }, + { + "epoch": 128, + "train_loss": 6.803801723480225, + "train_acc": 0.0089, + "test_loss": 4.605170277404786, + "test_acc": 0.01, + "lyapunov": 2.606579548867462, + "grad_norm": 0.10479682515434138, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 167.26385951042175 + }, + { + "epoch": 129, + "train_loss": 6.7995252819824215, + "train_acc": 0.0085, + "test_loss": 4.605170484924316, + "test_acc": 0.01, + "lyapunov": 2.604231426478042, + "grad_norm": 0.08941205723411079, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 167.30450534820557 + }, + { + "epoch": 130, + "train_loss": 6.821313883209228, + "train_acc": 0.00852, + "test_loss": 4.605170134735108, + "test_acc": 0.01, + "lyapunov": 2.615080727335742, + "grad_norm": 0.1662641683208483, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 167.14770483970642 + }, + { + "epoch": 131, + "train_loss": 6.795292775421142, + "train_acc": 0.00846, + "test_loss": 4.605170323944092, + "test_acc": 0.01, + "lyapunov": 2.601862790944326, + "grad_norm": 0.11411966381332427, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 167.2135558128357 + }, + { + "epoch": 132, + "train_loss": 6.796047713775635, + "train_acc": 0.00904, + "test_loss": 4.6051700454711915, + "test_acc": 0.01, + "lyapunov": 2.602336645736109, + "grad_norm": 0.08834944397480328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 167.23654413223267 + }, + { + "epoch": 133, + "train_loss": 6.799664002380371, + "train_acc": 0.00904, + "test_loss": 4.605170405578614, + "test_acc": 0.01, + "lyapunov": 2.6045111707409325, + "grad_norm": 0.08768823633488758, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 167.25386261940002 + }, + { + "epoch": 134, + "train_loss": 6.799534449920654, + "train_acc": 0.00966, + "test_loss": 4.605170095825195, + "test_acc": 0.01, + "lyapunov": 2.604433027374775, + "grad_norm": 0.08880059006188033, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 167.089768409729 + }, + { + "epoch": 135, + "train_loss": 6.816852741394043, + "train_acc": 0.00922, + "test_loss": 4.6051704139709475, + "test_acc": 0.01, + "lyapunov": 2.6120451417420525, + "grad_norm": 0.1344230192150204, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 167.21077299118042 + }, + { + "epoch": 136, + "train_loss": 6.79835750869751, + "train_acc": 0.01, + "test_loss": 4.60517020111084, + "test_acc": 0.01, + "lyapunov": 2.6037550874988136, + "grad_norm": 0.09237399837874004, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 167.25671005249023 + }, + { + "epoch": 137, + "train_loss": 6.799135870971679, + "train_acc": 0.00948, + "test_loss": 4.605170085144043, + "test_acc": 0.01, + "lyapunov": 2.6042151554771094, + "grad_norm": 0.08937220866741212, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 167.19218349456787 + }, + { + "epoch": 138, + "train_loss": 6.824215604553222, + "train_acc": 0.01, + "test_loss": 4.605170098876953, + "test_acc": 0.01, + "lyapunov": 2.616335995666816, + "grad_norm": 0.10994228945768546, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 167.09943842887878 + }, + { + "epoch": 139, + "train_loss": 6.802577704467773, + "train_acc": 0.01, + "test_loss": 4.605170218658447, + "test_acc": 0.01, + "lyapunov": 2.6062524855289313, + "grad_norm": 0.09042623460420336, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 167.20513486862183 + }, + { + "epoch": 140, + "train_loss": 6.7961073709106445, + "train_acc": 0.01, + "test_loss": 4.605170453643799, + "test_acc": 0.01, + "lyapunov": 2.602320309490194, + "grad_norm": 0.08815797205742677, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 167.25681805610657 + }, + { + "epoch": 141, + "train_loss": 6.797138239898682, + "train_acc": 0.01, + "test_loss": 4.605170432281494, + "test_acc": 0.01, + "lyapunov": 2.6029675891027426, + "grad_norm": 0.0879981627311107, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 167.06548428535461 + }, + { + "epoch": 142, + "train_loss": 6.801417353363037, + "train_acc": 0.01, + "test_loss": 4.605170329284668, + "test_acc": 0.01, + "lyapunov": 2.605164134593876, + "grad_norm": 0.08843743115572271, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 167.19282054901123 + }, + { + "epoch": 143, + "train_loss": 6.799633148193359, + "train_acc": 0.01, + "test_loss": 4.6051702880859375, + "test_acc": 0.01, + "lyapunov": 2.6045726491972006, + "grad_norm": 0.09210601924786092, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 167.22217631340027 + }, + { + "epoch": 144, + "train_loss": 6.799774599914551, + "train_acc": 0.01, + "test_loss": 4.605170209503174, + "test_acc": 0.01, + "lyapunov": 2.6046122669258995, + "grad_norm": 0.08889860655727871, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 167.18017983436584 + }, + { + "epoch": 145, + "train_loss": 6.7985524331665035, + "train_acc": 0.01, + "test_loss": 4.6051704223632814, + "test_acc": 0.01, + "lyapunov": 2.6038548361005076, + "grad_norm": 0.08800873662125164, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 167.10364723205566 + }, + { + "epoch": 146, + "train_loss": 6.797061258239746, + "train_acc": 0.01, + "test_loss": 4.605170094299316, + "test_acc": 0.01, + "lyapunov": 2.6029466247314685, + "grad_norm": 0.08767630908448117, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 167.13109254837036 + }, + { + "epoch": 147, + "train_loss": 6.7999437774658205, + "train_acc": 0.01, + "test_loss": 4.605170198059082, + "test_acc": 0.01, + "lyapunov": 2.6046864193723636, + "grad_norm": 0.08792294865681417, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 167.20970582962036 + }, + { + "epoch": 148, + "train_loss": 6.798582576293946, + "train_acc": 0.01, + "test_loss": 4.605170455932617, + "test_acc": 0.01, + "lyapunov": 2.6038761730389215, + "grad_norm": 0.09215822971292409, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 167.12604355812073 + }, + { + "epoch": 149, + "train_loss": 6.796307967529297, + "train_acc": 0.01, + "test_loss": 4.605170027923584, + "test_acc": 0.01, + "lyapunov": 2.6024758651128512, + "grad_norm": 0.08782242943220565, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 167.15288949012756 + }, + { + "epoch": 150, + "train_loss": 6.797921124420166, + "train_acc": 0.01, + "test_loss": 4.6051702972412105, + "test_acc": 0.01, + "lyapunov": 2.6034922130272515, + "grad_norm": 0.08768432297346943, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 167.14476084709167 + } + ], + "20": [ + { + "epoch": 1, + "train_loss": 15.093960892944336, + "train_acc": 0.01476, + "test_loss": 4.694812010192871, + "test_acc": 0.0101, + "lyapunov": 5.28920032362194, + "grad_norm": 5.920792423737725, + "grad_max_sv": 4.9676717877388, + "grad_min_sv": 8.119859199878787e-08, + "grad_condition": 1111289730.0106924, + "lr": 0.0009998903417374227, + "time_sec": 210.120050907135 + }, + { + "epoch": 2, + "train_loss": 9.793692145080566, + "train_acc": 0.01708, + "test_loss": 4.630818698120117, + "test_acc": 0.0101, + "lyapunov": 3.9491244813670283, + "grad_norm": 4.179099264712139, + "grad_max_sv": 3.6389390349388124, + "grad_min_sv": 4.435643456510846e-08, + "grad_condition": 1465465238.7805393, + "lr": 0.0009995614150494292, + "time_sec": 210.1432433128357 + }, + { + "epoch": 3, + "train_loss": 9.864517554931641, + "train_acc": 0.01526, + "test_loss": 4.635793448638916, + "test_acc": 0.01, + "lyapunov": 4.013264959120689, + "grad_norm": 3.461175130912805, + "grad_max_sv": 3.00231654047966, + "grad_min_sv": 7.094927521799298e-09, + "grad_condition": 151743845631.83978, + "lr": 0.0009990133642141358, + "time_sec": 210.18036890029907 + }, + { + "epoch": 4, + "train_loss": 9.012857937622071, + "train_acc": 0.01522, + "test_loss": 4.623633129882813, + "test_acc": 0.01, + "lyapunov": 3.700052426599176, + "grad_norm": 2.6286152850939577, + "grad_max_sv": 2.296706238389015, + "grad_min_sv": 3.159897203264806e-11, + "grad_condition": 343973728227.78937, + "lr": 0.0009982464296247522, + "time_sec": 210.1404571533203 + }, + { + "epoch": 5, + "train_loss": 8.190340083312988, + "train_acc": 0.0141, + "test_loss": 4.620581848144531, + "test_acc": 0.01, + "lyapunov": 3.3428353769395054, + "grad_norm": 1.8058911521537262, + "grad_max_sv": 1.3938701748847961, + "grad_min_sv": 9.547992879409192e-12, + "grad_condition": 323805955248.2424, + "lr": 0.0009972609476841367, + "time_sec": 210.12661004066467 + }, + { + "epoch": 6, + "train_loss": 7.759998917236328, + "train_acc": 0.01288, + "test_loss": 4.617343115997315, + "test_acc": 0.01, + "lyapunov": 3.1374943689312165, + "grad_norm": 1.7534337420481565, + "grad_max_sv": 0.9646675065159919, + "grad_min_sv": 2.9231036572180592e-12, + "grad_condition": 375265614590.23444, + "lr": 0.000996057350657239, + "time_sec": 210.0431251525879 + }, + { + "epoch": 7, + "train_loss": 7.5100171649169924, + "train_acc": 0.01298, + "test_loss": 4.613992894744873, + "test_acc": 0.01, + "lyapunov": 3.009886204434173, + "grad_norm": 1.2599904723678697, + "grad_max_sv": 0.683513353765011, + "grad_min_sv": 2.034050211148161e-12, + "grad_condition": 321368791479.6951, + "lr": 0.000994636166481494, + "time_sec": 210.03102850914001 + }, + { + "epoch": 8, + "train_loss": 7.526667755889893, + "train_acc": 0.0137, + "test_loss": 4.6132587142944335, + "test_acc": 0.01, + "lyapunov": 3.020487799973744, + "grad_norm": 1.4149077024298684, + "grad_max_sv": 0.43169260323047637, + "grad_min_sv": 1.314155534129329e-12, + "grad_condition": 228604061031.44318, + "lr": 0.0009929980185352525, + "time_sec": 210.09079957008362 + }, + { + "epoch": 9, + "train_loss": 7.424001091003418, + "train_acc": 0.0139, + "test_loss": 4.612518185424805, + "test_acc": 0.01, + "lyapunov": 2.9646140498578397, + "grad_norm": 1.4854391503992914, + "grad_max_sv": 0.39994182234216435, + "grad_min_sv": 7.056669271977351e-13, + "grad_condition": 272585344238.14337, + "lr": 0.0009911436253643444, + "time_sec": 210.04538559913635 + }, + { + "epoch": 10, + "train_loss": 7.422507609710693, + "train_acc": 0.01292, + "test_loss": 4.612365335083008, + "test_acc": 0.01, + "lyapunov": 2.9684851279344096, + "grad_norm": 1.4578891690299673, + "grad_max_sv": 0.3333915390074253, + "grad_min_sv": 5.315411665648874e-13, + "grad_condition": 252944829203.9721, + "lr": 0.0009890738003669028, + "time_sec": 210.01400017738342 + }, + { + "epoch": 11, + "train_loss": 7.279168519592285, + "train_acc": 0.01416, + "test_loss": 4.605921854400635, + "test_acc": 0.01, + "lyapunov": 2.8905254178644753, + "grad_norm": 1.1550117670507138, + "grad_max_sv": 0.26091913171112535, + "grad_min_sv": 1.5622282665285416e-13, + "grad_condition": 237845802721.57803, + "lr": 0.00098678945143658, + "time_sec": 210.0479826927185 + }, + { + "epoch": 12, + "train_loss": 7.238350921325684, + "train_acc": 0.01288, + "test_loss": 4.6059690254211425, + "test_acc": 0.01, + "lyapunov": 2.870093943212953, + "grad_norm": 1.2092537765879001, + "grad_max_sv": 0.2273966234177351, + "grad_min_sv": 2.126834221214877e-15, + "grad_condition": 226904883800.9376, + "lr": 0.0009842915805643154, + "time_sec": 210.02421975135803 + }, + { + "epoch": 13, + "train_loss": 7.237049304504395, + "train_acc": 0.0122, + "test_loss": 4.606073367309571, + "test_acc": 0.01, + "lyapunov": 2.8677229795919357, + "grad_norm": 1.945360181719986, + "grad_max_sv": 0.19105065988258402, + "grad_min_sv": 7.58301405160596e-16, + "grad_condition": 190882486106.46655, + "lr": 0.000981581283398829, + "time_sec": 209.9947109222412 + }, + { + "epoch": 14, + "train_loss": 7.725393817138672, + "train_acc": 0.01264, + "test_loss": 5.5369372573852536, + "test_acc": 0.0157, + "lyapunov": 3.1145479276661985, + "grad_norm": 3.5850673850910875, + "grad_max_sv": 0.13178386465706673, + "grad_min_sv": 1.7957017814409413e-15, + "grad_condition": 131460341909.11662, + "lr": 0.0009786597487660333, + "time_sec": 210.06614232063293 + }, + { + "epoch": 15, + "train_loss": 7.938173998718262, + "train_acc": 0.0112, + "test_loss": 4.605860107421875, + "test_acc": 0.01, + "lyapunov": 3.22320399442902, + "grad_norm": 1.470918431013692, + "grad_max_sv": 0.13412793046313495, + "grad_min_sv": 1.3123556012424532e-27, + "grad_condition": 134127930463.13481, + "lr": 0.0009755282581475766, + "time_sec": 210.01092720031738 + }, + { + "epoch": 16, + "train_loss": 7.877476094970703, + "train_acc": 0.01078, + "test_loss": 4.605639274597168, + "test_acc": 0.01, + "lyapunov": 3.1950507353028983, + "grad_norm": 1.136967603821004, + "grad_max_sv": 0.11695587523281574, + "grad_min_sv": 5.493959932514282e-37, + "grad_condition": 116955875232.81572, + "lr": 0.0009721881851187403, + "time_sec": 210.03272008895874 + }, + { + "epoch": 17, + "train_loss": 7.939653808288575, + "train_acc": 0.01054, + "test_loss": 4.60557441482544, + "test_acc": 0.01, + "lyapunov": 3.220062300982073, + "grad_norm": 1.7456145739471243, + "grad_max_sv": 0.09164720228873194, + "grad_min_sv": 2.1019476964872255e-46, + "grad_condition": 91647202288.73193, + "lr": 0.0009686409947459456, + "time_sec": 210.02848625183105 + }, + { + "epoch": 18, + "train_loss": 7.52693728515625, + "train_acc": 0.0113, + "test_loss": 4.605569499206543, + "test_acc": 0.01, + "lyapunov": 3.0156563999097976, + "grad_norm": 2.4071740405774276, + "grad_max_sv": 0.08130668587982655, + "grad_min_sv": 4.554220009055656e-46, + "grad_condition": 81306685879.82654, + "lr": 0.0009648882429441254, + "time_sec": 210.00972390174866 + }, + { + "epoch": 19, + "train_loss": 7.715430914611816, + "train_acc": 0.0111, + "test_loss": 4.605534184265137, + "test_acc": 0.01, + "lyapunov": 3.1088165675892547, + "grad_norm": 2.6762849936508677, + "grad_max_sv": 0.042965149600058795, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 42965149600.05879, + "lr": 0.00096093157579425, + "time_sec": 209.9727280139923 + }, + { + "epoch": 20, + "train_loss": 7.460425003356933, + "train_acc": 0.0111, + "test_loss": 7.111512740325928, + "test_acc": 0.01, + "lyapunov": 2.9692358793809897, + "grad_norm": 2.853254134437055, + "grad_max_sv": 0.050038989260792734, + "grad_min_sv": 2.5374011942761624e-43, + "grad_condition": 50038989260.792725, + "lr": 0.0009567727288213001, + "time_sec": 210.01186299324036 + }, + { + "epoch": 21, + "train_loss": 7.205679086456299, + "train_acc": 0.0091, + "test_loss": 7.044362417602539, + "test_acc": 0.01, + "lyapunov": 2.8364865828658004, + "grad_norm": 3.3061229521295945, + "grad_max_sv": 0.02213773485273123, + "grad_min_sv": 0.0, + "grad_condition": 22137734852.731228, + "lr": 0.0009524135262330095, + "time_sec": 209.98502397537231 + }, + { + "epoch": 22, + "train_loss": 7.1949261268615725, + "train_acc": 0.0098, + "test_loss": 4.605458296203613, + "test_acc": 0.01, + "lyapunov": 2.8206752724659716, + "grad_norm": 6.972340571186882, + "grad_max_sv": 0.02202093116939068, + "grad_min_sv": 0.0, + "grad_condition": 22020931169.39068, + "lr": 0.0009478558801197061, + "time_sec": 209.94458675384521 + }, + { + "epoch": 23, + "train_loss": 7.115987669677734, + "train_acc": 0.00996, + "test_loss": 6.645735456848144, + "test_acc": 0.01, + "lyapunov": 2.7744642029637876, + "grad_norm": 7.989108672811228, + "grad_max_sv": 0.011007561534643173, + "grad_min_sv": 0.0, + "grad_condition": 11007561534.643173, + "lr": 0.000943101789615607, + "time_sec": 209.97865319252014 + }, + { + "epoch": 24, + "train_loss": 7.058884606628418, + "train_acc": 0.00872, + "test_loss": 6.569473106384278, + "test_acc": 0.01, + "lyapunov": 2.745215448881964, + "grad_norm": 5.5094378668531405, + "grad_max_sv": 0.01464888285845518, + "grad_min_sv": 0.0, + "grad_condition": 14648882858.455181, + "lr": 0.0009381533400219313, + "time_sec": 210.0189917087555 + }, + { + "epoch": 25, + "train_loss": 7.515213393859863, + "train_acc": 0.01036, + "test_loss": 4.605401533508301, + "test_acc": 0.01, + "lyapunov": 3.0008729113947097, + "grad_norm": 2.870644125398128, + "grad_max_sv": 0.07644851161090856, + "grad_min_sv": 3.1529215447308385e-46, + "grad_condition": 76448511610.90854, + "lr": 0.0009330127018922189, + "time_sec": 210.00069952011108 + }, + { + "epoch": 26, + "train_loss": 7.552015746002197, + "train_acc": 0.01018, + "test_loss": 4.605392645263672, + "test_acc": 0.01, + "lyapunov": 3.0268727373284148, + "grad_norm": 1.9702867287865506, + "grad_max_sv": 0.07252425029873848, + "grad_min_sv": 1.0509738482436128e-46, + "grad_condition": 72524250298.73848, + "lr": 0.000927682130080253, + "time_sec": 210.00505328178406 + }, + { + "epoch": 27, + "train_loss": 7.204120320739746, + "train_acc": 0.00916, + "test_loss": 4.605300965118408, + "test_acc": 0.01, + "lyapunov": 2.8272059610127793, + "grad_norm": 2.304850056236489, + "grad_max_sv": 0.002205173298716545, + "grad_min_sv": 0.0, + "grad_condition": 2205173298.716545, + "lr": 0.0009221639627510072, + "time_sec": 210.04179668426514 + }, + { + "epoch": 28, + "train_loss": 7.194927945556641, + "train_acc": 0.00832, + "test_loss": 5.018761894989014, + "test_acc": 0.01, + "lyapunov": 2.834069358723243, + "grad_norm": 2.6612819081862673, + "grad_max_sv": 0.007065491378307342, + "grad_min_sv": 0.0, + "grad_condition": 7065491378.307343, + "lr": 0.0009164606203550494, + "time_sec": 209.9864535331726 + }, + { + "epoch": 29, + "train_loss": 7.058241820373535, + "train_acc": 0.0089, + "test_loss": 4.605222779083252, + "test_acc": 0.01, + "lyapunov": 2.7548481247309224, + "grad_norm": 1.6469496155298196, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009105746045668516, + "time_sec": 209.949223279953 + }, + { + "epoch": 30, + "train_loss": 6.992346358947754, + "train_acc": 0.00846, + "test_loss": 5.288449756622314, + "test_acc": 0.01, + "lyapunov": 2.7193446976449485, + "grad_norm": 0.12148601528604053, + "grad_max_sv": 0.010588385537266732, + "grad_min_sv": 0.0, + "grad_condition": 10588385537.266731, + "lr": 0.0009045084971874733, + "time_sec": 209.9674859046936 + }, + { + "epoch": 31, + "train_loss": 6.981909171295166, + "train_acc": 0.0089, + "test_loss": 5.256688010406494, + "test_acc": 0.01, + "lyapunov": 2.713971863622251, + "grad_norm": 0.1172841827453055, + "grad_max_sv": 0.004473739862442016, + "grad_min_sv": 0.0, + "grad_condition": 4473739862.442017, + "lr": 0.0008982649590120977, + "time_sec": 210.0011682510376 + }, + { + "epoch": 32, + "train_loss": 6.981826614379883, + "train_acc": 0.00878, + "test_loss": 5.260603121185302, + "test_acc": 0.01, + "lyapunov": 2.714321748679861, + "grad_norm": 0.09952710953666385, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008918467286629196, + "time_sec": 209.97604823112488 + }, + { + "epoch": 33, + "train_loss": 6.99227462890625, + "train_acc": 0.00872, + "test_loss": 5.264018801879883, + "test_acc": 0.01, + "lyapunov": 2.7198148792052206, + "grad_norm": 0.10982760460792622, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878943, + "time_sec": 209.99684286117554 + }, + { + "epoch": 34, + "train_loss": 6.985566412353515, + "train_acc": 0.00828, + "test_loss": 5.252056950378418, + "test_acc": 0.01, + "lyapunov": 2.71640632646468, + "grad_norm": 0.0980287254251016, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000878497527825878, + "time_sec": 209.97523665428162 + }, + { + "epoch": 35, + "train_loss": 6.983518271942138, + "train_acc": 0.00802, + "test_loss": 5.235891506958008, + "test_acc": 0.01, + "lyapunov": 2.7152942220878113, + "grad_norm": 0.098301014644246, + "grad_max_sv": 0.010264468565583228, + "grad_min_sv": 0.0, + "grad_condition": 10264468565.58323, + "lr": 0.000871572412738697, + "time_sec": 209.92434358596802 + }, + { + "epoch": 36, + "train_loss": 7.056292109069824, + "train_acc": 0.00856, + "test_loss": 5.234983450317383, + "test_acc": 0.01, + "lyapunov": 2.7453303550515336, + "grad_norm": 0.16314843571536908, + "grad_max_sv": 0.004481474310159684, + "grad_min_sv": 0.0, + "grad_condition": 4481474310.159683, + "lr": 0.0008644843137107055, + "time_sec": 209.98300409317017 + }, + { + "epoch": 37, + "train_loss": 7.04465570388794, + "train_acc": 0.00922, + "test_loss": 4.60517428894043, + "test_acc": 0.01, + "lyapunov": 2.7430449416265463, + "grad_norm": 0.3622526875575334, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008572363398164014, + "time_sec": 209.93617868423462 + }, + { + "epoch": 38, + "train_loss": 6.99952162109375, + "train_acc": 0.00886, + "test_loss": 4.605173640441895, + "test_acc": 0.01, + "lyapunov": 2.7234638078743236, + "grad_norm": 0.13703797479309945, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008498316702566826, + "time_sec": 209.95248365402222 + }, + { + "epoch": 39, + "train_loss": 7.040763073120117, + "train_acc": 0.00844, + "test_loss": 4.605174145507813, + "test_acc": 0.01, + "lyapunov": 2.7378825531591233, + "grad_norm": 0.1820768645877041, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643442, + "time_sec": 209.9344642162323 + }, + { + "epoch": 40, + "train_loss": 7.0346226399230956, + "train_acc": 0.0086, + "test_loss": 4.6051736892700195, + "test_acc": 0.01, + "lyapunov": 2.7368516513453724, + "grad_norm": 0.16922090716634502, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008345653031794289, + "time_sec": 209.97976160049438 + }, + { + "epoch": 41, + "train_loss": 7.102251969604493, + "train_acc": 0.00846, + "test_loss": 4.605173461914062, + "test_acc": 0.01, + "lyapunov": 2.764533970362085, + "grad_norm": 0.2796669100517588, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008267103019950526, + "time_sec": 209.97592854499817 + }, + { + "epoch": 42, + "train_loss": 6.989806396331787, + "train_acc": 0.00866, + "test_loss": 4.605173326110839, + "test_acc": 0.01, + "lyapunov": 2.718248601459786, + "grad_norm": 0.11817449733439238, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743447, + "time_sec": 209.91329216957092 + }, + { + "epoch": 43, + "train_loss": 6.980831128997803, + "train_acc": 0.00798, + "test_loss": 4.605173022460938, + "test_acc": 0.01, + "lyapunov": 2.713783808071595, + "grad_norm": 0.09538783881391288, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000810573890139155, + "time_sec": 209.95550656318665 + }, + { + "epoch": 44, + "train_loss": 6.979222456054687, + "train_acc": 0.00884, + "test_loss": 4.605172604370117, + "test_acc": 0.01, + "lyapunov": 2.712872148474769, + "grad_norm": 0.0919946830154422, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008022995574311873, + "time_sec": 209.928706407547 + }, + { + "epoch": 45, + "train_loss": 6.981346151428222, + "train_acc": 0.00856, + "test_loss": 4.605171971130371, + "test_acc": 0.01, + "lyapunov": 2.7140665036028304, + "grad_norm": 0.09306477436154323, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462363, + "time_sec": 209.92562985420227 + }, + { + "epoch": 46, + "train_loss": 6.981760795288086, + "train_acc": 0.0086, + "test_loss": 4.605172605133057, + "test_acc": 0.01, + "lyapunov": 2.714427888850727, + "grad_norm": 0.08970786008826526, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007853567838422158, + "time_sec": 210.02350616455078 + }, + { + "epoch": 47, + "train_loss": 7.014443389587402, + "train_acc": 0.0088, + "test_loss": 4.605172411346436, + "test_acc": 0.01, + "lyapunov": 2.728213080969613, + "grad_norm": 0.1697709047839743, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007766957746216719, + "time_sec": 209.98714351654053 + }, + { + "epoch": 48, + "train_loss": 6.98308254486084, + "train_acc": 0.0088, + "test_loss": 4.605172724151611, + "test_acc": 0.01, + "lyapunov": 2.7148986033466467, + "grad_norm": 0.10089096056823664, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894982, + "time_sec": 209.9425868988037 + }, + { + "epoch": 49, + "train_loss": 6.981540090026855, + "train_acc": 0.00806, + "test_loss": 4.610235414886475, + "test_acc": 0.01, + "lyapunov": 2.714101230396944, + "grad_norm": 0.09707765972227518, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000759013504686565, + "time_sec": 210.01923370361328 + }, + { + "epoch": 50, + "train_loss": 7.012723862762451, + "train_acc": 0.0088, + "test_loss": 4.6051725616455075, + "test_acc": 0.01, + "lyapunov": 2.729266738037929, + "grad_norm": 0.1358370231708399, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 209.99068450927734 + }, + { + "epoch": 51, + "train_loss": 7.017712171630859, + "train_acc": 0.00878, + "test_loss": 4.60517274017334, + "test_acc": 0.01, + "lyapunov": 2.729401938445733, + "grad_norm": 0.13779403599934203, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 210.01132082939148 + }, + { + "epoch": 52, + "train_loss": 6.98579848815918, + "train_acc": 0.00862, + "test_loss": 4.605172367095947, + "test_acc": 0.01, + "lyapunov": 2.7164978974920406, + "grad_norm": 0.11440777465495124, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 209.96309852600098 + }, + { + "epoch": 53, + "train_loss": 6.980713491516113, + "train_acc": 0.0088, + "test_loss": 4.605172201538086, + "test_acc": 0.01, + "lyapunov": 2.7136193919364753, + "grad_norm": 0.0963297125293723, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 210.0020875930786 + }, + { + "epoch": 54, + "train_loss": 6.9838667016601566, + "train_acc": 0.00856, + "test_loss": 4.605172233581543, + "test_acc": 0.01, + "lyapunov": 2.715499324871756, + "grad_norm": 0.1368676120419564, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 209.94060635566711 + }, + { + "epoch": 55, + "train_loss": 6.983624946899414, + "train_acc": 0.00906, + "test_loss": 4.605171611022949, + "test_acc": 0.01, + "lyapunov": 2.7151694712431533, + "grad_norm": 0.1214142336589057, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007033683215378998, + "time_sec": 209.92118954658508 + }, + { + "epoch": 56, + "train_loss": 6.996163428649902, + "train_acc": 0.00826, + "test_loss": 4.60517228012085, + "test_acc": 0.01, + "lyapunov": 2.721804239560881, + "grad_norm": 0.13635707009394835, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 210.05888557434082 + }, + { + "epoch": 57, + "train_loss": 6.9852110571289066, + "train_acc": 0.00888, + "test_loss": 4.6051725509643555, + "test_acc": 0.01, + "lyapunov": 2.7162836719961727, + "grad_norm": 0.09827989868248155, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423388, + "time_sec": 210.03313207626343 + }, + { + "epoch": 58, + "train_loss": 6.990598773498535, + "train_acc": 0.0087, + "test_loss": 4.605171973419189, + "test_acc": 0.01, + "lyapunov": 2.718923308355424, + "grad_norm": 0.11245505032562926, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 210.20554780960083 + }, + { + "epoch": 59, + "train_loss": 6.990819956512452, + "train_acc": 0.00914, + "test_loss": 4.605172409057618, + "test_acc": 0.01, + "lyapunov": 2.719175950950369, + "grad_norm": 0.11267799994144367, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 210.00883507728577 + }, + { + "epoch": 60, + "train_loss": 7.063073814697265, + "train_acc": 0.00868, + "test_loss": 4.605172189331054, + "test_acc": 0.01, + "lyapunov": 2.7483064634415806, + "grad_norm": 0.18267690644430695, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 210.0396704673767 + }, + { + "epoch": 61, + "train_loss": 6.994184250183105, + "train_acc": 0.00868, + "test_loss": 4.605171653747559, + "test_acc": 0.01, + "lyapunov": 2.7201892951565325, + "grad_norm": 0.1215511744322559, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 210.01424837112427 + }, + { + "epoch": 62, + "train_loss": 7.032484904479981, + "train_acc": 0.00918, + "test_loss": 4.605172390747071, + "test_acc": 0.01, + "lyapunov": 2.7373275226339353, + "grad_norm": 0.20957283019702622, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 210.07943868637085 + }, + { + "epoch": 63, + "train_loss": 6.997943234863281, + "train_acc": 0.00816, + "test_loss": 4.6051715438842775, + "test_acc": 0.01, + "lyapunov": 2.722739946506822, + "grad_norm": 0.14325925108066898, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 210.0124545097351 + }, + { + "epoch": 64, + "train_loss": 7.036040018615723, + "train_acc": 0.00846, + "test_loss": 4.6051715461730955, + "test_acc": 0.01, + "lyapunov": 2.737502407234953, + "grad_norm": 0.1852649849094369, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 210.16446352005005 + }, + { + "epoch": 65, + "train_loss": 6.987151607818603, + "train_acc": 0.00856, + "test_loss": 4.605171313476562, + "test_acc": 0.01, + "lyapunov": 2.717369063126157, + "grad_norm": 0.11469395705842762, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 210.01318955421448 + }, + { + "epoch": 66, + "train_loss": 7.095058049316406, + "train_acc": 0.0084, + "test_loss": 4.605171440124511, + "test_acc": 0.01, + "lyapunov": 2.76260655432406, + "grad_norm": 0.38302198809757837, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 209.99922275543213 + }, + { + "epoch": 67, + "train_loss": 6.990951052246094, + "train_acc": 0.00822, + "test_loss": 4.60517152709961, + "test_acc": 0.01, + "lyapunov": 2.719036699865785, + "grad_norm": 0.12621463018935974, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 210.0219807624817 + }, + { + "epoch": 68, + "train_loss": 6.979004976806641, + "train_acc": 0.0089, + "test_loss": 4.6051711723327635, + "test_acc": 0.01, + "lyapunov": 2.7127806817174265, + "grad_norm": 0.0898257720991778, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 209.98719429969788 + }, + { + "epoch": 69, + "train_loss": 7.030236116638184, + "train_acc": 0.0085, + "test_loss": 4.605171342468262, + "test_acc": 0.01, + "lyapunov": 2.7335510912453733, + "grad_norm": 0.16033156081316657, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 210.08958458900452 + }, + { + "epoch": 70, + "train_loss": 7.039960643615722, + "train_acc": 0.00892, + "test_loss": 4.6051711669921875, + "test_acc": 0.01, + "lyapunov": 2.739665296681397, + "grad_norm": 0.22271149603025697, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 210.03332662582397 + }, + { + "epoch": 71, + "train_loss": 6.994076708221436, + "train_acc": 0.0088, + "test_loss": 4.605171272277832, + "test_acc": 0.01, + "lyapunov": 2.720922397530597, + "grad_norm": 0.1379622518868338, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 210.08726000785828 + }, + { + "epoch": 72, + "train_loss": 7.031296715240479, + "train_acc": 0.0093, + "test_loss": 4.605170808410644, + "test_acc": 0.01, + "lyapunov": 2.7340313668751044, + "grad_norm": 0.15171246429702803, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646563, + "time_sec": 209.98722290992737 + }, + { + "epoch": 73, + "train_loss": 7.004211445465088, + "train_acc": 0.00854, + "test_loss": 4.605171342468262, + "test_acc": 0.01, + "lyapunov": 2.723038975844908, + "grad_norm": 0.13946310624469108, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 210.0228340625763 + }, + { + "epoch": 74, + "train_loss": 7.004648984680176, + "train_acc": 0.00784, + "test_loss": 4.605171240234375, + "test_acc": 0.01, + "lyapunov": 2.7241133033771954, + "grad_norm": 0.14177753146701746, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 210.09978771209717 + }, + { + "epoch": 75, + "train_loss": 7.037411134338379, + "train_acc": 0.00828, + "test_loss": 4.605171034240723, + "test_acc": 0.01, + "lyapunov": 2.7407932879065005, + "grad_norm": 0.3048803615675911, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 209.95723867416382 + }, + { + "epoch": 76, + "train_loss": 7.073835411071777, + "train_acc": 0.00852, + "test_loss": 4.605171124267578, + "test_acc": 0.01, + "lyapunov": 2.7557388784940287, + "grad_norm": 0.3366831366752972, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 210.0526421070099 + }, + { + "epoch": 77, + "train_loss": 7.069385101013183, + "train_acc": 0.00882, + "test_loss": 4.605171006011963, + "test_acc": 0.01, + "lyapunov": 2.7532967996719244, + "grad_norm": 0.3023678187768571, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 210.00937223434448 + }, + { + "epoch": 78, + "train_loss": 7.039409867553711, + "train_acc": 0.00918, + "test_loss": 4.605171101379394, + "test_acc": 0.01, + "lyapunov": 2.7399997028243512, + "grad_norm": 0.2334340472843992, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 209.98830223083496 + }, + { + "epoch": 79, + "train_loss": 7.060353764648437, + "train_acc": 0.0089, + "test_loss": 4.605171464538574, + "test_acc": 0.01, + "lyapunov": 2.7474362892872843, + "grad_norm": 0.24607577443282014, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 209.9931514263153 + }, + { + "epoch": 80, + "train_loss": 6.994573851013183, + "train_acc": 0.00838, + "test_loss": 4.605170816040039, + "test_acc": 0.01, + "lyapunov": 2.7213273816706276, + "grad_norm": 0.13316471216665574, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 210.0208034515381 + }, + { + "epoch": 81, + "train_loss": 6.987541461791992, + "train_acc": 0.00882, + "test_loss": 4.605170903778077, + "test_acc": 0.01, + "lyapunov": 2.7174221109551238, + "grad_norm": 0.103648369821384, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 209.98763418197632 + }, + { + "epoch": 82, + "train_loss": 7.037619709472656, + "train_acc": 0.009, + "test_loss": 4.60517109298706, + "test_acc": 0.01, + "lyapunov": 2.740689567897631, + "grad_norm": 0.2931576105004017, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 209.9937252998352 + }, + { + "epoch": 83, + "train_loss": 6.985121826171875, + "train_acc": 0.00916, + "test_loss": 4.605170684051513, + "test_acc": 0.01, + "lyapunov": 2.7163276074792417, + "grad_norm": 0.1492971550466505, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 209.95198678970337 + }, + { + "epoch": 84, + "train_loss": 7.066727964477539, + "train_acc": 0.00896, + "test_loss": 4.605170683288574, + "test_acc": 0.01, + "lyapunov": 2.7504812116208286, + "grad_norm": 0.2866450325163035, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 210.01719284057617 + }, + { + "epoch": 85, + "train_loss": 6.989573917999268, + "train_acc": 0.00868, + "test_loss": 4.605171029663086, + "test_acc": 0.01, + "lyapunov": 2.718881234488524, + "grad_norm": 0.17966945444038818, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 209.97075200080872 + }, + { + "epoch": 86, + "train_loss": 7.024203224792481, + "train_acc": 0.009, + "test_loss": 4.60517100982666, + "test_acc": 0.01, + "lyapunov": 2.7339598565455288, + "grad_norm": 0.22243544874027923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 210.22112345695496 + }, + { + "epoch": 87, + "train_loss": 6.999354568481445, + "train_acc": 0.0089, + "test_loss": 4.605170932006836, + "test_acc": 0.01, + "lyapunov": 2.723075409984345, + "grad_norm": 0.18428974005449253, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 210.0000035762787 + }, + { + "epoch": 88, + "train_loss": 6.986679251861572, + "train_acc": 0.0085, + "test_loss": 4.605170610046387, + "test_acc": 0.01, + "lyapunov": 2.7169672826976727, + "grad_norm": 0.12620646621233791, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 209.9843943119049 + }, + { + "epoch": 89, + "train_loss": 7.011478589172364, + "train_acc": 0.00836, + "test_loss": 4.605170822143554, + "test_acc": 0.01, + "lyapunov": 2.7271931854355365, + "grad_norm": 0.15417699872251808, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 209.97113156318665 + }, + { + "epoch": 90, + "train_loss": 7.101416894836426, + "train_acc": 0.00908, + "test_loss": 4.605170645141602, + "test_acc": 0.01, + "lyapunov": 2.7632448941545413, + "grad_norm": 0.31835714546200394, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 209.9718475341797 + }, + { + "epoch": 91, + "train_loss": 7.0410906286621096, + "train_acc": 0.00862, + "test_loss": 4.605170471191406, + "test_acc": 0.01, + "lyapunov": 2.7411284916236274, + "grad_norm": 0.3464519876405528, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 209.98472666740417 + }, + { + "epoch": 92, + "train_loss": 7.078473837890625, + "train_acc": 0.00868, + "test_loss": 4.605170490264893, + "test_acc": 0.01, + "lyapunov": 2.756490916547263, + "grad_norm": 0.3699213952956702, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 209.99044036865234 + }, + { + "epoch": 93, + "train_loss": 6.9829315435791015, + "train_acc": 0.00898, + "test_loss": 4.605170346069336, + "test_acc": 0.01, + "lyapunov": 2.71514059576537, + "grad_norm": 0.0883076892297495, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 209.9776222705841 + }, + { + "epoch": 94, + "train_loss": 6.9855348080444335, + "train_acc": 0.00822, + "test_loss": 4.605170868682861, + "test_acc": 0.01, + "lyapunov": 2.7164944638986417, + "grad_norm": 0.1479238762597201, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 210.00643134117126 + }, + { + "epoch": 95, + "train_loss": 6.9874295346069335, + "train_acc": 0.00856, + "test_loss": 4.605170775604248, + "test_acc": 0.01, + "lyapunov": 2.7169240917391178, + "grad_norm": 0.15626938065528906, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 209.99916791915894 + }, + { + "epoch": 96, + "train_loss": 6.983181795043945, + "train_acc": 0.00818, + "test_loss": 4.605170436096191, + "test_acc": 0.01, + "lyapunov": 2.7151255619800305, + "grad_norm": 0.12016550567041384, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 210.07179808616638 + }, + { + "epoch": 97, + "train_loss": 6.9956132180786135, + "train_acc": 0.0088, + "test_loss": 4.6051704200744625, + "test_acc": 0.01, + "lyapunov": 2.7203723811127647, + "grad_norm": 0.14197786423069308, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 209.9841606616974 + }, + { + "epoch": 98, + "train_loss": 6.9846799612426755, + "train_acc": 0.00844, + "test_loss": 4.605170723724365, + "test_acc": 0.01, + "lyapunov": 2.715931734465577, + "grad_norm": 0.1266081420314572, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 209.96538734436035 + }, + { + "epoch": 99, + "train_loss": 7.002227352294922, + "train_acc": 0.0088, + "test_loss": 4.605170701599121, + "test_acc": 0.01, + "lyapunov": 2.7254832943382166, + "grad_norm": 0.30098740432801424, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 209.96611714363098 + }, + { + "epoch": 100, + "train_loss": 7.031358368072509, + "train_acc": 0.0084, + "test_loss": 4.605170401763916, + "test_acc": 0.01, + "lyapunov": 2.734792661179057, + "grad_norm": 0.22052159160290236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 209.99191045761108 + }, + { + "epoch": 101, + "train_loss": 7.02535282836914, + "train_acc": 0.0089, + "test_loss": 4.605170426940918, + "test_acc": 0.01, + "lyapunov": 2.732613311094396, + "grad_norm": 0.1884414449751891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 209.96369862556458 + }, + { + "epoch": 102, + "train_loss": 6.979629467163086, + "train_acc": 0.00892, + "test_loss": 4.605170404052735, + "test_acc": 0.01, + "lyapunov": 2.713197677031807, + "grad_norm": 0.11445011044498424, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 209.94372940063477 + }, + { + "epoch": 103, + "train_loss": 6.992681996459961, + "train_acc": 0.00866, + "test_loss": 4.605170614624023, + "test_acc": 0.01, + "lyapunov": 2.7198261897582228, + "grad_norm": 0.11698623871801088, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 209.9833948612213 + }, + { + "epoch": 104, + "train_loss": 6.981217978515625, + "train_acc": 0.00812, + "test_loss": 4.605170754241944, + "test_acc": 0.01, + "lyapunov": 2.7141413487436825, + "grad_norm": 0.08755411353395318, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 210.01173162460327 + }, + { + "epoch": 105, + "train_loss": 6.981228657531738, + "train_acc": 0.00804, + "test_loss": 4.605170397949219, + "test_acc": 0.01, + "lyapunov": 2.7141372974571363, + "grad_norm": 0.09294871100024936, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 209.94330191612244 + }, + { + "epoch": 106, + "train_loss": 7.012609109344482, + "train_acc": 0.0086, + "test_loss": 4.605170350646973, + "test_acc": 0.01, + "lyapunov": 2.7288797901719426, + "grad_norm": 0.20993573311720926, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 210.00956416130066 + }, + { + "epoch": 107, + "train_loss": 7.00075564453125, + "train_acc": 0.00862, + "test_loss": 4.60517020111084, + "test_acc": 0.01, + "lyapunov": 2.7233152907827627, + "grad_norm": 0.15372921012205631, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 210.00604104995728 + }, + { + "epoch": 108, + "train_loss": 7.0513025799560545, + "train_acc": 0.00884, + "test_loss": 4.605170352172852, + "test_acc": 0.01, + "lyapunov": 2.7449967105065465, + "grad_norm": 0.27576954124117053, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 209.93969535827637 + }, + { + "epoch": 109, + "train_loss": 6.980083810424805, + "train_acc": 0.00836, + "test_loss": 4.605170263671875, + "test_acc": 0.01, + "lyapunov": 2.713495020366386, + "grad_norm": 0.08939231438623309, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 209.99505877494812 + }, + { + "epoch": 110, + "train_loss": 6.984004687805176, + "train_acc": 0.00854, + "test_loss": 4.60517056350708, + "test_acc": 0.01, + "lyapunov": 2.715787248538278, + "grad_norm": 0.09252734679044972, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 209.9858946800232 + }, + { + "epoch": 111, + "train_loss": 6.983103836517334, + "train_acc": 0.00846, + "test_loss": 4.6051701759338375, + "test_acc": 0.01, + "lyapunov": 2.715198960145721, + "grad_norm": 0.12412466148890375, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 209.98376154899597 + }, + { + "epoch": 112, + "train_loss": 7.001786309051513, + "train_acc": 0.00842, + "test_loss": 4.605170098876953, + "test_acc": 0.01, + "lyapunov": 2.7237192645402213, + "grad_norm": 0.2611435951973152, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 210.04836750030518 + }, + { + "epoch": 113, + "train_loss": 6.985844685974121, + "train_acc": 0.0083, + "test_loss": 4.605170079040527, + "test_acc": 0.01, + "lyapunov": 2.716268786993783, + "grad_norm": 0.12269496905075315, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 210.01298427581787 + }, + { + "epoch": 114, + "train_loss": 6.982051696472168, + "train_acc": 0.0086, + "test_loss": 4.605170341491699, + "test_acc": 0.01, + "lyapunov": 2.7146723093584066, + "grad_norm": 0.10102267353118359, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 209.98340034484863 + }, + { + "epoch": 115, + "train_loss": 6.97831426361084, + "train_acc": 0.00934, + "test_loss": 4.60517028503418, + "test_acc": 0.01, + "lyapunov": 2.7124323881495638, + "grad_norm": 0.0910994755377039, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 209.99640536308289 + }, + { + "epoch": 116, + "train_loss": 6.9820148625183105, + "train_acc": 0.00932, + "test_loss": 4.605170400238037, + "test_acc": 0.01, + "lyapunov": 2.7146591920681926, + "grad_norm": 0.10075615501603827, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 209.9244248867035 + }, + { + "epoch": 117, + "train_loss": 6.9843703225708005, + "train_acc": 0.00914, + "test_loss": 4.605170434570312, + "test_acc": 0.01, + "lyapunov": 2.715647294393281, + "grad_norm": 0.11228216953551147, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 209.9830358028412 + }, + { + "epoch": 118, + "train_loss": 7.017746971740722, + "train_acc": 0.00848, + "test_loss": 4.605170096588135, + "test_acc": 0.01, + "lyapunov": 2.7295747071580814, + "grad_norm": 0.20995938315988794, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 209.98030400276184 + }, + { + "epoch": 119, + "train_loss": 6.992286892089844, + "train_acc": 0.00848, + "test_loss": 4.605170076751709, + "test_acc": 0.01, + "lyapunov": 2.7198437071212416, + "grad_norm": 0.13966024517159772, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 209.8962001800537 + }, + { + "epoch": 120, + "train_loss": 6.988741851654053, + "train_acc": 0.00882, + "test_loss": 4.605170139312744, + "test_acc": 0.01, + "lyapunov": 2.7180907177498272, + "grad_norm": 0.16074749971185626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 210.00037145614624 + }, + { + "epoch": 121, + "train_loss": 6.9938799935913085, + "train_acc": 0.00866, + "test_loss": 4.605170372772217, + "test_acc": 0.01, + "lyapunov": 2.7198036820687297, + "grad_norm": 0.15994838954410112, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 210.0474226474762 + }, + { + "epoch": 122, + "train_loss": 7.0039596870422365, + "train_acc": 0.00892, + "test_loss": 4.6051700347900395, + "test_acc": 0.01, + "lyapunov": 2.7259010494212665, + "grad_norm": 0.09437754111929303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 210.04152083396912 + }, + { + "epoch": 123, + "train_loss": 7.009052494049072, + "train_acc": 0.00872, + "test_loss": 4.605170434570312, + "test_acc": 0.01, + "lyapunov": 2.72874392755806, + "grad_norm": 0.10432489602660702, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 210.2749161720276 + }, + { + "epoch": 124, + "train_loss": 7.074693834838867, + "train_acc": 0.0093, + "test_loss": 4.605170128631592, + "test_acc": 0.01, + "lyapunov": 2.758679599103415, + "grad_norm": 0.22022455692760384, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 210.06590056419373 + }, + { + "epoch": 125, + "train_loss": 6.982606186523437, + "train_acc": 0.00892, + "test_loss": 4.605170491027832, + "test_acc": 0.01, + "lyapunov": 2.7148781255687897, + "grad_norm": 0.08823763166065995, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 210.01559233665466 + }, + { + "epoch": 126, + "train_loss": 6.982140954437256, + "train_acc": 0.0086, + "test_loss": 4.605170350646973, + "test_acc": 0.01, + "lyapunov": 2.7147414952592777, + "grad_norm": 0.10255408158855737, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 210.03672337532043 + }, + { + "epoch": 127, + "train_loss": 6.979871159973144, + "train_acc": 0.00872, + "test_loss": 4.605170230102539, + "test_acc": 0.01, + "lyapunov": 2.71336467369743, + "grad_norm": 0.08818157608440398, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 210.00639820098877 + }, + { + "epoch": 128, + "train_loss": 6.985049297180176, + "train_acc": 0.00864, + "test_loss": 4.605170027160645, + "test_acc": 0.01, + "lyapunov": 2.716455806551687, + "grad_norm": 0.08762261938563776, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 209.97323060035706 + }, + { + "epoch": 129, + "train_loss": 6.985287237243653, + "train_acc": 0.00956, + "test_loss": 4.605170120239258, + "test_acc": 0.01, + "lyapunov": 2.7165556063737406, + "grad_norm": 0.08764461237151443, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 210.0408091545105 + }, + { + "epoch": 130, + "train_loss": 7.065185516815186, + "train_acc": 0.00922, + "test_loss": 4.605170118713379, + "test_acc": 0.01, + "lyapunov": 2.756326196138816, + "grad_norm": 0.2237427649903656, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 210.05785131454468 + }, + { + "epoch": 131, + "train_loss": 7.003630043640137, + "train_acc": 0.00874, + "test_loss": 4.605170425415039, + "test_acc": 0.01, + "lyapunov": 2.7251280341916684, + "grad_norm": 0.11404915316549034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 210.06771302223206 + }, + { + "epoch": 132, + "train_loss": 7.016419371795655, + "train_acc": 0.00874, + "test_loss": 4.605170411682129, + "test_acc": 0.01, + "lyapunov": 2.732408604048707, + "grad_norm": 0.09643363295807468, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 210.00194883346558 + }, + { + "epoch": 133, + "train_loss": 7.027043022460938, + "train_acc": 0.00868, + "test_loss": 4.605170454406738, + "test_acc": 0.01, + "lyapunov": 2.7380632366365787, + "grad_norm": 0.08968045213589285, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 210.257652759552 + }, + { + "epoch": 134, + "train_loss": 7.035782067260742, + "train_acc": 0.00788, + "test_loss": 4.605170135498047, + "test_acc": 0.01, + "lyapunov": 2.743028284033851, + "grad_norm": 0.09341294223256699, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 209.9916913509369 + }, + { + "epoch": 135, + "train_loss": 7.071151198425293, + "train_acc": 0.0096, + "test_loss": 4.605170458984375, + "test_acc": 0.01, + "lyapunov": 2.760085921153388, + "grad_norm": 0.09297571487706319, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 210.2266161441803 + }, + { + "epoch": 136, + "train_loss": 7.034707638702392, + "train_acc": 0.00916, + "test_loss": 4.605170063018798, + "test_acc": 0.01, + "lyapunov": 2.742517843880617, + "grad_norm": 0.08845657511108296, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 210.06171536445618 + }, + { + "epoch": 137, + "train_loss": 7.0274613586425785, + "train_acc": 0.00888, + "test_loss": 4.605170385742188, + "test_acc": 0.01, + "lyapunov": 2.7373946475250945, + "grad_norm": 0.10398852016478509, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 209.9369614124298 + }, + { + "epoch": 138, + "train_loss": 7.025472250366211, + "train_acc": 0.0095, + "test_loss": 4.605170440673828, + "test_acc": 0.01, + "lyapunov": 2.736402528670133, + "grad_norm": 0.09038559548514402, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 210.0793435573578 + }, + { + "epoch": 139, + "train_loss": 7.014701705322266, + "train_acc": 0.00924, + "test_loss": 4.605170342254639, + "test_acc": 0.01, + "lyapunov": 2.7315333481030084, + "grad_norm": 0.10172944851300819, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 210.09445595741272 + }, + { + "epoch": 140, + "train_loss": 7.003781777954101, + "train_acc": 0.00918, + "test_loss": 4.605170393371582, + "test_acc": 0.01, + "lyapunov": 2.7260687607328604, + "grad_norm": 0.08766437036057895, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 210.07793593406677 + }, + { + "epoch": 141, + "train_loss": 7.056627904968262, + "train_acc": 0.01, + "test_loss": 4.60516996383667, + "test_acc": 0.01, + "lyapunov": 2.7532575478029373, + "grad_norm": 0.09441259373264534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 210.04277729988098 + }, + { + "epoch": 142, + "train_loss": 6.989320599212647, + "train_acc": 0.00982, + "test_loss": 4.605170464324951, + "test_acc": 0.01, + "lyapunov": 2.718763675836041, + "grad_norm": 0.08778246721140825, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 210.0390853881836 + }, + { + "epoch": 143, + "train_loss": 7.0194689248657225, + "train_acc": 0.01, + "test_loss": 4.605170278930664, + "test_acc": 0.01, + "lyapunov": 2.7337976069096714, + "grad_norm": 0.088168048948687, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 210.09060406684875 + }, + { + "epoch": 144, + "train_loss": 6.989500450592041, + "train_acc": 0.01, + "test_loss": 4.605170496368408, + "test_acc": 0.01, + "lyapunov": 2.71841098280514, + "grad_norm": 0.08876604826979184, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 210.08678889274597 + }, + { + "epoch": 145, + "train_loss": 6.977725113220215, + "train_acc": 0.01, + "test_loss": 4.605170376586914, + "test_acc": 0.01, + "lyapunov": 2.712189649986794, + "grad_norm": 0.08740841232989421, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 210.07671403884888 + }, + { + "epoch": 146, + "train_loss": 7.063753978881836, + "train_acc": 0.01, + "test_loss": 4.605170356750488, + "test_acc": 0.01, + "lyapunov": 2.7562683031077273, + "grad_norm": 0.08829447012972118, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 210.06147265434265 + }, + { + "epoch": 147, + "train_loss": 6.97903392501831, + "train_acc": 0.01, + "test_loss": 4.605170056915283, + "test_acc": 0.01, + "lyapunov": 2.712921044405769, + "grad_norm": 0.08792833595670006, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 210.12889552116394 + }, + { + "epoch": 148, + "train_loss": 7.024583773956299, + "train_acc": 0.01, + "test_loss": 4.605170234680176, + "test_acc": 0.01, + "lyapunov": 2.736283694386787, + "grad_norm": 0.08841220675764232, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 210.09635305404663 + }, + { + "epoch": 149, + "train_loss": 6.9777571395874025, + "train_acc": 0.01, + "test_loss": 4.605170068359375, + "test_acc": 0.01, + "lyapunov": 2.7121838078169564, + "grad_norm": 0.08769792454661404, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 210.0731065273285 + }, + { + "epoch": 150, + "train_loss": 6.9812114135742185, + "train_acc": 0.01, + "test_loss": 4.605170178985595, + "test_acc": 0.01, + "lyapunov": 2.71422858494322, + "grad_norm": 0.08799513594752054, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 210.09806776046753 + } + ] + } +}
\ No newline at end of file diff --git a/runs/depth_scaling/cifar10_20251229-160504/config.json b/runs/depth_scaling/cifar10_20251229-160504/config.json new file mode 100644 index 0000000..c87b8a8 --- /dev/null +++ b/runs/depth_scaling/cifar10_20251229-160504/config.json @@ -0,0 +1,20 @@ +{ + "dataset": "cifar10", + "depths": [ + 4, + 8, + 12, + 16 + ], + "T": 4, + "epochs": 100, + "batch_size": 128, + "lr": 0.001, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "data_dir": "./data", + "out_dir": "runs/depth_scaling", + "device": "cuda", + "seed": 42, + "no_progress": false +}
\ No newline at end of file diff --git a/runs/depth_scaling/cifar10_20251229-160504/results.json b/runs/depth_scaling/cifar10_20251229-160504/results.json new file mode 100644 index 0000000..2e9b6eb --- /dev/null +++ b/runs/depth_scaling/cifar10_20251229-160504/results.json @@ -0,0 +1,11222 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 1.87523081199646, + "train_acc": 0.3904, + "test_loss": 1.3005033981323242, + "test_acc": 0.538, + "lyapunov": null, + "grad_norm": 7.167065437345997, + "grad_max_sv": 6.2841449797153475, + "grad_min_sv": 2.820393511626662e-07, + "grad_condition": 22637653.325481158, + "lr": 0.0009997532801828658, + "time_sec": 17.83638072013855 + }, + { + "epoch": 2, + "train_loss": 1.330778917236328, + "train_acc": 0.53242, + "test_loss": 1.3051589399337769, + "test_acc": 0.5299, + "lyapunov": null, + "grad_norm": 5.684293544168513, + "grad_max_sv": 4.961454087495804, + "grad_min_sv": 2.2011614504435783e-07, + "grad_condition": 23000049.3006949, + "lr": 0.0009990133642141358, + "time_sec": 15.308318853378296 + }, + { + "epoch": 3, + "train_loss": 1.1224762370300292, + "train_acc": 0.59994, + "test_loss": 1.1229688482284546, + "test_acc": 0.6085, + "lyapunov": null, + "grad_norm": 4.767601837094887, + "grad_max_sv": 4.13027862906456, + "grad_min_sv": 1.9442289698190506e-07, + "grad_condition": 21218061.296424918, + "lr": 0.00099778098230154, + "time_sec": 15.306547403335571 + }, + { + "epoch": 4, + "train_loss": 0.9929985418510437, + "train_acc": 0.6506, + "test_loss": 1.0345463452339172, + "test_acc": 0.6476, + "lyapunov": null, + "grad_norm": 4.154534311876162, + "grad_max_sv": 3.4217750519514083, + "grad_min_sv": 1.738904227721605e-07, + "grad_condition": 19945043.08817544, + "lr": 0.000996057350657239, + "time_sec": 15.302969694137573 + }, + { + "epoch": 5, + "train_loss": 0.8976026094818115, + "train_acc": 0.68438, + "test_loss": 0.8756585054397583, + "test_acc": 0.6914, + "lyapunov": null, + "grad_norm": 3.6333960771107905, + "grad_max_sv": 2.9354925364255906, + "grad_min_sv": 1.6106242668456615e-07, + "grad_condition": 18489046.232839655, + "lr": 0.0009938441702975688, + "time_sec": 15.317728281021118 + }, + { + "epoch": 6, + "train_loss": 0.8413557116317749, + "train_acc": 0.70288, + "test_loss": 1.0890468210220337, + "test_acc": 0.6361, + "lyapunov": null, + "grad_norm": 3.416502916483722, + "grad_max_sv": 2.8772784233093263, + "grad_min_sv": 1.524946609876565e-07, + "grad_condition": 19017545.32666207, + "lr": 0.0009911436253643444, + "time_sec": 15.30530047416687 + }, + { + "epoch": 7, + "train_loss": 0.780380486125946, + "train_acc": 0.72624, + "test_loss": 0.7749503490447998, + "test_acc": 0.7328, + "lyapunov": null, + "grad_norm": 3.046069709126096, + "grad_max_sv": 2.3629971712827684, + "grad_min_sv": 1.380081055657456e-07, + "grad_condition": 17149009.230771504, + "lr": 0.0009879583809693736, + "time_sec": 15.307675838470459 + }, + { + "epoch": 8, + "train_loss": 0.7390781346511841, + "train_acc": 0.7414, + "test_loss": 0.7958005157470703, + "test_acc": 0.7277, + "lyapunov": null, + "grad_norm": 2.7435338958916513, + "grad_max_sv": 2.05181370973587, + "grad_min_sv": 1.2932217341443675e-07, + "grad_condition": 16036517.768211821, + "lr": 0.0009842915805643154, + "time_sec": 15.307319641113281 + }, + { + "epoch": 9, + "train_loss": 0.7052495925521851, + "train_acc": 0.75274, + "test_loss": 1.0447007677078246, + "test_acc": 0.6745, + "lyapunov": null, + "grad_norm": 2.552586529905072, + "grad_max_sv": 2.0337040573358536, + "grad_min_sv": 1.2101497901539914e-07, + "grad_condition": 16963155.872520845, + "lr": 0.0009801468428384714, + "time_sec": 15.290063619613647 + }, + { + "epoch": 10, + "train_loss": 0.6694383864402771, + "train_acc": 0.76588, + "test_loss": 0.9462176066398621, + "test_acc": 0.6842, + "lyapunov": null, + "grad_norm": 2.3520331395340692, + "grad_max_sv": 1.7684333354234696, + "grad_min_sv": 1.1190378259584577e-07, + "grad_condition": 15955738.307438832, + "lr": 0.0009755282581475767, + "time_sec": 15.305615901947021 + }, + { + "epoch": 11, + "train_loss": 0.6340117832756043, + "train_acc": 0.77878, + "test_loss": 0.7613432981491088, + "test_acc": 0.7377, + "lyapunov": null, + "grad_norm": 2.164571307713442, + "grad_max_sv": 1.7057331085205079, + "grad_min_sv": 1.0792852087604387e-07, + "grad_condition": 15783530.208328355, + "lr": 0.0009704403844771127, + "time_sec": 15.29656457901001 + }, + { + "epoch": 12, + "train_loss": 0.6060477030181884, + "train_acc": 0.78728, + "test_loss": 0.7971237164974213, + "test_acc": 0.729, + "lyapunov": null, + "grad_norm": 1.993298876301324, + "grad_max_sv": 1.514353270828724, + "grad_min_sv": 1.009763655801521e-07, + "grad_condition": 14944755.026175302, + "lr": 0.0009648882429441257, + "time_sec": 15.30236530303955 + }, + { + "epoch": 13, + "train_loss": 0.5870892490005493, + "train_acc": 0.79524, + "test_loss": 0.8448094959259034, + "test_acc": 0.7127, + "lyapunov": null, + "grad_norm": 1.8629217723116693, + "grad_max_sv": 1.3949483826756477, + "grad_min_sv": 9.635141964281502e-08, + "grad_condition": 14581029.38399595, + "lr": 0.0009588773128419905, + "time_sec": 15.315025806427002 + }, + { + "epoch": 14, + "train_loss": 0.5539195073699951, + "train_acc": 0.80644, + "test_loss": 0.7561563467979431, + "test_acc": 0.7394, + "lyapunov": null, + "grad_norm": 1.6986166991338625, + "grad_max_sv": 1.245494757592678, + "grad_min_sv": 8.711651755533012e-08, + "grad_condition": 14401234.8235637, + "lr": 0.0009524135262330098, + "time_sec": 15.308890104293823 + }, + { + "epoch": 15, + "train_loss": 0.5333379591941834, + "train_acc": 0.8143, + "test_loss": 0.6968033623695373, + "test_acc": 0.7569, + "lyapunov": null, + "grad_norm": 1.5656089916965232, + "grad_max_sv": 1.1909169003367424, + "grad_min_sv": 8.488269482853639e-08, + "grad_condition": 14106351.27298153, + "lr": 0.0009455032620941839, + "time_sec": 15.311123609542847 + }, + { + "epoch": 16, + "train_loss": 0.5167095581436157, + "train_acc": 0.82042, + "test_loss": 0.849514400100708, + "test_acc": 0.7133, + "lyapunov": null, + "grad_norm": 1.496171987836298, + "grad_max_sv": 1.0258999049663544, + "grad_min_sv": 8.006283778172473e-08, + "grad_condition": 12841377.110361751, + "lr": 0.0009381533400219318, + "time_sec": 15.310609817504883 + }, + { + "epoch": 17, + "train_loss": 0.49894729826927187, + "train_acc": 0.8262, + "test_loss": 0.7154086270809173, + "test_acc": 0.7552, + "lyapunov": null, + "grad_norm": 1.3884031919720434, + "grad_max_sv": 0.9819801226258278, + "grad_min_sv": 7.953692726658801e-08, + "grad_condition": 12477520.833613167, + "lr": 0.0009303710135019719, + "time_sec": 15.301868200302124 + }, + { + "epoch": 18, + "train_loss": 0.4833205630302429, + "train_acc": 0.83074, + "test_loss": 0.8212436129570008, + "test_acc": 0.7372, + "lyapunov": null, + "grad_norm": 1.322943153444315, + "grad_max_sv": 0.9954353883862496, + "grad_min_sv": 7.706266931251094e-08, + "grad_condition": 12928888.561653998, + "lr": 0.0009221639627510076, + "time_sec": 15.304028987884521 + }, + { + "epoch": 19, + "train_loss": 0.46378349807739255, + "train_acc": 0.8371, + "test_loss": 0.6447551451683045, + "test_acc": 0.789, + "lyapunov": null, + "grad_norm": 1.231933968586028, + "grad_max_sv": 0.7683330580592156, + "grad_min_sv": 6.892571695615856e-08, + "grad_condition": 11194075.895721275, + "lr": 0.000913540287137281, + "time_sec": 15.304960489273071 + }, + { + "epoch": 20, + "train_loss": 0.44474551233291626, + "train_acc": 0.84504, + "test_loss": 0.6990101715087891, + "test_acc": 0.7693, + "lyapunov": null, + "grad_norm": 1.1785280692983833, + "grad_max_sv": 0.8134334728121757, + "grad_min_sv": 6.934622298615523e-08, + "grad_condition": 11771827.214910198, + "lr": 0.0009045084971874739, + "time_sec": 15.309978008270264 + }, + { + "epoch": 21, + "train_loss": 0.4328971823978424, + "train_acc": 0.8493, + "test_loss": 0.605803295135498, + "test_acc": 0.7971, + "lyapunov": null, + "grad_norm": 1.1010893792673297, + "grad_max_sv": 0.74788568764925, + "grad_min_sv": 6.635127869358826e-08, + "grad_condition": 11337903.371089932, + "lr": 0.0008950775061878452, + "time_sec": 15.304766416549683 + }, + { + "epoch": 22, + "train_loss": 0.42013943620681765, + "train_acc": 0.85398, + "test_loss": 0.6351155483245849, + "test_acc": 0.7873, + "lyapunov": null, + "grad_norm": 1.050275059187082, + "grad_max_sv": 0.733056052774191, + "grad_min_sv": 6.172693325368073e-08, + "grad_condition": 11926578.893480929, + "lr": 0.0008852566213878947, + "time_sec": 15.304250001907349 + }, + { + "epoch": 23, + "train_loss": 0.4068706720542908, + "train_acc": 0.85872, + "test_loss": 0.6962938892364502, + "test_acc": 0.7771, + "lyapunov": null, + "grad_norm": 1.0041008989601972, + "grad_max_sv": 0.6977266952395439, + "grad_min_sv": 6.174876086006975e-08, + "grad_condition": 11375115.065625418, + "lr": 0.0008750555348152298, + "time_sec": 15.29546570777893 + }, + { + "epoch": 24, + "train_loss": 0.3927080359458923, + "train_acc": 0.86198, + "test_loss": 0.6316822688102722, + "test_acc": 0.797, + "lyapunov": null, + "grad_norm": 0.9591057928108919, + "grad_max_sv": 0.6601924143731595, + "grad_min_sv": 5.981677704269828e-08, + "grad_condition": 10958128.320144685, + "lr": 0.0008644843137107057, + "time_sec": 15.319843292236328 + }, + { + "epoch": 25, + "train_loss": 0.37991392849445343, + "train_acc": 0.8662, + "test_loss": 0.7685016389846802, + "test_acc": 0.7528, + "lyapunov": null, + "grad_norm": 0.9185108543931831, + "grad_max_sv": 0.5813446715474129, + "grad_min_sv": 5.7562914257403006e-08, + "grad_condition": 10132723.13073414, + "lr": 0.0008535533905932737, + "time_sec": 15.314316272735596 + }, + { + "epoch": 26, + "train_loss": 0.3740078569984436, + "train_acc": 0.86904, + "test_loss": 0.6302923937797547, + "test_acc": 0.7894, + "lyapunov": null, + "grad_norm": 0.896823092741051, + "grad_max_sv": 0.5897809371352196, + "grad_min_sv": 5.612208120453488e-08, + "grad_condition": 10555219.724126566, + "lr": 0.0008422735529643444, + "time_sec": 15.295911312103271 + }, + { + "epoch": 27, + "train_loss": 0.35986615454673765, + "train_acc": 0.8722, + "test_loss": 0.5293433817148209, + "test_acc": 0.8255, + "lyapunov": null, + "grad_norm": 0.8414160526480361, + "grad_max_sv": 0.5433246113359929, + "grad_min_sv": 5.460546566027347e-08, + "grad_condition": 10029361.12551422, + "lr": 0.0008306559326618259, + "time_sec": 15.296611309051514 + }, + { + "epoch": 28, + "train_loss": 0.34749350198745727, + "train_acc": 0.87846, + "test_loss": 0.6013012096405029, + "test_acc": 0.8077, + "lyapunov": null, + "grad_norm": 0.8012028361027335, + "grad_max_sv": 0.5324302047491074, + "grad_min_sv": 5.343053706141632e-08, + "grad_condition": 9995030.902296156, + "lr": 0.0008187119948743449, + "time_sec": 15.314170122146606 + }, + { + "epoch": 29, + "train_loss": 0.33312201313018797, + "train_acc": 0.88212, + "test_loss": 0.5545183982849121, + "test_acc": 0.8162, + "lyapunov": null, + "grad_norm": 0.7852771005330633, + "grad_max_sv": 0.5164767228066921, + "grad_min_sv": 5.198521888516439e-08, + "grad_condition": 10107248.49432898, + "lr": 0.0008064535268264883, + "time_sec": 15.311892986297607 + }, + { + "epoch": 30, + "train_loss": 0.3230313647842407, + "train_acc": 0.88538, + "test_loss": 0.658975659275055, + "test_acc": 0.7951, + "lyapunov": null, + "grad_norm": 0.7620779575769897, + "grad_max_sv": 0.5038670122623443, + "grad_min_sv": 5.0398949014152095e-08, + "grad_condition": 10038873.739317197, + "lr": 0.0007938926261462367, + "time_sec": 15.305739402770996 + }, + { + "epoch": 31, + "train_loss": 0.318023904876709, + "train_acc": 0.88796, + "test_loss": 0.6099616609573364, + "test_acc": 0.8127, + "lyapunov": null, + "grad_norm": 0.7501021639283835, + "grad_max_sv": 0.48214229866862296, + "grad_min_sv": 5.136175964537415e-08, + "grad_condition": 9343056.264591306, + "lr": 0.0007810416889260654, + "time_sec": 15.325766324996948 + }, + { + "epoch": 32, + "train_loss": 0.31232675287246703, + "train_acc": 0.89082, + "test_loss": 0.5936648756027222, + "test_acc": 0.8109, + "lyapunov": null, + "grad_norm": 0.7279129448401558, + "grad_max_sv": 0.4431505911052227, + "grad_min_sv": 4.812153910904726e-08, + "grad_condition": 9245973.275864627, + "lr": 0.0007679133974894983, + "time_sec": 15.317164897918701 + }, + { + "epoch": 33, + "train_loss": 0.29341697571754455, + "train_acc": 0.8967, + "test_loss": 0.5134524160385132, + "test_acc": 0.8357, + "lyapunov": null, + "grad_norm": 0.6884958324446571, + "grad_max_sv": 0.4426784858107567, + "grad_min_sv": 4.9337259699910875e-08, + "grad_condition": 9173234.108017813, + "lr": 0.0007545207078751857, + "time_sec": 15.312905311584473 + }, + { + "epoch": 34, + "train_loss": 0.2897170938873291, + "train_acc": 0.89828, + "test_loss": 0.5332132309913635, + "test_acc": 0.8335, + "lyapunov": null, + "grad_norm": 0.6750271636840882, + "grad_max_sv": 0.4532689817249775, + "grad_min_sv": 4.866335441278125e-08, + "grad_condition": 9412153.339201316, + "lr": 0.0007408768370508577, + "time_sec": 15.313745260238647 + }, + { + "epoch": 35, + "train_loss": 0.28602589085578917, + "train_acc": 0.89756, + "test_loss": 0.6111867341041565, + "test_acc": 0.8164, + "lyapunov": null, + "grad_norm": 0.6693786571127541, + "grad_max_sv": 0.4255728892982006, + "grad_min_sv": 4.737296563916971e-08, + "grad_condition": 9020003.170186436, + "lr": 0.0007269952498697734, + "time_sec": 15.32437539100647 + }, + { + "epoch": 36, + "train_loss": 0.2724088624763489, + "train_acc": 0.90408, + "test_loss": 0.5054482436180114, + "test_acc": 0.8387, + "lyapunov": null, + "grad_norm": 0.6416324201224461, + "grad_max_sv": 0.4291106700897217, + "grad_min_sv": 4.6136759568327077e-08, + "grad_condition": 9385408.654433403, + "lr": 0.0007128896457825364, + "time_sec": 15.322253704071045 + }, + { + "epoch": 37, + "train_loss": 0.26598569943904876, + "train_acc": 0.90576, + "test_loss": 0.5292941621780396, + "test_acc": 0.8315, + "lyapunov": null, + "grad_norm": 0.6311835178833255, + "grad_max_sv": 0.372799988463521, + "grad_min_sv": 4.42526025601353e-08, + "grad_condition": 8432960.688056583, + "lr": 0.0006985739453173903, + "time_sec": 15.330822467803955 + }, + { + "epoch": 38, + "train_loss": 0.2548411606884003, + "train_acc": 0.90972, + "test_loss": 0.5889158064842224, + "test_acc": 0.8304, + "lyapunov": null, + "grad_norm": 0.6075907586779873, + "grad_max_sv": 0.40464401319622995, + "grad_min_sv": 4.5029356776638e-08, + "grad_condition": 9144084.308266882, + "lr": 0.0006840622763423391, + "time_sec": 15.306779623031616 + }, + { + "epoch": 39, + "train_loss": 0.2488733386993408, + "train_acc": 0.91114, + "test_loss": 0.5380938538551331, + "test_acc": 0.8325, + "lyapunov": null, + "grad_norm": 0.6071846116294305, + "grad_max_sv": 0.3960565410554409, + "grad_min_sv": 4.6051877067299075e-08, + "grad_condition": 8601152.95310002, + "lr": 0.0006693689601226458, + "time_sec": 15.341014862060547 + }, + { + "epoch": 40, + "train_loss": 0.24494112944602967, + "train_acc": 0.91272, + "test_loss": 0.5513611147403717, + "test_acc": 0.8299, + "lyapunov": null, + "grad_norm": 0.592226155692726, + "grad_max_sv": 0.3729955680668354, + "grad_min_sv": 4.293505284636012e-08, + "grad_condition": 8794710.30872355, + "lr": 0.0006545084971874737, + "time_sec": 15.389995813369751 + }, + { + "epoch": 41, + "train_loss": 0.23727083059310913, + "train_acc": 0.9153, + "test_loss": 0.516801796245575, + "test_acc": 0.8461, + "lyapunov": null, + "grad_norm": 0.5812900748217327, + "grad_max_sv": 0.38579080179333686, + "grad_min_sv": 4.4259539766500214e-08, + "grad_condition": 8748753.244401883, + "lr": 0.0006394955530196147, + "time_sec": 15.318362474441528 + }, + { + "epoch": 42, + "train_loss": 0.22481181490898133, + "train_acc": 0.92022, + "test_loss": 0.5416705925941467, + "test_acc": 0.8322, + "lyapunov": null, + "grad_norm": 0.5619779097810216, + "grad_max_sv": 0.35356797464191914, + "grad_min_sv": 4.2614826689657547e-08, + "grad_condition": 8335709.16485816, + "lr": 0.0006243449435824273, + "time_sec": 15.315505743026733 + }, + { + "epoch": 43, + "train_loss": 0.22531912160873413, + "train_acc": 0.9199, + "test_loss": 0.5833574778556824, + "test_acc": 0.8338, + "lyapunov": null, + "grad_norm": 0.557199013327348, + "grad_max_sv": 0.33938006646931174, + "grad_min_sv": 4.300346327923421e-08, + "grad_condition": 7932422.911212927, + "lr": 0.0006090716206982714, + "time_sec": 15.32206392288208 + }, + { + "epoch": 44, + "train_loss": 0.216223452000618, + "train_acc": 0.92378, + "test_loss": 0.5012358224868775, + "test_acc": 0.8491, + "lyapunov": null, + "grad_norm": 0.5383308349401124, + "grad_max_sv": 0.3396204937249422, + "grad_min_sv": 4.201267005399245e-08, + "grad_condition": 8110585.992247519, + "lr": 0.0005936906572928625, + "time_sec": 15.314954042434692 + }, + { + "epoch": 45, + "train_loss": 0.21238275866508483, + "train_acc": 0.92506, + "test_loss": 0.5394745681762695, + "test_acc": 0.8426, + "lyapunov": null, + "grad_norm": 0.5338537929467614, + "grad_max_sv": 0.34414798244833944, + "grad_min_sv": 4.2673109312829635e-08, + "grad_condition": 8155102.629835799, + "lr": 0.0005782172325201156, + "time_sec": 15.313148975372314 + }, + { + "epoch": 46, + "train_loss": 0.2043999564409256, + "train_acc": 0.9264, + "test_loss": 0.4982535705089569, + "test_acc": 0.851, + "lyapunov": null, + "grad_norm": 0.518001070564685, + "grad_max_sv": 0.3181751623749733, + "grad_min_sv": 4.258852284166892e-08, + "grad_condition": 7586177.211236173, + "lr": 0.0005626666167821523, + "time_sec": 15.31693696975708 + }, + { + "epoch": 47, + "train_loss": 0.19748862716674806, + "train_acc": 0.93056, + "test_loss": 0.511198134803772, + "test_acc": 0.8512, + "lyapunov": null, + "grad_norm": 0.5066091467854666, + "grad_max_sv": 0.3097307480871677, + "grad_min_sv": 4.0578768167875976e-08, + "grad_condition": 7694719.511876054, + "lr": 0.0005470541566592572, + "time_sec": 15.311876773834229 + }, + { + "epoch": 48, + "train_loss": 0.18840614411354065, + "train_acc": 0.93296, + "test_loss": 0.5223799973011017, + "test_acc": 0.8486, + "lyapunov": null, + "grad_norm": 0.4947799501006328, + "grad_max_sv": 0.32398409508168696, + "grad_min_sv": 3.967475805666254e-08, + "grad_condition": 8181991.0382896485, + "lr": 0.0005313952597646569, + "time_sec": 15.324450016021729 + }, + { + "epoch": 49, + "train_loss": 0.1852111140346527, + "train_acc": 0.93434, + "test_loss": 0.5372783863067627, + "test_acc": 0.8442, + "lyapunov": null, + "grad_norm": 0.49013002688624263, + "grad_max_sv": 0.3128523100167513, + "grad_min_sv": 4.042725132435976e-08, + "grad_condition": 7786375.414612537, + "lr": 0.0005157053795390643, + "time_sec": 15.311121940612793 + }, + { + "epoch": 50, + "train_loss": 0.17850845782279967, + "train_acc": 0.9363, + "test_loss": 0.5162768915176391, + "test_acc": 0.8514, + "lyapunov": null, + "grad_norm": 0.4757476361255021, + "grad_max_sv": 0.3146433509886265, + "grad_min_sv": 3.966314778836022e-08, + "grad_condition": 7931529.673702802, + "lr": 0.0005000000000000002, + "time_sec": 15.3083016872406 + }, + { + "epoch": 51, + "train_loss": 0.17266313230514527, + "train_acc": 0.9392, + "test_loss": 0.5169307453155517, + "test_acc": 0.8514, + "lyapunov": null, + "grad_norm": 0.47267825902613214, + "grad_max_sv": 0.30655047073960306, + "grad_min_sv": 3.728870501262804e-08, + "grad_condition": 8340291.307145154, + "lr": 0.00048429462046093607, + "time_sec": 15.306477308273315 + }, + { + "epoch": 52, + "train_loss": 0.1663313666152954, + "train_acc": 0.94122, + "test_loss": 0.5442662063598633, + "test_acc": 0.8474, + "lyapunov": null, + "grad_norm": 0.46294043228921017, + "grad_max_sv": 0.31195108480751516, + "grad_min_sv": 3.8414651104545784e-08, + "grad_condition": 8124213.069898104, + "lr": 0.0004686047402353435, + "time_sec": 15.31308388710022 + }, + { + "epoch": 53, + "train_loss": 0.16149800906658174, + "train_acc": 0.94246, + "test_loss": 0.580558476114273, + "test_acc": 0.8416, + "lyapunov": null, + "grad_norm": 0.4519494684602909, + "grad_max_sv": 0.2916812110692263, + "grad_min_sv": 3.7287610199499e-08, + "grad_condition": 7889287.089630139, + "lr": 0.000452945843340743, + "time_sec": 15.30961537361145 + }, + { + "epoch": 54, + "train_loss": 0.16166152165412903, + "train_acc": 0.94208, + "test_loss": 0.5555281185150146, + "test_acc": 0.8473, + "lyapunov": null, + "grad_norm": 0.45553329333157905, + "grad_max_sv": 0.2948467206209898, + "grad_min_sv": 3.7315171308449634e-08, + "grad_condition": 7971105.5751351025, + "lr": 0.00043733338321784806, + "time_sec": 15.302156925201416 + }, + { + "epoch": 55, + "train_loss": 0.1565243923521042, + "train_acc": 0.94508, + "test_loss": 0.5074358646392823, + "test_acc": 0.8554, + "lyapunov": null, + "grad_norm": 0.4482394365745094, + "grad_max_sv": 0.2973413269966841, + "grad_min_sv": 3.757956048566768e-08, + "grad_condition": 8002347.089848238, + "lr": 0.0004217827674798847, + "time_sec": 15.313871145248413 + }, + { + "epoch": 56, + "train_loss": 0.14638519546031953, + "train_acc": 0.94786, + "test_loss": 0.4880453747272491, + "test_acc": 0.8653, + "lyapunov": null, + "grad_norm": 0.4314707571224286, + "grad_max_sv": 0.2860257361084223, + "grad_min_sv": 3.907978447514893e-08, + "grad_condition": 7325521.391552436, + "lr": 0.00040630934270713783, + "time_sec": 15.315257549285889 + }, + { + "epoch": 57, + "train_loss": 0.14646475307941437, + "train_acc": 0.94766, + "test_loss": 0.576962650680542, + "test_acc": 0.847, + "lyapunov": null, + "grad_norm": 0.4344661359835185, + "grad_max_sv": 0.27631179951131346, + "grad_min_sv": 3.824539080987677e-08, + "grad_condition": 7229591.786889655, + "lr": 0.000390928379301729, + "time_sec": 15.307274341583252 + }, + { + "epoch": 58, + "train_loss": 0.13712914622783662, + "train_acc": 0.95096, + "test_loss": 0.577113539648056, + "test_acc": 0.8499, + "lyapunov": null, + "grad_norm": 0.42148317642657124, + "grad_max_sv": 0.2975440930575132, + "grad_min_sv": 3.797022123386284e-08, + "grad_condition": 7915512.058803884, + "lr": 0.0003756550564175727, + "time_sec": 15.30914568901062 + }, + { + "epoch": 59, + "train_loss": 0.13448802095890044, + "train_acc": 0.95234, + "test_loss": 0.5032788132190704, + "test_acc": 0.8625, + "lyapunov": null, + "grad_norm": 0.4112977684378401, + "grad_max_sv": 0.2814919870346785, + "grad_min_sv": 3.85102704836271e-08, + "grad_condition": 7377336.951999759, + "lr": 0.00036050444698038553, + "time_sec": 15.317845106124878 + }, + { + "epoch": 60, + "train_loss": 0.13363940123558044, + "train_acc": 0.952, + "test_loss": 0.5432449889659882, + "test_acc": 0.854, + "lyapunov": null, + "grad_norm": 0.4126784436246539, + "grad_max_sv": 0.2804244253784418, + "grad_min_sv": 3.7023297405625045e-08, + "grad_condition": 7621956.91724248, + "lr": 0.00034549150281252655, + "time_sec": 15.322251796722412 + }, + { + "epoch": 61, + "train_loss": 0.12653651702404023, + "train_acc": 0.9556, + "test_loss": 0.49968673663139346, + "test_acc": 0.8678, + "lyapunov": null, + "grad_norm": 0.4007355103640766, + "grad_max_sv": 0.27012523673474786, + "grad_min_sv": 3.795508094484035e-08, + "grad_condition": 7141541.257203001, + "lr": 0.0003306310398773544, + "time_sec": 15.314436435699463 + }, + { + "epoch": 62, + "train_loss": 0.12188665760755539, + "train_acc": 0.9566, + "test_loss": 0.5593991501808167, + "test_acc": 0.8565, + "lyapunov": null, + "grad_norm": 0.3921398359098778, + "grad_max_sv": 0.27338829450309277, + "grad_min_sv": 3.639061785243314e-08, + "grad_condition": 7584044.263979311, + "lr": 0.00031593772365766127, + "time_sec": 15.302758693695068 + }, + { + "epoch": 63, + "train_loss": 0.1223608536529541, + "train_acc": 0.95622, + "test_loss": 0.5149862161636353, + "test_acc": 0.8612, + "lyapunov": null, + "grad_norm": 0.39447951861080405, + "grad_max_sv": 0.2628227811306715, + "grad_min_sv": 3.7084175330548416e-08, + "grad_condition": 7085494.638547185, + "lr": 0.0003014260546826097, + "time_sec": 15.300389051437378 + }, + { + "epoch": 64, + "train_loss": 0.11717436948299408, + "train_acc": 0.95768, + "test_loss": 0.5029231981754303, + "test_acc": 0.8645, + "lyapunov": null, + "grad_norm": 0.3837842917710247, + "grad_max_sv": 0.2503308400511742, + "grad_min_sv": 3.676226967286311e-08, + "grad_condition": 6852674.209660569, + "lr": 0.0002871103542174637, + "time_sec": 15.306849479675293 + }, + { + "epoch": 65, + "train_loss": 0.1104171419763565, + "train_acc": 0.96138, + "test_loss": 0.5105278373241424, + "test_acc": 0.8621, + "lyapunov": null, + "grad_norm": 0.37324824392122696, + "grad_max_sv": 0.24798878654837608, + "grad_min_sv": 3.5933988673519934e-08, + "grad_condition": 6928104.161500673, + "lr": 0.0002730047501302267, + "time_sec": 15.306128978729248 + }, + { + "epoch": 66, + "train_loss": 0.11005497314453125, + "train_acc": 0.9604, + "test_loss": 0.5454881217956543, + "test_acc": 0.8593, + "lyapunov": null, + "grad_norm": 0.3740796827280413, + "grad_max_sv": 0.25094335451722144, + "grad_min_sv": 3.760543059172505e-08, + "grad_condition": 6680130.259128613, + "lr": 0.00025912316294914234, + "time_sec": 15.311371803283691 + }, + { + "epoch": 67, + "train_loss": 0.1054667473077774, + "train_acc": 0.96206, + "test_loss": 0.5242725006103516, + "test_acc": 0.8654, + "lyapunov": null, + "grad_norm": 0.368892738378212, + "grad_max_sv": 0.25266984924674035, + "grad_min_sv": 3.633599621188921e-08, + "grad_condition": 7013352.02049877, + "lr": 0.0002454792921248144, + "time_sec": 15.30515193939209 + }, + { + "epoch": 68, + "train_loss": 0.10004293047904968, + "train_acc": 0.96412, + "test_loss": 0.5743433611869811, + "test_acc": 0.8538, + "lyapunov": null, + "grad_norm": 0.3572601369548122, + "grad_max_sv": 0.24928448162972927, + "grad_min_sv": 3.5534662101710524e-08, + "grad_condition": 7054160.907809177, + "lr": 0.00023208660251050164, + "time_sec": 15.31411099433899 + }, + { + "epoch": 69, + "train_loss": 0.09898206293821335, + "train_acc": 0.96434, + "test_loss": 0.5453432657718659, + "test_acc": 0.8647, + "lyapunov": null, + "grad_norm": 0.3575462219401736, + "grad_max_sv": 0.22338325902819633, + "grad_min_sv": 3.5619033011968784e-08, + "grad_condition": 6388845.433191194, + "lr": 0.00021895831107393473, + "time_sec": 15.320244789123535 + }, + { + "epoch": 70, + "train_loss": 0.09576731202960015, + "train_acc": 0.96662, + "test_loss": 0.5289871492862701, + "test_acc": 0.8673, + "lyapunov": null, + "grad_norm": 0.3475548635629844, + "grad_max_sv": 0.22887863107025624, + "grad_min_sv": 3.558577605922153e-08, + "grad_condition": 6520932.801253774, + "lr": 0.00020610737385376356, + "time_sec": 15.312981367111206 + }, + { + "epoch": 71, + "train_loss": 0.09435438349246979, + "train_acc": 0.96552, + "test_loss": 0.5673801244735718, + "test_acc": 0.8597, + "lyapunov": null, + "grad_norm": 0.35002047617094667, + "grad_max_sv": 0.24012817665934563, + "grad_min_sv": 3.424292120968175e-08, + "grad_condition": 7037803.21914607, + "lr": 0.00019354647317351177, + "time_sec": 15.323097705841064 + }, + { + "epoch": 72, + "train_loss": 0.0899286351108551, + "train_acc": 0.96766, + "test_loss": 0.5408580667495727, + "test_acc": 0.8662, + "lyapunov": null, + "grad_norm": 0.34100528699001653, + "grad_max_sv": 0.22443376183509828, + "grad_min_sv": 3.460758826179244e-08, + "grad_condition": 6548190.204110672, + "lr": 0.0001812880051256552, + "time_sec": 15.303936243057251 + }, + { + "epoch": 73, + "train_loss": 0.08644640971183777, + "train_acc": 0.9696, + "test_loss": 0.5231532414436341, + "test_acc": 0.8687, + "lyapunov": null, + "grad_norm": 0.3297853844853395, + "grad_max_sv": 0.23831307105720043, + "grad_min_sv": 3.648763895469642e-08, + "grad_condition": 6564265.399345921, + "lr": 0.00016934406733817422, + "time_sec": 15.323826313018799 + }, + { + "epoch": 74, + "train_loss": 0.08675267961740493, + "train_acc": 0.96966, + "test_loss": 0.531370454120636, + "test_acc": 0.8724, + "lyapunov": null, + "grad_norm": 0.33474921077291964, + "grad_max_sv": 0.23228033129125833, + "grad_min_sv": 3.54595965035287e-08, + "grad_condition": 6646670.669053013, + "lr": 0.0001577264470356557, + "time_sec": 15.305448532104492 + }, + { + "epoch": 75, + "train_loss": 0.08520255417346954, + "train_acc": 0.96946, + "test_loss": 0.5489996848106384, + "test_acc": 0.8629, + "lyapunov": null, + "grad_norm": 0.333062577424503, + "grad_max_sv": 0.23861498832702638, + "grad_min_sv": 3.416034828340742e-08, + "grad_condition": 7057996.098654354, + "lr": 0.00014644660940672634, + "time_sec": 15.307157516479492 + }, + { + "epoch": 76, + "train_loss": 0.08347911696434021, + "train_acc": 0.97006, + "test_loss": 0.5250146618843079, + "test_acc": 0.8686, + "lyapunov": null, + "grad_norm": 0.3315871550000043, + "grad_max_sv": 0.23978985324501992, + "grad_min_sv": 3.5313697566152766e-08, + "grad_condition": 6836692.7541990755, + "lr": 0.0001355156862892944, + "time_sec": 15.2927827835083 + }, + { + "epoch": 77, + "train_loss": 0.08182602140903474, + "train_acc": 0.97104, + "test_loss": 0.5350998015880585, + "test_acc": 0.8704, + "lyapunov": null, + "grad_norm": 0.3273538350101595, + "grad_max_sv": 0.23843283373862506, + "grad_min_sv": 3.504422023681286e-08, + "grad_condition": 6836027.998268524, + "lr": 0.00012494446518477025, + "time_sec": 15.317047834396362 + }, + { + "epoch": 78, + "train_loss": 0.07884973392605782, + "train_acc": 0.9722, + "test_loss": 0.543610359621048, + "test_acc": 0.869, + "lyapunov": null, + "grad_norm": 0.318085721614815, + "grad_max_sv": 0.2306290850043297, + "grad_min_sv": 3.51138401910589e-08, + "grad_condition": 6598865.01839647, + "lr": 0.00011474337861210548, + "time_sec": 15.346408605575562 + }, + { + "epoch": 79, + "train_loss": 0.07515444636344909, + "train_acc": 0.97302, + "test_loss": 0.5453424057006836, + "test_acc": 0.8685, + "lyapunov": null, + "grad_norm": 0.30764732453726595, + "grad_max_sv": 0.23328058049082756, + "grad_min_sv": 3.4018917194345025e-08, + "grad_condition": 6898312.859708968, + "lr": 0.00010492249381215483, + "time_sec": 15.312849998474121 + }, + { + "epoch": 80, + "train_loss": 0.07553981874942779, + "train_acc": 0.97342, + "test_loss": 0.5447598055839539, + "test_acc": 0.8687, + "lyapunov": null, + "grad_norm": 0.3126827627293077, + "grad_max_sv": 0.22440926413983106, + "grad_min_sv": 3.5051727831358904e-08, + "grad_condition": 6508990.801328001, + "lr": 9.549150281252637e-05, + "time_sec": 15.31579327583313 + }, + { + "epoch": 81, + "train_loss": 0.0691981615459919, + "train_acc": 0.9767, + "test_loss": 0.6010801038742065, + "test_acc": 0.8592, + "lyapunov": null, + "grad_norm": 0.2964655372784287, + "grad_max_sv": 0.20926067158579825, + "grad_min_sv": 3.334633209561844e-08, + "grad_condition": 6336645.734981732, + "lr": 8.645971286271918e-05, + "time_sec": 15.311565399169922 + }, + { + "epoch": 82, + "train_loss": 0.07134237255096436, + "train_acc": 0.97564, + "test_loss": 0.5511228674888611, + "test_acc": 0.8685, + "lyapunov": null, + "grad_norm": 0.3035210287863858, + "grad_max_sv": 0.2166539143770933, + "grad_min_sv": 3.444789098416834e-08, + "grad_condition": 6316501.5285459785, + "lr": 7.78360372489926e-05, + "time_sec": 15.321164846420288 + }, + { + "epoch": 83, + "train_loss": 0.06894262619018554, + "train_acc": 0.97574, + "test_loss": 0.5341768414020538, + "test_acc": 0.8666, + "lyapunov": null, + "grad_norm": 0.3006016750160245, + "grad_max_sv": 0.214569428935647, + "grad_min_sv": 3.390297984573465e-08, + "grad_condition": 6347736.579489769, + "lr": 6.962898649802815e-05, + "time_sec": 15.31421685218811 + }, + { + "epoch": 84, + "train_loss": 0.06843596329629421, + "train_acc": 0.97558, + "test_loss": 0.5208944204807282, + "test_acc": 0.8703, + "lyapunov": null, + "grad_norm": 0.2931609715468412, + "grad_max_sv": 0.2041362512856722, + "grad_min_sv": 3.608063616766799e-08, + "grad_condition": 5852493.960090882, + "lr": 6.184665997806824e-05, + "time_sec": 15.313952445983887 + }, + { + "epoch": 85, + "train_loss": 0.06798111920118331, + "train_acc": 0.97708, + "test_loss": 0.5408778586387635, + "test_acc": 0.869, + "lyapunov": null, + "grad_norm": 0.2949462881166867, + "grad_max_sv": 0.2191694311797619, + "grad_min_sv": 3.3161099466383345e-08, + "grad_condition": 6683084.915046187, + "lr": 5.449673790581613e-05, + "time_sec": 15.323522567749023 + }, + { + "epoch": 86, + "train_loss": 0.06374187029123306, + "train_acc": 0.97854, + "test_loss": 0.534241654920578, + "test_acc": 0.8701, + "lyapunov": null, + "grad_norm": 0.28381214745100436, + "grad_max_sv": 0.21770549267530442, + "grad_min_sv": 3.4639007706616096e-08, + "grad_condition": 6392279.068014438, + "lr": 4.758647376699034e-05, + "time_sec": 15.312573432922363 + }, + { + "epoch": 87, + "train_loss": 0.06471459998726845, + "train_acc": 0.97748, + "test_loss": 0.5297845101356506, + "test_acc": 0.8726, + "lyapunov": null, + "grad_norm": 0.28897487313019665, + "grad_max_sv": 0.19332378804683686, + "grad_min_sv": 3.343392815935431e-08, + "grad_condition": 5824270.640002059, + "lr": 4.112268715800956e-05, + "time_sec": 15.310936450958252 + }, + { + "epoch": 88, + "train_loss": 0.06347171569228173, + "train_acc": 0.97814, + "test_loss": 0.5321846860408783, + "test_acc": 0.8722, + "lyapunov": null, + "grad_norm": 0.2861217885894181, + "grad_max_sv": 0.18890463691204787, + "grad_min_sv": 3.443075908826643e-08, + "grad_condition": 5578610.167209303, + "lr": 3.511175705587434e-05, + "time_sec": 15.30883502960205 + }, + { + "epoch": 89, + "train_loss": 0.06456126765966415, + "train_acc": 0.97732, + "test_loss": 0.5306058297157288, + "test_acc": 0.8724, + "lyapunov": null, + "grad_norm": 0.2911671580013793, + "grad_max_sv": 0.20169610902667046, + "grad_min_sv": 3.3340199756537456e-08, + "grad_condition": 6113921.310843622, + "lr": 2.9559615522887284e-05, + "time_sec": 15.325217247009277 + }, + { + "epoch": 90, + "train_loss": 0.05981739419221878, + "train_acc": 0.97936, + "test_loss": 0.5510406871795654, + "test_acc": 0.8698, + "lyapunov": null, + "grad_norm": 0.27406962038993515, + "grad_max_sv": 0.20393476765602828, + "grad_min_sv": 3.436182409721766e-08, + "grad_condition": 6006804.61096659, + "lr": 2.447174185242324e-05, + "time_sec": 15.308394432067871 + }, + { + "epoch": 91, + "train_loss": 0.05843851445674896, + "train_acc": 0.97988, + "test_loss": 0.5369569517612457, + "test_acc": 0.8726, + "lyapunov": null, + "grad_norm": 0.270215680703968, + "grad_max_sv": 0.19462423361837863, + "grad_min_sv": 3.2800926286213895e-08, + "grad_condition": 5976870.852957519, + "lr": 1.9853157161528526e-05, + "time_sec": 15.312544584274292 + }, + { + "epoch": 92, + "train_loss": 0.06141342503786087, + "train_acc": 0.9789, + "test_loss": 0.5492124430656433, + "test_acc": 0.8715, + "lyapunov": null, + "grad_norm": 0.28355491226552393, + "grad_max_sv": 0.20141606461256742, + "grad_min_sv": 3.389024190170176e-08, + "grad_condition": 6025484.075561702, + "lr": 1.570841943568452e-05, + "time_sec": 15.318751096725464 + }, + { + "epoch": 93, + "train_loss": 0.06185958398580551, + "train_acc": 0.9791, + "test_loss": 0.5353557282447815, + "test_acc": 0.8734, + "lyapunov": null, + "grad_norm": 0.28019086696986784, + "grad_max_sv": 0.20358563121408224, + "grad_min_sv": 3.4872499954374805e-08, + "grad_condition": 5972181.870711091, + "lr": 1.204161903062634e-05, + "time_sec": 15.310726404190063 + }, + { + "epoch": 94, + "train_loss": 0.061077375268936154, + "train_acc": 0.97862, + "test_loss": 0.5403136486530304, + "test_acc": 0.8726, + "lyapunov": null, + "grad_norm": 0.27793458972654056, + "grad_max_sv": 0.21468139700591565, + "grad_min_sv": 3.314470546911252e-08, + "grad_condition": 6531953.716980138, + "lr": 8.85637463565564e-06, + "time_sec": 15.322482585906982 + }, + { + "epoch": 95, + "train_loss": 0.059067166829109195, + "train_acc": 0.9801, + "test_loss": 0.5499792334079743, + "test_acc": 0.8706, + "lyapunov": null, + "grad_norm": 0.2726950869177449, + "grad_max_sv": 0.1847312103956938, + "grad_min_sv": 3.442832863242984e-08, + "grad_condition": 5484378.490748374, + "lr": 6.155829702431171e-06, + "time_sec": 15.331462860107422 + }, + { + "epoch": 96, + "train_loss": 0.058869197854995725, + "train_acc": 0.97992, + "test_loss": 0.5609679688453675, + "test_acc": 0.8699, + "lyapunov": null, + "grad_norm": 0.2733600212103379, + "grad_max_sv": 0.203422649204731, + "grad_min_sv": 3.4962690476092464e-08, + "grad_condition": 5877045.15462194, + "lr": 3.942649342761118e-06, + "time_sec": 15.318592071533203 + }, + { + "epoch": 97, + "train_loss": 0.05934914319038391, + "train_acc": 0.97972, + "test_loss": 0.5556031215667725, + "test_acc": 0.8687, + "lyapunov": null, + "grad_norm": 0.2765716324142509, + "grad_max_sv": 0.1996933190152049, + "grad_min_sv": 3.3284164402402895e-08, + "grad_condition": 6129925.740326188, + "lr": 2.2190176984600023e-06, + "time_sec": 15.329679727554321 + }, + { + "epoch": 98, + "train_loss": 0.05874215810537338, + "train_acc": 0.97992, + "test_loss": 0.5451333051681518, + "test_acc": 0.8712, + "lyapunov": null, + "grad_norm": 0.2696205462857481, + "grad_max_sv": 0.19026922769844531, + "grad_min_sv": 3.324827377859663e-08, + "grad_condition": 5756655.141047328, + "lr": 9.866357858642206e-07, + "time_sec": 15.31182599067688 + }, + { + "epoch": 99, + "train_loss": 0.059339061715602874, + "train_acc": 0.98046, + "test_loss": 0.5511723966598511, + "test_acc": 0.8694, + "lyapunov": null, + "grad_norm": 0.2722387278016211, + "grad_max_sv": 0.17949199080467224, + "grad_min_sv": 3.178271090753526e-08, + "grad_condition": 5671386.367227938, + "lr": 2.467198171342e-07, + "time_sec": 15.313301801681519 + }, + { + "epoch": 100, + "train_loss": 0.05937783687353134, + "train_acc": 0.97908, + "test_loss": 0.5341217585086823, + "test_acc": 0.8723, + "lyapunov": null, + "grad_norm": 0.275408042809645, + "grad_max_sv": 0.19940215721726418, + "grad_min_sv": 3.299201711826072e-08, + "grad_condition": 6121670.713258359, + "lr": 0.0, + "time_sec": 15.337401151657104 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 2.1551968896484377, + "train_acc": 0.2953, + "test_loss": 1.8477057243347168, + "test_acc": 0.3437, + "lyapunov": null, + "grad_norm": 8.144943624656428, + "grad_max_sv": 7.675079941749573, + "grad_min_sv": 2.827612160416493e-07, + "grad_condition": 28317355.270070046, + "lr": 0.0009997532801828658, + "time_sec": 32.46485447883606 + }, + { + "epoch": 2, + "train_loss": 1.6082625040054321, + "train_acc": 0.42284, + "test_loss": 1.6673745800018311, + "test_acc": 0.406, + "lyapunov": null, + "grad_norm": 6.065037474589551, + "grad_max_sv": 5.5711340546607975, + "grad_min_sv": 2.234880795981553e-07, + "grad_condition": 25327173.99046154, + "lr": 0.0009990133642141358, + "time_sec": 32.39758110046387 + }, + { + "epoch": 3, + "train_loss": 1.4377277154159547, + "train_acc": 0.48488, + "test_loss": 1.5402760635375976, + "test_acc": 0.4555, + "lyapunov": null, + "grad_norm": 5.494687491087257, + "grad_max_sv": 4.691517299413681, + "grad_min_sv": 1.9618108950680835e-07, + "grad_condition": 24150344.903272796, + "lr": 0.00099778098230154, + "time_sec": 32.400826930999756 + }, + { + "epoch": 4, + "train_loss": 1.2879639573669435, + "train_acc": 0.53716, + "test_loss": 1.8371749683380127, + "test_acc": 0.4098, + "lyapunov": null, + "grad_norm": 4.741620609793776, + "grad_max_sv": 4.525534170866012, + "grad_min_sv": 1.8297150106150184e-07, + "grad_condition": 24870782.059164062, + "lr": 0.000996057350657239, + "time_sec": 32.39713406562805 + }, + { + "epoch": 5, + "train_loss": 1.196011114768982, + "train_acc": 0.5717, + "test_loss": 1.1917746976852417, + "test_acc": 0.5662, + "lyapunov": null, + "grad_norm": 4.225084445671327, + "grad_max_sv": 3.8811924695968627, + "grad_min_sv": 1.7304786759098079e-07, + "grad_condition": 22788363.03168846, + "lr": 0.0009938441702975688, + "time_sec": 32.39927625656128 + }, + { + "epoch": 6, + "train_loss": 1.1017011584854126, + "train_acc": 0.60624, + "test_loss": 1.2156044723510742, + "test_acc": 0.5524, + "lyapunov": null, + "grad_norm": 3.8500733224578765, + "grad_max_sv": 3.3867243230342865, + "grad_min_sv": 1.5910630946081028e-07, + "grad_condition": 21517993.207089722, + "lr": 0.0009911436253643444, + "time_sec": 32.41104435920715 + }, + { + "epoch": 7, + "train_loss": 1.019956372566223, + "train_acc": 0.63884, + "test_loss": 1.0341911317825316, + "test_acc": 0.6312, + "lyapunov": null, + "grad_norm": 3.4050623209558424, + "grad_max_sv": 2.8642074435949327, + "grad_min_sv": 1.3970929391149411e-07, + "grad_condition": 20503012.26948414, + "lr": 0.0009879583809693736, + "time_sec": 32.39900183677673 + }, + { + "epoch": 8, + "train_loss": 0.952932172832489, + "train_acc": 0.66154, + "test_loss": 0.9561027820587158, + "test_acc": 0.6654, + "lyapunov": null, + "grad_norm": 3.069081296040065, + "grad_max_sv": 2.5316490083932877, + "grad_min_sv": 1.2806189264580325e-07, + "grad_condition": 19934874.23822563, + "lr": 0.0009842915805643154, + "time_sec": 32.39242911338806 + }, + { + "epoch": 9, + "train_loss": 0.8849921081352234, + "train_acc": 0.68628, + "test_loss": 1.0301121936798097, + "test_acc": 0.6342, + "lyapunov": null, + "grad_norm": 2.63645918277651, + "grad_max_sv": 2.232751601934433, + "grad_min_sv": 1.2227004724252312e-07, + "grad_condition": 18401740.489395566, + "lr": 0.0009801468428384714, + "time_sec": 32.409496545791626 + }, + { + "epoch": 10, + "train_loss": 0.8236279186630249, + "train_acc": 0.70854, + "test_loss": 0.8807288621902466, + "test_acc": 0.682, + "lyapunov": null, + "grad_norm": 2.300239690915013, + "grad_max_sv": 1.9658639460802079, + "grad_min_sv": 1.1437598530505966e-07, + "grad_condition": 17605252.06510754, + "lr": 0.0009755282581475767, + "time_sec": 32.40023136138916 + }, + { + "epoch": 11, + "train_loss": 0.788265288658142, + "train_acc": 0.72186, + "test_loss": 0.8550062474250794, + "test_acc": 0.6904, + "lyapunov": null, + "grad_norm": 2.12020034951075, + "grad_max_sv": 1.6186737358570098, + "grad_min_sv": 1.0332133957291489e-07, + "grad_condition": 15780748.729030486, + "lr": 0.0009704403844771127, + "time_sec": 32.40667533874512 + }, + { + "epoch": 12, + "train_loss": 0.7433690148735046, + "train_acc": 0.73772, + "test_loss": 0.8008458862304687, + "test_acc": 0.7171, + "lyapunov": null, + "grad_norm": 1.8897751819834427, + "grad_max_sv": 1.448184822499752, + "grad_min_sv": 9.324852872083511e-08, + "grad_condition": 15545592.26156075, + "lr": 0.0009648882429441257, + "time_sec": 32.4004065990448 + }, + { + "epoch": 13, + "train_loss": 0.7159804575920105, + "train_acc": 0.74844, + "test_loss": 0.8449424732208252, + "test_acc": 0.7107, + "lyapunov": null, + "grad_norm": 1.7162684736286458, + "grad_max_sv": 1.387939277291298, + "grad_min_sv": 9.02613965791943e-08, + "grad_condition": 15516859.545498159, + "lr": 0.0009588773128419905, + "time_sec": 32.39161419868469 + }, + { + "epoch": 14, + "train_loss": 0.6710689739608765, + "train_acc": 0.7652, + "test_loss": 0.8030969514846802, + "test_acc": 0.7199, + "lyapunov": null, + "grad_norm": 1.5415310022642745, + "grad_max_sv": 1.124143162369728, + "grad_min_sv": 7.788519358342683e-08, + "grad_condition": 14586378.513744438, + "lr": 0.0009524135262330098, + "time_sec": 32.40552067756653 + }, + { + "epoch": 15, + "train_loss": 0.6438176040267944, + "train_acc": 0.77396, + "test_loss": 0.7497868657112121, + "test_acc": 0.7401, + "lyapunov": null, + "grad_norm": 1.4186644873786285, + "grad_max_sv": 1.0314671725034714, + "grad_min_sv": 7.5272734179066e-08, + "grad_condition": 13653093.352212925, + "lr": 0.0009455032620941839, + "time_sec": 32.40474534034729 + }, + { + "epoch": 16, + "train_loss": 0.615869576702118, + "train_acc": 0.7829, + "test_loss": 0.7672984195709228, + "test_acc": 0.7337, + "lyapunov": null, + "grad_norm": 1.2847059491767132, + "grad_max_sv": 0.8981582961976529, + "grad_min_sv": 7.069710665774664e-08, + "grad_condition": 12774971.99569363, + "lr": 0.0009381533400219318, + "time_sec": 32.411378145217896 + }, + { + "epoch": 17, + "train_loss": 0.5916317593765259, + "train_acc": 0.79332, + "test_loss": 0.6773865149497986, + "test_acc": 0.7673, + "lyapunov": null, + "grad_norm": 1.1905850089737686, + "grad_max_sv": 0.8305475980043411, + "grad_min_sv": 6.581527465243652e-08, + "grad_condition": 12649477.259974267, + "lr": 0.0009303710135019719, + "time_sec": 32.40375375747681 + }, + { + "epoch": 18, + "train_loss": 0.5710988390541076, + "train_acc": 0.80148, + "test_loss": 0.6730817820549011, + "test_acc": 0.7658, + "lyapunov": null, + "grad_norm": 1.1184745092261044, + "grad_max_sv": 0.8092691361904144, + "grad_min_sv": 6.20087442726458e-08, + "grad_condition": 13237272.581055809, + "lr": 0.0009221639627510076, + "time_sec": 32.403624534606934 + }, + { + "epoch": 19, + "train_loss": 0.5524461611747742, + "train_acc": 0.80704, + "test_loss": 0.7162760413169861, + "test_acc": 0.7602, + "lyapunov": null, + "grad_norm": 1.023562615452227, + "grad_max_sv": 0.6794823326170445, + "grad_min_sv": 5.88299432280337e-08, + "grad_condition": 11704217.317878243, + "lr": 0.000913540287137281, + "time_sec": 32.39382600784302 + }, + { + "epoch": 20, + "train_loss": 0.5298428584098815, + "train_acc": 0.81452, + "test_loss": 0.7450216589927673, + "test_acc": 0.752, + "lyapunov": null, + "grad_norm": 0.9359144343942514, + "grad_max_sv": 0.5905756287276744, + "grad_min_sv": 5.571528873815623e-08, + "grad_condition": 10693233.182217773, + "lr": 0.0009045084971874739, + "time_sec": 32.40094780921936 + }, + { + "epoch": 21, + "train_loss": 0.5077325123977661, + "train_acc": 0.82174, + "test_loss": 0.63943037815094, + "test_acc": 0.7812, + "lyapunov": null, + "grad_norm": 0.8805285251076611, + "grad_max_sv": 0.615053903311491, + "grad_min_sv": 5.4429192175575734e-08, + "grad_condition": 11327012.575821584, + "lr": 0.0008950775061878452, + "time_sec": 32.38740086555481 + }, + { + "epoch": 22, + "train_loss": 0.4933246819114685, + "train_acc": 0.8259, + "test_loss": 0.718407027053833, + "test_acc": 0.7614, + "lyapunov": null, + "grad_norm": 0.8303617086611039, + "grad_max_sv": 0.5229416653513909, + "grad_min_sv": 5.0371477122723717e-08, + "grad_condition": 10417728.60900723, + "lr": 0.0008852566213878947, + "time_sec": 32.404406785964966 + }, + { + "epoch": 23, + "train_loss": 0.47660592782020567, + "train_acc": 0.83498, + "test_loss": 0.6119730060577393, + "test_acc": 0.7951, + "lyapunov": null, + "grad_norm": 0.7772569962051041, + "grad_max_sv": 0.5228113703429699, + "grad_min_sv": 4.883190189985953e-08, + "grad_condition": 10840281.592058718, + "lr": 0.0008750555348152298, + "time_sec": 32.41756844520569 + }, + { + "epoch": 24, + "train_loss": 0.4621484722900391, + "train_acc": 0.8354, + "test_loss": 0.6255874982833862, + "test_acc": 0.7921, + "lyapunov": null, + "grad_norm": 0.7435129116165293, + "grad_max_sv": 0.5028938911855221, + "grad_min_sv": 4.940657198915232e-08, + "grad_condition": 10262672.7433966, + "lr": 0.0008644843137107057, + "time_sec": 32.40160775184631 + }, + { + "epoch": 25, + "train_loss": 0.44543547362804414, + "train_acc": 0.84322, + "test_loss": 0.6244046552658081, + "test_acc": 0.8003, + "lyapunov": null, + "grad_norm": 0.7057766135770664, + "grad_max_sv": 0.45453565418720243, + "grad_min_sv": 4.47153126970079e-08, + "grad_condition": 10235918.99223967, + "lr": 0.0008535533905932737, + "time_sec": 32.397634983062744 + }, + { + "epoch": 26, + "train_loss": 0.4291659313964844, + "train_acc": 0.85028, + "test_loss": 0.586253802204132, + "test_acc": 0.8053, + "lyapunov": null, + "grad_norm": 0.6653011352683553, + "grad_max_sv": 0.40432176999747754, + "grad_min_sv": 4.4079006933372964e-08, + "grad_condition": 9263382.4971398, + "lr": 0.0008422735529643444, + "time_sec": 32.408364057540894 + }, + { + "epoch": 27, + "train_loss": 0.41755434021949767, + "train_acc": 0.8537, + "test_loss": 0.6190900807380676, + "test_acc": 0.8031, + "lyapunov": null, + "grad_norm": 0.634844213604884, + "grad_max_sv": 0.38489293307065964, + "grad_min_sv": 4.278397165435877e-08, + "grad_condition": 9083713.307072137, + "lr": 0.0008306559326618259, + "time_sec": 32.3781955242157 + }, + { + "epoch": 28, + "train_loss": 0.409987173576355, + "train_acc": 0.85588, + "test_loss": 0.6381987627029418, + "test_acc": 0.7967, + "lyapunov": null, + "grad_norm": 0.6208575070285024, + "grad_max_sv": 0.3849256232380867, + "grad_min_sv": 4.156698754087529e-08, + "grad_condition": 9343591.955088045, + "lr": 0.0008187119948743449, + "time_sec": 32.424397468566895 + }, + { + "epoch": 29, + "train_loss": 0.39254301443099976, + "train_acc": 0.86148, + "test_loss": 0.6114391220092773, + "test_acc": 0.8072, + "lyapunov": null, + "grad_norm": 0.5930731028782803, + "grad_max_sv": 0.35281661339104176, + "grad_min_sv": 3.97135552887562e-08, + "grad_condition": 8878121.049382607, + "lr": 0.0008064535268264883, + "time_sec": 32.40766763687134 + }, + { + "epoch": 30, + "train_loss": 0.3785347310256958, + "train_acc": 0.86726, + "test_loss": 0.6049399808883666, + "test_acc": 0.811, + "lyapunov": null, + "grad_norm": 0.5794796026042499, + "grad_max_sv": 0.36831745132803917, + "grad_min_sv": 4.032110121343635e-08, + "grad_condition": 9212028.38827365, + "lr": 0.0007938926261462367, + "time_sec": 32.40119290351868 + }, + { + "epoch": 31, + "train_loss": 0.3689020803642273, + "train_acc": 0.87034, + "test_loss": 0.6224831011772156, + "test_acc": 0.8103, + "lyapunov": null, + "grad_norm": 0.5518777770693967, + "grad_max_sv": 0.34497435614466665, + "grad_min_sv": 3.993250263789605e-08, + "grad_condition": 8691890.072923485, + "lr": 0.0007810416889260654, + "time_sec": 32.42319178581238 + }, + { + "epoch": 32, + "train_loss": 0.3600490350532532, + "train_acc": 0.87378, + "test_loss": 0.6563146770000458, + "test_acc": 0.7989, + "lyapunov": null, + "grad_norm": 0.5344416918727563, + "grad_max_sv": 0.3161147892475128, + "grad_min_sv": 3.79914633530376e-08, + "grad_condition": 8391808.948301231, + "lr": 0.0007679133974894983, + "time_sec": 32.40037226676941 + }, + { + "epoch": 33, + "train_loss": 0.3552369830417633, + "train_acc": 0.876, + "test_loss": 0.5918597935676575, + "test_acc": 0.8191, + "lyapunov": null, + "grad_norm": 0.5223477954823382, + "grad_max_sv": 0.32091905549168587, + "grad_min_sv": 3.692389771714488e-08, + "grad_condition": 8735655.499988783, + "lr": 0.0007545207078751857, + "time_sec": 32.39385366439819 + }, + { + "epoch": 34, + "train_loss": 0.3357627202987671, + "train_acc": 0.88192, + "test_loss": 0.6601162696361542, + "test_acc": 0.8074, + "lyapunov": null, + "grad_norm": 0.5010170887656177, + "grad_max_sv": 0.3139246258884668, + "grad_min_sv": 3.658822085306213e-08, + "grad_condition": 8606732.681616401, + "lr": 0.0007408768370508577, + "time_sec": 32.40888476371765 + }, + { + "epoch": 35, + "train_loss": 0.32540871870040894, + "train_acc": 0.88428, + "test_loss": 0.6114396753549576, + "test_acc": 0.8112, + "lyapunov": null, + "grad_norm": 0.4852002465463357, + "grad_max_sv": 0.3033136323094368, + "grad_min_sv": 3.599271058973841e-08, + "grad_condition": 8499862.031601336, + "lr": 0.0007269952498697734, + "time_sec": 32.40857720375061 + }, + { + "epoch": 36, + "train_loss": 0.32421252524375915, + "train_acc": 0.8847, + "test_loss": 0.6881836595535278, + "test_acc": 0.8116, + "lyapunov": null, + "grad_norm": 0.47585625371919826, + "grad_max_sv": 0.28932417593896387, + "grad_min_sv": 3.663087517757902e-08, + "grad_condition": 7933220.2527872, + "lr": 0.0007128896457825364, + "time_sec": 32.39529776573181 + }, + { + "epoch": 37, + "train_loss": 0.3108924944496155, + "train_acc": 0.88942, + "test_loss": 0.7008573976516723, + "test_acc": 0.8098, + "lyapunov": null, + "grad_norm": 0.46276747011208014, + "grad_max_sv": 0.2795715734362602, + "grad_min_sv": 3.448033547570617e-08, + "grad_condition": 8262563.079640454, + "lr": 0.0006985739453173903, + "time_sec": 32.38434648513794 + }, + { + "epoch": 38, + "train_loss": 0.31133034090042117, + "train_acc": 0.88992, + "test_loss": 0.6698009629249573, + "test_acc": 0.81, + "lyapunov": null, + "grad_norm": 0.4586602799362298, + "grad_max_sv": 0.2844005227088928, + "grad_min_sv": 3.324500559287458e-08, + "grad_condition": 8714467.747357922, + "lr": 0.0006840622763423391, + "time_sec": 32.396021366119385 + }, + { + "epoch": 39, + "train_loss": 0.29518098635673523, + "train_acc": 0.89552, + "test_loss": 0.7677701180458069, + "test_acc": 0.7991, + "lyapunov": null, + "grad_norm": 0.43830085967668675, + "grad_max_sv": 0.2725641973316669, + "grad_min_sv": 3.3406064270380397e-08, + "grad_condition": 8255466.038533419, + "lr": 0.0006693689601226458, + "time_sec": 32.40195083618164 + }, + { + "epoch": 40, + "train_loss": 0.2831247230243683, + "train_acc": 0.89996, + "test_loss": 0.6842746494293213, + "test_acc": 0.8148, + "lyapunov": null, + "grad_norm": 0.4331819538283316, + "grad_max_sv": 0.26449211575090886, + "grad_min_sv": 3.399684476157461e-08, + "grad_condition": 7879060.46068686, + "lr": 0.0006545084971874737, + "time_sec": 32.418256521224976 + }, + { + "epoch": 41, + "train_loss": 0.27670828733444214, + "train_acc": 0.90256, + "test_loss": 0.701638517665863, + "test_acc": 0.8105, + "lyapunov": null, + "grad_norm": 0.42402034759846713, + "grad_max_sv": 0.26597036607563496, + "grad_min_sv": 3.2260157212249396e-08, + "grad_condition": 8290157.649110466, + "lr": 0.0006394955530196147, + "time_sec": 32.40391206741333 + }, + { + "epoch": 42, + "train_loss": 0.26722780378341676, + "train_acc": 0.90478, + "test_loss": 0.676421770954132, + "test_acc": 0.8152, + "lyapunov": null, + "grad_norm": 0.41593559749987674, + "grad_max_sv": 0.26356035731732846, + "grad_min_sv": 3.2800773563934625e-08, + "grad_condition": 8080555.103613043, + "lr": 0.0006243449435824273, + "time_sec": 32.413851737976074 + }, + { + "epoch": 43, + "train_loss": 0.2611290577888489, + "train_acc": 0.9069, + "test_loss": 0.7091101724147797, + "test_acc": 0.8165, + "lyapunov": null, + "grad_norm": 0.40890139043798995, + "grad_max_sv": 0.2530216708779335, + "grad_min_sv": 3.0997858102566053e-08, + "grad_condition": 8224218.543131987, + "lr": 0.0006090716206982714, + "time_sec": 32.60969662666321 + }, + { + "epoch": 44, + "train_loss": 0.2530948238658905, + "train_acc": 0.90982, + "test_loss": 0.6961516171455383, + "test_acc": 0.8214, + "lyapunov": null, + "grad_norm": 0.39919304872434885, + "grad_max_sv": 0.24201009832322598, + "grad_min_sv": 3.264100985056473e-08, + "grad_condition": 7496864.741894746, + "lr": 0.0005936906572928625, + "time_sec": 32.40188717842102 + }, + { + "epoch": 45, + "train_loss": 0.23889887328147888, + "train_acc": 0.91386, + "test_loss": 0.7265622617721558, + "test_acc": 0.8196, + "lyapunov": null, + "grad_norm": 0.39216552760863915, + "grad_max_sv": 0.25172842368483545, + "grad_min_sv": 3.196390450099784e-08, + "grad_condition": 7939664.340514863, + "lr": 0.0005782172325201156, + "time_sec": 32.40084266662598 + }, + { + "epoch": 46, + "train_loss": 0.23805784145355224, + "train_acc": 0.91674, + "test_loss": 0.6975640031337738, + "test_acc": 0.8226, + "lyapunov": null, + "grad_norm": 0.3825430754006707, + "grad_max_sv": 0.23831223957240583, + "grad_min_sv": 2.971923072081495e-08, + "grad_condition": 8085204.090791678, + "lr": 0.0005626666167821523, + "time_sec": 32.42257380485535 + }, + { + "epoch": 47, + "train_loss": 0.23282361968994142, + "train_acc": 0.91824, + "test_loss": 0.6992193672657013, + "test_acc": 0.8311, + "lyapunov": null, + "grad_norm": 0.3814486121413188, + "grad_max_sv": 0.23424655832350255, + "grad_min_sv": 3.104032040290861e-08, + "grad_condition": 7643726.892298067, + "lr": 0.0005470541566592572, + "time_sec": 32.40861511230469 + }, + { + "epoch": 48, + "train_loss": 0.22799833922863005, + "train_acc": 0.91886, + "test_loss": 0.6951349193096161, + "test_acc": 0.8282, + "lyapunov": null, + "grad_norm": 0.38166215011498245, + "grad_max_sv": 0.24571430422365664, + "grad_min_sv": 3.0606541878697156e-08, + "grad_condition": 8099711.568480073, + "lr": 0.0005313952597646569, + "time_sec": 32.382601499557495 + }, + { + "epoch": 49, + "train_loss": 0.21888560410499572, + "train_acc": 0.92208, + "test_loss": 0.6775056694984436, + "test_acc": 0.8377, + "lyapunov": null, + "grad_norm": 0.3681781600012364, + "grad_max_sv": 0.22858488224446774, + "grad_min_sv": 3.0608208811955254e-08, + "grad_condition": 7499521.525014189, + "lr": 0.0005157053795390643, + "time_sec": 32.38293170928955 + }, + { + "epoch": 50, + "train_loss": 0.2106206985092163, + "train_acc": 0.9252, + "test_loss": 0.6563802011966705, + "test_acc": 0.8396, + "lyapunov": null, + "grad_norm": 0.36053809946906845, + "grad_max_sv": 0.2215539276599884, + "grad_min_sv": 2.9670953960447833e-08, + "grad_condition": 7567975.97315415, + "lr": 0.0005000000000000002, + "time_sec": 32.3891761302948 + }, + { + "epoch": 51, + "train_loss": 0.19901366895198822, + "train_acc": 0.92832, + "test_loss": 0.6814763808727264, + "test_acc": 0.837, + "lyapunov": null, + "grad_norm": 0.3509310663538234, + "grad_max_sv": 0.21552756875753404, + "grad_min_sv": 3.0066001732720335e-08, + "grad_condition": 7264544.488552595, + "lr": 0.00048429462046093607, + "time_sec": 32.41236758232117 + }, + { + "epoch": 52, + "train_loss": 0.19969978581905365, + "train_acc": 0.9285, + "test_loss": 0.6935202028274536, + "test_acc": 0.8339, + "lyapunov": null, + "grad_norm": 0.3520257382758021, + "grad_max_sv": 0.22391790114343166, + "grad_min_sv": 3.0129751982244104e-08, + "grad_condition": 7509087.830538243, + "lr": 0.0004686047402353435, + "time_sec": 32.39413237571716 + }, + { + "epoch": 53, + "train_loss": 0.19100741683721542, + "train_acc": 0.93138, + "test_loss": 0.686068691778183, + "test_acc": 0.8361, + "lyapunov": null, + "grad_norm": 0.3426294963785598, + "grad_max_sv": 0.22632624246180058, + "grad_min_sv": 2.9659243594437613e-08, + "grad_condition": 7652635.339128266, + "lr": 0.000452945843340743, + "time_sec": 32.40613842010498 + }, + { + "epoch": 54, + "train_loss": 0.18032077651500703, + "train_acc": 0.9362, + "test_loss": 0.7067575240373611, + "test_acc": 0.8336, + "lyapunov": null, + "grad_norm": 0.3322012382733825, + "grad_max_sv": 0.20586859565228224, + "grad_min_sv": 2.850985989510946e-08, + "grad_condition": 7314687.938871255, + "lr": 0.00043733338321784806, + "time_sec": 32.4026734828949 + }, + { + "epoch": 55, + "train_loss": 0.17773653375148774, + "train_acc": 0.93586, + "test_loss": 0.7423279015541077, + "test_acc": 0.8264, + "lyapunov": null, + "grad_norm": 0.3304441924446054, + "grad_max_sv": 0.21223607212305068, + "grad_min_sv": 2.8433270138350508e-08, + "grad_condition": 7539548.749518724, + "lr": 0.0004217827674798847, + "time_sec": 32.404977560043335 + }, + { + "epoch": 56, + "train_loss": 0.17266820957183837, + "train_acc": 0.93834, + "test_loss": 0.7072871742248535, + "test_acc": 0.8362, + "lyapunov": null, + "grad_norm": 0.3213443005744008, + "grad_max_sv": 0.20142054706811904, + "grad_min_sv": 2.726542889242012e-08, + "grad_condition": 7440941.08660387, + "lr": 0.00040630934270713783, + "time_sec": 32.39922308921814 + }, + { + "epoch": 57, + "train_loss": 0.16320502066612244, + "train_acc": 0.9411, + "test_loss": 0.7605734568834305, + "test_acc": 0.8318, + "lyapunov": null, + "grad_norm": 0.31657510227372176, + "grad_max_sv": 0.20284682027995588, + "grad_min_sv": 2.7356661469468692e-08, + "grad_condition": 7474082.923928386, + "lr": 0.000390928379301729, + "time_sec": 32.39910292625427 + }, + { + "epoch": 58, + "train_loss": 0.15670019901275634, + "train_acc": 0.94476, + "test_loss": 0.784366103553772, + "test_acc": 0.8311, + "lyapunov": null, + "grad_norm": 0.30805235096734923, + "grad_max_sv": 0.20260103438049554, + "grad_min_sv": 2.8483807401613605e-08, + "grad_condition": 7164125.0338090565, + "lr": 0.0003756550564175727, + "time_sec": 32.38076663017273 + }, + { + "epoch": 59, + "train_loss": 0.1490273987340927, + "train_acc": 0.94576, + "test_loss": 0.7455846133232117, + "test_acc": 0.8376, + "lyapunov": null, + "grad_norm": 0.303406267580447, + "grad_max_sv": 0.19556450732052327, + "grad_min_sv": 2.8112297023596967e-08, + "grad_condition": 7040746.144049543, + "lr": 0.00036050444698038553, + "time_sec": 32.39811587333679 + }, + { + "epoch": 60, + "train_loss": 0.14525161782741547, + "train_acc": 0.94758, + "test_loss": 0.7790617815971375, + "test_acc": 0.8344, + "lyapunov": null, + "grad_norm": 0.30155039989577326, + "grad_max_sv": 0.19981648530811072, + "grad_min_sv": 2.756223151934023e-08, + "grad_condition": 7325326.926472412, + "lr": 0.00034549150281252655, + "time_sec": 32.389100313186646 + }, + { + "epoch": 61, + "train_loss": 0.1412713815355301, + "train_acc": 0.94936, + "test_loss": 0.7642439495563507, + "test_acc": 0.836, + "lyapunov": null, + "grad_norm": 0.29749874721325253, + "grad_max_sv": 0.19452713318169118, + "grad_min_sv": 2.9010603075363407e-08, + "grad_condition": 6769308.704484415, + "lr": 0.0003306310398773544, + "time_sec": 32.38328981399536 + }, + { + "epoch": 62, + "train_loss": 0.1323081604719162, + "train_acc": 0.95234, + "test_loss": 0.7581991817474365, + "test_acc": 0.8398, + "lyapunov": null, + "grad_norm": 0.29116698502726973, + "grad_max_sv": 0.18757329024374486, + "grad_min_sv": 2.7799571622466603e-08, + "grad_condition": 6802391.979822846, + "lr": 0.00031593772365766127, + "time_sec": 32.38175868988037 + }, + { + "epoch": 63, + "train_loss": 0.12890920341968537, + "train_acc": 0.95402, + "test_loss": 0.7480168062210083, + "test_acc": 0.8421, + "lyapunov": null, + "grad_norm": 0.286611612578029, + "grad_max_sv": 0.1843133084475994, + "grad_min_sv": 2.6867626612414597e-08, + "grad_condition": 6929516.973504146, + "lr": 0.0003014260546826097, + "time_sec": 32.42565321922302 + }, + { + "epoch": 64, + "train_loss": 0.1265330140542984, + "train_acc": 0.9554, + "test_loss": 0.8281557668209076, + "test_acc": 0.8301, + "lyapunov": null, + "grad_norm": 0.2827852267700905, + "grad_max_sv": 0.18494715746492146, + "grad_min_sv": 2.7603675123444305e-08, + "grad_condition": 6836444.701068824, + "lr": 0.0002871103542174637, + "time_sec": 32.41487503051758 + }, + { + "epoch": 65, + "train_loss": 0.1179364563369751, + "train_acc": 0.95766, + "test_loss": 0.8201508460521698, + "test_acc": 0.8301, + "lyapunov": null, + "grad_norm": 0.27559434018913526, + "grad_max_sv": 0.1801072470843792, + "grad_min_sv": 2.659138749194767e-08, + "grad_condition": 6847688.983849314, + "lr": 0.0002730047501302267, + "time_sec": 32.39773344993591 + }, + { + "epoch": 66, + "train_loss": 0.11676965503931046, + "train_acc": 0.9583, + "test_loss": 0.8626040154457092, + "test_acc": 0.8299, + "lyapunov": null, + "grad_norm": 0.2739785879338369, + "grad_max_sv": 0.181886912509799, + "grad_min_sv": 2.726705781164185e-08, + "grad_condition": 6765344.039900659, + "lr": 0.00025912316294914234, + "time_sec": 32.3981568813324 + }, + { + "epoch": 67, + "train_loss": 0.1134087336063385, + "train_acc": 0.95968, + "test_loss": 0.8600147367477416, + "test_acc": 0.8307, + "lyapunov": null, + "grad_norm": 0.27359780558028896, + "grad_max_sv": 0.17809443082660437, + "grad_min_sv": 2.617720586961525e-08, + "grad_condition": 6850097.709154141, + "lr": 0.0002454792921248144, + "time_sec": 32.39709424972534 + }, + { + "epoch": 68, + "train_loss": 0.10615333132266998, + "train_acc": 0.96164, + "test_loss": 0.7972221804141998, + "test_acc": 0.8376, + "lyapunov": null, + "grad_norm": 0.2659183144921437, + "grad_max_sv": 0.18308131918311119, + "grad_min_sv": 2.689645892672843e-08, + "grad_condition": 6797772.602815667, + "lr": 0.00023208660251050164, + "time_sec": 32.41845703125 + }, + { + "epoch": 69, + "train_loss": 0.10183365075588226, + "train_acc": 0.9635, + "test_loss": 0.826421448802948, + "test_acc": 0.8419, + "lyapunov": null, + "grad_norm": 0.25781252098700996, + "grad_max_sv": 0.16897555273026227, + "grad_min_sv": 2.6931133589869206e-08, + "grad_condition": 6306456.524677806, + "lr": 0.00021895831107393473, + "time_sec": 32.397175788879395 + }, + { + "epoch": 70, + "train_loss": 0.10107698081731796, + "train_acc": 0.96376, + "test_loss": 0.8561173896312714, + "test_acc": 0.831, + "lyapunov": null, + "grad_norm": 0.25760306881898437, + "grad_max_sv": 0.17646125555038453, + "grad_min_sv": 2.669760297280277e-08, + "grad_condition": 6679362.317952393, + "lr": 0.00020610737385376356, + "time_sec": 32.403748512268066 + }, + { + "epoch": 71, + "train_loss": 0.09157823500394821, + "train_acc": 0.9672, + "test_loss": 0.819078180027008, + "test_acc": 0.8435, + "lyapunov": null, + "grad_norm": 0.24819829552233322, + "grad_max_sv": 0.1644124612212181, + "grad_min_sv": 2.60399903861952e-08, + "grad_condition": 6357922.646001594, + "lr": 0.00019354647317351177, + "time_sec": 32.40361571311951 + }, + { + "epoch": 72, + "train_loss": 0.09161295493125915, + "train_acc": 0.9674, + "test_loss": 0.8579238404273987, + "test_acc": 0.8382, + "lyapunov": null, + "grad_norm": 0.2471838058669454, + "grad_max_sv": 0.18323104958981276, + "grad_min_sv": 2.6274890752020497e-08, + "grad_condition": 7043842.298456557, + "lr": 0.0001812880051256552, + "time_sec": 32.40220522880554 + }, + { + "epoch": 73, + "train_loss": 0.08914089821338654, + "train_acc": 0.9689, + "test_loss": 0.822793147277832, + "test_acc": 0.8428, + "lyapunov": null, + "grad_norm": 0.24800643716145856, + "grad_max_sv": 0.17686894070357084, + "grad_min_sv": 2.5135920411756273e-08, + "grad_condition": 7047438.025677231, + "lr": 0.00016934406733817422, + "time_sec": 32.38602375984192 + }, + { + "epoch": 74, + "train_loss": 0.08674161068916321, + "train_acc": 0.96972, + "test_loss": 0.9136243630409241, + "test_acc": 0.832, + "lyapunov": null, + "grad_norm": 0.24475644922641637, + "grad_max_sv": 0.1730644192546606, + "grad_min_sv": 2.701796373294485e-08, + "grad_condition": 6442891.2485314775, + "lr": 0.0001577264470356557, + "time_sec": 32.388394594192505 + }, + { + "epoch": 75, + "train_loss": 0.08695965735673905, + "train_acc": 0.96928, + "test_loss": 0.8845508131980896, + "test_acc": 0.8384, + "lyapunov": null, + "grad_norm": 0.2459968799202821, + "grad_max_sv": 0.17426501363515853, + "grad_min_sv": 2.6569961386613273e-08, + "grad_condition": 6640201.158479671, + "lr": 0.00014644660940672634, + "time_sec": 32.41233015060425 + }, + { + "epoch": 76, + "train_loss": 0.08056579726457595, + "train_acc": 0.97162, + "test_loss": 0.8616433102607727, + "test_acc": 0.843, + "lyapunov": null, + "grad_norm": 0.2370989720124241, + "grad_max_sv": 0.17729146480560304, + "grad_min_sv": 2.568868753272113e-08, + "grad_condition": 6934864.636315972, + "lr": 0.0001355156862892944, + "time_sec": 32.40184926986694 + }, + { + "epoch": 77, + "train_loss": 0.0778916252565384, + "train_acc": 0.97266, + "test_loss": 0.8366258358001709, + "test_acc": 0.846, + "lyapunov": null, + "grad_norm": 0.2285631358810043, + "grad_max_sv": 0.15610157009214162, + "grad_min_sv": 2.4703725332031468e-08, + "grad_condition": 6441768.40822393, + "lr": 0.00012494446518477025, + "time_sec": 32.39042067527771 + }, + { + "epoch": 78, + "train_loss": 0.07181410483896733, + "train_acc": 0.97442, + "test_loss": 0.8555541298389435, + "test_acc": 0.8426, + "lyapunov": null, + "grad_norm": 0.21751467049933892, + "grad_max_sv": 0.15433428399264812, + "grad_min_sv": 2.665557081726888e-08, + "grad_condition": 5918219.605492928, + "lr": 0.00011474337861210548, + "time_sec": 32.394978523254395 + }, + { + "epoch": 79, + "train_loss": 0.07194108392477036, + "train_acc": 0.9751, + "test_loss": 0.8495045845985413, + "test_acc": 0.8448, + "lyapunov": null, + "grad_norm": 0.22114745807083974, + "grad_max_sv": 0.1569668130017817, + "grad_min_sv": 2.5639288958601015e-08, + "grad_condition": 6206249.934502038, + "lr": 0.00010492249381215483, + "time_sec": 32.40589165687561 + }, + { + "epoch": 80, + "train_loss": 0.07222781093478203, + "train_acc": 0.97412, + "test_loss": 0.8713514517307281, + "test_acc": 0.8394, + "lyapunov": null, + "grad_norm": 0.22263796587188234, + "grad_max_sv": 0.14711420265957714, + "grad_min_sv": 2.5633022726623266e-08, + "grad_condition": 5761666.097039051, + "lr": 9.549150281252637e-05, + "time_sec": 32.37701368331909 + }, + { + "epoch": 81, + "train_loss": 0.06728733582258224, + "train_acc": 0.97644, + "test_loss": 0.8841948908805847, + "test_acc": 0.8471, + "lyapunov": null, + "grad_norm": 0.2167084382178911, + "grad_max_sv": 0.150007457844913, + "grad_min_sv": 2.4493604877662278e-08, + "grad_condition": 6166534.410663934, + "lr": 8.645971286271918e-05, + "time_sec": 32.398573875427246 + }, + { + "epoch": 82, + "train_loss": 0.06532315739750862, + "train_acc": 0.97664, + "test_loss": 0.8479381636619567, + "test_acc": 0.8476, + "lyapunov": null, + "grad_norm": 0.21360344563146125, + "grad_max_sv": 0.14955835351720453, + "grad_min_sv": 2.5209754284105657e-08, + "grad_condition": 5995150.4945804905, + "lr": 7.78360372489926e-05, + "time_sec": 32.39670705795288 + }, + { + "epoch": 83, + "train_loss": 0.06434115768909454, + "train_acc": 0.97796, + "test_loss": 0.8688706632614136, + "test_acc": 0.8462, + "lyapunov": null, + "grad_norm": 0.208142142739157, + "grad_max_sv": 0.14977061534300445, + "grad_min_sv": 2.4894345518333694e-08, + "grad_condition": 6089831.719725271, + "lr": 6.962898649802815e-05, + "time_sec": 32.399760007858276 + }, + { + "epoch": 84, + "train_loss": 0.06394571399211883, + "train_acc": 0.9776, + "test_loss": 0.8629561246871948, + "test_acc": 0.8473, + "lyapunov": null, + "grad_norm": 0.2090274768795119, + "grad_max_sv": 0.1535501467064023, + "grad_min_sv": 2.6076664383367643e-08, + "grad_condition": 5914212.49570628, + "lr": 6.184665997806824e-05, + "time_sec": 32.38430905342102 + }, + { + "epoch": 85, + "train_loss": 0.062020836523771286, + "train_acc": 0.97872, + "test_loss": 0.875181820678711, + "test_acc": 0.8453, + "lyapunov": null, + "grad_norm": 0.2063308108071089, + "grad_max_sv": 0.14753851415589453, + "grad_min_sv": 2.432188375145472e-08, + "grad_condition": 6144261.18306755, + "lr": 5.449673790581613e-05, + "time_sec": 32.41748404502869 + }, + { + "epoch": 86, + "train_loss": 0.06044566638708115, + "train_acc": 0.9789, + "test_loss": 0.872238347530365, + "test_acc": 0.8476, + "lyapunov": null, + "grad_norm": 0.20133211072179052, + "grad_max_sv": 0.148629211448133, + "grad_min_sv": 2.4942497534041762e-08, + "grad_condition": 6060679.3216307415, + "lr": 4.758647376699034e-05, + "time_sec": 32.391072273254395 + }, + { + "epoch": 87, + "train_loss": 0.061503240056037904, + "train_acc": 0.97832, + "test_loss": 0.8733239276885987, + "test_acc": 0.8431, + "lyapunov": null, + "grad_norm": 0.2056722075536268, + "grad_max_sv": 0.14386752797290683, + "grad_min_sv": 2.4274280185920816e-08, + "grad_condition": 5915342.2569472315, + "lr": 4.112268715800956e-05, + "time_sec": 32.393316984176636 + }, + { + "epoch": 88, + "train_loss": 0.057686230409145355, + "train_acc": 0.98028, + "test_loss": 0.9238866704940796, + "test_acc": 0.8441, + "lyapunov": null, + "grad_norm": 0.19849445098013146, + "grad_max_sv": 0.14159611044451595, + "grad_min_sv": 2.40493778669304e-08, + "grad_condition": 5894624.093493214, + "lr": 3.511175705587434e-05, + "time_sec": 32.38528490066528 + }, + { + "epoch": 89, + "train_loss": 0.05870611476659775, + "train_acc": 0.9798, + "test_loss": 0.8742481526374817, + "test_acc": 0.8481, + "lyapunov": null, + "grad_norm": 0.20012200731407057, + "grad_max_sv": 0.15360670480877162, + "grad_min_sv": 2.5219260857411995e-08, + "grad_condition": 6191506.157967448, + "lr": 2.9559615522887284e-05, + "time_sec": 32.393001079559326 + }, + { + "epoch": 90, + "train_loss": 0.05783582457482815, + "train_acc": 0.9801, + "test_loss": 0.8813467388153076, + "test_acc": 0.8475, + "lyapunov": null, + "grad_norm": 0.19996222144489287, + "grad_max_sv": 0.1403856192715466, + "grad_min_sv": 2.448204212690541e-08, + "grad_condition": 5742298.053374326, + "lr": 2.447174185242324e-05, + "time_sec": 32.38493609428406 + }, + { + "epoch": 91, + "train_loss": 0.05505133232176304, + "train_acc": 0.9811, + "test_loss": 0.8983916495323181, + "test_acc": 0.8462, + "lyapunov": null, + "grad_norm": 0.1922888220223182, + "grad_max_sv": 0.13430234417319298, + "grad_min_sv": 2.4953015476114616e-08, + "grad_condition": 5451203.641164561, + "lr": 1.9853157161528526e-05, + "time_sec": 32.399288177490234 + }, + { + "epoch": 92, + "train_loss": 0.05489971268892288, + "train_acc": 0.98124, + "test_loss": 0.8997103338241577, + "test_acc": 0.843, + "lyapunov": null, + "grad_norm": 0.1914882132186981, + "grad_max_sv": 0.13863548981025814, + "grad_min_sv": 2.579038138605938e-08, + "grad_condition": 5398596.905280545, + "lr": 1.570841943568452e-05, + "time_sec": 32.40613651275635 + }, + { + "epoch": 93, + "train_loss": 0.05393671277284622, + "train_acc": 0.9816, + "test_loss": 0.8570820412635803, + "test_acc": 0.847, + "lyapunov": null, + "grad_norm": 0.19247907609747256, + "grad_max_sv": 0.14507245384156703, + "grad_min_sv": 2.4785522878545406e-08, + "grad_condition": 5879853.769356969, + "lr": 1.204161903062634e-05, + "time_sec": 32.38154458999634 + }, + { + "epoch": 94, + "train_loss": 0.05565428542852402, + "train_acc": 0.98092, + "test_loss": 0.8699159992218017, + "test_acc": 0.8494, + "lyapunov": null, + "grad_norm": 0.1950428660443827, + "grad_max_sv": 0.15786617370322348, + "grad_min_sv": 2.5128920544403855e-08, + "grad_condition": 6342900.039114647, + "lr": 8.85637463565564e-06, + "time_sec": 32.408872842788696 + }, + { + "epoch": 95, + "train_loss": 0.0554716275537014, + "train_acc": 0.98074, + "test_loss": 0.8724354814529419, + "test_acc": 0.848, + "lyapunov": null, + "grad_norm": 0.1953551453056335, + "grad_max_sv": 0.14595830552279948, + "grad_min_sv": 2.4523609010174142e-08, + "grad_condition": 6097998.471070435, + "lr": 6.155829702431171e-06, + "time_sec": 32.37954640388489 + }, + { + "epoch": 96, + "train_loss": 0.055670329051017764, + "train_acc": 0.98156, + "test_loss": 0.8982214247703553, + "test_acc": 0.8452, + "lyapunov": null, + "grad_norm": 0.19496196662820392, + "grad_max_sv": 0.1501585453748703, + "grad_min_sv": 2.5934764646962095e-08, + "grad_condition": 5869735.378663734, + "lr": 3.942649342761118e-06, + "time_sec": 32.4021053314209 + }, + { + "epoch": 97, + "train_loss": 0.05344248455762863, + "train_acc": 0.9813, + "test_loss": 0.9114454601287841, + "test_acc": 0.8468, + "lyapunov": null, + "grad_norm": 0.19018664442063118, + "grad_max_sv": 0.14032225906848908, + "grad_min_sv": 2.502056415387699e-08, + "grad_condition": 5745975.090099884, + "lr": 2.2190176984600023e-06, + "time_sec": 32.38188123703003 + }, + { + "epoch": 98, + "train_loss": 0.053135186285972594, + "train_acc": 0.9819, + "test_loss": 0.869631242275238, + "test_acc": 0.8508, + "lyapunov": null, + "grad_norm": 0.18824134211058935, + "grad_max_sv": 0.13075507152825594, + "grad_min_sv": 2.4252965857840536e-08, + "grad_condition": 5397614.905736231, + "lr": 9.866357858642206e-07, + "time_sec": 32.386441230773926 + }, + { + "epoch": 99, + "train_loss": 0.05097491117954254, + "train_acc": 0.983, + "test_loss": 0.8943203839302063, + "test_acc": 0.8483, + "lyapunov": null, + "grad_norm": 0.18445756568932634, + "grad_max_sv": 0.13804081929847598, + "grad_min_sv": 2.4356519201518267e-08, + "grad_condition": 5702871.134726013, + "lr": 2.467198171342e-07, + "time_sec": 32.405375480651855 + }, + { + "epoch": 100, + "train_loss": 0.05390245022058487, + "train_acc": 0.9809, + "test_loss": 0.871891166973114, + "test_acc": 0.8498, + "lyapunov": null, + "grad_norm": 0.1935152752615153, + "grad_max_sv": 0.14720266554504632, + "grad_min_sv": 2.436729609200938e-08, + "grad_condition": 6104513.732861901, + "lr": 0.0, + "time_sec": 32.40170097351074 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 2.4167917232513427, + "train_acc": 0.21668, + "test_loss": 2.5600556365966796, + "test_acc": 0.1426, + "lyapunov": null, + "grad_norm": 8.183371300480916, + "grad_max_sv": 7.386911773681641, + "grad_min_sv": 2.415331181282454e-07, + "grad_condition": 30373000.643941343, + "lr": 0.0009997532801828658, + "time_sec": 49.45663261413574 + }, + { + "epoch": 2, + "train_loss": 1.9079357604217528, + "train_acc": 0.31534, + "test_loss": 2.481009757232666, + "test_acc": 0.1736, + "lyapunov": null, + "grad_norm": 6.225007320887903, + "grad_max_sv": 6.023341983556747, + "grad_min_sv": 2.0562342122332212e-07, + "grad_condition": 29136429.527644336, + "lr": 0.0009990133642141358, + "time_sec": 49.483285427093506 + }, + { + "epoch": 3, + "train_loss": 1.7475298168945312, + "train_acc": 0.36588, + "test_loss": 2.8285199867248534, + "test_acc": 0.131, + "lyapunov": null, + "grad_norm": 5.1420950067433004, + "grad_max_sv": 4.660892617702484, + "grad_min_sv": 1.8032060928874215e-07, + "grad_condition": 26358047.987367053, + "lr": 0.00099778098230154, + "time_sec": 49.57265663146973 + }, + { + "epoch": 4, + "train_loss": 1.648739521408081, + "train_acc": 0.40166, + "test_loss": 2.3356450172424315, + "test_acc": 0.1751, + "lyapunov": null, + "grad_norm": 4.371713821921025, + "grad_max_sv": 3.9185040295124054, + "grad_min_sv": 1.6463919898512814e-07, + "grad_condition": 23923294.770848013, + "lr": 0.000996057350657239, + "time_sec": 49.45625138282776 + }, + { + "epoch": 5, + "train_loss": 1.5810089331436157, + "train_acc": 0.4251, + "test_loss": 2.673109909439087, + "test_acc": 0.1544, + "lyapunov": null, + "grad_norm": 3.4555186506953595, + "grad_max_sv": 2.900471958518028, + "grad_min_sv": 1.4436529607309013e-07, + "grad_condition": 20173199.710391533, + "lr": 0.0009938441702975688, + "time_sec": 49.46467709541321 + }, + { + "epoch": 6, + "train_loss": 1.5207538050079346, + "train_acc": 0.44858, + "test_loss": 2.5345509658813477, + "test_acc": 0.1699, + "lyapunov": null, + "grad_norm": 2.64949967993879, + "grad_max_sv": 2.2037453174591066, + "grad_min_sv": 1.0903019624919352e-07, + "grad_condition": 20443245.381738927, + "lr": 0.0009911436253643444, + "time_sec": 49.46764326095581 + }, + { + "epoch": 7, + "train_loss": 1.4697360105133057, + "train_acc": 0.46474, + "test_loss": 2.8721789810180662, + "test_acc": 0.1272, + "lyapunov": null, + "grad_norm": 2.07791741270765, + "grad_max_sv": 1.6007355004549026, + "grad_min_sv": 8.760053766820875e-08, + "grad_condition": 18373378.661422264, + "lr": 0.0009879583809693736, + "time_sec": 49.47743082046509 + }, + { + "epoch": 8, + "train_loss": 1.4266535543823242, + "train_acc": 0.48382, + "test_loss": 3.240042792892456, + "test_acc": 0.1388, + "lyapunov": null, + "grad_norm": 1.6671990756280735, + "grad_max_sv": 1.2928156778216362, + "grad_min_sv": 7.22438866951336e-08, + "grad_condition": 18264606.350417227, + "lr": 0.0009842915805643154, + "time_sec": 49.462923526763916 + }, + { + "epoch": 9, + "train_loss": 1.394312504272461, + "train_acc": 0.49708, + "test_loss": 2.92084864654541, + "test_acc": 0.1515, + "lyapunov": null, + "grad_norm": 1.4501900520177538, + "grad_max_sv": 1.0461901366710662, + "grad_min_sv": 6.580800739897086e-08, + "grad_condition": 16086880.216684576, + "lr": 0.0009801468428384714, + "time_sec": 49.47783327102661 + }, + { + "epoch": 10, + "train_loss": 1.3646438373184204, + "train_acc": 0.50782, + "test_loss": 2.4641769153594972, + "test_acc": 0.2432, + "lyapunov": null, + "grad_norm": 1.291271889799819, + "grad_max_sv": 0.9352933883666992, + "grad_min_sv": 6.025941292620019e-08, + "grad_condition": 15737334.845315147, + "lr": 0.0009755282581475767, + "time_sec": 49.47376465797424 + }, + { + "epoch": 11, + "train_loss": 1.3376501561355592, + "train_acc": 0.51558, + "test_loss": 2.9219178497314453, + "test_acc": 0.2438, + "lyapunov": null, + "grad_norm": 1.1555098680383777, + "grad_max_sv": 0.7429820895195007, + "grad_min_sv": 5.2901568192709195e-08, + "grad_condition": 14266011.744750757, + "lr": 0.0009704403844771127, + "time_sec": 49.47013974189758 + }, + { + "epoch": 12, + "train_loss": 1.3112868671417237, + "train_acc": 0.5284, + "test_loss": 2.74031083946228, + "test_acc": 0.2031, + "lyapunov": null, + "grad_norm": 1.0738955371821308, + "grad_max_sv": 0.748549421876669, + "grad_min_sv": 4.978303538294426e-08, + "grad_condition": 15210211.076616298, + "lr": 0.0009648882429441257, + "time_sec": 49.46808075904846 + }, + { + "epoch": 13, + "train_loss": 1.287481568031311, + "train_acc": 0.53728, + "test_loss": 3.040859108734131, + "test_acc": 0.1924, + "lyapunov": null, + "grad_norm": 0.9771624206683323, + "grad_max_sv": 0.64529999345541, + "grad_min_sv": 4.393245678357971e-08, + "grad_condition": 14761475.748675447, + "lr": 0.0009588773128419905, + "time_sec": 49.47308921813965 + }, + { + "epoch": 14, + "train_loss": 1.2648405401992797, + "train_acc": 0.54502, + "test_loss": 2.792311123275757, + "test_acc": 0.1915, + "lyapunov": null, + "grad_norm": 0.9467244901324925, + "grad_max_sv": 0.6184789575636387, + "grad_min_sv": 4.4816473465658643e-08, + "grad_condition": 14165375.345471447, + "lr": 0.0009524135262330098, + "time_sec": 49.483009815216064 + }, + { + "epoch": 15, + "train_loss": 1.241471286087036, + "train_acc": 0.55048, + "test_loss": 2.3441864311218263, + "test_acc": 0.2456, + "lyapunov": null, + "grad_norm": 0.8759338877958681, + "grad_max_sv": 0.5726857863366603, + "grad_min_sv": 3.894658555658736e-08, + "grad_condition": 14972228.263231587, + "lr": 0.0009455032620941839, + "time_sec": 49.48427653312683 + }, + { + "epoch": 16, + "train_loss": 1.2250818849945069, + "train_acc": 0.55916, + "test_loss": 2.4376744468688964, + "test_acc": 0.2811, + "lyapunov": null, + "grad_norm": 0.8280125995789305, + "grad_max_sv": 0.5269983820617199, + "grad_min_sv": 3.957679450827811e-08, + "grad_condition": 13458638.5630938, + "lr": 0.0009381533400219318, + "time_sec": 49.491514921188354 + }, + { + "epoch": 17, + "train_loss": 1.2011407931518554, + "train_acc": 0.5681, + "test_loss": 3.077988208389282, + "test_acc": 0.2372, + "lyapunov": null, + "grad_norm": 0.7903623783049802, + "grad_max_sv": 0.5003585621714592, + "grad_min_sv": 3.7936934749183135e-08, + "grad_condition": 13344237.683557762, + "lr": 0.0009303710135019719, + "time_sec": 49.4895544052124 + }, + { + "epoch": 18, + "train_loss": 1.1899376231193541, + "train_acc": 0.57472, + "test_loss": 2.3918450389862063, + "test_acc": 0.2518, + "lyapunov": null, + "grad_norm": 0.7718039520215193, + "grad_max_sv": 0.47414265275001527, + "grad_min_sv": 3.554989529419572e-08, + "grad_condition": 13438942.364842063, + "lr": 0.0009221639627510076, + "time_sec": 49.456658124923706 + }, + { + "epoch": 19, + "train_loss": 1.168603648300171, + "train_acc": 0.57972, + "test_loss": 2.283582151031494, + "test_acc": 0.2237, + "lyapunov": null, + "grad_norm": 0.7146309518059523, + "grad_max_sv": 0.4340610824525356, + "grad_min_sv": 3.228430212054434e-08, + "grad_condition": 13543039.003440287, + "lr": 0.000913540287137281, + "time_sec": 49.45988321304321 + }, + { + "epoch": 20, + "train_loss": 1.151336190109253, + "train_acc": 0.58574, + "test_loss": 2.2708426193237305, + "test_acc": 0.2755, + "lyapunov": null, + "grad_norm": 0.6983120785552407, + "grad_max_sv": 0.4454373300075531, + "grad_min_sv": 3.350230577403579e-08, + "grad_condition": 13641891.236675229, + "lr": 0.0009045084971874739, + "time_sec": 49.4855215549469 + }, + { + "epoch": 21, + "train_loss": 1.1312933298873902, + "train_acc": 0.5941, + "test_loss": 2.002239217376709, + "test_acc": 0.3398, + "lyapunov": null, + "grad_norm": 0.6668029786621408, + "grad_max_sv": 0.4022377036511898, + "grad_min_sv": 3.0301077691419207e-08, + "grad_condition": 13290330.075167935, + "lr": 0.0008950775061878452, + "time_sec": 49.5133171081543 + }, + { + "epoch": 22, + "train_loss": 1.1186233515167237, + "train_acc": 0.59978, + "test_loss": 3.6749740661621093, + "test_acc": 0.2938, + "lyapunov": null, + "grad_norm": 0.6355160393463501, + "grad_max_sv": 0.3662328697741032, + "grad_min_sv": 2.919807395862506e-08, + "grad_condition": 12676455.229119861, + "lr": 0.0008852566213878947, + "time_sec": 49.47933578491211 + }, + { + "epoch": 23, + "train_loss": 1.0992162245941162, + "train_acc": 0.60538, + "test_loss": 2.2956289947509765, + "test_acc": 0.3419, + "lyapunov": null, + "grad_norm": 0.6289434264719856, + "grad_max_sv": 0.3852032497525215, + "grad_min_sv": 2.838916279834791e-08, + "grad_condition": 13726993.354284357, + "lr": 0.0008750555348152298, + "time_sec": 49.46930289268494 + }, + { + "epoch": 24, + "train_loss": 1.09261875541687, + "train_acc": 0.6078, + "test_loss": 2.194385333251953, + "test_acc": 0.3862, + "lyapunov": null, + "grad_norm": 0.6127565268862699, + "grad_max_sv": 0.3749225478619337, + "grad_min_sv": 2.902605293897409e-08, + "grad_condition": 12941629.392305708, + "lr": 0.0008644843137107057, + "time_sec": 49.45948123931885 + }, + { + "epoch": 25, + "train_loss": 1.0722477124023437, + "train_acc": 0.61656, + "test_loss": 2.4663957664489744, + "test_acc": 0.3925, + "lyapunov": null, + "grad_norm": 0.5897825535844798, + "grad_max_sv": 0.371936571970582, + "grad_min_sv": 2.8421365216857452e-08, + "grad_condition": 13252758.329758141, + "lr": 0.0008535533905932737, + "time_sec": 49.479785442352295 + }, + { + "epoch": 26, + "train_loss": 1.0658014038848878, + "train_acc": 0.62154, + "test_loss": 2.2172969047546385, + "test_acc": 0.3602, + "lyapunov": null, + "grad_norm": 0.5970948959400837, + "grad_max_sv": 0.3504005130380392, + "grad_min_sv": 2.822866052021311e-08, + "grad_condition": 12516728.270259932, + "lr": 0.0008422735529643444, + "time_sec": 49.46492099761963 + }, + { + "epoch": 27, + "train_loss": 1.04928136428833, + "train_acc": 0.62394, + "test_loss": 2.3098046798706053, + "test_acc": 0.3753, + "lyapunov": null, + "grad_norm": 0.5799982623396496, + "grad_max_sv": 0.3511035542935133, + "grad_min_sv": 2.871881275012811e-08, + "grad_condition": 12420577.990074852, + "lr": 0.0008306559326618259, + "time_sec": 49.463754177093506 + }, + { + "epoch": 28, + "train_loss": 1.033934779319763, + "train_acc": 0.6312, + "test_loss": 2.5853637130737304, + "test_acc": 0.3827, + "lyapunov": null, + "grad_norm": 0.5626766992798455, + "grad_max_sv": 0.3680811390280724, + "grad_min_sv": 2.860611223454157e-08, + "grad_condition": 13030738.458713688, + "lr": 0.0008187119948743449, + "time_sec": 49.46650528907776 + }, + { + "epoch": 29, + "train_loss": 1.0245469808578491, + "train_acc": 0.63318, + "test_loss": 2.421029793548584, + "test_acc": 0.3777, + "lyapunov": null, + "grad_norm": 0.540434209171599, + "grad_max_sv": 0.33249553516507147, + "grad_min_sv": 2.5725369168227985e-08, + "grad_condition": 13074923.559065297, + "lr": 0.0008064535268264883, + "time_sec": 49.46920871734619 + }, + { + "epoch": 30, + "train_loss": 1.0157002903938293, + "train_acc": 0.63876, + "test_loss": 2.5748968841552733, + "test_acc": 0.353, + "lyapunov": null, + "grad_norm": 0.5335667641481916, + "grad_max_sv": 0.31497838646173476, + "grad_min_sv": 2.4617009453109516e-08, + "grad_condition": 12878002.467485525, + "lr": 0.0007938926261462367, + "time_sec": 49.47658443450928 + }, + { + "epoch": 31, + "train_loss": 1.0092763556671143, + "train_acc": 0.64072, + "test_loss": 2.575096744155884, + "test_acc": 0.3689, + "lyapunov": null, + "grad_norm": 0.5319602288309537, + "grad_max_sv": 0.33714523129165175, + "grad_min_sv": 2.6278444886784767e-08, + "grad_condition": 12997099.648816537, + "lr": 0.0007810416889260654, + "time_sec": 49.48014044761658 + }, + { + "epoch": 32, + "train_loss": 0.9945861617660523, + "train_acc": 0.64606, + "test_loss": 2.18585274848938, + "test_acc": 0.3591, + "lyapunov": null, + "grad_norm": 0.5207883539385971, + "grad_max_sv": 0.30190461575984956, + "grad_min_sv": 2.498473832268644e-08, + "grad_condition": 12302495.137337226, + "lr": 0.0007679133974894983, + "time_sec": 49.48141527175903 + }, + { + "epoch": 33, + "train_loss": 0.9839789762878418, + "train_acc": 0.65072, + "test_loss": 2.067453681182861, + "test_acc": 0.4015, + "lyapunov": null, + "grad_norm": 0.5202120303096632, + "grad_max_sv": 0.3107115812599659, + "grad_min_sv": 2.559975968985384e-08, + "grad_condition": 12183076.283694824, + "lr": 0.0007545207078751857, + "time_sec": 49.50013208389282 + }, + { + "epoch": 34, + "train_loss": 0.9741807369995117, + "train_acc": 0.6534, + "test_loss": 2.3987243717193603, + "test_acc": 0.3907, + "lyapunov": null, + "grad_norm": 0.5156705695841731, + "grad_max_sv": 0.3042212676256895, + "grad_min_sv": 2.4721938141070156e-08, + "grad_condition": 12439098.422273466, + "lr": 0.0007408768370508577, + "time_sec": 49.4883246421814 + }, + { + "epoch": 35, + "train_loss": 0.960876017742157, + "train_acc": 0.6604, + "test_loss": 2.952223745727539, + "test_acc": 0.3772, + "lyapunov": null, + "grad_norm": 0.49534065997567395, + "grad_max_sv": 0.3189103938639164, + "grad_min_sv": 2.6160001853625657e-08, + "grad_condition": 12245579.759729771, + "lr": 0.0007269952498697734, + "time_sec": 49.49185800552368 + }, + { + "epoch": 36, + "train_loss": 0.9563328867340087, + "train_acc": 0.66094, + "test_loss": 2.5444390853881838, + "test_acc": 0.3748, + "lyapunov": null, + "grad_norm": 0.5015211388674911, + "grad_max_sv": 0.301097634062171, + "grad_min_sv": 2.4840815004978368e-08, + "grad_condition": 12193384.34751702, + "lr": 0.0007128896457825364, + "time_sec": 49.473448038101196 + }, + { + "epoch": 37, + "train_loss": 0.9456947842597961, + "train_acc": 0.66318, + "test_loss": 2.8305119338989257, + "test_acc": 0.3608, + "lyapunov": null, + "grad_norm": 0.5027801927119517, + "grad_max_sv": 0.3191258400678635, + "grad_min_sv": 2.5498967737291876e-08, + "grad_condition": 12721385.179239903, + "lr": 0.0006985739453173903, + "time_sec": 49.47532916069031 + }, + { + "epoch": 38, + "train_loss": 0.9344060453033447, + "train_acc": 0.66828, + "test_loss": 2.3942235221862793, + "test_acc": 0.3846, + "lyapunov": null, + "grad_norm": 0.4893981754322751, + "grad_max_sv": 0.27843328677117823, + "grad_min_sv": 2.3813316207821345e-08, + "grad_condition": 11809731.27063098, + "lr": 0.0006840622763423391, + "time_sec": 49.466092109680176 + }, + { + "epoch": 39, + "train_loss": 0.9299031619262695, + "train_acc": 0.6701, + "test_loss": 2.5896951622009277, + "test_acc": 0.3377, + "lyapunov": null, + "grad_norm": 0.4877056898105668, + "grad_max_sv": 0.2895252756774426, + "grad_min_sv": 2.313919011953658e-08, + "grad_condition": 12624897.370656734, + "lr": 0.0006693689601226458, + "time_sec": 49.47689652442932 + }, + { + "epoch": 40, + "train_loss": 0.9202397887802124, + "train_acc": 0.67222, + "test_loss": 2.3479004539489745, + "test_acc": 0.3652, + "lyapunov": null, + "grad_norm": 0.48378803227864736, + "grad_max_sv": 0.2827453903853893, + "grad_min_sv": 2.3820017647224744e-08, + "grad_condition": 11971929.846932925, + "lr": 0.0006545084971874737, + "time_sec": 49.48384690284729 + }, + { + "epoch": 41, + "train_loss": 0.9035198735237122, + "train_acc": 0.67674, + "test_loss": 2.4544072883605956, + "test_acc": 0.4098, + "lyapunov": null, + "grad_norm": 0.48414477684461676, + "grad_max_sv": 0.2927399341017008, + "grad_min_sv": 2.5373001699691144e-08, + "grad_condition": 11722800.874950778, + "lr": 0.0006394955530196147, + "time_sec": 49.49253749847412 + }, + { + "epoch": 42, + "train_loss": 0.8996260007095337, + "train_acc": 0.67922, + "test_loss": 2.7968482540130615, + "test_acc": 0.3717, + "lyapunov": null, + "grad_norm": 0.47529519443329865, + "grad_max_sv": 0.2862662900239229, + "grad_min_sv": 2.4432264433826845e-08, + "grad_condition": 11830651.602965241, + "lr": 0.0006243449435824273, + "time_sec": 49.472256898880005 + }, + { + "epoch": 43, + "train_loss": 0.8935702981376648, + "train_acc": 0.68226, + "test_loss": 2.7968372314453127, + "test_acc": 0.3814, + "lyapunov": null, + "grad_norm": 0.47246322948696845, + "grad_max_sv": 0.2997207723557949, + "grad_min_sv": 2.4396437803275717e-08, + "grad_condition": 12442839.021676019, + "lr": 0.0006090716206982714, + "time_sec": 49.47343039512634 + }, + { + "epoch": 44, + "train_loss": 0.8839340761566162, + "train_acc": 0.68406, + "test_loss": 2.1332605548858643, + "test_acc": 0.4518, + "lyapunov": null, + "grad_norm": 0.4773353798688752, + "grad_max_sv": 0.287653349712491, + "grad_min_sv": 2.485683419095608e-08, + "grad_condition": 11744954.507169517, + "lr": 0.0005936906572928625, + "time_sec": 49.483134508132935 + }, + { + "epoch": 45, + "train_loss": 0.8809750416755676, + "train_acc": 0.6871, + "test_loss": 2.3744767669677733, + "test_acc": 0.4104, + "lyapunov": null, + "grad_norm": 0.47171575077424854, + "grad_max_sv": 0.2800353281199932, + "grad_min_sv": 2.4150169553038835e-08, + "grad_condition": 11697732.41688976, + "lr": 0.0005782172325201156, + "time_sec": 49.47827482223511 + }, + { + "epoch": 46, + "train_loss": 0.8651049407958984, + "train_acc": 0.69358, + "test_loss": 2.6672937103271486, + "test_acc": 0.4106, + "lyapunov": null, + "grad_norm": 0.46225804490680006, + "grad_max_sv": 0.2764727082103491, + "grad_min_sv": 2.4165243095453092e-08, + "grad_condition": 11539194.901861329, + "lr": 0.0005626666167821523, + "time_sec": 49.482288122177124 + }, + { + "epoch": 47, + "train_loss": 0.855909815826416, + "train_acc": 0.6953, + "test_loss": 2.1082290111541746, + "test_acc": 0.4302, + "lyapunov": null, + "grad_norm": 0.46665587567927413, + "grad_max_sv": 0.2777487523853779, + "grad_min_sv": 2.3157732442768975e-08, + "grad_condition": 12021773.98709596, + "lr": 0.0005470541566592572, + "time_sec": 49.48243308067322 + }, + { + "epoch": 48, + "train_loss": 0.8559737893295288, + "train_acc": 0.69554, + "test_loss": 2.6735187637329103, + "test_acc": 0.3758, + "lyapunov": null, + "grad_norm": 0.4613852081362787, + "grad_max_sv": 0.2753657314926386, + "grad_min_sv": 2.358262860546745e-08, + "grad_condition": 11826265.97781797, + "lr": 0.0005313952597646569, + "time_sec": 49.471890687942505 + }, + { + "epoch": 49, + "train_loss": 0.8440363460159301, + "train_acc": 0.69974, + "test_loss": 2.318854873275757, + "test_acc": 0.4239, + "lyapunov": null, + "grad_norm": 0.46468634824792515, + "grad_max_sv": 0.2798832211643457, + "grad_min_sv": 2.5059412145367333e-08, + "grad_condition": 11328180.182026755, + "lr": 0.0005157053795390643, + "time_sec": 49.46786379814148 + }, + { + "epoch": 50, + "train_loss": 0.8407046744155884, + "train_acc": 0.69938, + "test_loss": 2.2581016651153565, + "test_acc": 0.4586, + "lyapunov": null, + "grad_norm": 0.4552999687027473, + "grad_max_sv": 0.27262482419610023, + "grad_min_sv": 2.3505009449920066e-08, + "grad_condition": 11655869.156098623, + "lr": 0.0005000000000000002, + "time_sec": 49.46631741523743 + }, + { + "epoch": 51, + "train_loss": 0.8328268578910828, + "train_acc": 0.70616, + "test_loss": 2.021052066421509, + "test_acc": 0.4663, + "lyapunov": null, + "grad_norm": 0.45398371093616957, + "grad_max_sv": 0.2551860522478819, + "grad_min_sv": 2.261276339510232e-08, + "grad_condition": 11423398.903523896, + "lr": 0.00048429462046093607, + "time_sec": 49.49492907524109 + }, + { + "epoch": 52, + "train_loss": 0.8242957615280151, + "train_acc": 0.70608, + "test_loss": 2.4299042922973633, + "test_acc": 0.4339, + "lyapunov": null, + "grad_norm": 0.4518491350882313, + "grad_max_sv": 0.2677639227360487, + "grad_min_sv": 2.340493003849531e-08, + "grad_condition": 11498272.982724927, + "lr": 0.0004686047402353435, + "time_sec": 49.47549295425415 + }, + { + "epoch": 53, + "train_loss": 0.8202688133239746, + "train_acc": 0.70788, + "test_loss": 2.0557694828033446, + "test_acc": 0.4729, + "lyapunov": null, + "grad_norm": 0.45155452834894444, + "grad_max_sv": 0.2765634849667549, + "grad_min_sv": 2.294847063488703e-08, + "grad_condition": 12152279.677541133, + "lr": 0.000452945843340743, + "time_sec": 49.47136735916138 + }, + { + "epoch": 54, + "train_loss": 0.8075869009590149, + "train_acc": 0.71144, + "test_loss": 2.2601095848083497, + "test_acc": 0.469, + "lyapunov": null, + "grad_norm": 0.44703257607115265, + "grad_max_sv": 0.28669003024697304, + "grad_min_sv": 2.3961542838790707e-08, + "grad_condition": 11972426.895574057, + "lr": 0.00043733338321784806, + "time_sec": 49.472840785980225 + }, + { + "epoch": 55, + "train_loss": 0.8038845987319946, + "train_acc": 0.71234, + "test_loss": 1.9625594703674316, + "test_acc": 0.4966, + "lyapunov": null, + "grad_norm": 0.45158056349279113, + "grad_max_sv": 0.2616859499365091, + "grad_min_sv": 2.319859899735377e-08, + "grad_condition": 11323136.132990547, + "lr": 0.0004217827674798847, + "time_sec": 49.475728034973145 + }, + { + "epoch": 56, + "train_loss": 0.7961191424942017, + "train_acc": 0.71566, + "test_loss": 2.24710135345459, + "test_acc": 0.4678, + "lyapunov": null, + "grad_norm": 0.45114634744336685, + "grad_max_sv": 0.27140378654003144, + "grad_min_sv": 2.345107636969601e-08, + "grad_condition": 11702309.047382332, + "lr": 0.00040630934270713783, + "time_sec": 49.46745586395264 + }, + { + "epoch": 57, + "train_loss": 0.7886269653129577, + "train_acc": 0.71928, + "test_loss": 2.332701706314087, + "test_acc": 0.4392, + "lyapunov": null, + "grad_norm": 0.44691251964783024, + "grad_max_sv": 0.2512993272393942, + "grad_min_sv": 2.3577591501400263e-08, + "grad_condition": 10797942.504272973, + "lr": 0.000390928379301729, + "time_sec": 49.487914085388184 + }, + { + "epoch": 58, + "train_loss": 0.7809809253120422, + "train_acc": 0.72054, + "test_loss": 2.163261636352539, + "test_acc": 0.4825, + "lyapunov": null, + "grad_norm": 0.44707505885973187, + "grad_max_sv": 0.27487311884760857, + "grad_min_sv": 2.305816853009901e-08, + "grad_condition": 11921937.091947556, + "lr": 0.0003756550564175727, + "time_sec": 49.477548360824585 + }, + { + "epoch": 59, + "train_loss": 0.7728579918098449, + "train_acc": 0.72464, + "test_loss": 2.4211140827178954, + "test_acc": 0.4792, + "lyapunov": null, + "grad_norm": 0.442207932790873, + "grad_max_sv": 0.2551064256578684, + "grad_min_sv": 2.3925818348757842e-08, + "grad_condition": 10733599.660670992, + "lr": 0.00036050444698038553, + "time_sec": 49.47178077697754 + }, + { + "epoch": 60, + "train_loss": 0.7646781494522095, + "train_acc": 0.72672, + "test_loss": 2.02176361579895, + "test_acc": 0.4897, + "lyapunov": null, + "grad_norm": 0.4430698668925349, + "grad_max_sv": 0.26053123250603677, + "grad_min_sv": 2.3670396620545377e-08, + "grad_condition": 11170288.922506649, + "lr": 0.00034549150281252655, + "time_sec": 49.46177387237549 + }, + { + "epoch": 61, + "train_loss": 0.7588282846641541, + "train_acc": 0.7286, + "test_loss": 2.670531511688232, + "test_acc": 0.4198, + "lyapunov": null, + "grad_norm": 0.43898999083578233, + "grad_max_sv": 0.26667738817632197, + "grad_min_sv": 2.325178121154181e-08, + "grad_condition": 11623927.174902633, + "lr": 0.0003306310398773544, + "time_sec": 49.49580407142639 + }, + { + "epoch": 62, + "train_loss": 0.7492313718986511, + "train_acc": 0.73298, + "test_loss": 2.4778705802917482, + "test_acc": 0.449, + "lyapunov": null, + "grad_norm": 0.4417738790617677, + "grad_max_sv": 0.2574993997812271, + "grad_min_sv": 2.3859390374525445e-08, + "grad_condition": 10899105.692467105, + "lr": 0.00031593772365766127, + "time_sec": 49.486817836761475 + }, + { + "epoch": 63, + "train_loss": 0.7480638890266419, + "train_acc": 0.73324, + "test_loss": 2.1940598976135255, + "test_acc": 0.4734, + "lyapunov": null, + "grad_norm": 0.4366591281226868, + "grad_max_sv": 0.2512634038925171, + "grad_min_sv": 2.326989370082799e-08, + "grad_condition": 10851343.919251464, + "lr": 0.0003014260546826097, + "time_sec": 49.494584798812866 + }, + { + "epoch": 64, + "train_loss": 0.7451907014846801, + "train_acc": 0.73538, + "test_loss": 2.3143032501220704, + "test_acc": 0.4762, + "lyapunov": null, + "grad_norm": 0.4362314837898005, + "grad_max_sv": 0.2649652697145939, + "grad_min_sv": 2.3657484859995748e-08, + "grad_condition": 11323682.220760768, + "lr": 0.0002871103542174637, + "time_sec": 49.46461892127991 + }, + { + "epoch": 65, + "train_loss": 0.7316487748908996, + "train_acc": 0.73868, + "test_loss": 2.132633139801025, + "test_acc": 0.4893, + "lyapunov": null, + "grad_norm": 0.43117564557331234, + "grad_max_sv": 0.2554838340729475, + "grad_min_sv": 2.3040169683241628e-08, + "grad_condition": 11170455.423079647, + "lr": 0.0002730047501302267, + "time_sec": 49.4881227016449 + }, + { + "epoch": 66, + "train_loss": 0.7290266520881653, + "train_acc": 0.7408, + "test_loss": 2.396712022781372, + "test_acc": 0.4793, + "lyapunov": null, + "grad_norm": 0.43225303341958693, + "grad_max_sv": 0.2486136831343174, + "grad_min_sv": 2.2949348021938932e-08, + "grad_condition": 10962824.963370848, + "lr": 0.00025912316294914234, + "time_sec": 49.47016882896423 + }, + { + "epoch": 67, + "train_loss": 0.7191537443733216, + "train_acc": 0.74308, + "test_loss": 2.1576420639038085, + "test_acc": 0.4941, + "lyapunov": null, + "grad_norm": 0.42657147393758854, + "grad_max_sv": 0.2438450776040554, + "grad_min_sv": 2.3898531642529975e-08, + "grad_condition": 10287595.631951943, + "lr": 0.0002454792921248144, + "time_sec": 49.49215388298035 + }, + { + "epoch": 68, + "train_loss": 0.7169496524429322, + "train_acc": 0.74418, + "test_loss": 2.4695981254577637, + "test_acc": 0.4807, + "lyapunov": null, + "grad_norm": 0.4234097941028663, + "grad_max_sv": 0.24577417597174644, + "grad_min_sv": 2.2813544342525915e-08, + "grad_condition": 10779009.57251847, + "lr": 0.00023208660251050164, + "time_sec": 49.531681299209595 + }, + { + "epoch": 69, + "train_loss": 0.7072784723091126, + "train_acc": 0.74744, + "test_loss": 2.27939485244751, + "test_acc": 0.4853, + "lyapunov": null, + "grad_norm": 0.4251678846869415, + "grad_max_sv": 0.241105442866683, + "grad_min_sv": 2.3618906030975496e-08, + "grad_condition": 10243169.91188918, + "lr": 0.00021895831107393473, + "time_sec": 49.46745848655701 + }, + { + "epoch": 70, + "train_loss": 0.7093459980392456, + "train_acc": 0.74668, + "test_loss": 2.2168941738128662, + "test_acc": 0.4993, + "lyapunov": null, + "grad_norm": 0.4187232599688298, + "grad_max_sv": 0.2437821462750435, + "grad_min_sv": 2.330924906424059e-08, + "grad_condition": 10529543.438680641, + "lr": 0.00020610737385376356, + "time_sec": 49.46611166000366 + }, + { + "epoch": 71, + "train_loss": 0.7046173419761658, + "train_acc": 0.74866, + "test_loss": 2.6486716678619384, + "test_acc": 0.4604, + "lyapunov": null, + "grad_norm": 0.43152156311922873, + "grad_max_sv": 0.26821285113692284, + "grad_min_sv": 2.3308388552578663e-08, + "grad_condition": 11585490.938807528, + "lr": 0.00019354647317351177, + "time_sec": 49.484049558639526 + }, + { + "epoch": 72, + "train_loss": 0.6916852585601807, + "train_acc": 0.75164, + "test_loss": 2.4044878028869627, + "test_acc": 0.4868, + "lyapunov": null, + "grad_norm": 0.42974614402520106, + "grad_max_sv": 0.2577272642403841, + "grad_min_sv": 2.3734259935181968e-08, + "grad_condition": 10929944.700492647, + "lr": 0.0001812880051256552, + "time_sec": 49.47321033477783 + }, + { + "epoch": 73, + "train_loss": 0.6914860160255432, + "train_acc": 0.75462, + "test_loss": 2.459467795562744, + "test_acc": 0.4755, + "lyapunov": null, + "grad_norm": 0.4235499199054343, + "grad_max_sv": 0.2499073389917612, + "grad_min_sv": 2.312090292555524e-08, + "grad_condition": 10928192.758700397, + "lr": 0.00016934406733817422, + "time_sec": 49.47536325454712 + }, + { + "epoch": 74, + "train_loss": 0.6900841831016541, + "train_acc": 0.75346, + "test_loss": 2.529036985015869, + "test_acc": 0.4694, + "lyapunov": null, + "grad_norm": 0.4200493463432216, + "grad_max_sv": 0.24829606115818023, + "grad_min_sv": 2.3347005217999595e-08, + "grad_condition": 10777473.575533265, + "lr": 0.0001577264470356557, + "time_sec": 49.47671389579773 + }, + { + "epoch": 75, + "train_loss": 0.6844219914627075, + "train_acc": 0.75664, + "test_loss": 2.7192491188049317, + "test_acc": 0.4659, + "lyapunov": null, + "grad_norm": 0.41891725324120427, + "grad_max_sv": 0.2549721471965313, + "grad_min_sv": 2.308645701276646e-08, + "grad_condition": 11178421.697050892, + "lr": 0.00014644660940672634, + "time_sec": 49.475868701934814 + }, + { + "epoch": 76, + "train_loss": 0.6757127567672729, + "train_acc": 0.76002, + "test_loss": 2.228153326416016, + "test_acc": 0.4719, + "lyapunov": null, + "grad_norm": 0.41518783756559813, + "grad_max_sv": 0.24106829576194286, + "grad_min_sv": 2.3467413079458765e-08, + "grad_condition": 10331945.898118276, + "lr": 0.0001355156862892944, + "time_sec": 49.47853899002075 + }, + { + "epoch": 77, + "train_loss": 0.6663033656692505, + "train_acc": 0.7606, + "test_loss": 2.5164624114990235, + "test_acc": 0.4627, + "lyapunov": null, + "grad_norm": 0.41866630242016806, + "grad_max_sv": 0.2701979674398899, + "grad_min_sv": 2.4135091125643272e-08, + "grad_condition": 11260755.273271866, + "lr": 0.00012494446518477025, + "time_sec": 49.47706151008606 + }, + { + "epoch": 78, + "train_loss": 0.6645314185142517, + "train_acc": 0.76252, + "test_loss": 2.8226414447784425, + "test_acc": 0.4614, + "lyapunov": null, + "grad_norm": 0.4173542916715373, + "grad_max_sv": 0.2490392465144396, + "grad_min_sv": 2.3206901200722994e-08, + "grad_condition": 10823280.058633823, + "lr": 0.00011474337861210548, + "time_sec": 49.483954191207886 + }, + { + "epoch": 79, + "train_loss": 0.6665540114593506, + "train_acc": 0.76016, + "test_loss": 2.2122913623809812, + "test_acc": 0.4819, + "lyapunov": null, + "grad_norm": 0.4188547510844498, + "grad_max_sv": 0.25715495869517324, + "grad_min_sv": 2.4195212988686877e-08, + "grad_condition": 10755821.867443344, + "lr": 0.00010492249381215483, + "time_sec": 49.46640372276306 + }, + { + "epoch": 80, + "train_loss": 0.6579594387054444, + "train_acc": 0.76406, + "test_loss": 2.328022619628906, + "test_acc": 0.4922, + "lyapunov": null, + "grad_norm": 0.41446019268915407, + "grad_max_sv": 0.2467421844601631, + "grad_min_sv": 2.3609747978881047e-08, + "grad_condition": 10542743.78062649, + "lr": 9.549150281252637e-05, + "time_sec": 49.47466158866882 + }, + { + "epoch": 81, + "train_loss": 0.6575078699111938, + "train_acc": 0.76504, + "test_loss": 2.435921426773071, + "test_acc": 0.4706, + "lyapunov": null, + "grad_norm": 0.41722587257024396, + "grad_max_sv": 0.2460654556751251, + "grad_min_sv": 2.2818005085412097e-08, + "grad_condition": 10871762.933690486, + "lr": 8.645971286271918e-05, + "time_sec": 49.48575758934021 + }, + { + "epoch": 82, + "train_loss": 0.6540266362380981, + "train_acc": 0.7668, + "test_loss": 2.420010438537598, + "test_acc": 0.4873, + "lyapunov": null, + "grad_norm": 0.4134489054266664, + "grad_max_sv": 0.24872095324099064, + "grad_min_sv": 2.4063159953513492e-08, + "grad_condition": 10418409.724400165, + "lr": 7.78360372489926e-05, + "time_sec": 49.4517502784729 + }, + { + "epoch": 83, + "train_loss": 0.6572029878616333, + "train_acc": 0.76728, + "test_loss": 2.509574550628662, + "test_acc": 0.4741, + "lyapunov": null, + "grad_norm": 0.40888921626022273, + "grad_max_sv": 0.24261515885591506, + "grad_min_sv": 2.325806733871616e-08, + "grad_condition": 10519103.211694924, + "lr": 6.962898649802815e-05, + "time_sec": 49.47699522972107 + }, + { + "epoch": 84, + "train_loss": 0.648239343738556, + "train_acc": 0.76774, + "test_loss": 2.2645148223876954, + "test_acc": 0.485, + "lyapunov": null, + "grad_norm": 0.4120785615672335, + "grad_max_sv": 0.24379208087921142, + "grad_min_sv": 2.272370744904606e-08, + "grad_condition": 10771039.526767144, + "lr": 6.184665997806824e-05, + "time_sec": 49.461183071136475 + }, + { + "epoch": 85, + "train_loss": 0.6412541982460022, + "train_acc": 0.77106, + "test_loss": 2.5437144912719725, + "test_acc": 0.4865, + "lyapunov": null, + "grad_norm": 0.41805406865324773, + "grad_max_sv": 0.2572408441454172, + "grad_min_sv": 2.2814066324983172e-08, + "grad_condition": 11337861.01159941, + "lr": 5.449673790581613e-05, + "time_sec": 49.47793769836426 + }, + { + "epoch": 86, + "train_loss": 0.6463544520187378, + "train_acc": 0.76662, + "test_loss": 2.9264222496032715, + "test_acc": 0.4471, + "lyapunov": null, + "grad_norm": 0.4118969055764605, + "grad_max_sv": 0.2387235414236784, + "grad_min_sv": 2.2642364694291928e-08, + "grad_condition": 10550361.803450387, + "lr": 4.758647376699034e-05, + "time_sec": 49.4726197719574 + }, + { + "epoch": 87, + "train_loss": 0.6428634425735473, + "train_acc": 0.7704, + "test_loss": 2.5568968086242676, + "test_acc": 0.4759, + "lyapunov": null, + "grad_norm": 0.415046593792845, + "grad_max_sv": 0.2535580638796091, + "grad_min_sv": 2.363120126247509e-08, + "grad_condition": 10837761.433894884, + "lr": 4.112268715800956e-05, + "time_sec": 49.48099684715271 + }, + { + "epoch": 88, + "train_loss": 0.6407405834579468, + "train_acc": 0.77184, + "test_loss": 2.4600058319091795, + "test_acc": 0.475, + "lyapunov": null, + "grad_norm": 0.4135582126787873, + "grad_max_sv": 0.25508003048598765, + "grad_min_sv": 2.376858407870941e-08, + "grad_condition": 10837781.081215866, + "lr": 3.511175705587434e-05, + "time_sec": 49.47017812728882 + }, + { + "epoch": 89, + "train_loss": 0.6344939192008973, + "train_acc": 0.77288, + "test_loss": 2.4250204902648926, + "test_acc": 0.4787, + "lyapunov": null, + "grad_norm": 0.4160361292383021, + "grad_max_sv": 0.25198650658130645, + "grad_min_sv": 2.3671872506625392e-08, + "grad_condition": 10764847.245073054, + "lr": 2.9559615522887284e-05, + "time_sec": 49.48287224769592 + }, + { + "epoch": 90, + "train_loss": 0.6344009274482727, + "train_acc": 0.77354, + "test_loss": 2.7001010314941407, + "test_acc": 0.4623, + "lyapunov": null, + "grad_norm": 0.4089648902673904, + "grad_max_sv": 0.24975020438432693, + "grad_min_sv": 2.2971467306120984e-08, + "grad_condition": 10990208.207150657, + "lr": 2.447174185242324e-05, + "time_sec": 49.50636339187622 + }, + { + "epoch": 91, + "train_loss": 0.6388888354110718, + "train_acc": 0.77322, + "test_loss": 2.4007692584991456, + "test_acc": 0.482, + "lyapunov": null, + "grad_norm": 0.41394740295503574, + "grad_max_sv": 0.24785541072487832, + "grad_min_sv": 2.4093225903243366e-08, + "grad_condition": 10380601.978368312, + "lr": 1.9853157161528526e-05, + "time_sec": 49.47446608543396 + }, + { + "epoch": 92, + "train_loss": 0.6364776765632629, + "train_acc": 0.7745, + "test_loss": 2.399016780090332, + "test_acc": 0.4893, + "lyapunov": null, + "grad_norm": 0.4144776850028884, + "grad_max_sv": 0.23398316986858844, + "grad_min_sv": 2.3364770829203963e-08, + "grad_condition": 10152213.637178902, + "lr": 1.570841943568452e-05, + "time_sec": 49.4903450012207 + }, + { + "epoch": 93, + "train_loss": 0.6323039393615723, + "train_acc": 0.7761, + "test_loss": 2.5661166526794434, + "test_acc": 0.4799, + "lyapunov": null, + "grad_norm": 0.4148058440423859, + "grad_max_sv": 0.25038140527904035, + "grad_min_sv": 2.3675201843431638e-08, + "grad_condition": 10621575.74650034, + "lr": 1.204161903062634e-05, + "time_sec": 49.47283339500427 + }, + { + "epoch": 94, + "train_loss": 0.6312036778831482, + "train_acc": 0.77456, + "test_loss": 2.4954245025634765, + "test_acc": 0.4884, + "lyapunov": null, + "grad_norm": 0.41190158928123094, + "grad_max_sv": 0.23922828286886216, + "grad_min_sv": 2.3207600818864195e-08, + "grad_condition": 10426944.434691576, + "lr": 8.85637463565564e-06, + "time_sec": 49.4705286026001 + }, + { + "epoch": 95, + "train_loss": 0.631898609752655, + "train_acc": 0.77374, + "test_loss": 2.496735878753662, + "test_acc": 0.484, + "lyapunov": null, + "grad_norm": 0.4118919272482802, + "grad_max_sv": 0.2545221421867609, + "grad_min_sv": 2.265429692727139e-08, + "grad_condition": 11229071.176658351, + "lr": 6.155829702431171e-06, + "time_sec": 49.45284724235535 + }, + { + "epoch": 96, + "train_loss": 0.6379076655197143, + "train_acc": 0.77178, + "test_loss": 2.6363272483825684, + "test_acc": 0.476, + "lyapunov": null, + "grad_norm": 0.4109637736779776, + "grad_max_sv": 0.23244931511580944, + "grad_min_sv": 2.2822463163763017e-08, + "grad_condition": 10301145.344649881, + "lr": 3.942649342761118e-06, + "time_sec": 49.47940802574158 + }, + { + "epoch": 97, + "train_loss": 0.6325872544288635, + "train_acc": 0.77334, + "test_loss": 2.7118479751586912, + "test_acc": 0.4606, + "lyapunov": null, + "grad_norm": 0.4111072193471729, + "grad_max_sv": 0.23797121047973632, + "grad_min_sv": 2.2607291239040707e-08, + "grad_condition": 10688228.14219837, + "lr": 2.2190176984600023e-06, + "time_sec": 49.482439041137695 + }, + { + "epoch": 98, + "train_loss": 0.6342727423286438, + "train_acc": 0.77484, + "test_loss": 2.50120391998291, + "test_acc": 0.4868, + "lyapunov": null, + "grad_norm": 0.4137394255148928, + "grad_max_sv": 0.24089130759239197, + "grad_min_sv": 2.424639040654597e-08, + "grad_condition": 10056603.153747398, + "lr": 9.866357858642206e-07, + "time_sec": 49.48271298408508 + }, + { + "epoch": 99, + "train_loss": 0.628259766407013, + "train_acc": 0.77486, + "test_loss": 2.447319179916382, + "test_acc": 0.4885, + "lyapunov": null, + "grad_norm": 0.4076037809536703, + "grad_max_sv": 0.25056461431086063, + "grad_min_sv": 2.3701171647516616e-08, + "grad_condition": 10626762.207877642, + "lr": 2.467198171342e-07, + "time_sec": 49.45984363555908 + }, + { + "epoch": 100, + "train_loss": 0.6313758395767212, + "train_acc": 0.77534, + "test_loss": 2.4442952224731447, + "test_acc": 0.4905, + "lyapunov": null, + "grad_norm": 0.40858498927976306, + "grad_max_sv": 0.23060753419995308, + "grad_min_sv": 2.2785150743942496e-08, + "grad_condition": 10116355.973472353, + "lr": 0.0, + "time_sec": 49.46379518508911 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 2.717775194091797, + "train_acc": 0.12228, + "test_loss": 3.3459623817443847, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 7.716699984005914, + "grad_max_sv": 7.287460565567017, + "grad_min_sv": 2.5165389772041635e-07, + "grad_condition": 29456429.211788226, + "lr": 0.0009997532801828658, + "time_sec": 66.53277444839478 + }, + { + "epoch": 2, + "train_loss": 2.2721379792785643, + "train_acc": 0.17654, + "test_loss": 4.04989028930664, + "test_acc": 0.1003, + "lyapunov": null, + "grad_norm": 6.63637414556116, + "grad_max_sv": 6.237935948371887, + "grad_min_sv": 2.2601446723058415e-07, + "grad_condition": 28188789.96425259, + "lr": 0.0009990133642141358, + "time_sec": 66.55316853523254 + }, + { + "epoch": 3, + "train_loss": 2.137921618881226, + "train_acc": 0.2105, + "test_loss": 5.869428012084961, + "test_acc": 0.1011, + "lyapunov": null, + "grad_norm": 5.7520031644476814, + "grad_max_sv": 5.452845233678818, + "grad_min_sv": 1.9201941405810886e-07, + "grad_condition": 28919609.465649594, + "lr": 0.00099778098230154, + "time_sec": 66.56071186065674 + }, + { + "epoch": 4, + "train_loss": 2.0486733519744873, + "train_acc": 0.23394, + "test_loss": 5.161107911682129, + "test_acc": 0.1097, + "lyapunov": null, + "grad_norm": 4.91519980042541, + "grad_max_sv": 4.5814680576324465, + "grad_min_sv": 1.6788343710771868e-07, + "grad_condition": 27707547.33712595, + "lr": 0.000996057350657239, + "time_sec": 66.55148816108704 + }, + { + "epoch": 5, + "train_loss": 1.9897926804351806, + "train_acc": 0.25822, + "test_loss": 4.115356592559815, + "test_acc": 0.1203, + "lyapunov": null, + "grad_norm": 4.476936137063571, + "grad_max_sv": 4.264879077672958, + "grad_min_sv": 1.6287330311115512e-07, + "grad_condition": 27434565.90350554, + "lr": 0.0009938441702975688, + "time_sec": 66.53483939170837 + }, + { + "epoch": 6, + "train_loss": 1.950422788543701, + "train_acc": 0.26598, + "test_loss": 6.161662875366211, + "test_acc": 0.1038, + "lyapunov": null, + "grad_norm": 4.078084494569751, + "grad_max_sv": 3.8316186487674715, + "grad_min_sv": 1.5860823996405315e-07, + "grad_condition": 24946451.178036533, + "lr": 0.0009911436253643444, + "time_sec": 66.544926404953 + }, + { + "epoch": 7, + "train_loss": 1.9193549822998046, + "train_acc": 0.28804, + "test_loss": 6.333303915405273, + "test_acc": 0.1006, + "lyapunov": null, + "grad_norm": 3.9544625089709906, + "grad_max_sv": 3.660486602783203, + "grad_min_sv": 1.3159545346752567e-07, + "grad_condition": 27858533.203216422, + "lr": 0.0009879583809693736, + "time_sec": 66.54343152046204 + }, + { + "epoch": 8, + "train_loss": 1.8974505254364014, + "train_acc": 0.29166, + "test_loss": 6.595959260559082, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 3.7716319720252063, + "grad_max_sv": 3.4488155782222747, + "grad_min_sv": 1.3156188991558792e-07, + "grad_condition": 26979104.149509914, + "lr": 0.0009842915805643154, + "time_sec": 66.53689360618591 + }, + { + "epoch": 9, + "train_loss": 1.8757565868377686, + "train_acc": 0.2988, + "test_loss": 8.294800563049316, + "test_acc": 0.1001, + "lyapunov": null, + "grad_norm": 3.606736816077247, + "grad_max_sv": 3.276396805047989, + "grad_min_sv": 1.2148574111137122e-07, + "grad_condition": 27354129.68622259, + "lr": 0.0009801468428384714, + "time_sec": 66.53859829902649 + }, + { + "epoch": 10, + "train_loss": 1.853810763168335, + "train_acc": 0.30818, + "test_loss": 7.528170121765137, + "test_acc": 0.1002, + "lyapunov": null, + "grad_norm": 3.590286745766664, + "grad_max_sv": 3.3836376488208773, + "grad_min_sv": 1.2300289498057282e-07, + "grad_condition": 28478996.179412544, + "lr": 0.0009755282581475767, + "time_sec": 66.54752492904663 + }, + { + "epoch": 11, + "train_loss": 1.8360865605926513, + "train_acc": 0.31554, + "test_loss": 8.300324632263184, + "test_acc": 0.1004, + "lyapunov": null, + "grad_norm": 3.4184867147228633, + "grad_max_sv": 3.2137346804141997, + "grad_min_sv": 1.2349632871888616e-07, + "grad_condition": 27052165.93028751, + "lr": 0.0009704403844771127, + "time_sec": 66.54567265510559 + }, + { + "epoch": 12, + "train_loss": 1.822631957397461, + "train_acc": 0.32436, + "test_loss": 7.752643719482422, + "test_acc": 0.1021, + "lyapunov": null, + "grad_norm": 3.4268104192911824, + "grad_max_sv": 3.0984551936388014, + "grad_min_sv": 1.1916837276970682e-07, + "grad_condition": 26678795.929163624, + "lr": 0.0009648882429441257, + "time_sec": 66.54143714904785 + }, + { + "epoch": 13, + "train_loss": 1.8042937320327759, + "train_acc": 0.33052, + "test_loss": 6.320642838287354, + "test_acc": 0.1016, + "lyapunov": null, + "grad_norm": 3.26500321242579, + "grad_max_sv": 3.034997683763504, + "grad_min_sv": 1.1198519924704443e-07, + "grad_condition": 27516714.34616376, + "lr": 0.0009588773128419905, + "time_sec": 66.54663801193237 + }, + { + "epoch": 14, + "train_loss": 1.7935633684539796, + "train_acc": 0.33378, + "test_loss": 8.591533955383301, + "test_acc": 0.1001, + "lyapunov": null, + "grad_norm": 3.205935962438017, + "grad_max_sv": 2.9335897117853165, + "grad_min_sv": 1.0952790088225584e-07, + "grad_condition": 27285541.83012454, + "lr": 0.0009524135262330098, + "time_sec": 66.54473447799683 + }, + { + "epoch": 15, + "train_loss": 1.7773359481811524, + "train_acc": 0.34102, + "test_loss": 9.823327029418945, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 3.107803718888726, + "grad_max_sv": 2.8818213611841204, + "grad_min_sv": 1.1047076302617142e-07, + "grad_condition": 26466849.950957365, + "lr": 0.0009455032620941839, + "time_sec": 66.54632878303528 + }, + { + "epoch": 16, + "train_loss": 1.7638415741348266, + "train_acc": 0.3494, + "test_loss": 10.98111782836914, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 2.991047436873543, + "grad_max_sv": 2.6788798362016677, + "grad_min_sv": 9.756340197952796e-08, + "grad_condition": 27546377.57163794, + "lr": 0.0009381533400219318, + "time_sec": 66.5387659072876 + }, + { + "epoch": 17, + "train_loss": 1.7545028717422486, + "train_acc": 0.3524, + "test_loss": 8.496100090026856, + "test_acc": 0.1005, + "lyapunov": null, + "grad_norm": 2.9405206102474817, + "grad_max_sv": 2.7797821670770646, + "grad_min_sv": 1.0545847413112597e-07, + "grad_condition": 26402272.837948732, + "lr": 0.0009303710135019719, + "time_sec": 66.53228521347046 + }, + { + "epoch": 18, + "train_loss": 1.7399513541412353, + "train_acc": 0.35946, + "test_loss": 9.442770735168457, + "test_acc": 0.1002, + "lyapunov": null, + "grad_norm": 2.876673477887061, + "grad_max_sv": 2.652202320098877, + "grad_min_sv": 1.0433013795108081e-07, + "grad_condition": 26098642.755907767, + "lr": 0.0009221639627510076, + "time_sec": 66.52799201011658 + }, + { + "epoch": 19, + "train_loss": 1.7275141513061523, + "train_acc": 0.36564, + "test_loss": 8.60740804901123, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 2.820914668477109, + "grad_max_sv": 2.8074967473745347, + "grad_min_sv": 1.0515814725664541e-07, + "grad_condition": 27554948.172257036, + "lr": 0.000913540287137281, + "time_sec": 66.53072094917297 + }, + { + "epoch": 20, + "train_loss": 1.7184981283187866, + "train_acc": 0.36706, + "test_loss": 5.74347527923584, + "test_acc": 0.1074, + "lyapunov": null, + "grad_norm": 2.755999508826315, + "grad_max_sv": 2.4683564633131025, + "grad_min_sv": 9.147877104709323e-08, + "grad_condition": 27108387.83832861, + "lr": 0.0009045084971874739, + "time_sec": 66.53930997848511 + }, + { + "epoch": 21, + "train_loss": 1.7127495180892944, + "train_acc": 0.36988, + "test_loss": 5.374083380126953, + "test_acc": 0.1038, + "lyapunov": null, + "grad_norm": 2.7076782774581156, + "grad_max_sv": 2.415825995802879, + "grad_min_sv": 9.989069553739682e-08, + "grad_condition": 24996642.26521779, + "lr": 0.0008950775061878452, + "time_sec": 66.5274007320404 + }, + { + "epoch": 22, + "train_loss": 1.7080568863677978, + "train_acc": 0.37366, + "test_loss": 5.8365667526245115, + "test_acc": 0.1074, + "lyapunov": null, + "grad_norm": 2.777540200252398, + "grad_max_sv": 2.682383918762207, + "grad_min_sv": 1.0115953053002613e-07, + "grad_condition": 27062321.26943115, + "lr": 0.0008852566213878947, + "time_sec": 66.52736306190491 + }, + { + "epoch": 23, + "train_loss": 1.6937433179473877, + "train_acc": 0.378, + "test_loss": 5.908844201660156, + "test_acc": 0.102, + "lyapunov": null, + "grad_norm": 2.5943120813718052, + "grad_max_sv": 2.4230685472488402, + "grad_min_sv": 9.802377860523848e-08, + "grad_condition": 25663315.966033876, + "lr": 0.0008750555348152298, + "time_sec": 66.55514574050903 + }, + { + "epoch": 24, + "train_loss": 1.685849613647461, + "train_acc": 0.38486, + "test_loss": 6.484691570281982, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 2.470392685402757, + "grad_max_sv": 2.3409340023994445, + "grad_min_sv": 9.386610759776204e-08, + "grad_condition": 25307930.60423732, + "lr": 0.0008644843137107057, + "time_sec": 66.55581784248352 + }, + { + "epoch": 25, + "train_loss": 1.6830421477890014, + "train_acc": 0.38556, + "test_loss": 7.468188558959961, + "test_acc": 0.1022, + "lyapunov": null, + "grad_norm": 2.548563020510745, + "grad_max_sv": 2.1459918454289437, + "grad_min_sv": 8.803468158902205e-08, + "grad_condition": 24944715.33907653, + "lr": 0.0008535533905932737, + "time_sec": 66.53887248039246 + }, + { + "epoch": 26, + "train_loss": 1.6700520505523682, + "train_acc": 0.38856, + "test_loss": 7.895222584533691, + "test_acc": 0.1009, + "lyapunov": null, + "grad_norm": 2.5359070370837204, + "grad_max_sv": 2.4539994060993195, + "grad_min_sv": 9.640742533179037e-08, + "grad_condition": 26335532.748314124, + "lr": 0.0008422735529643444, + "time_sec": 66.54404091835022 + }, + { + "epoch": 27, + "train_loss": 1.6605180406951905, + "train_acc": 0.39334, + "test_loss": 6.994429248046875, + "test_acc": 0.101, + "lyapunov": null, + "grad_norm": 2.4258405770471474, + "grad_max_sv": 2.320448189973831, + "grad_min_sv": 9.107987271050888e-08, + "grad_condition": 26102152.790860306, + "lr": 0.0008306559326618259, + "time_sec": 66.53805947303772 + }, + { + "epoch": 28, + "train_loss": 1.6567610062408447, + "train_acc": 0.395, + "test_loss": 6.368250694274902, + "test_acc": 0.1099, + "lyapunov": null, + "grad_norm": 2.4482138479454654, + "grad_max_sv": 2.1421856224536895, + "grad_min_sv": 8.29846632299791e-08, + "grad_condition": 25968573.760956615, + "lr": 0.0008187119948743449, + "time_sec": 66.56613659858704 + }, + { + "epoch": 29, + "train_loss": 1.643007601623535, + "train_acc": 0.39978, + "test_loss": 5.360125735473633, + "test_acc": 0.1039, + "lyapunov": null, + "grad_norm": 2.4260201472737237, + "grad_max_sv": 2.2909662395715715, + "grad_min_sv": 9.427450295973471e-08, + "grad_condition": 24999199.08130427, + "lr": 0.0008064535268264883, + "time_sec": 66.5019998550415 + }, + { + "epoch": 30, + "train_loss": 1.6426652933120727, + "train_acc": 0.40242, + "test_loss": 5.846046133422852, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 2.4104230560175877, + "grad_max_sv": 2.2003868728876115, + "grad_min_sv": 8.557402386699664e-08, + "grad_condition": 26105024.01238749, + "lr": 0.0007938926261462367, + "time_sec": 66.54244065284729 + }, + { + "epoch": 31, + "train_loss": 1.6377650901031495, + "train_acc": 0.4032, + "test_loss": 5.6720462432861325, + "test_acc": 0.1037, + "lyapunov": null, + "grad_norm": 2.3941082742204367, + "grad_max_sv": 2.1774697691202163, + "grad_min_sv": 8.963231525882521e-08, + "grad_condition": 24809583.231536172, + "lr": 0.0007810416889260654, + "time_sec": 66.54210758209229 + }, + { + "epoch": 32, + "train_loss": 1.6306892547607421, + "train_acc": 0.40602, + "test_loss": 6.530587504577637, + "test_acc": 0.1021, + "lyapunov": null, + "grad_norm": 2.310788163521601, + "grad_max_sv": 2.3168098986148835, + "grad_min_sv": 8.591319300421674e-08, + "grad_condition": 27429040.418645225, + "lr": 0.0007679133974894983, + "time_sec": 66.54988598823547 + }, + { + "epoch": 33, + "train_loss": 1.616210421142578, + "train_acc": 0.41068, + "test_loss": 6.481897874450683, + "test_acc": 0.1047, + "lyapunov": null, + "grad_norm": 2.280822445658443, + "grad_max_sv": 2.0465356022119523, + "grad_min_sv": 8.811248948248363e-08, + "grad_condition": 23945215.471904326, + "lr": 0.0007545207078751857, + "time_sec": 66.54384207725525 + }, + { + "epoch": 34, + "train_loss": 1.6103173712921142, + "train_acc": 0.4129, + "test_loss": 7.558738642883301, + "test_acc": 0.1004, + "lyapunov": null, + "grad_norm": 2.268328370380239, + "grad_max_sv": 1.9925297170877456, + "grad_min_sv": 8.015654646698067e-08, + "grad_condition": 25172747.9746131, + "lr": 0.0007408768370508577, + "time_sec": 66.53899669647217 + }, + { + "epoch": 35, + "train_loss": 1.6033166294860839, + "train_acc": 0.41878, + "test_loss": 7.87334995880127, + "test_acc": 0.1014, + "lyapunov": null, + "grad_norm": 2.1857354046879727, + "grad_max_sv": 1.9975714191794396, + "grad_min_sv": 7.650004620884943e-08, + "grad_condition": 26089987.057969414, + "lr": 0.0007269952498697734, + "time_sec": 66.5277693271637 + }, + { + "epoch": 36, + "train_loss": 1.6046894992446898, + "train_acc": 0.41892, + "test_loss": 8.474886727905274, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 2.192178860403557, + "grad_max_sv": 2.002661418914795, + "grad_min_sv": 8.41961090181087e-08, + "grad_condition": 24123592.75292515, + "lr": 0.0007128896457825364, + "time_sec": 66.54011392593384 + }, + { + "epoch": 37, + "train_loss": 1.5938314058685303, + "train_acc": 0.42164, + "test_loss": 7.729584867858887, + "test_acc": 0.1023, + "lyapunov": null, + "grad_norm": 2.181177891654343, + "grad_max_sv": 2.0365157604217528, + "grad_min_sv": 8.0202053975853e-08, + "grad_condition": 26197254.249608647, + "lr": 0.0006985739453173903, + "time_sec": 66.53632307052612 + }, + { + "epoch": 38, + "train_loss": 1.5886405113220214, + "train_acc": 0.42264, + "test_loss": 5.7885481513977055, + "test_acc": 0.1062, + "lyapunov": null, + "grad_norm": 2.138587269147521, + "grad_max_sv": 1.933423602581024, + "grad_min_sv": 7.520017115680844e-08, + "grad_condition": 25928003.19539905, + "lr": 0.0006840622763423391, + "time_sec": 66.54145908355713 + }, + { + "epoch": 39, + "train_loss": 1.5804911177825929, + "train_acc": 0.42612, + "test_loss": 6.7240009689331055, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 2.146582724428281, + "grad_max_sv": 1.8961839854717255, + "grad_min_sv": 7.674624242781647e-08, + "grad_condition": 24938086.191727363, + "lr": 0.0006693689601226458, + "time_sec": 66.54460453987122 + }, + { + "epoch": 40, + "train_loss": 1.5785979819488525, + "train_acc": 0.42734, + "test_loss": 6.793812344360352, + "test_acc": 0.1033, + "lyapunov": null, + "grad_norm": 2.0524354853565967, + "grad_max_sv": 1.9275713503360747, + "grad_min_sv": 7.654831097880788e-08, + "grad_condition": 25599705.595900334, + "lr": 0.0006545084971874737, + "time_sec": 66.78280329704285 + }, + { + "epoch": 41, + "train_loss": 1.5828138892364503, + "train_acc": 0.42612, + "test_loss": 6.44511951751709, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 2.1085813246105163, + "grad_max_sv": 1.9095334649085998, + "grad_min_sv": 7.941251247700621e-08, + "grad_condition": 24686632.04929278, + "lr": 0.0006394955530196147, + "time_sec": 66.53900074958801 + }, + { + "epoch": 42, + "train_loss": 1.5717257321548461, + "train_acc": 0.42996, + "test_loss": 8.174863388061523, + "test_acc": 0.1011, + "lyapunov": null, + "grad_norm": 2.0568855518830627, + "grad_max_sv": 1.8603438019752503, + "grad_min_sv": 8.168111662598676e-08, + "grad_condition": 23782864.12280636, + "lr": 0.0006243449435824273, + "time_sec": 66.54205513000488 + }, + { + "epoch": 43, + "train_loss": 1.562401286239624, + "train_acc": 0.43392, + "test_loss": 7.7131751495361325, + "test_acc": 0.1014, + "lyapunov": null, + "grad_norm": 2.0119184672620642, + "grad_max_sv": 1.8657386392354964, + "grad_min_sv": 7.582975278808135e-08, + "grad_condition": 24942971.18450144, + "lr": 0.0006090716206982714, + "time_sec": 66.53042316436768 + }, + { + "epoch": 44, + "train_loss": 1.5541102393341064, + "train_acc": 0.43712, + "test_loss": 8.247987678527831, + "test_acc": 0.1011, + "lyapunov": null, + "grad_norm": 1.9482695609274137, + "grad_max_sv": 1.6971077546477318, + "grad_min_sv": 7.249982623136474e-08, + "grad_condition": 23783887.230844818, + "lr": 0.0005936906572928625, + "time_sec": 66.5365047454834 + }, + { + "epoch": 45, + "train_loss": 1.551253000793457, + "train_acc": 0.43906, + "test_loss": 7.164133547973633, + "test_acc": 0.1021, + "lyapunov": null, + "grad_norm": 1.9478309625288126, + "grad_max_sv": 1.7972041130065919, + "grad_min_sv": 7.798710131012853e-08, + "grad_condition": 23697966.26066207, + "lr": 0.0005782172325201156, + "time_sec": 66.54136061668396 + }, + { + "epoch": 46, + "train_loss": 1.541000611190796, + "train_acc": 0.44134, + "test_loss": 6.376314013671875, + "test_acc": 0.1045, + "lyapunov": null, + "grad_norm": 1.8630241109997108, + "grad_max_sv": 1.6913443714380265, + "grad_min_sv": 7.214549819778427e-08, + "grad_condition": 23808757.926116575, + "lr": 0.0005626666167821523, + "time_sec": 66.55902171134949 + }, + { + "epoch": 47, + "train_loss": 1.5372591391754151, + "train_acc": 0.44398, + "test_loss": 6.5030721710205075, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 1.9024590490680153, + "grad_max_sv": 1.814224436879158, + "grad_min_sv": 7.368249033135044e-08, + "grad_condition": 25117471.09981022, + "lr": 0.0005470541566592572, + "time_sec": 66.52199673652649 + }, + { + "epoch": 48, + "train_loss": 1.5375283456802369, + "train_acc": 0.44544, + "test_loss": 7.119714102935791, + "test_acc": 0.1016, + "lyapunov": null, + "grad_norm": 1.8585907694205182, + "grad_max_sv": 1.7394830703735351, + "grad_min_sv": 7.501465217885084e-08, + "grad_condition": 23906344.012628905, + "lr": 0.0005313952597646569, + "time_sec": 66.54580640792847 + }, + { + "epoch": 49, + "train_loss": 1.5338307555770874, + "train_acc": 0.4442, + "test_loss": 5.397337831115722, + "test_acc": 0.1059, + "lyapunov": null, + "grad_norm": 1.7902731589528738, + "grad_max_sv": 1.6494132414460183, + "grad_min_sv": 6.831805556828386e-08, + "grad_condition": 24615282.56582328, + "lr": 0.0005157053795390643, + "time_sec": 66.53534126281738 + }, + { + "epoch": 50, + "train_loss": 1.5284276412963866, + "train_acc": 0.44778, + "test_loss": 5.524033654785156, + "test_acc": 0.1078, + "lyapunov": null, + "grad_norm": 1.7713612838130008, + "grad_max_sv": 1.5726667106151582, + "grad_min_sv": 6.907176626214096e-08, + "grad_condition": 22960902.516891498, + "lr": 0.0005000000000000002, + "time_sec": 66.5325882434845 + }, + { + "epoch": 51, + "train_loss": 1.5330605014801026, + "train_acc": 0.44666, + "test_loss": 6.847183532714844, + "test_acc": 0.1031, + "lyapunov": null, + "grad_norm": 1.7792073911302086, + "grad_max_sv": 1.6382696747779846, + "grad_min_sv": 6.6116589625409e-08, + "grad_condition": 24861349.651776347, + "lr": 0.00048429462046093607, + "time_sec": 66.53938388824463 + }, + { + "epoch": 52, + "train_loss": 1.515211699180603, + "train_acc": 0.45132, + "test_loss": 6.849605633544922, + "test_acc": 0.1046, + "lyapunov": null, + "grad_norm": 1.7110848232260776, + "grad_max_sv": 1.4070507645606996, + "grad_min_sv": 6.268320333902011e-08, + "grad_condition": 22502851.341604523, + "lr": 0.0004686047402353435, + "time_sec": 66.54575228691101 + }, + { + "epoch": 53, + "train_loss": 1.511851570777893, + "train_acc": 0.44984, + "test_loss": 6.742161424255371, + "test_acc": 0.1035, + "lyapunov": null, + "grad_norm": 1.6990701953393579, + "grad_max_sv": 1.5247679650783539, + "grad_min_sv": 6.360552236017725e-08, + "grad_condition": 24187524.31056104, + "lr": 0.000452945843340743, + "time_sec": 66.55630564689636 + }, + { + "epoch": 54, + "train_loss": 1.5134658539581298, + "train_acc": 0.45194, + "test_loss": 6.076722029113769, + "test_acc": 0.1055, + "lyapunov": null, + "grad_norm": 1.67595650149666, + "grad_max_sv": 1.521102523803711, + "grad_min_sv": 6.705203148271721e-08, + "grad_condition": 23102185.373464666, + "lr": 0.00043733338321784806, + "time_sec": 66.54796624183655 + }, + { + "epoch": 55, + "train_loss": 1.5127635479736328, + "train_acc": 0.45416, + "test_loss": 6.099140180969238, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 1.669713615396416, + "grad_max_sv": 1.4162977203726768, + "grad_min_sv": 5.9198181379116475e-08, + "grad_condition": 24265418.333155036, + "lr": 0.0004217827674798847, + "time_sec": 66.56652212142944 + }, + { + "epoch": 56, + "train_loss": 1.5037149493789672, + "train_acc": 0.45674, + "test_loss": 5.881203063964843, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 1.6488336383475701, + "grad_max_sv": 1.5071144998073578, + "grad_min_sv": 6.376719170475554e-08, + "grad_condition": 23818554.434521496, + "lr": 0.00040630934270713783, + "time_sec": 66.53574323654175 + }, + { + "epoch": 57, + "train_loss": 1.504850189590454, + "train_acc": 0.459, + "test_loss": 5.68402534790039, + "test_acc": 0.1076, + "lyapunov": null, + "grad_norm": 1.6129911107480968, + "grad_max_sv": 1.4527282550930978, + "grad_min_sv": 6.286840470437483e-08, + "grad_condition": 23483060.334747117, + "lr": 0.000390928379301729, + "time_sec": 66.54559707641602 + }, + { + "epoch": 58, + "train_loss": 1.4977053466033936, + "train_acc": 0.45916, + "test_loss": 5.9823997062683105, + "test_acc": 0.1071, + "lyapunov": null, + "grad_norm": 1.6061924832487942, + "grad_max_sv": 1.3888853162527084, + "grad_min_sv": 6.253125484079192e-08, + "grad_condition": 22608679.418678027, + "lr": 0.0003756550564175727, + "time_sec": 66.55387783050537 + }, + { + "epoch": 59, + "train_loss": 1.4972542272949219, + "train_acc": 0.45872, + "test_loss": 5.0882811370849605, + "test_acc": 0.1151, + "lyapunov": null, + "grad_norm": 1.5591682163016796, + "grad_max_sv": 1.3346713334321976, + "grad_min_sv": 5.8280132453347735e-08, + "grad_condition": 23069467.539254077, + "lr": 0.00036050444698038553, + "time_sec": 66.54211473464966 + }, + { + "epoch": 60, + "train_loss": 1.4907029873657227, + "train_acc": 0.46126, + "test_loss": 7.020564842224121, + "test_acc": 0.1048, + "lyapunov": null, + "grad_norm": 1.5345406038505094, + "grad_max_sv": 1.4284722179174423, + "grad_min_sv": 6.001468877414595e-08, + "grad_condition": 24162295.485593982, + "lr": 0.00034549150281252655, + "time_sec": 66.55491805076599 + }, + { + "epoch": 61, + "train_loss": 1.4877613472366333, + "train_acc": 0.4653, + "test_loss": 4.854167632293701, + "test_acc": 0.1114, + "lyapunov": null, + "grad_norm": 1.5324361061772793, + "grad_max_sv": 1.325933101773262, + "grad_min_sv": 5.964644183009682e-08, + "grad_condition": 22280923.908054985, + "lr": 0.0003306310398773544, + "time_sec": 66.54050326347351 + }, + { + "epoch": 62, + "train_loss": 1.4875999914550782, + "train_acc": 0.4609, + "test_loss": 6.024991397094727, + "test_acc": 0.1045, + "lyapunov": null, + "grad_norm": 1.5157035873578593, + "grad_max_sv": 1.2820105284452439, + "grad_min_sv": 5.6854590901878056e-08, + "grad_condition": 22744392.831777684, + "lr": 0.00031593772365766127, + "time_sec": 66.56322026252747 + }, + { + "epoch": 63, + "train_loss": 1.4804442275238037, + "train_acc": 0.46586, + "test_loss": 6.877338618469238, + "test_acc": 0.1028, + "lyapunov": null, + "grad_norm": 1.5037529747226948, + "grad_max_sv": 1.3301736950874328, + "grad_min_sv": 6.064568385255597e-08, + "grad_condition": 22458783.805724658, + "lr": 0.0003014260546826097, + "time_sec": 66.55420660972595 + }, + { + "epoch": 64, + "train_loss": 1.4785625118637085, + "train_acc": 0.4676, + "test_loss": 5.8289501716613765, + "test_acc": 0.1058, + "lyapunov": null, + "grad_norm": 1.4955609555476688, + "grad_max_sv": 1.2231090664863586, + "grad_min_sv": 5.909942020210224e-08, + "grad_condition": 21200746.17398096, + "lr": 0.0002871103542174637, + "time_sec": 66.55184054374695 + }, + { + "epoch": 65, + "train_loss": 1.474054185218811, + "train_acc": 0.4692, + "test_loss": 6.821263113403321, + "test_acc": 0.1053, + "lyapunov": null, + "grad_norm": 1.4816881050330082, + "grad_max_sv": 1.304422627389431, + "grad_min_sv": 6.126439071607592e-08, + "grad_condition": 22262717.79019341, + "lr": 0.0002730047501302267, + "time_sec": 66.54631876945496 + }, + { + "epoch": 66, + "train_loss": 1.468451905593872, + "train_acc": 0.46872, + "test_loss": 6.21660086593628, + "test_acc": 0.1049, + "lyapunov": null, + "grad_norm": 1.4471343716270808, + "grad_max_sv": 1.2118137910962106, + "grad_min_sv": 5.677175121121536e-08, + "grad_condition": 21833909.31574912, + "lr": 0.00025912316294914234, + "time_sec": 66.54650139808655 + }, + { + "epoch": 67, + "train_loss": 1.473218607635498, + "train_acc": 0.46886, + "test_loss": 5.585741909790039, + "test_acc": 0.1093, + "lyapunov": null, + "grad_norm": 1.4454249735567377, + "grad_max_sv": 1.344612455368042, + "grad_min_sv": 5.805593232821593e-08, + "grad_condition": 23703781.24599778, + "lr": 0.0002454792921248144, + "time_sec": 66.54963803291321 + }, + { + "epoch": 68, + "train_loss": 1.464357560043335, + "train_acc": 0.47134, + "test_loss": 6.43534487915039, + "test_acc": 0.1036, + "lyapunov": null, + "grad_norm": 1.4158825945249984, + "grad_max_sv": 1.216756673157215, + "grad_min_sv": 5.594884520121468e-08, + "grad_condition": 22117575.184218023, + "lr": 0.00023208660251050164, + "time_sec": 66.53380155563354 + }, + { + "epoch": 69, + "train_loss": 1.4605754261016846, + "train_acc": 0.47354, + "test_loss": 6.361464812469483, + "test_acc": 0.1041, + "lyapunov": null, + "grad_norm": 1.4102858398212452, + "grad_max_sv": 1.2650031745433807, + "grad_min_sv": 5.616340708058942e-08, + "grad_condition": 22755240.415779583, + "lr": 0.00021895831107393473, + "time_sec": 66.55379509925842 + }, + { + "epoch": 70, + "train_loss": 1.4566728033065797, + "train_acc": 0.4732, + "test_loss": 7.030058961486817, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 1.4004542368068666, + "grad_max_sv": 1.1733321487903594, + "grad_min_sv": 5.324388059335661e-08, + "grad_condition": 22428640.626706712, + "lr": 0.00020610737385376356, + "time_sec": 66.53196001052856 + }, + { + "epoch": 71, + "train_loss": 1.4595127109909058, + "train_acc": 0.4747, + "test_loss": 6.251192915344238, + "test_acc": 0.1055, + "lyapunov": null, + "grad_norm": 1.4007518176750748, + "grad_max_sv": 1.2036359310150146, + "grad_min_sv": 5.3584219283919765e-08, + "grad_condition": 22661079.860923886, + "lr": 0.00019354647317351177, + "time_sec": 66.53831934928894 + }, + { + "epoch": 72, + "train_loss": 1.4561804718780518, + "train_acc": 0.47592, + "test_loss": 6.078685757446289, + "test_acc": 0.1053, + "lyapunov": null, + "grad_norm": 1.3882159701453969, + "grad_max_sv": 1.1710434511303902, + "grad_min_sv": 5.193670311598453e-08, + "grad_condition": 22617697.621583022, + "lr": 0.0001812880051256552, + "time_sec": 66.53273725509644 + }, + { + "epoch": 73, + "train_loss": 1.456334539833069, + "train_acc": 0.47646, + "test_loss": 6.318551240539551, + "test_acc": 0.1053, + "lyapunov": null, + "grad_norm": 1.3893052276682352, + "grad_max_sv": 1.262186436355114, + "grad_min_sv": 5.998066114898392e-08, + "grad_condition": 21695066.67305842, + "lr": 0.00016934406733817422, + "time_sec": 66.53349781036377 + }, + { + "epoch": 74, + "train_loss": 1.450936794128418, + "train_acc": 0.48046, + "test_loss": 5.979817550659179, + "test_acc": 0.105, + "lyapunov": null, + "grad_norm": 1.3659009379358413, + "grad_max_sv": 1.2089540883898735, + "grad_min_sv": 5.6734091380405974e-08, + "grad_condition": 21453559.245642237, + "lr": 0.0001577264470356557, + "time_sec": 66.5519745349884 + }, + { + "epoch": 75, + "train_loss": 1.4469789163970947, + "train_acc": 0.47906, + "test_loss": 6.295627461242676, + "test_acc": 0.1067, + "lyapunov": null, + "grad_norm": 1.3551347445295552, + "grad_max_sv": 1.1976817324757576, + "grad_min_sv": 5.458875831365617e-08, + "grad_condition": 22252931.086762276, + "lr": 0.00014644660940672634, + "time_sec": 66.55559992790222 + }, + { + "epoch": 76, + "train_loss": 1.4463843099212645, + "train_acc": 0.47934, + "test_loss": 6.197264282226563, + "test_acc": 0.1079, + "lyapunov": null, + "grad_norm": 1.3380208446863917, + "grad_max_sv": 1.2127704448997974, + "grad_min_sv": 5.3017609769057116e-08, + "grad_condition": 23070185.252038278, + "lr": 0.0001355156862892944, + "time_sec": 66.54188418388367 + }, + { + "epoch": 77, + "train_loss": 1.4422340731430054, + "train_acc": 0.47956, + "test_loss": 6.095625473022461, + "test_acc": 0.1068, + "lyapunov": null, + "grad_norm": 1.319834743092097, + "grad_max_sv": 1.0997839123010635, + "grad_min_sv": 5.253857917608684e-08, + "grad_condition": 21034235.602306478, + "lr": 0.00012494446518477025, + "time_sec": 66.54432153701782 + }, + { + "epoch": 78, + "train_loss": 1.4469564128875732, + "train_acc": 0.48036, + "test_loss": 5.388970955657959, + "test_acc": 0.11, + "lyapunov": null, + "grad_norm": 1.3475784983368762, + "grad_max_sv": 1.2046680554747582, + "grad_min_sv": 5.585839417676652e-08, + "grad_condition": 21905924.79288598, + "lr": 0.00011474337861210548, + "time_sec": 66.53302836418152 + }, + { + "epoch": 79, + "train_loss": 1.4366684397125244, + "train_acc": 0.4798, + "test_loss": 6.206115145874024, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 1.3130109628098805, + "grad_max_sv": 1.1744658067822455, + "grad_min_sv": 5.508810989596213e-08, + "grad_condition": 21715398.426144313, + "lr": 0.00010492249381215483, + "time_sec": 66.53135848045349 + }, + { + "epoch": 80, + "train_loss": 1.4392537023544312, + "train_acc": 0.48228, + "test_loss": 6.179986186218262, + "test_acc": 0.1064, + "lyapunov": null, + "grad_norm": 1.3256940413341314, + "grad_max_sv": 1.1846244156360626, + "grad_min_sv": 5.3839901603680576e-08, + "grad_condition": 22125564.09370377, + "lr": 9.549150281252637e-05, + "time_sec": 66.5379912853241 + }, + { + "epoch": 81, + "train_loss": 1.4338660355377197, + "train_acc": 0.48616, + "test_loss": 6.177688023376465, + "test_acc": 0.1068, + "lyapunov": null, + "grad_norm": 1.331304941867422, + "grad_max_sv": 1.2059139341115952, + "grad_min_sv": 5.419374078385886e-08, + "grad_condition": 22342309.054380674, + "lr": 8.645971286271918e-05, + "time_sec": 66.5526373386383 + }, + { + "epoch": 82, + "train_loss": 1.4322706761550903, + "train_acc": 0.48346, + "test_loss": 6.39905592956543, + "test_acc": 0.1049, + "lyapunov": null, + "grad_norm": 1.3160308800060254, + "grad_max_sv": 1.1150345966219901, + "grad_min_sv": 5.504024436220334e-08, + "grad_condition": 20495998.096470684, + "lr": 7.78360372489926e-05, + "time_sec": 66.53385639190674 + }, + { + "epoch": 83, + "train_loss": 1.4299918703460692, + "train_acc": 0.48306, + "test_loss": 6.442905668640137, + "test_acc": 0.1051, + "lyapunov": null, + "grad_norm": 1.3113912638515688, + "grad_max_sv": 1.0838071212172509, + "grad_min_sv": 5.43203230840561e-08, + "grad_condition": 20241235.03989599, + "lr": 6.962898649802815e-05, + "time_sec": 66.52077317237854 + }, + { + "epoch": 84, + "train_loss": 1.4280065909194946, + "train_acc": 0.4822, + "test_loss": 6.0934767837524415, + "test_acc": 0.1077, + "lyapunov": null, + "grad_norm": 1.3219999598887227, + "grad_max_sv": 1.1636987075209617, + "grad_min_sv": 5.4432569296380964e-08, + "grad_condition": 21698960.666762732, + "lr": 6.184665997806824e-05, + "time_sec": 66.54324150085449 + }, + { + "epoch": 85, + "train_loss": 1.426846856918335, + "train_acc": 0.4865, + "test_loss": 5.9188161468505855, + "test_acc": 0.107, + "lyapunov": null, + "grad_norm": 1.2965845421535789, + "grad_max_sv": 1.1792906790971756, + "grad_min_sv": 5.5100021434384416e-08, + "grad_condition": 21690369.73733188, + "lr": 5.449673790581613e-05, + "time_sec": 66.53187370300293 + }, + { + "epoch": 86, + "train_loss": 1.4228094031524658, + "train_acc": 0.48556, + "test_loss": 6.137683601379394, + "test_acc": 0.108, + "lyapunov": null, + "grad_norm": 1.292831856620217, + "grad_max_sv": 1.0124387323856354, + "grad_min_sv": 5.2233392278111523e-08, + "grad_condition": 19602805.79996558, + "lr": 4.758647376699034e-05, + "time_sec": 66.53067183494568 + }, + { + "epoch": 87, + "train_loss": 1.429165520362854, + "train_acc": 0.48332, + "test_loss": 5.927753118133545, + "test_acc": 0.1088, + "lyapunov": null, + "grad_norm": 1.3101745862822605, + "grad_max_sv": 1.1612930461764335, + "grad_min_sv": 5.276717347513227e-08, + "grad_condition": 22472879.957919728, + "lr": 4.112268715800956e-05, + "time_sec": 66.53908562660217 + }, + { + "epoch": 88, + "train_loss": 1.4288117279052734, + "train_acc": 0.48666, + "test_loss": 6.013241593933105, + "test_acc": 0.1075, + "lyapunov": null, + "grad_norm": 1.3007188330408852, + "grad_max_sv": 1.139727284014225, + "grad_min_sv": 5.308784185587001e-08, + "grad_condition": 21649216.459450316, + "lr": 3.511175705587434e-05, + "time_sec": 66.52465963363647 + }, + { + "epoch": 89, + "train_loss": 1.4234879583358764, + "train_acc": 0.48672, + "test_loss": 5.440691387176513, + "test_acc": 0.1132, + "lyapunov": null, + "grad_norm": 1.286797693166196, + "grad_max_sv": 1.1378898680210114, + "grad_min_sv": 5.206395803369901e-08, + "grad_condition": 22299317.66856014, + "lr": 2.9559615522887284e-05, + "time_sec": 66.52217221260071 + }, + { + "epoch": 90, + "train_loss": 1.4255534106445313, + "train_acc": 0.4873, + "test_loss": 5.6889183303833, + "test_acc": 0.1089, + "lyapunov": null, + "grad_norm": 1.2907871997501676, + "grad_max_sv": 1.1832163825631141, + "grad_min_sv": 5.3787662057658284e-08, + "grad_condition": 22287194.786688134, + "lr": 2.447174185242324e-05, + "time_sec": 66.53036832809448 + }, + { + "epoch": 91, + "train_loss": 1.4252548498916626, + "train_acc": 0.48792, + "test_loss": 6.261311422729492, + "test_acc": 0.1064, + "lyapunov": null, + "grad_norm": 1.3031797280361905, + "grad_max_sv": 1.1937354177236557, + "grad_min_sv": 5.396164546311866e-08, + "grad_condition": 22285756.773222417, + "lr": 1.9853157161528526e-05, + "time_sec": 66.53405451774597 + }, + { + "epoch": 92, + "train_loss": 1.4257716689300537, + "train_acc": 0.48484, + "test_loss": 5.9496440505981445, + "test_acc": 0.1083, + "lyapunov": null, + "grad_norm": 1.2963951565864091, + "grad_max_sv": 1.1119507551193237, + "grad_min_sv": 5.530857025703995e-08, + "grad_condition": 20517700.461063318, + "lr": 1.570841943568452e-05, + "time_sec": 66.55413794517517 + }, + { + "epoch": 93, + "train_loss": 1.4217627249526978, + "train_acc": 0.48994, + "test_loss": 5.984926200866699, + "test_acc": 0.1075, + "lyapunov": null, + "grad_norm": 1.264014206865248, + "grad_max_sv": 1.0518594324588775, + "grad_min_sv": 4.926823864437324e-08, + "grad_condition": 21435816.94874554, + "lr": 1.204161903062634e-05, + "time_sec": 66.52945113182068 + }, + { + "epoch": 94, + "train_loss": 1.4220651029205322, + "train_acc": 0.48712, + "test_loss": 5.9274788650512695, + "test_acc": 0.107, + "lyapunov": null, + "grad_norm": 1.2852744864782746, + "grad_max_sv": 1.194958347082138, + "grad_min_sv": 5.49836086882749e-08, + "grad_condition": 21876849.948771022, + "lr": 8.85637463565564e-06, + "time_sec": 66.53060245513916 + }, + { + "epoch": 95, + "train_loss": 1.4127644922637939, + "train_acc": 0.4891, + "test_loss": 6.033211676025391, + "test_acc": 0.1068, + "lyapunov": null, + "grad_norm": 1.2852733904252112, + "grad_max_sv": 1.1103495568037034, + "grad_min_sv": 5.0794950290367066e-08, + "grad_condition": 21903481.59645809, + "lr": 6.155829702431171e-06, + "time_sec": 66.54151201248169 + }, + { + "epoch": 96, + "train_loss": 1.42291917427063, + "train_acc": 0.48754, + "test_loss": 5.946468173217774, + "test_acc": 0.1078, + "lyapunov": null, + "grad_norm": 1.296502082808029, + "grad_max_sv": 1.1921778261661529, + "grad_min_sv": 5.59618015927299e-08, + "grad_condition": 21704630.944007598, + "lr": 3.942649342761118e-06, + "time_sec": 66.53685402870178 + }, + { + "epoch": 97, + "train_loss": 1.4221784051132202, + "train_acc": 0.48922, + "test_loss": 5.77611974029541, + "test_acc": 0.1107, + "lyapunov": null, + "grad_norm": 1.283101201721102, + "grad_max_sv": 1.1582708179950714, + "grad_min_sv": 5.3498822172315384e-08, + "grad_condition": 21893400.606446274, + "lr": 2.2190176984600023e-06, + "time_sec": 66.51551508903503 + }, + { + "epoch": 98, + "train_loss": 1.4199727509307862, + "train_acc": 0.48888, + "test_loss": 5.947603340148926, + "test_acc": 0.1072, + "lyapunov": null, + "grad_norm": 1.2852084329880165, + "grad_max_sv": 1.12471182346344, + "grad_min_sv": 5.5720254987789984e-08, + "grad_condition": 20744598.237500653, + "lr": 9.866357858642206e-07, + "time_sec": 66.54128313064575 + }, + { + "epoch": 99, + "train_loss": 1.4189085994720458, + "train_acc": 0.49036, + "test_loss": 6.019410075378418, + "test_acc": 0.1088, + "lyapunov": null, + "grad_norm": 1.2671570273045278, + "grad_max_sv": 1.044458197057247, + "grad_min_sv": 5.2453829901821794e-08, + "grad_condition": 20122144.845569003, + "lr": 2.467198171342e-07, + "time_sec": 66.5876886844635 + }, + { + "epoch": 100, + "train_loss": 1.4237549599456787, + "train_acc": 0.48696, + "test_loss": 6.123869666290283, + "test_acc": 0.1056, + "lyapunov": null, + "grad_norm": 1.2842958901976373, + "grad_max_sv": 1.0893320694565773, + "grad_min_sv": 5.240736280498481e-08, + "grad_condition": 20983923.24178537, + "lr": 0.0, + "time_sec": 66.52526140213013 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 5.9559499659729, + "train_acc": 0.1816, + "test_loss": 2.127836145401001, + "test_acc": 0.2458, + "lyapunov": 3.1805403927707916, + "grad_norm": 7.669457973262479, + "grad_max_sv": 5.918661725521088, + "grad_min_sv": 2.931642846704108e-07, + "grad_condition": 20422744.62807854, + "lr": 0.0009997532801828658, + "time_sec": 38.74378061294556 + }, + { + "epoch": 2, + "train_loss": 4.402947195281983, + "train_acc": 0.19622, + "test_loss": 2.0710217851638792, + "test_acc": 0.2599, + "lyapunov": 2.5604425824206807, + "grad_norm": 5.322089969338386, + "grad_max_sv": 4.252373713254928, + "grad_min_sv": 1.9552239614029076e-07, + "grad_condition": 22174922.12126705, + "lr": 0.0009990133642141358, + "time_sec": 38.64048624038696 + }, + { + "epoch": 3, + "train_loss": 4.045168105316162, + "train_acc": 0.22284, + "test_loss": 2.047537351036072, + "test_acc": 0.275, + "lyapunov": 2.4094676093372236, + "grad_norm": 3.329135536451279, + "grad_max_sv": 2.700692330300808, + "grad_min_sv": 1.3114565362570828e-07, + "grad_condition": 21120674.055912692, + "lr": 0.00099778098230154, + "time_sec": 38.632225036621094 + }, + { + "epoch": 4, + "train_loss": 3.8760036846923827, + "train_acc": 0.23552, + "test_loss": 2.0494147090911867, + "test_acc": 0.2624, + "lyapunov": 2.323524356803016, + "grad_norm": 1.6169046791962502, + "grad_max_sv": 1.2880224913358689, + "grad_min_sv": 5.374016822656813e-08, + "grad_condition": 24107383.024291664, + "lr": 0.000996057350657239, + "time_sec": 38.643821477890015 + }, + { + "epoch": 5, + "train_loss": 3.7066750312805175, + "train_acc": 0.23364, + "test_loss": 2.073809361457825, + "test_acc": 0.2559, + "lyapunov": 2.2068090539454195, + "grad_norm": 0.6888041501699484, + "grad_max_sv": 0.4505885936319828, + "grad_min_sv": 2.5095627176341396e-08, + "grad_condition": 18224356.70160868, + "lr": 0.0009938441702975688, + "time_sec": 38.63996958732605 + }, + { + "epoch": 6, + "train_loss": 3.5870462338256837, + "train_acc": 0.22278, + "test_loss": 2.0948594261169435, + "test_acc": 0.2419, + "lyapunov": 2.1068829035819947, + "grad_norm": 0.4525297557038159, + "grad_max_sv": 0.2912705983966589, + "grad_min_sv": 1.4355599531334918e-08, + "grad_condition": 20443883.38963156, + "lr": 0.0009911436253643444, + "time_sec": 38.64875626564026 + }, + { + "epoch": 7, + "train_loss": 3.516497625274658, + "train_acc": 0.20518, + "test_loss": 2.122341016769409, + "test_acc": 0.2149, + "lyapunov": 2.031583094535886, + "grad_norm": 0.4192338818357315, + "grad_max_sv": 0.2666142761707306, + "grad_min_sv": 1.244383397436266e-08, + "grad_condition": 21524577.239365414, + "lr": 0.0009879583809693736, + "time_sec": 38.65327429771423 + }, + { + "epoch": 8, + "train_loss": 3.500787953567505, + "train_acc": 0.15934, + "test_loss": 2.30495919342041, + "test_acc": 0.1, + "lyapunov": 1.9705595735393826, + "grad_norm": 0.364806685633591, + "grad_max_sv": 0.19433156847953797, + "grad_min_sv": 7.78323775238877e-09, + "grad_condition": 1400511997.1550007, + "lr": 0.0009842915805643154, + "time_sec": 38.633607625961304 + }, + { + "epoch": 9, + "train_loss": 3.5612770445251463, + "train_acc": 0.0995, + "test_loss": 2.309052435684204, + "test_acc": 0.1, + "lyapunov": 1.9462372851188836, + "grad_norm": 0.1961322565486487, + "grad_max_sv": 0.08832639907486736, + "grad_min_sv": 7.733921171735724e-10, + "grad_condition": 10141008570.944132, + "lr": 0.0009801468428384714, + "time_sec": 38.646180152893066 + }, + { + "epoch": 10, + "train_loss": 3.538458889770508, + "train_acc": 0.09824, + "test_loss": 2.3040579429626464, + "test_acc": 0.1, + "lyapunov": 1.9283022353106447, + "grad_norm": 0.21318046705690488, + "grad_max_sv": 0.0782687779981643, + "grad_min_sv": 8.435315090236436e-10, + "grad_condition": 12098584585.465805, + "lr": 0.0009755282581475767, + "time_sec": 38.63904404640198 + }, + { + "epoch": 11, + "train_loss": 3.529650466461182, + "train_acc": 0.10062, + "test_loss": 2.302797904205322, + "test_acc": 0.1, + "lyapunov": 1.9214661554302401, + "grad_norm": 0.14436104663435, + "grad_max_sv": 0.07406298876740039, + "grad_min_sv": 1.8938792208460978e-10, + "grad_condition": 16582547419.599035, + "lr": 0.0009704403844771127, + "time_sec": 38.65141201019287 + }, + { + "epoch": 12, + "train_loss": 3.527643050994873, + "train_acc": 0.09804, + "test_loss": 2.3026904548645017, + "test_acc": 0.1, + "lyapunov": 1.9200294935489859, + "grad_norm": 0.13153432020985192, + "grad_max_sv": 0.05873946417123079, + "grad_min_sv": 2.2213949011783955e-10, + "grad_condition": 29679782911.168915, + "lr": 0.0009648882429441257, + "time_sec": 38.637062311172485 + }, + { + "epoch": 13, + "train_loss": 3.525748397216797, + "train_acc": 0.09986, + "test_loss": 2.3026839447021485, + "test_acc": 0.1, + "lyapunov": 1.9183377143367173, + "grad_norm": 0.1253530383790545, + "grad_max_sv": 0.054947068355977534, + "grad_min_sv": 2.484597018350735e-10, + "grad_condition": 32728296691.529114, + "lr": 0.0009588773128419905, + "time_sec": 38.639862060546875 + }, + { + "epoch": 14, + "train_loss": 3.5267535670471193, + "train_acc": 0.09928, + "test_loss": 2.303218070602417, + "test_acc": 0.1, + "lyapunov": 1.9196420743337372, + "grad_norm": 0.1092532269273596, + "grad_max_sv": 0.04395028324797749, + "grad_min_sv": 9.613613581557888e-11, + "grad_condition": 21168413985.92494, + "lr": 0.0009524135262330098, + "time_sec": 38.639400243759155 + }, + { + "epoch": 15, + "train_loss": 3.5285498448181154, + "train_acc": 0.0982, + "test_loss": 2.3035209484100343, + "test_acc": 0.1, + "lyapunov": 1.920996154055876, + "grad_norm": 0.10604045531455125, + "grad_max_sv": 0.030423881998285652, + "grad_min_sv": 8.947113291620313e-11, + "grad_condition": 14692894250.958597, + "lr": 0.0009455032620941839, + "time_sec": 38.645652770996094 + }, + { + "epoch": 16, + "train_loss": 3.5281584407806394, + "train_acc": 0.09964, + "test_loss": 2.3028687210083008, + "test_acc": 0.1, + "lyapunov": 1.9207957717768676, + "grad_norm": 0.09543807455983376, + "grad_max_sv": 0.006560872681438923, + "grad_min_sv": 4.056405124991419e-12, + "grad_condition": 3706750979.9989243, + "lr": 0.0009381533400219318, + "time_sec": 38.63558006286621 + }, + { + "epoch": 17, + "train_loss": 3.5265050379943848, + "train_acc": 0.09798, + "test_loss": 2.302896424102783, + "test_acc": 0.1, + "lyapunov": 1.9195188765635576, + "grad_norm": 0.09404328433417611, + "grad_max_sv": 0.005626836745068431, + "grad_min_sv": 8.896868440940896e-13, + "grad_condition": 3600570896.7918577, + "lr": 0.0009303710135019719, + "time_sec": 38.63581418991089 + }, + { + "epoch": 18, + "train_loss": 3.5274914381408693, + "train_acc": 0.09708, + "test_loss": 2.3026503776550293, + "test_acc": 0.1, + "lyapunov": 1.9202668194270804, + "grad_norm": 0.09620880376142034, + "grad_max_sv": 0.003721812926232815, + "grad_min_sv": 3.080583531323011e-13, + "grad_condition": 2605476049.955305, + "lr": 0.0009221639627510076, + "time_sec": 38.637654304504395 + }, + { + "epoch": 19, + "train_loss": 3.5240187657165527, + "train_acc": 0.09788, + "test_loss": 2.3026472286224364, + "test_acc": 0.1, + "lyapunov": 1.917564369833378, + "grad_norm": 0.08696272623748423, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000913540287137281, + "time_sec": 38.64585041999817 + }, + { + "epoch": 20, + "train_loss": 3.526093559265137, + "train_acc": 0.09698, + "test_loss": 2.302675205993652, + "test_acc": 0.1, + "lyapunov": 1.9192343212454521, + "grad_norm": 0.08759130668154863, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009045084971874739, + "time_sec": 38.63778305053711 + }, + { + "epoch": 21, + "train_loss": 3.5268382842254637, + "train_acc": 0.0963, + "test_loss": 2.302619518661499, + "test_acc": 0.1, + "lyapunov": 1.9198827185594212, + "grad_norm": 0.09131899089817433, + "grad_max_sv": 0.0007137967739254236, + "grad_min_sv": 1.2143662959650498e-34, + "grad_condition": 713796773.9254236, + "lr": 0.0008950775061878452, + "time_sec": 38.63694953918457 + }, + { + "epoch": 22, + "train_loss": 3.5266487127685546, + "train_acc": 0.09736, + "test_loss": 2.302595558166504, + "test_acc": 0.1, + "lyapunov": 1.919754564914557, + "grad_norm": 0.08451797479839518, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878947, + "time_sec": 38.62629771232605 + }, + { + "epoch": 23, + "train_loss": 3.526773832244873, + "train_acc": 0.09764, + "test_loss": 2.3026504470825193, + "test_acc": 0.1, + "lyapunov": 1.919811970132696, + "grad_norm": 0.0880141883169143, + "grad_max_sv": 0.003215626534074545, + "grad_min_sv": 6.757893669575438e-13, + "grad_condition": 421691349.6171393, + "lr": 0.0008750555348152298, + "time_sec": 38.627503395080566 + }, + { + "epoch": 24, + "train_loss": 3.5253559977722166, + "train_acc": 0.09686, + "test_loss": 2.302592763519287, + "test_acc": 0.1, + "lyapunov": 1.9186803285423142, + "grad_norm": 0.08625519727104183, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107057, + "time_sec": 38.62110924720764 + }, + { + "epoch": 25, + "train_loss": 3.5271505029296875, + "train_acc": 0.09882, + "test_loss": 2.3026457008361816, + "test_acc": 0.1, + "lyapunov": 1.9201455759575299, + "grad_norm": 0.08664315655618471, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008535533905932737, + "time_sec": 38.663304567337036 + }, + { + "epoch": 26, + "train_loss": 3.52567841835022, + "train_acc": 0.09848, + "test_loss": 2.302622730255127, + "test_acc": 0.1, + "lyapunov": 1.918919243775975, + "grad_norm": 0.08931714213407926, + "grad_max_sv": 0.0026560820173472167, + "grad_min_sv": 7.80326428931121e-27, + "grad_condition": 2656082017.346831, + "lr": 0.0008422735529643444, + "time_sec": 38.642497539520264 + }, + { + "epoch": 27, + "train_loss": 3.5247526208496094, + "train_acc": 0.09662, + "test_loss": 2.3026296226501466, + "test_acc": 0.1, + "lyapunov": 1.9182322189935943, + "grad_norm": 0.08339910325165188, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008306559326618259, + "time_sec": 38.63079476356506 + }, + { + "epoch": 28, + "train_loss": 3.5269400009155274, + "train_acc": 0.09728, + "test_loss": 2.3025920150756836, + "test_acc": 0.1, + "lyapunov": 1.9199587207316133, + "grad_norm": 0.08394537087665149, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 38.61244583129883 + }, + { + "epoch": 29, + "train_loss": 3.5242063328552247, + "train_acc": 0.09546, + "test_loss": 2.3025877166748048, + "test_acc": 0.1, + "lyapunov": 1.9176992738948149, + "grad_norm": 0.08393484553605075, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008064535268264883, + "time_sec": 38.62086057662964 + }, + { + "epoch": 30, + "train_loss": 3.524652021865845, + "train_acc": 0.09846, + "test_loss": 2.3025890396118163, + "test_acc": 0.1, + "lyapunov": 1.9180299269268886, + "grad_norm": 0.08604739858068552, + "grad_max_sv": 0.0037235306110233067, + "grad_min_sv": 2.2816656604449788e-14, + "grad_condition": 2522915018.0120707, + "lr": 0.0007938926261462367, + "time_sec": 38.63639521598816 + }, + { + "epoch": 31, + "train_loss": 3.5269307495117186, + "train_acc": 0.09852, + "test_loss": 2.302594734954834, + "test_acc": 0.1, + "lyapunov": 1.9199556487295635, + "grad_norm": 0.08308332919661195, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 38.632620334625244 + }, + { + "epoch": 32, + "train_loss": 3.526603982696533, + "train_acc": 0.0987, + "test_loss": 2.3026425048828125, + "test_acc": 0.1, + "lyapunov": 1.9197655053394835, + "grad_norm": 0.08373608851321027, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 38.6338005065918 + }, + { + "epoch": 33, + "train_loss": 3.5402134245300294, + "train_acc": 0.09648, + "test_loss": 2.3025889293670656, + "test_acc": 0.1, + "lyapunov": 1.926927990010937, + "grad_norm": 0.09981834537565924, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 38.6455602645874 + }, + { + "epoch": 34, + "train_loss": 3.5265413635253906, + "train_acc": 0.09788, + "test_loss": 2.302589825439453, + "test_acc": 0.1, + "lyapunov": 1.9196307095115448, + "grad_norm": 0.08459800727870437, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 38.652732133865356 + }, + { + "epoch": 35, + "train_loss": 3.526457656402588, + "train_acc": 0.09848, + "test_loss": 2.3025897277832033, + "test_acc": 0.1, + "lyapunov": 1.91963635930015, + "grad_norm": 0.08392830107993868, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 38.618977308273315 + }, + { + "epoch": 36, + "train_loss": 3.5264506495666503, + "train_acc": 0.09836, + "test_loss": 2.302591544342041, + "test_acc": 0.1, + "lyapunov": 1.919547389840226, + "grad_norm": 0.0844841992615646, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 38.635788917541504 + }, + { + "epoch": 37, + "train_loss": 3.525513755493164, + "train_acc": 0.09824, + "test_loss": 2.302587795257568, + "test_acc": 0.1, + "lyapunov": 1.9188998626626057, + "grad_norm": 0.08511865281250128, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 38.63599181175232 + }, + { + "epoch": 38, + "train_loss": 3.5258794207763673, + "train_acc": 0.09634, + "test_loss": 2.302587114715576, + "test_acc": 0.1, + "lyapunov": 1.9190363072983139, + "grad_norm": 0.08976844520779069, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 38.631999015808105 + }, + { + "epoch": 39, + "train_loss": 3.526812607116699, + "train_acc": 0.09782, + "test_loss": 2.3025868911743164, + "test_acc": 0.1, + "lyapunov": 1.9198928242144377, + "grad_norm": 0.08338895706252505, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 38.62815856933594 + }, + { + "epoch": 40, + "train_loss": 3.5299447924041747, + "train_acc": 0.09834, + "test_loss": 2.302587143325806, + "test_acc": 0.1, + "lyapunov": 1.9223552085554507, + "grad_norm": 0.09522270183573409, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 38.62764048576355 + }, + { + "epoch": 41, + "train_loss": 3.529573831253052, + "train_acc": 0.0978, + "test_loss": 2.3025870990753172, + "test_acc": 0.1, + "lyapunov": 1.922197810829143, + "grad_norm": 0.08338290015497958, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 38.63026428222656 + }, + { + "epoch": 42, + "train_loss": 3.5254642880249025, + "train_acc": 0.09878, + "test_loss": 2.302588144683838, + "test_acc": 0.1, + "lyapunov": 1.9188408784549256, + "grad_norm": 0.08333708848875665, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 38.63510298728943 + }, + { + "epoch": 43, + "train_loss": 3.527522850036621, + "train_acc": 0.09724, + "test_loss": 2.302586852264404, + "test_acc": 0.1, + "lyapunov": 1.920439124717127, + "grad_norm": 0.08392990999765709, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 38.61439347267151 + }, + { + "epoch": 44, + "train_loss": 3.5268155879211425, + "train_acc": 0.09854, + "test_loss": 2.302588026046753, + "test_acc": 0.1, + "lyapunov": 1.919859874583876, + "grad_norm": 0.08808142140863674, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 38.63164472579956 + }, + { + "epoch": 45, + "train_loss": 3.528644903793335, + "train_acc": 0.09726, + "test_loss": 2.302586632156372, + "test_acc": 0.1, + "lyapunov": 1.9213885017063306, + "grad_norm": 0.08163685266757659, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 38.63089060783386 + }, + { + "epoch": 46, + "train_loss": 3.5269173733520507, + "train_acc": 0.09548, + "test_loss": 2.302586455535889, + "test_acc": 0.1, + "lyapunov": 1.9199798500446408, + "grad_norm": 0.08000528496736534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 38.636719703674316 + }, + { + "epoch": 47, + "train_loss": 3.525616721343994, + "train_acc": 0.0969, + "test_loss": 2.3025855419158936, + "test_acc": 0.1, + "lyapunov": 1.918914921753242, + "grad_norm": 0.0847797082901155, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 38.63527321815491 + }, + { + "epoch": 48, + "train_loss": 3.527122305908203, + "train_acc": 0.09908, + "test_loss": 2.302587979507446, + "test_acc": 0.1, + "lyapunov": 1.9201535523090216, + "grad_norm": 0.08334551671941194, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 38.6254460811615 + }, + { + "epoch": 49, + "train_loss": 3.529289007568359, + "train_acc": 0.09836, + "test_loss": 2.3025873039245606, + "test_acc": 0.1, + "lyapunov": 1.9219778029205243, + "grad_norm": 0.08239563380139257, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 38.63705110549927 + }, + { + "epoch": 50, + "train_loss": 3.5303411560821534, + "train_acc": 0.0977, + "test_loss": 2.3025870582580565, + "test_acc": 0.1, + "lyapunov": 1.9227478766380368, + "grad_norm": 0.08162963599167514, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 38.626914262771606 + }, + { + "epoch": 51, + "train_loss": 3.5286489057922363, + "train_acc": 0.09604, + "test_loss": 2.302586822128296, + "test_acc": 0.1, + "lyapunov": 1.9214349052180415, + "grad_norm": 0.08139452605749796, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 38.64423418045044 + }, + { + "epoch": 52, + "train_loss": 3.525787140045166, + "train_acc": 0.09778, + "test_loss": 2.3025859855651856, + "test_acc": 0.1, + "lyapunov": 1.9190660763884444, + "grad_norm": 0.08146521230474718, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 38.6294162273407 + }, + { + "epoch": 53, + "train_loss": 3.5288507063293455, + "train_acc": 0.09546, + "test_loss": 2.3025855419158936, + "test_acc": 0.1, + "lyapunov": 1.9215699824530754, + "grad_norm": 0.08218605919682316, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 38.62653970718384 + }, + { + "epoch": 54, + "train_loss": 3.5271841695404054, + "train_acc": 0.09872, + "test_loss": 2.3025858070373535, + "test_acc": 0.1, + "lyapunov": 1.9201822860161666, + "grad_norm": 0.08216715344839949, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 38.638410806655884 + }, + { + "epoch": 55, + "train_loss": 3.526853522644043, + "train_acc": 0.09744, + "test_loss": 2.3025860900878907, + "test_acc": 0.1, + "lyapunov": 1.919959136897036, + "grad_norm": 0.0817176354250303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 38.630091190338135 + }, + { + "epoch": 56, + "train_loss": 3.5288575717926025, + "train_acc": 0.09954, + "test_loss": 2.302586184310913, + "test_acc": 0.1, + "lyapunov": 1.921623296444983, + "grad_norm": 0.08257148205256129, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 38.64346218109131 + }, + { + "epoch": 57, + "train_loss": 3.5272767601776125, + "train_acc": 0.09642, + "test_loss": 2.302586555480957, + "test_acc": 0.1, + "lyapunov": 1.9202661358791848, + "grad_norm": 0.08293348649238423, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 38.64233660697937 + }, + { + "epoch": 58, + "train_loss": 3.526464948577881, + "train_acc": 0.09672, + "test_loss": 2.3025856628417967, + "test_acc": 0.1, + "lyapunov": 1.9196561523105786, + "grad_norm": 0.08164186959675705, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 38.63249588012695 + }, + { + "epoch": 59, + "train_loss": 3.5295531370544433, + "train_acc": 0.09774, + "test_loss": 2.302585400390625, + "test_acc": 0.1, + "lyapunov": 1.9221740268990206, + "grad_norm": 0.08246273738852085, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 38.646018266677856 + }, + { + "epoch": 60, + "train_loss": 3.5271629650115965, + "train_acc": 0.0971, + "test_loss": 2.3025858444213867, + "test_acc": 0.1, + "lyapunov": 1.9201987954356787, + "grad_norm": 0.08208001883222767, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 38.6309814453125 + }, + { + "epoch": 61, + "train_loss": 3.5265548262023927, + "train_acc": 0.0977, + "test_loss": 2.302585780715942, + "test_acc": 0.1, + "lyapunov": 1.9197500297785415, + "grad_norm": 0.08189736323511718, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 38.638221740722656 + }, + { + "epoch": 62, + "train_loss": 3.52600441986084, + "train_acc": 0.09678, + "test_loss": 2.302585761642456, + "test_acc": 0.1, + "lyapunov": 1.9192463177854142, + "grad_norm": 0.08137598978711448, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 38.63043713569641 + }, + { + "epoch": 63, + "train_loss": 3.5271013943481444, + "train_acc": 0.09814, + "test_loss": 2.302585670852661, + "test_acc": 0.1, + "lyapunov": 1.920157666096602, + "grad_norm": 0.0823619758981674, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 38.63147497177124 + }, + { + "epoch": 64, + "train_loss": 3.526780191192627, + "train_acc": 0.09852, + "test_loss": 2.302585818862915, + "test_acc": 0.1, + "lyapunov": 1.919904801546765, + "grad_norm": 0.08022492391600272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 38.62516927719116 + }, + { + "epoch": 65, + "train_loss": 3.5343781797790528, + "train_acc": 0.09912, + "test_loss": 2.3025853904724123, + "test_acc": 0.1, + "lyapunov": 1.9257748550771143, + "grad_norm": 0.10073329729823817, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 38.634148836135864 + }, + { + "epoch": 66, + "train_loss": 3.5349793888092043, + "train_acc": 0.09842, + "test_loss": 2.3025853446960447, + "test_acc": 0.1, + "lyapunov": 1.9264679845336758, + "grad_norm": 0.11920770311136344, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 38.61845135688782 + }, + { + "epoch": 67, + "train_loss": 3.526273007965088, + "train_acc": 0.09544, + "test_loss": 2.3025852378845215, + "test_acc": 0.1, + "lyapunov": 1.9194827823687697, + "grad_norm": 0.08304121043671493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 38.626497983932495 + }, + { + "epoch": 68, + "train_loss": 3.5271414315795897, + "train_acc": 0.0966, + "test_loss": 2.3025850952148437, + "test_acc": 0.1, + "lyapunov": 1.9202514917344389, + "grad_norm": 0.08574615477087318, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 38.627126693725586 + }, + { + "epoch": 69, + "train_loss": 3.529951874008179, + "train_acc": 0.0986, + "test_loss": 2.30258518447876, + "test_acc": 0.1, + "lyapunov": 1.9225430412365652, + "grad_norm": 0.08082947961897828, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 38.630186319351196 + }, + { + "epoch": 70, + "train_loss": 3.526535584869385, + "train_acc": 0.09668, + "test_loss": 2.3025852592468263, + "test_acc": 0.1, + "lyapunov": 1.919725867183617, + "grad_norm": 0.08274796493939703, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 38.6431679725647 + }, + { + "epoch": 71, + "train_loss": 3.5277945655822753, + "train_acc": 0.09836, + "test_loss": 2.3025853775024414, + "test_acc": 0.1, + "lyapunov": 1.920768865843868, + "grad_norm": 0.08235441909099428, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 38.63748812675476 + }, + { + "epoch": 72, + "train_loss": 3.5274662791442872, + "train_acc": 0.0948, + "test_loss": 2.3025851234436034, + "test_acc": 0.1, + "lyapunov": 1.9204377185963, + "grad_norm": 0.08364637794680509, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 38.6381402015686 + }, + { + "epoch": 73, + "train_loss": 3.526118115386963, + "train_acc": 0.09886, + "test_loss": 2.302585259628296, + "test_acc": 0.1, + "lyapunov": 1.9193554836160995, + "grad_norm": 0.0826562338509352, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 38.65567326545715 + }, + { + "epoch": 74, + "train_loss": 3.527300643615723, + "train_acc": 0.09764, + "test_loss": 2.302585151672363, + "test_acc": 0.1, + "lyapunov": 1.9203089323190168, + "grad_norm": 0.08128595818241462, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 38.65558409690857 + }, + { + "epoch": 75, + "train_loss": 3.52685251663208, + "train_acc": 0.09664, + "test_loss": 2.3025852661132813, + "test_acc": 0.1, + "lyapunov": 1.9200191327068201, + "grad_norm": 0.08404244166329763, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 38.63766312599182 + }, + { + "epoch": 76, + "train_loss": 3.5262623787689207, + "train_acc": 0.09722, + "test_loss": 2.3025850158691408, + "test_acc": 0.1, + "lyapunov": 1.919482776271108, + "grad_norm": 0.08232879952859255, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 38.633180379867554 + }, + { + "epoch": 77, + "train_loss": 3.528319863128662, + "train_acc": 0.09596, + "test_loss": 2.3025850936889647, + "test_acc": 0.1, + "lyapunov": 1.9211895322555776, + "grad_norm": 0.08358594679641423, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 38.6444034576416 + }, + { + "epoch": 78, + "train_loss": 3.526455977935791, + "train_acc": 0.09646, + "test_loss": 2.3025851753234865, + "test_acc": 0.1, + "lyapunov": 1.919646045740913, + "grad_norm": 0.0800944099425941, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 38.63438820838928 + }, + { + "epoch": 79, + "train_loss": 3.528594108276367, + "train_acc": 0.09844, + "test_loss": 2.302585315704346, + "test_acc": 0.1, + "lyapunov": 1.9213674385529345, + "grad_norm": 0.0823521435571041, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 38.63344979286194 + }, + { + "epoch": 80, + "train_loss": 3.5273741276550292, + "train_acc": 0.09784, + "test_loss": 2.3025850051879884, + "test_acc": 0.1, + "lyapunov": 1.9203915013681592, + "grad_norm": 0.0830759912493753, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 38.62626814842224 + }, + { + "epoch": 81, + "train_loss": 3.5291355400848388, + "train_acc": 0.09736, + "test_loss": 2.3025851634979246, + "test_acc": 0.1, + "lyapunov": 1.921823484818344, + "grad_norm": 0.08275874029214267, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 38.62844204902649 + }, + { + "epoch": 82, + "train_loss": 3.525912507019043, + "train_acc": 0.09748, + "test_loss": 2.3025852321624756, + "test_acc": 0.1, + "lyapunov": 1.91920463874212, + "grad_norm": 0.08153852660653182, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 38.653265714645386 + }, + { + "epoch": 83, + "train_loss": 3.5292207734680177, + "train_acc": 0.0958, + "test_loss": 2.3025851135253905, + "test_acc": 0.1, + "lyapunov": 1.9219502158786939, + "grad_norm": 0.08350888633092267, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 38.634111642837524 + }, + { + "epoch": 84, + "train_loss": 3.5284012381744385, + "train_acc": 0.09624, + "test_loss": 2.30258512878418, + "test_acc": 0.1, + "lyapunov": 1.9212511674217556, + "grad_norm": 0.08116909186786311, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 38.64353036880493 + }, + { + "epoch": 85, + "train_loss": 3.5251765769195558, + "train_acc": 0.09792, + "test_loss": 2.30258514251709, + "test_acc": 0.1, + "lyapunov": 1.918617296401802, + "grad_norm": 0.07954191314548852, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 38.62560677528381 + }, + { + "epoch": 86, + "train_loss": 3.5287663554382322, + "train_acc": 0.09838, + "test_loss": 2.302585173034668, + "test_acc": 0.1, + "lyapunov": 1.9215295982482794, + "grad_norm": 0.08355699198177892, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 38.65434241294861 + }, + { + "epoch": 87, + "train_loss": 3.5260034490966796, + "train_acc": 0.09604, + "test_loss": 2.3025851554870607, + "test_acc": 0.1, + "lyapunov": 1.9192945807791122, + "grad_norm": 0.08149215014053633, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 38.63465094566345 + }, + { + "epoch": 88, + "train_loss": 3.5243265664672854, + "train_acc": 0.09828, + "test_loss": 2.302585033416748, + "test_acc": 0.1, + "lyapunov": 1.9179029281791824, + "grad_norm": 0.08154521467921626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 38.6289963722229 + }, + { + "epoch": 89, + "train_loss": 3.5287904942321777, + "train_acc": 0.09666, + "test_loss": 2.302585191345215, + "test_acc": 0.1, + "lyapunov": 1.9215726117648737, + "grad_norm": 0.084132595254172, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 38.642388105392456 + }, + { + "epoch": 90, + "train_loss": 3.526969603881836, + "train_acc": 0.09754, + "test_loss": 2.302585014343262, + "test_acc": 0.1, + "lyapunov": 1.920039845549542, + "grad_norm": 0.0821271686806539, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 38.63814377784729 + }, + { + "epoch": 91, + "train_loss": 3.527617153930664, + "train_acc": 0.09638, + "test_loss": 2.302585041809082, + "test_acc": 0.1, + "lyapunov": 1.9205815706716474, + "grad_norm": 0.08312510555513332, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 38.61940360069275 + }, + { + "epoch": 92, + "train_loss": 3.5268433947753905, + "train_acc": 0.09684, + "test_loss": 2.3025852138519287, + "test_acc": 0.1, + "lyapunov": 1.9199492108181615, + "grad_norm": 0.0823876986166593, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 38.627458810806274 + }, + { + "epoch": 93, + "train_loss": 3.53038783744812, + "train_acc": 0.0982, + "test_loss": 2.3025850196838378, + "test_acc": 0.1, + "lyapunov": 1.9228984605320885, + "grad_norm": 0.08263085862758328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 38.63483691215515 + }, + { + "epoch": 94, + "train_loss": 3.5289703980255127, + "train_acc": 0.09816, + "test_loss": 2.3025850566864015, + "test_acc": 0.1, + "lyapunov": 1.9216854218631754, + "grad_norm": 0.08327210271669083, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 38.63469362258911 + }, + { + "epoch": 95, + "train_loss": 3.5277647956848144, + "train_acc": 0.0995, + "test_loss": 2.3025852081298828, + "test_acc": 0.1, + "lyapunov": 1.9207559202028357, + "grad_norm": 0.08352486265414892, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 38.64616012573242 + }, + { + "epoch": 96, + "train_loss": 3.526619141845703, + "train_acc": 0.09938, + "test_loss": 2.3025851345062254, + "test_acc": 0.1, + "lyapunov": 1.9198539360709812, + "grad_norm": 0.08098182122024891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 38.62220072746277 + }, + { + "epoch": 97, + "train_loss": 3.5280892516326903, + "train_acc": 0.1, + "test_loss": 2.3025852352142335, + "test_acc": 0.1, + "lyapunov": 1.921060741100165, + "grad_norm": 0.08211810367594433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 38.645119190216064 + }, + { + "epoch": 98, + "train_loss": 3.5287079336547853, + "train_acc": 0.1, + "test_loss": 2.3025850273132322, + "test_acc": 0.1, + "lyapunov": 1.9215380800959398, + "grad_norm": 0.08325515946558669, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 38.63027763366699 + }, + { + "epoch": 99, + "train_loss": 3.5253015606689453, + "train_acc": 0.1, + "test_loss": 2.30258511428833, + "test_acc": 0.1, + "lyapunov": 1.9187132022569857, + "grad_norm": 0.08193671483030009, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 38.63921046257019 + }, + { + "epoch": 100, + "train_loss": 3.5272140621948243, + "train_acc": 0.1, + "test_loss": 2.302585135269165, + "test_acc": 0.1, + "lyapunov": 1.9202767503840843, + "grad_norm": 0.08222655054617872, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 38.6323139667511 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 8.479881681365967, + "train_acc": 0.15672, + "test_loss": 2.162619204711914, + "test_acc": 0.2125, + "lyapunov": 4.108346384199684, + "grad_norm": 7.697098833505723, + "grad_max_sv": 6.178906440734863, + "grad_min_sv": 2.761631513692464e-07, + "grad_condition": 23140136.221944965, + "lr": 0.0009997532801828658, + "time_sec": 81.47396469116211 + }, + { + "epoch": 2, + "train_loss": 5.665244631958008, + "train_acc": 0.18, + "test_loss": 2.1842808677673338, + "test_acc": 0.1923, + "lyapunov": 3.230283256686862, + "grad_norm": 5.392009012742897, + "grad_max_sv": 4.110089653730393, + "grad_min_sv": 1.9321651976156317e-07, + "grad_condition": 21420475.323837068, + "lr": 0.0009990133642141358, + "time_sec": 81.45991396903992 + }, + { + "epoch": 3, + "train_loss": 5.333162035522461, + "train_acc": 0.1952, + "test_loss": 2.225303956604004, + "test_acc": 0.167, + "lyapunov": 3.1082111679379594, + "grad_norm": 3.851771920219555, + "grad_max_sv": 3.176962560415268, + "grad_min_sv": 1.3438213457561688e-07, + "grad_condition": 23879291.498504233, + "lr": 0.00099778098230154, + "time_sec": 81.46788787841797 + }, + { + "epoch": 4, + "train_loss": 5.171234805908203, + "train_acc": 0.20002, + "test_loss": 2.235258939361572, + "test_acc": 0.159, + "lyapunov": 3.0473744570446746, + "grad_norm": 2.481126294013876, + "grad_max_sv": 2.0792742133140565, + "grad_min_sv": 8.9392968050106e-08, + "grad_condition": 24637829.84704242, + "lr": 0.000996057350657239, + "time_sec": 81.47967004776001 + }, + { + "epoch": 5, + "train_loss": 5.166805406799316, + "train_acc": 0.19452, + "test_loss": 2.237046794128418, + "test_acc": 0.1327, + "lyapunov": 3.0511742223559133, + "grad_norm": 1.3615579983642885, + "grad_max_sv": 1.0548206314444541, + "grad_min_sv": 4.5490313116403056e-08, + "grad_condition": 23987300.59429905, + "lr": 0.0009938441702975688, + "time_sec": 81.459157705307 + }, + { + "epoch": 6, + "train_loss": 4.8697237976074215, + "train_acc": 0.1737, + "test_loss": 2.2830872146606445, + "test_acc": 0.1253, + "lyapunov": 2.8754516471072535, + "grad_norm": 0.6903867745940513, + "grad_max_sv": 0.41943032629787924, + "grad_min_sv": 1.919375629544362e-08, + "grad_condition": 22192013.87340497, + "lr": 0.0009911436253643444, + "time_sec": 81.48192954063416 + }, + { + "epoch": 7, + "train_loss": 4.493588522949219, + "train_acc": 0.15938, + "test_loss": 2.3302653469085692, + "test_acc": 0.1, + "lyapunov": 2.653091859939458, + "grad_norm": 0.7557218960403191, + "grad_max_sv": 0.26077940948307515, + "grad_min_sv": 1.0986899512399616e-08, + "grad_condition": 25117189.859535195, + "lr": 0.0009879583809693736, + "time_sec": 81.4841628074646 + }, + { + "epoch": 8, + "train_loss": 4.350341845397949, + "train_acc": 0.15252, + "test_loss": 2.3086660652160647, + "test_acc": 0.1, + "lyapunov": 2.5555299291830234, + "grad_norm": 0.6250628446482196, + "grad_max_sv": 0.20942260958254338, + "grad_min_sv": 7.251302003297155e-09, + "grad_condition": 30522570.970140863, + "lr": 0.0009842915805643154, + "time_sec": 81.46237683296204 + }, + { + "epoch": 9, + "train_loss": 4.145118522186279, + "train_acc": 0.13274, + "test_loss": 2.315164138031006, + "test_acc": 0.1, + "lyapunov": 2.40533269762688, + "grad_norm": 0.6205908073118289, + "grad_max_sv": 0.14447018823120744, + "grad_min_sv": 4.4057232563565755e-09, + "grad_condition": 34238562.93985257, + "lr": 0.0009801468428384714, + "time_sec": 81.4730293750763 + }, + { + "epoch": 10, + "train_loss": 4.078840268859863, + "train_acc": 0.1284, + "test_loss": 2.3138900623321534, + "test_acc": 0.1, + "lyapunov": 2.363016066343888, + "grad_norm": 0.7930843872612708, + "grad_max_sv": 0.10398251404985785, + "grad_min_sv": 3.7019540950061767e-09, + "grad_condition": 60913515.913623154, + "lr": 0.0009755282581475767, + "time_sec": 81.45200657844543 + }, + { + "epoch": 11, + "train_loss": 4.092224692230225, + "train_acc": 0.1466, + "test_loss": 2.312975662994385, + "test_acc": 0.1, + "lyapunov": 2.3754844513085795, + "grad_norm": 1.1984655112922225, + "grad_max_sv": 0.17450910471379757, + "grad_min_sv": 5.5799074860640734e-09, + "grad_condition": 13168082812.37189, + "lr": 0.0009704403844771127, + "time_sec": 81.45421433448792 + }, + { + "epoch": 12, + "train_loss": 4.142614550323486, + "train_acc": 0.10048, + "test_loss": 2.3073625778198243, + "test_acc": 0.1, + "lyapunov": 2.36521298623146, + "grad_norm": 0.8201455961321854, + "grad_max_sv": 0.06452706009149552, + "grad_min_sv": 1.4042129118228878e-12, + "grad_condition": 50885083514.90724, + "lr": 0.0009648882429441257, + "time_sec": 81.46072387695312 + }, + { + "epoch": 13, + "train_loss": 3.979385091934204, + "train_acc": 0.10066, + "test_loss": 2.3081630187988282, + "test_acc": 0.1, + "lyapunov": 2.26381984696059, + "grad_norm": 0.16210184952823345, + "grad_max_sv": 0.04905642978847027, + "grad_min_sv": 2.7241308859756593e-12, + "grad_condition": 39268609789.13625, + "lr": 0.0009588773128419905, + "time_sec": 81.4600670337677 + }, + { + "epoch": 14, + "train_loss": 4.013840252990723, + "train_acc": 0.09774, + "test_loss": 2.3071225547790526, + "test_acc": 0.1, + "lyapunov": 2.2779995590219717, + "grad_norm": 0.2350799590612887, + "grad_max_sv": 0.03584399004466832, + "grad_min_sv": 2.4371194341884142e-11, + "grad_condition": 24256890299.017464, + "lr": 0.0009524135262330098, + "time_sec": 81.45963406562805 + }, + { + "epoch": 15, + "train_loss": 3.9913157040405274, + "train_acc": 0.09784, + "test_loss": 2.319146055984497, + "test_acc": 0.1, + "lyapunov": 2.268958825894329, + "grad_norm": 0.15763925383129676, + "grad_max_sv": 0.009183965646661818, + "grad_min_sv": 1.97946225383161e-12, + "grad_condition": 8163098832.376617, + "lr": 0.0009455032620941839, + "time_sec": 81.44594478607178 + }, + { + "epoch": 16, + "train_loss": 3.9718331854248046, + "train_acc": 0.0996, + "test_loss": 2.3092525833129884, + "test_acc": 0.1, + "lyapunov": 2.2586230457286396, + "grad_norm": 0.11766352456542575, + "grad_max_sv": 0.006989215174689889, + "grad_min_sv": 2.4024430389645366e-14, + "grad_condition": 6504081924.260536, + "lr": 0.0009381533400219318, + "time_sec": 81.44390797615051 + }, + { + "epoch": 17, + "train_loss": 3.9787883277130125, + "train_acc": 0.09702, + "test_loss": 2.3043574817657473, + "test_acc": 0.1, + "lyapunov": 2.2631307922665727, + "grad_norm": 0.1527010207412437, + "grad_max_sv": 0.009803948854096235, + "grad_min_sv": 1.4435005241224427e-33, + "grad_condition": 9803948854.096233, + "lr": 0.0009303710135019719, + "time_sec": 81.43403100967407 + }, + { + "epoch": 18, + "train_loss": 3.9913615090942383, + "train_acc": 0.09744, + "test_loss": 2.3033508323669434, + "test_acc": 0.1, + "lyapunov": 2.269262256524752, + "grad_norm": 0.11184179273021279, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009221639627510076, + "time_sec": 81.42399740219116 + }, + { + "epoch": 19, + "train_loss": 3.9763801429748535, + "train_acc": 0.0977, + "test_loss": 2.3026752422332764, + "test_acc": 0.1, + "lyapunov": 2.2619051079615913, + "grad_norm": 0.11713248666386221, + "grad_max_sv": 0.000484072370454669, + "grad_min_sv": 0.0, + "grad_condition": 484072370.454669, + "lr": 0.000913540287137281, + "time_sec": 81.4525249004364 + }, + { + "epoch": 20, + "train_loss": 3.976750040283203, + "train_acc": 0.09734, + "test_loss": 2.302591667175293, + "test_acc": 0.1, + "lyapunov": 2.262148560770332, + "grad_norm": 0.11345857984491753, + "grad_max_sv": 0.004815328773111105, + "grad_min_sv": 7.298523316195025e-36, + "grad_condition": 4815328773.111105, + "lr": 0.0009045084971874739, + "time_sec": 81.51628756523132 + }, + { + "epoch": 21, + "train_loss": 3.980269993438721, + "train_acc": 0.09802, + "test_loss": 2.302587752532959, + "test_acc": 0.1, + "lyapunov": 2.264334798164075, + "grad_norm": 0.13684662833237576, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008950775061878452, + "time_sec": 81.45560097694397 + }, + { + "epoch": 22, + "train_loss": 3.9804648877716065, + "train_acc": 0.0979, + "test_loss": 2.302587752532959, + "test_acc": 0.1, + "lyapunov": 2.2635294013011182, + "grad_norm": 0.13344079799844585, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878947, + "time_sec": 81.44366526603699 + }, + { + "epoch": 23, + "train_loss": 3.9813251597595216, + "train_acc": 0.09872, + "test_loss": 2.302596923828125, + "test_acc": 0.1, + "lyapunov": 2.264318755825462, + "grad_norm": 0.11240815342914404, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008750555348152298, + "time_sec": 81.4700722694397 + }, + { + "epoch": 24, + "train_loss": 3.9829969465637207, + "train_acc": 0.09762, + "test_loss": 2.302590003967285, + "test_acc": 0.1, + "lyapunov": 2.2655306484388267, + "grad_norm": 0.13657445352154945, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107057, + "time_sec": 81.44092345237732 + }, + { + "epoch": 25, + "train_loss": 3.9867445934295653, + "train_acc": 0.09768, + "test_loss": 2.3025884731292723, + "test_acc": 0.1, + "lyapunov": 2.2683042187215117, + "grad_norm": 0.13504220620651136, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008535533905932737, + "time_sec": 81.44885325431824 + }, + { + "epoch": 26, + "train_loss": 4.011947896575927, + "train_acc": 0.09772, + "test_loss": 2.302588147735596, + "test_acc": 0.1, + "lyapunov": 2.2796514083052535, + "grad_norm": 0.16320303411181733, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643444, + "time_sec": 81.45354628562927 + }, + { + "epoch": 27, + "train_loss": 3.9786824931335447, + "train_acc": 0.09896, + "test_loss": 2.302594832611084, + "test_acc": 0.1, + "lyapunov": 2.26323458300832, + "grad_norm": 0.10988564477689002, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008306559326618259, + "time_sec": 81.44628882408142 + }, + { + "epoch": 28, + "train_loss": 3.977536257247925, + "train_acc": 0.098, + "test_loss": 2.302598391723633, + "test_acc": 0.1, + "lyapunov": 2.262441022926584, + "grad_norm": 0.12595116922261335, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 81.4543764591217 + }, + { + "epoch": 29, + "train_loss": 3.976567816162109, + "train_acc": 0.09876, + "test_loss": 2.302590633010864, + "test_acc": 0.1, + "lyapunov": 2.2617232262935785, + "grad_norm": 0.11663224483129596, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008064535268264883, + "time_sec": 81.45405316352844 + }, + { + "epoch": 30, + "train_loss": 3.98611599609375, + "train_acc": 0.09902, + "test_loss": 2.302588882827759, + "test_acc": 0.1, + "lyapunov": 2.268034580723404, + "grad_norm": 0.12156603788402341, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462367, + "time_sec": 81.43305087089539 + }, + { + "epoch": 31, + "train_loss": 3.973400810546875, + "train_acc": 0.09778, + "test_loss": 2.3025912315368653, + "test_acc": 0.1, + "lyapunov": 2.259550383633665, + "grad_norm": 0.11416147448139306, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 81.45837593078613 + }, + { + "epoch": 32, + "train_loss": 3.988133301086426, + "train_acc": 0.0974, + "test_loss": 2.3025894966125486, + "test_acc": 0.1, + "lyapunov": 2.2669999562870817, + "grad_norm": 0.11056723038790034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 81.44456076622009 + }, + { + "epoch": 33, + "train_loss": 4.005648225860596, + "train_acc": 0.09582, + "test_loss": 2.302590217590332, + "test_acc": 0.1, + "lyapunov": 2.2759649180390342, + "grad_norm": 0.15627582965327647, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 81.45507860183716 + }, + { + "epoch": 34, + "train_loss": 3.979487621154785, + "train_acc": 0.09842, + "test_loss": 2.3025886589050293, + "test_acc": 0.1, + "lyapunov": 2.2636950528225324, + "grad_norm": 0.11766964677730013, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 81.40873432159424 + }, + { + "epoch": 35, + "train_loss": 3.9761420146942137, + "train_acc": 0.09734, + "test_loss": 2.3025886192321776, + "test_acc": 0.1, + "lyapunov": 2.2615554509565348, + "grad_norm": 0.13516175590778773, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 81.41994976997375 + }, + { + "epoch": 36, + "train_loss": 3.982365760269165, + "train_acc": 0.09772, + "test_loss": 2.302588511276245, + "test_acc": 0.1, + "lyapunov": 2.2654811189607584, + "grad_norm": 0.11681074828605718, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 81.44073605537415 + }, + { + "epoch": 37, + "train_loss": 4.0145159342956545, + "train_acc": 0.09844, + "test_loss": 2.3025877605438234, + "test_acc": 0.1, + "lyapunov": 2.279959214617834, + "grad_norm": 0.16927419652036743, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 81.44942951202393 + }, + { + "epoch": 38, + "train_loss": 3.9834751657104492, + "train_acc": 0.0988, + "test_loss": 2.3025879089355468, + "test_acc": 0.1, + "lyapunov": 2.26584634939423, + "grad_norm": 0.14984272020285577, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 81.45499515533447 + }, + { + "epoch": 39, + "train_loss": 4.02413849609375, + "train_acc": 0.09734, + "test_loss": 2.30258787689209, + "test_acc": 0.1, + "lyapunov": 2.286009701316619, + "grad_norm": 0.22145868959770007, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 81.45317363739014 + }, + { + "epoch": 40, + "train_loss": 3.9736411520385744, + "train_acc": 0.09894, + "test_loss": 2.3025887702941894, + "test_acc": 0.1, + "lyapunov": 2.259992800710146, + "grad_norm": 0.08893647577966153, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 81.45592546463013 + }, + { + "epoch": 41, + "train_loss": 3.976674521484375, + "train_acc": 0.09844, + "test_loss": 2.302586205673218, + "test_acc": 0.1, + "lyapunov": 2.262093958647355, + "grad_norm": 0.09526075366227103, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 81.4629635810852 + }, + { + "epoch": 42, + "train_loss": 3.9767224240112307, + "train_acc": 0.09934, + "test_loss": 2.3025863662719726, + "test_acc": 0.1, + "lyapunov": 2.2621575853098994, + "grad_norm": 0.0889728077319319, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 81.4452486038208 + }, + { + "epoch": 43, + "train_loss": 3.9843084770202637, + "train_acc": 0.0983, + "test_loss": 2.302587857055664, + "test_acc": 0.1, + "lyapunov": 2.266823678980093, + "grad_norm": 0.14286833201945623, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 81.46053290367126 + }, + { + "epoch": 44, + "train_loss": 3.978666923828125, + "train_acc": 0.09862, + "test_loss": 2.302588472366333, + "test_acc": 0.1, + "lyapunov": 2.262758489764865, + "grad_norm": 0.10285858309556797, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 81.4441590309143 + }, + { + "epoch": 45, + "train_loss": 3.984368924102783, + "train_acc": 0.09714, + "test_loss": 2.3025872661590574, + "test_acc": 0.1, + "lyapunov": 2.2663481009890662, + "grad_norm": 0.11152947980914625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 81.43797850608826 + }, + { + "epoch": 46, + "train_loss": 3.9835290453338623, + "train_acc": 0.09794, + "test_loss": 2.302588889694214, + "test_acc": 0.1, + "lyapunov": 2.2661942069792684, + "grad_norm": 0.12155880302110986, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 81.4439845085144 + }, + { + "epoch": 47, + "train_loss": 3.976571675872803, + "train_acc": 0.09746, + "test_loss": 2.302587047958374, + "test_acc": 0.1, + "lyapunov": 2.262034943646482, + "grad_norm": 0.09434388559512244, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 81.44648504257202 + }, + { + "epoch": 48, + "train_loss": 3.978961787414551, + "train_acc": 0.09674, + "test_loss": 2.302586452484131, + "test_acc": 0.1, + "lyapunov": 2.2636160929794507, + "grad_norm": 0.09388300184277713, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 81.50625872612 + }, + { + "epoch": 49, + "train_loss": 3.9766515798950195, + "train_acc": 0.09856, + "test_loss": 2.302586361694336, + "test_acc": 0.1, + "lyapunov": 2.2621047679725512, + "grad_norm": 0.08611192583269686, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 81.42919588088989 + }, + { + "epoch": 50, + "train_loss": 3.9754750718688965, + "train_acc": 0.09614, + "test_loss": 2.302587022018433, + "test_acc": 0.1, + "lyapunov": 2.261166003049182, + "grad_norm": 0.09585057441328976, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 81.43738746643066 + }, + { + "epoch": 51, + "train_loss": 3.9752406224823, + "train_acc": 0.09726, + "test_loss": 2.302586801147461, + "test_acc": 0.1, + "lyapunov": 2.2611102423704494, + "grad_norm": 0.09095072097377155, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 81.45784163475037 + }, + { + "epoch": 52, + "train_loss": 3.98188600982666, + "train_acc": 0.0951, + "test_loss": 2.302586806488037, + "test_acc": 0.1, + "lyapunov": 2.265076126893768, + "grad_norm": 0.1123738428492386, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 81.47153091430664 + }, + { + "epoch": 53, + "train_loss": 3.980596968536377, + "train_acc": 0.0976, + "test_loss": 2.3025859146118166, + "test_acc": 0.1, + "lyapunov": 2.2645553932775315, + "grad_norm": 0.1076773200596488, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 81.44375872612 + }, + { + "epoch": 54, + "train_loss": 3.9776349996948244, + "train_acc": 0.09706, + "test_loss": 2.3025868438720702, + "test_acc": 0.1, + "lyapunov": 2.2628720568878875, + "grad_norm": 0.08828239082049001, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 81.42411518096924 + }, + { + "epoch": 55, + "train_loss": 3.9808822979736327, + "train_acc": 0.09588, + "test_loss": 2.302585488128662, + "test_acc": 0.1, + "lyapunov": 2.2643827629821076, + "grad_norm": 0.11262628002715089, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 81.4528546333313 + }, + { + "epoch": 56, + "train_loss": 3.974801806488037, + "train_acc": 0.09592, + "test_loss": 2.3025861625671387, + "test_acc": 0.1, + "lyapunov": 2.2608287944208327, + "grad_norm": 0.09195483599034024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 81.44676446914673 + }, + { + "epoch": 57, + "train_loss": 3.976495365371704, + "train_acc": 0.09736, + "test_loss": 2.3025858879089354, + "test_acc": 0.1, + "lyapunov": 2.262001718096721, + "grad_norm": 0.08361845913085657, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 81.45348882675171 + }, + { + "epoch": 58, + "train_loss": 3.980894155731201, + "train_acc": 0.09842, + "test_loss": 2.3025855281829832, + "test_acc": 0.1, + "lyapunov": 2.2647068646862683, + "grad_norm": 0.11991605921354555, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 81.47408199310303 + }, + { + "epoch": 59, + "train_loss": 3.994586195449829, + "train_acc": 0.0973, + "test_loss": 2.3025854663848877, + "test_acc": 0.1, + "lyapunov": 2.27294464672313, + "grad_norm": 0.18222829815312913, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 81.44711089134216 + }, + { + "epoch": 60, + "train_loss": 3.9781198291015625, + "train_acc": 0.09658, + "test_loss": 2.3025856033325196, + "test_acc": 0.1, + "lyapunov": 2.263154449365328, + "grad_norm": 0.08448254246697348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 81.44161295890808 + }, + { + "epoch": 61, + "train_loss": 4.02450031616211, + "train_acc": 0.0976, + "test_loss": 2.302585502624512, + "test_acc": 0.1, + "lyapunov": 2.286170544831649, + "grad_norm": 0.23432897685131301, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 81.45745611190796 + }, + { + "epoch": 62, + "train_loss": 3.988269701385498, + "train_acc": 0.09688, + "test_loss": 2.3025854175567626, + "test_acc": 0.1, + "lyapunov": 2.267505117084669, + "grad_norm": 0.10764931064603923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 81.45787954330444 + }, + { + "epoch": 63, + "train_loss": 3.9736854934692385, + "train_acc": 0.09646, + "test_loss": 2.3025857013702393, + "test_acc": 0.1, + "lyapunov": 2.2600014398774833, + "grad_norm": 0.08382317206831051, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 81.44196057319641 + }, + { + "epoch": 64, + "train_loss": 3.9797292990875244, + "train_acc": 0.0969, + "test_loss": 2.3025853332519532, + "test_acc": 0.1, + "lyapunov": 2.264177340680681, + "grad_norm": 0.11933485737211565, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 81.45828652381897 + }, + { + "epoch": 65, + "train_loss": 3.9763733405303956, + "train_acc": 0.097, + "test_loss": 2.3025854026794432, + "test_acc": 0.1, + "lyapunov": 2.2618614468733065, + "grad_norm": 0.08601466707594763, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 81.44515085220337 + }, + { + "epoch": 66, + "train_loss": 4.001672252197266, + "train_acc": 0.09836, + "test_loss": 2.302585359954834, + "test_acc": 0.1, + "lyapunov": 2.276178054492492, + "grad_norm": 0.19097066416551475, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 81.44997453689575 + }, + { + "epoch": 67, + "train_loss": 3.983064818649292, + "train_acc": 0.09848, + "test_loss": 2.302585221862793, + "test_acc": 0.1, + "lyapunov": 2.2660030678410052, + "grad_norm": 0.11726894505680324, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 81.45755219459534 + }, + { + "epoch": 68, + "train_loss": 3.9874353774261473, + "train_acc": 0.09726, + "test_loss": 2.302585542297363, + "test_acc": 0.1, + "lyapunov": 2.26753244497587, + "grad_norm": 0.1096052061821724, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 81.45092463493347 + }, + { + "epoch": 69, + "train_loss": 3.984990802612305, + "train_acc": 0.09842, + "test_loss": 2.3025853466033936, + "test_acc": 0.1, + "lyapunov": 2.2674437922894803, + "grad_norm": 0.08538883278176537, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 81.44036960601807 + }, + { + "epoch": 70, + "train_loss": 3.9768560768127443, + "train_acc": 0.09864, + "test_loss": 2.3025853176116944, + "test_acc": 0.1, + "lyapunov": 2.262266612113894, + "grad_norm": 0.0826759570118499, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 81.44237995147705 + }, + { + "epoch": 71, + "train_loss": 3.97729412109375, + "train_acc": 0.09838, + "test_loss": 2.3025852783203127, + "test_acc": 0.1, + "lyapunov": 2.262566337195199, + "grad_norm": 0.08149339121565821, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 81.46553111076355 + }, + { + "epoch": 72, + "train_loss": 3.999013508300781, + "train_acc": 0.09792, + "test_loss": 2.3025853332519532, + "test_acc": 0.1, + "lyapunov": 2.2738718602358534, + "grad_norm": 0.15690481475260892, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 81.440505027771 + }, + { + "epoch": 73, + "train_loss": 3.9769914697265625, + "train_acc": 0.09758, + "test_loss": 2.302585132598877, + "test_acc": 0.1, + "lyapunov": 2.262345004264656, + "grad_norm": 0.08468511131490652, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 81.45508050918579 + }, + { + "epoch": 74, + "train_loss": 3.9735559133148195, + "train_acc": 0.09684, + "test_loss": 2.302585078430176, + "test_acc": 0.1, + "lyapunov": 2.2599204360981426, + "grad_norm": 0.08407853053475459, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 81.43686723709106 + }, + { + "epoch": 75, + "train_loss": 3.975616183166504, + "train_acc": 0.09758, + "test_loss": 2.302585101699829, + "test_acc": 0.1, + "lyapunov": 2.2613788644980897, + "grad_norm": 0.08410718060667108, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 81.46202492713928 + }, + { + "epoch": 76, + "train_loss": 3.9777969396972654, + "train_acc": 0.09642, + "test_loss": 2.302585230255127, + "test_acc": 0.1, + "lyapunov": 2.262849387000589, + "grad_norm": 0.08412741392957411, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 81.69426202774048 + }, + { + "epoch": 77, + "train_loss": 3.997583436126709, + "train_acc": 0.09804, + "test_loss": 2.3025851612091066, + "test_acc": 0.1, + "lyapunov": 2.272977476534636, + "grad_norm": 0.19693507091470583, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 81.47962164878845 + }, + { + "epoch": 78, + "train_loss": 3.981567749633789, + "train_acc": 0.0972, + "test_loss": 2.302585176086426, + "test_acc": 0.1, + "lyapunov": 2.2653762513719253, + "grad_norm": 0.08819478927352292, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 81.44144415855408 + }, + { + "epoch": 79, + "train_loss": 3.979712967529297, + "train_acc": 0.09928, + "test_loss": 2.3025852310180666, + "test_acc": 0.1, + "lyapunov": 2.2640710157506607, + "grad_norm": 0.10900387268878003, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 81.44691228866577 + }, + { + "epoch": 80, + "train_loss": 3.9752784634399414, + "train_acc": 0.09612, + "test_loss": 2.3025851806640625, + "test_acc": 0.1, + "lyapunov": 2.2611999310495907, + "grad_norm": 0.08485114515050625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 81.44573497772217 + }, + { + "epoch": 81, + "train_loss": 3.973998136444092, + "train_acc": 0.09674, + "test_loss": 2.302585205078125, + "test_acc": 0.1, + "lyapunov": 2.2602438634009006, + "grad_norm": 0.08193297107495977, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 81.44051194190979 + }, + { + "epoch": 82, + "train_loss": 3.9795581608581543, + "train_acc": 0.0974, + "test_loss": 2.3025851707458496, + "test_acc": 0.1, + "lyapunov": 2.2642151602088947, + "grad_norm": 0.08382214616673372, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 81.44579362869263 + }, + { + "epoch": 83, + "train_loss": 3.97544639793396, + "train_acc": 0.0975, + "test_loss": 2.3025851676940916, + "test_acc": 0.1, + "lyapunov": 2.261258240550985, + "grad_norm": 0.0830598190151241, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 81.46574568748474 + }, + { + "epoch": 84, + "train_loss": 3.9764262825775147, + "train_acc": 0.09818, + "test_loss": 2.302585060119629, + "test_acc": 0.1, + "lyapunov": 2.2619712322264376, + "grad_norm": 0.08369246247456191, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 81.45664143562317 + }, + { + "epoch": 85, + "train_loss": 3.9776910205078124, + "train_acc": 0.0955, + "test_loss": 2.3025851593017577, + "test_acc": 0.1, + "lyapunov": 2.2629058550080985, + "grad_norm": 0.08247891269837844, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 81.461270570755 + }, + { + "epoch": 86, + "train_loss": 3.9771215029907228, + "train_acc": 0.09536, + "test_loss": 2.3025850746154783, + "test_acc": 0.1, + "lyapunov": 2.2625219870711226, + "grad_norm": 0.08304329059000737, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 81.45261931419373 + }, + { + "epoch": 87, + "train_loss": 3.9780111279296877, + "train_acc": 0.09718, + "test_loss": 2.3025850124359133, + "test_acc": 0.1, + "lyapunov": 2.263096221572603, + "grad_norm": 0.08168556680409891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 81.47083902359009 + }, + { + "epoch": 88, + "train_loss": 3.975586996154785, + "train_acc": 0.09506, + "test_loss": 2.3025851093292236, + "test_acc": 0.1, + "lyapunov": 2.261420638360026, + "grad_norm": 0.08585199329222436, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 81.46594524383545 + }, + { + "epoch": 89, + "train_loss": 3.9770257449340822, + "train_acc": 0.0982, + "test_loss": 2.3025851146698, + "test_acc": 0.1, + "lyapunov": 2.262422331153889, + "grad_norm": 0.08469063518506169, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 81.46577405929565 + }, + { + "epoch": 90, + "train_loss": 3.973931856689453, + "train_acc": 0.09746, + "test_loss": 2.3025850677490234, + "test_acc": 0.1, + "lyapunov": 2.2602365346210997, + "grad_norm": 0.08267580569635262, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 81.45771622657776 + }, + { + "epoch": 91, + "train_loss": 3.9777387670898436, + "train_acc": 0.09732, + "test_loss": 2.3025851654052736, + "test_acc": 0.1, + "lyapunov": 2.262757078765908, + "grad_norm": 0.10473963211370652, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 81.46830105781555 + }, + { + "epoch": 92, + "train_loss": 3.973895709075928, + "train_acc": 0.09754, + "test_loss": 2.302585176086426, + "test_acc": 0.1, + "lyapunov": 2.2601819568887698, + "grad_norm": 0.08524438116449506, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 81.45872473716736 + }, + { + "epoch": 93, + "train_loss": 3.975780742340088, + "train_acc": 0.09832, + "test_loss": 2.302585258483887, + "test_acc": 0.1, + "lyapunov": 2.261494060916364, + "grad_norm": 0.08296746372602809, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 81.44344329833984 + }, + { + "epoch": 94, + "train_loss": 3.9749393853759765, + "train_acc": 0.099, + "test_loss": 2.3025851181030275, + "test_acc": 0.1, + "lyapunov": 2.2609141049787516, + "grad_norm": 0.081703214219651, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 81.47197723388672 + }, + { + "epoch": 95, + "train_loss": 3.977360173110962, + "train_acc": 0.09844, + "test_loss": 2.3025852035522463, + "test_acc": 0.1, + "lyapunov": 2.2626446403200973, + "grad_norm": 0.08370580659845218, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 81.4649875164032 + }, + { + "epoch": 96, + "train_loss": 3.9748195641326904, + "train_acc": 0.09918, + "test_loss": 2.3025851348876953, + "test_acc": 0.1, + "lyapunov": 2.2608655974688125, + "grad_norm": 0.08506351899121649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 81.45548796653748 + }, + { + "epoch": 97, + "train_loss": 3.977184408874512, + "train_acc": 0.09888, + "test_loss": 2.3025851238250734, + "test_acc": 0.1, + "lyapunov": 2.262512852163876, + "grad_norm": 0.08383579924614167, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 81.4503653049469 + }, + { + "epoch": 98, + "train_loss": 3.979651080627441, + "train_acc": 0.1, + "test_loss": 2.3025852249145506, + "test_acc": 0.1, + "lyapunov": 2.264271725778994, + "grad_norm": 0.08181479722385572, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 81.46501636505127 + }, + { + "epoch": 99, + "train_loss": 3.9744724880981446, + "train_acc": 0.1, + "test_loss": 2.302585131072998, + "test_acc": 0.1, + "lyapunov": 2.260578519547992, + "grad_norm": 0.08286890329554125, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 81.44538688659668 + }, + { + "epoch": 100, + "train_loss": 3.9755064764404295, + "train_acc": 0.1, + "test_loss": 2.302585161590576, + "test_acc": 0.1, + "lyapunov": 2.2613274374276475, + "grad_norm": 0.08253103448725845, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 81.44115138053894 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 11.514268187866211, + "train_acc": 0.12322, + "test_loss": 2.335220721435547, + "test_acc": 0.1082, + "lyapunov": 5.094494405609872, + "grad_norm": 6.68472372840091, + "grad_max_sv": 5.768041110038757, + "grad_min_sv": 2.425695402763495e-07, + "grad_condition": 23767971.115653183, + "lr": 0.0009997532801828658, + "time_sec": 124.28109288215637 + }, + { + "epoch": 2, + "train_loss": 6.767582432556153, + "train_acc": 0.13338, + "test_loss": 2.3135711360931395, + "test_acc": 0.1058, + "lyapunov": 3.703414491375389, + "grad_norm": 4.437490608687784, + "grad_max_sv": 3.688317948579788, + "grad_min_sv": 1.6068337682639822e-07, + "grad_condition": 23679624.47851156, + "lr": 0.0009990133642141358, + "time_sec": 124.28083038330078 + }, + { + "epoch": 3, + "train_loss": 6.359151521911621, + "train_acc": 0.1371, + "test_loss": 2.3046204761505127, + "test_acc": 0.1017, + "lyapunov": 3.53740519087028, + "grad_norm": 3.3992685611612004, + "grad_max_sv": 3.1906665176153184, + "grad_min_sv": 1.0806052515022202e-07, + "grad_condition": 30020073.39935509, + "lr": 0.00099778098230154, + "time_sec": 124.26130867004395 + }, + { + "epoch": 4, + "train_loss": 5.680015151367187, + "train_acc": 0.12346, + "test_loss": 2.4307143615722655, + "test_acc": 0.0946, + "lyapunov": 3.2194143725783015, + "grad_norm": 3.6284679983008856, + "grad_max_sv": 2.3083297662011844, + "grad_min_sv": 7.267783242878633e-08, + "grad_condition": 28802302.157710887, + "lr": 0.000996057350657239, + "time_sec": 124.2893226146698 + }, + { + "epoch": 5, + "train_loss": 5.515282614440918, + "train_acc": 0.11878, + "test_loss": 2.3333636627197265, + "test_acc": 0.0806, + "lyapunov": 3.1298821100493526, + "grad_norm": 2.1440857096164527, + "grad_max_sv": 1.8293321043252946, + "grad_min_sv": 6.11613814704981e-08, + "grad_condition": 30298382.919277746, + "lr": 0.0009938441702975688, + "time_sec": 124.24556708335876 + }, + { + "epoch": 6, + "train_loss": 4.830215334472657, + "train_acc": 0.10662, + "test_loss": 2.3030837219238283, + "test_acc": 0.1, + "lyapunov": 2.7727705700623106, + "grad_norm": 2.350059460657985, + "grad_max_sv": 1.5110829517245292, + "grad_min_sv": 2.7742502849842366e-08, + "grad_condition": 415971679.7996719, + "lr": 0.0009911436253643444, + "time_sec": 124.2670316696167 + }, + { + "epoch": 7, + "train_loss": 5.0002188845825195, + "train_acc": 0.1014, + "test_loss": 2.306517247772217, + "test_acc": 0.1, + "lyapunov": 2.8697540314910968, + "grad_norm": 4.791639177202153, + "grad_max_sv": 0.7900435705131315, + "grad_min_sv": 1.012708673176853e-08, + "grad_condition": 1185811132.9619708, + "lr": 0.0009879583809693736, + "time_sec": 124.2431480884552 + }, + { + "epoch": 8, + "train_loss": 5.872336234741211, + "train_acc": 0.10816, + "test_loss": 2.3033512046813964, + "test_acc": 0.1, + "lyapunov": 3.2996887185079666, + "grad_norm": 4.562165296743471, + "grad_max_sv": 0.4824362076822354, + "grad_min_sv": 1.352856967967285e-08, + "grad_condition": 33563973.110157445, + "lr": 0.0009842915805643154, + "time_sec": 124.24206638336182 + }, + { + "epoch": 9, + "train_loss": 5.207491922912598, + "train_acc": 0.1015, + "test_loss": 2.302657497024536, + "test_acc": 0.1, + "lyapunov": 2.982921624732444, + "grad_norm": 1.2857988530859297, + "grad_max_sv": 0.4782970450818539, + "grad_min_sv": 6.14909029240993e-09, + "grad_condition": 17001336844.82257, + "lr": 0.0009801468428384714, + "time_sec": 124.2599868774414 + }, + { + "epoch": 10, + "train_loss": 5.278977078552246, + "train_acc": 0.11042, + "test_loss": 2.303682248687744, + "test_acc": 0.1, + "lyapunov": 3.0210835842220374, + "grad_norm": 2.219210747930246, + "grad_max_sv": 0.26804067082703115, + "grad_min_sv": 5.793725242549423e-09, + "grad_condition": 7080161076.764597, + "lr": 0.0009755282581475767, + "time_sec": 124.2449324131012 + }, + { + "epoch": 11, + "train_loss": 4.803467753601074, + "train_acc": 0.1012, + "test_loss": 4.169252464294433, + "test_acc": 0.1, + "lyapunov": 2.77325821654571, + "grad_norm": 2.127622649938152, + "grad_max_sv": 0.1682983461767435, + "grad_min_sv": 5.603680153853458e-10, + "grad_condition": 68373983123.414894, + "lr": 0.0009704403844771127, + "time_sec": 124.30126142501831 + }, + { + "epoch": 12, + "train_loss": 4.544517149658203, + "train_acc": 0.09926, + "test_loss": 4.290980886840821, + "test_acc": 0.1, + "lyapunov": 2.62944141068422, + "grad_norm": 1.638854096476257, + "grad_max_sv": 0.07512564162607305, + "grad_min_sv": 2.6490731026315825e-12, + "grad_condition": 54196459261.33328, + "lr": 0.0009648882429441257, + "time_sec": 124.24927043914795 + }, + { + "epoch": 13, + "train_loss": 4.369602390441894, + "train_acc": 0.09752, + "test_loss": 4.109600519561767, + "test_acc": 0.1, + "lyapunov": 2.5177556279370243, + "grad_norm": 2.133122078616872, + "grad_max_sv": 0.09587469333782792, + "grad_min_sv": 2.093604774056981e-12, + "grad_condition": 86094204980.57991, + "lr": 0.0009588773128419905, + "time_sec": 124.26178216934204 + }, + { + "epoch": 14, + "train_loss": 4.34119681640625, + "train_acc": 0.09926, + "test_loss": 4.199708403778076, + "test_acc": 0.1, + "lyapunov": 2.495693293373908, + "grad_norm": 2.708849611541162, + "grad_max_sv": 0.09101940747350454, + "grad_min_sv": 8.368649587364072e-14, + "grad_condition": 87173383288.77208, + "lr": 0.0009524135262330098, + "time_sec": 124.24493861198425 + }, + { + "epoch": 15, + "train_loss": 5.13457500289917, + "train_acc": 0.10424, + "test_loss": 2.308458815765381, + "test_acc": 0.1, + "lyapunov": 2.9219820334783297, + "grad_norm": 3.354402938679459, + "grad_max_sv": 0.09543408825993538, + "grad_min_sv": 1.3719995468877692e-10, + "grad_condition": 59504120268.59434, + "lr": 0.0009455032620941839, + "time_sec": 124.29389190673828 + }, + { + "epoch": 16, + "train_loss": 5.3248897048950194, + "train_acc": 0.10296, + "test_loss": 2.302912854766846, + "test_acc": 0.1, + "lyapunov": 2.9764596306149613, + "grad_norm": 0.6322085012676749, + "grad_max_sv": 0.053145987424068154, + "grad_min_sv": 3.2089368939156336e-11, + "grad_condition": 21592510035.150898, + "lr": 0.0009381533400219318, + "time_sec": 124.22647547721863 + }, + { + "epoch": 17, + "train_loss": 4.330915478057861, + "train_acc": 0.09936, + "test_loss": 2.3026626167297364, + "test_acc": 0.1, + "lyapunov": 2.493599863613353, + "grad_norm": 0.20813626461361764, + "grad_max_sv": 0.0220638582482934, + "grad_min_sv": 5.079951297939575e-13, + "grad_condition": 7528215997.404785, + "lr": 0.0009303710135019719, + "time_sec": 124.25075626373291 + }, + { + "epoch": 18, + "train_loss": 4.329695655975342, + "train_acc": 0.09802, + "test_loss": 2.3026026527404784, + "test_acc": 0.1, + "lyapunov": 2.4943465003577034, + "grad_norm": 0.28764831256555634, + "grad_max_sv": 0.00430559329688549, + "grad_min_sv": 1.0630859058082507e-17, + "grad_condition": 4303763188.890272, + "lr": 0.0009221639627510076, + "time_sec": 124.26908159255981 + }, + { + "epoch": 19, + "train_loss": 4.449291636352539, + "train_acc": 0.09546, + "test_loss": 2.3025916465759275, + "test_acc": 0.1, + "lyapunov": 2.5493475122524956, + "grad_norm": 0.286977076303005, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000913540287137281, + "time_sec": 124.22392654418945 + }, + { + "epoch": 20, + "train_loss": 4.275282980957031, + "train_acc": 0.09758, + "test_loss": 2.3025943778991698, + "test_acc": 0.1, + "lyapunov": 2.4641005602639043, + "grad_norm": 0.11226214403634883, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009045084971874739, + "time_sec": 124.30651044845581 + }, + { + "epoch": 21, + "train_loss": 4.299091949005127, + "train_acc": 0.09792, + "test_loss": 2.30259245262146, + "test_acc": 0.1, + "lyapunov": 2.477661563917194, + "grad_norm": 0.12888554972749486, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008950775061878452, + "time_sec": 124.23446798324585 + }, + { + "epoch": 22, + "train_loss": 4.315002240905762, + "train_acc": 0.0975, + "test_loss": 2.3025940551757813, + "test_acc": 0.1, + "lyapunov": 2.4848342008907776, + "grad_norm": 0.13926908971905202, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878947, + "time_sec": 124.30266809463501 + }, + { + "epoch": 23, + "train_loss": 4.362473590087891, + "train_acc": 0.09968, + "test_loss": 2.3025879684448243, + "test_acc": 0.1, + "lyapunov": 2.508172784619929, + "grad_norm": 0.25147158848993745, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008750555348152298, + "time_sec": 124.24051856994629 + }, + { + "epoch": 24, + "train_loss": 4.361022654266358, + "train_acc": 0.09674, + "test_loss": 2.3025897010803225, + "test_acc": 0.1, + "lyapunov": 2.5060998808087596, + "grad_norm": 0.25289701667178555, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107057, + "time_sec": 124.22614932060242 + }, + { + "epoch": 25, + "train_loss": 4.292231715545654, + "train_acc": 0.098, + "test_loss": 2.3025892387390137, + "test_acc": 0.1, + "lyapunov": 2.4726591543163483, + "grad_norm": 0.15846202884892668, + "grad_max_sv": 0.007139207795262337, + "grad_min_sv": 1.1884213096035809e-14, + "grad_condition": 5768863374.104107, + "lr": 0.0008535533905932737, + "time_sec": 124.29175138473511 + }, + { + "epoch": 26, + "train_loss": 4.278334856414795, + "train_acc": 0.09952, + "test_loss": 2.302597050857544, + "test_acc": 0.1, + "lyapunov": 2.46608062229498, + "grad_norm": 0.09871518957397614, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643444, + "time_sec": 124.22811436653137 + }, + { + "epoch": 27, + "train_loss": 4.279530144348144, + "train_acc": 0.09882, + "test_loss": 2.3025887565612795, + "test_acc": 0.1, + "lyapunov": 2.466456468757766, + "grad_norm": 0.09728576577451334, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008306559326618259, + "time_sec": 124.25813937187195 + }, + { + "epoch": 28, + "train_loss": 4.276873157348633, + "train_acc": 0.0965, + "test_loss": 2.302586852264404, + "test_acc": 0.1, + "lyapunov": 2.4651820092554897, + "grad_norm": 0.09336828927700111, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 124.22499465942383 + }, + { + "epoch": 29, + "train_loss": 4.274294167022705, + "train_acc": 0.09674, + "test_loss": 2.302587184906006, + "test_acc": 0.1, + "lyapunov": 2.4635079608244053, + "grad_norm": 0.08132883703681491, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008064535268264883, + "time_sec": 124.26223015785217 + }, + { + "epoch": 30, + "train_loss": 4.3161706869506835, + "train_acc": 0.09742, + "test_loss": 2.302589612197876, + "test_acc": 0.1, + "lyapunov": 2.4838878163291365, + "grad_norm": 0.1244076499240839, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462367, + "time_sec": 124.22068643569946 + }, + { + "epoch": 31, + "train_loss": 4.2865172996520995, + "train_acc": 0.09864, + "test_loss": 2.3025933723449707, + "test_acc": 0.1, + "lyapunov": 2.4704265179841416, + "grad_norm": 0.11325710428703713, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 124.27307343482971 + }, + { + "epoch": 32, + "train_loss": 4.276113499755859, + "train_acc": 0.09876, + "test_loss": 2.302595587158203, + "test_acc": 0.1, + "lyapunov": 2.464605447276474, + "grad_norm": 0.11188150655123451, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 124.21617436408997 + }, + { + "epoch": 33, + "train_loss": 4.390245020904541, + "train_acc": 0.09734, + "test_loss": 2.302589817047119, + "test_acc": 0.1, + "lyapunov": 2.5185477038478608, + "grad_norm": 0.2703519117597579, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 124.22293186187744 + }, + { + "epoch": 34, + "train_loss": 4.350401836242676, + "train_acc": 0.09758, + "test_loss": 2.302588123321533, + "test_acc": 0.1, + "lyapunov": 2.4999206596628176, + "grad_norm": 0.21853702579717843, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 124.26609373092651 + }, + { + "epoch": 35, + "train_loss": 4.305715147399902, + "train_acc": 0.09856, + "test_loss": 2.302589534378052, + "test_acc": 0.1, + "lyapunov": 2.4810556158080432, + "grad_norm": 0.17605927419881373, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 124.22794723510742 + }, + { + "epoch": 36, + "train_loss": 4.305906265258789, + "train_acc": 0.09718, + "test_loss": 2.302591007232666, + "test_acc": 0.1, + "lyapunov": 2.477643119709571, + "grad_norm": 0.1236420897514881, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 124.26314496994019 + }, + { + "epoch": 37, + "train_loss": 4.27584158996582, + "train_acc": 0.0968, + "test_loss": 2.302587622451782, + "test_acc": 0.1, + "lyapunov": 2.464479011038075, + "grad_norm": 0.09532844351778941, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 124.25255799293518 + }, + { + "epoch": 38, + "train_loss": 4.283268468475342, + "train_acc": 0.097, + "test_loss": 2.302587129211426, + "test_acc": 0.1, + "lyapunov": 2.4685643030249556, + "grad_norm": 0.12053745808537034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 124.26603984832764 + }, + { + "epoch": 39, + "train_loss": 4.340071802978516, + "train_acc": 0.09756, + "test_loss": 2.302587187576294, + "test_acc": 0.1, + "lyapunov": 2.496372491807279, + "grad_norm": 0.2265015040889252, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 124.26093554496765 + }, + { + "epoch": 40, + "train_loss": 4.285524172973632, + "train_acc": 0.0976, + "test_loss": 2.302589253234863, + "test_acc": 0.1, + "lyapunov": 2.4703913722806576, + "grad_norm": 0.12837922155849044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 124.23279547691345 + }, + { + "epoch": 41, + "train_loss": 4.353975823822021, + "train_acc": 0.0984, + "test_loss": 2.3025891468048094, + "test_acc": 0.1, + "lyapunov": 2.502122705854723, + "grad_norm": 0.31834434179235455, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 124.27406620979309 + }, + { + "epoch": 42, + "train_loss": 4.285235863494873, + "train_acc": 0.0975, + "test_loss": 2.3025873653411866, + "test_acc": 0.1, + "lyapunov": 2.4699011251444705, + "grad_norm": 0.16460675806479913, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 124.23745155334473 + }, + { + "epoch": 43, + "train_loss": 4.273813045043945, + "train_acc": 0.09694, + "test_loss": 2.3025889190673827, + "test_acc": 0.1, + "lyapunov": 2.463189967148139, + "grad_norm": 0.09609475828794435, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 124.27437806129456 + }, + { + "epoch": 44, + "train_loss": 4.297922962646484, + "train_acc": 0.09686, + "test_loss": 2.3025868633270266, + "test_acc": 0.1, + "lyapunov": 2.474009756541923, + "grad_norm": 0.14502465560049782, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 124.22268414497375 + }, + { + "epoch": 45, + "train_loss": 4.279574555053711, + "train_acc": 0.09652, + "test_loss": 2.3025878047943116, + "test_acc": 0.1, + "lyapunov": 2.4667322599064665, + "grad_norm": 0.12003136414158579, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 124.28323554992676 + }, + { + "epoch": 46, + "train_loss": 4.273971158905029, + "train_acc": 0.0966, + "test_loss": 2.302587424468994, + "test_acc": 0.1, + "lyapunov": 2.463305209908644, + "grad_norm": 0.09172584937965118, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 124.20362710952759 + }, + { + "epoch": 47, + "train_loss": 4.313593041381836, + "train_acc": 0.09574, + "test_loss": 2.302586856460571, + "test_acc": 0.1, + "lyapunov": 2.4801262095761114, + "grad_norm": 0.15167690922053198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 124.29144883155823 + }, + { + "epoch": 48, + "train_loss": 4.295382699737549, + "train_acc": 0.09748, + "test_loss": 2.302586772155762, + "test_acc": 0.1, + "lyapunov": 2.4740971671345897, + "grad_norm": 0.10879569327624422, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 124.23017454147339 + }, + { + "epoch": 49, + "train_loss": 4.2751529647827144, + "train_acc": 0.09936, + "test_loss": 2.3025859580993653, + "test_acc": 0.1, + "lyapunov": 2.4640432062661253, + "grad_norm": 0.10568439425734225, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 124.25622701644897 + }, + { + "epoch": 50, + "train_loss": 4.273743729553223, + "train_acc": 0.0957, + "test_loss": 2.3025863090515135, + "test_acc": 0.1, + "lyapunov": 2.4630955387564266, + "grad_norm": 0.11615112587060138, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 124.27268052101135 + }, + { + "epoch": 51, + "train_loss": 4.280425806427002, + "train_acc": 0.09628, + "test_loss": 2.302586248397827, + "test_acc": 0.1, + "lyapunov": 2.466461474938161, + "grad_norm": 0.10654878565362114, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 124.24109268188477 + }, + { + "epoch": 52, + "train_loss": 4.279801727294922, + "train_acc": 0.09702, + "test_loss": 2.3025866828918455, + "test_acc": 0.1, + "lyapunov": 2.4669952484043054, + "grad_norm": 0.130514829251149, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 124.26980781555176 + }, + { + "epoch": 53, + "train_loss": 4.315970222320557, + "train_acc": 0.09704, + "test_loss": 2.3025870681762695, + "test_acc": 0.1, + "lyapunov": 2.484521316445392, + "grad_norm": 0.1939414239261272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 124.22718167304993 + }, + { + "epoch": 54, + "train_loss": 4.311761430969239, + "train_acc": 0.09862, + "test_loss": 2.3025857872009277, + "test_acc": 0.1, + "lyapunov": 2.482763496506245, + "grad_norm": 0.18263667447361673, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 124.2686333656311 + }, + { + "epoch": 55, + "train_loss": 4.277025068054199, + "train_acc": 0.09778, + "test_loss": 2.3025857639312743, + "test_acc": 0.1, + "lyapunov": 2.465040735576464, + "grad_norm": 0.09424723224869033, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 124.23272252082825 + }, + { + "epoch": 56, + "train_loss": 4.308205063934326, + "train_acc": 0.0989, + "test_loss": 2.3025861671447756, + "test_acc": 0.1, + "lyapunov": 2.4804823679082535, + "grad_norm": 0.20788469844558666, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 124.45265817642212 + }, + { + "epoch": 57, + "train_loss": 4.282971714477539, + "train_acc": 0.09876, + "test_loss": 2.3025856742858886, + "test_acc": 0.1, + "lyapunov": 2.4687917086169544, + "grad_norm": 0.1374470775631024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 124.2466242313385 + }, + { + "epoch": 58, + "train_loss": 4.311033409729004, + "train_acc": 0.09662, + "test_loss": 2.302585438156128, + "test_acc": 0.1, + "lyapunov": 2.4805221582007837, + "grad_norm": 0.15017627742331574, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 124.22827982902527 + }, + { + "epoch": 59, + "train_loss": 4.29637522354126, + "train_acc": 0.09756, + "test_loss": 2.302585637664795, + "test_acc": 0.1, + "lyapunov": 2.4749210880845403, + "grad_norm": 0.1570135955415664, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 124.30038142204285 + }, + { + "epoch": 60, + "train_loss": 4.307900915527344, + "train_acc": 0.09804, + "test_loss": 2.302586008834839, + "test_acc": 0.1, + "lyapunov": 2.4804043434465024, + "grad_norm": 0.21537262268091628, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 124.21648406982422 + }, + { + "epoch": 61, + "train_loss": 4.294828899230957, + "train_acc": 0.09696, + "test_loss": 2.302585659408569, + "test_acc": 0.1, + "lyapunov": 2.474180576441538, + "grad_norm": 0.15175328138376964, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 124.26800394058228 + }, + { + "epoch": 62, + "train_loss": 4.27745719039917, + "train_acc": 0.09794, + "test_loss": 2.302585639190674, + "test_acc": 0.1, + "lyapunov": 2.465500669406198, + "grad_norm": 0.10570315629890674, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 124.23925018310547 + }, + { + "epoch": 63, + "train_loss": 4.2727640603637695, + "train_acc": 0.09586, + "test_loss": 2.3025855934143067, + "test_acc": 0.1, + "lyapunov": 2.4626387360760624, + "grad_norm": 0.0890330369346984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 124.27016854286194 + }, + { + "epoch": 64, + "train_loss": 4.272457419738769, + "train_acc": 0.09604, + "test_loss": 2.3025855697631834, + "test_acc": 0.1, + "lyapunov": 2.4623735072972526, + "grad_norm": 0.0847950891199477, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 124.20920252799988 + }, + { + "epoch": 65, + "train_loss": 4.273480668334961, + "train_acc": 0.09808, + "test_loss": 2.302585276031494, + "test_acc": 0.1, + "lyapunov": 2.4630366255865073, + "grad_norm": 0.08372012214032937, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 124.22656655311584 + }, + { + "epoch": 66, + "train_loss": 4.307428127746582, + "train_acc": 0.09712, + "test_loss": 2.302585486602783, + "test_acc": 0.1, + "lyapunov": 2.4764473944368874, + "grad_norm": 0.12238051774317063, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 124.28961944580078 + }, + { + "epoch": 67, + "train_loss": 4.310281341094971, + "train_acc": 0.09792, + "test_loss": 2.3025853305816653, + "test_acc": 0.1, + "lyapunov": 2.480989251295319, + "grad_norm": 0.27019424894200594, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 124.25288558006287 + }, + { + "epoch": 68, + "train_loss": 4.282535659484863, + "train_acc": 0.09756, + "test_loss": 2.3025853900909423, + "test_acc": 0.1, + "lyapunov": 2.4676397261412246, + "grad_norm": 0.1281762106524609, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 124.26717019081116 + }, + { + "epoch": 69, + "train_loss": 4.276787458190918, + "train_acc": 0.09688, + "test_loss": 2.3025852905273436, + "test_acc": 0.1, + "lyapunov": 2.4651669858361753, + "grad_norm": 0.08124252440804115, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 124.23096060752869 + }, + { + "epoch": 70, + "train_loss": 4.28195741897583, + "train_acc": 0.09668, + "test_loss": 2.302585355377197, + "test_acc": 0.1, + "lyapunov": 2.468135183729479, + "grad_norm": 0.11112746909721634, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 124.27119207382202 + }, + { + "epoch": 71, + "train_loss": 4.284729679412842, + "train_acc": 0.09706, + "test_loss": 2.302585294342041, + "test_acc": 0.1, + "lyapunov": 2.469655635716665, + "grad_norm": 0.12307199730963861, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 124.23093914985657 + }, + { + "epoch": 72, + "train_loss": 4.276600415039063, + "train_acc": 0.09806, + "test_loss": 2.3025852252960206, + "test_acc": 0.1, + "lyapunov": 2.464849721440269, + "grad_norm": 0.12908363321506647, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 124.25842094421387 + }, + { + "epoch": 73, + "train_loss": 4.3069706353759765, + "train_acc": 0.09654, + "test_loss": 2.3025852447509765, + "test_acc": 0.1, + "lyapunov": 2.479751230810609, + "grad_norm": 0.183601868909449, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 124.21842932701111 + }, + { + "epoch": 74, + "train_loss": 4.287112475280762, + "train_acc": 0.09722, + "test_loss": 2.302585179901123, + "test_acc": 0.1, + "lyapunov": 2.4702408582048343, + "grad_norm": 0.1331148526919891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 124.22039604187012 + }, + { + "epoch": 75, + "train_loss": 4.271034491882324, + "train_acc": 0.09664, + "test_loss": 2.3025851165771485, + "test_acc": 0.1, + "lyapunov": 2.461448823704439, + "grad_norm": 0.08255701875769623, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 124.30420184135437 + }, + { + "epoch": 76, + "train_loss": 4.272865072021484, + "train_acc": 0.09542, + "test_loss": 2.302585235977173, + "test_acc": 0.1, + "lyapunov": 2.462638800101512, + "grad_norm": 0.08790859271963604, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 124.23553800582886 + }, + { + "epoch": 77, + "train_loss": 4.271533363189698, + "train_acc": 0.09712, + "test_loss": 2.3025852149963377, + "test_acc": 0.1, + "lyapunov": 2.4617462914313197, + "grad_norm": 0.08471091537010327, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 124.25954508781433 + }, + { + "epoch": 78, + "train_loss": 4.290692696685791, + "train_acc": 0.09754, + "test_loss": 2.302585163116455, + "test_acc": 0.1, + "lyapunov": 2.470475591357102, + "grad_norm": 0.10652401748252295, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 124.22494149208069 + }, + { + "epoch": 79, + "train_loss": 4.274790961608887, + "train_acc": 0.09758, + "test_loss": 2.302585228347778, + "test_acc": 0.1, + "lyapunov": 2.4638520756645885, + "grad_norm": 0.08078835262733591, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 124.29019331932068 + }, + { + "epoch": 80, + "train_loss": 4.272836723175049, + "train_acc": 0.09616, + "test_loss": 2.3025851444244383, + "test_acc": 0.1, + "lyapunov": 2.462624883407827, + "grad_norm": 0.08161990901444113, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 124.22851657867432 + }, + { + "epoch": 81, + "train_loss": 4.39987655090332, + "train_acc": 0.0985, + "test_loss": 2.302585282897949, + "test_acc": 0.1, + "lyapunov": 2.5367127757548067, + "grad_norm": 0.6635822194594717, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 124.23617506027222 + }, + { + "epoch": 82, + "train_loss": 4.297471022949218, + "train_acc": 0.0953, + "test_loss": 2.3025852149963377, + "test_acc": 0.1, + "lyapunov": 2.475090144540343, + "grad_norm": 0.729945935366233, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 124.25805640220642 + }, + { + "epoch": 83, + "train_loss": 4.269278663024902, + "train_acc": 0.09916, + "test_loss": 2.3025850776672363, + "test_acc": 0.1, + "lyapunov": 2.4603407303695484, + "grad_norm": 0.09631779246548546, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 124.23541116714478 + }, + { + "epoch": 84, + "train_loss": 4.2767918655395505, + "train_acc": 0.09902, + "test_loss": 2.3025851837158204, + "test_acc": 0.1, + "lyapunov": 2.464642455815659, + "grad_norm": 0.15914456443799777, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 124.2600998878479 + }, + { + "epoch": 85, + "train_loss": 4.275007407989502, + "train_acc": 0.09774, + "test_loss": 2.302585231781006, + "test_acc": 0.1, + "lyapunov": 2.4639958829221213, + "grad_norm": 0.08948000358835351, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 124.19096970558167 + }, + { + "epoch": 86, + "train_loss": 4.282883452606201, + "train_acc": 0.0984, + "test_loss": 2.3025849563598633, + "test_acc": 0.1, + "lyapunov": 2.46685717294893, + "grad_norm": 0.20955582940776452, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 124.28308463096619 + }, + { + "epoch": 87, + "train_loss": 4.273255398712158, + "train_acc": 0.09732, + "test_loss": 2.3025850818634033, + "test_acc": 0.1, + "lyapunov": 2.4628877334887416, + "grad_norm": 0.08251896757547691, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 124.24707794189453 + }, + { + "epoch": 88, + "train_loss": 4.27318275390625, + "train_acc": 0.09818, + "test_loss": 2.3025852210998536, + "test_acc": 0.1, + "lyapunov": 2.462852593273153, + "grad_norm": 0.08488796189115587, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 124.27159857749939 + }, + { + "epoch": 89, + "train_loss": 4.274446720886231, + "train_acc": 0.0964, + "test_loss": 2.3025852279663086, + "test_acc": 0.1, + "lyapunov": 2.463662301792818, + "grad_norm": 0.08254333748035417, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 124.20991706848145 + }, + { + "epoch": 90, + "train_loss": 4.282081894989013, + "train_acc": 0.09898, + "test_loss": 2.302585124206543, + "test_acc": 0.1, + "lyapunov": 2.4669584868204257, + "grad_norm": 0.11057422059552115, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 124.23175573348999 + }, + { + "epoch": 91, + "train_loss": 4.270762037200928, + "train_acc": 0.09742, + "test_loss": 2.302585070037842, + "test_acc": 0.1, + "lyapunov": 2.4613021468872303, + "grad_norm": 0.08094752788352252, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 124.28751397132874 + }, + { + "epoch": 92, + "train_loss": 4.2731778295898435, + "train_acc": 0.0967, + "test_loss": 2.3025849838256836, + "test_acc": 0.1, + "lyapunov": 2.4628693057448054, + "grad_norm": 0.08218150011851272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 124.20022916793823 + }, + { + "epoch": 93, + "train_loss": 4.271317660827637, + "train_acc": 0.09598, + "test_loss": 2.302585059738159, + "test_acc": 0.1, + "lyapunov": 2.461685863602192, + "grad_norm": 0.09351987385512874, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 124.32517552375793 + }, + { + "epoch": 94, + "train_loss": 4.271005298614502, + "train_acc": 0.09678, + "test_loss": 2.3025850238800047, + "test_acc": 0.1, + "lyapunov": 2.461446201100069, + "grad_norm": 0.08051510852574385, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 124.25493431091309 + }, + { + "epoch": 95, + "train_loss": 4.272550579528809, + "train_acc": 0.0975, + "test_loss": 2.302585118865967, + "test_acc": 0.1, + "lyapunov": 2.462437502258574, + "grad_norm": 0.08133134154526532, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 124.2907202243805 + }, + { + "epoch": 96, + "train_loss": 4.27599407836914, + "train_acc": 0.09808, + "test_loss": 2.302585164642334, + "test_acc": 0.1, + "lyapunov": 2.464714573472357, + "grad_norm": 0.08129994421530186, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 124.2441520690918 + }, + { + "epoch": 97, + "train_loss": 4.27250137512207, + "train_acc": 0.1, + "test_loss": 2.3025850723266603, + "test_acc": 0.1, + "lyapunov": 2.462406137105449, + "grad_norm": 0.08085760651650271, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 124.25383496284485 + }, + { + "epoch": 98, + "train_loss": 4.272909243469238, + "train_acc": 0.1, + "test_loss": 2.30258510017395, + "test_acc": 0.1, + "lyapunov": 2.462700468195064, + "grad_norm": 0.08430371763203995, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 124.2897834777832 + }, + { + "epoch": 99, + "train_loss": 4.27265819152832, + "train_acc": 0.1, + "test_loss": 2.302585132598877, + "test_acc": 0.1, + "lyapunov": 2.462563226290066, + "grad_norm": 0.08009730488173318, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 124.25932240486145 + }, + { + "epoch": 100, + "train_loss": 4.272679078521729, + "train_acc": 0.1, + "test_loss": 2.302585071182251, + "test_acc": 0.1, + "lyapunov": 2.462542835708774, + "grad_norm": 0.08019670403901732, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 124.30135154724121 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 11.842812671203614, + "train_acc": 0.14506, + "test_loss": 2.34111376953125, + "test_acc": 0.1088, + "lyapunov": 5.111980842507404, + "grad_norm": 6.803328171635302, + "grad_max_sv": 5.664273583889008, + "grad_min_sv": 2.45656453401466e-07, + "grad_condition": 23556170.622745253, + "lr": 0.0009997532801828658, + "time_sec": 167.03577542304993 + }, + { + "epoch": 2, + "train_loss": 6.864391835327148, + "train_acc": 0.1532, + "test_loss": 2.3584522315979, + "test_acc": 0.1126, + "lyapunov": 3.7626322760911246, + "grad_norm": 5.449127371208671, + "grad_max_sv": 4.509619396924973, + "grad_min_sv": 1.816841066926145e-07, + "grad_condition": 25473679.781934455, + "lr": 0.0009990133642141358, + "time_sec": 167.0620617866516 + }, + { + "epoch": 3, + "train_loss": 6.632632642822266, + "train_acc": 0.16122, + "test_loss": 2.358525146102905, + "test_acc": 0.1, + "lyapunov": 3.702555048496217, + "grad_norm": 3.996691628576675, + "grad_max_sv": 3.4047091096639632, + "grad_min_sv": 1.1248512699069124e-07, + "grad_condition": 30963953.097301744, + "lr": 0.00099778098230154, + "time_sec": 167.01362991333008 + }, + { + "epoch": 4, + "train_loss": 6.508619455108643, + "train_acc": 0.15906, + "test_loss": 2.3301877449035646, + "test_acc": 0.1, + "lyapunov": 3.647035371312095, + "grad_norm": 3.2655343849407332, + "grad_max_sv": 3.0296140223741532, + "grad_min_sv": 9.594998209294659e-08, + "grad_condition": 32002571.000903092, + "lr": 0.000996057350657239, + "time_sec": 166.97752714157104 + }, + { + "epoch": 5, + "train_loss": 5.912459800109863, + "train_acc": 0.13794, + "test_loss": 2.3143163734436034, + "test_acc": 0.1, + "lyapunov": 3.364570482917454, + "grad_norm": 2.882730301769821, + "grad_max_sv": 2.836460363864899, + "grad_min_sv": 8.620691849259288e-08, + "grad_condition": 34084982.42197102, + "lr": 0.0009938441702975688, + "time_sec": 167.01780152320862 + }, + { + "epoch": 6, + "train_loss": 5.365990347290039, + "train_acc": 0.12352, + "test_loss": 2.307030549240112, + "test_acc": 0.1, + "lyapunov": 3.0800778951181473, + "grad_norm": 2.6661229845796357, + "grad_max_sv": 1.9664998756031884, + "grad_min_sv": 4.7012965353151585e-08, + "grad_condition": 714227055.0495954, + "lr": 0.0009911436253643444, + "time_sec": 166.95626974105835 + }, + { + "epoch": 7, + "train_loss": 5.098499784545899, + "train_acc": 0.11974, + "test_loss": 2.306401748275757, + "test_acc": 0.1, + "lyapunov": 2.9394846096672973, + "grad_norm": 2.0425554711132987, + "grad_max_sv": 1.3562358289975485, + "grad_min_sv": 3.416944161021407e-08, + "grad_condition": 430074872.43269414, + "lr": 0.0009879583809693736, + "time_sec": 167.02987694740295 + }, + { + "epoch": 8, + "train_loss": 4.836283032226563, + "train_acc": 0.1193, + "test_loss": 2.3056865058898928, + "test_acc": 0.1, + "lyapunov": 2.8134650903589584, + "grad_norm": 1.9015682902174655, + "grad_max_sv": 1.3965314358472825, + "grad_min_sv": 2.998794566512128e-08, + "grad_condition": 984527791.9432541, + "lr": 0.0009842915805643154, + "time_sec": 166.99379587173462 + }, + { + "epoch": 9, + "train_loss": 4.799866871795654, + "train_acc": 0.11898, + "test_loss": 2.3078849700927733, + "test_acc": 0.1, + "lyapunov": 2.7906805755537185, + "grad_norm": 1.830247256824178, + "grad_max_sv": 1.0446476072072983, + "grad_min_sv": 2.2101311034875437e-08, + "grad_condition": 6442199712.909399, + "lr": 0.0009801468428384714, + "time_sec": 167.04091095924377 + }, + { + "epoch": 10, + "train_loss": 4.8418486264038085, + "train_acc": 0.1198, + "test_loss": 2.306636996841431, + "test_acc": 0.1, + "lyapunov": 2.8099952402627073, + "grad_norm": 2.137959073318514, + "grad_max_sv": 0.7742668629978022, + "grad_min_sv": 1.0732185378244782e-08, + "grad_condition": 12825727231.027037, + "lr": 0.0009755282581475767, + "time_sec": 167.01724100112915 + }, + { + "epoch": 11, + "train_loss": 4.899544752502441, + "train_acc": 0.11034, + "test_loss": 2.303115463256836, + "test_acc": 0.1, + "lyapunov": 2.8371418083415314, + "grad_norm": 1.6003418244695304, + "grad_max_sv": 0.6158522295280715, + "grad_min_sv": 3.796369944507449e-09, + "grad_condition": 6480545635.210354, + "lr": 0.0009704403844771127, + "time_sec": 167.04382944107056 + }, + { + "epoch": 12, + "train_loss": 4.951635014648438, + "train_acc": 0.10792, + "test_loss": 2.3031677284240724, + "test_acc": 0.1, + "lyapunov": 2.866735147393268, + "grad_norm": 2.666838044816494, + "grad_max_sv": 0.5319730836898089, + "grad_min_sv": 3.372458990007535e-10, + "grad_condition": 39511669967.92405, + "lr": 0.0009648882429441257, + "time_sec": 166.9957308769226 + }, + { + "epoch": 13, + "train_loss": 6.152256243286133, + "train_acc": 0.10692, + "test_loss": 2.303246379852295, + "test_acc": 0.1, + "lyapunov": 3.4366153896312275, + "grad_norm": 6.342546880123247, + "grad_max_sv": 0.2403870326364995, + "grad_min_sv": 2.6050612198124816e-10, + "grad_condition": 34925794452.094666, + "lr": 0.0009588773128419905, + "time_sec": 167.01189947128296 + }, + { + "epoch": 14, + "train_loss": 6.052201841888428, + "train_acc": 0.10886, + "test_loss": 2.3029991958618163, + "test_acc": 0.1, + "lyapunov": 3.407372230154169, + "grad_norm": 3.751884478526656, + "grad_max_sv": 0.3085380573000293, + "grad_min_sv": 1.7481779514657177e-10, + "grad_condition": 69456467004.02864, + "lr": 0.0009524135262330098, + "time_sec": 166.99195837974548 + }, + { + "epoch": 15, + "train_loss": 6.174399379577637, + "train_acc": 0.10784, + "test_loss": 2.3030965816497804, + "test_acc": 0.1, + "lyapunov": 3.468341021891445, + "grad_norm": 2.2149403643105514, + "grad_max_sv": 0.2665206765946223, + "grad_min_sv": 7.174466620587407e-11, + "grad_condition": 25279718153.525455, + "lr": 0.0009455032620941839, + "time_sec": 167.02302026748657 + }, + { + "epoch": 16, + "train_loss": 5.8687522245788575, + "train_acc": 0.10852, + "test_loss": 2.302928673553467, + "test_acc": 0.1, + "lyapunov": 3.3205134075925784, + "grad_norm": 2.1727798236859517, + "grad_max_sv": 0.1694878804436172, + "grad_min_sv": 5.284483110394732e-11, + "grad_condition": 29825093550.928566, + "lr": 0.0009381533400219318, + "time_sec": 166.98851919174194 + }, + { + "epoch": 17, + "train_loss": 5.00506268585205, + "train_acc": 0.10292, + "test_loss": 2.3029050621032714, + "test_acc": 0.1, + "lyapunov": 2.8923883834458373, + "grad_norm": 1.1450970364565718, + "grad_max_sv": 0.12666865187754867, + "grad_min_sv": 2.4102328364569327e-11, + "grad_condition": 25147403549.501667, + "lr": 0.0009303710135019719, + "time_sec": 167.02036666870117 + }, + { + "epoch": 18, + "train_loss": 4.855449399719238, + "train_acc": 0.104, + "test_loss": 2.3028139762878417, + "test_acc": 0.1, + "lyapunov": 2.8120573298705507, + "grad_norm": 0.7305556308720836, + "grad_max_sv": 0.09714378891512751, + "grad_min_sv": 8.150729035001414e-12, + "grad_condition": 58264297783.12268, + "lr": 0.0009221639627510076, + "time_sec": 167.08689284324646 + }, + { + "epoch": 19, + "train_loss": 4.96336449584961, + "train_acc": 0.1041, + "test_loss": 2.3027950325012205, + "test_acc": 0.1, + "lyapunov": 2.8725837020922804, + "grad_norm": 1.182474133176391, + "grad_max_sv": 0.07083241189830006, + "grad_min_sv": 7.22405413796021e-12, + "grad_condition": 38280733847.458176, + "lr": 0.000913540287137281, + "time_sec": 167.00970244407654 + }, + { + "epoch": 20, + "train_loss": 4.743826732025147, + "train_acc": 0.10382, + "test_loss": 2.3027557773590086, + "test_acc": 0.1, + "lyapunov": 2.7483980515423942, + "grad_norm": 0.6554501104680703, + "grad_max_sv": 0.05732933725230396, + "grad_min_sv": 5.653544739145854e-12, + "grad_condition": 35503198727.48572, + "lr": 0.0009045084971874739, + "time_sec": 167.09380722045898 + }, + { + "epoch": 21, + "train_loss": 4.678205784606933, + "train_acc": 0.10294, + "test_loss": 3.7050921539306643, + "test_acc": 0.1, + "lyapunov": 2.712228787219738, + "grad_norm": 0.9024618566776086, + "grad_max_sv": 0.03976228955434635, + "grad_min_sv": 5.291108131013551e-11, + "grad_condition": 16349739158.901342, + "lr": 0.0008950775061878452, + "time_sec": 167.0224826335907 + }, + { + "epoch": 22, + "train_loss": 4.63441824432373, + "train_acc": 0.09868, + "test_loss": 2.678515822601318, + "test_acc": 0.1, + "lyapunov": 2.6848394797586113, + "grad_norm": 0.9464113383195869, + "grad_max_sv": 0.03219134085811674, + "grad_min_sv": 3.575371656772674e-11, + "grad_condition": 22552839587.69338, + "lr": 0.0008852566213878947, + "time_sec": 167.0608777999878 + }, + { + "epoch": 23, + "train_loss": 4.728675323486328, + "train_acc": 0.09932, + "test_loss": 3.68248123626709, + "test_acc": 0.1, + "lyapunov": 2.732565569450788, + "grad_norm": 1.1845032429393016, + "grad_max_sv": 0.009998515527695418, + "grad_min_sv": 1.095997224005267e-20, + "grad_condition": 9998514820.705112, + "lr": 0.0008750555348152298, + "time_sec": 167.0682075023651 + }, + { + "epoch": 24, + "train_loss": 4.65850959197998, + "train_acc": 0.09912, + "test_loss": 3.6423350326538086, + "test_acc": 0.1, + "lyapunov": 2.6980338791752105, + "grad_norm": 1.5417542431510867, + "grad_max_sv": 0.008353105513378978, + "grad_min_sv": 1.9907194983962853e-18, + "grad_condition": 8352993676.098096, + "lr": 0.0008644843137107057, + "time_sec": 167.08017802238464 + }, + { + "epoch": 25, + "train_loss": 4.584089448547363, + "train_acc": 0.09784, + "test_loss": 2.3033696189880373, + "test_acc": 0.1, + "lyapunov": 2.653346909891309, + "grad_norm": 0.9625814425500707, + "grad_max_sv": 0.0027962074615061282, + "grad_min_sv": 1.8178542286825737e-15, + "grad_condition": 2726213455.6624613, + "lr": 0.0008535533905932737, + "time_sec": 167.05963444709778 + }, + { + "epoch": 26, + "train_loss": 4.562473741149902, + "train_acc": 0.0972, + "test_loss": 2.5531665412902833, + "test_acc": 0.1, + "lyapunov": 2.6440261763989774, + "grad_norm": 1.0966601277478685, + "grad_max_sv": 0.0009299686178565025, + "grad_min_sv": 7.864982908802376e-35, + "grad_condition": 929968617.8565025, + "lr": 0.0008422735529643444, + "time_sec": 167.0820574760437 + }, + { + "epoch": 27, + "train_loss": 4.557928927612305, + "train_acc": 0.10072, + "test_loss": 2.3032149608612063, + "test_acc": 0.1, + "lyapunov": 2.640467453490743, + "grad_norm": 1.5990578945087282, + "grad_max_sv": 0.001147926412522793, + "grad_min_sv": 2.0663573730241894e-15, + "grad_condition": 1060288974.8907245, + "lr": 0.0008306559326618259, + "time_sec": 167.0413818359375 + }, + { + "epoch": 28, + "train_loss": 4.533458753051757, + "train_acc": 0.09686, + "test_loss": 2.303218946838379, + "test_acc": 0.1, + "lyapunov": 2.6252909279845253, + "grad_norm": 0.6753306901464893, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 167.0830535888672 + }, + { + "epoch": 29, + "train_loss": 4.496531313171387, + "train_acc": 0.09852, + "test_loss": 2.3032687267303467, + "test_acc": 0.1, + "lyapunov": 2.6040675938891633, + "grad_norm": 0.18386399798172356, + "grad_max_sv": 0.00110331317409873, + "grad_min_sv": 7.969612926285099e-35, + "grad_condition": 1103313174.09873, + "lr": 0.0008064535268264883, + "time_sec": 167.04623770713806 + }, + { + "epoch": 30, + "train_loss": 4.504303005065918, + "train_acc": 0.0976, + "test_loss": 2.303500841522217, + "test_acc": 0.1, + "lyapunov": 2.6081804003556974, + "grad_norm": 0.15236154258308318, + "grad_max_sv": 0.0028056097216904163, + "grad_min_sv": 0.0, + "grad_condition": 2805609721.6904163, + "lr": 0.0007938926261462367, + "time_sec": 167.02854776382446 + }, + { + "epoch": 31, + "train_loss": 4.50321345703125, + "train_acc": 0.09666, + "test_loss": 2.3035490158081053, + "test_acc": 0.1, + "lyapunov": 2.607592426602493, + "grad_norm": 0.10039091720588617, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 167.07999300956726 + }, + { + "epoch": 32, + "train_loss": 4.501663753662109, + "train_acc": 0.09806, + "test_loss": 2.3034838943481444, + "test_acc": 0.1, + "lyapunov": 2.607143198437703, + "grad_norm": 0.1048906506411198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 167.00407528877258 + }, + { + "epoch": 33, + "train_loss": 4.5019655114746095, + "train_acc": 0.09498, + "test_loss": 2.30348473739624, + "test_acc": 0.1, + "lyapunov": 2.607365154549289, + "grad_norm": 0.09466991605122166, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 167.04430413246155 + }, + { + "epoch": 34, + "train_loss": 4.4972885162353515, + "train_acc": 0.09806, + "test_loss": 2.3035587966918945, + "test_acc": 0.1, + "lyapunov": 2.6045894854513887, + "grad_norm": 0.094802640603578, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 167.01064467430115 + }, + { + "epoch": 35, + "train_loss": 4.496900313110352, + "train_acc": 0.09916, + "test_loss": 2.3035878532409666, + "test_acc": 0.1, + "lyapunov": 2.6043496991667294, + "grad_norm": 0.08505627865784493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 167.04931592941284 + }, + { + "epoch": 36, + "train_loss": 4.498045174407959, + "train_acc": 0.09896, + "test_loss": 2.303556993865967, + "test_acc": 0.1, + "lyapunov": 2.6051284626621722, + "grad_norm": 0.08865673943824036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 166.99707579612732 + }, + { + "epoch": 37, + "train_loss": 4.494941578521728, + "train_acc": 0.09764, + "test_loss": 2.3035079292297365, + "test_acc": 0.1, + "lyapunov": 2.6031092463247, + "grad_norm": 0.09732931123675816, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 167.02038192749023 + }, + { + "epoch": 38, + "train_loss": 4.496269936523437, + "train_acc": 0.09764, + "test_loss": 2.3035408573150633, + "test_acc": 0.1, + "lyapunov": 2.604000445217123, + "grad_norm": 0.08852073271727623, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 167.02108144760132 + }, + { + "epoch": 39, + "train_loss": 4.493522086791992, + "train_acc": 0.09734, + "test_loss": 2.303493659210205, + "test_acc": 0.1, + "lyapunov": 2.6023181265272446, + "grad_norm": 0.08748337786673831, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 167.05211973190308 + }, + { + "epoch": 40, + "train_loss": 4.498229814758301, + "train_acc": 0.09844, + "test_loss": 2.3034747520446777, + "test_acc": 0.1, + "lyapunov": 2.6050954608966017, + "grad_norm": 0.10483613599174303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 167.01571893692017 + }, + { + "epoch": 41, + "train_loss": 4.498432325286865, + "train_acc": 0.09692, + "test_loss": 2.3034770004272462, + "test_acc": 0.1, + "lyapunov": 2.6052994520767876, + "grad_norm": 0.09650951998583779, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 167.06526255607605 + }, + { + "epoch": 42, + "train_loss": 4.496120017395019, + "train_acc": 0.09806, + "test_loss": 2.303461635971069, + "test_acc": 0.1, + "lyapunov": 2.6038818706941727, + "grad_norm": 0.08793824539769711, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 167.0240659713745 + }, + { + "epoch": 43, + "train_loss": 4.50342136932373, + "train_acc": 0.0968, + "test_loss": 3.123962462234497, + "test_acc": 0.1, + "lyapunov": 2.6082677432643178, + "grad_norm": 0.10763460634241757, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 167.04283785820007 + }, + { + "epoch": 44, + "train_loss": 4.497545390930176, + "train_acc": 0.0993, + "test_loss": 2.30349365196228, + "test_acc": 0.1, + "lyapunov": 2.6048193215714086, + "grad_norm": 0.0914051250208073, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 167.00522899627686 + }, + { + "epoch": 45, + "train_loss": 4.497059263458252, + "train_acc": 0.0983, + "test_loss": 2.303560007476807, + "test_acc": 0.1, + "lyapunov": 2.604434971919145, + "grad_norm": 0.09665268401606698, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 166.98798084259033 + }, + { + "epoch": 46, + "train_loss": 4.496945586547851, + "train_acc": 0.09766, + "test_loss": 2.303540351486206, + "test_acc": 0.1, + "lyapunov": 2.6044252626121502, + "grad_norm": 0.08182959271154387, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 167.05580401420593 + }, + { + "epoch": 47, + "train_loss": 4.5494916119384765, + "train_acc": 0.0975, + "test_loss": 2.3035491088867186, + "test_acc": 0.1, + "lyapunov": 2.6250632187289655, + "grad_norm": 0.16118104591565238, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 167.02027297019958 + }, + { + "epoch": 48, + "train_loss": 4.527786728515625, + "train_acc": 0.09808, + "test_loss": 2.303548764038086, + "test_acc": 0.1, + "lyapunov": 2.6161820851933317, + "grad_norm": 0.1522047852768872, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 167.08899068832397 + }, + { + "epoch": 49, + "train_loss": 4.49808083328247, + "train_acc": 0.0977, + "test_loss": 2.3034967575073244, + "test_acc": 0.1, + "lyapunov": 2.6051423244769008, + "grad_norm": 0.09227111356756569, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 167.04247641563416 + }, + { + "epoch": 50, + "train_loss": 4.506656402282715, + "train_acc": 0.09788, + "test_loss": 2.3035506187438965, + "test_acc": 0.1, + "lyapunov": 2.6092079515042514, + "grad_norm": 0.0989012749171036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 167.06817507743835 + }, + { + "epoch": 51, + "train_loss": 4.518285944213867, + "train_acc": 0.09874, + "test_loss": 2.303562999343872, + "test_acc": 0.1, + "lyapunov": 2.6132117506793087, + "grad_norm": 0.14702247022618603, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 167.00237131118774 + }, + { + "epoch": 52, + "train_loss": 4.510767389526367, + "train_acc": 0.0985, + "test_loss": 2.303548727416992, + "test_acc": 0.1, + "lyapunov": 2.611425805884554, + "grad_norm": 0.12770796891288963, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 167.03129529953003 + }, + { + "epoch": 53, + "train_loss": 4.524528532714844, + "train_acc": 0.09758, + "test_loss": 2.3034987804412843, + "test_acc": 0.1, + "lyapunov": 2.6168906950889648, + "grad_norm": 0.16221922023587404, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 167.0302333831787 + }, + { + "epoch": 54, + "train_loss": 4.514558558197021, + "train_acc": 0.09898, + "test_loss": 2.3035224128723146, + "test_acc": 0.1, + "lyapunov": 2.6116219816915214, + "grad_norm": 0.11874932612009399, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 167.03262758255005 + }, + { + "epoch": 55, + "train_loss": 4.500117692108154, + "train_acc": 0.0969, + "test_loss": 2.303501333999634, + "test_acc": 0.1, + "lyapunov": 2.6062854854652033, + "grad_norm": 0.10674428233360923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 166.98121881484985 + }, + { + "epoch": 56, + "train_loss": 4.51960044921875, + "train_acc": 0.09628, + "test_loss": 2.30349303855896, + "test_acc": 0.1, + "lyapunov": 2.616247482616883, + "grad_norm": 0.14277503967283073, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 167.03360319137573 + }, + { + "epoch": 57, + "train_loss": 4.538308909759522, + "train_acc": 0.0975, + "test_loss": 2.303505461502075, + "test_acc": 0.1, + "lyapunov": 2.624653117431094, + "grad_norm": 0.17354441507562746, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 167.00332236289978 + }, + { + "epoch": 58, + "train_loss": 4.5402243867492675, + "train_acc": 0.09768, + "test_loss": 2.3034944499969483, + "test_acc": 0.1, + "lyapunov": 2.6235652969926213, + "grad_norm": 0.18590049129605235, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 166.94713830947876 + }, + { + "epoch": 59, + "train_loss": 4.497288510131836, + "train_acc": 0.09656, + "test_loss": 2.303503835296631, + "test_acc": 0.1, + "lyapunov": 2.60465430237753, + "grad_norm": 0.08925667815477244, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 166.97111773490906 + }, + { + "epoch": 60, + "train_loss": 4.520837378082275, + "train_acc": 0.09746, + "test_loss": 2.3035025501251223, + "test_acc": 0.1, + "lyapunov": 2.6177086183787, + "grad_norm": 0.14390327015753798, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 166.95851969718933 + }, + { + "epoch": 61, + "train_loss": 4.503204351348877, + "train_acc": 0.09616, + "test_loss": 2.3035063259124757, + "test_acc": 0.1, + "lyapunov": 2.6079881752238556, + "grad_norm": 0.11060100204296372, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 167.04684805870056 + }, + { + "epoch": 62, + "train_loss": 4.529549421844482, + "train_acc": 0.0966, + "test_loss": 2.303504373550415, + "test_acc": 0.1, + "lyapunov": 2.620155497889994, + "grad_norm": 0.25260476730678916, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 166.9670557975769 + }, + { + "epoch": 63, + "train_loss": 4.504642747955322, + "train_acc": 0.09824, + "test_loss": 2.302585437011719, + "test_acc": 0.1, + "lyapunov": 2.6090027182303426, + "grad_norm": 0.14482467729355822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 167.07136464118958 + }, + { + "epoch": 64, + "train_loss": 4.5207818331909175, + "train_acc": 0.09658, + "test_loss": 2.302585619735718, + "test_acc": 0.1, + "lyapunov": 2.6153993130949758, + "grad_norm": 0.14340140289375716, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 167.0296709537506 + }, + { + "epoch": 65, + "train_loss": 4.514579942321777, + "train_acc": 0.09692, + "test_loss": 2.302585908126831, + "test_acc": 0.1, + "lyapunov": 2.612202508370285, + "grad_norm": 0.11615853114383813, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 167.06110525131226 + }, + { + "epoch": 66, + "train_loss": 4.539550397949219, + "train_acc": 0.09668, + "test_loss": 2.3025857189178467, + "test_acc": 0.1, + "lyapunov": 2.6239442215551194, + "grad_norm": 0.24377422344866448, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 166.96833562850952 + }, + { + "epoch": 67, + "train_loss": 4.520765433959961, + "train_acc": 0.09678, + "test_loss": 2.3025856506347657, + "test_acc": 0.1, + "lyapunov": 2.6144380130426352, + "grad_norm": 0.17143215114502838, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 167.06375288963318 + }, + { + "epoch": 68, + "train_loss": 4.501224665222168, + "train_acc": 0.09848, + "test_loss": 2.3025851860046385, + "test_acc": 0.1, + "lyapunov": 2.606965447935607, + "grad_norm": 0.22167025880962787, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 166.97689723968506 + }, + { + "epoch": 69, + "train_loss": 4.516330520629883, + "train_acc": 0.09716, + "test_loss": 2.3025853271484373, + "test_acc": 0.1, + "lyapunov": 2.6127135893877815, + "grad_norm": 0.1178159153430125, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 167.03971099853516 + }, + { + "epoch": 70, + "train_loss": 4.518335289764404, + "train_acc": 0.09628, + "test_loss": 2.3025851623535156, + "test_acc": 0.1, + "lyapunov": 2.614670734576252, + "grad_norm": 0.19910468609269888, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 167.01087379455566 + }, + { + "epoch": 71, + "train_loss": 4.506198991699219, + "train_acc": 0.0961, + "test_loss": 2.3025853843688964, + "test_acc": 0.1, + "lyapunov": 2.6081283720557953, + "grad_norm": 0.09098734124729495, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 167.0194799900055 + }, + { + "epoch": 72, + "train_loss": 4.49574895111084, + "train_acc": 0.09856, + "test_loss": 2.3025853591918946, + "test_acc": 0.1, + "lyapunov": 2.603733692632612, + "grad_norm": 0.08176729544229487, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 167.05306220054626 + }, + { + "epoch": 73, + "train_loss": 4.497463835449219, + "train_acc": 0.09886, + "test_loss": 2.3025851680755616, + "test_acc": 0.1, + "lyapunov": 2.604736436053615, + "grad_norm": 0.082986396115534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 166.98811650276184 + }, + { + "epoch": 74, + "train_loss": 4.4971358953857425, + "train_acc": 0.09738, + "test_loss": 2.302585493850708, + "test_acc": 0.1, + "lyapunov": 2.6045719363805278, + "grad_norm": 0.08151196821637299, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 167.01667833328247 + }, + { + "epoch": 75, + "train_loss": 4.50925322631836, + "train_acc": 0.0967, + "test_loss": 2.302585232925415, + "test_acc": 0.1, + "lyapunov": 2.6094926751178242, + "grad_norm": 0.21190207725464844, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 166.97911548614502 + }, + { + "epoch": 76, + "train_loss": 4.496390933227539, + "train_acc": 0.0967, + "test_loss": 2.302585297393799, + "test_acc": 0.1, + "lyapunov": 2.6040706823549002, + "grad_norm": 0.08435313407684436, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 167.0480306148529 + }, + { + "epoch": 77, + "train_loss": 4.496095029296875, + "train_acc": 0.0965, + "test_loss": 2.3025853218078614, + "test_acc": 0.1, + "lyapunov": 2.6039189987475306, + "grad_norm": 0.1373346720572696, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 166.97820734977722 + }, + { + "epoch": 78, + "train_loss": 4.499068414611816, + "train_acc": 0.096, + "test_loss": 2.3025852237701416, + "test_acc": 0.1, + "lyapunov": 2.605743714305751, + "grad_norm": 0.10939849657650327, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 166.98934531211853 + }, + { + "epoch": 79, + "train_loss": 4.4964453392028805, + "train_acc": 0.09828, + "test_loss": 2.302585151672363, + "test_acc": 0.1, + "lyapunov": 2.604178778655694, + "grad_norm": 0.08774538011729731, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 167.02672863006592 + }, + { + "epoch": 80, + "train_loss": 4.499743932647705, + "train_acc": 0.09862, + "test_loss": 2.302585228347778, + "test_acc": 0.1, + "lyapunov": 2.606093951808217, + "grad_norm": 0.2420142867175763, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 167.10957646369934 + }, + { + "epoch": 81, + "train_loss": 4.502734872436523, + "train_acc": 0.09578, + "test_loss": 2.302585201263428, + "test_acc": 0.1, + "lyapunov": 2.6076697900776975, + "grad_norm": 0.13251791023485532, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 166.9769287109375 + }, + { + "epoch": 82, + "train_loss": 4.494626608581543, + "train_acc": 0.09758, + "test_loss": 2.3025851295471194, + "test_acc": 0.1, + "lyapunov": 2.6029957383489974, + "grad_norm": 0.08170465976084904, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 167.00449562072754 + }, + { + "epoch": 83, + "train_loss": 4.495700520019532, + "train_acc": 0.09822, + "test_loss": 2.3025853286743163, + "test_acc": 0.1, + "lyapunov": 2.6036597090913816, + "grad_norm": 0.1210411913955966, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 166.96435856819153 + }, + { + "epoch": 84, + "train_loss": 4.49369448425293, + "train_acc": 0.09848, + "test_loss": 2.3025850296020507, + "test_acc": 0.1, + "lyapunov": 2.6024485061235745, + "grad_norm": 0.1169116031555102, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 166.9589819908142 + }, + { + "epoch": 85, + "train_loss": 4.493269319915772, + "train_acc": 0.09772, + "test_loss": 2.3025851333618164, + "test_acc": 0.1, + "lyapunov": 2.60219204151417, + "grad_norm": 0.08026909865070977, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 167.0204620361328 + }, + { + "epoch": 86, + "train_loss": 4.4974218487548825, + "train_acc": 0.09802, + "test_loss": 2.302585245895386, + "test_acc": 0.1, + "lyapunov": 2.604730949987231, + "grad_norm": 0.08689607041758553, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 166.964524269104 + }, + { + "epoch": 87, + "train_loss": 4.495326493072509, + "train_acc": 0.0982, + "test_loss": 2.3025850296020507, + "test_acc": 0.1, + "lyapunov": 2.603457776481843, + "grad_norm": 0.09583928752803095, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 167.03006196022034 + }, + { + "epoch": 88, + "train_loss": 4.494311538085937, + "train_acc": 0.09762, + "test_loss": 2.3025852684020998, + "test_acc": 0.1, + "lyapunov": 2.602831931980065, + "grad_norm": 0.08201988600112256, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 166.98635745048523 + }, + { + "epoch": 89, + "train_loss": 4.497406745605469, + "train_acc": 0.09872, + "test_loss": 2.302585092926025, + "test_acc": 0.1, + "lyapunov": 2.6046652647540394, + "grad_norm": 0.11011286998675665, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 167.0066351890564 + }, + { + "epoch": 90, + "train_loss": 4.495393841552734, + "train_acc": 0.0955, + "test_loss": 2.3025851219177245, + "test_acc": 0.1, + "lyapunov": 2.603500037546963, + "grad_norm": 0.08854801622590937, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 166.98117446899414 + }, + { + "epoch": 91, + "train_loss": 4.496799105529785, + "train_acc": 0.09778, + "test_loss": 2.3025851669311526, + "test_acc": 0.1, + "lyapunov": 2.6043886601772455, + "grad_norm": 0.08317548392372451, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 167.05606770515442 + }, + { + "epoch": 92, + "train_loss": 4.501456503753662, + "train_acc": 0.09732, + "test_loss": 2.302585040283203, + "test_acc": 0.1, + "lyapunov": 2.6069688260402826, + "grad_norm": 0.09601255447418665, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 166.95690035820007 + }, + { + "epoch": 93, + "train_loss": 4.4988940646362305, + "train_acc": 0.09822, + "test_loss": 2.302585070037842, + "test_acc": 0.1, + "lyapunov": 2.6056473828337685, + "grad_norm": 0.11345521860163729, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 167.01007437705994 + }, + { + "epoch": 94, + "train_loss": 4.500971371002198, + "train_acc": 0.09656, + "test_loss": 2.3025852294921876, + "test_acc": 0.1, + "lyapunov": 2.606662953296281, + "grad_norm": 0.10989679012817173, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 166.93790555000305 + }, + { + "epoch": 95, + "train_loss": 4.496245345458984, + "train_acc": 0.09824, + "test_loss": 2.3025850425720216, + "test_acc": 0.1, + "lyapunov": 2.6040014677950185, + "grad_norm": 0.13386825999790872, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 166.99875664710999 + }, + { + "epoch": 96, + "train_loss": 4.4964897052001955, + "train_acc": 0.09874, + "test_loss": 2.302585097122192, + "test_acc": 0.1, + "lyapunov": 2.6042159268313356, + "grad_norm": 0.09409731933962433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 166.96930813789368 + }, + { + "epoch": 97, + "train_loss": 4.499828433837891, + "train_acc": 0.1, + "test_loss": 2.3025849605560302, + "test_acc": 0.1, + "lyapunov": 2.6062122037648545, + "grad_norm": 0.16887612557601597, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 166.9714593887329 + }, + { + "epoch": 98, + "train_loss": 4.496156484069824, + "train_acc": 0.1, + "test_loss": 2.302585231781006, + "test_acc": 0.1, + "lyapunov": 2.603946977259253, + "grad_norm": 0.08139214809285189, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 167.0184144973755 + }, + { + "epoch": 99, + "train_loss": 4.497607230377198, + "train_acc": 0.1, + "test_loss": 2.302585125350952, + "test_acc": 0.1, + "lyapunov": 2.6048427774473226, + "grad_norm": 0.08064979301518677, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 166.95221614837646 + }, + { + "epoch": 100, + "train_loss": 4.493742803955078, + "train_acc": 0.1, + "test_loss": 2.302585009765625, + "test_acc": 0.1, + "lyapunov": 2.602488872035385, + "grad_norm": 0.08215126330977654, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 166.99254083633423 + } + ] + } +}
\ No newline at end of file |
