diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
| commit | cd99d6b874d9d09b3bb87b8485cc787885af71f1 (patch) | |
| tree | 59a233959932ca0e4f12f196275e07fcf443b33f /runs/depth_scaling_hinge/cifar100_20260101-112306/results.json | |
init commit
Diffstat (limited to 'runs/depth_scaling_hinge/cifar100_20260101-112306/results.json')
| -rw-r--r-- | runs/depth_scaling_hinge/cifar100_20260101-112306/results.json | 16822 |
1 files changed, 16822 insertions, 0 deletions
diff --git a/runs/depth_scaling_hinge/cifar100_20260101-112306/results.json b/runs/depth_scaling_hinge/cifar100_20260101-112306/results.json new file mode 100644 index 0000000..97d572e --- /dev/null +++ b/runs/depth_scaling_hinge/cifar100_20260101-112306/results.json @@ -0,0 +1,16822 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 4.341291038284302, + "train_acc": 0.09568, + "test_loss": 3.5902228660583497, + "test_acc": 0.1719, + "lyapunov": null, + "grad_norm": 6.233568552079335, + "grad_max_sv": 4.7545679092407225, + "grad_min_sv": 1.1250918028338219e-07, + "grad_condition": 47144055.51418194, + "lr": 0.0009998903417374227, + "time_sec": 17.830737352371216 + }, + { + "epoch": 2, + "train_loss": 3.4833403620910643, + "train_acc": 0.1875, + "test_loss": 3.2125896770477294, + "test_acc": 0.2413, + "lyapunov": null, + "grad_norm": 4.2883357141420815, + "grad_max_sv": 3.0223524630069734, + "grad_min_sv": 7.805360168200437e-08, + "grad_condition": 68434745.79111826, + "lr": 0.0009995614150494292, + "time_sec": 15.740124702453613 + }, + { + "epoch": 3, + "train_loss": 3.014097664794922, + "train_acc": 0.26054, + "test_loss": 2.8822019165039063, + "test_acc": 0.2889, + "lyapunov": null, + "grad_norm": 3.3688150071564396, + "grad_max_sv": 2.1886239469051363, + "grad_min_sv": 6.223103937719188e-08, + "grad_condition": 42282037.7115659, + "lr": 0.0009990133642141358, + "time_sec": 15.473703145980835 + }, + { + "epoch": 4, + "train_loss": 2.7143693132019044, + "train_acc": 0.31262, + "test_loss": 2.702446311187744, + "test_acc": 0.3208, + "lyapunov": null, + "grad_norm": 2.8785406038007317, + "grad_max_sv": 1.7646001279354095, + "grad_min_sv": 5.3701336399925025e-08, + "grad_condition": 43554152.39164617, + "lr": 0.0009982464296247522, + "time_sec": 15.499403238296509 + }, + { + "epoch": 5, + "train_loss": 2.5030348071289064, + "train_acc": 0.3554, + "test_loss": 2.763942724990845, + "test_acc": 0.329, + "lyapunov": null, + "grad_norm": 2.5897409787447465, + "grad_max_sv": 1.5612378805875777, + "grad_min_sv": 4.8854244893981046e-08, + "grad_condition": 41333195.00893615, + "lr": 0.0009972609476841367, + "time_sec": 15.488951683044434 + }, + { + "epoch": 6, + "train_loss": 2.3269909496307375, + "train_acc": 0.3938, + "test_loss": 2.4710379989624025, + "test_acc": 0.3761, + "lyapunov": null, + "grad_norm": 2.37414912310322, + "grad_max_sv": 1.3197038874030114, + "grad_min_sv": 4.5427973693196176e-08, + "grad_condition": 185703885.27271265, + "lr": 0.000996057350657239, + "time_sec": 15.497607707977295 + }, + { + "epoch": 7, + "train_loss": 2.1854072467041017, + "train_acc": 0.4216, + "test_loss": 2.951163561248779, + "test_acc": 0.323, + "lyapunov": null, + "grad_norm": 2.2068200870493837, + "grad_max_sv": 1.2339675694704055, + "grad_min_sv": 4.277283941478416e-08, + "grad_condition": 52095598.918328084, + "lr": 0.000994636166481494, + "time_sec": 15.472023725509644 + }, + { + "epoch": 8, + "train_loss": 2.0716393295288085, + "train_acc": 0.44928, + "test_loss": 2.2887711679458618, + "test_acc": 0.4114, + "lyapunov": null, + "grad_norm": 2.076990480510157, + "grad_max_sv": 1.131314830482006, + "grad_min_sv": 3.9886170205560846e-08, + "grad_condition": 41939669.82744624, + "lr": 0.0009929980185352525, + "time_sec": 15.464510440826416 + }, + { + "epoch": 9, + "train_loss": 1.974085814552307, + "train_acc": 0.47136, + "test_loss": 2.672110557174683, + "test_acc": 0.3601, + "lyapunov": null, + "grad_norm": 1.9761816566655848, + "grad_max_sv": 1.0417343363165856, + "grad_min_sv": 3.825020498116061e-08, + "grad_condition": 39964162.48622004, + "lr": 0.0009911436253643444, + "time_sec": 15.494410037994385 + }, + { + "epoch": 10, + "train_loss": 1.8730941659545899, + "train_acc": 0.49054, + "test_loss": 2.5056158615112305, + "test_acc": 0.3813, + "lyapunov": null, + "grad_norm": 1.8634099386367884, + "grad_max_sv": 0.9600013196468353, + "grad_min_sv": 3.579910488604732e-08, + "grad_condition": 34060738.21798731, + "lr": 0.0009890738003669028, + "time_sec": 15.488292455673218 + }, + { + "epoch": 11, + "train_loss": 1.7812603790664674, + "train_acc": 0.51462, + "test_loss": 2.477180172729492, + "test_acc": 0.3997, + "lyapunov": null, + "grad_norm": 1.7790099981650356, + "grad_max_sv": 0.9072641983628273, + "grad_min_sv": 3.4340940041621694e-08, + "grad_condition": 36834828.42576877, + "lr": 0.00098678945143658, + "time_sec": 15.484249591827393 + }, + { + "epoch": 12, + "train_loss": 1.714907325401306, + "train_acc": 0.52888, + "test_loss": 2.226099481582642, + "test_acc": 0.4353, + "lyapunov": null, + "grad_norm": 1.701538564781707, + "grad_max_sv": 0.8431645318865776, + "grad_min_sv": 3.240299342038844e-08, + "grad_condition": 64109426.95331051, + "lr": 0.0009842915805643154, + "time_sec": 15.483522891998291 + }, + { + "epoch": 13, + "train_loss": 1.648736492576599, + "train_acc": 0.5449, + "test_loss": 2.1634216318130495, + "test_acc": 0.4573, + "lyapunov": null, + "grad_norm": 1.6315158856421696, + "grad_max_sv": 0.7919500142335891, + "grad_min_sv": 3.0836463893457736e-08, + "grad_condition": 50314317.689856075, + "lr": 0.000981581283398829, + "time_sec": 15.491243362426758 + }, + { + "epoch": 14, + "train_loss": 1.5916738232421874, + "train_acc": 0.5591, + "test_loss": 2.5368153831481934, + "test_acc": 0.398, + "lyapunov": null, + "grad_norm": 1.579987574958028, + "grad_max_sv": 0.7741283252835274, + "grad_min_sv": 3.031987156898453e-08, + "grad_condition": 33629215.75141786, + "lr": 0.0009786597487660333, + "time_sec": 15.476540565490723 + }, + { + "epoch": 15, + "train_loss": 1.5378693001937866, + "train_acc": 0.57156, + "test_loss": 1.9343770442962647, + "test_acc": 0.4989, + "lyapunov": null, + "grad_norm": 1.5231234313765212, + "grad_max_sv": 0.7179134920239448, + "grad_min_sv": 2.8637837475031792e-08, + "grad_condition": 49527050.380315706, + "lr": 0.0009755282581475766, + "time_sec": 15.486248970031738 + }, + { + "epoch": 16, + "train_loss": 1.478127024307251, + "train_acc": 0.58584, + "test_loss": 1.9563913166046143, + "test_acc": 0.4922, + "lyapunov": null, + "grad_norm": 1.46325785921816, + "grad_max_sv": 0.6841573119163513, + "grad_min_sv": 2.716867457952521e-08, + "grad_condition": 56699539.529558375, + "lr": 0.0009721881851187403, + "time_sec": 15.49137544631958 + }, + { + "epoch": 17, + "train_loss": 1.429626383972168, + "train_acc": 0.59714, + "test_loss": 2.326792067337036, + "test_acc": 0.4336, + "lyapunov": null, + "grad_norm": 1.4242655219863833, + "grad_max_sv": 0.6712241530418396, + "grad_min_sv": 2.6996844360027695e-08, + "grad_condition": 40189659.16617282, + "lr": 0.0009686409947459456, + "time_sec": 15.493090391159058 + }, + { + "epoch": 18, + "train_loss": 1.395352936630249, + "train_acc": 0.6053, + "test_loss": 1.8314157381057738, + "test_acc": 0.5182, + "lyapunov": null, + "grad_norm": 1.3761305598419875, + "grad_max_sv": 0.6385130822658539, + "grad_min_sv": 2.6239096877211932e-08, + "grad_condition": 63284929.054803826, + "lr": 0.0009648882429441254, + "time_sec": 15.477057695388794 + }, + { + "epoch": 19, + "train_loss": 1.340607022781372, + "train_acc": 0.61952, + "test_loss": 1.9038033363342286, + "test_acc": 0.5042, + "lyapunov": null, + "grad_norm": 1.3323384681348491, + "grad_max_sv": 0.613679239153862, + "grad_min_sv": 2.4952525421112828e-08, + "grad_condition": 1048659082.6601179, + "lr": 0.00096093157579425, + "time_sec": 15.483818292617798 + }, + { + "epoch": 20, + "train_loss": 1.2925908715438843, + "train_acc": 0.62856, + "test_loss": 2.031341696929932, + "test_acc": 0.4835, + "lyapunov": null, + "grad_norm": 1.3034876314465462, + "grad_max_sv": 0.5816340684890747, + "grad_min_sv": 2.434145293522816e-08, + "grad_condition": 45204778.74017582, + "lr": 0.0009567727288213001, + "time_sec": 15.512004375457764 + }, + { + "epoch": 21, + "train_loss": 1.278655789756775, + "train_acc": 0.63278, + "test_loss": 1.8846191581726075, + "test_acc": 0.5135, + "lyapunov": null, + "grad_norm": 1.2776040716135673, + "grad_max_sv": 0.5780372425913811, + "grad_min_sv": 2.405527027016241e-08, + "grad_condition": 42159114.019685745, + "lr": 0.0009524135262330095, + "time_sec": 15.499945878982544 + }, + { + "epoch": 22, + "train_loss": 1.2383485181427003, + "train_acc": 0.64622, + "test_loss": 1.8699242074966431, + "test_acc": 0.518, + "lyapunov": null, + "grad_norm": 1.2460313700260512, + "grad_max_sv": 0.5693550139665604, + "grad_min_sv": 2.3625755932697724e-08, + "grad_condition": 247459954.48036852, + "lr": 0.0009478558801197061, + "time_sec": 15.489409923553467 + }, + { + "epoch": 23, + "train_loss": 1.208611516494751, + "train_acc": 0.6519, + "test_loss": 1.8377874282836915, + "test_acc": 0.526, + "lyapunov": null, + "grad_norm": 1.2268147245238885, + "grad_max_sv": 0.5506495118141175, + "grad_min_sv": 2.2982289769879482e-08, + "grad_condition": 91532045.29729453, + "lr": 0.000943101789615607, + "time_sec": 15.503745555877686 + }, + { + "epoch": 24, + "train_loss": 1.1756799732208252, + "train_acc": 0.66142, + "test_loss": 1.8445790365219117, + "test_acc": 0.5321, + "lyapunov": null, + "grad_norm": 1.1995646648047669, + "grad_max_sv": 0.5362823188304902, + "grad_min_sv": 2.227390833997589e-08, + "grad_condition": 39000923.8470154, + "lr": 0.0009381533400219313, + "time_sec": 15.488165855407715 + }, + { + "epoch": 25, + "train_loss": 1.1402707249450683, + "train_acc": 0.67004, + "test_loss": 2.1079253253936767, + "test_acc": 0.4853, + "lyapunov": null, + "grad_norm": 1.1685820076008453, + "grad_max_sv": 0.500711290538311, + "grad_min_sv": 2.1209413056388903e-08, + "grad_condition": 37717541.68981, + "lr": 0.0009330127018922189, + "time_sec": 15.519190073013306 + }, + { + "epoch": 26, + "train_loss": 1.115832226486206, + "train_acc": 0.67608, + "test_loss": 1.7950333555221558, + "test_acc": 0.5345, + "lyapunov": null, + "grad_norm": 1.1487591162708706, + "grad_max_sv": 0.5033038355410099, + "grad_min_sv": 2.1531226807036675e-08, + "grad_condition": 34912719.99916558, + "lr": 0.000927682130080253, + "time_sec": 15.500119924545288 + }, + { + "epoch": 27, + "train_loss": 1.0897642765426636, + "train_acc": 0.68058, + "test_loss": 1.9983017498016358, + "test_acc": 0.5014, + "lyapunov": null, + "grad_norm": 1.1397755659416107, + "grad_max_sv": 0.5070834219455719, + "grad_min_sv": 2.094801768229293e-08, + "grad_condition": 112680773.02319674, + "lr": 0.0009221639627510072, + "time_sec": 15.487388610839844 + }, + { + "epoch": 28, + "train_loss": 1.0600782299995422, + "train_acc": 0.6873, + "test_loss": 1.7331308700561523, + "test_acc": 0.552, + "lyapunov": null, + "grad_norm": 1.1194293581413437, + "grad_max_sv": 0.49243925511837006, + "grad_min_sv": 2.061250336264555e-08, + "grad_condition": 2391098394.247443, + "lr": 0.0009164606203550494, + "time_sec": 15.49947738647461 + }, + { + "epoch": 29, + "train_loss": 1.0288162441635131, + "train_acc": 0.6958, + "test_loss": 1.7574676347732543, + "test_acc": 0.5469, + "lyapunov": null, + "grad_norm": 1.0981602434296158, + "grad_max_sv": 0.4940373159945011, + "grad_min_sv": 2.0519680072120238e-08, + "grad_condition": 152798003.85014075, + "lr": 0.0009105746045668516, + "time_sec": 15.519279956817627 + }, + { + "epoch": 30, + "train_loss": 1.0005281573104858, + "train_acc": 0.70474, + "test_loss": 1.7724915187835693, + "test_acc": 0.5535, + "lyapunov": null, + "grad_norm": 1.0821209053569316, + "grad_max_sv": 0.4882327690720558, + "grad_min_sv": 2.040895886699923e-08, + "grad_condition": 106754784.91270833, + "lr": 0.0009045084971874733, + "time_sec": 15.495746612548828 + }, + { + "epoch": 31, + "train_loss": 0.9887743633651733, + "train_acc": 0.70736, + "test_loss": 1.803389212989807, + "test_acc": 0.5421, + "lyapunov": null, + "grad_norm": 1.0717360299018484, + "grad_max_sv": 0.4644377827644348, + "grad_min_sv": 1.9709001528034342e-08, + "grad_condition": 35783294.580241755, + "lr": 0.0008982649590120977, + "time_sec": 15.506318807601929 + }, + { + "epoch": 32, + "train_loss": 0.9635560890579223, + "train_acc": 0.71462, + "test_loss": 1.7782361072540283, + "test_acc": 0.5515, + "lyapunov": null, + "grad_norm": 1.0547768746381694, + "grad_max_sv": 0.47287538424134257, + "grad_min_sv": 1.9473239257217223e-08, + "grad_condition": 36442794.53940544, + "lr": 0.0008918467286629196, + "time_sec": 15.525408744812012 + }, + { + "epoch": 33, + "train_loss": 0.9454534896087646, + "train_acc": 0.71586, + "test_loss": 1.8413972650527954, + "test_acc": 0.5387, + "lyapunov": null, + "grad_norm": 1.0457002240106366, + "grad_max_sv": 0.4636484496295452, + "grad_min_sv": 1.9625483711760426e-08, + "grad_condition": 124503449.94674742, + "lr": 0.0008852566213878943, + "time_sec": 15.658098459243774 + }, + { + "epoch": 34, + "train_loss": 0.926147558670044, + "train_acc": 0.72194, + "test_loss": 1.8227524955749512, + "test_acc": 0.5492, + "lyapunov": null, + "grad_norm": 1.030398616328217, + "grad_max_sv": 0.44984652400016784, + "grad_min_sv": 1.8758673522856208e-08, + "grad_condition": 63054578.90943961, + "lr": 0.000878497527825878, + "time_sec": 15.51594591140747 + }, + { + "epoch": 35, + "train_loss": 0.8910220455551148, + "train_acc": 0.7339, + "test_loss": 1.7336375022888184, + "test_acc": 0.5649, + "lyapunov": null, + "grad_norm": 1.0076609346644876, + "grad_max_sv": 0.44372819289565085, + "grad_min_sv": 1.8551427522633945e-08, + "grad_condition": 50611185.75714277, + "lr": 0.000871572412738697, + "time_sec": 15.497729539871216 + }, + { + "epoch": 36, + "train_loss": 0.8785494363021851, + "train_acc": 0.73456, + "test_loss": 1.7843629848480225, + "test_acc": 0.5581, + "lyapunov": null, + "grad_norm": 0.9989169914835021, + "grad_max_sv": 0.4366959437727928, + "grad_min_sv": 1.8408271952943812e-08, + "grad_condition": 85310005.79090494, + "lr": 0.0008644843137107055, + "time_sec": 15.490435123443604 + }, + { + "epoch": 37, + "train_loss": 0.856938405303955, + "train_acc": 0.74212, + "test_loss": 1.78583115940094, + "test_acc": 0.5595, + "lyapunov": null, + "grad_norm": 0.9837943590828618, + "grad_max_sv": 0.42913608700037004, + "grad_min_sv": 1.799877897834534e-08, + "grad_condition": 44955472.82427679, + "lr": 0.0008572363398164014, + "time_sec": 15.537626266479492 + }, + { + "epoch": 38, + "train_loss": 0.8304045977973938, + "train_acc": 0.74954, + "test_loss": 1.9540308137893676, + "test_acc": 0.5338, + "lyapunov": null, + "grad_norm": 0.9705660429353747, + "grad_max_sv": 0.41689482182264326, + "grad_min_sv": 1.7790258101044177e-08, + "grad_condition": 85624723.50661872, + "lr": 0.0008498316702566826, + "time_sec": 15.500178813934326 + }, + { + "epoch": 39, + "train_loss": 0.820258391494751, + "train_acc": 0.74884, + "test_loss": 1.8685070798873902, + "test_acc": 0.5491, + "lyapunov": null, + "grad_norm": 0.9650066613971798, + "grad_max_sv": 0.42203645706176757, + "grad_min_sv": 1.7701675934789218e-08, + "grad_condition": 38471919.31748825, + "lr": 0.0008422735529643442, + "time_sec": 15.50774359703064 + }, + { + "epoch": 40, + "train_loss": 0.8059215658950806, + "train_acc": 0.75368, + "test_loss": 1.7993948059082032, + "test_acc": 0.5644, + "lyapunov": null, + "grad_norm": 0.9599648842149144, + "grad_max_sv": 0.42296523600816727, + "grad_min_sv": 1.7450433907606477e-08, + "grad_condition": 48602019.20439266, + "lr": 0.0008345653031794289, + "time_sec": 15.5121328830719 + }, + { + "epoch": 41, + "train_loss": 0.7813009564971923, + "train_acc": 0.76052, + "test_loss": 1.8404800394058227, + "test_acc": 0.5604, + "lyapunov": null, + "grad_norm": 0.9418789892686961, + "grad_max_sv": 0.40448441356420517, + "grad_min_sv": 1.731778200703138e-08, + "grad_condition": 98318164.88521431, + "lr": 0.0008267103019950526, + "time_sec": 15.492136240005493 + }, + { + "epoch": 42, + "train_loss": 0.7671393407821655, + "train_acc": 0.76604, + "test_loss": 1.793884058380127, + "test_acc": 0.5618, + "lyapunov": null, + "grad_norm": 0.9315468648605028, + "grad_max_sv": 0.38932052329182626, + "grad_min_sv": 1.6337376871483622e-08, + "grad_condition": 62943904.80942075, + "lr": 0.0008187119948743447, + "time_sec": 15.521047592163086 + }, + { + "epoch": 43, + "train_loss": 0.7535210326766968, + "train_acc": 0.76782, + "test_loss": 1.7884279314041138, + "test_acc": 0.5658, + "lyapunov": null, + "grad_norm": 0.9214199202766519, + "grad_max_sv": 0.39339111372828484, + "grad_min_sv": 1.6136958740434192e-08, + "grad_condition": 115362103.47666125, + "lr": 0.000810573890139155, + "time_sec": 15.505242109298706 + }, + { + "epoch": 44, + "train_loss": 0.7410284707832336, + "train_acc": 0.77312, + "test_loss": 1.7518087032318115, + "test_acc": 0.575, + "lyapunov": null, + "grad_norm": 0.9135862495102605, + "grad_max_sv": 0.4029770277440548, + "grad_min_sv": 1.6805088312935034e-08, + "grad_condition": 94769472.27955042, + "lr": 0.0008022995574311873, + "time_sec": 15.517944812774658 + }, + { + "epoch": 45, + "train_loss": 0.7176916319656372, + "train_acc": 0.77704, + "test_loss": 2.0678364603042603, + "test_acc": 0.5371, + "lyapunov": null, + "grad_norm": 0.9046856584920682, + "grad_max_sv": 0.3983215056359768, + "grad_min_sv": 1.613215366361165e-08, + "grad_condition": 71122656.74298272, + "lr": 0.0007938926261462363, + "time_sec": 15.508166313171387 + }, + { + "epoch": 46, + "train_loss": 0.7069017255210877, + "train_acc": 0.7811, + "test_loss": 1.7433353471755981, + "test_acc": 0.5852, + "lyapunov": null, + "grad_norm": 0.8978206260313095, + "grad_max_sv": 0.3794424146413803, + "grad_min_sv": 1.602237248293781e-08, + "grad_condition": 54736720.76954285, + "lr": 0.0007853567838422158, + "time_sec": 15.502079725265503 + }, + { + "epoch": 47, + "train_loss": 0.6877984882736206, + "train_acc": 0.7887, + "test_loss": 1.818675978088379, + "test_acc": 0.571, + "lyapunov": null, + "grad_norm": 0.8819975234594025, + "grad_max_sv": 0.3825521655380726, + "grad_min_sv": 1.5721361913863253e-08, + "grad_condition": 205362522.60160935, + "lr": 0.0007766957746216719, + "time_sec": 15.509292840957642 + }, + { + "epoch": 48, + "train_loss": 0.6792054767608643, + "train_acc": 0.78942, + "test_loss": 1.8216966215133668, + "test_acc": 0.5718, + "lyapunov": null, + "grad_norm": 0.8744607628160516, + "grad_max_sv": 0.3726635776460171, + "grad_min_sv": 1.5723771835604582e-08, + "grad_condition": 93081917.25808936, + "lr": 0.0007679133974894982, + "time_sec": 15.525796890258789 + }, + { + "epoch": 49, + "train_loss": 0.6626561027145386, + "train_acc": 0.79284, + "test_loss": 1.772965872001648, + "test_acc": 0.5863, + "lyapunov": null, + "grad_norm": 0.8660062343667397, + "grad_max_sv": 0.3925539918243885, + "grad_min_sv": 1.5532864388332138e-08, + "grad_condition": 566473525.6824175, + "lr": 0.000759013504686565, + "time_sec": 15.50195598602295 + }, + { + "epoch": 50, + "train_loss": 0.6532552631759644, + "train_acc": 0.79666, + "test_loss": 1.8317417165756225, + "test_acc": 0.5724, + "lyapunov": null, + "grad_norm": 0.860130500782199, + "grad_max_sv": 0.3667507700622082, + "grad_min_sv": 1.5443047825941526e-08, + "grad_condition": 91486044.66793105, + "lr": 0.0007499999999999998, + "time_sec": 15.508357286453247 + }, + { + "epoch": 51, + "train_loss": 0.6380054843711853, + "train_acc": 0.80084, + "test_loss": 1.8737646755218507, + "test_acc": 0.5686, + "lyapunov": null, + "grad_norm": 0.8524936007576276, + "grad_max_sv": 0.3761135272681713, + "grad_min_sv": 1.5451151683110177e-08, + "grad_condition": 34353598.33829906, + "lr": 0.0007408768370508575, + "time_sec": 15.523806810379028 + }, + { + "epoch": 52, + "train_loss": 0.6237339858055114, + "train_acc": 0.80636, + "test_loss": 1.761890636062622, + "test_acc": 0.5872, + "lyapunov": null, + "grad_norm": 0.8410504283608066, + "grad_max_sv": 0.358472990244627, + "grad_min_sv": 1.503268568618654e-08, + "grad_condition": 136795884.7400892, + "lr": 0.0007316480175599307, + "time_sec": 15.495483636856079 + }, + { + "epoch": 53, + "train_loss": 0.6058457711982727, + "train_acc": 0.80932, + "test_loss": 1.9825311820983886, + "test_acc": 0.5638, + "lyapunov": null, + "grad_norm": 0.8335328667900934, + "grad_max_sv": 0.36334397196769713, + "grad_min_sv": 1.5307615661760283e-08, + "grad_condition": 250366089.5715099, + "lr": 0.0007223175895924635, + "time_sec": 15.514543771743774 + }, + { + "epoch": 54, + "train_loss": 0.6004596606063842, + "train_acc": 0.81078, + "test_loss": 1.8254186273574828, + "test_acc": 0.5794, + "lyapunov": null, + "grad_norm": 0.8274523113635032, + "grad_max_sv": 0.36342041566967964, + "grad_min_sv": 1.4868843903077106e-08, + "grad_condition": 300576728.02848065, + "lr": 0.0007128896457825361, + "time_sec": 15.540250062942505 + }, + { + "epoch": 55, + "train_loss": 0.5861557857704163, + "train_acc": 0.8164, + "test_loss": 1.824499238014221, + "test_acc": 0.583, + "lyapunov": null, + "grad_norm": 0.8198101267614993, + "grad_max_sv": 0.357354723662138, + "grad_min_sv": 1.4506401982417039e-08, + "grad_condition": 35029629.47074116, + "lr": 0.0007033683215378998, + "time_sec": 15.531729459762573 + }, + { + "epoch": 56, + "train_loss": 0.5844129343986512, + "train_acc": 0.81744, + "test_loss": 1.9169658557891847, + "test_acc": 0.5711, + "lyapunov": null, + "grad_norm": 0.8204173814530821, + "grad_max_sv": 0.35366991981863977, + "grad_min_sv": 1.4835723899028764e-08, + "grad_condition": 72623356.9140754, + "lr": 0.0006937577932260512, + "time_sec": 15.517155647277832 + }, + { + "epoch": 57, + "train_loss": 0.567106929988861, + "train_acc": 0.82118, + "test_loss": 1.872194965362549, + "test_acc": 0.5783, + "lyapunov": null, + "grad_norm": 0.8144173645411016, + "grad_max_sv": 0.3568101763725281, + "grad_min_sv": 1.459230552047601e-08, + "grad_condition": 479856948.8028302, + "lr": 0.0006840622763423388, + "time_sec": 15.499967098236084 + }, + { + "epoch": 58, + "train_loss": 0.5492036812782287, + "train_acc": 0.82718, + "test_loss": 1.9435380107879638, + "test_acc": 0.5717, + "lyapunov": null, + "grad_norm": 0.8017437900627353, + "grad_max_sv": 0.35105792358517646, + "grad_min_sv": 1.4126277701753675e-08, + "grad_condition": 43594921.05141826, + "lr": 0.0006742860236609073, + "time_sec": 15.517162084579468 + }, + { + "epoch": 59, + "train_loss": 0.5499647881126404, + "train_acc": 0.82578, + "test_loss": 1.9104221244812012, + "test_acc": 0.5719, + "lyapunov": null, + "grad_norm": 0.8008754176084809, + "grad_max_sv": 0.35147457346320155, + "grad_min_sv": 1.4486321607987823e-08, + "grad_condition": 183104197.19597444, + "lr": 0.0006644333233692913, + "time_sec": 15.51251220703125 + }, + { + "epoch": 60, + "train_loss": 0.534982263879776, + "train_acc": 0.83032, + "test_loss": 1.8654183416366577, + "test_acc": 0.5849, + "lyapunov": null, + "grad_norm": 0.7872093874708191, + "grad_max_sv": 0.3456037163734436, + "grad_min_sv": 1.4336570289236833e-08, + "grad_condition": 4249914917.2238555, + "lr": 0.0006545084971874734, + "time_sec": 15.505401134490967 + }, + { + "epoch": 61, + "train_loss": 0.5249415069770813, + "train_acc": 0.83296, + "test_loss": 1.8301967880249024, + "test_acc": 0.5899, + "lyapunov": null, + "grad_norm": 0.7823659308548245, + "grad_max_sv": 0.3372106350958347, + "grad_min_sv": 1.3865955505228816e-08, + "grad_condition": 252598095.01328754, + "lr": 0.0006445158984722354, + "time_sec": 15.503329277038574 + }, + { + "epoch": 62, + "train_loss": 0.510102439250946, + "train_acc": 0.8393, + "test_loss": 1.866330424118042, + "test_acc": 0.5875, + "lyapunov": null, + "grad_norm": 0.7690765731453699, + "grad_max_sv": 0.3254604462534189, + "grad_min_sv": 1.3302552516816778e-08, + "grad_condition": 201820413.1939206, + "lr": 0.0006344599103076324, + "time_sec": 15.51197862625122 + }, + { + "epoch": 63, + "train_loss": 0.5105279865837097, + "train_acc": 0.83724, + "test_loss": 1.901947551727295, + "test_acc": 0.5827, + "lyapunov": null, + "grad_norm": 0.7774036231362129, + "grad_max_sv": 0.3391082786023617, + "grad_min_sv": 1.3618166180666413e-08, + "grad_condition": 142624827.53962922, + "lr": 0.0006243449435824269, + "time_sec": 15.512575387954712 + }, + { + "epoch": 64, + "train_loss": 0.4943154125213623, + "train_acc": 0.84368, + "test_loss": 1.8720532272338868, + "test_acc": 0.5871, + "lyapunov": null, + "grad_norm": 0.7622106739600653, + "grad_max_sv": 0.3370689533650875, + "grad_min_sv": 1.3509893057039868e-08, + "grad_condition": 110330065.15549783, + "lr": 0.0006141754350553275, + "time_sec": 15.502142667770386 + }, + { + "epoch": 65, + "train_loss": 0.47654122495651247, + "train_acc": 0.84812, + "test_loss": 1.905906325340271, + "test_acc": 0.5836, + "lyapunov": null, + "grad_norm": 0.7485726591566199, + "grad_max_sv": 0.3178395930677652, + "grad_min_sv": 1.3372613298992531e-08, + "grad_condition": 61795906.83332411, + "lr": 0.0006039558454088793, + "time_sec": 15.515769243240356 + }, + { + "epoch": 66, + "train_loss": 0.4698985565757752, + "train_acc": 0.85062, + "test_loss": 1.9764730356216431, + "test_acc": 0.5772, + "lyapunov": null, + "grad_norm": 0.742030695327052, + "grad_max_sv": 0.32952211387455466, + "grad_min_sv": 1.321727686021503e-08, + "grad_condition": 4546159923.454214, + "lr": 0.000593690657292862, + "time_sec": 15.48769211769104 + }, + { + "epoch": 67, + "train_loss": 0.4604379980945587, + "train_acc": 0.8524, + "test_loss": 1.796267902946472, + "test_acc": 0.6041, + "lyapunov": null, + "grad_norm": 0.740514981620189, + "grad_max_sv": 0.33283664137125013, + "grad_min_sv": 1.3323875688170395e-08, + "grad_condition": 50110355.592218384, + "lr": 0.0005833843733580507, + "time_sec": 15.512935638427734 + }, + { + "epoch": 68, + "train_loss": 0.44513163749694823, + "train_acc": 0.85782, + "test_loss": 1.882637822341919, + "test_acc": 0.5923, + "lyapunov": null, + "grad_norm": 0.728632370248676, + "grad_max_sv": 0.3257355663925409, + "grad_min_sv": 1.2869882924648746e-08, + "grad_condition": 63884816.41740811, + "lr": 0.0005730415142812054, + "time_sec": 15.52915072441101 + }, + { + "epoch": 69, + "train_loss": 0.4467424920272827, + "train_acc": 0.85622, + "test_loss": 1.8523083587646485, + "test_acc": 0.5958, + "lyapunov": null, + "grad_norm": 0.7288387711248852, + "grad_max_sv": 0.322311682254076, + "grad_min_sv": 1.291249293496055e-08, + "grad_condition": 179204657.50522354, + "lr": 0.0005626666167821517, + "time_sec": 15.511183738708496 + }, + { + "epoch": 70, + "train_loss": 0.4350817290687561, + "train_acc": 0.86062, + "test_loss": 1.9277977352142335, + "test_acc": 0.5905, + "lyapunov": null, + "grad_norm": 0.7211268163108158, + "grad_max_sv": 0.3169262710958719, + "grad_min_sv": 1.2573862395379165e-08, + "grad_condition": 248234270.03092772, + "lr": 0.0005522642316338265, + "time_sec": 15.514695167541504 + }, + { + "epoch": 71, + "train_loss": 0.43583440225601194, + "train_acc": 0.86066, + "test_loss": 1.940795637512207, + "test_acc": 0.59, + "lyapunov": null, + "grad_norm": 0.7218256453060395, + "grad_max_sv": 0.3179506029933691, + "grad_min_sv": 1.2854640636141001e-08, + "grad_condition": 159315542.25023228, + "lr": 0.0005418389216661573, + "time_sec": 15.515326499938965 + }, + { + "epoch": 72, + "train_loss": 0.414209595451355, + "train_acc": 0.86682, + "test_loss": 1.9192114906311035, + "test_acc": 0.5871, + "lyapunov": null, + "grad_norm": 0.7026800304062572, + "grad_max_sv": 0.3194992933422327, + "grad_min_sv": 1.2563614283167892e-08, + "grad_condition": 438466879.2604634, + "lr": 0.0005313952597646563, + "time_sec": 15.508101224899292 + }, + { + "epoch": 73, + "train_loss": 0.41810142745018003, + "train_acc": 0.86568, + "test_loss": 1.9427220703125, + "test_acc": 0.5871, + "lyapunov": null, + "grad_norm": 0.7107104457797438, + "grad_max_sv": 0.3116331197321415, + "grad_min_sv": 1.2560458482156755e-08, + "grad_condition": 218040038.56003165, + "lr": 0.0005209378268645994, + "time_sec": 15.528023719787598 + }, + { + "epoch": 74, + "train_loss": 0.4033842642211914, + "train_acc": 0.87, + "test_loss": 1.9472733200073242, + "test_acc": 0.5874, + "lyapunov": null, + "grad_norm": 0.6981925142164059, + "grad_max_sv": 0.3173716105520725, + "grad_min_sv": 1.260878115683789e-08, + "grad_condition": 120156618.97368078, + "lr": 0.0005104712099416781, + "time_sec": 15.506508111953735 + }, + { + "epoch": 75, + "train_loss": 0.39077227040290835, + "train_acc": 0.87468, + "test_loss": 1.857486226272583, + "test_acc": 0.598, + "lyapunov": null, + "grad_norm": 0.6856338799556791, + "grad_max_sv": 0.30381867848336697, + "grad_min_sv": 1.2063926282295315e-08, + "grad_condition": 414020461.3005485, + "lr": 0.0004999999999999996, + "time_sec": 15.522391557693481 + }, + { + "epoch": 76, + "train_loss": 0.3836136112689972, + "train_acc": 0.8757, + "test_loss": 1.9512550479888917, + "test_acc": 0.587, + "lyapunov": null, + "grad_norm": 0.6870816068446682, + "grad_max_sv": 0.3084618851542473, + "grad_min_sv": 1.2161173516388873e-08, + "grad_condition": 299698503.7116597, + "lr": 0.0004895287900583212, + "time_sec": 15.51857614517212 + }, + { + "epoch": 77, + "train_loss": 0.38193485226631163, + "train_acc": 0.87626, + "test_loss": 1.8681373037338256, + "test_acc": 0.5993, + "lyapunov": null, + "grad_norm": 0.6828844071671899, + "grad_max_sv": 0.30646760389208794, + "grad_min_sv": 1.2204253475693593e-08, + "grad_condition": 272459180.1924466, + "lr": 0.0004790621731353997, + "time_sec": 15.519853591918945 + }, + { + "epoch": 78, + "train_loss": 0.37069116824150083, + "train_acc": 0.88084, + "test_loss": 1.875751858139038, + "test_acc": 0.6043, + "lyapunov": null, + "grad_norm": 0.6706724909872018, + "grad_max_sv": 0.30184795036911966, + "grad_min_sv": 1.1925269455606569e-08, + "grad_condition": 303963866.0557478, + "lr": 0.000468604740235343, + "time_sec": 15.520630836486816 + }, + { + "epoch": 79, + "train_loss": 0.3643507383155823, + "train_acc": 0.88364, + "test_loss": 1.9180334386825562, + "test_acc": 0.5942, + "lyapunov": null, + "grad_norm": 0.6691117052818351, + "grad_max_sv": 0.2972587738186121, + "grad_min_sv": 1.1847118905870552e-08, + "grad_condition": 4229198196.1638947, + "lr": 0.00045816107833384175, + "time_sec": 15.53023386001587 + }, + { + "epoch": 80, + "train_loss": 0.3633389077377319, + "train_acc": 0.88294, + "test_loss": 1.8658218830108642, + "test_acc": 0.6003, + "lyapunov": null, + "grad_norm": 0.6700579474761854, + "grad_max_sv": 0.2936097148805857, + "grad_min_sv": 1.1731030144946502e-08, + "grad_condition": 196324429.7051069, + "lr": 0.0004477357683661729, + "time_sec": 15.50595474243164 + }, + { + "epoch": 81, + "train_loss": 0.35195467962265015, + "train_acc": 0.88632, + "test_loss": 1.9072984680175782, + "test_acc": 0.5985, + "lyapunov": null, + "grad_norm": 0.6558349942319918, + "grad_max_sv": 0.2942222774028778, + "grad_min_sv": 1.1174211227583247e-08, + "grad_condition": 686453916.7723808, + "lr": 0.00043733338321784746, + "time_sec": 15.547033786773682 + }, + { + "epoch": 82, + "train_loss": 0.34602870296001437, + "train_acc": 0.88766, + "test_loss": 1.9684966739654541, + "test_acc": 0.5914, + "lyapunov": null, + "grad_norm": 0.6555903608944951, + "grad_max_sv": 0.29228324331343175, + "grad_min_sv": 1.1487677028338903e-08, + "grad_condition": 383534563.2338952, + "lr": 0.0004269584857187939, + "time_sec": 15.51542615890503 + }, + { + "epoch": 83, + "train_loss": 0.3428422933292389, + "train_acc": 0.89108, + "test_loss": 1.9337468532562256, + "test_acc": 0.5993, + "lyapunov": null, + "grad_norm": 0.6492331544938933, + "grad_max_sv": 0.28135959543287753, + "grad_min_sv": 1.1496448484339673e-08, + "grad_condition": 414922787.7095521, + "lr": 0.0004166156266419484, + "time_sec": 15.53177547454834 + }, + { + "epoch": 84, + "train_loss": 0.328343852148056, + "train_acc": 0.89454, + "test_loss": 1.9273885646820068, + "test_acc": 0.6009, + "lyapunov": null, + "grad_norm": 0.6390681347680143, + "grad_max_sv": 0.28590504080057144, + "grad_min_sv": 1.1241013130221244e-08, + "grad_condition": 433920435.0763866, + "lr": 0.0004063093427071373, + "time_sec": 15.530908346176147 + }, + { + "epoch": 85, + "train_loss": 0.3230694122695923, + "train_acc": 0.89496, + "test_loss": 1.9058713027954102, + "test_acc": 0.5998, + "lyapunov": null, + "grad_norm": 0.6383613950635205, + "grad_max_sv": 0.2902642168104649, + "grad_min_sv": 1.141585580797036e-08, + "grad_condition": 604353313.9340062, + "lr": 0.0003960441545911199, + "time_sec": 15.515930414199829 + }, + { + "epoch": 86, + "train_loss": 0.31695827428817747, + "train_acc": 0.8967, + "test_loss": 1.9341052951812745, + "test_acc": 0.5998, + "lyapunov": null, + "grad_norm": 0.6323196704290217, + "grad_max_sv": 0.30049107149243354, + "grad_min_sv": 1.1364172216449253e-08, + "grad_condition": 253780845.1911161, + "lr": 0.0003858245649446718, + "time_sec": 15.52891731262207 + }, + { + "epoch": 87, + "train_loss": 0.310550309715271, + "train_acc": 0.8979, + "test_loss": 1.9645798837661743, + "test_acc": 0.5972, + "lyapunov": null, + "grad_norm": 0.6290293549615046, + "grad_max_sv": 0.28168079666793344, + "grad_min_sv": 1.1139878612566237e-08, + "grad_condition": 3174828807.3372684, + "lr": 0.00037565505641757235, + "time_sec": 15.527303218841553 + }, + { + "epoch": 88, + "train_loss": 0.30801844054222105, + "train_acc": 0.89982, + "test_loss": 1.9113462907791137, + "test_acc": 0.6061, + "lyapunov": null, + "grad_norm": 0.6261342549488306, + "grad_max_sv": 0.2938710656017065, + "grad_min_sv": 1.1276199778260943e-08, + "grad_condition": 166623199.75638226, + "lr": 0.00036554008969236695, + "time_sec": 15.515942573547363 + }, + { + "epoch": 89, + "train_loss": 0.3031072138786316, + "train_acc": 0.90226, + "test_loss": 1.932079137611389, + "test_acc": 0.6084, + "lyapunov": null, + "grad_norm": 0.6209363139222046, + "grad_max_sv": 0.2818705204874277, + "grad_min_sv": 1.0986600190287382e-08, + "grad_condition": 235648712.41506353, + "lr": 0.0003554841015277638, + "time_sec": 15.523046731948853 + }, + { + "epoch": 90, + "train_loss": 0.295468587474823, + "train_acc": 0.90442, + "test_loss": 1.9561836023330688, + "test_acc": 0.6029, + "lyapunov": null, + "grad_norm": 0.6134434549386554, + "grad_max_sv": 0.28373970463871956, + "grad_min_sv": 1.1000367631294056e-08, + "grad_condition": 371761681.0452756, + "lr": 0.000345491502812526, + "time_sec": 15.52297592163086 + }, + { + "epoch": 91, + "train_loss": 0.29119554637908934, + "train_acc": 0.90446, + "test_loss": 1.993441968536377, + "test_acc": 0.6049, + "lyapunov": null, + "grad_norm": 0.6105333020567495, + "grad_max_sv": 0.27541381642222407, + "grad_min_sv": 1.0823096196089371e-08, + "grad_condition": 473734139.3827542, + "lr": 0.0003355666766307081, + "time_sec": 15.514235258102417 + }, + { + "epoch": 92, + "train_loss": 0.28460477176189425, + "train_acc": 0.90876, + "test_loss": 1.9682166564941406, + "test_acc": 0.6057, + "lyapunov": null, + "grad_norm": 0.5988483508766865, + "grad_max_sv": 0.27126791067421435, + "grad_min_sv": 1.0722518893266364e-08, + "grad_condition": 97668951.32032181, + "lr": 0.00032571397633909225, + "time_sec": 15.52116084098816 + }, + { + "epoch": 93, + "train_loss": 0.2825835990524292, + "train_acc": 0.90854, + "test_loss": 1.9348359714508057, + "test_acc": 0.6041, + "lyapunov": null, + "grad_norm": 0.6011972747002627, + "grad_max_sv": 0.2796713523566723, + "grad_min_sv": 1.0827668426964532e-08, + "grad_condition": 881127416.7703698, + "lr": 0.00031593772365766094, + "time_sec": 15.528529644012451 + }, + { + "epoch": 94, + "train_loss": 0.2801620689296722, + "train_acc": 0.9097, + "test_loss": 1.980628232383728, + "test_acc": 0.6055, + "lyapunov": null, + "grad_norm": 0.5993074321032092, + "grad_max_sv": 0.2800555154681206, + "grad_min_sv": 1.0468388221378244e-08, + "grad_condition": 140732695.72303194, + "lr": 0.0003062422067739483, + "time_sec": 15.532250165939331 + }, + { + "epoch": 95, + "train_loss": 0.26648273178100584, + "train_acc": 0.9142, + "test_loss": 2.0015383081436156, + "test_acc": 0.6016, + "lyapunov": null, + "grad_norm": 0.5881453904576209, + "grad_max_sv": 0.27579851634800434, + "grad_min_sv": 1.0274321395227492e-08, + "grad_condition": 201871276.47904783, + "lr": 0.00029663167846209965, + "time_sec": 15.681024551391602 + }, + { + "epoch": 96, + "train_loss": 0.26776352972984313, + "train_acc": 0.91448, + "test_loss": 2.0207461967468263, + "test_acc": 0.6012, + "lyapunov": null, + "grad_norm": 0.5860462649686203, + "grad_max_sv": 0.2698933105915785, + "grad_min_sv": 1.0329826621857664e-08, + "grad_condition": 76135409.2144176, + "lr": 0.00028711035421746345, + "time_sec": 15.536462545394897 + }, + { + "epoch": 97, + "train_loss": 0.25857464953899384, + "train_acc": 0.91696, + "test_loss": 1.9442026258468628, + "test_acc": 0.6066, + "lyapunov": null, + "grad_norm": 0.579918050497587, + "grad_max_sv": 0.28092321269214154, + "grad_min_sv": 1.0451780512853865e-08, + "grad_condition": 432604154.8635365, + "lr": 0.00027768241040753615, + "time_sec": 15.520632982254028 + }, + { + "epoch": 98, + "train_loss": 0.2567158591556549, + "train_acc": 0.91576, + "test_loss": 1.952080411529541, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.5815827800021661, + "grad_max_sv": 0.26784452944993975, + "grad_min_sv": 9.97831211164979e-09, + "grad_condition": 91061008.30272922, + "lr": 0.00026835198244006903, + "time_sec": 15.535520553588867 + }, + { + "epoch": 99, + "train_loss": 0.24892670249938964, + "train_acc": 0.9202, + "test_loss": 2.033794689941406, + "test_acc": 0.6019, + "lyapunov": null, + "grad_norm": 0.5696851893969495, + "grad_max_sv": 0.2726339440792799, + "grad_min_sv": 9.946045926049683e-09, + "grad_condition": 1696689541.1727843, + "lr": 0.0002591231629491421, + "time_sec": 15.538635969161987 + }, + { + "epoch": 100, + "train_loss": 0.24926711993694306, + "train_acc": 0.91978, + "test_loss": 1.9742811960220337, + "test_acc": 0.6068, + "lyapunov": null, + "grad_norm": 0.5702583833389835, + "grad_max_sv": 0.26799715869128704, + "grad_min_sv": 9.895174417351438e-09, + "grad_condition": 297572156.6297859, + "lr": 0.0002499999999999997, + "time_sec": 15.536820650100708 + }, + { + "epoch": 101, + "train_loss": 0.2401547999382019, + "train_acc": 0.92344, + "test_loss": 1.99689197101593, + "test_acc": 0.6077, + "lyapunov": null, + "grad_norm": 0.5610283078331603, + "grad_max_sv": 0.2691540464758873, + "grad_min_sv": 9.99432525588921e-09, + "grad_condition": 545457041.2762839, + "lr": 0.00024098649531343477, + "time_sec": 15.541125774383545 + }, + { + "epoch": 102, + "train_loss": 0.2366540629529953, + "train_acc": 0.92332, + "test_loss": 1.9686679859161378, + "test_acc": 0.6043, + "lyapunov": null, + "grad_norm": 0.5596319863447712, + "grad_max_sv": 0.2598999205976725, + "grad_min_sv": 9.748093400801378e-09, + "grad_condition": 280631646.0385326, + "lr": 0.0002320866025105016, + "time_sec": 15.642221689224243 + }, + { + "epoch": 103, + "train_loss": 0.23095350846290588, + "train_acc": 0.92478, + "test_loss": 1.9796740842819214, + "test_acc": 0.6086, + "lyapunov": null, + "grad_norm": 0.5527105531261713, + "grad_max_sv": 0.2648670017719269, + "grad_min_sv": 1.0250657645751934e-08, + "grad_condition": 501602567.1069907, + "lr": 0.0002233042253783278, + "time_sec": 15.533202886581421 + }, + { + "epoch": 104, + "train_loss": 0.23427851341247558, + "train_acc": 0.92466, + "test_loss": 1.9721594404220582, + "test_acc": 0.6107, + "lyapunov": null, + "grad_norm": 0.5589041472139786, + "grad_max_sv": 0.25932734124362466, + "grad_min_sv": 9.605904077877003e-09, + "grad_condition": 1031803946.0677515, + "lr": 0.000214643216157784, + "time_sec": 15.51241683959961 + }, + { + "epoch": 105, + "train_loss": 0.219517624874115, + "train_acc": 0.9293, + "test_loss": 2.0007881326675414, + "test_acc": 0.6035, + "lyapunov": null, + "grad_norm": 0.5422594048752922, + "grad_max_sv": 0.2685978960245848, + "grad_min_sv": 9.883629456617499e-09, + "grad_condition": 224740616.11832863, + "lr": 0.00020610737385376332, + "time_sec": 15.537052392959595 + }, + { + "epoch": 106, + "train_loss": 0.2232757794523239, + "train_acc": 0.92674, + "test_loss": 2.0058324546813964, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.5472900635805251, + "grad_max_sv": 0.2613681871443987, + "grad_min_sv": 9.819886173656478e-09, + "grad_condition": 176319742.57465333, + "lr": 0.00019770044256881242, + "time_sec": 15.542799949645996 + }, + { + "epoch": 107, + "train_loss": 0.21997562067031862, + "train_acc": 0.92926, + "test_loss": 1.989624990081787, + "test_acc": 0.6099, + "lyapunov": null, + "grad_norm": 0.5414473725256549, + "grad_max_sv": 0.2557095166295767, + "grad_min_sv": 9.448845216301038e-09, + "grad_condition": 1407753979.8512912, + "lr": 0.0001894261098608447, + "time_sec": 15.52652359008789 + }, + { + "epoch": 108, + "train_loss": 0.2132127531719208, + "train_acc": 0.93122, + "test_loss": 2.043244864463806, + "test_acc": 0.6013, + "lyapunov": null, + "grad_norm": 0.5380471333664735, + "grad_max_sv": 0.255327982082963, + "grad_min_sv": 9.992253989770521e-09, + "grad_condition": 429655462.4469593, + "lr": 0.000181288005125655, + "time_sec": 15.52126145362854 + }, + { + "epoch": 109, + "train_loss": 0.21187591857910157, + "train_acc": 0.93122, + "test_loss": 1.9954864723205565, + "test_acc": 0.6098, + "lyapunov": null, + "grad_norm": 0.5380204381544875, + "grad_max_sv": 0.26441522017121316, + "grad_min_sv": 9.557367238854226e-09, + "grad_condition": 237566723.1979712, + "lr": 0.0001732896980049473, + "time_sec": 15.548521995544434 + }, + { + "epoch": 110, + "train_loss": 0.20928363649368287, + "train_acc": 0.9326, + "test_loss": 1.9480315828323365, + "test_acc": 0.6146, + "lyapunov": null, + "grad_norm": 0.5298971206452113, + "grad_max_sv": 0.26398450396955014, + "grad_min_sv": 9.874217052428108e-09, + "grad_condition": 197519783.8891028, + "lr": 0.00016543469682057076, + "time_sec": 15.51990032196045 + }, + { + "epoch": 111, + "train_loss": 0.20472501375198365, + "train_acc": 0.93442, + "test_loss": 1.9880135498046876, + "test_acc": 0.6114, + "lyapunov": null, + "grad_norm": 0.5226715722616327, + "grad_max_sv": 0.25575212091207505, + "grad_min_sv": 9.559482279462156e-09, + "grad_condition": 213563040.67873913, + "lr": 0.00015772644703565552, + "time_sec": 15.518001079559326 + }, + { + "epoch": 112, + "train_loss": 0.20579987778663636, + "train_acc": 0.93296, + "test_loss": 2.016691120529175, + "test_acc": 0.6117, + "lyapunov": null, + "grad_norm": 0.5297683532569843, + "grad_max_sv": 0.25805489346385, + "grad_min_sv": 9.560597037899625e-09, + "grad_condition": 1064723629.28162, + "lr": 0.00015016832974331713, + "time_sec": 15.522767305374146 + }, + { + "epoch": 113, + "train_loss": 0.20068273310422896, + "train_acc": 0.93668, + "test_loss": 2.0594107456207276, + "test_acc": 0.6086, + "lyapunov": null, + "grad_norm": 0.5184460551642818, + "grad_max_sv": 0.24561816416680812, + "grad_min_sv": 9.581332657826458e-09, + "grad_condition": 364510178.3461688, + "lr": 0.00014276366018359834, + "time_sec": 15.533010005950928 + }, + { + "epoch": 114, + "train_loss": 0.19722092057228088, + "train_acc": 0.93788, + "test_loss": 2.008504161453247, + "test_acc": 0.6083, + "lyapunov": null, + "grad_norm": 0.5143544627139274, + "grad_max_sv": 0.26034388653934004, + "grad_min_sv": 9.650303647423114e-09, + "grad_condition": 3361687889.542286, + "lr": 0.00013551568628929425, + "time_sec": 15.531035661697388 + }, + { + "epoch": 115, + "train_loss": 0.19389657697677612, + "train_acc": 0.93868, + "test_loss": 2.0233098300933836, + "test_acc": 0.6117, + "lyapunov": null, + "grad_norm": 0.5104261903820102, + "grad_max_sv": 0.24447884745895862, + "grad_min_sv": 9.077133606870055e-09, + "grad_condition": 461064774.41410434, + "lr": 0.00012842758726130276, + "time_sec": 15.524327993392944 + }, + { + "epoch": 116, + "train_loss": 0.19362226080417633, + "train_acc": 0.93796, + "test_loss": 2.053111413192749, + "test_acc": 0.6054, + "lyapunov": null, + "grad_norm": 0.5131743880915615, + "grad_max_sv": 0.2492377854883671, + "grad_min_sv": 9.515753446841246e-09, + "grad_condition": 206396866.4016946, + "lr": 0.0001215024721741218, + "time_sec": 15.513204574584961 + }, + { + "epoch": 117, + "train_loss": 0.18898310523986817, + "train_acc": 0.93976, + "test_loss": 2.015893176269531, + "test_acc": 0.6127, + "lyapunov": null, + "grad_norm": 0.5048514988009624, + "grad_max_sv": 0.23975766226649284, + "grad_min_sv": 9.193109389200611e-09, + "grad_condition": 1880002960.4112122, + "lr": 0.00011474337861210538, + "time_sec": 15.531865119934082 + }, + { + "epoch": 118, + "train_loss": 0.18859933629989625, + "train_acc": 0.93992, + "test_loss": 2.0275477882385253, + "test_acc": 0.613, + "lyapunov": null, + "grad_norm": 0.5070579132326548, + "grad_max_sv": 0.2569826778024435, + "grad_min_sv": 9.573198521970264e-09, + "grad_condition": 946919734.9405922, + "lr": 0.00010815327133708009, + "time_sec": 15.528860330581665 + }, + { + "epoch": 119, + "train_loss": 0.18436414319992064, + "train_acc": 0.9409, + "test_loss": 2.035816400527954, + "test_acc": 0.6094, + "lyapunov": null, + "grad_norm": 0.49869022882133546, + "grad_max_sv": 0.24773051403462887, + "grad_min_sv": 9.154285843075704e-09, + "grad_condition": 330957531.4847302, + "lr": 0.00010173504098790182, + "time_sec": 15.546629190444946 + }, + { + "epoch": 120, + "train_loss": 0.18639450643777847, + "train_acc": 0.94082, + "test_loss": 2.0497810037612916, + "test_acc": 0.6101, + "lyapunov": null, + "grad_norm": 0.5054264593475204, + "grad_max_sv": 0.24650247804820538, + "grad_min_sv": 9.350194245597021e-09, + "grad_condition": 546741093.3651453, + "lr": 9.549150281252629e-05, + "time_sec": 15.52673053741455 + }, + { + "epoch": 121, + "train_loss": 0.18135397327423095, + "train_acc": 0.94364, + "test_loss": 2.0228085262298583, + "test_acc": 0.6112, + "lyapunov": null, + "grad_norm": 0.49196950746055856, + "grad_max_sv": 0.25292878448963163, + "grad_min_sv": 9.245442955446368e-09, + "grad_condition": 345415022.7201654, + "lr": 8.942539543314794e-05, + "time_sec": 15.530716180801392 + }, + { + "epoch": 122, + "train_loss": 0.17821871382713317, + "train_acc": 0.94288, + "test_loss": 2.015850890350342, + "test_acc": 0.6127, + "lyapunov": null, + "grad_norm": 0.4943397097989714, + "grad_max_sv": 0.2537323322147131, + "grad_min_sv": 9.237968556525395e-09, + "grad_condition": 263035591.43015513, + "lr": 8.353937964495024e-05, + "time_sec": 15.536164045333862 + }, + { + "epoch": 123, + "train_loss": 0.17632093348026276, + "train_acc": 0.9444, + "test_loss": 2.029286048698425, + "test_acc": 0.6089, + "lyapunov": null, + "grad_norm": 0.48806288568095135, + "grad_max_sv": 0.2458991575986147, + "grad_min_sv": 9.06146269260763e-09, + "grad_condition": 386283353.8532323, + "lr": 7.783603724899243e-05, + "time_sec": 15.518115997314453 + }, + { + "epoch": 124, + "train_loss": 0.1732941804933548, + "train_acc": 0.94456, + "test_loss": 2.099158185958862, + "test_acc": 0.6025, + "lyapunov": null, + "grad_norm": 0.4868912892942884, + "grad_max_sv": 0.24448585212230683, + "grad_min_sv": 8.980524343182167e-09, + "grad_condition": 336891094.31355625, + "lr": 7.231786991974666e-05, + "time_sec": 15.542467832565308 + }, + { + "epoch": 125, + "train_loss": 0.17837541491031647, + "train_acc": 0.94274, + "test_loss": 2.0764820568084716, + "test_acc": 0.61, + "lyapunov": null, + "grad_norm": 0.4948203710715524, + "grad_max_sv": 0.24412455931305885, + "grad_min_sv": 9.184420232503931e-09, + "grad_condition": 716346437.4859622, + "lr": 6.698729810778072e-05, + "time_sec": 15.55189299583435 + }, + { + "epoch": 126, + "train_loss": 0.1735024337530136, + "train_acc": 0.94474, + "test_loss": 2.0553098888397217, + "test_acc": 0.6111, + "lyapunov": null, + "grad_norm": 0.4854349633437902, + "grad_max_sv": 0.2419682189822197, + "grad_min_sv": 8.905077519393705e-09, + "grad_condition": 839365296.5454277, + "lr": 6.184665997806817e-05, + "time_sec": 15.54058313369751 + }, + { + "epoch": 127, + "train_loss": 0.1715146116065979, + "train_acc": 0.94478, + "test_loss": 2.0106375900268554, + "test_acc": 0.6128, + "lyapunov": null, + "grad_norm": 0.4816957588601112, + "grad_max_sv": 0.23674072176218033, + "grad_min_sv": 8.675588131831085e-09, + "grad_condition": 478973714.0473558, + "lr": 5.6898210384392595e-05, + "time_sec": 15.529821157455444 + }, + { + "epoch": 128, + "train_loss": 0.1660640141773224, + "train_acc": 0.9478, + "test_loss": 2.0750678112030028, + "test_acc": 0.6111, + "lyapunov": null, + "grad_norm": 0.4757528664416431, + "grad_max_sv": 0.244390731677413, + "grad_min_sv": 8.79119548703039e-09, + "grad_condition": 457083152.2974655, + "lr": 5.214411988029363e-05, + "time_sec": 15.54984712600708 + }, + { + "epoch": 129, + "train_loss": 0.1666716690993309, + "train_acc": 0.94686, + "test_loss": 2.0469725986480714, + "test_acc": 0.6123, + "lyapunov": null, + "grad_norm": 0.478310500713372, + "grad_max_sv": 0.23569908998906614, + "grad_min_sv": 8.542899999821468e-09, + "grad_condition": 598853903.3316209, + "lr": 4.7586473766990294e-05, + "time_sec": 15.545772552490234 + }, + { + "epoch": 130, + "train_loss": 0.16598962943553924, + "train_acc": 0.94712, + "test_loss": 1.9995166748046875, + "test_acc": 0.6146, + "lyapunov": null, + "grad_norm": 0.4758526221040286, + "grad_max_sv": 0.23986518271267415, + "grad_min_sv": 8.749124542689266e-09, + "grad_condition": 608746268.1362782, + "lr": 4.32272711786996e-05, + "time_sec": 15.54599404335022 + }, + { + "epoch": 131, + "train_loss": 0.16668007793426515, + "train_acc": 0.9479, + "test_loss": 2.0491572677612306, + "test_acc": 0.6109, + "lyapunov": null, + "grad_norm": 0.4755344205180913, + "grad_max_sv": 0.23323244228959084, + "grad_min_sv": 8.472622621633757e-09, + "grad_condition": 233979199.2625857, + "lr": 3.906842420574966e-05, + "time_sec": 15.524599552154541 + }, + { + "epoch": 132, + "train_loss": 0.16224975943565367, + "train_acc": 0.94862, + "test_loss": 2.0500082311630248, + "test_acc": 0.6134, + "lyapunov": null, + "grad_norm": 0.46871867660355254, + "grad_max_sv": 0.2372895274311304, + "grad_min_sv": 8.64411044331978e-09, + "grad_condition": 287263322.167899, + "lr": 3.5111757055874305e-05, + "time_sec": 15.527011156082153 + }, + { + "epoch": 133, + "train_loss": 0.16492341012477874, + "train_acc": 0.94736, + "test_loss": 2.0346584928512574, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.47534738241769, + "grad_max_sv": 0.24461643844842912, + "grad_min_sv": 9.178972258834517e-09, + "grad_condition": 500309812.0406585, + "lr": 3.1359005254054254e-05, + "time_sec": 15.547746658325195 + }, + { + "epoch": 134, + "train_loss": 0.16421831488609315, + "train_acc": 0.94756, + "test_loss": 2.0132702159881593, + "test_acc": 0.6162, + "lyapunov": null, + "grad_norm": 0.4772419829809968, + "grad_max_sv": 0.23413821049034594, + "grad_min_sv": 9.002530253383878e-09, + "grad_condition": 363205059.0549506, + "lr": 2.7811814881259484e-05, + "time_sec": 15.531517505645752 + }, + { + "epoch": 135, + "train_loss": 0.16381137976646423, + "train_acc": 0.94842, + "test_loss": 2.0648642013549803, + "test_acc": 0.6083, + "lyapunov": null, + "grad_norm": 0.4736658227067323, + "grad_max_sv": 0.23049395270645617, + "grad_min_sv": 8.56864400186879e-09, + "grad_condition": 1442465508.733611, + "lr": 2.4471741852423218e-05, + "time_sec": 15.541293859481812 + }, + { + "epoch": 136, + "train_loss": 0.16108462400436402, + "train_acc": 0.94976, + "test_loss": 2.0012967403411865, + "test_acc": 0.6119, + "lyapunov": null, + "grad_norm": 0.465643715209168, + "grad_max_sv": 0.23518772274255753, + "grad_min_sv": 8.637825488558292e-09, + "grad_condition": 243388926.8874995, + "lr": 2.1340251233966362e-05, + "time_sec": 15.512713193893433 + }, + { + "epoch": 137, + "train_loss": 0.1584918847179413, + "train_acc": 0.94912, + "test_loss": 2.050839980697632, + "test_acc": 0.6104, + "lyapunov": null, + "grad_norm": 0.46730923038258504, + "grad_max_sv": 0.23510748259723185, + "grad_min_sv": 8.813612497248977e-09, + "grad_condition": 1210234116.5017686, + "lr": 1.8418716601170932e-05, + "time_sec": 15.537960052490234 + }, + { + "epoch": 138, + "train_loss": 0.15678886548519136, + "train_acc": 0.9508, + "test_loss": 2.0579080810546877, + "test_acc": 0.6137, + "lyapunov": null, + "grad_norm": 0.46202513180941285, + "grad_max_sv": 0.22975999489426613, + "grad_min_sv": 8.437959897781514e-09, + "grad_condition": 1365594635.574403, + "lr": 1.570841943568445e-05, + "time_sec": 15.53256607055664 + }, + { + "epoch": 139, + "train_loss": 0.15868934306621552, + "train_acc": 0.95058, + "test_loss": 2.0891008211135866, + "test_acc": 0.607, + "lyapunov": null, + "grad_norm": 0.46370376954923076, + "grad_max_sv": 0.239790453761816, + "grad_min_sv": 8.653809858939418e-09, + "grad_condition": 751331866.6462338, + "lr": 1.3210548563419845e-05, + "time_sec": 15.542593002319336 + }, + { + "epoch": 140, + "train_loss": 0.16018940447807312, + "train_acc": 0.94944, + "test_loss": 2.0365436012268066, + "test_acc": 0.6134, + "lyapunov": null, + "grad_norm": 0.46850944550951273, + "grad_max_sv": 0.24336591213941575, + "grad_min_sv": 8.69392097297767e-09, + "grad_condition": 6372417042.7504635, + "lr": 1.0926199633097203e-05, + "time_sec": 15.530508279800415 + }, + { + "epoch": 141, + "train_loss": 0.1577048332262039, + "train_acc": 0.95192, + "test_loss": 2.048553763961792, + "test_acc": 0.6177, + "lyapunov": null, + "grad_norm": 0.46173934960898333, + "grad_max_sv": 0.2323433578014374, + "grad_min_sv": 8.582540832018093e-09, + "grad_condition": 374128300.47680604, + "lr": 8.856374635655688e-06, + "time_sec": 15.53349781036377 + }, + { + "epoch": 142, + "train_loss": 0.15599479459762572, + "train_acc": 0.95136, + "test_loss": 2.0303194038391115, + "test_acc": 0.6141, + "lyapunov": null, + "grad_norm": 0.46112847461678763, + "grad_max_sv": 0.23407747074961663, + "grad_min_sv": 8.815537186779992e-09, + "grad_condition": 888764932.2294099, + "lr": 7.001981464747503e-06, + "time_sec": 15.521865129470825 + }, + { + "epoch": 143, + "train_loss": 0.1572772634601593, + "train_acc": 0.95076, + "test_loss": 2.015152719116211, + "test_acc": 0.6117, + "lyapunov": null, + "grad_norm": 0.46482832090967446, + "grad_max_sv": 0.23328317552804947, + "grad_min_sv": 8.496040210356943e-09, + "grad_condition": 794958780.6842709, + "lr": 5.3638335185058295e-06, + "time_sec": 15.530633926391602 + }, + { + "epoch": 144, + "train_loss": 0.1607058820438385, + "train_acc": 0.94982, + "test_loss": 2.028663912010193, + "test_acc": 0.6144, + "lyapunov": null, + "grad_norm": 0.46757658167064325, + "grad_max_sv": 0.23105027191340924, + "grad_min_sv": 8.55830176145836e-09, + "grad_condition": 1653881177.8200665, + "lr": 3.942649342761114e-06, + "time_sec": 15.53608751296997 + }, + { + "epoch": 145, + "train_loss": 0.1565204811191559, + "train_acc": 0.95166, + "test_loss": 2.0279767280578613, + "test_acc": 0.6155, + "lyapunov": null, + "grad_norm": 0.4638655873772094, + "grad_max_sv": 0.23327881954610347, + "grad_min_sv": 8.597103550930796e-09, + "grad_condition": 316875488.0827421, + "lr": 2.7390523158633524e-06, + "time_sec": 15.526829719543457 + }, + { + "epoch": 146, + "train_loss": 0.15728166580677033, + "train_acc": 0.95086, + "test_loss": 1.9891761138916015, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.46488895344189896, + "grad_max_sv": 0.24002570435404777, + "grad_min_sv": 8.740120454957777e-09, + "grad_condition": 455470499.4939662, + "lr": 1.7535703752478133e-06, + "time_sec": 15.529450178146362 + }, + { + "epoch": 147, + "train_loss": 0.15490476808547973, + "train_acc": 0.95148, + "test_loss": 2.058331818771362, + "test_acc": 0.61, + "lyapunov": null, + "grad_norm": 0.46221701830974254, + "grad_max_sv": 0.2296001013368368, + "grad_min_sv": 8.541372666505225e-09, + "grad_condition": 659563768.7689784, + "lr": 9.866357858642196e-07, + "time_sec": 15.537895441055298 + }, + { + "epoch": 148, + "train_loss": 0.15796600056648255, + "train_acc": 0.94986, + "test_loss": 2.0414266393661498, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.46494816666423244, + "grad_max_sv": 0.2453433360904455, + "grad_min_sv": 8.874223652883401e-09, + "grad_condition": 791324939.5663835, + "lr": 4.38584950570808e-07, + "time_sec": 15.552018165588379 + }, + { + "epoch": 149, + "train_loss": 0.1572165874862671, + "train_acc": 0.9503, + "test_loss": 2.0304482383728026, + "test_acc": 0.6163, + "lyapunov": null, + "grad_norm": 0.46454324009038384, + "grad_max_sv": 0.23642796650528908, + "grad_min_sv": 8.51550397435591e-09, + "grad_condition": 463955776.24121666, + "lr": 1.096582625772501e-07, + "time_sec": 15.526931762695312 + }, + { + "epoch": 150, + "train_loss": 0.15873465202331544, + "train_acc": 0.94998, + "test_loss": 2.0263592735290525, + "test_acc": 0.6123, + "lyapunov": null, + "grad_norm": 0.46823921364683874, + "grad_max_sv": 0.24224489107728003, + "grad_min_sv": 8.409305788867338e-09, + "grad_condition": 491457160.41681844, + "lr": 0.0, + "time_sec": 15.518765687942505 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.593809753570556, + "train_acc": 0.06056, + "test_loss": 4.250240661239624, + "test_acc": 0.0724, + "lyapunov": null, + "grad_norm": 6.28680857536701, + "grad_max_sv": 5.32494820356369, + "grad_min_sv": 1.0926536573307998e-07, + "grad_condition": 75430538.96608621, + "lr": 0.0009998903417374227, + "time_sec": 32.64524722099304 + }, + { + "epoch": 2, + "train_loss": 3.8781360272216796, + "train_acc": 0.12202, + "test_loss": 3.828091265106201, + "test_acc": 0.1187, + "lyapunov": null, + "grad_norm": 4.685766976401904, + "grad_max_sv": 3.971551901102066, + "grad_min_sv": 8.512232171353773e-08, + "grad_condition": 73925683.02884856, + "lr": 0.0009995614150494292, + "time_sec": 32.55369710922241 + }, + { + "epoch": 3, + "train_loss": 3.5183256304931643, + "train_acc": 0.16986, + "test_loss": 3.603372495651245, + "test_acc": 0.1458, + "lyapunov": null, + "grad_norm": 3.857816495796443, + "grad_max_sv": 3.131850999593735, + "grad_min_sv": 7.069926738628718e-08, + "grad_condition": 597358447.7631978, + "lr": 0.0009990133642141358, + "time_sec": 32.61470580101013 + }, + { + "epoch": 4, + "train_loss": 3.2580047064208983, + "train_acc": 0.21016, + "test_loss": 3.3982357917785646, + "test_acc": 0.1898, + "lyapunov": null, + "grad_norm": 3.25322967284326, + "grad_max_sv": 2.4588119089603424, + "grad_min_sv": 6.045808895738247e-08, + "grad_condition": 47197928.09495263, + "lr": 0.0009982464296247522, + "time_sec": 32.569292306900024 + }, + { + "epoch": 5, + "train_loss": 3.0406500122070312, + "train_acc": 0.24896, + "test_loss": 3.1738818031311036, + "test_acc": 0.2326, + "lyapunov": null, + "grad_norm": 2.772030407825626, + "grad_max_sv": 1.9638817846775054, + "grad_min_sv": 5.119714804324715e-08, + "grad_condition": 73515114.69409783, + "lr": 0.0009972609476841367, + "time_sec": 32.59326457977295 + }, + { + "epoch": 6, + "train_loss": 2.8603873377227784, + "train_acc": 0.28122, + "test_loss": 3.040658945083618, + "test_acc": 0.2441, + "lyapunov": null, + "grad_norm": 2.406511937670546, + "grad_max_sv": 1.6028138607740403, + "grad_min_sv": 4.437380299870952e-08, + "grad_condition": 42435152.16608156, + "lr": 0.000996057350657239, + "time_sec": 32.59000778198242 + }, + { + "epoch": 7, + "train_loss": 2.696464497909546, + "train_acc": 0.3124, + "test_loss": 2.7883455558776857, + "test_acc": 0.3055, + "lyapunov": null, + "grad_norm": 2.1276389781637293, + "grad_max_sv": 1.321936309337616, + "grad_min_sv": 3.9740869406390546e-08, + "grad_condition": 38077617.12004892, + "lr": 0.000994636166481494, + "time_sec": 32.58612537384033 + }, + { + "epoch": 8, + "train_loss": 2.5476934342956543, + "train_acc": 0.34226, + "test_loss": 2.7284567352294924, + "test_acc": 0.3201, + "lyapunov": null, + "grad_norm": 1.9443800586445228, + "grad_max_sv": 1.1562949120998383, + "grad_min_sv": 3.6514397544484825e-08, + "grad_condition": 50793777.88100208, + "lr": 0.0009929980185352525, + "time_sec": 32.609519958496094 + }, + { + "epoch": 9, + "train_loss": 2.420484928741455, + "train_acc": 0.37, + "test_loss": 2.5651690574645998, + "test_acc": 0.3474, + "lyapunov": null, + "grad_norm": 1.7908327823271384, + "grad_max_sv": 0.9936118766665458, + "grad_min_sv": 3.386289501583484e-08, + "grad_condition": 38337683.052389994, + "lr": 0.0009911436253643444, + "time_sec": 32.608171224594116 + }, + { + "epoch": 10, + "train_loss": 2.3262426779937746, + "train_acc": 0.38734, + "test_loss": 2.4693000373840333, + "test_acc": 0.3722, + "lyapunov": null, + "grad_norm": 1.6585340858173223, + "grad_max_sv": 0.8407874166965484, + "grad_min_sv": 3.068910873760267e-08, + "grad_condition": 34328942.84679211, + "lr": 0.0009890738003669028, + "time_sec": 32.64034914970398 + }, + { + "epoch": 11, + "train_loss": 2.2108732919311525, + "train_acc": 0.41382, + "test_loss": 2.465538624572754, + "test_acc": 0.3705, + "lyapunov": null, + "grad_norm": 1.5729603360376456, + "grad_max_sv": 0.778350618481636, + "grad_min_sv": 2.959336372621024e-08, + "grad_condition": 73499461.7080038, + "lr": 0.00098678945143658, + "time_sec": 32.57490301132202 + }, + { + "epoch": 12, + "train_loss": 2.1315050006103515, + "train_acc": 0.4307, + "test_loss": 2.3204302642822268, + "test_acc": 0.3954, + "lyapunov": null, + "grad_norm": 1.5011321305083667, + "grad_max_sv": 0.699262747168541, + "grad_min_sv": 2.8460571517563427e-08, + "grad_condition": 48774252.99057761, + "lr": 0.0009842915805643154, + "time_sec": 32.6048150062561 + }, + { + "epoch": 13, + "train_loss": 2.0442165532684324, + "train_acc": 0.44988, + "test_loss": 2.376241368865967, + "test_acc": 0.3938, + "lyapunov": null, + "grad_norm": 1.4288710226212364, + "grad_max_sv": 0.651852785050869, + "grad_min_sv": 2.6736829209427978e-08, + "grad_condition": 911183246.0701777, + "lr": 0.000981581283398829, + "time_sec": 32.5588493347168 + }, + { + "epoch": 14, + "train_loss": 1.9779467534637452, + "train_acc": 0.46564, + "test_loss": 2.3095103010177613, + "test_acc": 0.3997, + "lyapunov": null, + "grad_norm": 1.3745196502469326, + "grad_max_sv": 0.6157992795109749, + "grad_min_sv": 2.619163226788568e-08, + "grad_condition": 133496832.32967322, + "lr": 0.0009786597487660333, + "time_sec": 32.544082164764404 + }, + { + "epoch": 15, + "train_loss": 1.9085535586547853, + "train_acc": 0.48116, + "test_loss": 2.277028215789795, + "test_acc": 0.4192, + "lyapunov": null, + "grad_norm": 1.3371637415095632, + "grad_max_sv": 0.6050588846206665, + "grad_min_sv": 2.4948501375562925e-08, + "grad_condition": 111100134.80615222, + "lr": 0.0009755282581475766, + "time_sec": 32.55138826370239 + }, + { + "epoch": 16, + "train_loss": 1.8528347210693359, + "train_acc": 0.49492, + "test_loss": 2.1695428279876707, + "test_acc": 0.4331, + "lyapunov": null, + "grad_norm": 1.2814778531944382, + "grad_max_sv": 0.5591228373348713, + "grad_min_sv": 2.4496722306199815e-08, + "grad_condition": 25867184.37629143, + "lr": 0.0009721881851187403, + "time_sec": 32.59131908416748 + }, + { + "epoch": 17, + "train_loss": 1.7864885725402833, + "train_acc": 0.5083, + "test_loss": 2.2167986530303954, + "test_acc": 0.428, + "lyapunov": null, + "grad_norm": 1.2365928586283268, + "grad_max_sv": 0.5188852399587631, + "grad_min_sv": 2.3400686853525254e-08, + "grad_condition": 39202676.90349869, + "lr": 0.0009686409947459456, + "time_sec": 32.55093550682068 + }, + { + "epoch": 18, + "train_loss": 1.7305231869888307, + "train_acc": 0.52088, + "test_loss": 2.1779684148788454, + "test_acc": 0.4405, + "lyapunov": null, + "grad_norm": 1.2047689336699439, + "grad_max_sv": 0.5065509222447873, + "grad_min_sv": 2.279239488256479e-08, + "grad_condition": 28341315.825680755, + "lr": 0.0009648882429441254, + "time_sec": 32.556524991989136 + }, + { + "epoch": 19, + "train_loss": 1.6774425074768067, + "train_acc": 0.53444, + "test_loss": 2.22588055267334, + "test_acc": 0.4357, + "lyapunov": null, + "grad_norm": 1.1702937955790653, + "grad_max_sv": 0.4866269282996655, + "grad_min_sv": 2.1823409551702255e-08, + "grad_condition": 34695081.35711311, + "lr": 0.00096093157579425, + "time_sec": 32.57441163063049 + }, + { + "epoch": 20, + "train_loss": 1.6186258012771606, + "train_acc": 0.54752, + "test_loss": 2.1861088802337645, + "test_acc": 0.4422, + "lyapunov": null, + "grad_norm": 1.1434442793867807, + "grad_max_sv": 0.4658520080149174, + "grad_min_sv": 2.124641216849632e-08, + "grad_condition": 35023634.55777504, + "lr": 0.0009567727288213001, + "time_sec": 32.563255071640015 + }, + { + "epoch": 21, + "train_loss": 1.5804412273406983, + "train_acc": 0.5552, + "test_loss": 2.116827065849304, + "test_acc": 0.4608, + "lyapunov": null, + "grad_norm": 1.1174809929853884, + "grad_max_sv": 0.4587864212691784, + "grad_min_sv": 2.115127252788618e-08, + "grad_condition": 25409623.926622026, + "lr": 0.0009524135262330095, + "time_sec": 32.548664808273315 + }, + { + "epoch": 22, + "train_loss": 1.5373576833343505, + "train_acc": 0.56826, + "test_loss": 2.188752991104126, + "test_acc": 0.4488, + "lyapunov": null, + "grad_norm": 1.0855473101193578, + "grad_max_sv": 0.43056059926748275, + "grad_min_sv": 2.025934667526652e-08, + "grad_condition": 28615900.007624805, + "lr": 0.0009478558801197061, + "time_sec": 32.611814737319946 + }, + { + "epoch": 23, + "train_loss": 1.506667826461792, + "train_acc": 0.57494, + "test_loss": 2.174818174743652, + "test_acc": 0.4577, + "lyapunov": null, + "grad_norm": 1.0696030802642686, + "grad_max_sv": 0.43318344950675963, + "grad_min_sv": 2.0166759195916484e-08, + "grad_condition": 43974441.149682686, + "lr": 0.000943101789615607, + "time_sec": 32.57555532455444 + }, + { + "epoch": 24, + "train_loss": 1.47097098236084, + "train_acc": 0.5857, + "test_loss": 2.0404002576828004, + "test_acc": 0.4847, + "lyapunov": null, + "grad_norm": 1.0479522200281932, + "grad_max_sv": 0.4198159731924534, + "grad_min_sv": 1.9698220292407863e-08, + "grad_condition": 45870756.831042506, + "lr": 0.0009381533400219313, + "time_sec": 32.5772430896759 + }, + { + "epoch": 25, + "train_loss": 1.4312325327301025, + "train_acc": 0.59378, + "test_loss": 2.106845015716553, + "test_acc": 0.4767, + "lyapunov": null, + "grad_norm": 1.0240308878342053, + "grad_max_sv": 0.41350489780306815, + "grad_min_sv": 1.9328133177981543e-08, + "grad_condition": 69115062.26987141, + "lr": 0.0009330127018922189, + "time_sec": 32.557268142700195 + }, + { + "epoch": 26, + "train_loss": 1.3932979926300049, + "train_acc": 0.60466, + "test_loss": 2.0442503452301026, + "test_acc": 0.4874, + "lyapunov": null, + "grad_norm": 1.0080444681764495, + "grad_max_sv": 0.39995783641934396, + "grad_min_sv": 1.8682676014569743e-08, + "grad_condition": 33480939.457173, + "lr": 0.000927682130080253, + "time_sec": 32.54329538345337 + }, + { + "epoch": 27, + "train_loss": 1.3626447483444213, + "train_acc": 0.61088, + "test_loss": 2.1529213762283326, + "test_acc": 0.4772, + "lyapunov": null, + "grad_norm": 0.9916083960305544, + "grad_max_sv": 0.38913136497139933, + "grad_min_sv": 1.803411719611403e-08, + "grad_condition": 125553964.7328368, + "lr": 0.0009221639627510072, + "time_sec": 32.55648422241211 + }, + { + "epoch": 28, + "train_loss": 1.332198992652893, + "train_acc": 0.6166, + "test_loss": 2.2807082765579225, + "test_acc": 0.4558, + "lyapunov": null, + "grad_norm": 0.9771496174881384, + "grad_max_sv": 0.39622113704681394, + "grad_min_sv": 1.8371455795529455e-08, + "grad_condition": 25402444.150790665, + "lr": 0.0009164606203550494, + "time_sec": 32.56743788719177 + }, + { + "epoch": 29, + "train_loss": 1.3056928281402589, + "train_acc": 0.62548, + "test_loss": 2.3650270275115965, + "test_acc": 0.4494, + "lyapunov": null, + "grad_norm": 0.9678089971160496, + "grad_max_sv": 0.3883704259991646, + "grad_min_sv": 1.808786349449809e-08, + "grad_condition": 34866235.35928585, + "lr": 0.0009105746045668516, + "time_sec": 32.53697896003723 + }, + { + "epoch": 30, + "train_loss": 1.2669909148025513, + "train_acc": 0.63598, + "test_loss": 2.194760869216919, + "test_acc": 0.4794, + "lyapunov": null, + "grad_norm": 0.9467141888064133, + "grad_max_sv": 0.3744235411286354, + "grad_min_sv": 1.7651215561236e-08, + "grad_condition": 139376880.96042347, + "lr": 0.0009045084971874733, + "time_sec": 32.55838894844055 + }, + { + "epoch": 31, + "train_loss": 1.2365936059951783, + "train_acc": 0.64152, + "test_loss": 2.251469213104248, + "test_acc": 0.4728, + "lyapunov": null, + "grad_norm": 0.9363746920375892, + "grad_max_sv": 0.3752880610525608, + "grad_min_sv": 1.7496447651810243e-08, + "grad_condition": 33435292.843927078, + "lr": 0.0008982649590120977, + "time_sec": 32.56987476348877 + }, + { + "epoch": 32, + "train_loss": 1.2132414292144775, + "train_acc": 0.6457, + "test_loss": 2.155212931251526, + "test_acc": 0.4953, + "lyapunov": null, + "grad_norm": 0.9198517753600641, + "grad_max_sv": 0.3622582726180553, + "grad_min_sv": 1.7169938390428767e-08, + "grad_condition": 301357597.1554047, + "lr": 0.0008918467286629196, + "time_sec": 32.644938468933105 + }, + { + "epoch": 33, + "train_loss": 1.184193948135376, + "train_acc": 0.654, + "test_loss": 2.2338722274780274, + "test_acc": 0.4833, + "lyapunov": null, + "grad_norm": 0.9078833042188178, + "grad_max_sv": 0.3615180656313896, + "grad_min_sv": 1.6779444181325154e-08, + "grad_condition": 31157779.01941774, + "lr": 0.0008852566213878943, + "time_sec": 32.592013359069824 + }, + { + "epoch": 34, + "train_loss": 1.1604648839569092, + "train_acc": 0.6605, + "test_loss": 2.144485057640076, + "test_acc": 0.4963, + "lyapunov": null, + "grad_norm": 0.8972811549201535, + "grad_max_sv": 0.34557069540023805, + "grad_min_sv": 1.606287251786076e-08, + "grad_condition": 75723670.78622702, + "lr": 0.000878497527825878, + "time_sec": 32.58034062385559 + }, + { + "epoch": 35, + "train_loss": 1.1375362993240357, + "train_acc": 0.66418, + "test_loss": 2.181222864341736, + "test_acc": 0.4898, + "lyapunov": null, + "grad_norm": 0.8889790406396809, + "grad_max_sv": 0.35035020038485526, + "grad_min_sv": 1.6642615324746756e-08, + "grad_condition": 30786547.22695731, + "lr": 0.000871572412738697, + "time_sec": 32.54904317855835 + }, + { + "epoch": 36, + "train_loss": 1.1133264205932618, + "train_acc": 0.67238, + "test_loss": 2.1131927043914795, + "test_acc": 0.5058, + "lyapunov": null, + "grad_norm": 0.8832491549304202, + "grad_max_sv": 0.34634757712483405, + "grad_min_sv": 1.6018088946911922e-08, + "grad_condition": 49284260.37621014, + "lr": 0.0008644843137107055, + "time_sec": 32.58738970756531 + }, + { + "epoch": 37, + "train_loss": 1.0785640783309935, + "train_acc": 0.67878, + "test_loss": 2.2109802129745484, + "test_acc": 0.4946, + "lyapunov": null, + "grad_norm": 0.8741999013148335, + "grad_max_sv": 0.3421505123376846, + "grad_min_sv": 1.5883508850886296e-08, + "grad_condition": 147125609.85023776, + "lr": 0.0008572363398164014, + "time_sec": 32.6028311252594 + }, + { + "epoch": 38, + "train_loss": 1.0444296839141847, + "train_acc": 0.68996, + "test_loss": 2.2259356287002565, + "test_acc": 0.4923, + "lyapunov": null, + "grad_norm": 0.8523318198837474, + "grad_max_sv": 0.33938159644603727, + "grad_min_sv": 1.5807346684382218e-08, + "grad_condition": 34226370.63225422, + "lr": 0.0008498316702566826, + "time_sec": 32.560999393463135 + }, + { + "epoch": 39, + "train_loss": 1.023456362953186, + "train_acc": 0.69698, + "test_loss": 2.1364882369995115, + "test_acc": 0.5049, + "lyapunov": null, + "grad_norm": 0.8498222777562341, + "grad_max_sv": 0.3415807694196701, + "grad_min_sv": 1.5869645431099144e-08, + "grad_condition": 27853151.39901676, + "lr": 0.0008422735529643442, + "time_sec": 32.56105279922485 + }, + { + "epoch": 40, + "train_loss": 1.0050300610351564, + "train_acc": 0.7014, + "test_loss": 2.150569340324402, + "test_acc": 0.5071, + "lyapunov": null, + "grad_norm": 0.8356269441634138, + "grad_max_sv": 0.3239683095365763, + "grad_min_sv": 1.5381535548204818e-08, + "grad_condition": 155224453.46718103, + "lr": 0.0008345653031794289, + "time_sec": 32.59518837928772 + }, + { + "epoch": 41, + "train_loss": 0.9930689501571656, + "train_acc": 0.7026, + "test_loss": 2.154064438056946, + "test_acc": 0.5136, + "lyapunov": null, + "grad_norm": 0.8262418740899825, + "grad_max_sv": 0.3324408046901226, + "grad_min_sv": 1.5276669600161607e-08, + "grad_condition": 51863928.79048334, + "lr": 0.0008267103019950526, + "time_sec": 32.57974171638489 + }, + { + "epoch": 42, + "train_loss": 0.957993507232666, + "train_acc": 0.7135, + "test_loss": 2.1310552421569824, + "test_acc": 0.5193, + "lyapunov": null, + "grad_norm": 0.8217377307572092, + "grad_max_sv": 0.31569988913834096, + "grad_min_sv": 1.4821617464605419e-08, + "grad_condition": 57225046.557756186, + "lr": 0.0008187119948743447, + "time_sec": 32.74825191497803 + }, + { + "epoch": 43, + "train_loss": 0.9496447095489502, + "train_acc": 0.71474, + "test_loss": 2.1654404600143433, + "test_acc": 0.5088, + "lyapunov": null, + "grad_norm": 0.8130839223264894, + "grad_max_sv": 0.32253594174981115, + "grad_min_sv": 1.506773582987675e-08, + "grad_condition": 93723846.88549985, + "lr": 0.000810573890139155, + "time_sec": 32.602092027664185 + }, + { + "epoch": 44, + "train_loss": 0.9342586210250855, + "train_acc": 0.71974, + "test_loss": 2.290501368904114, + "test_acc": 0.5013, + "lyapunov": null, + "grad_norm": 0.8096736459411619, + "grad_max_sv": 0.32218324691057204, + "grad_min_sv": 1.5053544679538565e-08, + "grad_condition": 44430049.08800385, + "lr": 0.0008022995574311873, + "time_sec": 32.594489097595215 + }, + { + "epoch": 45, + "train_loss": 0.9010325805664062, + "train_acc": 0.72686, + "test_loss": 2.4134263542175294, + "test_acc": 0.4913, + "lyapunov": null, + "grad_norm": 0.799116269115145, + "grad_max_sv": 0.31640069633722306, + "grad_min_sv": 1.5047001319934415e-08, + "grad_condition": 50608547.42886399, + "lr": 0.0007938926261462363, + "time_sec": 32.557663917541504 + }, + { + "epoch": 46, + "train_loss": 0.8911659923553467, + "train_acc": 0.73008, + "test_loss": 2.2884033529281615, + "test_acc": 0.5057, + "lyapunov": null, + "grad_norm": 0.7934582132141624, + "grad_max_sv": 0.31383398175239563, + "grad_min_sv": 1.4469329700584135e-08, + "grad_condition": 467744144.1725038, + "lr": 0.0007853567838422158, + "time_sec": 32.56327676773071 + }, + { + "epoch": 47, + "train_loss": 0.8638532521438599, + "train_acc": 0.73696, + "test_loss": 2.2446172203063965, + "test_acc": 0.5076, + "lyapunov": null, + "grad_norm": 0.7837979602809746, + "grad_max_sv": 0.31239640712738037, + "grad_min_sv": 1.4274264739655428e-08, + "grad_condition": 50193793.36053495, + "lr": 0.0007766957746216719, + "time_sec": 32.57334923744202 + }, + { + "epoch": 48, + "train_loss": 0.8375042049598694, + "train_acc": 0.74282, + "test_loss": 2.227299571418762, + "test_acc": 0.5202, + "lyapunov": null, + "grad_norm": 0.77427016194081, + "grad_max_sv": 0.31100503690540793, + "grad_min_sv": 1.4236399661915477e-08, + "grad_condition": 50469567.486968085, + "lr": 0.0007679133974894982, + "time_sec": 32.569188356399536 + }, + { + "epoch": 49, + "train_loss": 0.8221629112625122, + "train_acc": 0.74886, + "test_loss": 2.3033808235168456, + "test_acc": 0.5082, + "lyapunov": null, + "grad_norm": 0.7673158740604195, + "grad_max_sv": 0.2993927221745253, + "grad_min_sv": 1.3854600900906066e-08, + "grad_condition": 304920112.4622501, + "lr": 0.000759013504686565, + "time_sec": 32.584622621536255 + }, + { + "epoch": 50, + "train_loss": 0.8111858353424072, + "train_acc": 0.75248, + "test_loss": 2.386407151031494, + "test_acc": 0.5007, + "lyapunov": null, + "grad_norm": 0.7677657118676934, + "grad_max_sv": 0.3098601832985878, + "grad_min_sv": 1.3993020677935397e-08, + "grad_condition": 150857500.73279318, + "lr": 0.0007499999999999998, + "time_sec": 32.59726119041443 + }, + { + "epoch": 51, + "train_loss": 0.8006631660461426, + "train_acc": 0.7542, + "test_loss": 2.322489023399353, + "test_acc": 0.5061, + "lyapunov": null, + "grad_norm": 0.7571398534411352, + "grad_max_sv": 0.3029158480465412, + "grad_min_sv": 1.366701978661438e-08, + "grad_condition": 1198508278.0301957, + "lr": 0.0007408768370508575, + "time_sec": 32.566423654556274 + }, + { + "epoch": 52, + "train_loss": 0.7743014498138427, + "train_acc": 0.7611, + "test_loss": 2.446239744186401, + "test_acc": 0.5001, + "lyapunov": null, + "grad_norm": 0.7494625172701129, + "grad_max_sv": 0.30184583105146884, + "grad_min_sv": 1.3538439711142935e-08, + "grad_condition": 454382825.5364168, + "lr": 0.0007316480175599307, + "time_sec": 32.606823205947876 + }, + { + "epoch": 53, + "train_loss": 0.7602159348106384, + "train_acc": 0.76546, + "test_loss": 2.3079547737121584, + "test_acc": 0.5179, + "lyapunov": null, + "grad_norm": 0.743347450494438, + "grad_max_sv": 0.3061353128403425, + "grad_min_sv": 1.348931551216348e-08, + "grad_condition": 80924083.81225905, + "lr": 0.0007223175895924635, + "time_sec": 32.580427408218384 + }, + { + "epoch": 54, + "train_loss": 0.7339858147239685, + "train_acc": 0.77348, + "test_loss": 2.388110917472839, + "test_acc": 0.5122, + "lyapunov": null, + "grad_norm": 0.7398005246039192, + "grad_max_sv": 0.2995276223868132, + "grad_min_sv": 1.3313009213089532e-08, + "grad_condition": 46213404.23441851, + "lr": 0.0007128896457825361, + "time_sec": 32.57850360870361 + }, + { + "epoch": 55, + "train_loss": 0.7361176003837585, + "train_acc": 0.77096, + "test_loss": 2.3849290475845337, + "test_acc": 0.5096, + "lyapunov": null, + "grad_norm": 0.7355302680365016, + "grad_max_sv": 0.2989551298320293, + "grad_min_sv": 1.3770161400267037e-08, + "grad_condition": 1196071659.3025665, + "lr": 0.0007033683215378998, + "time_sec": 32.57127046585083 + }, + { + "epoch": 56, + "train_loss": 0.7056646187782287, + "train_acc": 0.78266, + "test_loss": 2.5353955261230467, + "test_acc": 0.5094, + "lyapunov": null, + "grad_norm": 0.7263545559812212, + "grad_max_sv": 0.29214551076292994, + "grad_min_sv": 1.2961420287754821e-08, + "grad_condition": 55296196.635770574, + "lr": 0.0006937577932260512, + "time_sec": 32.6073100566864 + }, + { + "epoch": 57, + "train_loss": 0.6901627484321594, + "train_acc": 0.78498, + "test_loss": 2.424652412033081, + "test_acc": 0.515, + "lyapunov": null, + "grad_norm": 0.7255525918000217, + "grad_max_sv": 0.2947526901960373, + "grad_min_sv": 1.3273521161719094e-08, + "grad_condition": 81805484.33683524, + "lr": 0.0006840622763423388, + "time_sec": 32.587172746658325 + }, + { + "epoch": 58, + "train_loss": 0.6748793490219116, + "train_acc": 0.79032, + "test_loss": 2.4186749195098876, + "test_acc": 0.5152, + "lyapunov": null, + "grad_norm": 0.7152761560999475, + "grad_max_sv": 0.2920954205095768, + "grad_min_sv": 1.3006854693124736e-08, + "grad_condition": 92386117.68065517, + "lr": 0.0006742860236609073, + "time_sec": 32.59625577926636 + }, + { + "epoch": 59, + "train_loss": 0.6585909474945069, + "train_acc": 0.79492, + "test_loss": 2.423396731376648, + "test_acc": 0.5147, + "lyapunov": null, + "grad_norm": 0.7000734196662035, + "grad_max_sv": 0.27961262725293634, + "grad_min_sv": 1.2433090768732002e-08, + "grad_condition": 44055598.930747576, + "lr": 0.0006644333233692913, + "time_sec": 32.56940460205078 + }, + { + "epoch": 60, + "train_loss": 0.6509319092178345, + "train_acc": 0.7971, + "test_loss": 2.4439749031066893, + "test_acc": 0.5172, + "lyapunov": null, + "grad_norm": 0.7014808778975755, + "grad_max_sv": 0.279667991027236, + "grad_min_sv": 1.213204634045728e-08, + "grad_condition": 71422713.53211066, + "lr": 0.0006545084971874734, + "time_sec": 32.592474699020386 + }, + { + "epoch": 61, + "train_loss": 0.6274669117927552, + "train_acc": 0.80326, + "test_loss": 2.6459867664337158, + "test_acc": 0.4988, + "lyapunov": null, + "grad_norm": 0.6875040317915668, + "grad_max_sv": 0.2785758938640356, + "grad_min_sv": 1.2619559043233753e-08, + "grad_condition": 171857029.8323717, + "lr": 0.0006445158984722354, + "time_sec": 32.630576610565186 + }, + { + "epoch": 62, + "train_loss": 0.6170748471164703, + "train_acc": 0.80476, + "test_loss": 2.5383020797729494, + "test_acc": 0.507, + "lyapunov": null, + "grad_norm": 0.6898214493116677, + "grad_max_sv": 0.27117876932024954, + "grad_min_sv": 1.216634772142032e-08, + "grad_condition": 368391230.9870256, + "lr": 0.0006344599103076324, + "time_sec": 32.61634922027588 + }, + { + "epoch": 63, + "train_loss": 0.6143111569595336, + "train_acc": 0.80454, + "test_loss": 2.4434647581100464, + "test_acc": 0.5183, + "lyapunov": null, + "grad_norm": 0.6875312632959335, + "grad_max_sv": 0.28126552477478983, + "grad_min_sv": 1.246990521854962e-08, + "grad_condition": 798988222.1191355, + "lr": 0.0006243449435824269, + "time_sec": 32.61603879928589 + }, + { + "epoch": 64, + "train_loss": 0.593730930519104, + "train_acc": 0.81294, + "test_loss": 2.4702172830581666, + "test_acc": 0.5204, + "lyapunov": null, + "grad_norm": 0.6805278132405531, + "grad_max_sv": 0.27184186428785323, + "grad_min_sv": 1.2160773926804362e-08, + "grad_condition": 897317916.9202541, + "lr": 0.0006141754350553275, + "time_sec": 32.62076783180237 + }, + { + "epoch": 65, + "train_loss": 0.5915982696533203, + "train_acc": 0.81346, + "test_loss": 2.5983056301116942, + "test_acc": 0.5091, + "lyapunov": null, + "grad_norm": 0.6786733542651691, + "grad_max_sv": 0.2730319045484066, + "grad_min_sv": 1.195807074368116e-08, + "grad_condition": 100225768.74912949, + "lr": 0.0006039558454088793, + "time_sec": 32.57223296165466 + }, + { + "epoch": 66, + "train_loss": 0.5778841704368591, + "train_acc": 0.8164, + "test_loss": 2.5375493215560914, + "test_acc": 0.5166, + "lyapunov": null, + "grad_norm": 0.6661254148265577, + "grad_max_sv": 0.27218331433832643, + "grad_min_sv": 1.21305288360192e-08, + "grad_condition": 409516154.47474587, + "lr": 0.000593690657292862, + "time_sec": 32.60103678703308 + }, + { + "epoch": 67, + "train_loss": 0.5534152274894715, + "train_acc": 0.82388, + "test_loss": 2.525739343261719, + "test_acc": 0.5172, + "lyapunov": null, + "grad_norm": 0.66286867140097, + "grad_max_sv": 0.27192877791821957, + "grad_min_sv": 1.1918128833138253e-08, + "grad_condition": 43219144.55143875, + "lr": 0.0005833843733580507, + "time_sec": 32.570470571517944 + }, + { + "epoch": 68, + "train_loss": 0.5373673023986817, + "train_acc": 0.82976, + "test_loss": 2.5977006465911865, + "test_acc": 0.517, + "lyapunov": null, + "grad_norm": 0.6509079409235867, + "grad_max_sv": 0.26122898012399676, + "grad_min_sv": 1.1391138144897784e-08, + "grad_condition": 68515123.47894785, + "lr": 0.0005730415142812054, + "time_sec": 32.60091519355774 + }, + { + "epoch": 69, + "train_loss": 0.5234087624740601, + "train_acc": 0.83328, + "test_loss": 2.5398946479797364, + "test_acc": 0.5195, + "lyapunov": null, + "grad_norm": 0.6514320709102108, + "grad_max_sv": 0.2681581676006317, + "grad_min_sv": 1.1655683266427116e-08, + "grad_condition": 706218189.6988381, + "lr": 0.0005626666167821517, + "time_sec": 32.60088515281677 + }, + { + "epoch": 70, + "train_loss": 0.5105544789123535, + "train_acc": 0.83858, + "test_loss": 2.6386670696258543, + "test_acc": 0.5124, + "lyapunov": null, + "grad_norm": 0.6433463540817135, + "grad_max_sv": 0.2647452913224697, + "grad_min_sv": 1.1366260942169416e-08, + "grad_condition": 65156065.92607037, + "lr": 0.0005522642316338265, + "time_sec": 32.64759874343872 + }, + { + "epoch": 71, + "train_loss": 0.5010787317276001, + "train_acc": 0.83912, + "test_loss": 2.6461667497634886, + "test_acc": 0.5113, + "lyapunov": null, + "grad_norm": 0.6437656983932116, + "grad_max_sv": 0.27069182582199575, + "grad_min_sv": 1.1655098845937683e-08, + "grad_condition": 152350561.59014112, + "lr": 0.0005418389216661573, + "time_sec": 32.59350061416626 + }, + { + "epoch": 72, + "train_loss": 0.48393970026969907, + "train_acc": 0.84504, + "test_loss": 2.714662640762329, + "test_acc": 0.5138, + "lyapunov": null, + "grad_norm": 0.6380630437719501, + "grad_max_sv": 0.2641098305583, + "grad_min_sv": 1.1268197760809507e-08, + "grad_condition": 120257137.75772035, + "lr": 0.0005313952597646563, + "time_sec": 32.596872329711914 + }, + { + "epoch": 73, + "train_loss": 0.48754292858123777, + "train_acc": 0.84344, + "test_loss": 2.7237933948516844, + "test_acc": 0.5121, + "lyapunov": null, + "grad_norm": 0.6383299877925953, + "grad_max_sv": 0.26338610500097276, + "grad_min_sv": 1.1300838716199468e-08, + "grad_condition": 111884472.4678097, + "lr": 0.0005209378268645994, + "time_sec": 32.5793662071228 + }, + { + "epoch": 74, + "train_loss": 0.47278374366760256, + "train_acc": 0.84774, + "test_loss": 2.6715963176727295, + "test_acc": 0.5175, + "lyapunov": null, + "grad_norm": 0.6274777670934027, + "grad_max_sv": 0.2674501951783895, + "grad_min_sv": 1.1504576969084777e-08, + "grad_condition": 1355085877.4304867, + "lr": 0.0005104712099416781, + "time_sec": 32.57535362243652 + }, + { + "epoch": 75, + "train_loss": 0.46160235664367677, + "train_acc": 0.8514, + "test_loss": 2.648087367248535, + "test_acc": 0.5256, + "lyapunov": null, + "grad_norm": 0.6267372816019459, + "grad_max_sv": 0.2574677299708128, + "grad_min_sv": 1.0966666171572172e-08, + "grad_condition": 334727656.01781523, + "lr": 0.0004999999999999996, + "time_sec": 32.610466957092285 + }, + { + "epoch": 76, + "train_loss": 0.4535921633911133, + "train_acc": 0.85614, + "test_loss": 2.6602814262390138, + "test_acc": 0.523, + "lyapunov": null, + "grad_norm": 0.6107123792245788, + "grad_max_sv": 0.2529071237891912, + "grad_min_sv": 1.1059093659587793e-08, + "grad_condition": 120836694.63569286, + "lr": 0.0004895287900583212, + "time_sec": 32.60012149810791 + }, + { + "epoch": 77, + "train_loss": 0.4353150751876831, + "train_acc": 0.85868, + "test_loss": 2.704223956680298, + "test_acc": 0.515, + "lyapunov": null, + "grad_norm": 0.6089035015325723, + "grad_max_sv": 0.26519037671387197, + "grad_min_sv": 1.1131827913862629e-08, + "grad_condition": 731888345.2288473, + "lr": 0.0004790621731353997, + "time_sec": 32.5684015750885 + }, + { + "epoch": 78, + "train_loss": 0.4266960339736938, + "train_acc": 0.86162, + "test_loss": 2.621325074005127, + "test_acc": 0.5293, + "lyapunov": null, + "grad_norm": 0.6005077005692222, + "grad_max_sv": 0.24986533373594283, + "grad_min_sv": 1.066437155744851e-08, + "grad_condition": 323621690.1204275, + "lr": 0.000468604740235343, + "time_sec": 32.593501567840576 + }, + { + "epoch": 79, + "train_loss": 0.40983675064086916, + "train_acc": 0.86828, + "test_loss": 2.654561376953125, + "test_acc": 0.5278, + "lyapunov": null, + "grad_norm": 0.5926958478419567, + "grad_max_sv": 0.253178546205163, + "grad_min_sv": 1.0804884827174745e-08, + "grad_condition": 432601908.1535362, + "lr": 0.00045816107833384175, + "time_sec": 32.603999376297 + }, + { + "epoch": 80, + "train_loss": 0.4048340177345276, + "train_acc": 0.86952, + "test_loss": 2.7457454587936403, + "test_acc": 0.5169, + "lyapunov": null, + "grad_norm": 0.5908548576457587, + "grad_max_sv": 0.25038131698966026, + "grad_min_sv": 1.0512154793168581e-08, + "grad_condition": 130905588.43349023, + "lr": 0.0004477357683661729, + "time_sec": 32.603445053100586 + }, + { + "epoch": 81, + "train_loss": 0.3956010137653351, + "train_acc": 0.87362, + "test_loss": 2.6873944789886473, + "test_acc": 0.5209, + "lyapunov": null, + "grad_norm": 0.584388729391549, + "grad_max_sv": 0.24884492233395578, + "grad_min_sv": 1.0513768951801727e-08, + "grad_condition": 247213360.42633313, + "lr": 0.00043733338321784746, + "time_sec": 32.59891176223755 + }, + { + "epoch": 82, + "train_loss": 0.39998871772766115, + "train_acc": 0.87126, + "test_loss": 2.7860556625366213, + "test_acc": 0.5159, + "lyapunov": null, + "grad_norm": 0.5914248649657466, + "grad_max_sv": 0.2658348709344864, + "grad_min_sv": 1.082797196690511e-08, + "grad_condition": 1133342480.7967758, + "lr": 0.0004269584857187939, + "time_sec": 32.59586429595947 + }, + { + "epoch": 83, + "train_loss": 0.3816492418861389, + "train_acc": 0.877, + "test_loss": 2.7754603567123413, + "test_acc": 0.5172, + "lyapunov": null, + "grad_norm": 0.5821106701045357, + "grad_max_sv": 0.2504717506468296, + "grad_min_sv": 1.0313228220211468e-08, + "grad_condition": 79983143.9616401, + "lr": 0.0004166156266419484, + "time_sec": 32.61333727836609 + }, + { + "epoch": 84, + "train_loss": 0.3718857811355591, + "train_acc": 0.88052, + "test_loss": 2.711159196472168, + "test_acc": 0.5308, + "lyapunov": null, + "grad_norm": 0.5753178111464781, + "grad_max_sv": 0.24524039030075073, + "grad_min_sv": 1.0231703595139919e-08, + "grad_condition": 185067792.66451305, + "lr": 0.0004063093427071373, + "time_sec": 32.58551812171936 + }, + { + "epoch": 85, + "train_loss": 0.3627623717498779, + "train_acc": 0.8827, + "test_loss": 2.7379925659179687, + "test_acc": 0.5259, + "lyapunov": null, + "grad_norm": 0.5629491927418928, + "grad_max_sv": 0.24136969707906247, + "grad_min_sv": 9.91763398714568e-09, + "grad_condition": 152636209.94255581, + "lr": 0.0003960441545911199, + "time_sec": 32.603590965270996 + }, + { + "epoch": 86, + "train_loss": 0.346252275390625, + "train_acc": 0.88882, + "test_loss": 2.766578482246399, + "test_acc": 0.5312, + "lyapunov": null, + "grad_norm": 0.5515259268132012, + "grad_max_sv": 0.24355790987610818, + "grad_min_sv": 1.0009752546454032e-08, + "grad_condition": 97406517.6245994, + "lr": 0.0003858245649446718, + "time_sec": 32.584232807159424 + }, + { + "epoch": 87, + "train_loss": 0.34051946352005, + "train_acc": 0.89098, + "test_loss": 2.779722568702698, + "test_acc": 0.528, + "lyapunov": null, + "grad_norm": 0.5519101007375313, + "grad_max_sv": 0.24400133974850177, + "grad_min_sv": 9.877336406855648e-09, + "grad_condition": 712710697.5623571, + "lr": 0.00037565505641757235, + "time_sec": 32.6142373085022 + }, + { + "epoch": 88, + "train_loss": 0.33136254326820375, + "train_acc": 0.89032, + "test_loss": 2.719365368270874, + "test_acc": 0.535, + "lyapunov": null, + "grad_norm": 0.5511773242388698, + "grad_max_sv": 0.23767127953469752, + "grad_min_sv": 9.902577505389865e-09, + "grad_condition": 127351733.7757211, + "lr": 0.00036554008969236695, + "time_sec": 32.62907528877258 + }, + { + "epoch": 89, + "train_loss": 0.32775797492980957, + "train_acc": 0.89324, + "test_loss": 2.790045444488525, + "test_acc": 0.5299, + "lyapunov": null, + "grad_norm": 0.5479128041042186, + "grad_max_sv": 0.2417389802634716, + "grad_min_sv": 9.801050153543031e-09, + "grad_condition": 342834303.4129317, + "lr": 0.0003554841015277638, + "time_sec": 32.58039617538452 + }, + { + "epoch": 90, + "train_loss": 0.32945220873832703, + "train_acc": 0.8918, + "test_loss": 2.922000147628784, + "test_acc": 0.5182, + "lyapunov": null, + "grad_norm": 0.5550461625192047, + "grad_max_sv": 0.24011647067964076, + "grad_min_sv": 9.800379771726567e-09, + "grad_condition": 1256581334.5865822, + "lr": 0.000345491502812526, + "time_sec": 32.59003448486328 + }, + { + "epoch": 91, + "train_loss": 0.3192555838537216, + "train_acc": 0.89716, + "test_loss": 2.8951302070617677, + "test_acc": 0.5263, + "lyapunov": null, + "grad_norm": 0.5399705873184968, + "grad_max_sv": 0.2398311447352171, + "grad_min_sv": 9.757036307719846e-09, + "grad_condition": 127427759.95651396, + "lr": 0.0003355666766307081, + "time_sec": 32.6045126914978 + }, + { + "epoch": 92, + "train_loss": 0.3078860513591766, + "train_acc": 0.90134, + "test_loss": 2.8668867027282716, + "test_acc": 0.5242, + "lyapunov": null, + "grad_norm": 0.529771320174461, + "grad_max_sv": 0.24304427802562714, + "grad_min_sv": 9.90028982024438e-09, + "grad_condition": 134692222.21263316, + "lr": 0.00032571397633909225, + "time_sec": 32.59454321861267 + }, + { + "epoch": 93, + "train_loss": 0.2954711162376404, + "train_acc": 0.90374, + "test_loss": 2.8291058578491213, + "test_acc": 0.5338, + "lyapunov": null, + "grad_norm": 0.5270179348539408, + "grad_max_sv": 0.23493569679558277, + "grad_min_sv": 9.681322873239529e-09, + "grad_condition": 154310830.71851045, + "lr": 0.00031593772365766094, + "time_sec": 32.637152433395386 + }, + { + "epoch": 94, + "train_loss": 0.29190866079330446, + "train_acc": 0.90516, + "test_loss": 2.8675409421920777, + "test_acc": 0.5267, + "lyapunov": null, + "grad_norm": 0.5236741934845208, + "grad_max_sv": 0.23337335288524627, + "grad_min_sv": 9.406507730548574e-09, + "grad_condition": 172022555.775852, + "lr": 0.0003062422067739483, + "time_sec": 32.615885496139526 + }, + { + "epoch": 95, + "train_loss": 0.2843532346916199, + "train_acc": 0.90826, + "test_loss": 2.9124584104537963, + "test_acc": 0.5294, + "lyapunov": null, + "grad_norm": 0.5141183140073359, + "grad_max_sv": 0.22986465878784657, + "grad_min_sv": 9.210905181113172e-09, + "grad_condition": 336375534.72882974, + "lr": 0.00029663167846209965, + "time_sec": 32.62099742889404 + }, + { + "epoch": 96, + "train_loss": 0.28095845563411714, + "train_acc": 0.90888, + "test_loss": 2.9585642152786256, + "test_acc": 0.5188, + "lyapunov": null, + "grad_norm": 0.5209337851609864, + "grad_max_sv": 0.24165461957454681, + "grad_min_sv": 9.822391551029056e-09, + "grad_condition": 3734850942.353486, + "lr": 0.00028711035421746345, + "time_sec": 32.606362104415894 + }, + { + "epoch": 97, + "train_loss": 0.270245605134964, + "train_acc": 0.91376, + "test_loss": 2.8790921213150025, + "test_acc": 0.535, + "lyapunov": null, + "grad_norm": 0.5018050404070028, + "grad_max_sv": 0.2287111472338438, + "grad_min_sv": 9.100506417479732e-09, + "grad_condition": 1286046088.0897596, + "lr": 0.00027768241040753615, + "time_sec": 32.605376958847046 + }, + { + "epoch": 98, + "train_loss": 0.26737561470508575, + "train_acc": 0.91348, + "test_loss": 2.9673530891418456, + "test_acc": 0.52, + "lyapunov": null, + "grad_norm": 0.5026625596288345, + "grad_max_sv": 0.22773091793060302, + "grad_min_sv": 9.130605362089221e-09, + "grad_condition": 2561536325.8505445, + "lr": 0.00026835198244006903, + "time_sec": 32.61582803726196 + }, + { + "epoch": 99, + "train_loss": 0.25649453671455386, + "train_acc": 0.91706, + "test_loss": 2.960128957557678, + "test_acc": 0.5285, + "lyapunov": null, + "grad_norm": 0.4959587348752051, + "grad_max_sv": 0.22662512063980103, + "grad_min_sv": 9.021708526762983e-09, + "grad_condition": 2170055259.576285, + "lr": 0.0002591231629491421, + "time_sec": 32.59518361091614 + }, + { + "epoch": 100, + "train_loss": 0.25298852029800417, + "train_acc": 0.91614, + "test_loss": 2.999088920211792, + "test_acc": 0.5213, + "lyapunov": null, + "grad_norm": 0.49694281512357663, + "grad_max_sv": 0.2285677995532751, + "grad_min_sv": 9.117687981181898e-09, + "grad_condition": 153385408.53154242, + "lr": 0.0002499999999999997, + "time_sec": 32.60006618499756 + }, + { + "epoch": 101, + "train_loss": 0.24837311635971068, + "train_acc": 0.92042, + "test_loss": 2.9769588521957395, + "test_acc": 0.527, + "lyapunov": null, + "grad_norm": 0.49156384156747235, + "grad_max_sv": 0.23404922261834143, + "grad_min_sv": 9.245040229915492e-09, + "grad_condition": 730777146.0902932, + "lr": 0.00024098649531343477, + "time_sec": 32.58926057815552 + }, + { + "epoch": 102, + "train_loss": 0.24679850215435029, + "train_acc": 0.91974, + "test_loss": 2.983294668197632, + "test_acc": 0.5239, + "lyapunov": null, + "grad_norm": 0.4891194067973055, + "grad_max_sv": 0.22282884679734707, + "grad_min_sv": 8.780173748647313e-09, + "grad_condition": 157121553.36478597, + "lr": 0.0002320866025105016, + "time_sec": 32.61522173881531 + }, + { + "epoch": 103, + "train_loss": 0.235624645652771, + "train_acc": 0.9236, + "test_loss": 2.97529112701416, + "test_acc": 0.5278, + "lyapunov": null, + "grad_norm": 0.47526538494931814, + "grad_max_sv": 0.2206702034920454, + "grad_min_sv": 8.61680920262453e-09, + "grad_condition": 145823760.67239988, + "lr": 0.0002233042253783278, + "time_sec": 32.67024850845337 + }, + { + "epoch": 104, + "train_loss": 0.23265846648216248, + "train_acc": 0.92502, + "test_loss": 2.9763864707946777, + "test_acc": 0.5263, + "lyapunov": null, + "grad_norm": 0.47725567627138915, + "grad_max_sv": 0.22133470103144645, + "grad_min_sv": 8.68051782312168e-09, + "grad_condition": 267574471.67175755, + "lr": 0.000214643216157784, + "time_sec": 32.611361265182495 + }, + { + "epoch": 105, + "train_loss": 0.22897292974472047, + "train_acc": 0.92568, + "test_loss": 3.0474896495819093, + "test_acc": 0.5212, + "lyapunov": null, + "grad_norm": 0.4764754544051647, + "grad_max_sv": 0.22653804197907448, + "grad_min_sv": 8.760947359104918e-09, + "grad_condition": 3219418687.447474, + "lr": 0.00020610737385376332, + "time_sec": 32.5970995426178 + }, + { + "epoch": 106, + "train_loss": 0.22509269979476929, + "train_acc": 0.9271, + "test_loss": 2.9895481927871703, + "test_acc": 0.5276, + "lyapunov": null, + "grad_norm": 0.47179914735427825, + "grad_max_sv": 0.22902226410806178, + "grad_min_sv": 8.651995134743851e-09, + "grad_condition": 188321170.63109916, + "lr": 0.00019770044256881242, + "time_sec": 32.61952805519104 + }, + { + "epoch": 107, + "train_loss": 0.22124877912521362, + "train_acc": 0.92918, + "test_loss": 2.9869052186965943, + "test_acc": 0.5261, + "lyapunov": null, + "grad_norm": 0.4676814721095271, + "grad_max_sv": 0.23612426966428757, + "grad_min_sv": 8.830977354858538e-09, + "grad_condition": 1324097462.1438193, + "lr": 0.0001894261098608447, + "time_sec": 32.63655757904053 + }, + { + "epoch": 108, + "train_loss": 0.2119530977487564, + "train_acc": 0.93214, + "test_loss": 2.957085295295715, + "test_acc": 0.5283, + "lyapunov": null, + "grad_norm": 0.4597233192330978, + "grad_max_sv": 0.21893165111541749, + "grad_min_sv": 8.44588889763187e-09, + "grad_condition": 325299909.8181821, + "lr": 0.000181288005125655, + "time_sec": 32.6324462890625 + }, + { + "epoch": 109, + "train_loss": 0.2096145883345604, + "train_acc": 0.93168, + "test_loss": 3.0633232662200927, + "test_acc": 0.5232, + "lyapunov": null, + "grad_norm": 0.46012619309211217, + "grad_max_sv": 0.21432300768792628, + "grad_min_sv": 8.437937682305527e-09, + "grad_condition": 912797689.183795, + "lr": 0.0001732896980049473, + "time_sec": 32.59154772758484 + }, + { + "epoch": 110, + "train_loss": 0.20650233900070192, + "train_acc": 0.9334, + "test_loss": 3.0124371912002563, + "test_acc": 0.5288, + "lyapunov": null, + "grad_norm": 0.45267852009677, + "grad_max_sv": 0.2197608083486557, + "grad_min_sv": 8.136439059915762e-09, + "grad_condition": 214553728.36221018, + "lr": 0.00016543469682057076, + "time_sec": 32.58715891838074 + }, + { + "epoch": 111, + "train_loss": 0.202456818523407, + "train_acc": 0.93476, + "test_loss": 2.953989649581909, + "test_acc": 0.5364, + "lyapunov": null, + "grad_norm": 0.44877046173685803, + "grad_max_sv": 0.2101663440465927, + "grad_min_sv": 8.111785431298008e-09, + "grad_condition": 181357744.46055207, + "lr": 0.00015772644703565552, + "time_sec": 32.61166739463806 + }, + { + "epoch": 112, + "train_loss": 0.19417572572231293, + "train_acc": 0.93836, + "test_loss": 3.0636728370666506, + "test_acc": 0.5294, + "lyapunov": null, + "grad_norm": 0.44228389201963325, + "grad_max_sv": 0.2184779081493616, + "grad_min_sv": 8.052494614532204e-09, + "grad_condition": 701685099.8537222, + "lr": 0.00015016832974331713, + "time_sec": 32.61799240112305 + }, + { + "epoch": 113, + "train_loss": 0.1894145729970932, + "train_acc": 0.93984, + "test_loss": 2.981136636924744, + "test_acc": 0.5323, + "lyapunov": null, + "grad_norm": 0.4358812319975278, + "grad_max_sv": 0.20872662551701068, + "grad_min_sv": 7.95152020114211e-09, + "grad_condition": 1423865321.2329361, + "lr": 0.00014276366018359834, + "time_sec": 32.6167311668396 + }, + { + "epoch": 114, + "train_loss": 0.18947952261924744, + "train_acc": 0.9398, + "test_loss": 3.0828820104598997, + "test_acc": 0.5292, + "lyapunov": null, + "grad_norm": 0.43739466792043646, + "grad_max_sv": 0.2058663982897997, + "grad_min_sv": 7.741768523156016e-09, + "grad_condition": 7243536793.4379, + "lr": 0.00013551568628929425, + "time_sec": 32.59801626205444 + }, + { + "epoch": 115, + "train_loss": 0.1862397237443924, + "train_acc": 0.94078, + "test_loss": 2.9763780981063843, + "test_acc": 0.538, + "lyapunov": null, + "grad_norm": 0.43528746000323826, + "grad_max_sv": 0.20504732690751554, + "grad_min_sv": 8.141562394137907e-09, + "grad_condition": 139509610.14712492, + "lr": 0.00012842758726130276, + "time_sec": 32.612173080444336 + }, + { + "epoch": 116, + "train_loss": 0.17998726233482362, + "train_acc": 0.9426, + "test_loss": 3.0221671098709106, + "test_acc": 0.5357, + "lyapunov": null, + "grad_norm": 0.4288718122641706, + "grad_max_sv": 0.2140086382627487, + "grad_min_sv": 7.976556949608644e-09, + "grad_condition": 784872577.917934, + "lr": 0.0001215024721741218, + "time_sec": 32.63769769668579 + }, + { + "epoch": 117, + "train_loss": 0.17653137303352356, + "train_acc": 0.94314, + "test_loss": 3.0061340055465697, + "test_acc": 0.5323, + "lyapunov": null, + "grad_norm": 0.4236151447378006, + "grad_max_sv": 0.20592431761324406, + "grad_min_sv": 7.804582891849515e-09, + "grad_condition": 232091482.5503703, + "lr": 0.00011474337861210538, + "time_sec": 32.63769888877869 + }, + { + "epoch": 118, + "train_loss": 0.18115964114189148, + "train_acc": 0.94264, + "test_loss": 2.9955945150375367, + "test_acc": 0.5394, + "lyapunov": null, + "grad_norm": 0.43031955217275497, + "grad_max_sv": 0.21836008243262767, + "grad_min_sv": 7.966632081498128e-09, + "grad_condition": 338791411.5737727, + "lr": 0.00010815327133708009, + "time_sec": 32.59054613113403 + }, + { + "epoch": 119, + "train_loss": 0.1751684021663666, + "train_acc": 0.94342, + "test_loss": 3.0028031162261963, + "test_acc": 0.5344, + "lyapunov": null, + "grad_norm": 0.4234025902326238, + "grad_max_sv": 0.2052937986329198, + "grad_min_sv": 7.743973756604156e-09, + "grad_condition": 205737178.47096592, + "lr": 0.00010173504098790182, + "time_sec": 32.63575482368469 + }, + { + "epoch": 120, + "train_loss": 0.17288655778884887, + "train_acc": 0.9449, + "test_loss": 3.026424203681946, + "test_acc": 0.5381, + "lyapunov": null, + "grad_norm": 0.41773026543709724, + "grad_max_sv": 0.2095510721206665, + "grad_min_sv": 7.937595827254033e-09, + "grad_condition": 6330317379.225478, + "lr": 9.549150281252629e-05, + "time_sec": 32.587223052978516 + }, + { + "epoch": 121, + "train_loss": 0.17101951307296753, + "train_acc": 0.94462, + "test_loss": 3.165215256309509, + "test_acc": 0.5219, + "lyapunov": null, + "grad_norm": 0.42195608937670603, + "grad_max_sv": 0.20825999304652215, + "grad_min_sv": 7.99512678009099e-09, + "grad_condition": 653203712.6193202, + "lr": 8.942539543314794e-05, + "time_sec": 32.596564531326294 + }, + { + "epoch": 122, + "train_loss": 0.1693978008031845, + "train_acc": 0.94588, + "test_loss": 3.0062981233596804, + "test_acc": 0.5348, + "lyapunov": null, + "grad_norm": 0.41591242620468016, + "grad_max_sv": 0.2059656113386154, + "grad_min_sv": 7.704039686772836e-09, + "grad_condition": 1004445609.8434451, + "lr": 8.353937964495024e-05, + "time_sec": 32.61800956726074 + }, + { + "epoch": 123, + "train_loss": 0.16728713005065918, + "train_acc": 0.94756, + "test_loss": 3.1665957611083986, + "test_acc": 0.5246, + "lyapunov": null, + "grad_norm": 0.41526238625867323, + "grad_max_sv": 0.20129744820296763, + "grad_min_sv": 7.569636380905243e-09, + "grad_condition": 407190475.77847266, + "lr": 7.783603724899243e-05, + "time_sec": 32.61078882217407 + }, + { + "epoch": 124, + "train_loss": 0.1635257438659668, + "train_acc": 0.94798, + "test_loss": 3.1016404109954836, + "test_acc": 0.5367, + "lyapunov": null, + "grad_norm": 0.4079868295136817, + "grad_max_sv": 0.20866212155669928, + "grad_min_sv": 7.864988894011604e-09, + "grad_condition": 294549971.18264663, + "lr": 7.231786991974666e-05, + "time_sec": 32.627676486968994 + }, + { + "epoch": 125, + "train_loss": 0.1641435864830017, + "train_acc": 0.94756, + "test_loss": 3.0870759466171265, + "test_acc": 0.5259, + "lyapunov": null, + "grad_norm": 0.4108898930410538, + "grad_max_sv": 0.21254582721740006, + "grad_min_sv": 7.773244741892532e-09, + "grad_condition": 192549384.92611116, + "lr": 6.698729810778072e-05, + "time_sec": 32.60348701477051 + }, + { + "epoch": 126, + "train_loss": 0.15524960072517396, + "train_acc": 0.95126, + "test_loss": 3.106667465209961, + "test_acc": 0.5253, + "lyapunov": null, + "grad_norm": 0.39708975035952015, + "grad_max_sv": 0.20546648390591143, + "grad_min_sv": 7.524984951411303e-09, + "grad_condition": 594241717.5398318, + "lr": 6.184665997806817e-05, + "time_sec": 32.62395262718201 + }, + { + "epoch": 127, + "train_loss": 0.16405641248226166, + "train_acc": 0.94786, + "test_loss": 3.0382690155029297, + "test_acc": 0.5344, + "lyapunov": null, + "grad_norm": 0.41136197829373494, + "grad_max_sv": 0.20878486707806587, + "grad_min_sv": 7.634084871223142e-09, + "grad_condition": 4480646318.175786, + "lr": 5.6898210384392595e-05, + "time_sec": 32.58641195297241 + }, + { + "epoch": 128, + "train_loss": 0.15556303625106813, + "train_acc": 0.95, + "test_loss": 3.0696772289276124, + "test_acc": 0.5291, + "lyapunov": null, + "grad_norm": 0.399629179039621, + "grad_max_sv": 0.19112058784812688, + "grad_min_sv": 7.558967303998576e-09, + "grad_condition": 130958494.19530413, + "lr": 5.214411988029363e-05, + "time_sec": 32.6273717880249 + }, + { + "epoch": 129, + "train_loss": 0.15622675662994384, + "train_acc": 0.94962, + "test_loss": 3.0737016366958616, + "test_acc": 0.53, + "lyapunov": null, + "grad_norm": 0.4021852855426899, + "grad_max_sv": 0.20368068106472492, + "grad_min_sv": 7.91968607510862e-09, + "grad_condition": 4092034646.124222, + "lr": 4.7586473766990294e-05, + "time_sec": 32.61072516441345 + }, + { + "epoch": 130, + "train_loss": 0.15069342103004454, + "train_acc": 0.95206, + "test_loss": 3.138083388710022, + "test_acc": 0.5303, + "lyapunov": null, + "grad_norm": 0.3967446109539621, + "grad_max_sv": 0.20565238259732724, + "grad_min_sv": 7.903937278850096e-09, + "grad_condition": 403356372.5201774, + "lr": 4.32272711786996e-05, + "time_sec": 32.60817766189575 + }, + { + "epoch": 131, + "train_loss": 0.1475225008201599, + "train_acc": 0.95388, + "test_loss": 3.097823154640198, + "test_acc": 0.5262, + "lyapunov": null, + "grad_norm": 0.3911645556854745, + "grad_max_sv": 0.2029418082907796, + "grad_min_sv": 7.451206509700297e-09, + "grad_condition": 184512637.53159684, + "lr": 3.906842420574966e-05, + "time_sec": 32.620972633361816 + }, + { + "epoch": 132, + "train_loss": 0.14910545247793197, + "train_acc": 0.95376, + "test_loss": 3.1958837438583374, + "test_acc": 0.5255, + "lyapunov": null, + "grad_norm": 0.39312251468793336, + "grad_max_sv": 0.19356854669749737, + "grad_min_sv": 7.3685526407948895e-09, + "grad_condition": 474360013.88184536, + "lr": 3.5111757055874305e-05, + "time_sec": 32.62202000617981 + }, + { + "epoch": 133, + "train_loss": 0.14772581936836243, + "train_acc": 0.95306, + "test_loss": 3.1449778295516966, + "test_acc": 0.528, + "lyapunov": null, + "grad_norm": 0.39083628600782144, + "grad_max_sv": 0.18662805538624525, + "grad_min_sv": 7.411569982176611e-09, + "grad_condition": 590179948.2869803, + "lr": 3.1359005254054254e-05, + "time_sec": 32.62527775764465 + }, + { + "epoch": 134, + "train_loss": 0.1473908689570427, + "train_acc": 0.95432, + "test_loss": 3.060500933647156, + "test_acc": 0.532, + "lyapunov": null, + "grad_norm": 0.39321527574531456, + "grad_max_sv": 0.1960258588194847, + "grad_min_sv": 7.530598097665528e-09, + "grad_condition": 690149093.5169044, + "lr": 2.7811814881259484e-05, + "time_sec": 32.611403942108154 + }, + { + "epoch": 135, + "train_loss": 0.1489419222688675, + "train_acc": 0.95216, + "test_loss": 3.0586274435043337, + "test_acc": 0.5333, + "lyapunov": null, + "grad_norm": 0.3951339678077363, + "grad_max_sv": 0.19855166971683502, + "grad_min_sv": 7.4231230849652885e-09, + "grad_condition": 338026036.5432772, + "lr": 2.4471741852423218e-05, + "time_sec": 32.57758116722107 + }, + { + "epoch": 136, + "train_loss": 0.1439458827161789, + "train_acc": 0.9552, + "test_loss": 3.1572901706695555, + "test_acc": 0.5268, + "lyapunov": null, + "grad_norm": 0.38505775133385556, + "grad_max_sv": 0.20576392244547606, + "grad_min_sv": 7.578524123253968e-09, + "grad_condition": 2346058745.0245013, + "lr": 2.1340251233966362e-05, + "time_sec": 32.60840678215027 + }, + { + "epoch": 137, + "train_loss": 0.14263056889772416, + "train_acc": 0.95558, + "test_loss": 3.0500190071105955, + "test_acc": 0.5343, + "lyapunov": null, + "grad_norm": 0.38315618240250937, + "grad_max_sv": 0.19492608066648245, + "grad_min_sv": 7.437362629664907e-09, + "grad_condition": 445968074.97881687, + "lr": 1.8418716601170932e-05, + "time_sec": 32.5784227848053 + }, + { + "epoch": 138, + "train_loss": 0.14197950773239135, + "train_acc": 0.95516, + "test_loss": 3.054612173843384, + "test_acc": 0.5379, + "lyapunov": null, + "grad_norm": 0.3842449580292686, + "grad_max_sv": 0.20386305153369905, + "grad_min_sv": 7.256548800879062e-09, + "grad_condition": 4009126006.180674, + "lr": 1.570841943568445e-05, + "time_sec": 32.58382248878479 + }, + { + "epoch": 139, + "train_loss": 0.14526520327091216, + "train_acc": 0.95412, + "test_loss": 3.0950862688064573, + "test_acc": 0.5323, + "lyapunov": null, + "grad_norm": 0.38739146310202444, + "grad_max_sv": 0.19300882443785666, + "grad_min_sv": 7.3080626628160495e-09, + "grad_condition": 1317753085.472504, + "lr": 1.3210548563419845e-05, + "time_sec": 32.599539041519165 + }, + { + "epoch": 140, + "train_loss": 0.14277389855384826, + "train_acc": 0.9551, + "test_loss": 3.0536239072799685, + "test_acc": 0.5334, + "lyapunov": null, + "grad_norm": 0.3812502385842012, + "grad_max_sv": 0.2037056451663375, + "grad_min_sv": 7.302020117101499e-09, + "grad_condition": 4685216825.833342, + "lr": 1.0926199633097203e-05, + "time_sec": 32.60143446922302 + }, + { + "epoch": 141, + "train_loss": 0.14106001211643218, + "train_acc": 0.95592, + "test_loss": 3.0723882249832153, + "test_acc": 0.5322, + "lyapunov": null, + "grad_norm": 0.38539484766071236, + "grad_max_sv": 0.19134777113795282, + "grad_min_sv": 7.162904132459666e-09, + "grad_condition": 370718600.83184236, + "lr": 8.856374635655688e-06, + "time_sec": 32.604408740997314 + }, + { + "epoch": 142, + "train_loss": 0.1438280531835556, + "train_acc": 0.95406, + "test_loss": 3.1630526540756225, + "test_acc": 0.526, + "lyapunov": null, + "grad_norm": 0.3885005879930968, + "grad_max_sv": 0.19621171467006207, + "grad_min_sv": 7.508452308209804e-09, + "grad_condition": 440340049.22603464, + "lr": 7.001981464747503e-06, + "time_sec": 32.600708961486816 + }, + { + "epoch": 143, + "train_loss": 0.1418447697210312, + "train_acc": 0.95556, + "test_loss": 3.0879846578598023, + "test_acc": 0.5291, + "lyapunov": null, + "grad_norm": 0.3836324164118778, + "grad_max_sv": 0.188724672421813, + "grad_min_sv": 7.507878820815078e-09, + "grad_condition": 1051208641.6769501, + "lr": 5.3638335185058295e-06, + "time_sec": 32.61192798614502 + }, + { + "epoch": 144, + "train_loss": 0.14410037503242493, + "train_acc": 0.95534, + "test_loss": 3.1234459602355957, + "test_acc": 0.5318, + "lyapunov": null, + "grad_norm": 0.38512540576239257, + "grad_max_sv": 0.20008118823170662, + "grad_min_sv": 7.477710552595152e-09, + "grad_condition": 1216378712.8275027, + "lr": 3.942649342761114e-06, + "time_sec": 32.67555069923401 + }, + { + "epoch": 145, + "train_loss": 0.14076073776245118, + "train_acc": 0.95618, + "test_loss": 3.0669401094436646, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.38185175053609804, + "grad_max_sv": 0.19599322322756052, + "grad_min_sv": 7.380410241113189e-09, + "grad_condition": 248121028.65324074, + "lr": 2.7390523158633524e-06, + "time_sec": 32.595621824264526 + }, + { + "epoch": 146, + "train_loss": 0.14235492443561554, + "train_acc": 0.95542, + "test_loss": 3.1099600078582763, + "test_acc": 0.5303, + "lyapunov": null, + "grad_norm": 0.3833756904141184, + "grad_max_sv": 0.19929019846022128, + "grad_min_sv": 7.511771148854818e-09, + "grad_condition": 234726041.20136175, + "lr": 1.7535703752478133e-06, + "time_sec": 32.61228895187378 + }, + { + "epoch": 147, + "train_loss": 0.1437687619996071, + "train_acc": 0.95498, + "test_loss": 3.1555084846496584, + "test_acc": 0.5253, + "lyapunov": null, + "grad_norm": 0.38692842594278615, + "grad_max_sv": 0.19934902153909206, + "grad_min_sv": 7.2967766568429565e-09, + "grad_condition": 2247202882.6063395, + "lr": 9.866357858642196e-07, + "time_sec": 32.581571102142334 + }, + { + "epoch": 148, + "train_loss": 0.13997777037143708, + "train_acc": 0.95636, + "test_loss": 3.126287574195862, + "test_acc": 0.5349, + "lyapunov": null, + "grad_norm": 0.37982964494822274, + "grad_max_sv": 0.19688362777233123, + "grad_min_sv": 7.199474146620671e-09, + "grad_condition": 410986683.7547163, + "lr": 4.38584950570808e-07, + "time_sec": 32.614789724349976 + }, + { + "epoch": 149, + "train_loss": 0.13758307416915894, + "train_acc": 0.9559, + "test_loss": 3.0673478214263916, + "test_acc": 0.5359, + "lyapunov": null, + "grad_norm": 0.37705013515223074, + "grad_max_sv": 0.20387833528220653, + "grad_min_sv": 7.47520324575064e-09, + "grad_condition": 2818005270.75425, + "lr": 1.096582625772501e-07, + "time_sec": 32.597362995147705 + }, + { + "epoch": 150, + "train_loss": 0.13772287871360778, + "train_acc": 0.95614, + "test_loss": 3.273663801765442, + "test_acc": 0.5186, + "lyapunov": null, + "grad_norm": 0.3790080333138129, + "grad_max_sv": 0.2025493886321783, + "grad_min_sv": 7.3542313326689475e-09, + "grad_condition": 1465090879.8372142, + "lr": 0.0, + "time_sec": 32.61164855957031 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.866019581298828, + "train_acc": 0.03074, + "test_loss": 4.872710034179687, + "test_acc": 0.0143, + "lyapunov": null, + "grad_norm": 5.904015758743758, + "grad_max_sv": 5.3000179648399355, + "grad_min_sv": 9.986983708909492e-08, + "grad_condition": 75746426.03647776, + "lr": 0.0009998903417374227, + "time_sec": 49.65879511833191 + }, + { + "epoch": 2, + "train_loss": 4.336319505615235, + "train_acc": 0.05884, + "test_loss": 5.078699280548095, + "test_acc": 0.0179, + "lyapunov": null, + "grad_norm": 4.512132309010241, + "grad_max_sv": 3.9969229817390444, + "grad_min_sv": 7.723465306475052e-08, + "grad_condition": 99844248.01218227, + "lr": 0.0009995614150494292, + "time_sec": 49.67804217338562 + }, + { + "epoch": 3, + "train_loss": 4.054194154663086, + "train_acc": 0.08442, + "test_loss": 4.735939234924317, + "test_acc": 0.0289, + "lyapunov": null, + "grad_norm": 3.6216238346079055, + "grad_max_sv": 3.0721623718738558, + "grad_min_sv": 6.332745707271492e-08, + "grad_condition": 68533376.3072471, + "lr": 0.0009990133642141358, + "time_sec": 49.650996685028076 + }, + { + "epoch": 4, + "train_loss": 3.8553889916229247, + "train_acc": 0.11068, + "test_loss": 4.7776531311035155, + "test_acc": 0.04, + "lyapunov": null, + "grad_norm": 3.0027283473808, + "grad_max_sv": 2.4722895294427873, + "grad_min_sv": 5.260577265187028e-08, + "grad_condition": 133218192.19257763, + "lr": 0.0009982464296247522, + "time_sec": 49.62583518028259 + }, + { + "epoch": 5, + "train_loss": 3.6851790403747557, + "train_acc": 0.13608, + "test_loss": 4.847144582366943, + "test_acc": 0.0436, + "lyapunov": null, + "grad_norm": 2.4406262601219466, + "grad_max_sv": 1.8893477827310563, + "grad_min_sv": 4.253873583381917e-08, + "grad_condition": 53203728.717256345, + "lr": 0.0009972609476841367, + "time_sec": 49.64903235435486 + }, + { + "epoch": 6, + "train_loss": 3.557223811721802, + "train_acc": 0.1541, + "test_loss": 4.846635614776611, + "test_acc": 0.0504, + "lyapunov": null, + "grad_norm": 1.9869329520709325, + "grad_max_sv": 1.4254269927740097, + "grad_min_sv": 3.4773817814137684e-08, + "grad_condition": 109287419.58926606, + "lr": 0.000996057350657239, + "time_sec": 49.632389545440674 + }, + { + "epoch": 7, + "train_loss": 3.448442996292114, + "train_acc": 0.17344, + "test_loss": 5.146338744354248, + "test_acc": 0.0432, + "lyapunov": null, + "grad_norm": 1.6934869679578504, + "grad_max_sv": 1.111972664296627, + "grad_min_sv": 3.0129338379758507e-08, + "grad_condition": 49145502.73266151, + "lr": 0.000994636166481494, + "time_sec": 49.63013672828674 + }, + { + "epoch": 8, + "train_loss": 3.3602959382629396, + "train_acc": 0.18858, + "test_loss": 4.997173266601562, + "test_acc": 0.0549, + "lyapunov": null, + "grad_norm": 1.4715658174689026, + "grad_max_sv": 0.8646033376455307, + "grad_min_sv": 2.5999903535689484e-08, + "grad_condition": 38484605.38778691, + "lr": 0.0009929980185352525, + "time_sec": 49.63576054573059 + }, + { + "epoch": 9, + "train_loss": 3.2854549378204347, + "train_acc": 0.20336, + "test_loss": 5.892930588531494, + "test_acc": 0.0446, + "lyapunov": null, + "grad_norm": 1.3451340821865851, + "grad_max_sv": 0.7257503181695938, + "grad_min_sv": 2.3997866654967837e-08, + "grad_condition": 36951868.39671626, + "lr": 0.0009911436253643444, + "time_sec": 49.629499197006226 + }, + { + "epoch": 10, + "train_loss": 3.2246680919647215, + "train_acc": 0.21242, + "test_loss": 5.3121603576660155, + "test_acc": 0.0492, + "lyapunov": null, + "grad_norm": 1.2440111786697226, + "grad_max_sv": 0.6271802522242069, + "grad_min_sv": 2.25186588764803e-08, + "grad_condition": 32332715.425953984, + "lr": 0.0009890738003669028, + "time_sec": 49.677348613739014 + }, + { + "epoch": 11, + "train_loss": 3.1626394175720214, + "train_acc": 0.22606, + "test_loss": 6.13012219543457, + "test_acc": 0.0509, + "lyapunov": null, + "grad_norm": 1.1630276076372463, + "grad_max_sv": 0.5456254407763481, + "grad_min_sv": 2.0650329043969684e-08, + "grad_condition": 43285920.578072175, + "lr": 0.00098678945143658, + "time_sec": 49.63444662094116 + }, + { + "epoch": 12, + "train_loss": 3.105594987640381, + "train_acc": 0.2381, + "test_loss": 6.692684747314453, + "test_acc": 0.0337, + "lyapunov": null, + "grad_norm": 1.0991523249692334, + "grad_max_sv": 0.5055619306862355, + "grad_min_sv": 2.044758472541375e-08, + "grad_condition": 38174879.70426883, + "lr": 0.0009842915805643154, + "time_sec": 49.667534828186035 + }, + { + "epoch": 13, + "train_loss": 3.071034761581421, + "train_acc": 0.24202, + "test_loss": 6.808190565490722, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 1.0461733390262893, + "grad_max_sv": 0.45393969416618346, + "grad_min_sv": 1.9080661878279058e-08, + "grad_condition": 26144165.717305023, + "lr": 0.000981581283398829, + "time_sec": 49.651849031448364 + }, + { + "epoch": 14, + "train_loss": 3.031006901779175, + "train_acc": 0.25136, + "test_loss": 6.8066056442260745, + "test_acc": 0.0421, + "lyapunov": null, + "grad_norm": 1.0001345448432042, + "grad_max_sv": 0.4178654387593269, + "grad_min_sv": 1.817219532629366e-08, + "grad_condition": 26243292.8670463, + "lr": 0.0009786597487660333, + "time_sec": 49.67574381828308 + }, + { + "epoch": 15, + "train_loss": 2.992844039916992, + "train_acc": 0.25788, + "test_loss": 6.2335087615966795, + "test_acc": 0.0415, + "lyapunov": null, + "grad_norm": 0.9709343078677097, + "grad_max_sv": 0.40159890055656433, + "grad_min_sv": 1.7637466787068233e-08, + "grad_condition": 31130355.004485857, + "lr": 0.0009755282581475766, + "time_sec": 49.648940324783325 + }, + { + "epoch": 16, + "train_loss": 2.9533546379089355, + "train_acc": 0.2654, + "test_loss": 6.982061653900146, + "test_acc": 0.0331, + "lyapunov": null, + "grad_norm": 0.9294555695312433, + "grad_max_sv": 0.38935905918478964, + "grad_min_sv": 1.7345642956689833e-08, + "grad_condition": 34633361.17032104, + "lr": 0.0009721881851187403, + "time_sec": 49.62569880485535 + }, + { + "epoch": 17, + "train_loss": 2.9248884143066407, + "train_acc": 0.27134, + "test_loss": 5.847897528839112, + "test_acc": 0.0375, + "lyapunov": null, + "grad_norm": 0.8931744987288306, + "grad_max_sv": 0.3547165349125862, + "grad_min_sv": 1.6551659471827906e-08, + "grad_condition": 78906912.01626787, + "lr": 0.0009686409947459456, + "time_sec": 49.628357887268066 + }, + { + "epoch": 18, + "train_loss": 2.896197442779541, + "train_acc": 0.27548, + "test_loss": 6.654647819519043, + "test_acc": 0.0387, + "lyapunov": null, + "grad_norm": 0.8750290297759321, + "grad_max_sv": 0.3526077255606651, + "grad_min_sv": 1.6023472331015005e-08, + "grad_condition": 266939500.3731903, + "lr": 0.0009648882429441254, + "time_sec": 49.64867830276489 + }, + { + "epoch": 19, + "train_loss": 2.8669221867370607, + "train_acc": 0.28036, + "test_loss": 5.810343419647217, + "test_acc": 0.0502, + "lyapunov": null, + "grad_norm": 0.8587949296642396, + "grad_max_sv": 0.34078171029686927, + "grad_min_sv": 1.6171859118507826e-08, + "grad_condition": 22947806.160383917, + "lr": 0.00096093157579425, + "time_sec": 49.63094878196716 + }, + { + "epoch": 20, + "train_loss": 2.82938760848999, + "train_acc": 0.289, + "test_loss": 5.896671797180176, + "test_acc": 0.0461, + "lyapunov": null, + "grad_norm": 0.839027246743402, + "grad_max_sv": 0.3308767855167389, + "grad_min_sv": 1.570504673531481e-08, + "grad_condition": 24206043.26616613, + "lr": 0.0009567727288213001, + "time_sec": 49.6539568901062 + }, + { + "epoch": 21, + "train_loss": 2.8006727541351317, + "train_acc": 0.2938, + "test_loss": 6.180831294250488, + "test_acc": 0.0398, + "lyapunov": null, + "grad_norm": 0.8110141308366953, + "grad_max_sv": 0.3095390945672989, + "grad_min_sv": 1.4921404802026306e-08, + "grad_condition": 34079256.769043334, + "lr": 0.0009524135262330095, + "time_sec": 49.64039897918701 + }, + { + "epoch": 22, + "train_loss": 2.7774745903778078, + "train_acc": 0.29804, + "test_loss": 6.308743616485596, + "test_acc": 0.045, + "lyapunov": null, + "grad_norm": 0.8004103125902539, + "grad_max_sv": 0.31844869926571845, + "grad_min_sv": 1.5020042806734857e-08, + "grad_condition": 27917630.374082875, + "lr": 0.0009478558801197061, + "time_sec": 49.63332271575928 + }, + { + "epoch": 23, + "train_loss": 2.7524796044921875, + "train_acc": 0.30316, + "test_loss": 5.521375189208984, + "test_acc": 0.0535, + "lyapunov": null, + "grad_norm": 0.7869460876794067, + "grad_max_sv": 0.292531880363822, + "grad_min_sv": 1.448369401080285e-08, + "grad_condition": 35029756.554903194, + "lr": 0.000943101789615607, + "time_sec": 49.63528370857239 + }, + { + "epoch": 24, + "train_loss": 2.7253317372131347, + "train_acc": 0.3104, + "test_loss": 6.1194743759155275, + "test_acc": 0.0494, + "lyapunov": null, + "grad_norm": 0.7678368002286986, + "grad_max_sv": 0.29576918072998526, + "grad_min_sv": 1.4323617783529307e-08, + "grad_condition": 28702466.777186085, + "lr": 0.0009381533400219313, + "time_sec": 49.64074897766113 + }, + { + "epoch": 25, + "train_loss": 2.7074700713348387, + "train_acc": 0.31266, + "test_loss": 6.289851884460449, + "test_acc": 0.0462, + "lyapunov": null, + "grad_norm": 0.7683642905855677, + "grad_max_sv": 0.2851465784013271, + "grad_min_sv": 1.4292519384673242e-08, + "grad_condition": 22761462.806346737, + "lr": 0.0009330127018922189, + "time_sec": 49.631171464920044 + }, + { + "epoch": 26, + "train_loss": 2.686272830505371, + "train_acc": 0.3169, + "test_loss": 6.941660729980469, + "test_acc": 0.0479, + "lyapunov": null, + "grad_norm": 0.755488240958268, + "grad_max_sv": 0.28228237964212893, + "grad_min_sv": 1.4025971441233854e-08, + "grad_condition": 35803882.89457456, + "lr": 0.000927682130080253, + "time_sec": 49.64768934249878 + }, + { + "epoch": 27, + "train_loss": 2.6507435781860353, + "train_acc": 0.32476, + "test_loss": 5.651136081695556, + "test_acc": 0.0552, + "lyapunov": null, + "grad_norm": 0.7510174800021984, + "grad_max_sv": 0.2705878522247076, + "grad_min_sv": 1.3801869563900837e-08, + "grad_condition": 24650339.234644465, + "lr": 0.0009221639627510072, + "time_sec": 49.63985729217529 + }, + { + "epoch": 28, + "train_loss": 2.6402551649475097, + "train_acc": 0.32708, + "test_loss": 6.290144860839844, + "test_acc": 0.042, + "lyapunov": null, + "grad_norm": 0.7327305496870947, + "grad_max_sv": 0.26595143899321555, + "grad_min_sv": 1.3485531080714708e-08, + "grad_condition": 24838092.070290618, + "lr": 0.0009164606203550494, + "time_sec": 49.668391704559326 + }, + { + "epoch": 29, + "train_loss": 2.6250381271362304, + "train_acc": 0.32904, + "test_loss": 5.969137829589844, + "test_acc": 0.0584, + "lyapunov": null, + "grad_norm": 0.7326068006390382, + "grad_max_sv": 0.27750224173069, + "grad_min_sv": 1.3820259439634164e-08, + "grad_condition": 23369103.19183632, + "lr": 0.0009105746045668516, + "time_sec": 49.66312098503113 + }, + { + "epoch": 30, + "train_loss": 2.5943477003479005, + "train_acc": 0.3349, + "test_loss": 5.8657053939819335, + "test_acc": 0.0662, + "lyapunov": null, + "grad_norm": 0.7282576381570287, + "grad_max_sv": 0.267722587287426, + "grad_min_sv": 1.3611432567173232e-08, + "grad_condition": 33832306.890324585, + "lr": 0.0009045084971874733, + "time_sec": 49.635533809661865 + }, + { + "epoch": 31, + "train_loss": 2.5734296069335936, + "train_acc": 0.3377, + "test_loss": 5.947202941894531, + "test_acc": 0.0536, + "lyapunov": null, + "grad_norm": 0.72371197105418, + "grad_max_sv": 0.2766475807875395, + "grad_min_sv": 1.3626912859915353e-08, + "grad_condition": 57961221.39827029, + "lr": 0.0008982649590120977, + "time_sec": 49.64917349815369 + }, + { + "epoch": 32, + "train_loss": 2.564406160736084, + "train_acc": 0.34312, + "test_loss": 5.720430706787109, + "test_acc": 0.0515, + "lyapunov": null, + "grad_norm": 0.7163915374705971, + "grad_max_sv": 0.25801267102360725, + "grad_min_sv": 1.3336803814101295e-08, + "grad_condition": 26182544.879379902, + "lr": 0.0008918467286629196, + "time_sec": 49.67513680458069 + }, + { + "epoch": 33, + "train_loss": 2.5487507371520994, + "train_acc": 0.3468, + "test_loss": 6.23959475479126, + "test_acc": 0.0534, + "lyapunov": null, + "grad_norm": 0.7054942364907418, + "grad_max_sv": 0.24919774606823922, + "grad_min_sv": 1.306408175666407e-08, + "grad_condition": 26801620.75531055, + "lr": 0.0008852566213878943, + "time_sec": 49.64692521095276 + }, + { + "epoch": 34, + "train_loss": 2.5242181804656982, + "train_acc": 0.34942, + "test_loss": 6.2963892974853515, + "test_acc": 0.0553, + "lyapunov": null, + "grad_norm": 0.7016169815154498, + "grad_max_sv": 0.25484145022928717, + "grad_min_sv": 1.3042181151723397e-08, + "grad_condition": 22430709.73115928, + "lr": 0.000878497527825878, + "time_sec": 49.654839754104614 + }, + { + "epoch": 35, + "train_loss": 2.5094819609832766, + "train_acc": 0.35066, + "test_loss": 6.719456141662597, + "test_acc": 0.0546, + "lyapunov": null, + "grad_norm": 0.6984323559876441, + "grad_max_sv": 0.25291088260710237, + "grad_min_sv": 1.3091225495309722e-08, + "grad_condition": 24055952.13732664, + "lr": 0.000871572412738697, + "time_sec": 49.63660550117493 + }, + { + "epoch": 36, + "train_loss": 2.482266076126099, + "train_acc": 0.35974, + "test_loss": 6.552088442993164, + "test_acc": 0.0652, + "lyapunov": null, + "grad_norm": 0.6961085506168149, + "grad_max_sv": 0.25587535500526426, + "grad_min_sv": 1.3084706912414034e-08, + "grad_condition": 29953242.59302296, + "lr": 0.0008644843137107055, + "time_sec": 49.636728286743164 + }, + { + "epoch": 37, + "train_loss": 2.4597298861694337, + "train_acc": 0.36194, + "test_loss": 7.314365348815918, + "test_acc": 0.0495, + "lyapunov": null, + "grad_norm": 0.6914952761349973, + "grad_max_sv": 0.24747973680496216, + "grad_min_sv": 1.3026676748406629e-08, + "grad_condition": 27342755.995011915, + "lr": 0.0008572363398164014, + "time_sec": 49.638224363327026 + }, + { + "epoch": 38, + "train_loss": 2.4654034370422364, + "train_acc": 0.36094, + "test_loss": 6.702982992553711, + "test_acc": 0.0509, + "lyapunov": null, + "grad_norm": 0.6892432022946228, + "grad_max_sv": 0.2394346885383129, + "grad_min_sv": 1.273180681438113e-08, + "grad_condition": 22022203.054304175, + "lr": 0.0008498316702566826, + "time_sec": 49.639644145965576 + }, + { + "epoch": 39, + "train_loss": 2.42667671333313, + "train_acc": 0.36782, + "test_loss": 6.179627616882324, + "test_acc": 0.0407, + "lyapunov": null, + "grad_norm": 0.6855295822993354, + "grad_max_sv": 0.24026529379189016, + "grad_min_sv": 1.2694210569513809e-08, + "grad_condition": 40057775.67721417, + "lr": 0.0008422735529643442, + "time_sec": 49.63581466674805 + }, + { + "epoch": 40, + "train_loss": 2.4109215718841552, + "train_acc": 0.37052, + "test_loss": 6.805292085266113, + "test_acc": 0.0527, + "lyapunov": null, + "grad_norm": 0.6807278981220505, + "grad_max_sv": 0.23731110394001007, + "grad_min_sv": 1.2639894338140056e-08, + "grad_condition": 27610612.2175704, + "lr": 0.0008345653031794289, + "time_sec": 49.64470100402832 + }, + { + "epoch": 41, + "train_loss": 2.394052338409424, + "train_acc": 0.37456, + "test_loss": 6.000495677947998, + "test_acc": 0.0498, + "lyapunov": null, + "grad_norm": 0.684187370269629, + "grad_max_sv": 0.24500937685370444, + "grad_min_sv": 1.290876201071045e-08, + "grad_condition": 57507496.68239377, + "lr": 0.0008267103019950526, + "time_sec": 49.64144778251648 + }, + { + "epoch": 42, + "train_loss": 2.369488366241455, + "train_acc": 0.37932, + "test_loss": 5.813188542175293, + "test_acc": 0.0442, + "lyapunov": null, + "grad_norm": 0.6660607900191566, + "grad_max_sv": 0.23581123538315296, + "grad_min_sv": 1.243826876218268e-08, + "grad_condition": 43225809.82445784, + "lr": 0.0008187119948743447, + "time_sec": 49.65106153488159 + }, + { + "epoch": 43, + "train_loss": 2.349871713409424, + "train_acc": 0.38354, + "test_loss": 6.650400701904297, + "test_acc": 0.054, + "lyapunov": null, + "grad_norm": 0.6728559080292662, + "grad_max_sv": 0.23216901496052741, + "grad_min_sv": 1.2423243067605228e-08, + "grad_condition": 97229672.46407479, + "lr": 0.000810573890139155, + "time_sec": 49.6483952999115 + }, + { + "epoch": 44, + "train_loss": 2.3327147588348387, + "train_acc": 0.38762, + "test_loss": 7.37770638885498, + "test_acc": 0.0556, + "lyapunov": null, + "grad_norm": 0.6708437479650249, + "grad_max_sv": 0.2353798534721136, + "grad_min_sv": 1.2329054610571433e-08, + "grad_condition": 24315327.09270349, + "lr": 0.0008022995574311873, + "time_sec": 49.649359464645386 + }, + { + "epoch": 45, + "train_loss": 2.3379388195037842, + "train_acc": 0.38554, + "test_loss": 7.32100400390625, + "test_acc": 0.0447, + "lyapunov": null, + "grad_norm": 0.6690933212170967, + "grad_max_sv": 0.23992121778428555, + "grad_min_sv": 1.2581548722301328e-08, + "grad_condition": 23582198.377444454, + "lr": 0.0007938926261462363, + "time_sec": 49.65408158302307 + }, + { + "epoch": 46, + "train_loss": 2.3259339227294924, + "train_acc": 0.3881, + "test_loss": 5.903630683898926, + "test_acc": 0.0532, + "lyapunov": null, + "grad_norm": 0.6696674111669629, + "grad_max_sv": 0.24237493835389615, + "grad_min_sv": 1.264802341723395e-08, + "grad_condition": 189995164.68487653, + "lr": 0.0007853567838422158, + "time_sec": 49.62894296646118 + }, + { + "epoch": 47, + "train_loss": 2.3060372606658937, + "train_acc": 0.39222, + "test_loss": 6.722331466674805, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.6608950831630619, + "grad_max_sv": 0.2247944913804531, + "grad_min_sv": 1.2062996512373236e-08, + "grad_condition": 1083025267.50655, + "lr": 0.0007766957746216719, + "time_sec": 49.62338829040527 + }, + { + "epoch": 48, + "train_loss": 2.283214527587891, + "train_acc": 0.39554, + "test_loss": 6.30029787979126, + "test_acc": 0.058, + "lyapunov": null, + "grad_norm": 0.6607285996206229, + "grad_max_sv": 0.23341836147010325, + "grad_min_sv": 1.2354938326575304e-08, + "grad_condition": 30471435.85248127, + "lr": 0.0007679133974894982, + "time_sec": 49.62940454483032 + }, + { + "epoch": 49, + "train_loss": 2.2607837000274658, + "train_acc": 0.39988, + "test_loss": 5.6582544311523435, + "test_acc": 0.0597, + "lyapunov": null, + "grad_norm": 0.6558663174998175, + "grad_max_sv": 0.22986114919185638, + "grad_min_sv": 1.2380245191512263e-08, + "grad_condition": 37434404.18782197, + "lr": 0.000759013504686565, + "time_sec": 49.63751459121704 + }, + { + "epoch": 50, + "train_loss": 2.245105714797974, + "train_acc": 0.40408, + "test_loss": 6.382824391937256, + "test_acc": 0.0387, + "lyapunov": null, + "grad_norm": 0.6549241097715082, + "grad_max_sv": 0.2248407918959856, + "grad_min_sv": 1.2180415326357163e-08, + "grad_condition": 21126842.856077008, + "lr": 0.0007499999999999998, + "time_sec": 49.62160301208496 + }, + { + "epoch": 51, + "train_loss": 2.235931240615845, + "train_acc": 0.40734, + "test_loss": 5.594304537963867, + "test_acc": 0.0703, + "lyapunov": null, + "grad_norm": 0.6606674978525966, + "grad_max_sv": 0.23265439458191395, + "grad_min_sv": 1.2417693201483005e-08, + "grad_condition": 38123270.60577395, + "lr": 0.0007408768370508575, + "time_sec": 49.63914489746094 + }, + { + "epoch": 52, + "train_loss": 2.220252141571045, + "train_acc": 0.40908, + "test_loss": 5.49668860168457, + "test_acc": 0.0417, + "lyapunov": null, + "grad_norm": 0.6502905279074903, + "grad_max_sv": 0.23435013145208358, + "grad_min_sv": 1.2266832496304891e-08, + "grad_condition": 38310230.157323316, + "lr": 0.0007316480175599307, + "time_sec": 49.623440980911255 + }, + { + "epoch": 53, + "train_loss": 2.20186401260376, + "train_acc": 0.41488, + "test_loss": 6.196598785400391, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.6529977877477179, + "grad_max_sv": 0.23160336054861547, + "grad_min_sv": 1.213869888216923e-08, + "grad_condition": 32786030.078148127, + "lr": 0.0007223175895924635, + "time_sec": 49.645137548446655 + }, + { + "epoch": 54, + "train_loss": 2.192180712852478, + "train_acc": 0.41462, + "test_loss": 6.966438492584229, + "test_acc": 0.0515, + "lyapunov": null, + "grad_norm": 0.6546718868496101, + "grad_max_sv": 0.23001223765313625, + "grad_min_sv": 1.2304833968412864e-08, + "grad_condition": 26553928.3741663, + "lr": 0.0007128896457825361, + "time_sec": 49.642454862594604 + }, + { + "epoch": 55, + "train_loss": 2.1692851805114746, + "train_acc": 0.42174, + "test_loss": 6.76854267578125, + "test_acc": 0.0514, + "lyapunov": null, + "grad_norm": 0.6573722021244011, + "grad_max_sv": 0.22808259911835194, + "grad_min_sv": 1.2273855956590473e-08, + "grad_condition": 23253160.925169718, + "lr": 0.0007033683215378998, + "time_sec": 49.62129521369934 + }, + { + "epoch": 56, + "train_loss": 2.1607114459228516, + "train_acc": 0.42392, + "test_loss": 6.366939366912842, + "test_acc": 0.0595, + "lyapunov": null, + "grad_norm": 0.6541197760013122, + "grad_max_sv": 0.2261738982051611, + "grad_min_sv": 1.2211666097772245e-08, + "grad_condition": 40339824.5426622, + "lr": 0.0006937577932260512, + "time_sec": 49.614548444747925 + }, + { + "epoch": 57, + "train_loss": 2.1550695499420165, + "train_acc": 0.42292, + "test_loss": 6.088698851013183, + "test_acc": 0.0407, + "lyapunov": null, + "grad_norm": 0.6495499294349419, + "grad_max_sv": 0.22787895202636718, + "grad_min_sv": 1.2191535223027294e-08, + "grad_condition": 46151755.99995027, + "lr": 0.0006840622763423388, + "time_sec": 49.86520218849182 + }, + { + "epoch": 58, + "train_loss": 2.1309228759002687, + "train_acc": 0.4298, + "test_loss": 6.714969717407227, + "test_acc": 0.0476, + "lyapunov": null, + "grad_norm": 0.6501923826294874, + "grad_max_sv": 0.2294207103550434, + "grad_min_sv": 1.2324306024324993e-08, + "grad_condition": 27012371.00660652, + "lr": 0.0006742860236609073, + "time_sec": 49.61659789085388 + }, + { + "epoch": 59, + "train_loss": 2.1276511294555664, + "train_acc": 0.43052, + "test_loss": 7.850105988311768, + "test_acc": 0.0531, + "lyapunov": null, + "grad_norm": 0.6522053097296127, + "grad_max_sv": 0.23177195861935615, + "grad_min_sv": 1.2570549945412068e-08, + "grad_condition": 21066069.902124517, + "lr": 0.0006644333233692913, + "time_sec": 49.61627125740051 + }, + { + "epoch": 60, + "train_loss": 2.108223154907227, + "train_acc": 0.43206, + "test_loss": 6.194909986877441, + "test_acc": 0.0601, + "lyapunov": null, + "grad_norm": 0.6509457366232547, + "grad_max_sv": 0.2232413150370121, + "grad_min_sv": 1.2092985912648402e-08, + "grad_condition": 20482533.369790833, + "lr": 0.0006545084971874734, + "time_sec": 49.638840198516846 + }, + { + "epoch": 61, + "train_loss": 2.0873364936828613, + "train_acc": 0.43732, + "test_loss": 7.149879702758789, + "test_acc": 0.0579, + "lyapunov": null, + "grad_norm": 0.6448496636259025, + "grad_max_sv": 0.2204914376139641, + "grad_min_sv": 1.2118930678428619e-08, + "grad_condition": 22158498.545212857, + "lr": 0.0006445158984722354, + "time_sec": 49.64352631568909 + }, + { + "epoch": 62, + "train_loss": 2.0711798847961425, + "train_acc": 0.4403, + "test_loss": 6.873784851074219, + "test_acc": 0.0519, + "lyapunov": null, + "grad_norm": 0.650740813617645, + "grad_max_sv": 0.23042820766568184, + "grad_min_sv": 1.2226469767173676e-08, + "grad_condition": 22253714.267564178, + "lr": 0.0006344599103076324, + "time_sec": 49.61197328567505 + }, + { + "epoch": 63, + "train_loss": 2.0670838510131837, + "train_acc": 0.44428, + "test_loss": 8.138898289489745, + "test_acc": 0.0465, + "lyapunov": null, + "grad_norm": 0.6500300321497959, + "grad_max_sv": 0.22807052806019784, + "grad_min_sv": 1.2282747885450362e-08, + "grad_condition": 25613801.10650332, + "lr": 0.0006243449435824269, + "time_sec": 49.64067339897156 + }, + { + "epoch": 64, + "train_loss": 2.0602053503417967, + "train_acc": 0.44336, + "test_loss": 6.739065780639648, + "test_acc": 0.0435, + "lyapunov": null, + "grad_norm": 0.6438167751087027, + "grad_max_sv": 0.21950027868151664, + "grad_min_sv": 1.1978744509505424e-08, + "grad_condition": 69086045.79764383, + "lr": 0.0006141754350553275, + "time_sec": 49.63843250274658 + }, + { + "epoch": 65, + "train_loss": 2.0289339319610598, + "train_acc": 0.4504, + "test_loss": 5.612693282318115, + "test_acc": 0.0624, + "lyapunov": null, + "grad_norm": 0.643091891417901, + "grad_max_sv": 0.2296879008412361, + "grad_min_sv": 1.2095985612095573e-08, + "grad_condition": 207267738.03108597, + "lr": 0.0006039558454088793, + "time_sec": 49.621809244155884 + }, + { + "epoch": 66, + "train_loss": 2.017880793533325, + "train_acc": 0.45524, + "test_loss": 5.917317507934571, + "test_acc": 0.0569, + "lyapunov": null, + "grad_norm": 0.6458313703477052, + "grad_max_sv": 0.2203237745910883, + "grad_min_sv": 1.2053612886975263e-08, + "grad_condition": 30573308.01952803, + "lr": 0.000593690657292862, + "time_sec": 49.62665867805481 + }, + { + "epoch": 67, + "train_loss": 2.00664087310791, + "train_acc": 0.45516, + "test_loss": 5.649988233947754, + "test_acc": 0.0551, + "lyapunov": null, + "grad_norm": 0.6469506065081965, + "grad_max_sv": 0.22469568885862828, + "grad_min_sv": 1.2245062176730048e-08, + "grad_condition": 29605005.92733214, + "lr": 0.0005833843733580507, + "time_sec": 49.66580653190613 + }, + { + "epoch": 68, + "train_loss": 1.9934558868789674, + "train_acc": 0.45752, + "test_loss": 6.518855290222168, + "test_acc": 0.0474, + "lyapunov": null, + "grad_norm": 0.6449120600766396, + "grad_max_sv": 0.22343773469328881, + "grad_min_sv": 1.2075202887595893e-08, + "grad_condition": 20470063.13805929, + "lr": 0.0005730415142812054, + "time_sec": 49.649908781051636 + }, + { + "epoch": 69, + "train_loss": 1.9819465933609008, + "train_acc": 0.4615, + "test_loss": 5.741820652770996, + "test_acc": 0.0576, + "lyapunov": null, + "grad_norm": 0.6444073081455958, + "grad_max_sv": 0.2133765324950218, + "grad_min_sv": 1.1591837454538903e-08, + "grad_condition": 7400690970.849569, + "lr": 0.0005626666167821517, + "time_sec": 49.64708852767944 + }, + { + "epoch": 70, + "train_loss": 1.9717326400756836, + "train_acc": 0.4635, + "test_loss": 6.180095139312744, + "test_acc": 0.0538, + "lyapunov": null, + "grad_norm": 0.646339670655307, + "grad_max_sv": 0.22971010841429235, + "grad_min_sv": 1.1938921282844683e-08, + "grad_condition": 42308986.45036293, + "lr": 0.0005522642316338265, + "time_sec": 49.65745282173157 + }, + { + "epoch": 71, + "train_loss": 1.947042868385315, + "train_acc": 0.46858, + "test_loss": 5.758691899871827, + "test_acc": 0.0481, + "lyapunov": null, + "grad_norm": 0.6454285691467331, + "grad_max_sv": 0.21988087929785252, + "grad_min_sv": 1.2038080984128063e-08, + "grad_condition": 54275907.24262571, + "lr": 0.0005418389216661573, + "time_sec": 49.655876874923706 + }, + { + "epoch": 72, + "train_loss": 1.9380216747283936, + "train_acc": 0.47278, + "test_loss": 5.360606885528564, + "test_acc": 0.0499, + "lyapunov": null, + "grad_norm": 0.6445951712238421, + "grad_max_sv": 0.22141558788716792, + "grad_min_sv": 1.2052524836839163e-08, + "grad_condition": 52658770.62947424, + "lr": 0.0005313952597646563, + "time_sec": 49.643407106399536 + }, + { + "epoch": 73, + "train_loss": 1.9315852340698243, + "train_acc": 0.47042, + "test_loss": 5.562986553955078, + "test_acc": 0.0528, + "lyapunov": null, + "grad_norm": 0.6455449182300289, + "grad_max_sv": 0.22759805843234063, + "grad_min_sv": 1.2166670372570909e-08, + "grad_condition": 25263034.87545003, + "lr": 0.0005209378268645994, + "time_sec": 49.65730333328247 + }, + { + "epoch": 74, + "train_loss": 1.9174984769439698, + "train_acc": 0.47274, + "test_loss": 5.779887171173096, + "test_acc": 0.0526, + "lyapunov": null, + "grad_norm": 0.6408982744466406, + "grad_max_sv": 0.223176771402359, + "grad_min_sv": 1.1881650463507754e-08, + "grad_condition": 21609418.938555025, + "lr": 0.0005104712099416781, + "time_sec": 49.63982319831848 + }, + { + "epoch": 75, + "train_loss": 1.9022090718841553, + "train_acc": 0.47956, + "test_loss": 6.74227056427002, + "test_acc": 0.0396, + "lyapunov": null, + "grad_norm": 0.6439391169821848, + "grad_max_sv": 0.22340110316872597, + "grad_min_sv": 1.1930816612437667e-08, + "grad_condition": 22835938.88370643, + "lr": 0.0004999999999999996, + "time_sec": 49.6373016834259 + }, + { + "epoch": 76, + "train_loss": 1.8833642294311523, + "train_acc": 0.48212, + "test_loss": 6.253941902160644, + "test_acc": 0.0401, + "lyapunov": null, + "grad_norm": 0.6458465784916259, + "grad_max_sv": 0.2219920836389065, + "grad_min_sv": 1.1862058124645358e-08, + "grad_condition": 24923864.351812743, + "lr": 0.0004895287900583212, + "time_sec": 49.63244032859802 + }, + { + "epoch": 77, + "train_loss": 1.872097596054077, + "train_acc": 0.4862, + "test_loss": 7.115831829833985, + "test_acc": 0.0455, + "lyapunov": null, + "grad_norm": 0.6389496343286681, + "grad_max_sv": 0.2166093897074461, + "grad_min_sv": 1.1753041695428124e-08, + "grad_condition": 123847363.5090142, + "lr": 0.0004790621731353997, + "time_sec": 49.65565347671509 + }, + { + "epoch": 78, + "train_loss": 1.8647768477630615, + "train_acc": 0.48824, + "test_loss": 6.585789360046387, + "test_acc": 0.0461, + "lyapunov": null, + "grad_norm": 0.6430712356182874, + "grad_max_sv": 0.2195899412035942, + "grad_min_sv": 1.2243656302224696e-08, + "grad_condition": 424951771.80469763, + "lr": 0.000468604740235343, + "time_sec": 49.62981295585632 + }, + { + "epoch": 79, + "train_loss": 1.8419312603759765, + "train_acc": 0.49144, + "test_loss": 6.8796092208862305, + "test_acc": 0.0534, + "lyapunov": null, + "grad_norm": 0.6438732522551095, + "grad_max_sv": 0.223552468046546, + "grad_min_sv": 1.2100811991712716e-08, + "grad_condition": 310767823.54431427, + "lr": 0.00045816107833384175, + "time_sec": 49.63279318809509 + }, + { + "epoch": 80, + "train_loss": 1.8222150116348266, + "train_acc": 0.49938, + "test_loss": 6.9083010223388674, + "test_acc": 0.0574, + "lyapunov": null, + "grad_norm": 0.646876723364354, + "grad_max_sv": 0.22485989183187485, + "grad_min_sv": 1.2241183645900212e-08, + "grad_condition": 28086849.755860113, + "lr": 0.0004477357683661729, + "time_sec": 49.6425895690918 + }, + { + "epoch": 81, + "train_loss": 1.813687347946167, + "train_acc": 0.49976, + "test_loss": 6.90407081451416, + "test_acc": 0.04, + "lyapunov": null, + "grad_norm": 0.642733217341124, + "grad_max_sv": 0.22463089227676392, + "grad_min_sv": 1.2082413675118531e-08, + "grad_condition": 22301589.48218178, + "lr": 0.00043733338321784746, + "time_sec": 49.629480838775635 + }, + { + "epoch": 82, + "train_loss": 1.7951585668945313, + "train_acc": 0.5034, + "test_loss": 7.836273937988281, + "test_acc": 0.0512, + "lyapunov": null, + "grad_norm": 0.6454340294520209, + "grad_max_sv": 0.22539752162992954, + "grad_min_sv": 1.1886250314216417e-08, + "grad_condition": 59544024.862964645, + "lr": 0.0004269584857187939, + "time_sec": 49.61994457244873 + }, + { + "epoch": 83, + "train_loss": 1.7966358541488647, + "train_acc": 0.50272, + "test_loss": 7.222357276916504, + "test_acc": 0.0579, + "lyapunov": null, + "grad_norm": 0.6453223951998842, + "grad_max_sv": 0.22831037007272242, + "grad_min_sv": 1.203974950118869e-08, + "grad_condition": 82894748.52704917, + "lr": 0.0004166156266419484, + "time_sec": 49.673835039138794 + }, + { + "epoch": 84, + "train_loss": 1.7854290616226196, + "train_acc": 0.50408, + "test_loss": 6.414771678161621, + "test_acc": 0.0601, + "lyapunov": null, + "grad_norm": 0.6427673490554981, + "grad_max_sv": 0.2182640478014946, + "grad_min_sv": 1.202259434229802e-08, + "grad_condition": 21861556.418338913, + "lr": 0.0004063093427071373, + "time_sec": 49.64637732505798 + }, + { + "epoch": 85, + "train_loss": 1.7772653774261475, + "train_acc": 0.5111, + "test_loss": 7.505108009338379, + "test_acc": 0.0616, + "lyapunov": null, + "grad_norm": 0.6410246970315546, + "grad_max_sv": 0.2277263168245554, + "grad_min_sv": 1.1847804396586393e-08, + "grad_condition": 36055137.59124441, + "lr": 0.0003960441545911199, + "time_sec": 49.642088174819946 + }, + { + "epoch": 86, + "train_loss": 1.7477331000518799, + "train_acc": 0.5147, + "test_loss": 7.709722770690918, + "test_acc": 0.0449, + "lyapunov": null, + "grad_norm": 0.6439998427728569, + "grad_max_sv": 0.22573819942772388, + "grad_min_sv": 1.2154757376287017e-08, + "grad_condition": 47618357.203088775, + "lr": 0.0003858245649446718, + "time_sec": 49.63089942932129 + }, + { + "epoch": 87, + "train_loss": 1.7338512952423095, + "train_acc": 0.51864, + "test_loss": 7.293183726501465, + "test_acc": 0.0531, + "lyapunov": null, + "grad_norm": 0.6450352139357391, + "grad_max_sv": 0.2251686044037342, + "grad_min_sv": 1.2090907994255495e-08, + "grad_condition": 23129638.107943743, + "lr": 0.00037565505641757235, + "time_sec": 49.62959694862366 + }, + { + "epoch": 88, + "train_loss": 1.7305470868301391, + "train_acc": 0.51752, + "test_loss": 6.886636978912353, + "test_acc": 0.0621, + "lyapunov": null, + "grad_norm": 0.6466229739487265, + "grad_max_sv": 0.2285929098725319, + "grad_min_sv": 1.2207108990238031e-08, + "grad_condition": 639961294.3776948, + "lr": 0.00036554008969236695, + "time_sec": 49.64359998703003 + }, + { + "epoch": 89, + "train_loss": 1.7247330599212647, + "train_acc": 0.52118, + "test_loss": 7.737054846954345, + "test_acc": 0.0492, + "lyapunov": null, + "grad_norm": 0.6431070021674609, + "grad_max_sv": 0.21853713542222977, + "grad_min_sv": 1.1871128499651996e-08, + "grad_condition": 34316573.10990389, + "lr": 0.0003554841015277638, + "time_sec": 49.6319477558136 + }, + { + "epoch": 90, + "train_loss": 1.704887728881836, + "train_acc": 0.52374, + "test_loss": 6.713198412322998, + "test_acc": 0.0556, + "lyapunov": null, + "grad_norm": 0.6451375385492529, + "grad_max_sv": 0.22224950045347214, + "grad_min_sv": 1.2021271361684072e-08, + "grad_condition": 25574543.625141606, + "lr": 0.000345491502812526, + "time_sec": 49.63963174819946 + }, + { + "epoch": 91, + "train_loss": 1.701412860145569, + "train_acc": 0.52644, + "test_loss": 7.295478704833984, + "test_acc": 0.0429, + "lyapunov": null, + "grad_norm": 0.6447266155116032, + "grad_max_sv": 0.23335366621613501, + "grad_min_sv": 1.257304017843186e-08, + "grad_condition": 24036732.36328527, + "lr": 0.0003355666766307081, + "time_sec": 49.665791511535645 + }, + { + "epoch": 92, + "train_loss": 1.6871472067642213, + "train_acc": 0.53048, + "test_loss": 7.389536867523193, + "test_acc": 0.0375, + "lyapunov": null, + "grad_norm": 0.6468836541708367, + "grad_max_sv": 0.2225259728729725, + "grad_min_sv": 1.1890293904331939e-08, + "grad_condition": 29650216.370129876, + "lr": 0.00032571397633909225, + "time_sec": 49.64622926712036 + }, + { + "epoch": 93, + "train_loss": 1.6749127053833008, + "train_acc": 0.53202, + "test_loss": 8.144829412078858, + "test_acc": 0.0401, + "lyapunov": null, + "grad_norm": 0.6416574148081634, + "grad_max_sv": 0.22841569185256957, + "grad_min_sv": 1.2051048693673128e-08, + "grad_condition": 29017060.070413183, + "lr": 0.00031593772365766094, + "time_sec": 49.649181604385376 + }, + { + "epoch": 94, + "train_loss": 1.6659465893936156, + "train_acc": 0.53198, + "test_loss": 7.906325871276856, + "test_acc": 0.0523, + "lyapunov": null, + "grad_norm": 0.6442484947336338, + "grad_max_sv": 0.22283854335546494, + "grad_min_sv": 1.1940718097624981e-08, + "grad_condition": 23900914.940908086, + "lr": 0.0003062422067739483, + "time_sec": 49.64401292800903 + }, + { + "epoch": 95, + "train_loss": 1.6399671975326537, + "train_acc": 0.53952, + "test_loss": 7.157633497619629, + "test_acc": 0.0527, + "lyapunov": null, + "grad_norm": 0.6406645370679923, + "grad_max_sv": 0.22293368987739087, + "grad_min_sv": 1.2085724485771942e-08, + "grad_condition": 56163384.20133088, + "lr": 0.00029663167846209965, + "time_sec": 49.6225950717926 + }, + { + "epoch": 96, + "train_loss": 1.6436440280532838, + "train_acc": 0.5397, + "test_loss": 8.535991598510742, + "test_acc": 0.0515, + "lyapunov": null, + "grad_norm": 0.6492588500387332, + "grad_max_sv": 0.22496760375797747, + "grad_min_sv": 1.180983480297132e-08, + "grad_condition": 106906297.43684229, + "lr": 0.00028711035421746345, + "time_sec": 49.64288353919983 + }, + { + "epoch": 97, + "train_loss": 1.6246039770889282, + "train_acc": 0.54446, + "test_loss": 8.059152350616456, + "test_acc": 0.0505, + "lyapunov": null, + "grad_norm": 0.6473823340688163, + "grad_max_sv": 0.23146028257906437, + "grad_min_sv": 1.2134549565862019e-08, + "grad_condition": 35822540.74264745, + "lr": 0.00027768241040753615, + "time_sec": 49.6298463344574 + }, + { + "epoch": 98, + "train_loss": 1.61877662109375, + "train_acc": 0.54736, + "test_loss": 8.167729595947266, + "test_acc": 0.038, + "lyapunov": null, + "grad_norm": 0.6455041816035443, + "grad_max_sv": 0.22865931317210197, + "grad_min_sv": 1.1919900413936979e-08, + "grad_condition": 28498587.531759303, + "lr": 0.00026835198244006903, + "time_sec": 49.63332438468933 + }, + { + "epoch": 99, + "train_loss": 3.068192625274658, + "train_acc": 0.31474, + "test_loss": 5.048260988616943, + "test_acc": 0.1146, + "lyapunov": null, + "grad_norm": 0.8608040247164788, + "grad_max_sv": 0.3330514427274466, + "grad_min_sv": 1.6094786775555646e-08, + "grad_condition": 28526093.82209841, + "lr": 0.0002591231629491421, + "time_sec": 49.662447690963745 + }, + { + "epoch": 100, + "train_loss": 2.316078476104736, + "train_acc": 0.39026, + "test_loss": 5.392445658874512, + "test_acc": 0.0879, + "lyapunov": null, + "grad_norm": 0.658192665007455, + "grad_max_sv": 0.22761380225419997, + "grad_min_sv": 1.2582580913994557e-08, + "grad_condition": 55399675.47104869, + "lr": 0.0002499999999999997, + "time_sec": 49.64076352119446 + }, + { + "epoch": 101, + "train_loss": 2.1483063832855223, + "train_acc": 0.42276, + "test_loss": 5.986578815460205, + "test_acc": 0.0707, + "lyapunov": null, + "grad_norm": 0.6484922643705857, + "grad_max_sv": 0.22837907671928406, + "grad_min_sv": 1.2391293061075892e-08, + "grad_condition": 23094080.352399424, + "lr": 0.00024098649531343477, + "time_sec": 49.6578733921051 + }, + { + "epoch": 102, + "train_loss": 2.05953384185791, + "train_acc": 0.4427, + "test_loss": 6.080546961212158, + "test_acc": 0.0573, + "lyapunov": null, + "grad_norm": 0.6484188898656511, + "grad_max_sv": 0.22914629317820073, + "grad_min_sv": 1.2451091090104338e-08, + "grad_condition": 62209882.03375574, + "lr": 0.0002320866025105016, + "time_sec": 49.63767695426941 + }, + { + "epoch": 103, + "train_loss": 2.004299710121155, + "train_acc": 0.45614, + "test_loss": 5.895175799560547, + "test_acc": 0.0578, + "lyapunov": null, + "grad_norm": 0.6399422615270736, + "grad_max_sv": 0.23107412382960318, + "grad_min_sv": 1.2409910121746748e-08, + "grad_condition": 22284137.40025208, + "lr": 0.0002233042253783278, + "time_sec": 49.65248942375183 + }, + { + "epoch": 104, + "train_loss": 1.9571235482788085, + "train_acc": 0.46526, + "test_loss": 5.738465850830078, + "test_acc": 0.0523, + "lyapunov": null, + "grad_norm": 0.6391319009023594, + "grad_max_sv": 0.2172716658562422, + "grad_min_sv": 1.1984206682580378e-08, + "grad_condition": 20112915.921763636, + "lr": 0.000214643216157784, + "time_sec": 49.633373975753784 + }, + { + "epoch": 105, + "train_loss": 1.9224023293304444, + "train_acc": 0.47322, + "test_loss": 6.117083155059815, + "test_acc": 0.05, + "lyapunov": null, + "grad_norm": 0.6402482339469217, + "grad_max_sv": 0.21523526906967164, + "grad_min_sv": 1.1972073542948491e-08, + "grad_condition": 36228791.07592559, + "lr": 0.00020610737385376332, + "time_sec": 49.63998031616211 + }, + { + "epoch": 106, + "train_loss": 1.8866684201812745, + "train_acc": 0.4833, + "test_loss": 5.936769345855713, + "test_acc": 0.0439, + "lyapunov": null, + "grad_norm": 0.6419042012012792, + "grad_max_sv": 0.22602429389953613, + "grad_min_sv": 1.2054361504115762e-08, + "grad_condition": 48343281.63861313, + "lr": 0.00019770044256881242, + "time_sec": 49.65153455734253 + }, + { + "epoch": 107, + "train_loss": 1.8594331677246094, + "train_acc": 0.48626, + "test_loss": 6.035185343170166, + "test_acc": 0.046, + "lyapunov": null, + "grad_norm": 0.6436629646723144, + "grad_max_sv": 0.21455634236335755, + "grad_min_sv": 1.1783472720489074e-08, + "grad_condition": 38784276.09698713, + "lr": 0.0001894261098608447, + "time_sec": 49.66721272468567 + }, + { + "epoch": 108, + "train_loss": 1.8262966638946534, + "train_acc": 0.49558, + "test_loss": 6.42567989654541, + "test_acc": 0.0425, + "lyapunov": null, + "grad_norm": 0.6468304513936767, + "grad_max_sv": 0.22701141163706778, + "grad_min_sv": 1.216740327554533e-08, + "grad_condition": 72116525.85188936, + "lr": 0.000181288005125655, + "time_sec": 49.65104866027832 + }, + { + "epoch": 109, + "train_loss": 1.8205863860321045, + "train_acc": 0.49754, + "test_loss": 5.783528507995605, + "test_acc": 0.0367, + "lyapunov": null, + "grad_norm": 0.643976690980956, + "grad_max_sv": 0.21868419870734215, + "grad_min_sv": 1.2079363115313768e-08, + "grad_condition": 20195547.998739578, + "lr": 0.0001732896980049473, + "time_sec": 49.66611671447754 + }, + { + "epoch": 110, + "train_loss": 1.793330860900879, + "train_acc": 0.5022, + "test_loss": 6.1977317413330075, + "test_acc": 0.0425, + "lyapunov": null, + "grad_norm": 0.6468160086891667, + "grad_max_sv": 0.2236340381205082, + "grad_min_sv": 1.1926133475226308e-08, + "grad_condition": 32237535.591110267, + "lr": 0.00016543469682057076, + "time_sec": 49.63362669944763 + }, + { + "epoch": 111, + "train_loss": 1.7825101839828492, + "train_acc": 0.5064, + "test_loss": 6.178716979980469, + "test_acc": 0.0443, + "lyapunov": null, + "grad_norm": 0.6424263059147781, + "grad_max_sv": 0.22070568352937697, + "grad_min_sv": 1.1919835535972866e-08, + "grad_condition": 37842182.06602182, + "lr": 0.00015772644703565552, + "time_sec": 49.65402150154114 + }, + { + "epoch": 112, + "train_loss": 1.7541921194458008, + "train_acc": 0.5103, + "test_loss": 6.0973250106811525, + "test_acc": 0.0475, + "lyapunov": null, + "grad_norm": 0.6481497742539534, + "grad_max_sv": 0.22489695958793163, + "grad_min_sv": 1.2136619546854188e-08, + "grad_condition": 29561688.482165914, + "lr": 0.00015016832974331713, + "time_sec": 49.65926122665405 + }, + { + "epoch": 113, + "train_loss": 1.7488899993515015, + "train_acc": 0.51458, + "test_loss": 5.979724680328369, + "test_acc": 0.0424, + "lyapunov": null, + "grad_norm": 0.6406667137370472, + "grad_max_sv": 0.22864535339176656, + "grad_min_sv": 1.191089982824356e-08, + "grad_condition": 56508420.06490357, + "lr": 0.00014276366018359834, + "time_sec": 49.62884473800659 + }, + { + "epoch": 114, + "train_loss": 1.7389903827667237, + "train_acc": 0.51522, + "test_loss": 5.958202845001221, + "test_acc": 0.0517, + "lyapunov": null, + "grad_norm": 0.6426356824149351, + "grad_max_sv": 0.22491934411227704, + "grad_min_sv": 1.2247705622608906e-08, + "grad_condition": 58131203.41244085, + "lr": 0.00013551568628929425, + "time_sec": 49.62388038635254 + }, + { + "epoch": 115, + "train_loss": 1.7231919304656982, + "train_acc": 0.52138, + "test_loss": 6.056362869262696, + "test_acc": 0.0478, + "lyapunov": null, + "grad_norm": 0.6495040089755264, + "grad_max_sv": 0.22354965060949325, + "grad_min_sv": 1.2017865864966116e-08, + "grad_condition": 28069335.9052594, + "lr": 0.00012842758726130276, + "time_sec": 49.6635365486145 + }, + { + "epoch": 116, + "train_loss": 1.6999663226699828, + "train_acc": 0.52556, + "test_loss": 6.322325106811523, + "test_acc": 0.0459, + "lyapunov": null, + "grad_norm": 0.6439980745634726, + "grad_max_sv": 0.22484406568109988, + "grad_min_sv": 1.2245539982025377e-08, + "grad_condition": 27693634.55346756, + "lr": 0.0001215024721741218, + "time_sec": 49.667264223098755 + }, + { + "epoch": 117, + "train_loss": 1.6914007580566406, + "train_acc": 0.52596, + "test_loss": 6.2398702270507815, + "test_acc": 0.0358, + "lyapunov": null, + "grad_norm": 0.6406992341206976, + "grad_max_sv": 0.22702743746340276, + "grad_min_sv": 1.2027920018309323e-08, + "grad_condition": 25480937.943885125, + "lr": 0.00011474337861210538, + "time_sec": 49.75715970993042 + }, + { + "epoch": 118, + "train_loss": 1.682532057723999, + "train_acc": 0.5269, + "test_loss": 6.022721984863281, + "test_acc": 0.0502, + "lyapunov": null, + "grad_norm": 0.6475614121887046, + "grad_max_sv": 0.22498515360057353, + "grad_min_sv": 1.2050166899382763e-08, + "grad_condition": 76251711.1097268, + "lr": 0.00010815327133708009, + "time_sec": 49.63880777359009 + }, + { + "epoch": 119, + "train_loss": 1.6772437452697755, + "train_acc": 0.53014, + "test_loss": 5.847724533081054, + "test_acc": 0.0456, + "lyapunov": null, + "grad_norm": 0.645505943920055, + "grad_max_sv": 0.22384067326784135, + "grad_min_sv": 1.1783700598622104e-08, + "grad_condition": 22583004.98493171, + "lr": 0.00010173504098790182, + "time_sec": 49.63686180114746 + }, + { + "epoch": 120, + "train_loss": 1.6719491082763671, + "train_acc": 0.53248, + "test_loss": 5.856200427246094, + "test_acc": 0.0427, + "lyapunov": null, + "grad_norm": 0.6466969899308954, + "grad_max_sv": 0.2293648473918438, + "grad_min_sv": 1.2215246461555474e-08, + "grad_condition": 26750165.211627714, + "lr": 9.549150281252629e-05, + "time_sec": 49.633697748184204 + }, + { + "epoch": 121, + "train_loss": 1.6578344228744506, + "train_acc": 0.53442, + "test_loss": 5.862105746459961, + "test_acc": 0.0534, + "lyapunov": null, + "grad_norm": 0.6460809469464214, + "grad_max_sv": 0.2225838266313076, + "grad_min_sv": 1.212055693311509e-08, + "grad_condition": 24676272.501794428, + "lr": 8.942539543314794e-05, + "time_sec": 49.647422790527344 + }, + { + "epoch": 122, + "train_loss": 1.6389700134658813, + "train_acc": 0.54052, + "test_loss": 5.913293504333496, + "test_acc": 0.0439, + "lyapunov": null, + "grad_norm": 0.6468970710870378, + "grad_max_sv": 0.22489394322037698, + "grad_min_sv": 1.1876642090624667e-08, + "grad_condition": 27879869.134462822, + "lr": 8.353937964495024e-05, + "time_sec": 49.6471688747406 + }, + { + "epoch": 123, + "train_loss": 1.6408760947418213, + "train_acc": 0.539, + "test_loss": 5.881608892822266, + "test_acc": 0.0455, + "lyapunov": null, + "grad_norm": 0.6409502867501498, + "grad_max_sv": 0.2229029569774866, + "grad_min_sv": 1.1994366785894606e-08, + "grad_condition": 23946080.329339217, + "lr": 7.783603724899243e-05, + "time_sec": 49.645761013031006 + }, + { + "epoch": 124, + "train_loss": 1.6327575244140624, + "train_acc": 0.54088, + "test_loss": 6.092592315673828, + "test_acc": 0.0442, + "lyapunov": null, + "grad_norm": 0.6388358623443664, + "grad_max_sv": 0.22407596856355666, + "grad_min_sv": 1.1999070549661983e-08, + "grad_condition": 29088864.422511287, + "lr": 7.231786991974666e-05, + "time_sec": 49.63370180130005 + }, + { + "epoch": 125, + "train_loss": 1.626538638381958, + "train_acc": 0.54214, + "test_loss": 6.060646697998047, + "test_acc": 0.0498, + "lyapunov": null, + "grad_norm": 0.649112571277706, + "grad_max_sv": 0.22536444179713727, + "grad_min_sv": 1.2212023835916908e-08, + "grad_condition": 35126636.74446645, + "lr": 6.698729810778072e-05, + "time_sec": 49.61126947402954 + }, + { + "epoch": 126, + "train_loss": 1.6151732135009766, + "train_acc": 0.54378, + "test_loss": 6.19133405456543, + "test_acc": 0.0452, + "lyapunov": null, + "grad_norm": 0.645551187410472, + "grad_max_sv": 0.227165062725544, + "grad_min_sv": 1.194181808161776e-08, + "grad_condition": 24734104.665951073, + "lr": 6.184665997806817e-05, + "time_sec": 49.74283456802368 + }, + { + "epoch": 127, + "train_loss": 1.6116835289764404, + "train_acc": 0.54702, + "test_loss": 6.264876268768311, + "test_acc": 0.0576, + "lyapunov": null, + "grad_norm": 0.6449882086043084, + "grad_max_sv": 0.2281236581504345, + "grad_min_sv": 1.2174795581409992e-08, + "grad_condition": 33327591.078247894, + "lr": 5.6898210384392595e-05, + "time_sec": 49.66547632217407 + }, + { + "epoch": 128, + "train_loss": 1.6025007713317871, + "train_acc": 0.55014, + "test_loss": 6.29011365814209, + "test_acc": 0.0469, + "lyapunov": null, + "grad_norm": 0.6498584112316286, + "grad_max_sv": 0.22942896112799643, + "grad_min_sv": 1.2217025608090431e-08, + "grad_condition": 181633490.37894756, + "lr": 5.214411988029363e-05, + "time_sec": 49.644524574279785 + }, + { + "epoch": 129, + "train_loss": 1.6006367045974732, + "train_acc": 0.55154, + "test_loss": 5.960230406188965, + "test_acc": 0.0484, + "lyapunov": null, + "grad_norm": 0.6474761633146622, + "grad_max_sv": 0.22425766214728354, + "grad_min_sv": 1.2069871824227363e-08, + "grad_condition": 25614798.36847374, + "lr": 4.7586473766990294e-05, + "time_sec": 49.63229012489319 + }, + { + "epoch": 130, + "train_loss": 1.5994749016952514, + "train_acc": 0.54798, + "test_loss": 6.082809280395508, + "test_acc": 0.0462, + "lyapunov": null, + "grad_norm": 0.6436297587317452, + "grad_max_sv": 0.2260743647813797, + "grad_min_sv": 1.197359623186789e-08, + "grad_condition": 47224918.84575805, + "lr": 4.32272711786996e-05, + "time_sec": 49.653711795806885 + }, + { + "epoch": 131, + "train_loss": 1.5907676587677002, + "train_acc": 0.55338, + "test_loss": 6.253540195465088, + "test_acc": 0.0493, + "lyapunov": null, + "grad_norm": 0.6404122118978958, + "grad_max_sv": 0.2243455123156309, + "grad_min_sv": 1.1890854798024541e-08, + "grad_condition": 28094398.171041556, + "lr": 3.906842420574966e-05, + "time_sec": 49.65587568283081 + }, + { + "epoch": 132, + "train_loss": 1.591219468383789, + "train_acc": 0.55168, + "test_loss": 6.408939161682129, + "test_acc": 0.0426, + "lyapunov": null, + "grad_norm": 0.6506622903315123, + "grad_max_sv": 0.23343092501163482, + "grad_min_sv": 1.2356089287846039e-08, + "grad_condition": 31524710.75405284, + "lr": 3.5111757055874305e-05, + "time_sec": 49.64363932609558 + }, + { + "epoch": 133, + "train_loss": 1.5818653707885741, + "train_acc": 0.55544, + "test_loss": 6.288112886047363, + "test_acc": 0.0416, + "lyapunov": null, + "grad_norm": 0.641538436455134, + "grad_max_sv": 0.22353356778621675, + "grad_min_sv": 1.1930217144046074e-08, + "grad_condition": 35984070.824167676, + "lr": 3.1359005254054254e-05, + "time_sec": 49.6272132396698 + }, + { + "epoch": 134, + "train_loss": 1.5757408687973022, + "train_acc": 0.5551, + "test_loss": 6.169788475036621, + "test_acc": 0.0436, + "lyapunov": null, + "grad_norm": 0.6422263506494424, + "grad_max_sv": 0.22716106660664082, + "grad_min_sv": 1.1833126612598166e-08, + "grad_condition": 52859395.957509615, + "lr": 2.7811814881259484e-05, + "time_sec": 49.634817600250244 + }, + { + "epoch": 135, + "train_loss": 1.573296899986267, + "train_acc": 0.5586, + "test_loss": 6.409516627502441, + "test_acc": 0.0398, + "lyapunov": null, + "grad_norm": 0.6422323193959601, + "grad_max_sv": 0.21986942775547505, + "grad_min_sv": 1.1918038018803035e-08, + "grad_condition": 135103466.34543505, + "lr": 2.4471741852423218e-05, + "time_sec": 49.644601583480835 + }, + { + "epoch": 136, + "train_loss": 1.5735322719573974, + "train_acc": 0.55498, + "test_loss": 6.962667681884765, + "test_acc": 0.0438, + "lyapunov": null, + "grad_norm": 0.6425705125331251, + "grad_max_sv": 0.22957376427948475, + "grad_min_sv": 1.2022417819265719e-08, + "grad_condition": 84953424.74808493, + "lr": 2.1340251233966362e-05, + "time_sec": 49.65340971946716 + }, + { + "epoch": 137, + "train_loss": 1.5703629438018798, + "train_acc": 0.55592, + "test_loss": 6.347426979064942, + "test_acc": 0.0416, + "lyapunov": null, + "grad_norm": 0.6470089432203813, + "grad_max_sv": 0.22675703540444375, + "grad_min_sv": 1.1964806787001515e-08, + "grad_condition": 42242032.09383811, + "lr": 1.8418716601170932e-05, + "time_sec": 49.65664100646973 + }, + { + "epoch": 138, + "train_loss": 1.5664401405334472, + "train_acc": 0.55756, + "test_loss": 6.496471109771728, + "test_acc": 0.0445, + "lyapunov": null, + "grad_norm": 0.6430396727274027, + "grad_max_sv": 0.22493685856461526, + "grad_min_sv": 1.2061497275950295e-08, + "grad_condition": 23954534.1998593, + "lr": 1.570841943568445e-05, + "time_sec": 49.642067432403564 + }, + { + "epoch": 139, + "train_loss": 1.5627032785415649, + "train_acc": 0.5605, + "test_loss": 6.283855271148681, + "test_acc": 0.0447, + "lyapunov": null, + "grad_norm": 0.6409841113210015, + "grad_max_sv": 0.2232666589319706, + "grad_min_sv": 1.1962911396386222e-08, + "grad_condition": 259592659.58503166, + "lr": 1.3210548563419845e-05, + "time_sec": 49.632962465286255 + }, + { + "epoch": 140, + "train_loss": 1.5663015616226197, + "train_acc": 0.55768, + "test_loss": 6.220936709594727, + "test_acc": 0.0479, + "lyapunov": null, + "grad_norm": 0.6429008373506699, + "grad_max_sv": 0.22778371684253215, + "grad_min_sv": 1.2041603553170077e-08, + "grad_condition": 67987905.64758533, + "lr": 1.0926199633097203e-05, + "time_sec": 49.615734338760376 + }, + { + "epoch": 141, + "train_loss": 1.5625858126068115, + "train_acc": 0.56096, + "test_loss": 6.526646176147461, + "test_acc": 0.0493, + "lyapunov": null, + "grad_norm": 0.6377897998533895, + "grad_max_sv": 0.2237264908850193, + "grad_min_sv": 1.2073943828072586e-08, + "grad_condition": 21432345.22954327, + "lr": 8.856374635655688e-06, + "time_sec": 49.64499115943909 + }, + { + "epoch": 142, + "train_loss": 1.551087869529724, + "train_acc": 0.56178, + "test_loss": 6.401860023498535, + "test_acc": 0.0441, + "lyapunov": null, + "grad_norm": 0.6415643857015031, + "grad_max_sv": 0.2261370625346899, + "grad_min_sv": 1.2029182526809845e-08, + "grad_condition": 66314375.58164777, + "lr": 7.001981464747503e-06, + "time_sec": 49.65327548980713 + }, + { + "epoch": 143, + "train_loss": 1.5571945658111572, + "train_acc": 0.55928, + "test_loss": 6.133491006469726, + "test_acc": 0.0486, + "lyapunov": null, + "grad_norm": 0.6447257277887289, + "grad_max_sv": 0.22846047319471835, + "grad_min_sv": 1.2135202965418701e-08, + "grad_condition": 37586048.51019514, + "lr": 5.3638335185058295e-06, + "time_sec": 49.65649223327637 + }, + { + "epoch": 144, + "train_loss": 1.5559558386611938, + "train_acc": 0.5614, + "test_loss": 6.064924475097656, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.6401487690577669, + "grad_max_sv": 0.2242697723209858, + "grad_min_sv": 1.1992281666317605e-08, + "grad_condition": 25437338.27988875, + "lr": 3.942649342761114e-06, + "time_sec": 49.635279178619385 + }, + { + "epoch": 145, + "train_loss": 1.553707954940796, + "train_acc": 0.56286, + "test_loss": 6.5988156112670895, + "test_acc": 0.0458, + "lyapunov": null, + "grad_norm": 0.6407793832198755, + "grad_max_sv": 0.23003120347857475, + "grad_min_sv": 1.1913595625301366e-08, + "grad_condition": 32004871.034651928, + "lr": 2.7390523158633524e-06, + "time_sec": 49.659799575805664 + }, + { + "epoch": 146, + "train_loss": 1.556730777015686, + "train_acc": 0.56224, + "test_loss": 6.555442190551758, + "test_acc": 0.0442, + "lyapunov": null, + "grad_norm": 0.6414928448640214, + "grad_max_sv": 0.22317990958690642, + "grad_min_sv": 1.2069366867430501e-08, + "grad_condition": 382827154.51718956, + "lr": 1.7535703752478133e-06, + "time_sec": 49.64200186729431 + }, + { + "epoch": 147, + "train_loss": 1.5659333599090577, + "train_acc": 0.55716, + "test_loss": 6.271022132873535, + "test_acc": 0.0492, + "lyapunov": null, + "grad_norm": 0.6449744450875666, + "grad_max_sv": 0.22341229021549225, + "grad_min_sv": 1.2069372681833279e-08, + "grad_condition": 29803939.928126138, + "lr": 9.866357858642196e-07, + "time_sec": 49.677895069122314 + }, + { + "epoch": 148, + "train_loss": 1.55233530418396, + "train_acc": 0.5624, + "test_loss": 6.24937745513916, + "test_acc": 0.0474, + "lyapunov": null, + "grad_norm": 0.643448067037432, + "grad_max_sv": 0.22757547162473202, + "grad_min_sv": 1.2111119601643239e-08, + "grad_condition": 33967427.03926191, + "lr": 4.38584950570808e-07, + "time_sec": 49.623542070388794 + }, + { + "epoch": 149, + "train_loss": 1.5480224239730835, + "train_acc": 0.5639, + "test_loss": 6.394064616394043, + "test_acc": 0.0438, + "lyapunov": null, + "grad_norm": 0.642149980505916, + "grad_max_sv": 0.21981638856232166, + "grad_min_sv": 1.1695069362070709e-08, + "grad_condition": 254731993.0398627, + "lr": 1.096582625772501e-07, + "time_sec": 49.63520789146423 + }, + { + "epoch": 150, + "train_loss": 1.5609092629623413, + "train_acc": 0.55828, + "test_loss": 6.494824208068848, + "test_acc": 0.042, + "lyapunov": null, + "grad_norm": 0.645124236315014, + "grad_max_sv": 0.2247354317456484, + "grad_min_sv": 1.2051133440466044e-08, + "grad_condition": 35388252.370039664, + "lr": 0.0, + "time_sec": 49.63965940475464 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.089254416656495, + "train_acc": 0.01344, + "test_loss": 4.870831555175781, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.582063459208639, + "grad_max_sv": 5.0306542873382565, + "grad_min_sv": 8.441757832766683e-08, + "grad_condition": 74707534.78681344, + "lr": 0.0009998903417374227, + "time_sec": 66.78056359291077 + }, + { + "epoch": 2, + "train_loss": 4.736304296569824, + "train_acc": 0.02172, + "test_loss": 4.92340059890747, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.087296772772229, + "grad_max_sv": 3.672157108783722, + "grad_min_sv": 6.109624839933935e-08, + "grad_condition": 230714811.36310124, + "lr": 0.0009995614150494292, + "time_sec": 66.77934241294861 + }, + { + "epoch": 3, + "train_loss": 4.52685978515625, + "train_acc": 0.03204, + "test_loss": 5.045831031799317, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 3.1470044543912175, + "grad_max_sv": 2.6447540044784548, + "grad_min_sv": 4.639755384339139e-08, + "grad_condition": 65625701.84585605, + "lr": 0.0009990133642141358, + "time_sec": 66.76001167297363 + }, + { + "epoch": 4, + "train_loss": 4.371717319641113, + "train_acc": 0.04112, + "test_loss": 4.993129699707032, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 2.5123688948843395, + "grad_max_sv": 2.1027904629707335, + "grad_min_sv": 3.615837387664633e-08, + "grad_condition": 418817692.03399765, + "lr": 0.0009982464296247522, + "time_sec": 66.79424738883972 + }, + { + "epoch": 5, + "train_loss": 4.27407361251831, + "train_acc": 0.0488, + "test_loss": 5.161634465789795, + "test_acc": 0.0119, + "lyapunov": null, + "grad_norm": 1.9573801826064445, + "grad_max_sv": 1.613087645173073, + "grad_min_sv": 2.8529539808364034e-08, + "grad_condition": 62747668.20627429, + "lr": 0.0009972609476841367, + "time_sec": 66.81961727142334 + }, + { + "epoch": 6, + "train_loss": 4.183251854553222, + "train_acc": 0.05812, + "test_loss": 5.447854755401611, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 1.436449079599314, + "grad_max_sv": 1.0459295481443405, + "grad_min_sv": 2.0654144772258576e-08, + "grad_condition": 94732574.16372415, + "lr": 0.000996057350657239, + "time_sec": 66.73661756515503 + }, + { + "epoch": 7, + "train_loss": 4.103355536193848, + "train_acc": 0.06872, + "test_loss": 5.544150679016114, + "test_acc": 0.0124, + "lyapunov": null, + "grad_norm": 1.082624040556548, + "grad_max_sv": 0.678101472556591, + "grad_min_sv": 1.6660088839048904e-08, + "grad_condition": 49338508.46283151, + "lr": 0.000994636166481494, + "time_sec": 66.81501913070679 + }, + { + "epoch": 8, + "train_loss": 4.040529095458984, + "train_acc": 0.07876, + "test_loss": 5.577163777160645, + "test_acc": 0.0172, + "lyapunov": null, + "grad_norm": 0.963869121683512, + "grad_max_sv": 0.5578698106110096, + "grad_min_sv": 1.4817374840991882e-08, + "grad_condition": 46172185.25999212, + "lr": 0.0009929980185352525, + "time_sec": 66.78599071502686 + }, + { + "epoch": 9, + "train_loss": 3.999490645446777, + "train_acc": 0.0856, + "test_loss": 5.472281336975097, + "test_acc": 0.0116, + "lyapunov": null, + "grad_norm": 0.9198022107734598, + "grad_max_sv": 0.5003849364817142, + "grad_min_sv": 1.3862486752946878e-08, + "grad_condition": 137028895.09887612, + "lr": 0.0009911436253643444, + "time_sec": 66.77566862106323 + }, + { + "epoch": 10, + "train_loss": 3.9641557629394533, + "train_acc": 0.09124, + "test_loss": 5.43024553604126, + "test_acc": 0.0112, + "lyapunov": null, + "grad_norm": 0.8539816540258655, + "grad_max_sv": 0.4397390566766262, + "grad_min_sv": 1.3177782898221579e-08, + "grad_condition": 50953468.3517745, + "lr": 0.0009890738003669028, + "time_sec": 66.84108996391296 + }, + { + "epoch": 11, + "train_loss": 3.9142907052612306, + "train_acc": 0.09788, + "test_loss": 5.24972756652832, + "test_acc": 0.0174, + "lyapunov": null, + "grad_norm": 0.8303589651826888, + "grad_max_sv": 0.4246540553867817, + "grad_min_sv": 1.288730961390705e-08, + "grad_condition": 88294678.08247125, + "lr": 0.00098678945143658, + "time_sec": 66.87874603271484 + }, + { + "epoch": 12, + "train_loss": 3.881778168411255, + "train_acc": 0.1037, + "test_loss": 5.765969756317139, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.7855031029198277, + "grad_max_sv": 0.3756070680916309, + "grad_min_sv": 1.2611303298881715e-08, + "grad_condition": 36786532.210794725, + "lr": 0.0009842915805643154, + "time_sec": 66.82181406021118 + }, + { + "epoch": 13, + "train_loss": 3.8490214154815674, + "train_acc": 0.1068, + "test_loss": 5.832162282562256, + "test_acc": 0.0138, + "lyapunov": null, + "grad_norm": 0.7681061932199776, + "grad_max_sv": 0.3604050487279892, + "grad_min_sv": 1.2243067453593382e-08, + "grad_condition": 131143000.26933214, + "lr": 0.000981581283398829, + "time_sec": 66.72735929489136 + }, + { + "epoch": 14, + "train_loss": 3.828877674636841, + "train_acc": 0.11234, + "test_loss": 6.293205305480957, + "test_acc": 0.0134, + "lyapunov": null, + "grad_norm": 0.7460407539013362, + "grad_max_sv": 0.34510768875479697, + "grad_min_sv": 1.1813573212726692e-08, + "grad_condition": 49629148.15911349, + "lr": 0.0009786597487660333, + "time_sec": 66.80630326271057 + }, + { + "epoch": 15, + "train_loss": 3.803487832107544, + "train_acc": 0.1159, + "test_loss": 6.4087516273498535, + "test_acc": 0.013, + "lyapunov": null, + "grad_norm": 0.716379034773642, + "grad_max_sv": 0.3261814657598734, + "grad_min_sv": 1.1572917107960378e-08, + "grad_condition": 31644703.4401185, + "lr": 0.0009755282581475766, + "time_sec": 66.77157950401306 + }, + { + "epoch": 16, + "train_loss": 3.7804446031188963, + "train_acc": 0.11974, + "test_loss": 6.637075031280518, + "test_acc": 0.0121, + "lyapunov": null, + "grad_norm": 0.696010315133547, + "grad_max_sv": 0.3137427795678377, + "grad_min_sv": 1.127850834219124e-08, + "grad_condition": 69462833.27053933, + "lr": 0.0009721881851187403, + "time_sec": 66.79616379737854 + }, + { + "epoch": 17, + "train_loss": 3.752294116973877, + "train_acc": 0.12396, + "test_loss": 6.783492227935791, + "test_acc": 0.0146, + "lyapunov": null, + "grad_norm": 0.6728326480937213, + "grad_max_sv": 0.29628029987216, + "grad_min_sv": 1.0862121784666057e-08, + "grad_condition": 67951530.61721244, + "lr": 0.0009686409947459456, + "time_sec": 66.90411448478699 + }, + { + "epoch": 18, + "train_loss": 3.7320939672851563, + "train_acc": 0.12876, + "test_loss": 6.78950693283081, + "test_acc": 0.0166, + "lyapunov": null, + "grad_norm": 0.6616867936990236, + "grad_max_sv": 0.2953863974660635, + "grad_min_sv": 1.095610695379251e-08, + "grad_condition": 136390664.3535565, + "lr": 0.0009648882429441254, + "time_sec": 66.75479531288147 + }, + { + "epoch": 19, + "train_loss": 3.7112531086730955, + "train_acc": 0.13056, + "test_loss": 6.585515812683106, + "test_acc": 0.0163, + "lyapunov": null, + "grad_norm": 0.6494124624609345, + "grad_max_sv": 0.2933062981814146, + "grad_min_sv": 1.0763416760650734e-08, + "grad_condition": 31017442.193528943, + "lr": 0.00096093157579425, + "time_sec": 66.74547505378723 + }, + { + "epoch": 20, + "train_loss": 3.6964602882385256, + "train_acc": 0.13444, + "test_loss": 6.817514788818359, + "test_acc": 0.0125, + "lyapunov": null, + "grad_norm": 0.6419428954986147, + "grad_max_sv": 0.28524503484368324, + "grad_min_sv": 1.07556832606992e-08, + "grad_condition": 29053863.493932776, + "lr": 0.0009567727288213001, + "time_sec": 66.75940012931824 + }, + { + "epoch": 21, + "train_loss": 3.6749328507995607, + "train_acc": 0.13862, + "test_loss": 6.693168528747559, + "test_acc": 0.0132, + "lyapunov": null, + "grad_norm": 0.6273897945446711, + "grad_max_sv": 0.27434321865439415, + "grad_min_sv": 1.0629087081326371e-08, + "grad_condition": 34272866.07000697, + "lr": 0.0009524135262330095, + "time_sec": 66.76537322998047 + }, + { + "epoch": 22, + "train_loss": 3.6651853931427003, + "train_acc": 0.13714, + "test_loss": 7.5128926712036135, + "test_acc": 0.0145, + "lyapunov": null, + "grad_norm": 0.6127571430728127, + "grad_max_sv": 0.2585024815052748, + "grad_min_sv": 9.990007998617045e-09, + "grad_condition": 29464610.145040773, + "lr": 0.0009478558801197061, + "time_sec": 66.88315868377686 + }, + { + "epoch": 23, + "train_loss": 3.6479580931091307, + "train_acc": 0.14048, + "test_loss": 7.259157413482666, + "test_acc": 0.013, + "lyapunov": null, + "grad_norm": 0.6101108448302026, + "grad_max_sv": 0.26707915738224985, + "grad_min_sv": 1.0416663243084657e-08, + "grad_condition": 44782214.320293196, + "lr": 0.000943101789615607, + "time_sec": 66.73595952987671 + }, + { + "epoch": 24, + "train_loss": 3.630135404510498, + "train_acc": 0.14444, + "test_loss": 6.769294599151611, + "test_acc": 0.0187, + "lyapunov": null, + "grad_norm": 0.5973985296812159, + "grad_max_sv": 0.25335801765322685, + "grad_min_sv": 9.992184554080685e-09, + "grad_condition": 42939810.102056004, + "lr": 0.0009381533400219313, + "time_sec": 66.83198976516724 + }, + { + "epoch": 25, + "train_loss": 3.6139439612579345, + "train_acc": 0.14892, + "test_loss": 6.755159613037109, + "test_acc": 0.0168, + "lyapunov": null, + "grad_norm": 0.5830251618606708, + "grad_max_sv": 0.2401360861957073, + "grad_min_sv": 9.682792681542374e-09, + "grad_condition": 104126991.37138663, + "lr": 0.0009330127018922189, + "time_sec": 66.7968385219574 + }, + { + "epoch": 26, + "train_loss": 3.5970758290100098, + "train_acc": 0.14988, + "test_loss": 6.900474179840088, + "test_acc": 0.0154, + "lyapunov": null, + "grad_norm": 0.5787074408614666, + "grad_max_sv": 0.23566974550485612, + "grad_min_sv": 9.719574232958105e-09, + "grad_condition": 38538660.37346102, + "lr": 0.000927682130080253, + "time_sec": 66.79184246063232 + }, + { + "epoch": 27, + "train_loss": 3.5895483708190916, + "train_acc": 0.1518, + "test_loss": 6.669962855529785, + "test_acc": 0.0167, + "lyapunov": null, + "grad_norm": 0.5803094423675084, + "grad_max_sv": 0.2358210153877735, + "grad_min_sv": 9.626696496206621e-09, + "grad_condition": 193890246.2613204, + "lr": 0.0009221639627510072, + "time_sec": 66.7768383026123 + }, + { + "epoch": 28, + "train_loss": 3.5726418092346193, + "train_acc": 0.15258, + "test_loss": 7.085537405395508, + "test_acc": 0.0168, + "lyapunov": null, + "grad_norm": 0.570193330921248, + "grad_max_sv": 0.23036426715552807, + "grad_min_sv": 9.589828041736691e-09, + "grad_condition": 89352936.15952519, + "lr": 0.0009164606203550494, + "time_sec": 66.79721999168396 + }, + { + "epoch": 29, + "train_loss": 3.5572311797332765, + "train_acc": 0.15608, + "test_loss": 6.67531994934082, + "test_acc": 0.0189, + "lyapunov": null, + "grad_norm": 0.5675152442756493, + "grad_max_sv": 0.22562474496662616, + "grad_min_sv": 9.685276963766754e-09, + "grad_condition": 25178417.23491483, + "lr": 0.0009105746045668516, + "time_sec": 66.85751271247864 + }, + { + "epoch": 30, + "train_loss": 3.548038801879883, + "train_acc": 0.15748, + "test_loss": 6.45415048828125, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.5621117218085827, + "grad_max_sv": 0.222617195174098, + "grad_min_sv": 9.435066891660959e-09, + "grad_condition": 26340041.97866543, + "lr": 0.0009045084971874733, + "time_sec": 66.79050874710083 + }, + { + "epoch": 31, + "train_loss": 3.5402868547058106, + "train_acc": 0.16092, + "test_loss": 6.451704531860352, + "test_acc": 0.0227, + "lyapunov": null, + "grad_norm": 0.5521957030096883, + "grad_max_sv": 0.22002805732190608, + "grad_min_sv": 9.47574586573907e-09, + "grad_condition": 26149277.514949474, + "lr": 0.0008982649590120977, + "time_sec": 66.78902292251587 + }, + { + "epoch": 32, + "train_loss": 3.5309471380615234, + "train_acc": 0.16198, + "test_loss": 6.8702184638977055, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.5464579230817538, + "grad_max_sv": 0.21435559950768948, + "grad_min_sv": 9.215979125329344e-09, + "grad_condition": 59638036.88956574, + "lr": 0.0008918467286629196, + "time_sec": 66.78767824172974 + }, + { + "epoch": 33, + "train_loss": 3.5130342961120604, + "train_acc": 0.16284, + "test_loss": 7.181190188598633, + "test_acc": 0.0173, + "lyapunov": null, + "grad_norm": 0.5437244358450883, + "grad_max_sv": 0.22251709625124932, + "grad_min_sv": 9.34404511543363e-09, + "grad_condition": 28699663.06993841, + "lr": 0.0008852566213878943, + "time_sec": 66.71953392028809 + }, + { + "epoch": 34, + "train_loss": 3.51255979675293, + "train_acc": 0.16636, + "test_loss": 7.333110241699218, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5393640775064226, + "grad_max_sv": 0.20921555384993554, + "grad_min_sv": 9.167450806812916e-09, + "grad_condition": 25706901.28825941, + "lr": 0.000878497527825878, + "time_sec": 66.7765941619873 + }, + { + "epoch": 35, + "train_loss": 3.4977930699157715, + "train_acc": 0.16716, + "test_loss": 7.278058241271973, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.5438001473750539, + "grad_max_sv": 0.20897603183984756, + "grad_min_sv": 9.184564683795137e-09, + "grad_condition": 34997969.65153339, + "lr": 0.000871572412738697, + "time_sec": 66.78994917869568 + }, + { + "epoch": 36, + "train_loss": 3.4839546405029296, + "train_acc": 0.17056, + "test_loss": 6.461000657653808, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.5343462863238121, + "grad_max_sv": 0.20449809469282626, + "grad_min_sv": 9.16483587076744e-09, + "grad_condition": 24381579.447592642, + "lr": 0.0008644843137107055, + "time_sec": 66.78629851341248 + }, + { + "epoch": 37, + "train_loss": 3.473933819503784, + "train_acc": 0.16984, + "test_loss": 6.470654428100586, + "test_acc": 0.0179, + "lyapunov": null, + "grad_norm": 0.5324136173248342, + "grad_max_sv": 0.20008243359625338, + "grad_min_sv": 9.049705299718491e-09, + "grad_condition": 34636922.167240486, + "lr": 0.0008572363398164014, + "time_sec": 66.79992747306824 + }, + { + "epoch": 38, + "train_loss": 3.4661802910614012, + "train_acc": 0.17092, + "test_loss": 6.690065528869629, + "test_acc": 0.0169, + "lyapunov": null, + "grad_norm": 0.5281123151657661, + "grad_max_sv": 0.20084053687751294, + "grad_min_sv": 8.970145487507963e-09, + "grad_condition": 26480283.34014668, + "lr": 0.0008498316702566826, + "time_sec": 66.92348313331604 + }, + { + "epoch": 39, + "train_loss": 3.4540661865997313, + "train_acc": 0.17118, + "test_loss": 6.078438919830322, + "test_acc": 0.0211, + "lyapunov": null, + "grad_norm": 0.5227451103728683, + "grad_max_sv": 0.1980721667408943, + "grad_min_sv": 8.970438091903537e-09, + "grad_condition": 149441951.98208869, + "lr": 0.0008422735529643442, + "time_sec": 66.80566644668579 + }, + { + "epoch": 40, + "train_loss": 3.439123515701294, + "train_acc": 0.17768, + "test_loss": 6.255719974517822, + "test_acc": 0.0246, + "lyapunov": null, + "grad_norm": 0.5238902894663456, + "grad_max_sv": 0.2012732930481434, + "grad_min_sv": 8.989019251171015e-09, + "grad_condition": 26996532.399999082, + "lr": 0.0008345653031794289, + "time_sec": 66.78863906860352 + }, + { + "epoch": 41, + "train_loss": 3.4350976667022706, + "train_acc": 0.17682, + "test_loss": 5.942692041015625, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5230791130306572, + "grad_max_sv": 0.19939371161162853, + "grad_min_sv": 9.040618726557925e-09, + "grad_condition": 35747119.67190552, + "lr": 0.0008267103019950526, + "time_sec": 66.78709435462952 + }, + { + "epoch": 42, + "train_loss": 3.4243579791259764, + "train_acc": 0.17844, + "test_loss": 6.007703511047363, + "test_acc": 0.0262, + "lyapunov": null, + "grad_norm": 0.517545208070228, + "grad_max_sv": 0.1922302544116974, + "grad_min_sv": 8.860449580982976e-09, + "grad_condition": 30602577.279376544, + "lr": 0.0008187119948743447, + "time_sec": 66.81675243377686 + }, + { + "epoch": 43, + "train_loss": 3.41020792137146, + "train_acc": 0.1805, + "test_loss": 6.532727696228028, + "test_acc": 0.0201, + "lyapunov": null, + "grad_norm": 0.5184771014750174, + "grad_max_sv": 0.1960398443043232, + "grad_min_sv": 9.042896009781032e-09, + "grad_condition": 109678067.45442054, + "lr": 0.000810573890139155, + "time_sec": 66.88858389854431 + }, + { + "epoch": 44, + "train_loss": 3.407023912811279, + "train_acc": 0.18096, + "test_loss": 6.134778085327149, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.5141850532973719, + "grad_max_sv": 0.18923728726804256, + "grad_min_sv": 9.02819977631475e-09, + "grad_condition": 100774753.52111238, + "lr": 0.0008022995574311873, + "time_sec": 66.80017518997192 + }, + { + "epoch": 45, + "train_loss": 3.395647827911377, + "train_acc": 0.1839, + "test_loss": 6.376823687744141, + "test_acc": 0.0222, + "lyapunov": null, + "grad_norm": 0.5126811791455754, + "grad_max_sv": 0.18771996162831783, + "grad_min_sv": 9.025198291837122e-09, + "grad_condition": 44468339.93349115, + "lr": 0.0007938926261462363, + "time_sec": 66.7608630657196 + }, + { + "epoch": 46, + "train_loss": 3.3928714478302, + "train_acc": 0.18238, + "test_loss": 6.053843517303466, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5084041434605487, + "grad_max_sv": 0.1855287253856659, + "grad_min_sv": 8.774856632975947e-09, + "grad_condition": 31787391.609472472, + "lr": 0.0007853567838422158, + "time_sec": 66.74166297912598 + }, + { + "epoch": 47, + "train_loss": 3.379834383621216, + "train_acc": 0.18724, + "test_loss": 6.8861193962097165, + "test_acc": 0.0191, + "lyapunov": null, + "grad_norm": 0.5060633641106507, + "grad_max_sv": 0.1826419185847044, + "grad_min_sv": 8.790497434824073e-09, + "grad_condition": 34120677.482305124, + "lr": 0.0007766957746216719, + "time_sec": 66.7685010433197 + }, + { + "epoch": 48, + "train_loss": 3.374839401092529, + "train_acc": 0.1861, + "test_loss": 5.864614242553711, + "test_acc": 0.0184, + "lyapunov": null, + "grad_norm": 0.5042105096702133, + "grad_max_sv": 0.18606598749756814, + "grad_min_sv": 8.831608784565237e-09, + "grad_condition": 28878813.551795878, + "lr": 0.0007679133974894982, + "time_sec": 66.80099678039551 + }, + { + "epoch": 49, + "train_loss": 3.3662559477996825, + "train_acc": 0.1887, + "test_loss": 6.230384608459473, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.5036215455963197, + "grad_max_sv": 0.19020347222685813, + "grad_min_sv": 8.961205007554373e-09, + "grad_condition": 47201312.24723457, + "lr": 0.000759013504686565, + "time_sec": 66.75482654571533 + }, + { + "epoch": 50, + "train_loss": 3.360496557159424, + "train_acc": 0.18832, + "test_loss": 6.6197496559143065, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.5042398036515723, + "grad_max_sv": 0.1836124774068594, + "grad_min_sv": 8.934804758553572e-09, + "grad_condition": 69600275.62778898, + "lr": 0.0007499999999999998, + "time_sec": 66.77506113052368 + }, + { + "epoch": 51, + "train_loss": 3.350079543914795, + "train_acc": 0.1919, + "test_loss": 6.343868575286865, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5043278001350275, + "grad_max_sv": 0.1825037430971861, + "grad_min_sv": 8.887193922446634e-09, + "grad_condition": 30024861.754817694, + "lr": 0.0007408768370508575, + "time_sec": 66.72825312614441 + }, + { + "epoch": 52, + "train_loss": 3.3426339905548095, + "train_acc": 0.1928, + "test_loss": 7.225718658447265, + "test_acc": 0.0199, + "lyapunov": null, + "grad_norm": 0.50252992009141, + "grad_max_sv": 0.17567641101777554, + "grad_min_sv": 8.804220427770064e-09, + "grad_condition": 740966766.3274126, + "lr": 0.0007316480175599307, + "time_sec": 66.72319173812866 + }, + { + "epoch": 53, + "train_loss": 3.3341299864959715, + "train_acc": 0.1933, + "test_loss": 6.803897232055664, + "test_acc": 0.0206, + "lyapunov": null, + "grad_norm": 0.5011496244728447, + "grad_max_sv": 0.17870272882282734, + "grad_min_sv": 8.831609968340536e-09, + "grad_condition": 22412356.279497318, + "lr": 0.0007223175895924635, + "time_sec": 66.7704975605011 + }, + { + "epoch": 54, + "train_loss": 3.3261182179260254, + "train_acc": 0.19572, + "test_loss": 6.764497369384766, + "test_acc": 0.028, + "lyapunov": null, + "grad_norm": 0.4979381618436104, + "grad_max_sv": 0.1770651936531067, + "grad_min_sv": 8.860568483093357e-09, + "grad_condition": 25306461.91969143, + "lr": 0.0007128896457825361, + "time_sec": 66.77421927452087 + }, + { + "epoch": 55, + "train_loss": 3.316899408569336, + "train_acc": 0.196, + "test_loss": 6.540015605163574, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.4977367964912547, + "grad_max_sv": 0.17745399177074433, + "grad_min_sv": 8.913811780364434e-09, + "grad_condition": 22903051.94229058, + "lr": 0.0007033683215378998, + "time_sec": 66.79190754890442 + }, + { + "epoch": 56, + "train_loss": 3.310275382003784, + "train_acc": 0.19632, + "test_loss": 6.745750244140625, + "test_acc": 0.0197, + "lyapunov": null, + "grad_norm": 0.4988650354422387, + "grad_max_sv": 0.17153157331049443, + "grad_min_sv": 8.749649851869101e-09, + "grad_condition": 22030625.492303018, + "lr": 0.0006937577932260512, + "time_sec": 66.7638955116272 + }, + { + "epoch": 57, + "train_loss": 3.290559967803955, + "train_acc": 0.20002, + "test_loss": 6.366741171264648, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.4982910029946987, + "grad_max_sv": 0.17201930955052375, + "grad_min_sv": 8.79568313487053e-09, + "grad_condition": 151885613.93341595, + "lr": 0.0006840622763423388, + "time_sec": 66.78560328483582 + }, + { + "epoch": 58, + "train_loss": 3.2923309088134767, + "train_acc": 0.20166, + "test_loss": 6.417476829528809, + "test_acc": 0.0246, + "lyapunov": null, + "grad_norm": 0.49889716140548146, + "grad_max_sv": 0.17567893117666245, + "grad_min_sv": 8.913143439981397e-09, + "grad_condition": 24256220.95115678, + "lr": 0.0006742860236609073, + "time_sec": 66.843590259552 + }, + { + "epoch": 59, + "train_loss": 3.2908721295928953, + "train_acc": 0.19948, + "test_loss": 6.640488920593262, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.49266049285108265, + "grad_max_sv": 0.17507032714784146, + "grad_min_sv": 8.739878155916703e-09, + "grad_condition": 26595294.449066617, + "lr": 0.0006644333233692913, + "time_sec": 66.74992251396179 + }, + { + "epoch": 60, + "train_loss": 3.284796617889404, + "train_acc": 0.2013, + "test_loss": 6.291868576049804, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.49223922966029576, + "grad_max_sv": 0.17198019847273827, + "grad_min_sv": 8.672205609183693e-09, + "grad_condition": 22947196.39326378, + "lr": 0.0006545084971874734, + "time_sec": 66.7844717502594 + }, + { + "epoch": 61, + "train_loss": 3.2731484245300293, + "train_acc": 0.20498, + "test_loss": 6.035749476623535, + "test_acc": 0.0304, + "lyapunov": null, + "grad_norm": 0.49100354548098263, + "grad_max_sv": 0.1670747336000204, + "grad_min_sv": 8.751909007925774e-09, + "grad_condition": 38402617.820078045, + "lr": 0.0006445158984722354, + "time_sec": 66.78787755966187 + }, + { + "epoch": 62, + "train_loss": 3.2566023439025877, + "train_acc": 0.20938, + "test_loss": 6.511487716674805, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.4914300539125354, + "grad_max_sv": 0.16597167886793612, + "grad_min_sv": 8.786484798073424e-09, + "grad_condition": 21670471.110839043, + "lr": 0.0006344599103076324, + "time_sec": 66.70972204208374 + }, + { + "epoch": 63, + "train_loss": 3.2568167697143555, + "train_acc": 0.20498, + "test_loss": 6.652309313964844, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.4918024874902063, + "grad_max_sv": 0.16560027711093425, + "grad_min_sv": 8.785258739235635e-09, + "grad_condition": 71694500.46039832, + "lr": 0.0006243449435824269, + "time_sec": 66.82298398017883 + }, + { + "epoch": 64, + "train_loss": 3.2456203374481203, + "train_acc": 0.20808, + "test_loss": 6.344074755859375, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.49095369226258845, + "grad_max_sv": 0.1667012270539999, + "grad_min_sv": 8.78574491491868e-09, + "grad_condition": 23075446.134346228, + "lr": 0.0006141754350553275, + "time_sec": 66.78016519546509 + }, + { + "epoch": 65, + "train_loss": 3.236674240646362, + "train_acc": 0.21152, + "test_loss": 6.2899073806762695, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.4921779891011333, + "grad_max_sv": 0.1677238956093788, + "grad_min_sv": 8.828472619626382e-09, + "grad_condition": 22441240.736154817, + "lr": 0.0006039558454088793, + "time_sec": 66.85806608200073 + }, + { + "epoch": 66, + "train_loss": 3.22965085647583, + "train_acc": 0.2126, + "test_loss": 6.429703979492188, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.4881811720746172, + "grad_max_sv": 0.164219119399786, + "grad_min_sv": 8.673666965219873e-09, + "grad_condition": 21892913.98496552, + "lr": 0.000593690657292862, + "time_sec": 66.78576803207397 + }, + { + "epoch": 67, + "train_loss": 3.224384484176636, + "train_acc": 0.21134, + "test_loss": 6.922704602050781, + "test_acc": 0.0234, + "lyapunov": null, + "grad_norm": 0.48741557028554877, + "grad_max_sv": 0.16480680033564568, + "grad_min_sv": 8.729063946666394e-09, + "grad_condition": 23200356.121009313, + "lr": 0.0005833843733580507, + "time_sec": 66.77217102050781 + }, + { + "epoch": 68, + "train_loss": 3.2157058325195313, + "train_acc": 0.21262, + "test_loss": 6.7681282539367675, + "test_acc": 0.0231, + "lyapunov": null, + "grad_norm": 0.493681050551615, + "grad_max_sv": 0.16986403651535512, + "grad_min_sv": 8.815265072070754e-09, + "grad_condition": 29441294.083651233, + "lr": 0.0005730415142812054, + "time_sec": 66.77236366271973 + }, + { + "epoch": 69, + "train_loss": 3.210006919326782, + "train_acc": 0.21728, + "test_loss": 6.470967771148682, + "test_acc": 0.0254, + "lyapunov": null, + "grad_norm": 0.4878926422472019, + "grad_max_sv": 0.1638301569968462, + "grad_min_sv": 8.75584678441954e-09, + "grad_condition": 52016652.85495178, + "lr": 0.0005626666167821517, + "time_sec": 66.80931973457336 + }, + { + "epoch": 70, + "train_loss": 3.196190078125, + "train_acc": 0.21792, + "test_loss": 5.951667370605469, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.48950735034118803, + "grad_max_sv": 0.16142398156225682, + "grad_min_sv": 8.815271614059927e-09, + "grad_condition": 24483281.259911567, + "lr": 0.0005522642316338265, + "time_sec": 66.77829360961914 + }, + { + "epoch": 71, + "train_loss": 3.2064027897644043, + "train_acc": 0.21506, + "test_loss": 6.750360327148438, + "test_acc": 0.0227, + "lyapunov": null, + "grad_norm": 0.4871695073962276, + "grad_max_sv": 0.16285001635551452, + "grad_min_sv": 8.758729140578848e-09, + "grad_condition": 23565681.777415752, + "lr": 0.0005418389216661573, + "time_sec": 66.78215885162354 + }, + { + "epoch": 72, + "train_loss": 3.1924329637908935, + "train_acc": 0.21822, + "test_loss": 6.714482778167724, + "test_acc": 0.025, + "lyapunov": null, + "grad_norm": 0.48778155896125935, + "grad_max_sv": 0.1631274577230215, + "grad_min_sv": 8.720527765009033e-09, + "grad_condition": 63496326.10433636, + "lr": 0.0005313952597646563, + "time_sec": 66.8333637714386 + }, + { + "epoch": 73, + "train_loss": 3.188364574279785, + "train_acc": 0.2196, + "test_loss": 7.193912121582032, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.4880279755205525, + "grad_max_sv": 0.1620686575770378, + "grad_min_sv": 8.740592850886574e-09, + "grad_condition": 27935085.988161374, + "lr": 0.0005209378268645994, + "time_sec": 66.71236157417297 + }, + { + "epoch": 74, + "train_loss": 3.1774999662780763, + "train_acc": 0.22036, + "test_loss": 6.498540209960938, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.48663554748850196, + "grad_max_sv": 0.16149300280958415, + "grad_min_sv": 8.688670802628472e-09, + "grad_condition": 102102915.61516626, + "lr": 0.0005104712099416781, + "time_sec": 66.7784776687622 + }, + { + "epoch": 75, + "train_loss": 3.1686367027282714, + "train_acc": 0.22206, + "test_loss": 7.174583370971679, + "test_acc": 0.0209, + "lyapunov": null, + "grad_norm": 0.48682394841302745, + "grad_max_sv": 0.16311258710920812, + "grad_min_sv": 8.786071105382209e-09, + "grad_condition": 24724999.404770423, + "lr": 0.0004999999999999996, + "time_sec": 66.76251482963562 + }, + { + "epoch": 76, + "train_loss": 3.1639041161346437, + "train_acc": 0.225, + "test_loss": 7.478772677612305, + "test_acc": 0.0197, + "lyapunov": null, + "grad_norm": 0.49049069180345295, + "grad_max_sv": 0.16360066644847393, + "grad_min_sv": 8.74060119004927e-09, + "grad_condition": 24496844.849027783, + "lr": 0.0004895287900583212, + "time_sec": 66.72801065444946 + }, + { + "epoch": 77, + "train_loss": 3.154632388381958, + "train_acc": 0.22396, + "test_loss": 6.57794190826416, + "test_acc": 0.0277, + "lyapunov": null, + "grad_norm": 0.4868448729214284, + "grad_max_sv": 0.1649958923459053, + "grad_min_sv": 8.840505302809554e-09, + "grad_condition": 21095789.830121905, + "lr": 0.0004790621731353997, + "time_sec": 66.73516988754272 + }, + { + "epoch": 78, + "train_loss": 3.1528517010498045, + "train_acc": 0.22312, + "test_loss": 7.1080197311401365, + "test_acc": 0.0217, + "lyapunov": null, + "grad_norm": 0.4887319331046421, + "grad_max_sv": 0.1634005270898342, + "grad_min_sv": 8.874131324221323e-09, + "grad_condition": 20245229.779506456, + "lr": 0.000468604740235343, + "time_sec": 66.71177268028259 + }, + { + "epoch": 79, + "train_loss": 3.1432092308807373, + "train_acc": 0.229, + "test_loss": 7.214095246887207, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.48838038818221724, + "grad_max_sv": 0.16252909004688262, + "grad_min_sv": 8.819199073806239e-09, + "grad_condition": 26520623.470668785, + "lr": 0.00045816107833384175, + "time_sec": 66.7255470752716 + }, + { + "epoch": 80, + "train_loss": 3.1343304455566408, + "train_acc": 0.22744, + "test_loss": 6.940009968566894, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.48846815734372934, + "grad_max_sv": 0.1635790452361107, + "grad_min_sv": 8.798821884981045e-09, + "grad_condition": 21131375.648625843, + "lr": 0.0004477357683661729, + "time_sec": 66.72595143318176 + }, + { + "epoch": 81, + "train_loss": 3.1298222771453856, + "train_acc": 0.22642, + "test_loss": 7.29024638671875, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.49086957943567056, + "grad_max_sv": 0.15947132408618928, + "grad_min_sv": 8.788132586923236e-09, + "grad_condition": 28060653.55060955, + "lr": 0.00043733338321784746, + "time_sec": 66.77222657203674 + }, + { + "epoch": 82, + "train_loss": 3.117735626373291, + "train_acc": 0.23038, + "test_loss": 6.9144718528747555, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.49138593312101014, + "grad_max_sv": 0.159454994648695, + "grad_min_sv": 8.759537291390742e-09, + "grad_condition": 308046195.23178655, + "lr": 0.0004269584857187939, + "time_sec": 66.75987410545349 + }, + { + "epoch": 83, + "train_loss": 3.1175857275390624, + "train_acc": 0.23194, + "test_loss": 6.706077085876465, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.4924089866784705, + "grad_max_sv": 0.16311928667128087, + "grad_min_sv": 8.90124301697326e-09, + "grad_condition": 32153498.186816484, + "lr": 0.0004166156266419484, + "time_sec": 66.74847078323364 + }, + { + "epoch": 84, + "train_loss": 3.1045476649475097, + "train_acc": 0.23228, + "test_loss": 6.154573769378662, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.49118329484452294, + "grad_max_sv": 0.16205354779958725, + "grad_min_sv": 8.760578144861864e-09, + "grad_condition": 52646848.44888155, + "lr": 0.0004063093427071373, + "time_sec": 66.74011945724487 + }, + { + "epoch": 85, + "train_loss": 3.1078517518615723, + "train_acc": 0.2344, + "test_loss": 6.530753035736084, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.4904367995984335, + "grad_max_sv": 0.161368178576231, + "grad_min_sv": 8.888137861817746e-09, + "grad_condition": 21303276.13293609, + "lr": 0.0003960441545911199, + "time_sec": 66.72609543800354 + }, + { + "epoch": 86, + "train_loss": 3.0952324195861816, + "train_acc": 0.23368, + "test_loss": 6.240639804077149, + "test_acc": 0.0308, + "lyapunov": null, + "grad_norm": 0.49428635963779644, + "grad_max_sv": 0.15839767456054688, + "grad_min_sv": 8.964046511322766e-09, + "grad_condition": 28785588.134401, + "lr": 0.0003858245649446718, + "time_sec": 66.74975419044495 + }, + { + "epoch": 87, + "train_loss": 3.0952587001037597, + "train_acc": 0.23356, + "test_loss": 6.628809076690674, + "test_acc": 0.0322, + "lyapunov": null, + "grad_norm": 0.49144116518393927, + "grad_max_sv": 0.16221071667969228, + "grad_min_sv": 8.962699898917847e-09, + "grad_condition": 20571826.020635325, + "lr": 0.00037565505641757235, + "time_sec": 66.7199854850769 + }, + { + "epoch": 88, + "train_loss": 3.0922299211120605, + "train_acc": 0.2344, + "test_loss": 6.5014627777099605, + "test_acc": 0.0295, + "lyapunov": null, + "grad_norm": 0.49360674992051745, + "grad_max_sv": 0.1644837912172079, + "grad_min_sv": 8.975622673573769e-09, + "grad_condition": 28771115.174499214, + "lr": 0.00036554008969236695, + "time_sec": 66.74195861816406 + }, + { + "epoch": 89, + "train_loss": 3.0761431072235106, + "train_acc": 0.23966, + "test_loss": 7.287914637756348, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.4909525286245839, + "grad_max_sv": 0.16159643046557903, + "grad_min_sv": 8.858207814488317e-09, + "grad_condition": 22425426.033500116, + "lr": 0.0003554841015277638, + "time_sec": 66.68954610824585 + }, + { + "epoch": 90, + "train_loss": 3.0747881409454347, + "train_acc": 0.2377, + "test_loss": 7.193168222808838, + "test_acc": 0.0262, + "lyapunov": null, + "grad_norm": 0.4911854264861308, + "grad_max_sv": 0.1574687145650387, + "grad_min_sv": 8.917724771215912e-09, + "grad_condition": 118300212.93482408, + "lr": 0.000345491502812526, + "time_sec": 66.77580857276917 + }, + { + "epoch": 91, + "train_loss": 3.070805363311768, + "train_acc": 0.23994, + "test_loss": 6.052177616882324, + "test_acc": 0.0304, + "lyapunov": null, + "grad_norm": 0.49339922868661756, + "grad_max_sv": 0.1602653257548809, + "grad_min_sv": 8.95202442799392e-09, + "grad_condition": 44017380.37680817, + "lr": 0.0003355666766307081, + "time_sec": 66.69368362426758 + }, + { + "epoch": 92, + "train_loss": 3.0647792414855957, + "train_acc": 0.23982, + "test_loss": 6.179595366668702, + "test_acc": 0.0301, + "lyapunov": null, + "grad_norm": 0.4931917462731246, + "grad_max_sv": 0.1606559857726097, + "grad_min_sv": 9.0662935353647e-09, + "grad_condition": 19908430.164367903, + "lr": 0.00032571397633909225, + "time_sec": 66.70123243331909 + }, + { + "epoch": 93, + "train_loss": 3.0550636367034913, + "train_acc": 0.2422, + "test_loss": 6.34838355255127, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.49186583360988956, + "grad_max_sv": 0.1579043295234442, + "grad_min_sv": 8.987567995388801e-09, + "grad_condition": 22006714.29709431, + "lr": 0.00031593772365766094, + "time_sec": 66.71771335601807 + }, + { + "epoch": 94, + "train_loss": 3.043202466583252, + "train_acc": 0.24232, + "test_loss": 6.682511094665528, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.4962595942491337, + "grad_max_sv": 0.1622728668153286, + "grad_min_sv": 9.030461697867587e-09, + "grad_condition": 30360701.35233465, + "lr": 0.0003062422067739483, + "time_sec": 66.82941317558289 + }, + { + "epoch": 95, + "train_loss": 3.0412676640319822, + "train_acc": 0.2447, + "test_loss": 6.22475659866333, + "test_acc": 0.0318, + "lyapunov": null, + "grad_norm": 0.4915093368948821, + "grad_max_sv": 0.15892955474555492, + "grad_min_sv": 8.946618996336086e-09, + "grad_condition": 69026491.3661272, + "lr": 0.00029663167846209965, + "time_sec": 66.73191213607788 + }, + { + "epoch": 96, + "train_loss": 3.0352964888000487, + "train_acc": 0.2471, + "test_loss": 6.5577602828979495, + "test_acc": 0.0293, + "lyapunov": null, + "grad_norm": 0.49248702226826524, + "grad_max_sv": 0.1611651573330164, + "grad_min_sv": 8.952907482040472e-09, + "grad_condition": 31830348.776786767, + "lr": 0.00028711035421746345, + "time_sec": 66.75891017913818 + }, + { + "epoch": 97, + "train_loss": 3.029721915130615, + "train_acc": 0.24842, + "test_loss": 6.651570160675049, + "test_acc": 0.0289, + "lyapunov": null, + "grad_norm": 0.4943874310747337, + "grad_max_sv": 0.1606567233800888, + "grad_min_sv": 9.076670715035818e-09, + "grad_condition": 36874515.58106691, + "lr": 0.00027768241040753615, + "time_sec": 66.74775719642639 + }, + { + "epoch": 98, + "train_loss": 3.0293620677948, + "train_acc": 0.24548, + "test_loss": 6.7938948928833005, + "test_acc": 0.0291, + "lyapunov": null, + "grad_norm": 0.4970218817533374, + "grad_max_sv": 0.15979058742523194, + "grad_min_sv": 9.025258917993995e-09, + "grad_condition": 21461503.719760668, + "lr": 0.00026835198244006903, + "time_sec": 66.71226525306702 + }, + { + "epoch": 99, + "train_loss": 3.0232276085662844, + "train_acc": 0.24992, + "test_loss": 6.842255628967285, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.4964386837271484, + "grad_max_sv": 0.16297372654080391, + "grad_min_sv": 9.074463314107107e-09, + "grad_condition": 38263953.83433555, + "lr": 0.0002591231629491421, + "time_sec": 66.73949241638184 + }, + { + "epoch": 100, + "train_loss": 3.0220013402557373, + "train_acc": 0.24942, + "test_loss": 7.044534214782715, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.4963097153496672, + "grad_max_sv": 0.1608368031680584, + "grad_min_sv": 8.999894975450506e-09, + "grad_condition": 41372527.951466024, + "lr": 0.0002499999999999997, + "time_sec": 66.77927494049072 + }, + { + "epoch": 101, + "train_loss": 3.0203451880645753, + "train_acc": 0.2487, + "test_loss": 6.837228249359131, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.49771273059241083, + "grad_max_sv": 0.16355772241950034, + "grad_min_sv": 9.09030489493201e-09, + "grad_condition": 21122520.470805176, + "lr": 0.00024098649531343477, + "time_sec": 66.73630166053772 + }, + { + "epoch": 102, + "train_loss": 3.0023662061309815, + "train_acc": 0.2517, + "test_loss": 7.122745419311523, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.4990559135673985, + "grad_max_sv": 0.16072520166635512, + "grad_min_sv": 9.129048311740107e-09, + "grad_condition": 20645009.356589716, + "lr": 0.0002320866025105016, + "time_sec": 66.75698280334473 + }, + { + "epoch": 103, + "train_loss": 2.998011736526489, + "train_acc": 0.25374, + "test_loss": 7.035623414611816, + "test_acc": 0.0277, + "lyapunov": null, + "grad_norm": 0.49574085619625, + "grad_max_sv": 0.15668718423694372, + "grad_min_sv": 9.148743505132951e-09, + "grad_condition": 33626359.10658366, + "lr": 0.0002233042253783278, + "time_sec": 66.75562310218811 + }, + { + "epoch": 104, + "train_loss": 2.997530387496948, + "train_acc": 0.25132, + "test_loss": 6.999302207946777, + "test_acc": 0.0292, + "lyapunov": null, + "grad_norm": 0.5002716771455139, + "grad_max_sv": 0.16238998733460902, + "grad_min_sv": 9.078950441443468e-09, + "grad_condition": 20349177.478017032, + "lr": 0.000214643216157784, + "time_sec": 66.79467344284058 + }, + { + "epoch": 105, + "train_loss": 2.9906964135742187, + "train_acc": 0.25506, + "test_loss": 7.1786759597778325, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.4946350333441307, + "grad_max_sv": 0.1600412342697382, + "grad_min_sv": 9.088851333008408e-09, + "grad_condition": 57224884.57519225, + "lr": 0.00020610737385376332, + "time_sec": 66.74862432479858 + }, + { + "epoch": 106, + "train_loss": 2.984202498321533, + "train_acc": 0.25656, + "test_loss": 7.172381106567383, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.4982362018645274, + "grad_max_sv": 0.1571014266461134, + "grad_min_sv": 9.054493026183775e-09, + "grad_condition": 22960817.2493112, + "lr": 0.00019770044256881242, + "time_sec": 66.77469301223755 + }, + { + "epoch": 107, + "train_loss": 2.975272487335205, + "train_acc": 0.25552, + "test_loss": 7.0334813690185545, + "test_acc": 0.0316, + "lyapunov": null, + "grad_norm": 0.49588396234922755, + "grad_max_sv": 0.16075790040194987, + "grad_min_sv": 9.117187717289087e-09, + "grad_condition": 22400105.746660806, + "lr": 0.0001894261098608447, + "time_sec": 66.76792025566101 + }, + { + "epoch": 108, + "train_loss": 2.9756462240600587, + "train_acc": 0.25536, + "test_loss": 7.59121438293457, + "test_acc": 0.0288, + "lyapunov": null, + "grad_norm": 0.4971626921836716, + "grad_max_sv": 0.15787492766976358, + "grad_min_sv": 9.170698456424448e-09, + "grad_condition": 2842260093.4746685, + "lr": 0.000181288005125655, + "time_sec": 66.72157907485962 + }, + { + "epoch": 109, + "train_loss": 2.9735143406677245, + "train_acc": 0.25872, + "test_loss": 6.839995979309082, + "test_acc": 0.0305, + "lyapunov": null, + "grad_norm": 0.49760629850795685, + "grad_max_sv": 0.16163251921534538, + "grad_min_sv": 9.179918801505149e-09, + "grad_condition": 26931510.48697853, + "lr": 0.0001732896980049473, + "time_sec": 66.76784825325012 + }, + { + "epoch": 110, + "train_loss": 2.971026375198364, + "train_acc": 0.25932, + "test_loss": 6.99457964477539, + "test_acc": 0.0301, + "lyapunov": null, + "grad_norm": 0.4972222462184193, + "grad_max_sv": 0.1576628390699625, + "grad_min_sv": 9.118256634466082e-09, + "grad_condition": 25805428.695002638, + "lr": 0.00016543469682057076, + "time_sec": 66.7546181678772 + }, + { + "epoch": 111, + "train_loss": 2.961785153198242, + "train_acc": 0.25938, + "test_loss": 7.5968095703125, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.499682712724269, + "grad_max_sv": 0.16410896554589272, + "grad_min_sv": 9.131004422013866e-09, + "grad_condition": 21672900.170981936, + "lr": 0.00015772644703565552, + "time_sec": 66.74458265304565 + }, + { + "epoch": 112, + "train_loss": 2.9625577368927, + "train_acc": 0.25878, + "test_loss": 7.764190951538086, + "test_acc": 0.026, + "lyapunov": null, + "grad_norm": 0.498213643225678, + "grad_max_sv": 0.15600935891270637, + "grad_min_sv": 9.151295493614598e-09, + "grad_condition": 20410187.211308915, + "lr": 0.00015016832974331713, + "time_sec": 66.75516033172607 + }, + { + "epoch": 113, + "train_loss": 2.95476414642334, + "train_acc": 0.25912, + "test_loss": 7.14678690032959, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.4989192084378189, + "grad_max_sv": 0.16326018050312996, + "grad_min_sv": 9.208972755539447e-09, + "grad_condition": 51946084.62151481, + "lr": 0.00014276366018359834, + "time_sec": 66.8117504119873 + }, + { + "epoch": 114, + "train_loss": 2.959580585861206, + "train_acc": 0.26152, + "test_loss": 7.228822399902343, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.4993052937105196, + "grad_max_sv": 0.1597112886607647, + "grad_min_sv": 9.184225070735242e-09, + "grad_condition": 24287456.61544974, + "lr": 0.00013551568628929425, + "time_sec": 66.71526288986206 + }, + { + "epoch": 115, + "train_loss": 2.951429924316406, + "train_acc": 0.2597, + "test_loss": 6.857805014038086, + "test_acc": 0.0311, + "lyapunov": null, + "grad_norm": 0.5001172379881009, + "grad_max_sv": 0.16317447423934936, + "grad_min_sv": 9.167603101656319e-09, + "grad_condition": 19878785.72490542, + "lr": 0.00012842758726130276, + "time_sec": 66.7846131324768 + }, + { + "epoch": 116, + "train_loss": 2.9463225456237794, + "train_acc": 0.26044, + "test_loss": 7.2446568466186525, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.4998364506796334, + "grad_max_sv": 0.16249994188547134, + "grad_min_sv": 9.130782213651045e-09, + "grad_condition": 19998723.305069156, + "lr": 0.0001215024721741218, + "time_sec": 66.7700080871582 + }, + { + "epoch": 117, + "train_loss": 2.937184557876587, + "train_acc": 0.26268, + "test_loss": 7.438090939331055, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.5024891978806302, + "grad_max_sv": 0.16552512347698212, + "grad_min_sv": 9.170617681214522e-09, + "grad_condition": 40015057.54321941, + "lr": 0.00011474337861210538, + "time_sec": 66.80615854263306 + }, + { + "epoch": 118, + "train_loss": 2.942110910797119, + "train_acc": 0.2621, + "test_loss": 7.324624530029297, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.5000364684279365, + "grad_max_sv": 0.16344034522771836, + "grad_min_sv": 9.328158331878279e-09, + "grad_condition": 21122225.248831175, + "lr": 0.00010815327133708009, + "time_sec": 66.78372955322266 + }, + { + "epoch": 119, + "train_loss": 2.93369575592041, + "train_acc": 0.26596, + "test_loss": 8.056785229492187, + "test_acc": 0.0234, + "lyapunov": null, + "grad_norm": 0.5006441450285836, + "grad_max_sv": 0.1595278237015009, + "grad_min_sv": 9.219788181871746e-09, + "grad_condition": 69721984.41132018, + "lr": 0.00010173504098790182, + "time_sec": 66.76624512672424 + }, + { + "epoch": 120, + "train_loss": 2.932797766189575, + "train_acc": 0.26344, + "test_loss": 7.282906192016601, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5037900163559795, + "grad_max_sv": 0.16313258111476897, + "grad_min_sv": 9.198472578075822e-09, + "grad_condition": 21164339.052237906, + "lr": 9.549150281252629e-05, + "time_sec": 66.71441149711609 + }, + { + "epoch": 121, + "train_loss": 2.9284527645874023, + "train_acc": 0.26852, + "test_loss": 7.262115740966797, + "test_acc": 0.0293, + "lyapunov": null, + "grad_norm": 0.5036251360683918, + "grad_max_sv": 0.1591605730354786, + "grad_min_sv": 9.272000557614124e-09, + "grad_condition": 40898149.281216756, + "lr": 8.942539543314794e-05, + "time_sec": 66.74046039581299 + }, + { + "epoch": 122, + "train_loss": 2.936891605682373, + "train_acc": 0.2668, + "test_loss": 7.490768426513672, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.5021434540478252, + "grad_max_sv": 0.16143947280943394, + "grad_min_sv": 9.394398098327983e-09, + "grad_condition": 19799976.943244066, + "lr": 8.353937964495024e-05, + "time_sec": 66.81744265556335 + }, + { + "epoch": 123, + "train_loss": 2.9236154601287843, + "train_acc": 0.26716, + "test_loss": 7.120488947296143, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.5028382354847799, + "grad_max_sv": 0.15968299470841885, + "grad_min_sv": 9.204075489266384e-09, + "grad_condition": 47939633.576168984, + "lr": 7.783603724899243e-05, + "time_sec": 66.76852679252625 + }, + { + "epoch": 124, + "train_loss": 2.92061264755249, + "train_acc": 0.2666, + "test_loss": 7.461192834472656, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.5005688158224261, + "grad_max_sv": 0.1629866801202297, + "grad_min_sv": 9.212228484906105e-09, + "grad_condition": 33814966.96761195, + "lr": 7.231786991974666e-05, + "time_sec": 66.7814073562622 + }, + { + "epoch": 125, + "train_loss": 2.9229219720458985, + "train_acc": 0.26648, + "test_loss": 7.498983331298828, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.5030160580327866, + "grad_max_sv": 0.16155149266123772, + "grad_min_sv": 9.212426940741203e-09, + "grad_condition": 19527956.667884845, + "lr": 6.698729810778072e-05, + "time_sec": 66.79239439964294 + }, + { + "epoch": 126, + "train_loss": 2.9202857413482666, + "train_acc": 0.26618, + "test_loss": 7.286036429595947, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.5046458563501821, + "grad_max_sv": 0.16270169503986837, + "grad_min_sv": 9.235521156170102e-09, + "grad_condition": 21514883.897712767, + "lr": 6.184665997806817e-05, + "time_sec": 66.79009366035461 + }, + { + "epoch": 127, + "train_loss": 2.9112009690093994, + "train_acc": 0.27148, + "test_loss": 6.8060284591674804, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.5048043752309758, + "grad_max_sv": 0.1627126146107912, + "grad_min_sv": 9.337147274801615e-09, + "grad_condition": 20067936.42847693, + "lr": 5.6898210384392595e-05, + "time_sec": 66.7122654914856 + }, + { + "epoch": 128, + "train_loss": 2.915534998703003, + "train_acc": 0.26936, + "test_loss": 7.528692306518555, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.505141680481134, + "grad_max_sv": 0.15927630066871643, + "grad_min_sv": 9.138972020816815e-09, + "grad_condition": 283653990.6139595, + "lr": 5.214411988029363e-05, + "time_sec": 66.76755571365356 + }, + { + "epoch": 129, + "train_loss": 2.911044763031006, + "train_acc": 0.26856, + "test_loss": 7.442652993774414, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 0.5029480129383956, + "grad_max_sv": 0.16405761763453483, + "grad_min_sv": 9.220356501568604e-09, + "grad_condition": 46047919.55891801, + "lr": 4.7586473766990294e-05, + "time_sec": 66.69603776931763 + }, + { + "epoch": 130, + "train_loss": 2.907666951751709, + "train_acc": 0.26828, + "test_loss": 7.026823535919189, + "test_acc": 0.0288, + "lyapunov": null, + "grad_norm": 0.5025376312973467, + "grad_max_sv": 0.15946717746555805, + "grad_min_sv": 9.221378457352492e-09, + "grad_condition": 33199750.366487652, + "lr": 4.32272711786996e-05, + "time_sec": 66.69535183906555 + }, + { + "epoch": 131, + "train_loss": 2.902869781417847, + "train_acc": 0.26958, + "test_loss": 7.536094513702393, + "test_acc": 0.0292, + "lyapunov": null, + "grad_norm": 0.5050312390729839, + "grad_max_sv": 0.16128032505512238, + "grad_min_sv": 9.28452798905008e-09, + "grad_condition": 135705763.13078815, + "lr": 3.906842420574966e-05, + "time_sec": 66.77000784873962 + }, + { + "epoch": 132, + "train_loss": 2.9037561528778078, + "train_acc": 0.27136, + "test_loss": 7.281431489562988, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.5052870516198174, + "grad_max_sv": 0.1615588180720806, + "grad_min_sv": 9.289024057758388e-09, + "grad_condition": 128507811.16031823, + "lr": 3.5111757055874305e-05, + "time_sec": 66.75163435935974 + }, + { + "epoch": 133, + "train_loss": 2.8991165522766114, + "train_acc": 0.27156, + "test_loss": 7.282987453460693, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.5034061589294716, + "grad_max_sv": 0.1581054452806711, + "grad_min_sv": 9.274782794554958e-09, + "grad_condition": 19574470.928057812, + "lr": 3.1359005254054254e-05, + "time_sec": 66.75138425827026 + }, + { + "epoch": 134, + "train_loss": 2.9077910748291016, + "train_acc": 0.2711, + "test_loss": 7.448024377441406, + "test_acc": 0.0294, + "lyapunov": null, + "grad_norm": 0.5046423793403062, + "grad_max_sv": 0.1635249551385641, + "grad_min_sv": 9.433638015199363e-09, + "grad_condition": 28668380.335333012, + "lr": 2.7811814881259484e-05, + "time_sec": 66.7329490184784 + }, + { + "epoch": 135, + "train_loss": 2.896955527267456, + "train_acc": 0.27268, + "test_loss": 7.478409793090821, + "test_acc": 0.028, + "lyapunov": null, + "grad_norm": 0.5037173672388571, + "grad_max_sv": 0.1622908242046833, + "grad_min_sv": 9.298784615918709e-09, + "grad_condition": 61773843.27193861, + "lr": 2.4471741852423218e-05, + "time_sec": 66.7459568977356 + }, + { + "epoch": 136, + "train_loss": 2.8964898432922364, + "train_acc": 0.27182, + "test_loss": 7.354159661865235, + "test_acc": 0.028, + "lyapunov": null, + "grad_norm": 0.5028619652958791, + "grad_max_sv": 0.1600797414779663, + "grad_min_sv": 9.074624002236575e-09, + "grad_condition": 22249764.299153708, + "lr": 2.1340251233966362e-05, + "time_sec": 66.75164866447449 + }, + { + "epoch": 137, + "train_loss": 2.895348368530273, + "train_acc": 0.27172, + "test_loss": 7.632054917144775, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.5031853951467254, + "grad_max_sv": 0.16463851928710938, + "grad_min_sv": 9.441171729823727e-09, + "grad_condition": 30855600.541313868, + "lr": 1.8418716601170932e-05, + "time_sec": 66.75186562538147 + }, + { + "epoch": 138, + "train_loss": 2.900583278427124, + "train_acc": 0.2717, + "test_loss": 7.199238876342774, + "test_acc": 0.0295, + "lyapunov": null, + "grad_norm": 0.5034869997386973, + "grad_max_sv": 0.16063327342271805, + "grad_min_sv": 9.296063535613186e-09, + "grad_condition": 25145907.489137426, + "lr": 1.570841943568445e-05, + "time_sec": 66.75230479240417 + }, + { + "epoch": 139, + "train_loss": 2.8933637355804445, + "train_acc": 0.27194, + "test_loss": 7.248442086029053, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.504304603082473, + "grad_max_sv": 0.162884946167469, + "grad_min_sv": 9.367608214128075e-09, + "grad_condition": 19993036.722377926, + "lr": 1.3210548563419845e-05, + "time_sec": 66.7671320438385 + }, + { + "epoch": 140, + "train_loss": 2.894832459564209, + "train_acc": 0.27222, + "test_loss": 7.71000400390625, + "test_acc": 0.0294, + "lyapunov": null, + "grad_norm": 0.5047832470696201, + "grad_max_sv": 0.16155096814036368, + "grad_min_sv": 9.160464450874706e-09, + "grad_condition": 20567241.25641649, + "lr": 1.0926199633097203e-05, + "time_sec": 66.73179697990417 + }, + { + "epoch": 141, + "train_loss": 2.897352989578247, + "train_acc": 0.27064, + "test_loss": 7.4464299194335934, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 0.5061737427703262, + "grad_max_sv": 0.16413113810122013, + "grad_min_sv": 9.289870605763695e-09, + "grad_condition": 51343563.84333199, + "lr": 8.856374635655688e-06, + "time_sec": 66.75452041625977 + }, + { + "epoch": 142, + "train_loss": 2.8876253887939454, + "train_acc": 0.2751, + "test_loss": 7.67550869064331, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.50486204633145, + "grad_max_sv": 0.16515321880578995, + "grad_min_sv": 9.218709545733006e-09, + "grad_condition": 25662988.761511788, + "lr": 7.001981464747503e-06, + "time_sec": 66.76586389541626 + }, + { + "epoch": 143, + "train_loss": 2.8951072731781005, + "train_acc": 0.2711, + "test_loss": 7.276433151245117, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.5066003424324655, + "grad_max_sv": 0.16512982696294784, + "grad_min_sv": 9.368238332307932e-09, + "grad_condition": 20872282.150921334, + "lr": 5.3638335185058295e-06, + "time_sec": 66.77883982658386 + }, + { + "epoch": 144, + "train_loss": 2.896107662887573, + "train_acc": 0.27174, + "test_loss": 7.442941972351075, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.5058752626030726, + "grad_max_sv": 0.1646978858858347, + "grad_min_sv": 9.187450514258621e-09, + "grad_condition": 21323054.46289139, + "lr": 3.942649342761114e-06, + "time_sec": 66.74654960632324 + }, + { + "epoch": 145, + "train_loss": 2.8981069023132324, + "train_acc": 0.27052, + "test_loss": 7.511137809753418, + "test_acc": 0.0286, + "lyapunov": null, + "grad_norm": 0.5043941197302124, + "grad_max_sv": 0.16361674722284078, + "grad_min_sv": 9.248454605793876e-09, + "grad_condition": 124843071.51810357, + "lr": 2.7390523158633524e-06, + "time_sec": 66.71942782402039 + }, + { + "epoch": 146, + "train_loss": 2.897443035583496, + "train_acc": 0.27094, + "test_loss": 7.219273558044433, + "test_acc": 0.0301, + "lyapunov": null, + "grad_norm": 0.5044889597609223, + "grad_max_sv": 0.1617003157734871, + "grad_min_sv": 9.33726697904813e-09, + "grad_condition": 20578970.810026187, + "lr": 1.7535703752478133e-06, + "time_sec": 66.74967193603516 + }, + { + "epoch": 147, + "train_loss": 2.8972148944854736, + "train_acc": 0.27036, + "test_loss": 7.628332612609864, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.5052009377242357, + "grad_max_sv": 0.15890285596251488, + "grad_min_sv": 9.382556353555727e-09, + "grad_condition": 91821063.92388035, + "lr": 9.866357858642196e-07, + "time_sec": 66.73621463775635 + }, + { + "epoch": 148, + "train_loss": 2.8898702787017823, + "train_acc": 0.27194, + "test_loss": 7.505082284545899, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.5047197831030149, + "grad_max_sv": 0.16516413502395152, + "grad_min_sv": 9.324620061507139e-09, + "grad_condition": 43789169.5949554, + "lr": 4.38584950570808e-07, + "time_sec": 66.76141929626465 + }, + { + "epoch": 149, + "train_loss": 2.9011361352539065, + "train_acc": 0.26824, + "test_loss": 7.6542517242431645, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.5054339021083573, + "grad_max_sv": 0.16298294067382812, + "grad_min_sv": 9.178197371562114e-09, + "grad_condition": 21653740.393576562, + "lr": 1.096582625772501e-07, + "time_sec": 66.75421690940857 + }, + { + "epoch": 150, + "train_loss": 2.9011223357391356, + "train_acc": 0.27114, + "test_loss": 7.460437265014648, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.5059469716903541, + "grad_max_sv": 0.16557817347347736, + "grad_min_sv": 9.153120701372967e-09, + "grad_condition": 361494763.7112081, + "lr": 0.0, + "time_sec": 66.78962397575378 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 4.580237577819824, + "train_acc": 0.07172, + "test_loss": 4.204835011291504, + "test_acc": 0.0865, + "lyapunov": 2.1020694111314273, + "grad_norm": 5.891421444416132, + "grad_max_sv": 4.6086235523223875, + "grad_min_sv": 1.0778671248878879e-07, + "grad_condition": 54871165.85509853, + "lr": 0.0009998903417374227, + "time_sec": 41.860575914382935 + }, + { + "epoch": 2, + "train_loss": 4.172055626296997, + "train_acc": 0.0921, + "test_loss": 4.402019414520264, + "test_acc": 0.0558, + "lyapunov": 1.6787975471647805, + "grad_norm": 3.9258769364442525, + "grad_max_sv": 2.9158192813396453, + "grad_min_sv": 7.291154454081017e-08, + "grad_condition": 84308361.49485277, + "lr": 0.0009995614150494292, + "time_sec": 41.754839181900024 + }, + { + "epoch": 3, + "train_loss": 4.050799645080566, + "train_acc": 0.10584, + "test_loss": 5.545398815917968, + "test_acc": 0.041, + "lyapunov": 1.5661922080437545, + "grad_norm": 3.128537052862856, + "grad_max_sv": 2.1766103327274324, + "grad_min_sv": 5.8618463349979774e-08, + "grad_condition": 41372858.502355784, + "lr": 0.0009990133642141358, + "time_sec": 41.694422006607056 + }, + { + "epoch": 4, + "train_loss": 3.9627039431762694, + "train_acc": 0.11682, + "test_loss": 6.328290705871582, + "test_acc": 0.0228, + "lyapunov": 1.5445425864070883, + "grad_norm": 2.5082278391489035, + "grad_max_sv": 1.6217471033334732, + "grad_min_sv": 4.5938650922172644e-08, + "grad_condition": 63153156.340209946, + "lr": 0.0009982464296247522, + "time_sec": 41.7418487071991 + }, + { + "epoch": 5, + "train_loss": 3.9077672985839844, + "train_acc": 0.1305, + "test_loss": 6.821084007263184, + "test_acc": 0.0156, + "lyapunov": 1.530182860086641, + "grad_norm": 2.041783975921356, + "grad_max_sv": 1.2541583150625228, + "grad_min_sv": 3.773506419557649e-08, + "grad_condition": 36438804.96965951, + "lr": 0.0009972609476841367, + "time_sec": 41.74874401092529 + }, + { + "epoch": 6, + "train_loss": 3.978193638305664, + "train_acc": 0.1273, + "test_loss": 10.715914828491211, + "test_acc": 0.015, + "lyapunov": 1.5294916736500344, + "grad_norm": 1.884529182522603, + "grad_max_sv": 1.174074074625969, + "grad_min_sv": 3.492432684992774e-08, + "grad_condition": 56687028.60603394, + "lr": 0.000996057350657239, + "time_sec": 41.79358172416687 + }, + { + "epoch": 7, + "train_loss": 4.028493068466187, + "train_acc": 0.12364, + "test_loss": 8.849580982971192, + "test_acc": 0.0108, + "lyapunov": 1.5220741317095354, + "grad_norm": 1.6311583818363289, + "grad_max_sv": 0.9764176219701767, + "grad_min_sv": 2.9745892293764343e-08, + "grad_condition": 38380014.867613696, + "lr": 0.000994636166481494, + "time_sec": 41.74577260017395 + }, + { + "epoch": 8, + "train_loss": 4.104167304382324, + "train_acc": 0.11452, + "test_loss": 9.404642602539063, + "test_acc": 0.0179, + "lyapunov": 1.5335235891439725, + "grad_norm": 1.4435862607793115, + "grad_max_sv": 0.8796723946928978, + "grad_min_sv": 2.6115679115784607e-08, + "grad_condition": 100856221.49209695, + "lr": 0.0009929980185352525, + "time_sec": 41.813751220703125 + }, + { + "epoch": 9, + "train_loss": 4.36510063079834, + "train_acc": 0.08636, + "test_loss": 7.074767668151855, + "test_acc": 0.0144, + "lyapunov": 1.5799841203957872, + "grad_norm": 1.3148798714645298, + "grad_max_sv": 0.7969768509268761, + "grad_min_sv": 2.3226430623246585e-08, + "grad_condition": 42533078.34572536, + "lr": 0.0009911436253643444, + "time_sec": 41.729400634765625 + }, + { + "epoch": 10, + "train_loss": 4.559664976348877, + "train_acc": 0.06118, + "test_loss": 6.018364582824707, + "test_acc": 0.01, + "lyapunov": 1.5615371959593596, + "grad_norm": 1.0712815395536825, + "grad_max_sv": 0.5929864205420017, + "grad_min_sv": 1.803380545450928e-08, + "grad_condition": 45789422.46232475, + "lr": 0.0009890738003669028, + "time_sec": 41.75548052787781 + }, + { + "epoch": 11, + "train_loss": 4.644180833282471, + "train_acc": 0.05202, + "test_loss": 6.277861665344238, + "test_acc": 0.01, + "lyapunov": 1.5085474514900266, + "grad_norm": 0.9280338123504958, + "grad_max_sv": 0.5784458503127098, + "grad_min_sv": 1.5023789502743857e-08, + "grad_condition": 63657686.089994095, + "lr": 0.00098678945143658, + "time_sec": 41.724050760269165 + }, + { + "epoch": 12, + "train_loss": 4.769687054901123, + "train_acc": 0.03436, + "test_loss": 7.280889709472656, + "test_acc": 0.01, + "lyapunov": 1.4389935622129904, + "grad_norm": 0.7003645750231552, + "grad_max_sv": 0.4854817561805248, + "grad_min_sv": 1.030722744932433e-08, + "grad_condition": 53249509.08795764, + "lr": 0.0009842915805643154, + "time_sec": 41.72962784767151 + }, + { + "epoch": 13, + "train_loss": 4.684542055053711, + "train_acc": 0.047, + "test_loss": 6.991418453979493, + "test_acc": 0.0112, + "lyapunov": 1.4236155184333588, + "grad_norm": 0.5991208192017541, + "grad_max_sv": 0.38398267030715943, + "grad_min_sv": 9.323978394926158e-09, + "grad_condition": 49967645.39513852, + "lr": 0.000981581283398829, + "time_sec": 41.743834018707275 + }, + { + "epoch": 14, + "train_loss": 4.875620534667969, + "train_acc": 0.02944, + "test_loss": 7.128801351165771, + "test_acc": 0.01, + "lyapunov": 1.427685697060412, + "grad_norm": 0.5025111739329319, + "grad_max_sv": 0.35512366965413095, + "grad_min_sv": 6.843199759284935e-09, + "grad_condition": 179836296.82542375, + "lr": 0.0009786597487660333, + "time_sec": 41.73904871940613 + }, + { + "epoch": 15, + "train_loss": 4.896511934967041, + "train_acc": 0.0335, + "test_loss": 17.298480625915527, + "test_acc": 0.01, + "lyapunov": 1.4632702230492516, + "grad_norm": 0.6331107294627782, + "grad_max_sv": 0.40708996057510377, + "grad_min_sv": 8.00606376749613e-09, + "grad_condition": 61874764.454221845, + "lr": 0.0009755282581475766, + "time_sec": 41.74419069290161 + }, + { + "epoch": 16, + "train_loss": 4.912100847015381, + "train_acc": 0.03632, + "test_loss": 8.131814362335206, + "test_acc": 0.0173, + "lyapunov": 1.4873096464235154, + "grad_norm": 0.826404597993897, + "grad_max_sv": 0.5076741345226765, + "grad_min_sv": 9.837833857273547e-09, + "grad_condition": 88718975.42972028, + "lr": 0.0009721881851187403, + "time_sec": 41.72049045562744 + }, + { + "epoch": 17, + "train_loss": 5.142030757446289, + "train_acc": 0.01672, + "test_loss": 6.458518544006347, + "test_acc": 0.01, + "lyapunov": 1.4868055615583649, + "grad_norm": 0.685951759542417, + "grad_max_sv": 0.5134769573807716, + "grad_min_sv": 7.799288968823869e-09, + "grad_condition": 85468742.13553956, + "lr": 0.0009686409947459456, + "time_sec": 41.73842525482178 + }, + { + "epoch": 18, + "train_loss": 5.188919100646973, + "train_acc": 0.00968, + "test_loss": 10.075014764404298, + "test_acc": 0.01, + "lyapunov": 1.4449111775059225, + "grad_norm": 0.4332247860431087, + "grad_max_sv": 0.3550705298781395, + "grad_min_sv": 4.337704034504397e-09, + "grad_condition": 117230068.9379596, + "lr": 0.0009648882429441254, + "time_sec": 41.763601779937744 + }, + { + "epoch": 19, + "train_loss": 5.226645467529297, + "train_acc": 0.01012, + "test_loss": 10.154055513000488, + "test_acc": 0.01, + "lyapunov": 1.4546792269362818, + "grad_norm": 0.3237987289049562, + "grad_max_sv": 0.2639503736048937, + "grad_min_sv": 2.060994466181133e-09, + "grad_condition": 14048870017.770252, + "lr": 0.00096093157579425, + "time_sec": 41.76903176307678 + }, + { + "epoch": 20, + "train_loss": 5.22861256149292, + "train_acc": 0.00962, + "test_loss": 9.159314030456542, + "test_acc": 0.01, + "lyapunov": 1.4311617704303674, + "grad_norm": 0.2580272391441697, + "grad_max_sv": 0.2014818772673607, + "grad_min_sv": 4.775887305801581e-11, + "grad_condition": 131599872645.97823, + "lr": 0.0009567727288213001, + "time_sec": 41.77689838409424 + }, + { + "epoch": 21, + "train_loss": 5.2369175091552735, + "train_acc": 0.0091, + "test_loss": 9.329907885742188, + "test_acc": 0.01, + "lyapunov": 1.4427513545736328, + "grad_norm": 0.20829668219493744, + "grad_max_sv": 0.15635721795260907, + "grad_min_sv": 7.96448125755094e-11, + "grad_condition": 123768275801.26958, + "lr": 0.0009524135262330095, + "time_sec": 41.749500036239624 + }, + { + "epoch": 22, + "train_loss": 5.232069122619629, + "train_acc": 0.00928, + "test_loss": 8.256287899780274, + "test_acc": 0.01, + "lyapunov": 1.43826272115683, + "grad_norm": 0.18574459317073533, + "grad_max_sv": 0.13343477975577117, + "grad_min_sv": 3.891468616243542e-11, + "grad_condition": 128132122536.13669, + "lr": 0.0009478558801197061, + "time_sec": 41.73808455467224 + }, + { + "epoch": 23, + "train_loss": 5.223144430541992, + "train_acc": 0.00912, + "test_loss": 8.333074249267579, + "test_acc": 0.01, + "lyapunov": 1.431471188659863, + "grad_norm": 0.15147554959008916, + "grad_max_sv": 0.10204733423888683, + "grad_min_sv": 2.03341283080962e-15, + "grad_condition": 101827814032.01648, + "lr": 0.000943101789615607, + "time_sec": 41.746745347976685 + }, + { + "epoch": 24, + "train_loss": 5.233420145263672, + "train_acc": 0.00942, + "test_loss": 7.730482585906983, + "test_acc": 0.01, + "lyapunov": 1.443052962917806, + "grad_norm": 0.1288834602441298, + "grad_max_sv": 0.07254640674218535, + "grad_min_sv": 1.1788800604957402e-13, + "grad_condition": 69609233199.00801, + "lr": 0.0009381533400219313, + "time_sec": 41.73458123207092 + }, + { + "epoch": 25, + "train_loss": 5.248794226074219, + "train_acc": 0.01224, + "test_loss": 6.550568232727051, + "test_acc": 0.01, + "lyapunov": 1.4743182287191796, + "grad_norm": 0.19543413013737237, + "grad_max_sv": 0.08613794101402164, + "grad_min_sv": 6.309014754681635e-11, + "grad_condition": 60792110328.20559, + "lr": 0.0009330127018922189, + "time_sec": 41.73256278038025 + }, + { + "epoch": 26, + "train_loss": 5.226683191070556, + "train_acc": 0.00892, + "test_loss": 5.647989534759522, + "test_acc": 0.01, + "lyapunov": 1.434842828289627, + "grad_norm": 0.14721341402984697, + "grad_max_sv": 0.09509434262290598, + "grad_min_sv": 1.0618768151186443e-15, + "grad_condition": 94978842737.15823, + "lr": 0.000927682130080253, + "time_sec": 41.72614550590515 + }, + { + "epoch": 27, + "train_loss": 5.229176857604981, + "train_acc": 0.00972, + "test_loss": 5.612284447479248, + "test_acc": 0.01, + "lyapunov": 1.4389631537830128, + "grad_norm": 0.1286875557895635, + "grad_max_sv": 0.07554986858740449, + "grad_min_sv": 1.9029346441684858e-16, + "grad_condition": 75528406184.49973, + "lr": 0.0009221639627510072, + "time_sec": 41.73252606391907 + }, + { + "epoch": 28, + "train_loss": 5.226171473999023, + "train_acc": 0.00934, + "test_loss": 5.924600332641601, + "test_acc": 0.01, + "lyapunov": 1.4371787568797236, + "grad_norm": 0.10743150341998972, + "grad_max_sv": 0.048194893449544904, + "grad_min_sv": 0.0, + "grad_condition": 48194893449.54491, + "lr": 0.0009164606203550494, + "time_sec": 41.72467064857483 + }, + { + "epoch": 29, + "train_loss": 5.230549348297119, + "train_acc": 0.00932, + "test_loss": 5.312363116455078, + "test_acc": 0.01, + "lyapunov": 1.4417800442946842, + "grad_norm": 0.10913623720356962, + "grad_max_sv": 0.050634372420608996, + "grad_min_sv": 0.0, + "grad_condition": 50634372420.60899, + "lr": 0.0009105746045668516, + "time_sec": 41.754605531692505 + }, + { + "epoch": 30, + "train_loss": 5.229708560028076, + "train_acc": 0.0092, + "test_loss": 5.395946918487549, + "test_acc": 0.01, + "lyapunov": 1.441019511588699, + "grad_norm": 0.10497591874908667, + "grad_max_sv": 0.04387410613708198, + "grad_min_sv": 0.0, + "grad_condition": 43874106137.081985, + "lr": 0.0009045084971874733, + "time_sec": 41.71743130683899 + }, + { + "epoch": 31, + "train_loss": 5.2316739025878904, + "train_acc": 0.00982, + "test_loss": 6.248269965362549, + "test_acc": 0.01, + "lyapunov": 1.443965878023211, + "grad_norm": 0.10154022323683165, + "grad_max_sv": 0.03353279777802527, + "grad_min_sv": 0.0, + "grad_condition": 33532797778.02527, + "lr": 0.0008982649590120977, + "time_sec": 41.701202392578125 + }, + { + "epoch": 32, + "train_loss": 5.23400792678833, + "train_acc": 0.00938, + "test_loss": 5.782683653259277, + "test_acc": 0.01, + "lyapunov": 1.446322088046452, + "grad_norm": 0.10537953489915908, + "grad_max_sv": 0.04410789059475064, + "grad_min_sv": 0.0, + "grad_condition": 44107890594.75064, + "lr": 0.0008918467286629196, + "time_sec": 41.70464754104614 + }, + { + "epoch": 33, + "train_loss": 5.232683167877197, + "train_acc": 0.00858, + "test_loss": 5.318116857910156, + "test_acc": 0.01, + "lyapunov": 1.4452067232497818, + "grad_norm": 0.1008655295742077, + "grad_max_sv": 0.03291638647206128, + "grad_min_sv": 0.0, + "grad_condition": 32916386472.06128, + "lr": 0.0008852566213878943, + "time_sec": 41.68885540962219 + }, + { + "epoch": 34, + "train_loss": 5.237297785339355, + "train_acc": 0.00966, + "test_loss": 5.309081327819825, + "test_acc": 0.01, + "lyapunov": 1.450283215783746, + "grad_norm": 0.10345313863412257, + "grad_max_sv": 0.04121980397030711, + "grad_min_sv": 0.0, + "grad_condition": 41219803970.30711, + "lr": 0.000878497527825878, + "time_sec": 41.72196674346924 + }, + { + "epoch": 35, + "train_loss": 5.240170780029297, + "train_acc": 0.00886, + "test_loss": 5.1140812942504885, + "test_acc": 0.01, + "lyapunov": 1.4520895359156383, + "grad_norm": 0.10252991679320593, + "grad_max_sv": 0.038473002053797244, + "grad_min_sv": 0.0, + "grad_condition": 38473002053.79725, + "lr": 0.000871572412738697, + "time_sec": 41.704707622528076 + }, + { + "epoch": 36, + "train_loss": 5.237992069244385, + "train_acc": 0.0091, + "test_loss": 5.254914206695557, + "test_acc": 0.01, + "lyapunov": 1.4511004372326004, + "grad_norm": 0.1034357825731679, + "grad_max_sv": 0.03689436963759363, + "grad_min_sv": 0.0, + "grad_condition": 36894369637.59363, + "lr": 0.0008644843137107055, + "time_sec": 41.68847870826721 + }, + { + "epoch": 37, + "train_loss": 5.24728928100586, + "train_acc": 0.00948, + "test_loss": 5.015587938690185, + "test_acc": 0.01, + "lyapunov": 1.4593792114111468, + "grad_norm": 0.10030700112378006, + "grad_max_sv": 0.027813022676855325, + "grad_min_sv": 0.0, + "grad_condition": 27813022676.855324, + "lr": 0.0008572363398164014, + "time_sec": 41.67623424530029 + }, + { + "epoch": 38, + "train_loss": 5.240536932220459, + "train_acc": 0.0092, + "test_loss": 4.961225141906739, + "test_acc": 0.01, + "lyapunov": 1.454334620319669, + "grad_norm": 0.09505358413147648, + "grad_max_sv": 0.022648979304358365, + "grad_min_sv": 0.0, + "grad_condition": 22648979304.35836, + "lr": 0.0008498316702566826, + "time_sec": 41.65856647491455 + }, + { + "epoch": 39, + "train_loss": 5.24094622467041, + "train_acc": 0.00906, + "test_loss": 4.902838454437256, + "test_acc": 0.01, + "lyapunov": 1.4547367199607517, + "grad_norm": 0.09365021131775912, + "grad_max_sv": 0.02316552624106407, + "grad_min_sv": 0.0, + "grad_condition": 23165526241.06407, + "lr": 0.0008422735529643442, + "time_sec": 41.66074347496033 + }, + { + "epoch": 40, + "train_loss": 5.245578489685059, + "train_acc": 0.00954, + "test_loss": 4.859429032897949, + "test_acc": 0.01, + "lyapunov": 1.4598181689791667, + "grad_norm": 0.10147367716516044, + "grad_max_sv": 0.023039095243439077, + "grad_min_sv": 0.0, + "grad_condition": 23039095243.43908, + "lr": 0.0008345653031794289, + "time_sec": 41.646554708480835 + }, + { + "epoch": 41, + "train_loss": 5.245340968780518, + "train_acc": 0.00972, + "test_loss": 5.133834055328369, + "test_acc": 0.01, + "lyapunov": 1.4597191298404313, + "grad_norm": 0.09983575491941106, + "grad_max_sv": 0.023509565647691487, + "grad_min_sv": 0.0, + "grad_condition": 23509565647.69149, + "lr": 0.0008267103019950526, + "time_sec": 41.67466497421265 + }, + { + "epoch": 42, + "train_loss": 5.243727160949707, + "train_acc": 0.0094, + "test_loss": 5.177202513122559, + "test_acc": 0.01, + "lyapunov": 1.457551447936641, + "grad_norm": 0.10012844556744109, + "grad_max_sv": 0.04022635291330516, + "grad_min_sv": 0.0, + "grad_condition": 40226352913.30516, + "lr": 0.0008187119948743447, + "time_sec": 41.69778633117676 + }, + { + "epoch": 43, + "train_loss": 5.245192972717285, + "train_acc": 0.00916, + "test_loss": 4.837023108673096, + "test_acc": 0.01, + "lyapunov": 1.4592695629505246, + "grad_norm": 0.0977089071025598, + "grad_max_sv": 0.02978864456526935, + "grad_min_sv": 0.0, + "grad_condition": 29788644565.269356, + "lr": 0.000810573890139155, + "time_sec": 41.68951177597046 + }, + { + "epoch": 44, + "train_loss": 5.2786666191101075, + "train_acc": 0.01064, + "test_loss": 5.4122274887084965, + "test_acc": 0.01, + "lyapunov": 1.5007501855835585, + "grad_norm": 0.12265113875538343, + "grad_max_sv": 0.033590356819331646, + "grad_min_sv": 5.169785690831125e-14, + "grad_condition": 31777859057.197426, + "lr": 0.0008022995574311873, + "time_sec": 41.67222714424133 + }, + { + "epoch": 45, + "train_loss": 5.251278916320801, + "train_acc": 0.00912, + "test_loss": 5.717527485656738, + "test_acc": 0.01, + "lyapunov": 1.4666499061047877, + "grad_norm": 0.09464479083441923, + "grad_max_sv": 0.015212097018957139, + "grad_min_sv": 0.0, + "grad_condition": 15212097018.957138, + "lr": 0.0007938926261462363, + "time_sec": 41.66761112213135 + }, + { + "epoch": 46, + "train_loss": 5.248660043487549, + "train_acc": 0.00922, + "test_loss": 5.687412886047364, + "test_acc": 0.01, + "lyapunov": 1.4640466523597309, + "grad_norm": 0.09250900682814509, + "grad_max_sv": 0.00974161345511675, + "grad_min_sv": 0.0, + "grad_condition": 9741613455.116749, + "lr": 0.0007853567838422158, + "time_sec": 41.62896704673767 + }, + { + "epoch": 47, + "train_loss": 5.249529778289795, + "train_acc": 0.00976, + "test_loss": 5.35712462310791, + "test_acc": 0.01, + "lyapunov": 1.4639555450595554, + "grad_norm": 0.09683136939926335, + "grad_max_sv": 0.02266658809967339, + "grad_min_sv": 0.0, + "grad_condition": 22666588099.67339, + "lr": 0.0007766957746216719, + "time_sec": 41.632965326309204 + }, + { + "epoch": 48, + "train_loss": 5.2507288345336915, + "train_acc": 0.00952, + "test_loss": 5.053029971313476, + "test_acc": 0.01, + "lyapunov": 1.46576005692982, + "grad_norm": 0.09407593048273037, + "grad_max_sv": 0.027120837941765785, + "grad_min_sv": 0.0, + "grad_condition": 27120837941.765785, + "lr": 0.0007679133974894982, + "time_sec": 41.65870714187622 + }, + { + "epoch": 49, + "train_loss": 5.249875890960693, + "train_acc": 0.00884, + "test_loss": 5.38174955444336, + "test_acc": 0.01, + "lyapunov": 1.465318091690083, + "grad_norm": 0.09064589183935413, + "grad_max_sv": 0.008867102395743131, + "grad_min_sv": 0.0, + "grad_condition": 8867102395.743132, + "lr": 0.000759013504686565, + "time_sec": 41.735912561416626 + }, + { + "epoch": 50, + "train_loss": 5.250207867889404, + "train_acc": 0.00898, + "test_loss": 5.739707115173339, + "test_acc": 0.01, + "lyapunov": 1.4655792646091004, + "grad_norm": 0.09717189190349201, + "grad_max_sv": 0.021169214555993677, + "grad_min_sv": 0.0, + "grad_condition": 21169214555.993675, + "lr": 0.0007499999999999998, + "time_sec": 41.72933316230774 + }, + { + "epoch": 51, + "train_loss": 5.250648717803955, + "train_acc": 0.00912, + "test_loss": 6.128197521972656, + "test_acc": 0.01, + "lyapunov": 1.4661765546749925, + "grad_norm": 0.09095698035941559, + "grad_max_sv": 0.01055141636170447, + "grad_min_sv": 0.0, + "grad_condition": 10551416361.704468, + "lr": 0.0007408768370508575, + "time_sec": 41.69919180870056 + }, + { + "epoch": 52, + "train_loss": 5.251839170684814, + "train_acc": 0.00908, + "test_loss": 6.067484506225586, + "test_acc": 0.01, + "lyapunov": 1.4675627587091586, + "grad_norm": 0.09067609636620885, + "grad_max_sv": 0.004669012082740664, + "grad_min_sv": 0.0, + "grad_condition": 4669012082.7406645, + "lr": 0.0007316480175599307, + "time_sec": 41.654059171676636 + }, + { + "epoch": 53, + "train_loss": 5.253518835144043, + "train_acc": 0.00896, + "test_loss": 5.7827218193054195, + "test_acc": 0.01, + "lyapunov": 1.4693938874832504, + "grad_norm": 0.09137616955031719, + "grad_max_sv": 0.010091183660551905, + "grad_min_sv": 0.0, + "grad_condition": 10091183660.551905, + "lr": 0.0007223175895924635, + "time_sec": 41.642850160598755 + }, + { + "epoch": 54, + "train_loss": 5.254051934051514, + "train_acc": 0.00872, + "test_loss": 5.591477861022949, + "test_acc": 0.01, + "lyapunov": 1.4702323230026324, + "grad_norm": 0.08996816491022355, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 41.657779932022095 + }, + { + "epoch": 55, + "train_loss": 5.255190885314941, + "train_acc": 0.00916, + "test_loss": 5.435504406738281, + "test_acc": 0.01, + "lyapunov": 1.4712699441348804, + "grad_norm": 0.09391959822012276, + "grad_max_sv": 0.005470911040902138, + "grad_min_sv": 0.0, + "grad_condition": 5470911040.902138, + "lr": 0.0007033683215378998, + "time_sec": 41.70645236968994 + }, + { + "epoch": 56, + "train_loss": 5.254567480010986, + "train_acc": 0.0092, + "test_loss": 5.745911796569824, + "test_acc": 0.01, + "lyapunov": 1.470891768670143, + "grad_norm": 0.08856701808364516, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 41.71012330055237 + }, + { + "epoch": 57, + "train_loss": 5.255953155822754, + "train_acc": 0.00902, + "test_loss": 5.410791555023193, + "test_acc": 0.01, + "lyapunov": 1.4723095774955457, + "grad_norm": 0.0914524874609732, + "grad_max_sv": 0.005876953201368451, + "grad_min_sv": 0.0, + "grad_condition": 5876953201.368451, + "lr": 0.0006840622763423388, + "time_sec": 41.65397572517395 + }, + { + "epoch": 58, + "train_loss": 5.255620794372558, + "train_acc": 0.00814, + "test_loss": 5.248719776153565, + "test_acc": 0.01, + "lyapunov": 1.4720726202211112, + "grad_norm": 0.08957407910190007, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 41.596808195114136 + }, + { + "epoch": 59, + "train_loss": 5.256758173370361, + "train_acc": 0.00904, + "test_loss": 5.839924575805664, + "test_acc": 0.01, + "lyapunov": 1.4729903738212098, + "grad_norm": 0.09261814392317223, + "grad_max_sv": 0.016021678689867258, + "grad_min_sv": 0.0, + "grad_condition": 16021678689.867258, + "lr": 0.0006644333233692913, + "time_sec": 41.65124177932739 + }, + { + "epoch": 60, + "train_loss": 5.256810084991455, + "train_acc": 0.00942, + "test_loss": 5.447851982879639, + "test_acc": 0.01, + "lyapunov": 1.4729429684636537, + "grad_norm": 0.09328751710854948, + "grad_max_sv": 0.018184319231659175, + "grad_min_sv": 0.0, + "grad_condition": 18184319231.659172, + "lr": 0.0006545084971874734, + "time_sec": 41.677849769592285 + }, + { + "epoch": 61, + "train_loss": 5.257736980895996, + "train_acc": 0.00956, + "test_loss": 5.214775198364258, + "test_acc": 0.01, + "lyapunov": 1.4742664586552574, + "grad_norm": 0.09141104511491621, + "grad_max_sv": 0.014100066805258393, + "grad_min_sv": 0.0, + "grad_condition": 14100066805.258392, + "lr": 0.0006445158984722354, + "time_sec": 41.65701365470886 + }, + { + "epoch": 62, + "train_loss": 5.257541732788086, + "train_acc": 0.00888, + "test_loss": 5.395826309204102, + "test_acc": 0.01, + "lyapunov": 1.4742513254780294, + "grad_norm": 0.08871521712913655, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 41.64438438415527 + }, + { + "epoch": 63, + "train_loss": 5.258026624908447, + "train_acc": 0.00826, + "test_loss": 5.438673513793946, + "test_acc": 0.01, + "lyapunov": 1.474777021066612, + "grad_norm": 0.08974006980177573, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 41.659621477127075 + }, + { + "epoch": 64, + "train_loss": 5.256656706237793, + "train_acc": 0.00858, + "test_loss": 5.30103558959961, + "test_acc": 0.01, + "lyapunov": 1.4732483726023409, + "grad_norm": 0.08966165557801938, + "grad_max_sv": 0.002812969218939543, + "grad_min_sv": 0.0, + "grad_condition": 2812969218.939543, + "lr": 0.0006141754350553275, + "time_sec": 41.680859327316284 + }, + { + "epoch": 65, + "train_loss": 5.25918576675415, + "train_acc": 0.00894, + "test_loss": 5.125008965301514, + "test_acc": 0.01, + "lyapunov": 1.4760865912108165, + "grad_norm": 0.0887662183827418, + "grad_max_sv": 0.0005635306239128113, + "grad_min_sv": 0.0, + "grad_condition": 563530623.9128113, + "lr": 0.0006039558454088793, + "time_sec": 41.60912251472473 + }, + { + "epoch": 66, + "train_loss": 5.260574841461182, + "train_acc": 0.00874, + "test_loss": 5.454896185302735, + "test_acc": 0.01, + "lyapunov": 1.4776358738579713, + "grad_norm": 0.11531617666338094, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 41.6300413608551 + }, + { + "epoch": 67, + "train_loss": 5.259261641082763, + "train_acc": 0.00928, + "test_loss": 5.808028590393066, + "test_acc": 0.01, + "lyapunov": 1.4762413047463692, + "grad_norm": 0.08815522678931535, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 41.62497115135193 + }, + { + "epoch": 68, + "train_loss": 5.2594527183532715, + "train_acc": 0.00938, + "test_loss": 5.654487629699707, + "test_acc": 0.01, + "lyapunov": 1.4761893337644885, + "grad_norm": 0.09333979255701338, + "grad_max_sv": 0.014018809190019965, + "grad_min_sv": 0.0, + "grad_condition": 14018809190.019964, + "lr": 0.0005730415142812054, + "time_sec": 41.621119260787964 + }, + { + "epoch": 69, + "train_loss": 5.26328825378418, + "train_acc": 0.00966, + "test_loss": 5.534258514404297, + "test_acc": 0.01, + "lyapunov": 1.4803016765038375, + "grad_norm": 0.10303270455881028, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 41.61156606674194 + }, + { + "epoch": 70, + "train_loss": 5.261220071105957, + "train_acc": 0.00968, + "test_loss": 5.542517721557617, + "test_acc": 0.01, + "lyapunov": 1.4784168117796368, + "grad_norm": 0.08844874021214537, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005522642316338265, + "time_sec": 41.62671518325806 + }, + { + "epoch": 71, + "train_loss": 5.260938765716553, + "train_acc": 0.00862, + "test_loss": 5.420013078308106, + "test_acc": 0.01, + "lyapunov": 1.4779477622502906, + "grad_norm": 0.0889283460956175, + "grad_max_sv": 0.0034733008593320846, + "grad_min_sv": 0.0, + "grad_condition": 3473300859.3320847, + "lr": 0.0005418389216661573, + "time_sec": 41.62442445755005 + }, + { + "epoch": 72, + "train_loss": 5.260601893157959, + "train_acc": 0.00902, + "test_loss": 5.176327791595459, + "test_acc": 0.01, + "lyapunov": 1.4776618431901078, + "grad_norm": 0.0902718541800826, + "grad_max_sv": 0.012300812685862184, + "grad_min_sv": 0.0, + "grad_condition": 12300812685.862183, + "lr": 0.0005313952597646563, + "time_sec": 41.66868996620178 + }, + { + "epoch": 73, + "train_loss": 5.264250277404785, + "train_acc": 0.00884, + "test_loss": 5.100635796356201, + "test_acc": 0.01, + "lyapunov": 1.4813997955883251, + "grad_norm": 0.0903405536598621, + "grad_max_sv": 0.007483795657753945, + "grad_min_sv": 0.0, + "grad_condition": 7483795657.7539425, + "lr": 0.0005209378268645994, + "time_sec": 41.626320600509644 + }, + { + "epoch": 74, + "train_loss": 5.26120802658081, + "train_acc": 0.0087, + "test_loss": 5.235371070861817, + "test_acc": 0.01, + "lyapunov": 1.4784196508510032, + "grad_norm": 0.0879091159548037, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 41.62154483795166 + }, + { + "epoch": 75, + "train_loss": 5.267138383178711, + "train_acc": 0.00858, + "test_loss": 4.973852683258056, + "test_acc": 0.01, + "lyapunov": 1.4819577859185846, + "grad_norm": 0.08881358787274304, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 41.638519048690796 + }, + { + "epoch": 76, + "train_loss": 5.2642199221801755, + "train_acc": 0.00822, + "test_loss": 5.071284794616699, + "test_acc": 0.01, + "lyapunov": 1.4816657048661996, + "grad_norm": 0.08882388372557563, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 41.619221925735474 + }, + { + "epoch": 77, + "train_loss": 5.273737740020752, + "train_acc": 0.00884, + "test_loss": 4.974697065734864, + "test_acc": 0.01, + "lyapunov": 1.490840724667015, + "grad_norm": 0.08942192638502924, + "grad_max_sv": 0.0068177991081029175, + "grad_min_sv": 0.0, + "grad_condition": 6817799108.102918, + "lr": 0.0004790621731353997, + "time_sec": 41.63776922225952 + }, + { + "epoch": 78, + "train_loss": 5.261278802490234, + "train_acc": 0.00874, + "test_loss": 4.976500602722168, + "test_acc": 0.01, + "lyapunov": 1.4785530381190501, + "grad_norm": 0.0880515343100226, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 41.607832193374634 + }, + { + "epoch": 79, + "train_loss": 5.263828933258057, + "train_acc": 0.00816, + "test_loss": 4.9257099716186525, + "test_acc": 0.01, + "lyapunov": 1.4813517496713897, + "grad_norm": 0.08863134124223197, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 41.631874561309814 + }, + { + "epoch": 80, + "train_loss": 5.268178493652344, + "train_acc": 0.00912, + "test_loss": 4.912583598327637, + "test_acc": 0.01, + "lyapunov": 1.4849315034154127, + "grad_norm": 0.08860861584524822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 41.710554122924805 + }, + { + "epoch": 81, + "train_loss": 5.26138502532959, + "train_acc": 0.00922, + "test_loss": 4.878695037841797, + "test_acc": 0.01, + "lyapunov": 1.478672110820975, + "grad_norm": 0.09157782940494599, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 41.64098763465881 + }, + { + "epoch": 82, + "train_loss": 5.268409018859863, + "train_acc": 0.00922, + "test_loss": 4.908391270446777, + "test_acc": 0.01, + "lyapunov": 1.4861254643296342, + "grad_norm": 0.11020465642062108, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004269584857187939, + "time_sec": 41.60934782028198 + }, + { + "epoch": 83, + "train_loss": 5.265614703063965, + "train_acc": 0.00942, + "test_loss": 4.864893129730224, + "test_acc": 0.01, + "lyapunov": 1.4825067782341061, + "grad_norm": 0.09011764156233357, + "grad_max_sv": 0.002433748124167323, + "grad_min_sv": 0.0, + "grad_condition": 2433748124.167323, + "lr": 0.0004166156266419484, + "time_sec": 41.60301470756531 + }, + { + "epoch": 84, + "train_loss": 5.262646561889649, + "train_acc": 0.0091, + "test_loss": 4.719803262329101, + "test_acc": 0.01, + "lyapunov": 1.4800378392114664, + "grad_norm": 0.08987030714157009, + "grad_max_sv": 0.005705382255837321, + "grad_min_sv": 0.0, + "grad_condition": 5705382255.837321, + "lr": 0.0004063093427071373, + "time_sec": 41.6301634311676 + }, + { + "epoch": 85, + "train_loss": 5.263007119445801, + "train_acc": 0.00892, + "test_loss": 4.765390521240234, + "test_acc": 0.01, + "lyapunov": 1.4803728941456435, + "grad_norm": 0.08908420576392925, + "grad_max_sv": 0.005673544481396675, + "grad_min_sv": 0.0, + "grad_condition": 5673544481.396675, + "lr": 0.0003960441545911199, + "time_sec": 41.6158664226532 + }, + { + "epoch": 86, + "train_loss": 5.261938611297607, + "train_acc": 0.00896, + "test_loss": 4.7486605583190915, + "test_acc": 0.01, + "lyapunov": 1.479363068900145, + "grad_norm": 0.08783615573103698, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 41.63826298713684 + }, + { + "epoch": 87, + "train_loss": 5.263675572814941, + "train_acc": 0.00854, + "test_loss": 4.729234335327148, + "test_acc": 0.01, + "lyapunov": 1.481331856354423, + "grad_norm": 0.08839938213840319, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 41.63784456253052 + }, + { + "epoch": 88, + "train_loss": 5.262854153900147, + "train_acc": 0.00876, + "test_loss": 4.702548780822754, + "test_acc": 0.01, + "lyapunov": 1.4803594689235053, + "grad_norm": 0.08793981551347788, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 41.71681451797485 + }, + { + "epoch": 89, + "train_loss": 5.2630352787780765, + "train_acc": 0.00878, + "test_loss": 4.71384239654541, + "test_acc": 0.01, + "lyapunov": 1.4806065233162298, + "grad_norm": 0.08814160681144886, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 41.7017023563385 + }, + { + "epoch": 90, + "train_loss": 5.262895381469726, + "train_acc": 0.00916, + "test_loss": 4.708866213226318, + "test_acc": 0.01, + "lyapunov": 1.4804326811105089, + "grad_norm": 0.08915485528106772, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 41.66344165802002 + }, + { + "epoch": 91, + "train_loss": 5.2640660131835935, + "train_acc": 0.00894, + "test_loss": 4.7449420501708985, + "test_acc": 0.01, + "lyapunov": 1.481703461588496, + "grad_norm": 0.09104557989631236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 41.65228295326233 + }, + { + "epoch": 92, + "train_loss": 5.2634638612365725, + "train_acc": 0.00882, + "test_loss": 4.755833000946045, + "test_acc": 0.01, + "lyapunov": 1.4810923280008614, + "grad_norm": 0.08888836178350999, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 41.6901330947876 + }, + { + "epoch": 93, + "train_loss": 5.264835737762451, + "train_acc": 0.00874, + "test_loss": 4.721351288604736, + "test_acc": 0.01, + "lyapunov": 1.4826934395543754, + "grad_norm": 0.08947356736587055, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 41.6052131652832 + }, + { + "epoch": 94, + "train_loss": 5.263670272369385, + "train_acc": 0.00868, + "test_loss": 4.785962379455566, + "test_acc": 0.01, + "lyapunov": 1.4813081669380597, + "grad_norm": 0.08849247443481073, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 41.60963582992554 + }, + { + "epoch": 95, + "train_loss": 5.2619873828125, + "train_acc": 0.00798, + "test_loss": 4.723102865600586, + "test_acc": 0.01, + "lyapunov": 1.479443594927678, + "grad_norm": 0.08787170616898271, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 41.6090726852417 + }, + { + "epoch": 96, + "train_loss": 5.264093981323242, + "train_acc": 0.00886, + "test_loss": 4.719023175048828, + "test_acc": 0.01, + "lyapunov": 1.4818146923923736, + "grad_norm": 0.08820019238952795, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 41.62479615211487 + }, + { + "epoch": 97, + "train_loss": 5.2660337771606445, + "train_acc": 0.00826, + "test_loss": 4.683718409729004, + "test_acc": 0.01, + "lyapunov": 1.4838567975232058, + "grad_norm": 0.08832542758192675, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 41.61792826652527 + }, + { + "epoch": 98, + "train_loss": 5.264854827270508, + "train_acc": 0.00872, + "test_loss": 4.66099263305664, + "test_acc": 0.01, + "lyapunov": 1.4826005797861788, + "grad_norm": 0.08770768444548716, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 41.65434980392456 + }, + { + "epoch": 99, + "train_loss": 5.26445282623291, + "train_acc": 0.00872, + "test_loss": 4.680420280456543, + "test_acc": 0.01, + "lyapunov": 1.482219386588582, + "grad_norm": 0.08789455257207789, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 41.626431465148926 + }, + { + "epoch": 100, + "train_loss": 5.267974179992676, + "train_acc": 0.00926, + "test_loss": 4.719721762084961, + "test_acc": 0.01, + "lyapunov": 1.4858673469489798, + "grad_norm": 0.08804026825834858, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 41.61785125732422 + }, + { + "epoch": 101, + "train_loss": 5.265785012969971, + "train_acc": 0.00908, + "test_loss": 4.677582652282715, + "test_acc": 0.01, + "lyapunov": 1.4835739272939579, + "grad_norm": 0.08811206484625347, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 41.61317491531372 + }, + { + "epoch": 102, + "train_loss": 5.262550980682373, + "train_acc": 0.00804, + "test_loss": 4.721813179779053, + "test_acc": 0.01, + "lyapunov": 1.4801046043405752, + "grad_norm": 0.08851673086495025, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 41.67564344406128 + }, + { + "epoch": 103, + "train_loss": 5.2642667413330075, + "train_acc": 0.00882, + "test_loss": 4.740510238647461, + "test_acc": 0.01, + "lyapunov": 1.4820212802618666, + "grad_norm": 0.08821117687751044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 41.63251256942749 + }, + { + "epoch": 104, + "train_loss": 5.263534827728272, + "train_acc": 0.0081, + "test_loss": 4.700486143493652, + "test_acc": 0.01, + "lyapunov": 1.4811951995200818, + "grad_norm": 0.08907217589685106, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 41.62003540992737 + }, + { + "epoch": 105, + "train_loss": 5.263595247192383, + "train_acc": 0.00866, + "test_loss": 4.685244355773926, + "test_acc": 0.01, + "lyapunov": 1.4812764624500518, + "grad_norm": 0.087999698905291, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 41.59307098388672 + }, + { + "epoch": 106, + "train_loss": 5.2640459841918945, + "train_acc": 0.00788, + "test_loss": 4.679230912780762, + "test_acc": 0.01, + "lyapunov": 1.481674498914148, + "grad_norm": 0.08791576128060906, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 41.62804102897644 + }, + { + "epoch": 107, + "train_loss": 5.264458420715332, + "train_acc": 0.00878, + "test_loss": 4.693680247497559, + "test_acc": 0.01, + "lyapunov": 1.4822333346852257, + "grad_norm": 0.0877864562223225, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 41.72821760177612 + }, + { + "epoch": 108, + "train_loss": 5.263148934020996, + "train_acc": 0.0092, + "test_loss": 4.703213790130615, + "test_acc": 0.01, + "lyapunov": 1.480785415300628, + "grad_norm": 0.08786524330498742, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 41.68737983703613 + }, + { + "epoch": 109, + "train_loss": 5.264703175201416, + "train_acc": 0.0078, + "test_loss": 4.703215410614014, + "test_acc": 0.01, + "lyapunov": 1.482531173454831, + "grad_norm": 0.0887187166875537, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 41.6301372051239 + }, + { + "epoch": 110, + "train_loss": 5.262354034423828, + "train_acc": 0.00878, + "test_loss": 4.673253472900391, + "test_acc": 0.01, + "lyapunov": 1.4798865848794922, + "grad_norm": 0.08823123281084728, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 41.61501979827881 + }, + { + "epoch": 111, + "train_loss": 5.261907596282959, + "train_acc": 0.00774, + "test_loss": 4.6810761657714846, + "test_acc": 0.01, + "lyapunov": 1.4794099962010103, + "grad_norm": 0.08847327230851044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 41.66792058944702 + }, + { + "epoch": 112, + "train_loss": 5.263451714782715, + "train_acc": 0.00876, + "test_loss": 4.675498142242431, + "test_acc": 0.01, + "lyapunov": 1.4811130951127738, + "grad_norm": 0.08821763372055312, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 41.6463463306427 + }, + { + "epoch": 113, + "train_loss": 5.271167716522217, + "train_acc": 0.00842, + "test_loss": 4.685236253356933, + "test_acc": 0.01, + "lyapunov": 1.489286311447163, + "grad_norm": 0.08951867713473023, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 41.74271559715271 + }, + { + "epoch": 114, + "train_loss": 5.271448510589599, + "train_acc": 0.00896, + "test_loss": 4.690647507476807, + "test_acc": 0.01, + "lyapunov": 1.4897843382852463, + "grad_norm": 0.08820177476113898, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 41.668110609054565 + }, + { + "epoch": 115, + "train_loss": 5.2816896908569335, + "train_acc": 0.00868, + "test_loss": 4.690107788085937, + "test_acc": 0.01, + "lyapunov": 1.49836193996927, + "grad_norm": 0.0881224924879974, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 41.65963578224182 + }, + { + "epoch": 116, + "train_loss": 5.265034445343018, + "train_acc": 0.00848, + "test_loss": 4.69013021774292, + "test_acc": 0.01, + "lyapunov": 1.4828510912483002, + "grad_norm": 0.0884889002186026, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 41.68511462211609 + }, + { + "epoch": 117, + "train_loss": 5.26604537612915, + "train_acc": 0.00834, + "test_loss": 4.690117681884765, + "test_acc": 0.01, + "lyapunov": 1.4837996590777736, + "grad_norm": 0.087812082346243, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 41.62825393676758 + }, + { + "epoch": 118, + "train_loss": 5.271575555877686, + "train_acc": 0.00838, + "test_loss": 4.688699510192871, + "test_acc": 0.01, + "lyapunov": 1.4897897758752183, + "grad_norm": 0.08852661249085975, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 41.813793897628784 + }, + { + "epoch": 119, + "train_loss": 5.270083126525879, + "train_acc": 0.00882, + "test_loss": 4.678613103485107, + "test_acc": 0.01, + "lyapunov": 1.4881404150477455, + "grad_norm": 0.08809098199633093, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 41.60239052772522 + }, + { + "epoch": 120, + "train_loss": 5.2668604069519045, + "train_acc": 0.00916, + "test_loss": 4.668810566711426, + "test_acc": 0.01, + "lyapunov": 1.484404284630895, + "grad_norm": 0.08801465824181619, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 41.67430233955383 + }, + { + "epoch": 121, + "train_loss": 5.270687980041504, + "train_acc": 0.00844, + "test_loss": 4.678598808288574, + "test_acc": 0.01, + "lyapunov": 1.4865265313316793, + "grad_norm": 0.08823636157170499, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 41.651268005371094 + }, + { + "epoch": 122, + "train_loss": 5.262444466705322, + "train_acc": 0.00858, + "test_loss": 4.678612301635742, + "test_acc": 0.01, + "lyapunov": 1.48004513079553, + "grad_norm": 0.09003261469940216, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 41.676185607910156 + }, + { + "epoch": 123, + "train_loss": 5.263941179351806, + "train_acc": 0.0086, + "test_loss": 4.671801266479492, + "test_acc": 0.01, + "lyapunov": 1.4817558716020316, + "grad_norm": 0.09047110449687606, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 41.740845918655396 + }, + { + "epoch": 124, + "train_loss": 5.269082255859375, + "train_acc": 0.00892, + "test_loss": 4.671809730529785, + "test_acc": 0.01, + "lyapunov": 1.4871390643327131, + "grad_norm": 0.08793369061349017, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 41.75574517250061 + }, + { + "epoch": 125, + "train_loss": 5.262843768310547, + "train_acc": 0.00886, + "test_loss": 4.662115892028808, + "test_acc": 0.01, + "lyapunov": 1.4804938851719927, + "grad_norm": 0.08792553586108803, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 41.601502656936646 + }, + { + "epoch": 126, + "train_loss": 5.262783556365966, + "train_acc": 0.0087, + "test_loss": 4.671795330810546, + "test_acc": 0.01, + "lyapunov": 1.4804595739335356, + "grad_norm": 0.08818916489651518, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 41.719630002975464 + }, + { + "epoch": 127, + "train_loss": 5.287085924682617, + "train_acc": 0.00884, + "test_loss": 4.670085035705567, + "test_acc": 0.01, + "lyapunov": 1.5052251651159028, + "grad_norm": 0.09375403073023182, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 41.655165672302246 + }, + { + "epoch": 128, + "train_loss": 5.3060646118164065, + "train_acc": 0.00794, + "test_loss": 4.6709625457763675, + "test_acc": 0.01, + "lyapunov": 1.5216917436750954, + "grad_norm": 0.08857015682665342, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 41.698471546173096 + }, + { + "epoch": 129, + "train_loss": 5.263810299682617, + "train_acc": 0.00862, + "test_loss": 4.679794757080078, + "test_acc": 0.01, + "lyapunov": 1.4815860233648355, + "grad_norm": 0.08793008720913074, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 41.65286087989807 + }, + { + "epoch": 130, + "train_loss": 5.2642881167602535, + "train_acc": 0.00886, + "test_loss": 4.679787918853759, + "test_acc": 0.01, + "lyapunov": 1.4821607542159918, + "grad_norm": 0.08826309404088324, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 41.60878133773804 + }, + { + "epoch": 131, + "train_loss": 5.264142718353272, + "train_acc": 0.00912, + "test_loss": 4.679794540405274, + "test_acc": 0.01, + "lyapunov": 1.4819643613322617, + "grad_norm": 0.0879145106714535, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 41.631954193115234 + }, + { + "epoch": 132, + "train_loss": 5.264426311187744, + "train_acc": 0.00912, + "test_loss": 4.686964068603515, + "test_acc": 0.01, + "lyapunov": 1.4822249098507034, + "grad_norm": 0.08772387144138033, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 41.61648106575012 + }, + { + "epoch": 133, + "train_loss": 5.263279991149902, + "train_acc": 0.00928, + "test_loss": 4.673583326721191, + "test_acc": 0.01, + "lyapunov": 1.481004032332574, + "grad_norm": 0.08756701265820996, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 41.61954092979431 + }, + { + "epoch": 134, + "train_loss": 5.264391135559082, + "train_acc": 0.00916, + "test_loss": 4.673584260559082, + "test_acc": 0.01, + "lyapunov": 1.482238910387239, + "grad_norm": 0.08773099630417767, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 41.636422872543335 + }, + { + "epoch": 135, + "train_loss": 5.264316839904785, + "train_acc": 0.00918, + "test_loss": 4.673586289215088, + "test_acc": 0.01, + "lyapunov": 1.4821837125226969, + "grad_norm": 0.0883951408561693, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 41.637362241744995 + }, + { + "epoch": 136, + "train_loss": 5.263837189178467, + "train_acc": 0.00856, + "test_loss": 4.673583441162109, + "test_acc": 0.01, + "lyapunov": 1.4816227761071052, + "grad_norm": 0.08805256597520511, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 41.648523807525635 + }, + { + "epoch": 137, + "train_loss": 5.263810054168701, + "train_acc": 0.00914, + "test_loss": 4.673584091186523, + "test_acc": 0.01, + "lyapunov": 1.4815898499525417, + "grad_norm": 0.08812282585660734, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 41.73938012123108 + }, + { + "epoch": 138, + "train_loss": 5.2631301567077635, + "train_acc": 0.00882, + "test_loss": 4.673581381225586, + "test_acc": 0.01, + "lyapunov": 1.4808570945354373, + "grad_norm": 0.0884075853889321, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 41.70086741447449 + }, + { + "epoch": 139, + "train_loss": 5.264147056427002, + "train_acc": 0.00966, + "test_loss": 4.673584265136719, + "test_acc": 0.01, + "lyapunov": 1.4819788155348406, + "grad_norm": 0.08781225710160669, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 41.63281536102295 + }, + { + "epoch": 140, + "train_loss": 5.264177637023926, + "train_acc": 0.00946, + "test_loss": 4.673582272338868, + "test_acc": 0.01, + "lyapunov": 1.4820371799151917, + "grad_norm": 0.08778605437009919, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 41.605711221694946 + }, + { + "epoch": 141, + "train_loss": 5.264175823974609, + "train_acc": 0.01, + "test_loss": 4.673583470153808, + "test_acc": 0.01, + "lyapunov": 1.482038261030641, + "grad_norm": 0.08820186315365212, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 41.616660594940186 + }, + { + "epoch": 142, + "train_loss": 5.263000276947022, + "train_acc": 0.01, + "test_loss": 4.67358302154541, + "test_acc": 0.01, + "lyapunov": 1.4806900521373505, + "grad_norm": 0.08785028349994792, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 41.626938819885254 + }, + { + "epoch": 143, + "train_loss": 5.264303789367676, + "train_acc": 0.0093, + "test_loss": 4.673582839202881, + "test_acc": 0.01, + "lyapunov": 1.4821641326255506, + "grad_norm": 0.08832630889985595, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 41.62687826156616 + }, + { + "epoch": 144, + "train_loss": 5.266550144958496, + "train_acc": 0.01, + "test_loss": 4.673582318115234, + "test_acc": 0.01, + "lyapunov": 1.4840948478035305, + "grad_norm": 0.08863982897252927, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 41.63750672340393 + }, + { + "epoch": 145, + "train_loss": 5.2637120777893065, + "train_acc": 0.01, + "test_loss": 4.673582674407959, + "test_acc": 0.01, + "lyapunov": 1.4815035524880489, + "grad_norm": 0.08799138407501185, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 41.61049675941467 + }, + { + "epoch": 146, + "train_loss": 5.263380687713623, + "train_acc": 0.01, + "test_loss": 4.6735828002929685, + "test_acc": 0.01, + "lyapunov": 1.48112582825029, + "grad_norm": 0.08789323778024616, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 41.664053201675415 + }, + { + "epoch": 147, + "train_loss": 5.262870178375244, + "train_acc": 0.01, + "test_loss": 4.67358247756958, + "test_acc": 0.01, + "lyapunov": 1.4805500345766698, + "grad_norm": 0.08785274592155841, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 41.73871088027954 + }, + { + "epoch": 148, + "train_loss": 5.263046730651856, + "train_acc": 0.01, + "test_loss": 4.673582760620117, + "test_acc": 0.01, + "lyapunov": 1.480766166811404, + "grad_norm": 0.08817919214333009, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 41.71699619293213 + }, + { + "epoch": 149, + "train_loss": 5.264003658447265, + "train_acc": 0.01, + "test_loss": 4.673582760620117, + "test_acc": 0.01, + "lyapunov": 1.4818289621406808, + "grad_norm": 0.08840976368023683, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 41.63391995429993 + }, + { + "epoch": 150, + "train_loss": 5.264799559326172, + "train_acc": 0.01, + "test_loss": 4.673582650756836, + "test_acc": 0.01, + "lyapunov": 1.4827044315045448, + "grad_norm": 0.08814260335342491, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 41.604254484176636 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 5.146115896911621, + "train_acc": 0.02178, + "test_loss": 4.658292015838623, + "test_acc": 0.0179, + "lyapunov": 2.2941700692676825, + "grad_norm": 5.7514440172256105, + "grad_max_sv": 4.608755576610565, + "grad_min_sv": 9.931108821970013e-08, + "grad_condition": 54298677.31321855, + "lr": 0.0009998903417374227, + "time_sec": 86.91112756729126 + }, + { + "epoch": 2, + "train_loss": 4.702691088256836, + "train_acc": 0.02976, + "test_loss": 4.6687107803344725, + "test_acc": 0.0173, + "lyapunov": 1.8152018111685049, + "grad_norm": 3.1269645106600352, + "grad_max_sv": 2.3287330240011217, + "grad_min_sv": 5.3721432058395636e-08, + "grad_condition": 52432891.31661774, + "lr": 0.0009995614150494292, + "time_sec": 86.96670389175415 + }, + { + "epoch": 3, + "train_loss": 4.563177616271973, + "train_acc": 0.03108, + "test_loss": 4.458634540557862, + "test_acc": 0.0275, + "lyapunov": 1.659614868481141, + "grad_norm": 1.6241391637016038, + "grad_max_sv": 1.0878711834549903, + "grad_min_sv": 2.6067565292442475e-08, + "grad_condition": 83662403.24623688, + "lr": 0.0009990133642141358, + "time_sec": 86.90370392799377 + }, + { + "epoch": 4, + "train_loss": 4.516682284240723, + "train_acc": 0.03726, + "test_loss": 4.491609892272949, + "test_acc": 0.0226, + "lyapunov": 1.5915839062322437, + "grad_norm": 1.140832409431892, + "grad_max_sv": 0.6813461020588875, + "grad_min_sv": 1.4620473591086398e-08, + "grad_condition": 563097834.1159084, + "lr": 0.0009982464296247522, + "time_sec": 86.99007058143616 + }, + { + "epoch": 5, + "train_loss": 4.5070478215026855, + "train_acc": 0.04338, + "test_loss": 4.482846225738525, + "test_acc": 0.0231, + "lyapunov": 1.5719971531797248, + "grad_norm": 0.9891134281920906, + "grad_max_sv": 0.576826149970293, + "grad_min_sv": 1.4178649894447393e-08, + "grad_condition": 58885947.278740086, + "lr": 0.0009972609476841367, + "time_sec": 86.98556971549988 + }, + { + "epoch": 6, + "train_loss": 4.547509643402099, + "train_acc": 0.0439, + "test_loss": 4.9390108833312985, + "test_acc": 0.0116, + "lyapunov": 1.566867695744995, + "grad_norm": 0.8577969738236341, + "grad_max_sv": 0.45468067899346354, + "grad_min_sv": 1.1785924136642478e-08, + "grad_condition": 51467445.538705364, + "lr": 0.000996057350657239, + "time_sec": 86.93410611152649 + }, + { + "epoch": 7, + "train_loss": 4.532205999908447, + "train_acc": 0.04932, + "test_loss": 4.854185777282715, + "test_acc": 0.0105, + "lyapunov": 1.5658333350325484, + "grad_norm": 0.7813900002362055, + "grad_max_sv": 0.42395056039094925, + "grad_min_sv": 1.0807322919567653e-08, + "grad_condition": 102461132.44291899, + "lr": 0.000994636166481494, + "time_sec": 86.96581149101257 + }, + { + "epoch": 8, + "train_loss": 4.556547904968261, + "train_acc": 0.0504, + "test_loss": 5.202551012420654, + "test_acc": 0.0104, + "lyapunov": 1.5580533120943152, + "grad_norm": 0.7496749300980402, + "grad_max_sv": 0.3704929508268833, + "grad_min_sv": 9.9690008810438e-09, + "grad_condition": 130808798.44108884, + "lr": 0.0009929980185352525, + "time_sec": 86.94089555740356 + }, + { + "epoch": 9, + "train_loss": 4.701766607666015, + "train_acc": 0.03756, + "test_loss": 5.755129487609863, + "test_acc": 0.01, + "lyapunov": 1.5552253073743543, + "grad_norm": 0.6765304040507019, + "grad_max_sv": 0.36201889589428904, + "grad_min_sv": 8.426840739095276e-09, + "grad_condition": 62920470.9578716, + "lr": 0.0009911436253643444, + "time_sec": 86.93878936767578 + }, + { + "epoch": 10, + "train_loss": 4.765756509094238, + "train_acc": 0.03202, + "test_loss": 5.775740480041504, + "test_acc": 0.01, + "lyapunov": 1.5391303578301159, + "grad_norm": 0.7537997383732445, + "grad_max_sv": 0.34123560786247253, + "grad_min_sv": 8.077983985887994e-09, + "grad_condition": 51423310.42648181, + "lr": 0.0009890738003669028, + "time_sec": 86.94973969459534 + }, + { + "epoch": 11, + "train_loss": 4.81721549484253, + "train_acc": 0.0287, + "test_loss": 5.310749195861816, + "test_acc": 0.01, + "lyapunov": 1.5252552425769894, + "grad_norm": 0.6724423278308185, + "grad_max_sv": 0.2991580605506897, + "grad_min_sv": 5.889135633492526e-09, + "grad_condition": 125659233.84784427, + "lr": 0.00098678945143658, + "time_sec": 86.92238068580627 + }, + { + "epoch": 12, + "train_loss": 4.815476130065918, + "train_acc": 0.03228, + "test_loss": 4.919392412567139, + "test_acc": 0.01, + "lyapunov": 1.5252421408358132, + "grad_norm": 0.6745068286502589, + "grad_max_sv": 0.2930708375293761, + "grad_min_sv": 6.114008772872826e-09, + "grad_condition": 71899366.71277946, + "lr": 0.0009842915805643154, + "time_sec": 86.96433067321777 + }, + { + "epoch": 13, + "train_loss": 4.802655950775146, + "train_acc": 0.03752, + "test_loss": 4.738039018249512, + "test_acc": 0.01, + "lyapunov": 1.5223182784321974, + "grad_norm": 0.6997812002840638, + "grad_max_sv": 0.34992206916213037, + "grad_min_sv": 8.056309852566556e-09, + "grad_condition": 47743142.04490039, + "lr": 0.000981581283398829, + "time_sec": 86.93432188034058 + }, + { + "epoch": 14, + "train_loss": 4.879040807647705, + "train_acc": 0.03196, + "test_loss": 4.635845722961426, + "test_acc": 0.01, + "lyapunov": 1.5264948713200173, + "grad_norm": 0.7132128709453732, + "grad_max_sv": 0.37259799614548683, + "grad_min_sv": 7.726031005933498e-09, + "grad_condition": 77087531.09708562, + "lr": 0.0009786597487660333, + "time_sec": 86.92895364761353 + }, + { + "epoch": 15, + "train_loss": 4.93996203048706, + "train_acc": 0.0286, + "test_loss": 4.715687692260742, + "test_acc": 0.01, + "lyapunov": 1.5275609859115327, + "grad_norm": 0.7145493932975088, + "grad_max_sv": 0.3383642140775919, + "grad_min_sv": 6.660084050924553e-09, + "grad_condition": 63568945.70900831, + "lr": 0.0009755282581475766, + "time_sec": 86.93708157539368 + }, + { + "epoch": 16, + "train_loss": 4.951732353668213, + "train_acc": 0.03108, + "test_loss": 4.694218672180176, + "test_acc": 0.01, + "lyapunov": 1.5221876610270546, + "grad_norm": 0.6526072701529334, + "grad_max_sv": 0.29856473468244077, + "grad_min_sv": 5.5810975953029866e-09, + "grad_condition": 3669494078.4381485, + "lr": 0.0009721881851187403, + "time_sec": 86.95431900024414 + }, + { + "epoch": 17, + "train_loss": 5.028552846374511, + "train_acc": 0.02936, + "test_loss": 4.582682956695557, + "test_acc": 0.0148, + "lyapunov": 1.5572718967257253, + "grad_norm": 0.8395071465637489, + "grad_max_sv": 0.2635829897597432, + "grad_min_sv": 4.546329786998837e-09, + "grad_condition": 9308629659.195911, + "lr": 0.0009686409947459456, + "time_sec": 86.94067001342773 + }, + { + "epoch": 18, + "train_loss": 5.080957429504394, + "train_acc": 0.02958, + "test_loss": 4.743882189178467, + "test_acc": 0.01, + "lyapunov": 1.573465526256415, + "grad_norm": 0.7060094795148925, + "grad_max_sv": 0.26090904884040356, + "grad_min_sv": 4.9669986091141484e-09, + "grad_condition": 158829567.68689433, + "lr": 0.0009648882429441254, + "time_sec": 86.93801307678223 + }, + { + "epoch": 19, + "train_loss": 5.163744027404785, + "train_acc": 0.0251, + "test_loss": 5.350689000701904, + "test_acc": 0.01, + "lyapunov": 1.5783103155662945, + "grad_norm": 0.7236371812810315, + "grad_max_sv": 0.32311243638396264, + "grad_min_sv": 4.661415661322624e-09, + "grad_condition": 362163554.1712912, + "lr": 0.00096093157579425, + "time_sec": 86.95386362075806 + }, + { + "epoch": 20, + "train_loss": 5.177699388122559, + "train_acc": 0.02336, + "test_loss": 4.728291717529297, + "test_acc": 0.01, + "lyapunov": 1.5543774262718533, + "grad_norm": 0.6278235228394613, + "grad_max_sv": 0.2316085107624531, + "grad_min_sv": 2.9537814670154304e-09, + "grad_condition": 3474032967.5441117, + "lr": 0.0009567727288213001, + "time_sec": 86.9823546409607 + }, + { + "epoch": 21, + "train_loss": 5.2000909381103515, + "train_acc": 0.02436, + "test_loss": 4.806672692871094, + "test_acc": 0.01, + "lyapunov": 1.5755902729985658, + "grad_norm": 0.766013265906278, + "grad_max_sv": 0.21709984578192235, + "grad_min_sv": 2.2318304187728858e-09, + "grad_condition": 8696284488.710842, + "lr": 0.0009524135262330095, + "time_sec": 86.9815993309021 + }, + { + "epoch": 22, + "train_loss": 5.172516224975586, + "train_acc": 0.02578, + "test_loss": 5.050736184692383, + "test_acc": 0.01, + "lyapunov": 1.5738651392709873, + "grad_norm": 0.8548378900544575, + "grad_max_sv": 0.21818067859858276, + "grad_min_sv": 2.4550293141510983e-09, + "grad_condition": 1446353295.730711, + "lr": 0.0009478558801197061, + "time_sec": 86.96929454803467 + }, + { + "epoch": 23, + "train_loss": 5.301382947845459, + "train_acc": 0.01554, + "test_loss": 5.921122685241699, + "test_acc": 0.01, + "lyapunov": 1.5795374422731912, + "grad_norm": 1.072625133417376, + "grad_max_sv": 0.29671905748546124, + "grad_min_sv": 3.4811909517637897e-09, + "grad_condition": 2268879972.814607, + "lr": 0.000943101789615607, + "time_sec": 87.05305171012878 + }, + { + "epoch": 24, + "train_loss": 5.308596148986816, + "train_acc": 0.01028, + "test_loss": 5.915314376831055, + "test_acc": 0.01, + "lyapunov": 1.5046202849853985, + "grad_norm": 0.4300250072511413, + "grad_max_sv": 0.29422527775168417, + "grad_min_sv": 2.563464584050615e-09, + "grad_condition": 1801474829.549522, + "lr": 0.0009381533400219313, + "time_sec": 86.9294683933258 + }, + { + "epoch": 25, + "train_loss": 5.30389043762207, + "train_acc": 0.01028, + "test_loss": 5.442194981384278, + "test_acc": 0.01, + "lyapunov": 1.5036146476140717, + "grad_norm": 0.369004063413563, + "grad_max_sv": 0.27016645595431327, + "grad_min_sv": 1.563399900968634e-09, + "grad_condition": 26105306242.6268, + "lr": 0.0009330127018922189, + "time_sec": 86.93831205368042 + }, + { + "epoch": 26, + "train_loss": 5.310046338348388, + "train_acc": 0.00962, + "test_loss": 6.1388027900695805, + "test_acc": 0.01, + "lyapunov": 1.5094104654648726, + "grad_norm": 0.3921330241846595, + "grad_max_sv": 0.27323133423924445, + "grad_min_sv": 2.6655278586792953e-09, + "grad_condition": 217735166.8546676, + "lr": 0.000927682130080253, + "time_sec": 87.04652237892151 + }, + { + "epoch": 27, + "train_loss": 5.301853795013428, + "train_acc": 0.01042, + "test_loss": 5.515717539215088, + "test_acc": 0.01, + "lyapunov": 1.508369487569765, + "grad_norm": 0.30565280482621787, + "grad_max_sv": 0.22872439920902252, + "grad_min_sv": 7.688681849029263e-10, + "grad_condition": 46178443525.53847, + "lr": 0.0009221639627510072, + "time_sec": 87.04486989974976 + }, + { + "epoch": 28, + "train_loss": 5.29817862487793, + "train_acc": 0.00972, + "test_loss": 5.770360753631592, + "test_acc": 0.01, + "lyapunov": 1.5080109913940625, + "grad_norm": 0.277614712245464, + "grad_max_sv": 0.196561511605978, + "grad_min_sv": 1.2118332304701748e-12, + "grad_condition": 124861391701.8731, + "lr": 0.0009164606203550494, + "time_sec": 86.97034883499146 + }, + { + "epoch": 29, + "train_loss": 5.299116547241211, + "train_acc": 0.00974, + "test_loss": 6.629917897796631, + "test_acc": 0.01, + "lyapunov": 1.5079803863144896, + "grad_norm": 0.26773989693385675, + "grad_max_sv": 0.19062257409095765, + "grad_min_sv": 1.316391307854978e-12, + "grad_condition": 118514569073.00333, + "lr": 0.0009105746045668516, + "time_sec": 86.9515905380249 + }, + { + "epoch": 30, + "train_loss": 5.301858203277588, + "train_acc": 0.00952, + "test_loss": 7.616147738647461, + "test_acc": 0.01, + "lyapunov": 1.5108254772927754, + "grad_norm": 0.2739642757327739, + "grad_max_sv": 0.2010789501480758, + "grad_min_sv": 3.194205121044685e-10, + "grad_condition": 84817443385.97237, + "lr": 0.0009045084971874733, + "time_sec": 86.96926951408386 + }, + { + "epoch": 31, + "train_loss": 5.299806740875244, + "train_acc": 0.01004, + "test_loss": 7.885091897583008, + "test_acc": 0.01, + "lyapunov": 1.5118325930422225, + "grad_norm": 0.23726371187902562, + "grad_max_sv": 0.1534210465848446, + "grad_min_sv": 3.777587378576868e-12, + "grad_condition": 117298463694.8497, + "lr": 0.0008982649590120977, + "time_sec": 86.93767380714417 + }, + { + "epoch": 32, + "train_loss": 5.294980096740723, + "train_acc": 0.01054, + "test_loss": 7.175394052124023, + "test_acc": 0.01, + "lyapunov": 1.5122702329055122, + "grad_norm": 0.18490861832393377, + "grad_max_sv": 0.09243289618752897, + "grad_min_sv": 7.151144434390166e-15, + "grad_condition": 91554722602.0434, + "lr": 0.0008918467286629196, + "time_sec": 86.92625045776367 + }, + { + "epoch": 33, + "train_loss": 5.302116135559082, + "train_acc": 0.00916, + "test_loss": 6.950838031005859, + "test_acc": 0.01, + "lyapunov": 1.514583631854533, + "grad_norm": 0.22539071559889906, + "grad_max_sv": 0.14949913807213305, + "grad_min_sv": 3.03463898255766e-13, + "grad_condition": 123295125931.77371, + "lr": 0.0008852566213878943, + "time_sec": 86.96885013580322 + }, + { + "epoch": 34, + "train_loss": 5.298243276367187, + "train_acc": 0.00926, + "test_loss": 7.482379321289063, + "test_acc": 0.01, + "lyapunov": 1.514684440839626, + "grad_norm": 0.18381668144055355, + "grad_max_sv": 0.10984101705253124, + "grad_min_sv": 7.163631845931476e-15, + "grad_condition": 109054948912.02344, + "lr": 0.000878497527825878, + "time_sec": 87.12512397766113 + }, + { + "epoch": 35, + "train_loss": 5.308689108428955, + "train_acc": 0.00958, + "test_loss": 7.612553489685059, + "test_acc": 0.01, + "lyapunov": 1.5216995715485204, + "grad_norm": 0.22567054848299975, + "grad_max_sv": 0.1234450839459896, + "grad_min_sv": 5.377204609898583e-14, + "grad_condition": 117334156157.8593, + "lr": 0.000871572412738697, + "time_sec": 86.95104956626892 + }, + { + "epoch": 36, + "train_loss": 5.303922519226075, + "train_acc": 0.00964, + "test_loss": 8.831939950561523, + "test_acc": 0.01, + "lyapunov": 1.5175864534914647, + "grad_norm": 0.2187679660724696, + "grad_max_sv": 0.13990986812859774, + "grad_min_sv": 1.80366368447702e-13, + "grad_condition": 123448577181.446, + "lr": 0.0008644843137107055, + "time_sec": 86.92687749862671 + }, + { + "epoch": 37, + "train_loss": 5.303381102600098, + "train_acc": 0.00916, + "test_loss": 6.551040885925293, + "test_acc": 0.01, + "lyapunov": 1.5200756013850727, + "grad_norm": 0.1798120608859804, + "grad_max_sv": 0.10729131288826466, + "grad_min_sv": 1.364290789538136e-14, + "grad_condition": 105529300010.77225, + "lr": 0.0008572363398164014, + "time_sec": 86.95336151123047 + }, + { + "epoch": 38, + "train_loss": 5.30714798034668, + "train_acc": 0.0094, + "test_loss": 6.027979496765137, + "test_acc": 0.01, + "lyapunov": 1.5257836866866596, + "grad_norm": 0.1909663013844348, + "grad_max_sv": 0.07728723548352719, + "grad_min_sv": 4.265317043954499e-24, + "grad_condition": 77287235483.15219, + "lr": 0.0008498316702566826, + "time_sec": 86.9212384223938 + }, + { + "epoch": 39, + "train_loss": 5.306197135772705, + "train_acc": 0.00974, + "test_loss": 6.997566845703125, + "test_acc": 0.01, + "lyapunov": 1.5238893687572626, + "grad_norm": 0.18383519139729404, + "grad_max_sv": 0.1007891584187746, + "grad_min_sv": 5.3239199179750705e-15, + "grad_condition": 100154494637.09956, + "lr": 0.0008422735529643442, + "time_sec": 86.89629626274109 + }, + { + "epoch": 40, + "train_loss": 5.307650102386474, + "train_acc": 0.00992, + "test_loss": 6.040484946441651, + "test_acc": 0.01, + "lyapunov": 1.5250033597507135, + "grad_norm": 0.18467843309484097, + "grad_max_sv": 0.1127883294597268, + "grad_min_sv": 7.1038360456260524e-15, + "grad_condition": 111935273841.19809, + "lr": 0.0008345653031794289, + "time_sec": 87.02732610702515 + }, + { + "epoch": 41, + "train_loss": 5.307996878356934, + "train_acc": 0.00992, + "test_loss": 5.920440175628662, + "test_acc": 0.01, + "lyapunov": 1.5282226456400683, + "grad_norm": 0.16629297131246892, + "grad_max_sv": 0.07292309552431106, + "grad_min_sv": 1.583549415956451e-17, + "grad_condition": 72921914356.18047, + "lr": 0.0008267103019950526, + "time_sec": 86.94355273246765 + }, + { + "epoch": 42, + "train_loss": 5.311696410522461, + "train_acc": 0.00968, + "test_loss": 6.38518196105957, + "test_acc": 0.01, + "lyapunov": 1.5307711250032001, + "grad_norm": 0.1871179922092424, + "grad_max_sv": 0.08245804710313678, + "grad_min_sv": 6.943719241443141e-16, + "grad_condition": 82389599949.82372, + "lr": 0.0008187119948743447, + "time_sec": 86.93303918838501 + }, + { + "epoch": 43, + "train_loss": 5.307222317810059, + "train_acc": 0.00956, + "test_loss": 6.652195385742187, + "test_acc": 0.01, + "lyapunov": 1.5260984678097698, + "grad_norm": 0.16067559125539438, + "grad_max_sv": 0.09466201290488244, + "grad_min_sv": 4.4300769825600874e-16, + "grad_condition": 94621173553.03905, + "lr": 0.000810573890139155, + "time_sec": 86.90417695045471 + }, + { + "epoch": 44, + "train_loss": 5.308213620300293, + "train_acc": 0.00882, + "test_loss": 6.962696185302734, + "test_acc": 0.01, + "lyapunov": 1.527706109044497, + "grad_norm": 0.1609729738345643, + "grad_max_sv": 0.07951483679935337, + "grad_min_sv": 1.2691498572245332e-19, + "grad_condition": 79514825996.07883, + "lr": 0.0008022995574311873, + "time_sec": 86.90469932556152 + }, + { + "epoch": 45, + "train_loss": 5.313642641601563, + "train_acc": 0.01004, + "test_loss": 6.176641661071777, + "test_acc": 0.01, + "lyapunov": 1.5278308333643258, + "grad_norm": 0.20554701681584006, + "grad_max_sv": 0.1498540248721838, + "grad_min_sv": 2.7361367599211426e-14, + "grad_condition": 145983867269.5576, + "lr": 0.0007938926261462363, + "time_sec": 86.93738555908203 + }, + { + "epoch": 46, + "train_loss": 5.3097161289978025, + "train_acc": 0.00952, + "test_loss": 6.005211575317383, + "test_acc": 0.01, + "lyapunov": 1.5284498929977417, + "grad_norm": 0.17319376275900747, + "grad_max_sv": 0.10527544040232897, + "grad_min_sv": 1.6379736406305529e-15, + "grad_condition": 105101166914.13033, + "lr": 0.0007853567838422158, + "time_sec": 86.95744371414185 + }, + { + "epoch": 47, + "train_loss": 5.311491881408691, + "train_acc": 0.00956, + "test_loss": 5.9810846961975095, + "test_acc": 0.01, + "lyapunov": 1.530076160760182, + "grad_norm": 0.1622416677557275, + "grad_max_sv": 0.09897023066878319, + "grad_min_sv": 1.1070734961814082e-15, + "grad_condition": 98861145932.69461, + "lr": 0.0007766957746216719, + "time_sec": 86.9021110534668 + }, + { + "epoch": 48, + "train_loss": 5.310971976165772, + "train_acc": 0.00894, + "test_loss": 5.884356218719482, + "test_acc": 0.01, + "lyapunov": 1.5301186023160929, + "grad_norm": 0.15478972851501702, + "grad_max_sv": 0.09055562000721692, + "grad_min_sv": 6.095582881917491e-16, + "grad_condition": 90492925874.14865, + "lr": 0.0007679133974894982, + "time_sec": 86.923269033432 + }, + { + "epoch": 49, + "train_loss": 5.313096929931641, + "train_acc": 0.00936, + "test_loss": 5.441997985839844, + "test_acc": 0.01, + "lyapunov": 1.5325667373359662, + "grad_norm": 0.15811997882687892, + "grad_max_sv": 0.09403467867523432, + "grad_min_sv": 2.5362328677092476e-16, + "grad_condition": 94010861805.62488, + "lr": 0.000759013504686565, + "time_sec": 86.9168426990509 + }, + { + "epoch": 50, + "train_loss": 5.311940245513916, + "train_acc": 0.00958, + "test_loss": 5.371611124420166, + "test_acc": 0.01, + "lyapunov": 1.5327015231027628, + "grad_norm": 0.14176864627007332, + "grad_max_sv": 0.07908807899802923, + "grad_min_sv": 2.050192692484369e-32, + "grad_condition": 79088078998.02924, + "lr": 0.0007499999999999998, + "time_sec": 86.92089605331421 + }, + { + "epoch": 51, + "train_loss": 5.310895777282715, + "train_acc": 0.00916, + "test_loss": 5.434047091674804, + "test_acc": 0.01, + "lyapunov": 1.53158952573986, + "grad_norm": 0.1361778166532044, + "grad_max_sv": 0.06832279236987233, + "grad_min_sv": 6.675573383462495e-16, + "grad_condition": 68265680127.16847, + "lr": 0.0007408768370508575, + "time_sec": 86.94595527648926 + }, + { + "epoch": 52, + "train_loss": 5.3132603437805175, + "train_acc": 0.01008, + "test_loss": 6.7278813507080075, + "test_acc": 0.01, + "lyapunov": 1.535024075252016, + "grad_norm": 0.17384705948913357, + "grad_max_sv": 0.04316680300980806, + "grad_min_sv": 0.0, + "grad_condition": 43166803009.80806, + "lr": 0.0007316480175599307, + "time_sec": 86.91442537307739 + }, + { + "epoch": 53, + "train_loss": 5.3123740222167966, + "train_acc": 0.00936, + "test_loss": 6.131865232849121, + "test_acc": 0.01, + "lyapunov": 1.5338834356468962, + "grad_norm": 0.1343518088533916, + "grad_max_sv": 0.04088693740777671, + "grad_min_sv": 0.0, + "grad_condition": 40886937407.77672, + "lr": 0.0007223175895924635, + "time_sec": 86.89388537406921 + }, + { + "epoch": 54, + "train_loss": 5.311756536712647, + "train_acc": 0.00874, + "test_loss": 6.26136455078125, + "test_acc": 0.01, + "lyapunov": 1.534105893900937, + "grad_norm": 0.12044776828887008, + "grad_max_sv": 0.018818416306748985, + "grad_min_sv": 0.0, + "grad_condition": 18818416306.748985, + "lr": 0.0007128896457825361, + "time_sec": 86.86209654808044 + }, + { + "epoch": 55, + "train_loss": 5.314126918182373, + "train_acc": 0.00948, + "test_loss": 6.455938655853272, + "test_acc": 0.01, + "lyapunov": 1.5355246698155123, + "grad_norm": 0.16535062387735305, + "grad_max_sv": 0.048017819551751016, + "grad_min_sv": 0.0, + "grad_condition": 48017819551.75102, + "lr": 0.0007033683215378998, + "time_sec": 86.91218829154968 + }, + { + "epoch": 56, + "train_loss": 5.3133398397827145, + "train_acc": 0.00934, + "test_loss": 6.355834351348877, + "test_acc": 0.01, + "lyapunov": 1.535221906574181, + "grad_norm": 0.14103865757116907, + "grad_max_sv": 0.040325032686814664, + "grad_min_sv": 0.0, + "grad_condition": 40325032686.814674, + "lr": 0.0006937577932260512, + "time_sec": 87.01914978027344 + }, + { + "epoch": 57, + "train_loss": 5.315177789154053, + "train_acc": 0.00906, + "test_loss": 5.778967167663574, + "test_acc": 0.01, + "lyapunov": 1.5374448241480172, + "grad_norm": 0.12626262616875458, + "grad_max_sv": 0.04227766813710332, + "grad_min_sv": 0.0, + "grad_condition": 42277668137.10332, + "lr": 0.0006840622763423388, + "time_sec": 86.90552043914795 + }, + { + "epoch": 58, + "train_loss": 5.314984718017578, + "train_acc": 0.0096, + "test_loss": 5.680106079101562, + "test_acc": 0.01, + "lyapunov": 1.536767850141696, + "grad_norm": 0.13366926148127872, + "grad_max_sv": 0.05202861637808383, + "grad_min_sv": 0.0, + "grad_condition": 52028616378.083824, + "lr": 0.0006742860236609073, + "time_sec": 86.97483849525452 + }, + { + "epoch": 59, + "train_loss": 5.314250464019775, + "train_acc": 0.00922, + "test_loss": 5.60796079864502, + "test_acc": 0.01, + "lyapunov": 1.535877099732304, + "grad_norm": 0.13264295460080205, + "grad_max_sv": 0.053861632384359835, + "grad_min_sv": 0.0, + "grad_condition": 53861632384.35984, + "lr": 0.0006644333233692913, + "time_sec": 86.90899348258972 + }, + { + "epoch": 60, + "train_loss": 5.315608520202637, + "train_acc": 0.00862, + "test_loss": 5.75697197265625, + "test_acc": 0.01, + "lyapunov": 1.5373123942128837, + "grad_norm": 0.13451447891861437, + "grad_max_sv": 0.05724321529269218, + "grad_min_sv": 0.0, + "grad_condition": 57243215292.692184, + "lr": 0.0006545084971874734, + "time_sec": 86.93145775794983 + }, + { + "epoch": 61, + "train_loss": 5.315526120605469, + "train_acc": 0.00966, + "test_loss": 5.641050135803223, + "test_acc": 0.01, + "lyapunov": 1.537875465419896, + "grad_norm": 0.134018980558527, + "grad_max_sv": 0.04659216776490212, + "grad_min_sv": 0.0, + "grad_condition": 46592167764.902115, + "lr": 0.0006445158984722354, + "time_sec": 86.9526846408844 + }, + { + "epoch": 62, + "train_loss": 5.3171287049865725, + "train_acc": 0.0095, + "test_loss": 5.52830389251709, + "test_acc": 0.01, + "lyapunov": 1.5390207541873082, + "grad_norm": 0.13900770761864464, + "grad_max_sv": 0.05631723469123244, + "grad_min_sv": 0.0, + "grad_condition": 56317234691.232445, + "lr": 0.0006344599103076324, + "time_sec": 86.95262598991394 + }, + { + "epoch": 63, + "train_loss": 5.321492596435547, + "train_acc": 0.00884, + "test_loss": 5.732630862426758, + "test_acc": 0.01, + "lyapunov": 1.5413236017422298, + "grad_norm": 0.1533270491872105, + "grad_max_sv": 0.04487980231642723, + "grad_min_sv": 0.0, + "grad_condition": 44879802316.42723, + "lr": 0.0006243449435824269, + "time_sec": 86.93239831924438 + }, + { + "epoch": 64, + "train_loss": 5.315124908752441, + "train_acc": 0.0099, + "test_loss": 5.382702461242676, + "test_acc": 0.01, + "lyapunov": 1.5375381320943613, + "grad_norm": 0.12218366701103515, + "grad_max_sv": 0.032946509402245285, + "grad_min_sv": 0.0, + "grad_condition": 32946509402.24528, + "lr": 0.0006141754350553275, + "time_sec": 86.91653037071228 + }, + { + "epoch": 65, + "train_loss": 5.317460901031494, + "train_acc": 0.00952, + "test_loss": 5.498714874267578, + "test_acc": 0.01, + "lyapunov": 1.5401654679452061, + "grad_norm": 0.11182228456659622, + "grad_max_sv": 0.020332988910377027, + "grad_min_sv": 0.0, + "grad_condition": 20332988910.377026, + "lr": 0.0006039558454088793, + "time_sec": 86.86022281646729 + }, + { + "epoch": 66, + "train_loss": 5.315697211608887, + "train_acc": 0.00964, + "test_loss": 5.722520481872559, + "test_acc": 0.01, + "lyapunov": 1.5384024250537842, + "grad_norm": 0.11947856234602877, + "grad_max_sv": 0.012709397682920098, + "grad_min_sv": 0.0, + "grad_condition": 12709397682.9201, + "lr": 0.000593690657292862, + "time_sec": 86.83588552474976 + }, + { + "epoch": 67, + "train_loss": 5.315312230377197, + "train_acc": 0.00948, + "test_loss": 5.6552305557250975, + "test_acc": 0.01, + "lyapunov": 1.5376315924822521, + "grad_norm": 0.12716375762874924, + "grad_max_sv": 0.026200923277065157, + "grad_min_sv": 0.0, + "grad_condition": 26200923277.06516, + "lr": 0.0005833843733580507, + "time_sec": 86.93734240531921 + }, + { + "epoch": 68, + "train_loss": 5.316413257446289, + "train_acc": 0.00892, + "test_loss": 5.644158979797363, + "test_acc": 0.01, + "lyapunov": 1.5389487700694053, + "grad_norm": 0.11329541475422919, + "grad_max_sv": 0.025692512933164834, + "grad_min_sv": 0.0, + "grad_condition": 25692512933.164837, + "lr": 0.0005730415142812054, + "time_sec": 86.92358016967773 + }, + { + "epoch": 69, + "train_loss": 5.317326981048584, + "train_acc": 0.00962, + "test_loss": 5.646556529998779, + "test_acc": 0.01, + "lyapunov": 1.5400864053565217, + "grad_norm": 0.1245567601020978, + "grad_max_sv": 0.024738446017727254, + "grad_min_sv": 0.0, + "grad_condition": 24738446017.727257, + "lr": 0.0005626666167821517, + "time_sec": 86.86787414550781 + }, + { + "epoch": 70, + "train_loss": 5.317049356994629, + "train_acc": 0.00982, + "test_loss": 5.6787915084838865, + "test_acc": 0.01, + "lyapunov": 1.5397665028072074, + "grad_norm": 0.118076358762286, + "grad_max_sv": 0.03472304726019502, + "grad_min_sv": 0.0, + "grad_condition": 34723047260.195015, + "lr": 0.0005522642316338265, + "time_sec": 86.88831448554993 + }, + { + "epoch": 71, + "train_loss": 5.315880928039551, + "train_acc": 0.00964, + "test_loss": 5.735556723022461, + "test_acc": 0.01, + "lyapunov": 1.5387067657602413, + "grad_norm": 0.11912248112688287, + "grad_max_sv": 0.025617524981498718, + "grad_min_sv": 0.0, + "grad_condition": 25617524981.49872, + "lr": 0.0005418389216661573, + "time_sec": 86.86845374107361 + }, + { + "epoch": 72, + "train_loss": 5.320206904296875, + "train_acc": 0.00958, + "test_loss": 5.694711586761475, + "test_acc": 0.01, + "lyapunov": 1.5424333557753307, + "grad_norm": 0.12792597639508846, + "grad_max_sv": 0.03625847464427352, + "grad_min_sv": 0.0, + "grad_condition": 36258474644.27352, + "lr": 0.0005313952597646563, + "time_sec": 86.87807965278625 + }, + { + "epoch": 73, + "train_loss": 5.318149011688233, + "train_acc": 0.0099, + "test_loss": 5.715859918212891, + "test_acc": 0.01, + "lyapunov": 1.5407461092600128, + "grad_norm": 0.12131920132322771, + "grad_max_sv": 0.04332554340362549, + "grad_min_sv": 0.0, + "grad_condition": 43325543403.62549, + "lr": 0.0005209378268645994, + "time_sec": 86.93414950370789 + }, + { + "epoch": 74, + "train_loss": 5.316737642364502, + "train_acc": 0.0094, + "test_loss": 5.432159627532959, + "test_acc": 0.01, + "lyapunov": 1.5394032800289066, + "grad_norm": 0.11202086425017638, + "grad_max_sv": 0.02820308110676706, + "grad_min_sv": 0.0, + "grad_condition": 28203081106.76706, + "lr": 0.0005104712099416781, + "time_sec": 86.86637806892395 + }, + { + "epoch": 75, + "train_loss": 5.317990305633545, + "train_acc": 0.00994, + "test_loss": 5.894020344543457, + "test_acc": 0.01, + "lyapunov": 1.5408979687849274, + "grad_norm": 0.15447706508859999, + "grad_max_sv": 0.01931341988965869, + "grad_min_sv": 0.0, + "grad_condition": 19313419889.65869, + "lr": 0.0004999999999999996, + "time_sec": 86.85794830322266 + }, + { + "epoch": 76, + "train_loss": 5.329913055419921, + "train_acc": 0.00922, + "test_loss": 5.356306673431397, + "test_acc": 0.01, + "lyapunov": 1.5469030404029904, + "grad_norm": 0.1130858808468486, + "grad_max_sv": 0.020954679837450384, + "grad_min_sv": 0.0, + "grad_condition": 20954679837.450386, + "lr": 0.0004895287900583212, + "time_sec": 86.8532190322876 + }, + { + "epoch": 77, + "train_loss": 5.317062496490479, + "train_acc": 0.01014, + "test_loss": 5.6768914947509765, + "test_acc": 0.01, + "lyapunov": 1.539591530399859, + "grad_norm": 0.11763219922287847, + "grad_max_sv": 0.03681175904348492, + "grad_min_sv": 0.0, + "grad_condition": 36811759043.484924, + "lr": 0.0004790621731353997, + "time_sec": 86.89854335784912 + }, + { + "epoch": 78, + "train_loss": 5.321235802612304, + "train_acc": 0.00956, + "test_loss": 5.498642253875732, + "test_acc": 0.01, + "lyapunov": 1.5433477379781815, + "grad_norm": 0.12257877066992058, + "grad_max_sv": 0.002356324018910527, + "grad_min_sv": 0.0, + "grad_condition": 2356324018.910527, + "lr": 0.000468604740235343, + "time_sec": 86.82986307144165 + }, + { + "epoch": 79, + "train_loss": 5.3170875860595705, + "train_acc": 0.00874, + "test_loss": 5.678500232696533, + "test_acc": 0.01, + "lyapunov": 1.5401862192031976, + "grad_norm": 0.11850283030771655, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 86.84353518486023 + }, + { + "epoch": 80, + "train_loss": 5.319253426513672, + "train_acc": 0.00918, + "test_loss": 5.127548231506347, + "test_acc": 0.01, + "lyapunov": 1.5418513970606773, + "grad_norm": 0.11699107355632338, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 86.8760769367218 + }, + { + "epoch": 81, + "train_loss": 5.317456825408936, + "train_acc": 0.00894, + "test_loss": 5.307968811035156, + "test_acc": 0.01, + "lyapunov": 1.5405245113860615, + "grad_norm": 0.1284549935774549, + "grad_max_sv": 0.0083365049213171, + "grad_min_sv": 0.0, + "grad_condition": 8336504921.317101, + "lr": 0.00043733338321784746, + "time_sec": 86.87371492385864 + }, + { + "epoch": 82, + "train_loss": 5.317734858398437, + "train_acc": 0.00954, + "test_loss": 5.0544998031616215, + "test_acc": 0.01, + "lyapunov": 1.5406023172466345, + "grad_norm": 0.120735257297947, + "grad_max_sv": 0.02263884055428207, + "grad_min_sv": 0.0, + "grad_condition": 22638840554.282066, + "lr": 0.0004269584857187939, + "time_sec": 86.92492771148682 + }, + { + "epoch": 83, + "train_loss": 5.32118753692627, + "train_acc": 0.00954, + "test_loss": 5.125200929260254, + "test_acc": 0.01, + "lyapunov": 1.5442977073552357, + "grad_norm": 0.11585054245697951, + "grad_max_sv": 0.004569409461691975, + "grad_min_sv": 0.0, + "grad_condition": 4569409461.691976, + "lr": 0.0004166156266419484, + "time_sec": 86.81740093231201 + }, + { + "epoch": 84, + "train_loss": 5.317668086853027, + "train_acc": 0.00892, + "test_loss": 5.523793495178222, + "test_acc": 0.01, + "lyapunov": 1.5407223094759694, + "grad_norm": 0.10949975143698651, + "grad_max_sv": 0.01457698536105454, + "grad_min_sv": 0.0, + "grad_condition": 14576985361.05454, + "lr": 0.0004063093427071373, + "time_sec": 86.87661004066467 + }, + { + "epoch": 85, + "train_loss": 5.327004724578857, + "train_acc": 0.00984, + "test_loss": 5.3676797477722165, + "test_acc": 0.01, + "lyapunov": 1.54690202819112, + "grad_norm": 0.11567866960588237, + "grad_max_sv": 0.00381420748308301, + "grad_min_sv": 0.0, + "grad_condition": 3814207483.0830092, + "lr": 0.0003960441545911199, + "time_sec": 86.82225131988525 + }, + { + "epoch": 86, + "train_loss": 5.3172469395446775, + "train_acc": 0.00898, + "test_loss": 4.901917692565918, + "test_acc": 0.01, + "lyapunov": 1.5404299381748794, + "grad_norm": 0.11387390679382547, + "grad_max_sv": 0.001853126659989357, + "grad_min_sv": 0.0, + "grad_condition": 1853126659.989357, + "lr": 0.0003858245649446718, + "time_sec": 86.82927370071411 + }, + { + "epoch": 87, + "train_loss": 5.318947126464844, + "train_acc": 0.00926, + "test_loss": 5.208927967834473, + "test_acc": 0.01, + "lyapunov": 1.5421383124788095, + "grad_norm": 0.10919909006363937, + "grad_max_sv": 0.0032654264010488986, + "grad_min_sv": 0.0, + "grad_condition": 3265426401.048898, + "lr": 0.00037565505641757235, + "time_sec": 86.81736421585083 + }, + { + "epoch": 88, + "train_loss": 5.318348231048584, + "train_acc": 0.00918, + "test_loss": 4.997183460998535, + "test_acc": 0.01, + "lyapunov": 1.5415247068990527, + "grad_norm": 0.11341200364232766, + "grad_max_sv": 0.006511487392708659, + "grad_min_sv": 0.0, + "grad_condition": 6511487392.708659, + "lr": 0.00036554008969236695, + "time_sec": 86.82162237167358 + }, + { + "epoch": 89, + "train_loss": 5.318816225433349, + "train_acc": 0.00892, + "test_loss": 5.18877671661377, + "test_acc": 0.01, + "lyapunov": 1.5420374519684736, + "grad_norm": 0.12034783892609052, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 86.97105526924133 + }, + { + "epoch": 90, + "train_loss": 5.318523200531006, + "train_acc": 0.00938, + "test_loss": 5.115398947143555, + "test_acc": 0.01, + "lyapunov": 1.5415691600736146, + "grad_norm": 0.14346849260322833, + "grad_max_sv": 0.02495567239820957, + "grad_min_sv": 0.0, + "grad_condition": 24955672398.20957, + "lr": 0.000345491502812526, + "time_sec": 86.88058757781982 + }, + { + "epoch": 91, + "train_loss": 5.318174597930908, + "train_acc": 0.00928, + "test_loss": 5.025017410278321, + "test_acc": 0.01, + "lyapunov": 1.5413767959150817, + "grad_norm": 0.12564666917462933, + "grad_max_sv": 0.0075723147485405205, + "grad_min_sv": 0.0, + "grad_condition": 7572314748.540522, + "lr": 0.0003355666766307081, + "time_sec": 86.85795545578003 + }, + { + "epoch": 92, + "train_loss": 5.318962445831299, + "train_acc": 0.00776, + "test_loss": 4.925245237731934, + "test_acc": 0.01, + "lyapunov": 1.5422863734652623, + "grad_norm": 0.12308146620405915, + "grad_max_sv": 0.0013421432580798865, + "grad_min_sv": 0.0, + "grad_condition": 1342143258.0798864, + "lr": 0.00032571397633909225, + "time_sec": 86.79794430732727 + }, + { + "epoch": 93, + "train_loss": 5.327239834136963, + "train_acc": 0.00902, + "test_loss": 5.076303866577148, + "test_acc": 0.01, + "lyapunov": 1.5474630085098775, + "grad_norm": 0.1277051442186759, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766094, + "time_sec": 86.82232332229614 + }, + { + "epoch": 94, + "train_loss": 5.318930770874023, + "train_acc": 0.00872, + "test_loss": 4.880594007110596, + "test_acc": 0.01, + "lyapunov": 1.5422684445100672, + "grad_norm": 0.13600368147480044, + "grad_max_sv": 0.002521184924989939, + "grad_min_sv": 0.0, + "grad_condition": 2521184924.9899387, + "lr": 0.0003062422067739483, + "time_sec": 86.81427669525146 + }, + { + "epoch": 95, + "train_loss": 5.319566112213135, + "train_acc": 0.00978, + "test_loss": 4.991552732849121, + "test_acc": 0.01, + "lyapunov": 1.5428647238885045, + "grad_norm": 0.12437123327866709, + "grad_max_sv": 0.012525724712759256, + "grad_min_sv": 0.0, + "grad_condition": 12525724712.759256, + "lr": 0.00029663167846209965, + "time_sec": 86.81576943397522 + }, + { + "epoch": 96, + "train_loss": 5.321689688720703, + "train_acc": 0.00864, + "test_loss": 4.8253173141479495, + "test_acc": 0.01, + "lyapunov": 1.5444780929619089, + "grad_norm": 0.12565886868121948, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 86.88868856430054 + }, + { + "epoch": 97, + "train_loss": 5.31878070602417, + "train_acc": 0.00896, + "test_loss": 4.881497433471679, + "test_acc": 0.01, + "lyapunov": 1.5421305144839275, + "grad_norm": 0.11716334018301236, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 86.82862520217896 + }, + { + "epoch": 98, + "train_loss": 5.322988173828125, + "train_acc": 0.00888, + "test_loss": 4.762122218322754, + "test_acc": 0.01, + "lyapunov": 1.545472724663327, + "grad_norm": 0.14401618175686975, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 86.81479406356812 + }, + { + "epoch": 99, + "train_loss": 5.318863394622802, + "train_acc": 0.00886, + "test_loss": 4.714427976989746, + "test_acc": 0.01, + "lyapunov": 1.5421699697099378, + "grad_norm": 0.13101580238155278, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 86.82360768318176 + }, + { + "epoch": 100, + "train_loss": 5.32177279083252, + "train_acc": 0.00908, + "test_loss": 4.741457105255127, + "test_acc": 0.01, + "lyapunov": 1.5448724360722106, + "grad_norm": 0.12685940692823117, + "grad_max_sv": 0.0014819118659943342, + "grad_min_sv": 0.0, + "grad_condition": 1481911865.9943342, + "lr": 0.0002499999999999997, + "time_sec": 86.83973097801208 + }, + { + "epoch": 101, + "train_loss": 5.321585564422607, + "train_acc": 0.0095, + "test_loss": 4.660526361846924, + "test_acc": 0.01, + "lyapunov": 1.5446103762482744, + "grad_norm": 0.15017654739054603, + "grad_max_sv": 0.013982362765818834, + "grad_min_sv": 0.0, + "grad_condition": 13982362765.818836, + "lr": 0.00024098649531343477, + "time_sec": 86.89186692237854 + }, + { + "epoch": 102, + "train_loss": 5.318927859802246, + "train_acc": 0.00892, + "test_loss": 4.667855642700196, + "test_acc": 0.01, + "lyapunov": 1.542065743900016, + "grad_norm": 0.14354448313759138, + "grad_max_sv": 0.007601975044235587, + "grad_min_sv": 0.0, + "grad_condition": 7601975044.235586, + "lr": 0.0002320866025105016, + "time_sec": 86.85510921478271 + }, + { + "epoch": 103, + "train_loss": 5.319302808380127, + "train_acc": 0.00854, + "test_loss": 4.7306030563354495, + "test_acc": 0.01, + "lyapunov": 1.5426954067576573, + "grad_norm": 0.1222745390564005, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 86.83695554733276 + }, + { + "epoch": 104, + "train_loss": 5.3208301354980465, + "train_acc": 0.00928, + "test_loss": 4.6642813407897945, + "test_acc": 0.01, + "lyapunov": 1.5443277465717873, + "grad_norm": 0.12082325206764133, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 86.83465480804443 + }, + { + "epoch": 105, + "train_loss": 5.325607220458984, + "train_acc": 0.00868, + "test_loss": 4.797847722625733, + "test_acc": 0.01, + "lyapunov": 1.547427470421852, + "grad_norm": 0.1467365865583852, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 86.92287278175354 + }, + { + "epoch": 106, + "train_loss": 5.327985736999512, + "train_acc": 0.00948, + "test_loss": 4.780700933837891, + "test_acc": 0.01, + "lyapunov": 1.5493294055504567, + "grad_norm": 0.13200210447777874, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 86.93008136749268 + }, + { + "epoch": 107, + "train_loss": 5.319034835205078, + "train_acc": 0.00946, + "test_loss": 4.834465756225586, + "test_acc": 0.01, + "lyapunov": 1.5422752080366129, + "grad_norm": 0.12777999612030252, + "grad_max_sv": 0.02157975882291794, + "grad_min_sv": 0.0, + "grad_condition": 21579758822.91794, + "lr": 0.0001894261098608447, + "time_sec": 86.82852697372437 + }, + { + "epoch": 108, + "train_loss": 5.321411961364746, + "train_acc": 0.00916, + "test_loss": 4.814922105407715, + "test_acc": 0.01, + "lyapunov": 1.544609341475055, + "grad_norm": 0.13197562787736147, + "grad_max_sv": 0.015251889312639832, + "grad_min_sv": 0.0, + "grad_condition": 15251889312.639832, + "lr": 0.000181288005125655, + "time_sec": 86.85191607475281 + }, + { + "epoch": 109, + "train_loss": 5.322899269256592, + "train_acc": 0.00876, + "test_loss": 4.713241914367676, + "test_acc": 0.01, + "lyapunov": 1.54528974267223, + "grad_norm": 0.12828276594838653, + "grad_max_sv": 0.0006727563217282295, + "grad_min_sv": 0.0, + "grad_condition": 672756321.7282295, + "lr": 0.0001732896980049473, + "time_sec": 86.82081818580627 + }, + { + "epoch": 110, + "train_loss": 5.318816036987305, + "train_acc": 0.0094, + "test_loss": 4.679484854125977, + "test_acc": 0.01, + "lyapunov": 1.5422053230388084, + "grad_norm": 0.12847280658733387, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 86.9124755859375 + }, + { + "epoch": 111, + "train_loss": 5.318745676116944, + "train_acc": 0.00848, + "test_loss": 4.795034047698975, + "test_acc": 0.01, + "lyapunov": 1.5421484263656695, + "grad_norm": 0.1278982868324375, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 86.83268451690674 + }, + { + "epoch": 112, + "train_loss": 5.318630710906983, + "train_acc": 0.00898, + "test_loss": 4.784210496520996, + "test_acc": 0.01, + "lyapunov": 1.5420354778504433, + "grad_norm": 0.13247976598300262, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 86.79545545578003 + }, + { + "epoch": 113, + "train_loss": 5.318998959655762, + "train_acc": 0.00884, + "test_loss": 4.768862895202637, + "test_acc": 0.01, + "lyapunov": 1.542412842021269, + "grad_norm": 0.13154644614275643, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 86.8436176776886 + }, + { + "epoch": 114, + "train_loss": 5.3237989538574215, + "train_acc": 0.00958, + "test_loss": 4.739323009490967, + "test_acc": 0.01, + "lyapunov": 1.5463786896537333, + "grad_norm": 0.14268776917647705, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 86.84370040893555 + }, + { + "epoch": 115, + "train_loss": 5.321883607025146, + "train_acc": 0.00924, + "test_loss": 4.724630879211426, + "test_acc": 0.01, + "lyapunov": 1.544751648707768, + "grad_norm": 0.13724738045143065, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 86.83514404296875 + }, + { + "epoch": 116, + "train_loss": 5.317745707855225, + "train_acc": 0.00926, + "test_loss": 4.771264694213867, + "test_acc": 0.01, + "lyapunov": 1.5411124830050846, + "grad_norm": 0.13439912972628948, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 86.83839774131775 + }, + { + "epoch": 117, + "train_loss": 5.318638670196533, + "train_acc": 0.00944, + "test_loss": 4.926259418487549, + "test_acc": 0.01, + "lyapunov": 1.5420454350273933, + "grad_norm": 0.1301899172356262, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 86.81545162200928 + }, + { + "epoch": 118, + "train_loss": 5.317975592346191, + "train_acc": 0.0091, + "test_loss": 4.7584453956604005, + "test_acc": 0.01, + "lyapunov": 1.5413338939856995, + "grad_norm": 0.1306510838756953, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 86.84224820137024 + }, + { + "epoch": 119, + "train_loss": 5.317512142944336, + "train_acc": 0.00918, + "test_loss": 4.75227194366455, + "test_acc": 0.01, + "lyapunov": 1.5408342912069062, + "grad_norm": 0.13531431192184493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 86.84121561050415 + }, + { + "epoch": 120, + "train_loss": 5.32096346862793, + "train_acc": 0.00916, + "test_loss": 4.783403231811524, + "test_acc": 0.01, + "lyapunov": 1.5443097962747754, + "grad_norm": 0.1366841922730417, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 86.8264012336731 + }, + { + "epoch": 121, + "train_loss": 5.31987023651123, + "train_acc": 0.009, + "test_loss": 4.769460425567627, + "test_acc": 0.01, + "lyapunov": 1.5431054827502317, + "grad_norm": 0.13796061159903233, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 86.83200931549072 + }, + { + "epoch": 122, + "train_loss": 5.317669274597168, + "train_acc": 0.009, + "test_loss": 4.726600196838379, + "test_acc": 0.01, + "lyapunov": 1.5410202537351252, + "grad_norm": 0.13807476351768067, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 86.85096383094788 + }, + { + "epoch": 123, + "train_loss": 5.31959240447998, + "train_acc": 0.00982, + "test_loss": 4.731892253112793, + "test_acc": 0.01, + "lyapunov": 1.5430450296158071, + "grad_norm": 0.14330032241201268, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 86.8001983165741 + }, + { + "epoch": 124, + "train_loss": 5.317501362304688, + "train_acc": 0.00938, + "test_loss": 4.782514060974121, + "test_acc": 0.01, + "lyapunov": 1.540854393673675, + "grad_norm": 0.14059038369574442, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 86.87392091751099 + }, + { + "epoch": 125, + "train_loss": 5.318027396545411, + "train_acc": 0.0095, + "test_loss": 4.765302996826172, + "test_acc": 0.01, + "lyapunov": 1.5414052317514444, + "grad_norm": 0.1418679045184447, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 86.82495832443237 + }, + { + "epoch": 126, + "train_loss": 5.318346632080078, + "train_acc": 0.0092, + "test_loss": 4.7442352600097655, + "test_acc": 0.01, + "lyapunov": 1.5417146911401578, + "grad_norm": 0.142826590523136, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 86.79729580879211 + }, + { + "epoch": 127, + "train_loss": 5.318922318725586, + "train_acc": 0.00974, + "test_loss": 4.76433516998291, + "test_acc": 0.01, + "lyapunov": 1.542423507136762, + "grad_norm": 0.14495446560643363, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 86.93182754516602 + }, + { + "epoch": 128, + "train_loss": 5.318007217102051, + "train_acc": 0.00962, + "test_loss": 4.764061611938477, + "test_acc": 0.01, + "lyapunov": 1.541390145831096, + "grad_norm": 0.14153652471754832, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 86.8191487789154 + }, + { + "epoch": 129, + "train_loss": 5.318092449340821, + "train_acc": 0.00968, + "test_loss": 4.765155668640137, + "test_acc": 0.01, + "lyapunov": 1.5414884422746156, + "grad_norm": 0.14863798950920318, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 86.92294239997864 + }, + { + "epoch": 130, + "train_loss": 5.318419138793946, + "train_acc": 0.00922, + "test_loss": 4.764954615783691, + "test_acc": 0.01, + "lyapunov": 1.541847081745372, + "grad_norm": 0.14422350481698742, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 86.83364939689636 + }, + { + "epoch": 131, + "train_loss": 5.319330998535157, + "train_acc": 0.00984, + "test_loss": 4.749797338867188, + "test_acc": 0.01, + "lyapunov": 1.5428275848593553, + "grad_norm": 0.1575339118534098, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 86.83805966377258 + }, + { + "epoch": 132, + "train_loss": 5.3225936277771, + "train_acc": 0.00944, + "test_loss": 4.753033805847168, + "test_acc": 0.01, + "lyapunov": 1.5456237704552653, + "grad_norm": 0.1459542484301229, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 86.83223581314087 + }, + { + "epoch": 133, + "train_loss": 5.319478280029297, + "train_acc": 0.00904, + "test_loss": 4.726372310638427, + "test_acc": 0.01, + "lyapunov": 1.5427262319628234, + "grad_norm": 0.15430065761057823, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 86.81233429908752 + }, + { + "epoch": 134, + "train_loss": 5.320157431182861, + "train_acc": 0.00978, + "test_loss": 4.729707991790772, + "test_acc": 0.01, + "lyapunov": 1.5434529592314035, + "grad_norm": 0.14953623206124225, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 86.81813621520996 + }, + { + "epoch": 135, + "train_loss": 5.344091755371093, + "train_acc": 0.00992, + "test_loss": 4.742976405334472, + "test_acc": 0.01, + "lyapunov": 1.5575274945524953, + "grad_norm": 0.17021644451164028, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 86.84416842460632 + }, + { + "epoch": 136, + "train_loss": 5.3179564929199215, + "train_acc": 0.01, + "test_loss": 4.757002459716797, + "test_acc": 0.01, + "lyapunov": 1.541358881289392, + "grad_norm": 0.1455320955701897, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 86.83202290534973 + }, + { + "epoch": 137, + "train_loss": 5.319369739990234, + "train_acc": 0.00978, + "test_loss": 4.748977610015869, + "test_acc": 0.01, + "lyapunov": 1.5428897822299577, + "grad_norm": 0.15104084037444107, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 86.81699085235596 + }, + { + "epoch": 138, + "train_loss": 5.318675216522217, + "train_acc": 0.01, + "test_loss": 4.713645321655274, + "test_acc": 0.01, + "lyapunov": 1.5421365197662198, + "grad_norm": 0.14694031631290994, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 86.8898720741272 + }, + { + "epoch": 139, + "train_loss": 5.318637705383301, + "train_acc": 0.01, + "test_loss": 4.743732140350342, + "test_acc": 0.01, + "lyapunov": 1.5420801776754276, + "grad_norm": 0.15086340410308036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 86.82428193092346 + }, + { + "epoch": 140, + "train_loss": 5.318365608825683, + "train_acc": 0.01, + "test_loss": 4.738941632843018, + "test_acc": 0.01, + "lyapunov": 1.5417572262951784, + "grad_norm": 0.1451696630670528, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 86.8176257610321 + }, + { + "epoch": 141, + "train_loss": 5.319074583282471, + "train_acc": 0.01, + "test_loss": 4.743734898376465, + "test_acc": 0.01, + "lyapunov": 1.5425543062522282, + "grad_norm": 0.14883420989990226, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 86.81977844238281 + }, + { + "epoch": 142, + "train_loss": 5.321842821502686, + "train_acc": 0.01, + "test_loss": 4.742512757873535, + "test_acc": 0.01, + "lyapunov": 1.5452124737107846, + "grad_norm": 0.14940314161589946, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 86.9058632850647 + }, + { + "epoch": 143, + "train_loss": 5.323013974456787, + "train_acc": 0.01, + "test_loss": 4.7366528335571285, + "test_acc": 0.01, + "lyapunov": 1.5466468251879564, + "grad_norm": 0.48352294330900464, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 86.8274781703949 + }, + { + "epoch": 144, + "train_loss": 5.322230252380371, + "train_acc": 0.01, + "test_loss": 4.734474227905274, + "test_acc": 0.01, + "lyapunov": 1.5454154453619058, + "grad_norm": 0.15060559526776118, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 86.83571076393127 + }, + { + "epoch": 145, + "train_loss": 5.318391214904785, + "train_acc": 0.01, + "test_loss": 4.740697119140625, + "test_acc": 0.01, + "lyapunov": 1.5418205120984245, + "grad_norm": 0.14599666991367263, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 86.83404302597046 + }, + { + "epoch": 146, + "train_loss": 5.3190992230224605, + "train_acc": 0.01, + "test_loss": 4.740016835021972, + "test_acc": 0.01, + "lyapunov": 1.542624485462218, + "grad_norm": 0.15263702906229243, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 86.86582016944885 + }, + { + "epoch": 147, + "train_loss": 5.318638049316406, + "train_acc": 0.01, + "test_loss": 4.740016804504394, + "test_acc": 0.01, + "lyapunov": 1.542047378352231, + "grad_norm": 0.1501107976108878, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 86.7875075340271 + }, + { + "epoch": 148, + "train_loss": 5.318966191101074, + "train_acc": 0.01, + "test_loss": 4.740017098999023, + "test_acc": 0.01, + "lyapunov": 1.5423082866327231, + "grad_norm": 0.1506843352752174, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 86.85878276824951 + }, + { + "epoch": 149, + "train_loss": 5.318281329040527, + "train_acc": 0.01, + "test_loss": 4.740017213439941, + "test_acc": 0.01, + "lyapunov": 1.5417110215672447, + "grad_norm": 0.14832275166563608, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 87.06339812278748 + }, + { + "epoch": 150, + "train_loss": 5.318742103729248, + "train_acc": 0.01, + "test_loss": 4.740017121887207, + "test_acc": 0.01, + "lyapunov": 1.5422426760958894, + "grad_norm": 0.1485832497803494, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 86.82008957862854 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 5.142427458190918, + "train_acc": 0.01732, + "test_loss": 4.915040765380859, + "test_acc": 0.0102, + "lyapunov": 2.4272339856228253, + "grad_norm": 5.192250161678427, + "grad_max_sv": 4.473296946287155, + "grad_min_sv": 8.955331335380733e-08, + "grad_condition": 71327028.89068338, + "lr": 0.0009998903417374227, + "time_sec": 132.13672518730164 + }, + { + "epoch": 2, + "train_loss": 4.874939300842285, + "train_acc": 0.01776, + "test_loss": 4.858658763122558, + "test_acc": 0.0123, + "lyapunov": 1.9352691591243305, + "grad_norm": 3.5048458101816564, + "grad_max_sv": 2.842214399576187, + "grad_min_sv": 5.994522662700064e-08, + "grad_condition": 56014607.037285045, + "lr": 0.0009995614150494292, + "time_sec": 132.1895821094513 + }, + { + "epoch": 3, + "train_loss": 4.780418332366944, + "train_acc": 0.01696, + "test_loss": 5.036572162628174, + "test_acc": 0.013, + "lyapunov": 1.6941773053020468, + "grad_norm": 2.3576536383434044, + "grad_max_sv": 1.8239452183246612, + "grad_min_sv": 3.909134313473395e-08, + "grad_condition": 54665529.32274648, + "lr": 0.0009990133642141358, + "time_sec": 132.14293670654297 + }, + { + "epoch": 4, + "train_loss": 4.74106760559082, + "train_acc": 0.0156, + "test_loss": 4.614977532958984, + "test_acc": 0.01, + "lyapunov": 1.667667641359217, + "grad_norm": 1.2834888351442275, + "grad_max_sv": 0.7230008448474109, + "grad_min_sv": 1.1444949870584092e-08, + "grad_condition": 21641297318.53074, + "lr": 0.0009982464296247522, + "time_sec": 132.18336057662964 + }, + { + "epoch": 5, + "train_loss": 4.765737413482666, + "train_acc": 0.01652, + "test_loss": 5.099783699798584, + "test_acc": 0.01, + "lyapunov": 1.6692155538617497, + "grad_norm": 0.6681729594071041, + "grad_max_sv": 0.4321929462254047, + "grad_min_sv": 8.256420696048775e-10, + "grad_condition": 130856413066.44238, + "lr": 0.0009972609476841367, + "time_sec": 132.0963535308838 + }, + { + "epoch": 6, + "train_loss": 4.802682023925781, + "train_acc": 0.01584, + "test_loss": 4.645143016052246, + "test_acc": 0.01, + "lyapunov": 1.6541148235121041, + "grad_norm": 0.5601084813828376, + "grad_max_sv": 0.3682811915874481, + "grad_min_sv": 4.4830527621445066e-12, + "grad_condition": 122810946704.98007, + "lr": 0.000996057350657239, + "time_sec": 132.08646774291992 + }, + { + "epoch": 7, + "train_loss": 4.861019936065674, + "train_acc": 0.0145, + "test_loss": 5.0593204246521, + "test_acc": 0.012, + "lyapunov": 1.6806474119196158, + "grad_norm": 0.4786920265962189, + "grad_max_sv": 0.36215363070368767, + "grad_min_sv": 5.403665967264682e-10, + "grad_condition": 157595569273.04913, + "lr": 0.000994636166481494, + "time_sec": 132.12457752227783 + }, + { + "epoch": 8, + "train_loss": 4.906115528869629, + "train_acc": 0.01422, + "test_loss": 4.609849331665039, + "test_acc": 0.01, + "lyapunov": 1.6933349569130431, + "grad_norm": 0.5105557123165358, + "grad_max_sv": 0.2962237525731325, + "grad_min_sv": 1.5893412122574907e-12, + "grad_condition": 162936272535.53033, + "lr": 0.0009929980185352525, + "time_sec": 132.0816192626953 + }, + { + "epoch": 9, + "train_loss": 4.948906524505615, + "train_acc": 0.01298, + "test_loss": 4.606528971099854, + "test_acc": 0.01, + "lyapunov": 1.684294082624528, + "grad_norm": 0.4680820303299784, + "grad_max_sv": 0.2727967657148838, + "grad_min_sv": 6.175172652279376e-13, + "grad_condition": 191797793138.9354, + "lr": 0.0009911436253643444, + "time_sec": 132.09475946426392 + }, + { + "epoch": 10, + "train_loss": 5.001812951354981, + "train_acc": 0.01048, + "test_loss": 4.605593468475342, + "test_acc": 0.01, + "lyapunov": 1.6371012395605102, + "grad_norm": 0.4454332910853826, + "grad_max_sv": 0.06080346256494522, + "grad_min_sv": 1.1174912073463375e-13, + "grad_condition": 43714632849.557816, + "lr": 0.0009890738003669028, + "time_sec": 132.12074422836304 + }, + { + "epoch": 11, + "train_loss": 5.020210814056396, + "train_acc": 0.0096, + "test_loss": 6.067085327148438, + "test_acc": 0.01, + "lyapunov": 1.55058368331636, + "grad_norm": 0.43082604131055474, + "grad_max_sv": 0.221556506305933, + "grad_min_sv": 2.881964604461995e-09, + "grad_condition": 154673733.23759162, + "lr": 0.00098678945143658, + "time_sec": 132.08557748794556 + }, + { + "epoch": 12, + "train_loss": 5.050462992553711, + "train_acc": 0.0094, + "test_loss": 4.605482531738281, + "test_acc": 0.01, + "lyapunov": 1.5398570713789568, + "grad_norm": 0.381893916008903, + "grad_max_sv": 0.2668355040252209, + "grad_min_sv": 3.789388436370445e-09, + "grad_condition": 42311880.80663426, + "lr": 0.0009842915805643154, + "time_sec": 132.05907773971558 + }, + { + "epoch": 13, + "train_loss": 5.067867939758301, + "train_acc": 0.00924, + "test_loss": 4.605311224365234, + "test_acc": 0.01, + "lyapunov": 1.539125974830764, + "grad_norm": 0.1537321432498029, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000981581283398829, + "time_sec": 132.1301724910736 + }, + { + "epoch": 14, + "train_loss": 5.122542482299805, + "train_acc": 0.01028, + "test_loss": 6.089662152862549, + "test_acc": 0.01, + "lyapunov": 1.5396406424929723, + "grad_norm": 0.3505932006709459, + "grad_max_sv": 0.24503438249230386, + "grad_min_sv": 3.2204854292020023e-09, + "grad_condition": 175828681.99119335, + "lr": 0.0009786597487660333, + "time_sec": 132.11422061920166 + }, + { + "epoch": 15, + "train_loss": 5.167975009613037, + "train_acc": 0.00938, + "test_loss": 6.145216786956787, + "test_acc": 0.01, + "lyapunov": 1.5421736868446136, + "grad_norm": 0.460038063194906, + "grad_max_sv": 0.37677369341254235, + "grad_min_sv": 5.061586208499058e-09, + "grad_condition": 83937837.74305013, + "lr": 0.0009755282581475766, + "time_sec": 132.15303254127502 + }, + { + "epoch": 16, + "train_loss": 5.185187667541504, + "train_acc": 0.00964, + "test_loss": 4.605292627716064, + "test_acc": 0.01, + "lyapunov": 1.5415043111347482, + "grad_norm": 0.2749549655041811, + "grad_max_sv": 0.13375916928052903, + "grad_min_sv": 1.7694276155388877e-09, + "grad_condition": 28413171.440939356, + "lr": 0.0009721881851187403, + "time_sec": 132.0988028049469 + }, + { + "epoch": 17, + "train_loss": 5.213513888549805, + "train_acc": 0.00944, + "test_loss": 4.605225193786621, + "test_acc": 0.01, + "lyapunov": 1.5439205886153005, + "grad_norm": 0.15107835674594625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009686409947459456, + "time_sec": 132.06156492233276 + }, + { + "epoch": 18, + "train_loss": 5.259810456237793, + "train_acc": 0.00946, + "test_loss": 6.243620587158203, + "test_acc": 0.01, + "lyapunov": 1.5492180427321998, + "grad_norm": 0.17993668118393238, + "grad_max_sv": 0.02630040645599365, + "grad_min_sv": 2.2052708131825583e-10, + "grad_condition": 25149159.75180607, + "lr": 0.0009648882429441254, + "time_sec": 132.04172444343567 + }, + { + "epoch": 19, + "train_loss": 5.30400526260376, + "train_acc": 0.01008, + "test_loss": 6.052386779022217, + "test_acc": 0.01, + "lyapunov": 1.544384488974081, + "grad_norm": 0.348063373631547, + "grad_max_sv": 0.2475440863519907, + "grad_min_sv": 2.704030184225853e-09, + "grad_condition": 448939719.83669394, + "lr": 0.00096093157579425, + "time_sec": 132.16821956634521 + }, + { + "epoch": 20, + "train_loss": 5.344405227050781, + "train_acc": 0.0094, + "test_loss": 6.0689891357421875, + "test_acc": 0.01, + "lyapunov": 1.549183475087061, + "grad_norm": 0.3941364600912924, + "grad_max_sv": 0.28380888141691685, + "grad_min_sv": 2.9937321677220295e-09, + "grad_condition": 919686281.1330671, + "lr": 0.0009567727288213001, + "time_sec": 132.13486909866333 + }, + { + "epoch": 21, + "train_loss": 5.342385781860352, + "train_acc": 0.00934, + "test_loss": 5.634283610534668, + "test_acc": 0.01, + "lyapunov": 1.5489524468741454, + "grad_norm": 0.35198337312808664, + "grad_max_sv": 0.2675567839294672, + "grad_min_sv": 2.7506563800988593e-09, + "grad_condition": 137616088.9764635, + "lr": 0.0009524135262330095, + "time_sec": 132.15001010894775 + }, + { + "epoch": 22, + "train_loss": 5.340258148040771, + "train_acc": 0.01038, + "test_loss": 6.047631702423096, + "test_acc": 0.01, + "lyapunov": 1.5503142017232792, + "grad_norm": 0.32912217146899386, + "grad_max_sv": 0.23988064490258693, + "grad_min_sv": 2.0088645359163383e-09, + "grad_condition": 325233106.42990357, + "lr": 0.0009478558801197061, + "time_sec": 132.1328146457672 + }, + { + "epoch": 23, + "train_loss": 5.33926953994751, + "train_acc": 0.00924, + "test_loss": 6.389647571563721, + "test_acc": 0.01, + "lyapunov": 1.5511968355349568, + "grad_norm": 0.3034442087369207, + "grad_max_sv": 0.21002153679728508, + "grad_min_sv": 7.416720458496191e-10, + "grad_condition": 49849833895.91653, + "lr": 0.000943101789615607, + "time_sec": 132.11377239227295 + }, + { + "epoch": 24, + "train_loss": 5.342641763763428, + "train_acc": 0.01046, + "test_loss": 6.151307273101807, + "test_acc": 0.01, + "lyapunov": 1.5519740599805436, + "grad_norm": 0.32351011233615656, + "grad_max_sv": 0.24164889194071293, + "grad_min_sv": 1.9842920796070418e-09, + "grad_condition": 216397157.20139033, + "lr": 0.0009381533400219313, + "time_sec": 132.07816553115845 + }, + { + "epoch": 25, + "train_loss": 5.336951184997559, + "train_acc": 0.00994, + "test_loss": 5.9992121322631835, + "test_acc": 0.01, + "lyapunov": 1.5503220811219471, + "grad_norm": 0.2784195734173852, + "grad_max_sv": 0.19388381093740464, + "grad_min_sv": 2.1356596568026515e-10, + "grad_condition": 108561949775.06238, + "lr": 0.0009330127018922189, + "time_sec": 132.10879969596863 + }, + { + "epoch": 26, + "train_loss": 5.336466632537841, + "train_acc": 0.01006, + "test_loss": 5.7221336074829106, + "test_acc": 0.01, + "lyapunov": 1.5520486011529517, + "grad_norm": 0.24825146645127755, + "grad_max_sv": 0.17286810129880906, + "grad_min_sv": 1.0904332706662028e-12, + "grad_condition": 103853917717.00699, + "lr": 0.000927682130080253, + "time_sec": 132.1171510219574 + }, + { + "epoch": 27, + "train_loss": 5.336693968505859, + "train_acc": 0.00944, + "test_loss": 5.829081159210205, + "test_acc": 0.01, + "lyapunov": 1.5536211549168657, + "grad_norm": 0.23362614927382305, + "grad_max_sv": 0.15823216680437327, + "grad_min_sv": 7.62931019239883e-13, + "grad_condition": 111090272986.05489, + "lr": 0.0009221639627510072, + "time_sec": 132.13189697265625 + }, + { + "epoch": 28, + "train_loss": 5.336333346252442, + "train_acc": 0.01034, + "test_loss": 6.183766918945312, + "test_acc": 0.01, + "lyapunov": 1.5548379052325587, + "grad_norm": 0.2252526539391841, + "grad_max_sv": 0.1425440175458789, + "grad_min_sv": 5.001494019507075e-14, + "grad_condition": 136232139639.80547, + "lr": 0.0009164606203550494, + "time_sec": 132.0898892879486 + }, + { + "epoch": 29, + "train_loss": 5.3385375555419925, + "train_acc": 0.01006, + "test_loss": 18.741441845703125, + "test_acc": 0.01, + "lyapunov": 1.559137857478598, + "grad_norm": 0.24309729358940327, + "grad_max_sv": 0.1129613446071744, + "grad_min_sv": 7.652494146034002e-15, + "grad_condition": 112054629681.63525, + "lr": 0.0009105746045668516, + "time_sec": 132.19855189323425 + }, + { + "epoch": 30, + "train_loss": 5.337543925323486, + "train_acc": 0.00958, + "test_loss": 17.780749963378906, + "test_acc": 0.01, + "lyapunov": 1.5578542255684542, + "grad_norm": 0.22390701226492316, + "grad_max_sv": 0.10281856972724199, + "grad_min_sv": 3.3459312089163837e-15, + "grad_condition": 102453292464.96785, + "lr": 0.0009045084971874733, + "time_sec": 132.09549117088318 + }, + { + "epoch": 31, + "train_loss": 5.33479830078125, + "train_acc": 0.00896, + "test_loss": 18.024621951293945, + "test_acc": 0.01, + "lyapunov": 1.5561083588758697, + "grad_norm": 0.2617176836095928, + "grad_max_sv": 0.0911625299602747, + "grad_min_sv": 1.0217219065908696e-15, + "grad_condition": 91065349161.70517, + "lr": 0.0008982649590120977, + "time_sec": 132.07474184036255 + }, + { + "epoch": 32, + "train_loss": 5.336539338684082, + "train_acc": 0.0096, + "test_loss": 18.656125256347657, + "test_acc": 0.01, + "lyapunov": 1.558475110536951, + "grad_norm": 0.2736415217941262, + "grad_max_sv": 0.08601008746773005, + "grad_min_sv": 8.793854624629887e-16, + "grad_condition": 85922955415.14108, + "lr": 0.0008918467286629196, + "time_sec": 132.10801935195923 + }, + { + "epoch": 33, + "train_loss": 5.346367032775879, + "train_acc": 0.00982, + "test_loss": 16.179306204223632, + "test_acc": 0.01, + "lyapunov": 1.5642947364036384, + "grad_norm": 0.26593824832856844, + "grad_max_sv": 0.11054420564323664, + "grad_min_sv": 1.4557409070313929e-10, + "grad_condition": 86957832407.85573, + "lr": 0.0008852566213878943, + "time_sec": 132.09707188606262 + }, + { + "epoch": 34, + "train_loss": 5.366751658630371, + "train_acc": 0.0095, + "test_loss": 14.5320333984375, + "test_acc": 0.01, + "lyapunov": 1.5604360716422196, + "grad_norm": 0.39203529519334207, + "grad_max_sv": 0.3150600105524063, + "grad_min_sv": 3.335271438415291e-09, + "grad_condition": 437335317.70210946, + "lr": 0.000878497527825878, + "time_sec": 132.12472343444824 + }, + { + "epoch": 35, + "train_loss": 5.3540499374389645, + "train_acc": 0.00914, + "test_loss": 14.636802185058594, + "test_acc": 0.01, + "lyapunov": 1.5606954972762281, + "grad_norm": 0.3377550426065231, + "grad_max_sv": 0.2708315536379814, + "grad_min_sv": 2.616331799126792e-09, + "grad_condition": 145659046.06806198, + "lr": 0.000871572412738697, + "time_sec": 132.10315084457397 + }, + { + "epoch": 36, + "train_loss": 5.350296534576416, + "train_acc": 0.00996, + "test_loss": 15.48446300354004, + "test_acc": 0.01, + "lyapunov": 1.5607713335920173, + "grad_norm": 0.29951473550525415, + "grad_max_sv": 0.24341562166810035, + "grad_min_sv": 1.5972995535181583e-09, + "grad_condition": 1815700162.0467975, + "lr": 0.0008644843137107055, + "time_sec": 132.10273575782776 + }, + { + "epoch": 37, + "train_loss": 5.3520866116333, + "train_acc": 0.00968, + "test_loss": 14.972803247070312, + "test_acc": 0.01, + "lyapunov": 1.5632766884611087, + "grad_norm": 0.33571017690288324, + "grad_max_sv": 0.2274009022861719, + "grad_min_sv": 6.642170352888692e-10, + "grad_condition": 43022286203.22009, + "lr": 0.0008572363398164014, + "time_sec": 132.0913314819336 + }, + { + "epoch": 38, + "train_loss": 5.347811700897217, + "train_acc": 0.00978, + "test_loss": 15.4173666015625, + "test_acc": 0.01, + "lyapunov": 1.5653380673864614, + "grad_norm": 0.23644614014625348, + "grad_max_sv": 0.15670949593186378, + "grad_min_sv": 3.485120328424339e-13, + "grad_condition": 126042108666.44785, + "lr": 0.0008498316702566826, + "time_sec": 132.12694144248962 + }, + { + "epoch": 39, + "train_loss": 5.350918925933838, + "train_acc": 0.01, + "test_loss": 7.349865231323242, + "test_acc": 0.01, + "lyapunov": 1.5639865206330634, + "grad_norm": 0.25831036099968246, + "grad_max_sv": 0.18908596560359, + "grad_min_sv": 3.4109730636612205e-10, + "grad_condition": 109021837331.04056, + "lr": 0.0008422735529643442, + "time_sec": 132.15545773506165 + }, + { + "epoch": 40, + "train_loss": 5.350084358825684, + "train_acc": 0.00968, + "test_loss": 6.699221839904785, + "test_acc": 0.01, + "lyapunov": 1.5618754555197323, + "grad_norm": 0.33240423060946156, + "grad_max_sv": 0.16681117806583642, + "grad_min_sv": 8.354353915913262e-10, + "grad_condition": 29639133022.15968, + "lr": 0.0008345653031794289, + "time_sec": 132.0622968673706 + }, + { + "epoch": 41, + "train_loss": 5.348379842224121, + "train_acc": 0.01014, + "test_loss": 12.351808143615722, + "test_acc": 0.01, + "lyapunov": 1.5626876762760875, + "grad_norm": 0.31832555128145307, + "grad_max_sv": 0.20640474413521587, + "grad_min_sv": 8.66528908347317e-13, + "grad_condition": 129815385507.61075, + "lr": 0.0008267103019950526, + "time_sec": 132.2454056739807 + }, + { + "epoch": 42, + "train_loss": 5.34665752532959, + "train_acc": 0.00974, + "test_loss": 14.07037748260498, + "test_acc": 0.01, + "lyapunov": 1.5655529825278864, + "grad_norm": 0.2561124376145529, + "grad_max_sv": 0.10575219443999231, + "grad_min_sv": 1.9916840597483354e-10, + "grad_condition": 82384130296.00456, + "lr": 0.0008187119948743447, + "time_sec": 132.08385848999023 + }, + { + "epoch": 43, + "train_loss": 5.343207415618896, + "train_acc": 0.0099, + "test_loss": 13.306277600097657, + "test_acc": 0.01, + "lyapunov": 1.5653508831472958, + "grad_norm": 0.19924932372474, + "grad_max_sv": 0.096745721437037, + "grad_min_sv": 1.0061398517570142e-15, + "grad_condition": 96651724250.54889, + "lr": 0.000810573890139155, + "time_sec": 132.13167572021484 + }, + { + "epoch": 44, + "train_loss": 5.345402418518066, + "train_acc": 0.00992, + "test_loss": 7.869494395446777, + "test_acc": 0.01, + "lyapunov": 1.5646309980650996, + "grad_norm": 0.21769658517748566, + "grad_max_sv": 0.13879811409860848, + "grad_min_sv": 1.6053037275992228e-14, + "grad_condition": 135561498479.67575, + "lr": 0.0008022995574311873, + "time_sec": 132.21540069580078 + }, + { + "epoch": 45, + "train_loss": 5.346674517059326, + "train_acc": 0.00986, + "test_loss": 11.400154348754883, + "test_acc": 0.01, + "lyapunov": 1.5669585390164114, + "grad_norm": 0.21055278107954878, + "grad_max_sv": 0.12050471100956202, + "grad_min_sv": 1.448653245665297e-14, + "grad_condition": 117784195175.33076, + "lr": 0.0007938926261462363, + "time_sec": 132.13598537445068 + }, + { + "epoch": 46, + "train_loss": 5.350086312103271, + "train_acc": 0.00912, + "test_loss": 11.996928524780273, + "test_acc": 0.01, + "lyapunov": 1.5701792279777624, + "grad_norm": 0.21008620048452556, + "grad_max_sv": 0.08796360064297915, + "grad_min_sv": 3.893309181110675e-16, + "grad_condition": 87925759209.02908, + "lr": 0.0007853567838422158, + "time_sec": 132.10033679008484 + }, + { + "epoch": 47, + "train_loss": 5.342350235290527, + "train_acc": 0.0087, + "test_loss": 10.970650772094727, + "test_acc": 0.01, + "lyapunov": 1.564373235263483, + "grad_norm": 0.1731163774631187, + "grad_max_sv": 0.08237459398806095, + "grad_min_sv": 2.1940905206855015e-16, + "grad_condition": 82355183433.8488, + "lr": 0.0007766957746216719, + "time_sec": 132.1089198589325 + }, + { + "epoch": 48, + "train_loss": 5.34227012512207, + "train_acc": 0.00988, + "test_loss": 11.343988357543946, + "test_acc": 0.01, + "lyapunov": 1.5652936489685723, + "grad_norm": 0.16074333900064897, + "grad_max_sv": 0.07524463571608067, + "grad_min_sv": 4.129742513509048e-34, + "grad_condition": 75244635716.08066, + "lr": 0.0007679133974894982, + "time_sec": 132.16328692436218 + }, + { + "epoch": 49, + "train_loss": 5.344108670349121, + "train_acc": 0.00988, + "test_loss": 11.356095449829102, + "test_acc": 0.01, + "lyapunov": 1.5667558609677092, + "grad_norm": 0.15860129770355044, + "grad_max_sv": 0.07414976768195629, + "grad_min_sv": 2.920054218147879e-21, + "grad_condition": 74149767435.12958, + "lr": 0.000759013504686565, + "time_sec": 132.1159553527832 + }, + { + "epoch": 50, + "train_loss": 5.3415603378295895, + "train_acc": 0.00976, + "test_loss": 11.700657446289062, + "test_acc": 0.01, + "lyapunov": 1.5651936311551067, + "grad_norm": 0.14626453498485173, + "grad_max_sv": 0.05773629667237401, + "grad_min_sv": 7.389830128226318e-40, + "grad_condition": 57736296672.37401, + "lr": 0.0007499999999999998, + "time_sec": 132.10842418670654 + }, + { + "epoch": 51, + "train_loss": 5.345499488220215, + "train_acc": 0.0091, + "test_loss": 7.841943490600586, + "test_acc": 0.01, + "lyapunov": 1.5647823362399245, + "grad_norm": 0.19931882783012003, + "grad_max_sv": 0.13148421347141265, + "grad_min_sv": 1.1399481724407015e-14, + "grad_condition": 129966725437.33623, + "lr": 0.0007408768370508575, + "time_sec": 132.13836026191711 + }, + { + "epoch": 52, + "train_loss": 5.346541320800781, + "train_acc": 0.01036, + "test_loss": 8.251887129211426, + "test_acc": 0.01, + "lyapunov": 1.565840955280587, + "grad_norm": 0.21227656722607438, + "grad_max_sv": 0.14938069488853217, + "grad_min_sv": 2.1186636603898966e-14, + "grad_condition": 146306194841.0702, + "lr": 0.0007316480175599307, + "time_sec": 132.21652913093567 + }, + { + "epoch": 53, + "train_loss": 5.346332246856689, + "train_acc": 0.00998, + "test_loss": 8.80145364074707, + "test_acc": 0.01, + "lyapunov": 1.5666624332023094, + "grad_norm": 0.2018507800384921, + "grad_max_sv": 0.12567667234688998, + "grad_min_sv": 4.6990583254762225e-15, + "grad_condition": 125036911617.91772, + "lr": 0.0007223175895924635, + "time_sec": 132.1492202281952 + }, + { + "epoch": 54, + "train_loss": 5.344240028381348, + "train_acc": 0.0096, + "test_loss": 8.331844716644287, + "test_acc": 0.01, + "lyapunov": 1.5653653464963675, + "grad_norm": 0.1977193203709713, + "grad_max_sv": 0.12096917647868395, + "grad_min_sv": 2.717621440740357e-15, + "grad_condition": 120646434306.70581, + "lr": 0.0007128896457825361, + "time_sec": 132.13583779335022 + }, + { + "epoch": 55, + "train_loss": 5.34588626373291, + "train_acc": 0.00938, + "test_loss": 8.483297344970703, + "test_acc": 0.01, + "lyapunov": 1.5671809872093103, + "grad_norm": 0.17917342896025326, + "grad_max_sv": 0.10660264752805233, + "grad_min_sv": 2.903017749905976e-15, + "grad_condition": 106288369212.58371, + "lr": 0.0007033683215378998, + "time_sec": 132.12570214271545 + }, + { + "epoch": 56, + "train_loss": 5.347936657714844, + "train_acc": 0.00928, + "test_loss": 12.471004583740234, + "test_acc": 0.01, + "lyapunov": 1.5704145821768913, + "grad_norm": 0.1585992442529963, + "grad_max_sv": 0.05894996239803731, + "grad_min_sv": 4.065829085829974e-17, + "grad_condition": 58945476044.698166, + "lr": 0.0006937577932260512, + "time_sec": 132.08077478408813 + }, + { + "epoch": 57, + "train_loss": 5.350657684173584, + "train_acc": 0.00942, + "test_loss": 11.975766296386718, + "test_acc": 0.01, + "lyapunov": 1.572284730803936, + "grad_norm": 0.16329462100720574, + "grad_max_sv": 0.018565936107188465, + "grad_min_sv": 0.0, + "grad_condition": 18565936107.188465, + "lr": 0.0006840622763423388, + "time_sec": 132.12146091461182 + }, + { + "epoch": 58, + "train_loss": 5.342193555297851, + "train_acc": 0.00952, + "test_loss": 12.00783012084961, + "test_acc": 0.01, + "lyapunov": 1.5669191542183956, + "grad_norm": 0.13144150243285688, + "grad_max_sv": 0.014100767159834503, + "grad_min_sv": 0.0, + "grad_condition": 14100767159.834503, + "lr": 0.0006742860236609073, + "time_sec": 132.0214581489563 + }, + { + "epoch": 59, + "train_loss": 5.349671448669434, + "train_acc": 0.0097, + "test_loss": 12.08228343963623, + "test_acc": 0.01, + "lyapunov": 1.5733529234786168, + "grad_norm": 0.15236031303960995, + "grad_max_sv": 0.002432991983368993, + "grad_min_sv": 0.0, + "grad_condition": 2432991983.368993, + "lr": 0.0006644333233692913, + "time_sec": 131.98429799079895 + }, + { + "epoch": 60, + "train_loss": 5.343136109619141, + "train_acc": 0.00986, + "test_loss": 10.815134619140625, + "test_acc": 0.01, + "lyapunov": 1.567219941207515, + "grad_norm": 0.13665097355727693, + "grad_max_sv": 0.03331217863596976, + "grad_min_sv": 4.039363544528912e-19, + "grad_condition": 33312131775.42389, + "lr": 0.0006545084971874734, + "time_sec": 132.03068280220032 + }, + { + "epoch": 61, + "train_loss": 5.344384336853027, + "train_acc": 0.01022, + "test_loss": 11.902839001464844, + "test_acc": 0.01, + "lyapunov": 1.5653783214061767, + "grad_norm": 0.18581223375617745, + "grad_max_sv": 0.11722703091800213, + "grad_min_sv": 1.8473140836599877e-15, + "grad_condition": 117024266905.12569, + "lr": 0.0006445158984722354, + "time_sec": 132.11943864822388 + }, + { + "epoch": 62, + "train_loss": 5.346207113494873, + "train_acc": 0.00964, + "test_loss": 10.298070428466797, + "test_acc": 0.01, + "lyapunov": 1.5678635116123483, + "grad_norm": 0.17212702314261866, + "grad_max_sv": 0.11003287564963102, + "grad_min_sv": 1.1830899390639064e-16, + "grad_condition": 110021246721.88094, + "lr": 0.0006344599103076324, + "time_sec": 132.09185695648193 + }, + { + "epoch": 63, + "train_loss": 5.345449805297852, + "train_acc": 0.00958, + "test_loss": 9.716324475097656, + "test_acc": 0.01, + "lyapunov": 1.5676089863643012, + "grad_norm": 0.15858824070117938, + "grad_max_sv": 0.09742239024490118, + "grad_min_sv": 2.2791221237746455e-16, + "grad_condition": 97400387801.48373, + "lr": 0.0006243449435824269, + "time_sec": 132.09884762763977 + }, + { + "epoch": 64, + "train_loss": 5.347441923828125, + "train_acc": 0.01, + "test_loss": 9.248421519470215, + "test_acc": 0.01, + "lyapunov": 1.5703948257524338, + "grad_norm": 0.14831464239510592, + "grad_max_sv": 0.07895854022353888, + "grad_min_sv": 1.0966957298749494e-34, + "grad_condition": 78958540223.53888, + "lr": 0.0006141754350553275, + "time_sec": 132.1075723171234 + }, + { + "epoch": 65, + "train_loss": 5.3479963973999025, + "train_acc": 0.00918, + "test_loss": 11.96562194519043, + "test_acc": 0.01, + "lyapunov": 1.5711398328966497, + "grad_norm": 0.13907361248234446, + "grad_max_sv": 0.06278349282220005, + "grad_min_sv": 0.0, + "grad_condition": 62783492822.20006, + "lr": 0.0006039558454088793, + "time_sec": 132.1277093887329 + }, + { + "epoch": 66, + "train_loss": 5.343847501678467, + "train_acc": 0.00942, + "test_loss": 10.723486402893066, + "test_acc": 0.01, + "lyapunov": 1.5666573139102868, + "grad_norm": 0.1348401569471477, + "grad_max_sv": 0.07675737962126732, + "grad_min_sv": 0.0, + "grad_condition": 76757379621.2673, + "lr": 0.000593690657292862, + "time_sec": 132.15379786491394 + }, + { + "epoch": 67, + "train_loss": 5.348686145477295, + "train_acc": 0.00928, + "test_loss": 9.169928652954102, + "test_acc": 0.01, + "lyapunov": 1.5714481184854532, + "grad_norm": 0.16082287392865435, + "grad_max_sv": 0.09281166503205895, + "grad_min_sv": 4.119931040700715e-29, + "grad_condition": 92811665032.05894, + "lr": 0.0005833843733580507, + "time_sec": 132.15499711036682 + }, + { + "epoch": 68, + "train_loss": 5.346614480133057, + "train_acc": 0.01036, + "test_loss": 9.111311894226073, + "test_acc": 0.01, + "lyapunov": 1.5694071944717252, + "grad_norm": 0.15530027367743043, + "grad_max_sv": 0.09021252328529954, + "grad_min_sv": 9.645277459794148e-41, + "grad_condition": 90212523285.29953, + "lr": 0.0005730415142812054, + "time_sec": 132.0900914669037 + }, + { + "epoch": 69, + "train_loss": 5.345042231140137, + "train_acc": 0.0094, + "test_loss": 8.921395944213867, + "test_acc": 0.01, + "lyapunov": 1.5690713626954256, + "grad_norm": 0.12882941842915957, + "grad_max_sv": 0.05447775078937411, + "grad_min_sv": 0.0, + "grad_condition": 54477750789.374115, + "lr": 0.0005626666167821517, + "time_sec": 132.08048009872437 + }, + { + "epoch": 70, + "train_loss": 5.35093121887207, + "train_acc": 0.00998, + "test_loss": 9.45476280517578, + "test_acc": 0.01, + "lyapunov": 1.5726936317770683, + "grad_norm": 0.15278112356314727, + "grad_max_sv": 0.05165710533037782, + "grad_min_sv": 0.0, + "grad_condition": 51657105330.377815, + "lr": 0.0005522642316338265, + "time_sec": 132.26694178581238 + }, + { + "epoch": 71, + "train_loss": 5.349324496612549, + "train_acc": 0.0099, + "test_loss": 8.863416375732422, + "test_acc": 0.01, + "lyapunov": 1.572835110642416, + "grad_norm": 0.13044312395716468, + "grad_max_sv": 0.040168187906965615, + "grad_min_sv": 0.0, + "grad_condition": 40168187906.965614, + "lr": 0.0005418389216661573, + "time_sec": 132.09336495399475 + }, + { + "epoch": 72, + "train_loss": 5.344522937774658, + "train_acc": 0.0098, + "test_loss": 8.490674835205079, + "test_acc": 0.01, + "lyapunov": 1.5687179925191739, + "grad_norm": 0.12245301057298638, + "grad_max_sv": 0.05633250158280134, + "grad_min_sv": 0.0, + "grad_condition": 56332501582.801346, + "lr": 0.0005313952597646563, + "time_sec": 132.10885214805603 + }, + { + "epoch": 73, + "train_loss": 5.344547733154297, + "train_acc": 0.0097, + "test_loss": 8.686578596496583, + "test_acc": 0.01, + "lyapunov": 1.5687794383529508, + "grad_norm": 0.11446001541385904, + "grad_max_sv": 0.049419266358017924, + "grad_min_sv": 0.0, + "grad_condition": 49419266358.01792, + "lr": 0.0005209378268645994, + "time_sec": 132.04956126213074 + }, + { + "epoch": 74, + "train_loss": 5.3437795330810545, + "train_acc": 0.0094, + "test_loss": 8.874914520263673, + "test_acc": 0.01, + "lyapunov": 1.5682151988339241, + "grad_norm": 0.1237497118091755, + "grad_max_sv": 0.03953348807990551, + "grad_min_sv": 0.0, + "grad_condition": 39533488079.9055, + "lr": 0.0005104712099416781, + "time_sec": 132.10020518302917 + }, + { + "epoch": 75, + "train_loss": 5.343674107208252, + "train_acc": 0.0092, + "test_loss": 8.772430587768556, + "test_acc": 0.01, + "lyapunov": 1.5683565054403241, + "grad_norm": 0.11349041239477198, + "grad_max_sv": 0.026115051889792084, + "grad_min_sv": 0.0, + "grad_condition": 26115051889.792084, + "lr": 0.0004999999999999996, + "time_sec": 132.01686429977417 + }, + { + "epoch": 76, + "train_loss": 5.342641368255615, + "train_acc": 0.00932, + "test_loss": 8.705339865112304, + "test_acc": 0.01, + "lyapunov": 1.5662559923308585, + "grad_norm": 0.12277695191025612, + "grad_max_sv": 0.0629763058386743, + "grad_min_sv": 0.0, + "grad_condition": 62976305838.67432, + "lr": 0.0004895287900583212, + "time_sec": 132.05883979797363 + }, + { + "epoch": 77, + "train_loss": 5.341884041595459, + "train_acc": 0.00968, + "test_loss": 9.93609327545166, + "test_acc": 0.01, + "lyapunov": 1.566317234502729, + "grad_norm": 0.11484157346336721, + "grad_max_sv": 0.047401683824136856, + "grad_min_sv": 0.0, + "grad_condition": 47401683824.136856, + "lr": 0.0004790621731353997, + "time_sec": 132.05576992034912 + }, + { + "epoch": 78, + "train_loss": 5.343069399871826, + "train_acc": 0.0102, + "test_loss": 8.943976522827148, + "test_acc": 0.01, + "lyapunov": 1.5676431427221469, + "grad_norm": 0.10629466820483455, + "grad_max_sv": 0.034334157966077326, + "grad_min_sv": 0.0, + "grad_condition": 34334157966.077324, + "lr": 0.000468604740235343, + "time_sec": 132.03219604492188 + }, + { + "epoch": 79, + "train_loss": 5.342923241119385, + "train_acc": 0.00894, + "test_loss": 10.30071854095459, + "test_acc": 0.01, + "lyapunov": 1.5677035571364186, + "grad_norm": 0.11729853273385192, + "grad_max_sv": 0.018184055807068944, + "grad_min_sv": 0.0, + "grad_condition": 18184055807.068947, + "lr": 0.00045816107833384175, + "time_sec": 132.0335590839386 + }, + { + "epoch": 80, + "train_loss": 5.342889130249024, + "train_acc": 0.00868, + "test_loss": 9.292682635498046, + "test_acc": 0.01, + "lyapunov": 1.5676629153054085, + "grad_norm": 0.10602422228730526, + "grad_max_sv": 0.022180042415857314, + "grad_min_sv": 0.0, + "grad_condition": 22180042415.857315, + "lr": 0.0004477357683661729, + "time_sec": 132.04535913467407 + }, + { + "epoch": 81, + "train_loss": 5.3435448347473145, + "train_acc": 0.01026, + "test_loss": 10.646222018432617, + "test_acc": 0.01, + "lyapunov": 1.5682694253409306, + "grad_norm": 0.10584507536046345, + "grad_max_sv": 0.036097540194168685, + "grad_min_sv": 0.0, + "grad_condition": 36097540194.168686, + "lr": 0.00043733338321784746, + "time_sec": 132.0792417526245 + }, + { + "epoch": 82, + "train_loss": 5.346409954376221, + "train_acc": 0.00938, + "test_loss": 8.388480964660644, + "test_acc": 0.01, + "lyapunov": 1.5704751517766578, + "grad_norm": 0.1594968968610417, + "grad_max_sv": 0.05689305039122701, + "grad_min_sv": 0.0, + "grad_condition": 56893050391.227005, + "lr": 0.0004269584857187939, + "time_sec": 132.10688591003418 + }, + { + "epoch": 83, + "train_loss": 5.351143104705811, + "train_acc": 0.00934, + "test_loss": 10.536403848266602, + "test_acc": 0.01, + "lyapunov": 1.57418333660916, + "grad_norm": 0.14631187426937112, + "grad_max_sv": 0.043841119017452, + "grad_min_sv": 0.0, + "grad_condition": 43841119017.451996, + "lr": 0.0004166156266419484, + "time_sec": 132.08924984931946 + }, + { + "epoch": 84, + "train_loss": 5.345183093261719, + "train_acc": 0.00942, + "test_loss": 11.133738461303711, + "test_acc": 0.01, + "lyapunov": 1.5697272662311563, + "grad_norm": 0.11663908627078753, + "grad_max_sv": 0.04061344410292804, + "grad_min_sv": 0.0, + "grad_condition": 40613444102.92804, + "lr": 0.0004063093427071373, + "time_sec": 132.13465809822083 + }, + { + "epoch": 85, + "train_loss": 5.346176763000488, + "train_acc": 0.01038, + "test_loss": 11.12772626953125, + "test_acc": 0.01, + "lyapunov": 1.5703431422753102, + "grad_norm": 0.1377494846746287, + "grad_max_sv": 0.026653958344832064, + "grad_min_sv": 0.0, + "grad_condition": 26653958344.83206, + "lr": 0.0003960441545911199, + "time_sec": 132.03662395477295 + }, + { + "epoch": 86, + "train_loss": 5.343412326202393, + "train_acc": 0.00966, + "test_loss": 10.485674588012696, + "test_acc": 0.01, + "lyapunov": 1.568256547383945, + "grad_norm": 0.11507124566756707, + "grad_max_sv": 0.015460054902359844, + "grad_min_sv": 0.0, + "grad_condition": 15460054902.359842, + "lr": 0.0003858245649446718, + "time_sec": 132.30029678344727 + }, + { + "epoch": 87, + "train_loss": 5.343340453948975, + "train_acc": 0.0093, + "test_loss": 10.443886459350585, + "test_acc": 0.01, + "lyapunov": 1.5683554758501175, + "grad_norm": 0.11491345749975401, + "grad_max_sv": 0.01923052747733891, + "grad_min_sv": 0.0, + "grad_condition": 19230527477.33891, + "lr": 0.00037565505641757235, + "time_sec": 132.09554266929626 + }, + { + "epoch": 88, + "train_loss": 5.343219871826172, + "train_acc": 0.00982, + "test_loss": 9.331489477539062, + "test_acc": 0.01, + "lyapunov": 1.5680722632371555, + "grad_norm": 0.10357957499765331, + "grad_max_sv": 0.03583596190437675, + "grad_min_sv": 0.0, + "grad_condition": 35835961904.37675, + "lr": 0.00036554008969236695, + "time_sec": 132.38618564605713 + }, + { + "epoch": 89, + "train_loss": 5.345059629974365, + "train_acc": 0.00942, + "test_loss": 9.705012353515626, + "test_acc": 0.01, + "lyapunov": 1.5701254081848028, + "grad_norm": 0.13335748884903612, + "grad_max_sv": 0.01991720902733505, + "grad_min_sv": 0.0, + "grad_condition": 19917209027.335045, + "lr": 0.0003554841015277638, + "time_sec": 132.10200333595276 + }, + { + "epoch": 90, + "train_loss": 5.346582987670899, + "train_acc": 0.00936, + "test_loss": 9.92761245727539, + "test_acc": 0.01, + "lyapunov": 1.570894326395391, + "grad_norm": 0.12917945353905133, + "grad_max_sv": 0.005056336428970099, + "grad_min_sv": 0.0, + "grad_condition": 5056336428.9700985, + "lr": 0.000345491502812526, + "time_sec": 132.01398086547852 + }, + { + "epoch": 91, + "train_loss": 5.343077623138428, + "train_acc": 0.00948, + "test_loss": 9.892114511108398, + "test_acc": 0.01, + "lyapunov": 1.5679589848384223, + "grad_norm": 0.10089565070900397, + "grad_max_sv": 0.024783097906038165, + "grad_min_sv": 0.0, + "grad_condition": 24783097906.038166, + "lr": 0.0003355666766307081, + "time_sec": 132.0552315711975 + }, + { + "epoch": 92, + "train_loss": 5.344612928619385, + "train_acc": 0.00984, + "test_loss": 9.036325561523437, + "test_acc": 0.01, + "lyapunov": 1.5697500227052537, + "grad_norm": 0.13133583896592352, + "grad_max_sv": 0.017823219764977694, + "grad_min_sv": 0.0, + "grad_condition": 17823219764.977695, + "lr": 0.00032571397633909225, + "time_sec": 132.07679438591003 + }, + { + "epoch": 93, + "train_loss": 5.346883224182129, + "train_acc": 0.0096, + "test_loss": 8.63075946044922, + "test_acc": 0.01, + "lyapunov": 1.5719260608448702, + "grad_norm": 0.09641577817960369, + "grad_max_sv": 0.003358140075579286, + "grad_min_sv": 0.0, + "grad_condition": 3358140075.5792856, + "lr": 0.00031593772365766094, + "time_sec": 132.0291886329651 + }, + { + "epoch": 94, + "train_loss": 5.343683553771973, + "train_acc": 0.00968, + "test_loss": 8.73685708618164, + "test_acc": 0.01, + "lyapunov": 1.5686328389760478, + "grad_norm": 0.09724660681276874, + "grad_max_sv": 0.018295074068009853, + "grad_min_sv": 0.0, + "grad_condition": 18295074068.00985, + "lr": 0.0003062422067739483, + "time_sec": 132.12304759025574 + }, + { + "epoch": 95, + "train_loss": 5.343045575866699, + "train_acc": 0.0086, + "test_loss": 8.563214770507813, + "test_acc": 0.01, + "lyapunov": 1.5680832335406252, + "grad_norm": 0.09663765425859253, + "grad_max_sv": 0.0011947159189730882, + "grad_min_sv": 0.0, + "grad_condition": 1194715918.9730883, + "lr": 0.00029663167846209965, + "time_sec": 132.08247256278992 + }, + { + "epoch": 96, + "train_loss": 5.342066871490479, + "train_acc": 0.00906, + "test_loss": 8.190421600341796, + "test_acc": 0.01, + "lyapunov": 1.5670246782205295, + "grad_norm": 0.10563473423950201, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 132.00989890098572 + }, + { + "epoch": 97, + "train_loss": 5.344517989196778, + "train_acc": 0.00956, + "test_loss": 7.861407074737548, + "test_acc": 0.01, + "lyapunov": 1.5693480187974622, + "grad_norm": 0.11742062064295959, + "grad_max_sv": 0.0026324169710278513, + "grad_min_sv": 0.0, + "grad_condition": 2632416971.027851, + "lr": 0.00027768241040753615, + "time_sec": 132.0594036579132 + }, + { + "epoch": 98, + "train_loss": 5.347235653991699, + "train_acc": 0.0093, + "test_loss": 7.575284122467041, + "test_acc": 0.01, + "lyapunov": 1.571171855682607, + "grad_norm": 0.09980977977399007, + "grad_max_sv": 0.02286601336672902, + "grad_min_sv": 0.0, + "grad_condition": 22866013366.729023, + "lr": 0.00026835198244006903, + "time_sec": 132.04233193397522 + }, + { + "epoch": 99, + "train_loss": 5.343029342498779, + "train_acc": 0.00906, + "test_loss": 7.45513014831543, + "test_acc": 0.01, + "lyapunov": 1.5681262549841801, + "grad_norm": 0.09342461116650493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 131.9914095401764 + }, + { + "epoch": 100, + "train_loss": 5.3494312777709965, + "train_acc": 0.00946, + "test_loss": 7.298580384063721, + "test_acc": 0.01, + "lyapunov": 1.573579462897747, + "grad_norm": 0.11907283705246616, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 131.99966597557068 + }, + { + "epoch": 101, + "train_loss": 5.342477266693115, + "train_acc": 0.00948, + "test_loss": 7.23597857055664, + "test_acc": 0.01, + "lyapunov": 1.5675478393159559, + "grad_norm": 0.09720728561760718, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 131.99136352539062 + }, + { + "epoch": 102, + "train_loss": 5.341832947845459, + "train_acc": 0.00952, + "test_loss": 6.885648638916016, + "test_acc": 0.01, + "lyapunov": 1.5668759388691933, + "grad_norm": 0.09041804951245885, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 131.99253511428833 + }, + { + "epoch": 103, + "train_loss": 5.342141702270508, + "train_acc": 0.00956, + "test_loss": 7.227639694976807, + "test_acc": 0.01, + "lyapunov": 1.5670329186007799, + "grad_norm": 0.09504910369326992, + "grad_max_sv": 0.02663951087743044, + "grad_min_sv": 0.0, + "grad_condition": 26639510877.43044, + "lr": 0.0002233042253783278, + "time_sec": 132.1089026927948 + }, + { + "epoch": 104, + "train_loss": 5.342686755828858, + "train_acc": 0.00952, + "test_loss": 7.590157605743408, + "test_acc": 0.01, + "lyapunov": 1.5676686721079796, + "grad_norm": 0.09647661834231228, + "grad_max_sv": 0.024380091251805423, + "grad_min_sv": 0.0, + "grad_condition": 24380091251.805428, + "lr": 0.000214643216157784, + "time_sec": 132.06964230537415 + }, + { + "epoch": 105, + "train_loss": 5.344026827392578, + "train_acc": 0.0095, + "test_loss": 7.26397318649292, + "test_acc": 0.01, + "lyapunov": 1.569079797895973, + "grad_norm": 0.09462212649965553, + "grad_max_sv": 0.025716999545693398, + "grad_min_sv": 0.0, + "grad_condition": 25716999545.693398, + "lr": 0.00020610737385376332, + "time_sec": 132.05113744735718 + }, + { + "epoch": 106, + "train_loss": 5.343383273925781, + "train_acc": 0.00984, + "test_loss": 7.472719841003418, + "test_acc": 0.01, + "lyapunov": 1.5685262430049574, + "grad_norm": 0.09652945369879859, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 132.04551148414612 + }, + { + "epoch": 107, + "train_loss": 5.343959386138916, + "train_acc": 0.00958, + "test_loss": 7.445523268127442, + "test_acc": 0.01, + "lyapunov": 1.5691688893091342, + "grad_norm": 0.11388204494439719, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 132.02328181266785 + }, + { + "epoch": 108, + "train_loss": 5.342418379516602, + "train_acc": 0.00956, + "test_loss": 7.7173920944213865, + "test_acc": 0.01, + "lyapunov": 1.5675345683646629, + "grad_norm": 0.09095832390063928, + "grad_max_sv": 0.0006004700437188149, + "grad_min_sv": 0.0, + "grad_condition": 600470043.7188148, + "lr": 0.000181288005125655, + "time_sec": 132.05611062049866 + }, + { + "epoch": 109, + "train_loss": 5.343011405029297, + "train_acc": 0.00944, + "test_loss": 7.669947085571289, + "test_acc": 0.01, + "lyapunov": 1.5680827374958322, + "grad_norm": 0.09262475373763442, + "grad_max_sv": 0.005615572584792972, + "grad_min_sv": 0.0, + "grad_condition": 5615572584.792972, + "lr": 0.0001732896980049473, + "time_sec": 132.0278182029724 + }, + { + "epoch": 110, + "train_loss": 5.343270805511475, + "train_acc": 0.00902, + "test_loss": 7.524606921386718, + "test_acc": 0.01, + "lyapunov": 1.5684265477578048, + "grad_norm": 0.0929528487372896, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 132.01432704925537 + }, + { + "epoch": 111, + "train_loss": 5.3430648620605465, + "train_acc": 0.00908, + "test_loss": 7.709186791992187, + "test_acc": 0.01, + "lyapunov": 1.568246929236995, + "grad_norm": 0.08919578457075998, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 131.99741911888123 + }, + { + "epoch": 112, + "train_loss": 5.343547642822266, + "train_acc": 0.00982, + "test_loss": 7.633082518005371, + "test_acc": 0.01, + "lyapunov": 1.56872364535661, + "grad_norm": 0.09053282340492008, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 131.9864740371704 + }, + { + "epoch": 113, + "train_loss": 5.349385154571533, + "train_acc": 0.00926, + "test_loss": 7.402510799407959, + "test_acc": 0.01, + "lyapunov": 1.573695613295221, + "grad_norm": 0.1331401826658418, + "grad_max_sv": 0.007452957844361663, + "grad_min_sv": 0.0, + "grad_condition": 7452957844.361662, + "lr": 0.00014276366018359834, + "time_sec": 131.9871220588684 + }, + { + "epoch": 114, + "train_loss": 5.3475169880676265, + "train_acc": 0.00952, + "test_loss": 7.718253441619873, + "test_acc": 0.01, + "lyapunov": 1.5723201231578428, + "grad_norm": 0.12289444805074258, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 131.98372554779053 + }, + { + "epoch": 115, + "train_loss": 5.344510088806152, + "train_acc": 0.0094, + "test_loss": 7.667512203216552, + "test_acc": 0.01, + "lyapunov": 1.569762335713867, + "grad_norm": 0.09241242910799227, + "grad_max_sv": 0.008661840902641415, + "grad_min_sv": 0.0, + "grad_condition": 8661840902.641415, + "lr": 0.00012842758726130276, + "time_sec": 132.05068254470825 + }, + { + "epoch": 116, + "train_loss": 5.343971741943359, + "train_acc": 0.00908, + "test_loss": 7.700549072265625, + "test_acc": 0.01, + "lyapunov": 1.5691710436130728, + "grad_norm": 0.10830143197848235, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 132.05018138885498 + }, + { + "epoch": 117, + "train_loss": 5.34632839920044, + "train_acc": 0.00976, + "test_loss": 7.761262622070313, + "test_acc": 0.01, + "lyapunov": 1.5713817326309125, + "grad_norm": 0.11435501476976112, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 131.99043989181519 + }, + { + "epoch": 118, + "train_loss": 5.343400028686523, + "train_acc": 0.0092, + "test_loss": 7.794083961486816, + "test_acc": 0.01, + "lyapunov": 1.5685766228019733, + "grad_norm": 0.08899614535065951, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 131.99262475967407 + }, + { + "epoch": 119, + "train_loss": 5.343056818084717, + "train_acc": 0.00994, + "test_loss": 7.639262364196777, + "test_acc": 0.01, + "lyapunov": 1.5682302356680946, + "grad_norm": 0.08977728685492378, + "grad_max_sv": 0.0006828804966062307, + "grad_min_sv": 0.0, + "grad_condition": 682880496.6062307, + "lr": 0.00010173504098790182, + "time_sec": 132.01868438720703 + }, + { + "epoch": 120, + "train_loss": 5.343217134552002, + "train_acc": 0.00976, + "test_loss": 7.660574660491943, + "test_acc": 0.01, + "lyapunov": 1.5684062449828438, + "grad_norm": 0.09249377742678497, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 132.00144267082214 + }, + { + "epoch": 121, + "train_loss": 5.344638092651367, + "train_acc": 0.00922, + "test_loss": 7.663163458251953, + "test_acc": 0.01, + "lyapunov": 1.5699151044001665, + "grad_norm": 0.1218726255205378, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 132.01804733276367 + }, + { + "epoch": 122, + "train_loss": 5.348134873046875, + "train_acc": 0.00886, + "test_loss": 7.884050512695312, + "test_acc": 0.01, + "lyapunov": 1.5724969224246872, + "grad_norm": 0.09050076665656355, + "grad_max_sv": 0.006364198122173548, + "grad_min_sv": 0.0, + "grad_condition": 6364198122.173548, + "lr": 8.353937964495024e-05, + "time_sec": 132.0272445678711 + }, + { + "epoch": 123, + "train_loss": 5.345365750579834, + "train_acc": 0.00954, + "test_loss": 7.118724527740478, + "test_acc": 0.01, + "lyapunov": 1.5703083133453604, + "grad_norm": 0.09069370794057488, + "grad_max_sv": 0.011258925357833505, + "grad_min_sv": 0.0, + "grad_condition": 11258925357.833506, + "lr": 7.783603724899243e-05, + "time_sec": 132.11900568008423 + }, + { + "epoch": 124, + "train_loss": 5.3431124142456055, + "train_acc": 0.01036, + "test_loss": 7.23227484741211, + "test_acc": 0.01, + "lyapunov": 1.568215018952899, + "grad_norm": 0.09217613058420869, + "grad_max_sv": 0.022803956363350152, + "grad_min_sv": 0.0, + "grad_condition": 22803956363.35015, + "lr": 7.231786991974666e-05, + "time_sec": 132.04238414764404 + }, + { + "epoch": 125, + "train_loss": 5.343697594146729, + "train_acc": 0.00968, + "test_loss": 7.098866456604004, + "test_acc": 0.01, + "lyapunov": 1.5689014327495605, + "grad_norm": 0.09081931856189392, + "grad_max_sv": 0.0006075550802052021, + "grad_min_sv": 0.0, + "grad_condition": 607555080.2052021, + "lr": 6.698729810778072e-05, + "time_sec": 132.0574872493744 + }, + { + "epoch": 126, + "train_loss": 5.34278548538208, + "train_acc": 0.00934, + "test_loss": 7.256412179565429, + "test_acc": 0.01, + "lyapunov": 1.5679547353778653, + "grad_norm": 0.09038480638705418, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 132.04981470108032 + }, + { + "epoch": 127, + "train_loss": 5.342774636230469, + "train_acc": 0.0091, + "test_loss": 7.211266984558105, + "test_acc": 0.01, + "lyapunov": 1.567944114470421, + "grad_norm": 0.089217745438497, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 132.0332305431366 + }, + { + "epoch": 128, + "train_loss": 5.343552632446289, + "train_acc": 0.00974, + "test_loss": 7.4164355209350585, + "test_acc": 0.01, + "lyapunov": 1.5687480887488636, + "grad_norm": 0.11327584151012998, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 132.0342137813568 + }, + { + "epoch": 129, + "train_loss": 5.343920302124023, + "train_acc": 0.00956, + "test_loss": 7.272874592590332, + "test_acc": 0.01, + "lyapunov": 1.5691817562903285, + "grad_norm": 0.09015948976899717, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 132.10112881660461 + }, + { + "epoch": 130, + "train_loss": 5.3440144625854495, + "train_acc": 0.01, + "test_loss": 7.378188175964356, + "test_acc": 0.01, + "lyapunov": 1.5693023784081344, + "grad_norm": 0.08928317026508968, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 132.07870721817017 + }, + { + "epoch": 131, + "train_loss": 5.343164742889404, + "train_acc": 0.01, + "test_loss": 7.42498392944336, + "test_acc": 0.01, + "lyapunov": 1.5683802131496731, + "grad_norm": 0.08938231829702648, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 132.035484790802 + }, + { + "epoch": 132, + "train_loss": 5.343568996734619, + "train_acc": 0.01, + "test_loss": 7.3698252609252926, + "test_acc": 0.01, + "lyapunov": 1.5688252653307317, + "grad_norm": 0.08905121975076379, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 132.03120112419128 + }, + { + "epoch": 133, + "train_loss": 5.343650721282959, + "train_acc": 0.01, + "test_loss": 7.399177293395996, + "test_acc": 0.01, + "lyapunov": 1.568874374070131, + "grad_norm": 0.08945297165320838, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 132.04973649978638 + }, + { + "epoch": 134, + "train_loss": 5.344010626678466, + "train_acc": 0.01, + "test_loss": 7.451564918518066, + "test_acc": 0.01, + "lyapunov": 1.569275133750018, + "grad_norm": 0.08901909798719944, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 132.0272672176361 + }, + { + "epoch": 135, + "train_loss": 5.3513097511291505, + "train_acc": 0.01, + "test_loss": 7.494620336914062, + "test_acc": 0.01, + "lyapunov": 1.5749251406515956, + "grad_norm": 0.11347426013089548, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 132.07217669487 + }, + { + "epoch": 136, + "train_loss": 5.344121324768066, + "train_acc": 0.01, + "test_loss": 7.466115431976318, + "test_acc": 0.01, + "lyapunov": 1.5693210134725741, + "grad_norm": 0.13961703652050822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 132.09098315238953 + }, + { + "epoch": 137, + "train_loss": 5.3435055235290525, + "train_acc": 0.01, + "test_loss": 7.356763949584961, + "test_acc": 0.01, + "lyapunov": 1.5687689787286627, + "grad_norm": 0.08881051948095202, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 132.01117372512817 + }, + { + "epoch": 138, + "train_loss": 5.343292431945801, + "train_acc": 0.01, + "test_loss": 7.423162863159179, + "test_acc": 0.01, + "lyapunov": 1.5685121305763263, + "grad_norm": 0.08882639322875942, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 132.0426745414734 + }, + { + "epoch": 139, + "train_loss": 5.345961066894532, + "train_acc": 0.01, + "test_loss": 7.442799024963379, + "test_acc": 0.01, + "lyapunov": 1.5709345974885593, + "grad_norm": 0.11315656196544904, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 132.11658310890198 + }, + { + "epoch": 140, + "train_loss": 5.343492304992676, + "train_acc": 0.01, + "test_loss": 7.444627010345459, + "test_acc": 0.01, + "lyapunov": 1.5687398992840895, + "grad_norm": 0.08884505400987935, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 132.04373836517334 + }, + { + "epoch": 141, + "train_loss": 5.344924531860352, + "train_acc": 0.01, + "test_loss": 7.465608943176269, + "test_acc": 0.01, + "lyapunov": 1.570182631387735, + "grad_norm": 0.0880861679030681, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 132.03311824798584 + }, + { + "epoch": 142, + "train_loss": 5.343007263793945, + "train_acc": 0.01, + "test_loss": 7.4812581214904785, + "test_acc": 0.01, + "lyapunov": 1.5682257471791923, + "grad_norm": 0.08813951319538865, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 132.02575135231018 + }, + { + "epoch": 143, + "train_loss": 5.343106704711914, + "train_acc": 0.01, + "test_loss": 7.437115397644043, + "test_acc": 0.01, + "lyapunov": 1.5683247204631796, + "grad_norm": 0.10158596989760496, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 132.05020785331726 + }, + { + "epoch": 144, + "train_loss": 5.34294032119751, + "train_acc": 0.01, + "test_loss": 7.48037815246582, + "test_acc": 0.01, + "lyapunov": 1.5681621552733205, + "grad_norm": 0.08833317407426634, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 132.06616115570068 + }, + { + "epoch": 145, + "train_loss": 5.3438012377929685, + "train_acc": 0.01, + "test_loss": 7.496150346374511, + "test_acc": 0.01, + "lyapunov": 1.5690925231065287, + "grad_norm": 0.08791012889132134, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 132.04411220550537 + }, + { + "epoch": 146, + "train_loss": 5.342738318328857, + "train_acc": 0.01, + "test_loss": 7.490428826141358, + "test_acc": 0.01, + "lyapunov": 1.5679414330236137, + "grad_norm": 0.08841039102397012, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 132.08523440361023 + }, + { + "epoch": 147, + "train_loss": 5.3446823258972165, + "train_acc": 0.01, + "test_loss": 7.497726692199707, + "test_acc": 0.01, + "lyapunov": 1.5699935627105597, + "grad_norm": 0.08776043049557726, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 132.03058862686157 + }, + { + "epoch": 148, + "train_loss": 5.343377943572998, + "train_acc": 0.01, + "test_loss": 7.49042504272461, + "test_acc": 0.01, + "lyapunov": 1.5686415504006779, + "grad_norm": 0.08845953592324265, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 132.1206715106964 + }, + { + "epoch": 149, + "train_loss": 5.342948052978516, + "train_acc": 0.01, + "test_loss": 7.490426095581054, + "test_acc": 0.01, + "lyapunov": 1.5681962311420294, + "grad_norm": 0.08842267718527619, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 132.15464973449707 + }, + { + "epoch": 150, + "train_loss": 5.341931441345215, + "train_acc": 0.01, + "test_loss": 7.487130715942383, + "test_acc": 0.01, + "lyapunov": 1.567085372822364, + "grad_norm": 0.0882430826444348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 132.04750204086304 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.159331872253418, + "train_acc": 0.01526, + "test_loss": 4.873309817504883, + "test_acc": 0.0093, + "lyapunov": 2.4743038653717626, + "grad_norm": 5.258705722697472, + "grad_max_sv": 4.479718285799026, + "grad_min_sv": 8.709666913797598e-08, + "grad_condition": 86685976.9902235, + "lr": 0.0009998903417374227, + "time_sec": 177.3543930053711 + }, + { + "epoch": 2, + "train_loss": 4.886084578857422, + "train_acc": 0.01782, + "test_loss": 4.853029528808594, + "test_acc": 0.01, + "lyapunov": 1.9916716545744015, + "grad_norm": 3.460383424161388, + "grad_max_sv": 2.7798140585422515, + "grad_min_sv": 5.706028290974885e-08, + "grad_condition": 56364730.82112197, + "lr": 0.0009995614150494292, + "time_sec": 177.3599088191986 + }, + { + "epoch": 3, + "train_loss": 4.784042566375732, + "train_acc": 0.01776, + "test_loss": 4.790321257781982, + "test_acc": 0.0116, + "lyapunov": 1.7964752174704277, + "grad_norm": 2.38204770499042, + "grad_max_sv": 1.8151098906993866, + "grad_min_sv": 3.787766869461917e-08, + "grad_condition": 87913704.86086728, + "lr": 0.0009990133642141358, + "time_sec": 177.30120587348938 + }, + { + "epoch": 4, + "train_loss": 4.7238768682861325, + "train_acc": 0.017, + "test_loss": 4.624422996520996, + "test_acc": 0.01, + "lyapunov": 1.708475301332791, + "grad_norm": 1.1762359291788405, + "grad_max_sv": 0.7854173953674035, + "grad_min_sv": 9.800736290438679e-09, + "grad_condition": 32224269144.49076, + "lr": 0.0009982464296247522, + "time_sec": 177.37837982177734 + }, + { + "epoch": 5, + "train_loss": 4.755855419616699, + "train_acc": 0.01562, + "test_loss": 4.610174011230469, + "test_acc": 0.01, + "lyapunov": 1.675043061871053, + "grad_norm": 0.7259009952417778, + "grad_max_sv": 0.5301507465541363, + "grad_min_sv": 5.1440461827152224e-11, + "grad_condition": 105915112802.73376, + "lr": 0.0009972609476841367, + "time_sec": 177.381986618042 + }, + { + "epoch": 6, + "train_loss": 4.81643141998291, + "train_acc": 0.01288, + "test_loss": 4.60545783996582, + "test_acc": 0.01, + "lyapunov": 1.6532284676876214, + "grad_norm": 0.4607532772533372, + "grad_max_sv": 0.3609377399086952, + "grad_min_sv": 5.305074951633812e-13, + "grad_condition": 279971546429.15295, + "lr": 0.000996057350657239, + "time_sec": 177.434068441391 + }, + { + "epoch": 7, + "train_loss": 4.86136633392334, + "train_acc": 0.01224, + "test_loss": 5.360651237487793, + "test_acc": 0.01, + "lyapunov": 1.6404305040988776, + "grad_norm": 0.3680696909769052, + "grad_max_sv": 0.316419655829668, + "grad_min_sv": 4.076535490995613e-14, + "grad_condition": 307643620830.443, + "lr": 0.000994636166481494, + "time_sec": 177.2750985622406 + }, + { + "epoch": 8, + "train_loss": 4.912417060089111, + "train_acc": 0.01054, + "test_loss": 9.9219926071167, + "test_acc": 0.01, + "lyapunov": 1.6378350980446468, + "grad_norm": 0.4461762738170382, + "grad_max_sv": 0.26778712812811134, + "grad_min_sv": 1.894336000793759e-10, + "grad_condition": 230695726821.5417, + "lr": 0.0009929980185352525, + "time_sec": 177.29276037216187 + }, + { + "epoch": 9, + "train_loss": 4.968367258911133, + "train_acc": 0.00954, + "test_loss": 7.827674491882324, + "test_acc": 0.01, + "lyapunov": 1.624799670465767, + "grad_norm": 0.5375330781925154, + "grad_max_sv": 0.19412051439285277, + "grad_min_sv": 1.2617160814236554e-09, + "grad_condition": 49059473464.09962, + "lr": 0.0009911436253643444, + "time_sec": 177.24522376060486 + }, + { + "epoch": 10, + "train_loss": 5.062082354125977, + "train_acc": 0.01038, + "test_loss": 5.569893667602539, + "test_acc": 0.01, + "lyapunov": 1.6864765662976238, + "grad_norm": 0.753548419446606, + "grad_max_sv": 0.4160853669047356, + "grad_min_sv": 5.35826894499278e-09, + "grad_condition": 10262508595.882322, + "lr": 0.0009890738003669028, + "time_sec": 177.3631317615509 + }, + { + "epoch": 11, + "train_loss": 5.058011302032471, + "train_acc": 0.00952, + "test_loss": 5.087331884002686, + "test_acc": 0.01, + "lyapunov": 1.6062763267770752, + "grad_norm": 0.6603912459051273, + "grad_max_sv": 0.3468701772391796, + "grad_min_sv": 4.421987463785291e-09, + "grad_condition": 31727265214.824364, + "lr": 0.00098678945143658, + "time_sec": 177.38562989234924 + }, + { + "epoch": 12, + "train_loss": 5.058439118957519, + "train_acc": 0.00978, + "test_loss": 5.082496954345703, + "test_acc": 0.01, + "lyapunov": 1.5697322474111377, + "grad_norm": 0.3523516525308902, + "grad_max_sv": 0.15937897935509682, + "grad_min_sv": 1.873834291129129e-09, + "grad_condition": 2759306059.465498, + "lr": 0.0009842915805643154, + "time_sec": 177.36675763130188 + }, + { + "epoch": 13, + "train_loss": 5.109822076416016, + "train_acc": 0.00966, + "test_loss": 5.692898876953125, + "test_acc": 0.01, + "lyapunov": 1.5695562542551924, + "grad_norm": 0.4593422563560374, + "grad_max_sv": 0.35409238263964654, + "grad_min_sv": 4.71099455383317e-09, + "grad_condition": 127958722.61296721, + "lr": 0.000981581283398829, + "time_sec": 177.44806337356567 + }, + { + "epoch": 14, + "train_loss": 5.165816433410645, + "train_acc": 0.01014, + "test_loss": 7.84957985534668, + "test_acc": 0.01, + "lyapunov": 1.5709327590435058, + "grad_norm": 0.5694077536605798, + "grad_max_sv": 0.4453627858310938, + "grad_min_sv": 5.610913853565864e-09, + "grad_condition": 15313856896.7998, + "lr": 0.0009786597487660333, + "time_sec": 177.33772945404053 + }, + { + "epoch": 15, + "train_loss": 5.173155229797363, + "train_acc": 0.00972, + "test_loss": 5.157973370361328, + "test_acc": 0.01, + "lyapunov": 1.5706551062786365, + "grad_norm": 0.43055135839909847, + "grad_max_sv": 0.21150126457214355, + "grad_min_sv": 1.4762666979190565e-09, + "grad_condition": 47799778820.01504, + "lr": 0.0009755282581475766, + "time_sec": 177.33515882492065 + }, + { + "epoch": 16, + "train_loss": 5.207788455657959, + "train_acc": 0.00962, + "test_loss": 7.759160287475586, + "test_acc": 0.01, + "lyapunov": 1.5720331275554569, + "grad_norm": 0.3894440758556563, + "grad_max_sv": 0.1499915760010481, + "grad_min_sv": 1.4193079274022143e-09, + "grad_condition": 19769526881.522236, + "lr": 0.0009721881851187403, + "time_sec": 177.28159952163696 + }, + { + "epoch": 17, + "train_loss": 5.25385222076416, + "train_acc": 0.00914, + "test_loss": 4.720599290466309, + "test_acc": 0.01, + "lyapunov": 1.579244610293747, + "grad_norm": 0.3647403085884025, + "grad_max_sv": 0.17017204388976098, + "grad_min_sv": 1.3479770702114132e-09, + "grad_condition": 29838909132.92096, + "lr": 0.0009686409947459456, + "time_sec": 177.3482620716095 + }, + { + "epoch": 18, + "train_loss": 5.290630603790283, + "train_acc": 0.00966, + "test_loss": 4.818104879760742, + "test_acc": 0.01, + "lyapunov": 1.572280853300753, + "grad_norm": 0.42846936793954693, + "grad_max_sv": 0.2142110202461481, + "grad_min_sv": 2.2586123961791682e-09, + "grad_condition": 6069325065.621381, + "lr": 0.0009648882429441254, + "time_sec": 177.32465243339539 + }, + { + "epoch": 19, + "train_loss": 5.347908495483399, + "train_acc": 0.00976, + "test_loss": 4.680776121520996, + "test_acc": 0.01, + "lyapunov": 1.575872380715197, + "grad_norm": 0.575049551174443, + "grad_max_sv": 0.43422624468803406, + "grad_min_sv": 4.46815191792408e-09, + "grad_condition": 771924430.9754374, + "lr": 0.00096093157579425, + "time_sec": 177.39169430732727 + }, + { + "epoch": 20, + "train_loss": 5.372361971588135, + "train_acc": 0.0092, + "test_loss": 4.661239500427246, + "test_acc": 0.01, + "lyapunov": 1.5752952742149762, + "grad_norm": 0.48504969680471643, + "grad_max_sv": 0.3245972327888012, + "grad_min_sv": 3.24804563384129e-09, + "grad_condition": 111189476.23947105, + "lr": 0.0009567727288213001, + "time_sec": 177.45550775527954 + }, + { + "epoch": 21, + "train_loss": 5.37029109954834, + "train_acc": 0.00994, + "test_loss": 4.667470470428467, + "test_acc": 0.01, + "lyapunov": 1.5776933690775996, + "grad_norm": 0.5453589213556644, + "grad_max_sv": 0.3167274951934814, + "grad_min_sv": 1.839770059066596e-09, + "grad_condition": 35181903296.3187, + "lr": 0.0009524135262330095, + "time_sec": 177.39379477500916 + }, + { + "epoch": 22, + "train_loss": 5.364489818725586, + "train_acc": 0.01004, + "test_loss": 4.650138076782227, + "test_acc": 0.01, + "lyapunov": 1.5788932602728725, + "grad_norm": 0.41535739480122674, + "grad_max_sv": 0.2576656248420477, + "grad_min_sv": 1.5858205317854233e-12, + "grad_condition": 141035021433.30975, + "lr": 0.0009478558801197061, + "time_sec": 177.35208559036255 + }, + { + "epoch": 23, + "train_loss": 5.354643789978027, + "train_acc": 0.0095, + "test_loss": 4.695660099029541, + "test_acc": 0.01, + "lyapunov": 1.5758325334095284, + "grad_norm": 0.30581042910039435, + "grad_max_sv": 0.09805708080530166, + "grad_min_sv": 6.027597976882962e-11, + "grad_condition": 58654490617.71743, + "lr": 0.000943101789615607, + "time_sec": 177.3221151828766 + }, + { + "epoch": 24, + "train_loss": 5.353882457122802, + "train_acc": 0.00926, + "test_loss": 4.697132012939453, + "test_acc": 0.01, + "lyapunov": 1.578979221756196, + "grad_norm": 0.24237849220724425, + "grad_max_sv": 0.008070914912968874, + "grad_min_sv": 0.0, + "grad_condition": 8070914912.968875, + "lr": 0.0009381533400219313, + "time_sec": 177.2640483379364 + }, + { + "epoch": 25, + "train_loss": 5.351721515655518, + "train_acc": 0.00882, + "test_loss": 4.700634111022949, + "test_acc": 0.01, + "lyapunov": 1.5769606035993533, + "grad_norm": 0.299683664855393, + "grad_max_sv": 0.0009750408120453357, + "grad_min_sv": 0.0, + "grad_condition": 975040812.0453358, + "lr": 0.0009330127018922189, + "time_sec": 177.26898193359375 + }, + { + "epoch": 26, + "train_loss": 5.350724313659668, + "train_acc": 0.00882, + "test_loss": 4.976845028686523, + "test_acc": 0.01, + "lyapunov": 1.5759871856635794, + "grad_norm": 0.25282322824422004, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000927682130080253, + "time_sec": 177.23982048034668 + }, + { + "epoch": 27, + "train_loss": 5.3572762519836425, + "train_acc": 0.00916, + "test_loss": 4.699456916046143, + "test_acc": 0.01, + "lyapunov": 1.5826555691716615, + "grad_norm": 0.3870563147260469, + "grad_max_sv": 0.0008042730391025543, + "grad_min_sv": 0.0, + "grad_condition": 804273039.1025543, + "lr": 0.0009221639627510072, + "time_sec": 177.22700691223145 + }, + { + "epoch": 28, + "train_loss": 5.352617038269043, + "train_acc": 0.0083, + "test_loss": 4.97811413192749, + "test_acc": 0.01, + "lyapunov": 1.5779867312487434, + "grad_norm": 0.23788834158418645, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009164606203550494, + "time_sec": 177.21826004981995 + }, + { + "epoch": 29, + "train_loss": 5.361850127716065, + "train_acc": 0.00882, + "test_loss": 4.701448201751709, + "test_acc": 0.01, + "lyapunov": 1.5833598887524032, + "grad_norm": 0.42995748870040046, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009105746045668516, + "time_sec": 177.21908974647522 + }, + { + "epoch": 30, + "train_loss": 5.358213574829102, + "train_acc": 0.00904, + "test_loss": 5.412950395202636, + "test_acc": 0.01, + "lyapunov": 1.5822858404930291, + "grad_norm": 0.331672095140798, + "grad_max_sv": 0.0007659861817955971, + "grad_min_sv": 0.0, + "grad_condition": 765986181.7955971, + "lr": 0.0009045084971874733, + "time_sec": 177.25155925750732 + }, + { + "epoch": 31, + "train_loss": 5.359104016113282, + "train_acc": 0.00934, + "test_loss": 4.669879191589356, + "test_acc": 0.01, + "lyapunov": 1.5799903305595184, + "grad_norm": 0.2952731697889261, + "grad_max_sv": 0.07996195461601019, + "grad_min_sv": 1.8027052930896337e-13, + "grad_condition": 65774856592.69602, + "lr": 0.0008982649590120977, + "time_sec": 177.35512685775757 + }, + { + "epoch": 32, + "train_loss": 5.376470304718017, + "train_acc": 0.0094, + "test_loss": 5.556229885864258, + "test_acc": 0.01, + "lyapunov": 1.5852845087075782, + "grad_norm": 0.34062130802734397, + "grad_max_sv": 0.1435967419296503, + "grad_min_sv": 4.671640446328522e-10, + "grad_condition": 42736336798.66166, + "lr": 0.0008918467286629196, + "time_sec": 177.3573558330536 + }, + { + "epoch": 33, + "train_loss": 5.354219467468262, + "train_acc": 0.00872, + "test_loss": 5.552221805572509, + "test_acc": 0.01, + "lyapunov": 1.5796612647488295, + "grad_norm": 0.24724638679639113, + "grad_max_sv": 0.012037708284333348, + "grad_min_sv": 0.0, + "grad_condition": 12037708284.333347, + "lr": 0.0008852566213878943, + "time_sec": 177.34085536003113 + }, + { + "epoch": 34, + "train_loss": 5.358693110198975, + "train_acc": 0.00966, + "test_loss": 5.034206434631348, + "test_acc": 0.01, + "lyapunov": 1.5802869622969566, + "grad_norm": 0.26366751089242085, + "grad_max_sv": 0.08639110988005996, + "grad_min_sv": 4.474218043386011e-15, + "grad_condition": 85802279590.28976, + "lr": 0.000878497527825878, + "time_sec": 177.4128155708313 + }, + { + "epoch": 35, + "train_loss": 5.366087015075683, + "train_acc": 0.00934, + "test_loss": 4.936266462707519, + "test_acc": 0.01, + "lyapunov": 1.584944297285641, + "grad_norm": 0.3376396372917839, + "grad_max_sv": 0.1203163092955947, + "grad_min_sv": 2.7491684533434274e-14, + "grad_condition": 116380291473.68535, + "lr": 0.000871572412738697, + "time_sec": 177.40404987335205 + }, + { + "epoch": 36, + "train_loss": 5.361581598358154, + "train_acc": 0.01024, + "test_loss": 4.950734414672851, + "test_acc": 0.01, + "lyapunov": 1.5822551268750749, + "grad_norm": 0.35809443213096964, + "grad_max_sv": 0.13039383399300278, + "grad_min_sv": 9.003150469885764e-15, + "grad_condition": 129198667968.56705, + "lr": 0.0008644843137107055, + "time_sec": 177.38117098808289 + }, + { + "epoch": 37, + "train_loss": 5.367499517974854, + "train_acc": 0.00976, + "test_loss": 5.498499377441406, + "test_acc": 0.01, + "lyapunov": 1.58695989923404, + "grad_norm": 0.3008050326299743, + "grad_max_sv": 0.1228790944442153, + "grad_min_sv": 5.822944316845422e-15, + "grad_condition": 122173960457.34317, + "lr": 0.0008572363398164014, + "time_sec": 177.40381455421448 + }, + { + "epoch": 38, + "train_loss": 5.360039620361328, + "train_acc": 0.0097, + "test_loss": 5.010895380401611, + "test_acc": 0.01, + "lyapunov": 1.5823902507572223, + "grad_norm": 0.28800004102415633, + "grad_max_sv": 0.10303753465414048, + "grad_min_sv": 1.7600771723101566e-15, + "grad_condition": 102819314675.69463, + "lr": 0.0008498316702566826, + "time_sec": 177.36353826522827 + }, + { + "epoch": 39, + "train_loss": 5.361895691375732, + "train_acc": 0.00962, + "test_loss": 5.47797232055664, + "test_acc": 0.01, + "lyapunov": 1.5826790979146348, + "grad_norm": 0.3607282899922051, + "grad_max_sv": 0.1270065199583769, + "grad_min_sv": 5.8177677532204334e-15, + "grad_condition": 126306540301.11067, + "lr": 0.0008422735529643442, + "time_sec": 177.36847496032715 + }, + { + "epoch": 40, + "train_loss": 5.360779151458741, + "train_acc": 0.00974, + "test_loss": 4.913441442871094, + "test_acc": 0.01, + "lyapunov": 1.5841997578320905, + "grad_norm": 0.30144541489536497, + "grad_max_sv": 0.08766317497938872, + "grad_min_sv": 3.1235879522614164e-15, + "grad_condition": 87300355595.9631, + "lr": 0.0008345653031794289, + "time_sec": 177.39417672157288 + }, + { + "epoch": 41, + "train_loss": 5.361253643188476, + "train_acc": 0.00952, + "test_loss": 5.392577352905273, + "test_acc": 0.01, + "lyapunov": 1.584902299334631, + "grad_norm": 0.33710076786895654, + "grad_max_sv": 0.07017813064157963, + "grad_min_sv": 1.8795491026783212e-20, + "grad_condition": 70178128751.4103, + "lr": 0.0008267103019950526, + "time_sec": 177.4070680141449 + }, + { + "epoch": 42, + "train_loss": 5.359663697814941, + "train_acc": 0.00966, + "test_loss": 5.435651000976563, + "test_acc": 0.01, + "lyapunov": 1.583795747793544, + "grad_norm": 0.44265142669444985, + "grad_max_sv": 0.06058515841141343, + "grad_min_sv": 8.532913146218004e-39, + "grad_condition": 60585158411.41343, + "lr": 0.0008187119948743447, + "time_sec": 177.301589012146 + }, + { + "epoch": 43, + "train_loss": 5.361796244659423, + "train_acc": 0.0104, + "test_loss": 5.4946890060424805, + "test_acc": 0.01, + "lyapunov": 1.5847100778613858, + "grad_norm": 0.6384686198807327, + "grad_max_sv": 0.08455213336274028, + "grad_min_sv": 1.854097809152722e-15, + "grad_condition": 84328075575.36731, + "lr": 0.000810573890139155, + "time_sec": 177.35142517089844 + }, + { + "epoch": 44, + "train_loss": 5.364447811279297, + "train_acc": 0.01014, + "test_loss": 5.332209419250488, + "test_acc": 0.01, + "lyapunov": 1.5854847031786008, + "grad_norm": 0.675284019586962, + "grad_max_sv": 0.11337836356833578, + "grad_min_sv": 1.7049374807524963e-14, + "grad_condition": 111308573138.52168, + "lr": 0.0008022995574311873, + "time_sec": 177.3521008491516 + }, + { + "epoch": 45, + "train_loss": 5.360489757080078, + "train_acc": 0.00976, + "test_loss": 5.304935124206543, + "test_acc": 0.01, + "lyapunov": 1.5837746992745363, + "grad_norm": 0.5718003616383085, + "grad_max_sv": 0.08602348966524005, + "grad_min_sv": 3.0378301121606614e-16, + "grad_condition": 85997891115.73683, + "lr": 0.0007938926261462363, + "time_sec": 177.33692407608032 + }, + { + "epoch": 46, + "train_loss": 5.361809297485352, + "train_acc": 0.01014, + "test_loss": 4.89552943725586, + "test_acc": 0.01, + "lyapunov": 1.585215172194459, + "grad_norm": 0.44412809114793517, + "grad_max_sv": 0.0825215914286673, + "grad_min_sv": 1.1713936618830865e-15, + "grad_condition": 82407893767.02434, + "lr": 0.0007853567838422158, + "time_sec": 177.35017251968384 + }, + { + "epoch": 47, + "train_loss": 5.361848121795655, + "train_acc": 0.00954, + "test_loss": 4.982022219848633, + "test_acc": 0.01, + "lyapunov": 1.5858572995876108, + "grad_norm": 0.4284143094057381, + "grad_max_sv": 0.06426824014633895, + "grad_min_sv": 5.420102114032563e-18, + "grad_condition": 64267673459.65764, + "lr": 0.0007766957746216719, + "time_sec": 177.3225803375244 + }, + { + "epoch": 48, + "train_loss": 5.360097906646729, + "train_acc": 0.0101, + "test_loss": 5.039643939208984, + "test_acc": 0.01, + "lyapunov": 1.5852815909763736, + "grad_norm": 0.21919166507419222, + "grad_max_sv": 0.02766723851673305, + "grad_min_sv": 0.0, + "grad_condition": 27667238516.73305, + "lr": 0.0007679133974894982, + "time_sec": 177.3571081161499 + }, + { + "epoch": 49, + "train_loss": 5.361355583496094, + "train_acc": 0.00912, + "test_loss": 4.70521968460083, + "test_acc": 0.01, + "lyapunov": 1.587215112603229, + "grad_norm": 0.31401296813167406, + "grad_max_sv": 0.0012400273233652114, + "grad_min_sv": 0.0, + "grad_condition": 1240027323.3652115, + "lr": 0.000759013504686565, + "time_sec": 177.23792433738708 + }, + { + "epoch": 50, + "train_loss": 5.374890024871826, + "train_acc": 0.00998, + "test_loss": 5.3741009857177735, + "test_acc": 0.01, + "lyapunov": 1.5953726881300396, + "grad_norm": 0.3238754552354357, + "grad_max_sv": 0.04934265548363328, + "grad_min_sv": 2.6824701739898724e-33, + "grad_condition": 49342655483.63328, + "lr": 0.0007499999999999998, + "time_sec": 177.3176691532135 + }, + { + "epoch": 51, + "train_loss": 5.359442653961182, + "train_acc": 0.0091, + "test_loss": 5.708284506988526, + "test_acc": 0.01, + "lyapunov": 1.5848879155600468, + "grad_norm": 0.19742833159549178, + "grad_max_sv": 0.019448843877762557, + "grad_min_sv": 4.3389140032583084e-41, + "grad_condition": 19448843877.762554, + "lr": 0.0007408768370508575, + "time_sec": 177.30614399909973 + }, + { + "epoch": 52, + "train_loss": 5.357807418670654, + "train_acc": 0.00892, + "test_loss": 5.598787411499023, + "test_acc": 0.01, + "lyapunov": 1.5835388462866664, + "grad_norm": 0.22895282871195646, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007316480175599307, + "time_sec": 177.23059678077698 + }, + { + "epoch": 53, + "train_loss": 5.364920553588867, + "train_acc": 0.00838, + "test_loss": 5.555523378753662, + "test_acc": 0.01, + "lyapunov": 1.5897833791840108, + "grad_norm": 0.27349172628604307, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007223175895924635, + "time_sec": 177.23636078834534 + }, + { + "epoch": 54, + "train_loss": 5.360137451934815, + "train_acc": 0.00904, + "test_loss": 5.4607298324584965, + "test_acc": 0.01, + "lyapunov": 1.585875649586358, + "grad_norm": 0.3494380261105508, + "grad_max_sv": 0.009265018161386251, + "grad_min_sv": 0.0, + "grad_condition": 9265018161.386251, + "lr": 0.0007128896457825361, + "time_sec": 177.3195767402649 + }, + { + "epoch": 55, + "train_loss": 5.361894327392578, + "train_acc": 0.01076, + "test_loss": 5.3967264434814455, + "test_acc": 0.01, + "lyapunov": 1.5858059591039673, + "grad_norm": 0.32616838064335635, + "grad_max_sv": 0.06554236207157374, + "grad_min_sv": 3.9627266810538444e-22, + "grad_condition": 65542362038.60982, + "lr": 0.0007033683215378998, + "time_sec": 177.4070463180542 + }, + { + "epoch": 56, + "train_loss": 5.361103507232666, + "train_acc": 0.00966, + "test_loss": 5.396138972473144, + "test_acc": 0.01, + "lyapunov": 1.585260014399848, + "grad_norm": 0.24476233592152788, + "grad_max_sv": 0.053304498083889484, + "grad_min_sv": 8.107207506846484e-17, + "grad_condition": 53297506440.79659, + "lr": 0.0006937577932260512, + "time_sec": 177.3034119606018 + }, + { + "epoch": 57, + "train_loss": 5.3623845806884765, + "train_acc": 0.00962, + "test_loss": 5.060037421417237, + "test_acc": 0.01, + "lyapunov": 1.5866734694946758, + "grad_norm": 0.28857632314696974, + "grad_max_sv": 0.06447782786563039, + "grad_min_sv": 1.9607974133287156e-16, + "grad_condition": 64457267604.59035, + "lr": 0.0006840622763423388, + "time_sec": 177.35450506210327 + }, + { + "epoch": 58, + "train_loss": 5.361771304779053, + "train_acc": 0.01002, + "test_loss": 5.0901702087402345, + "test_acc": 0.01, + "lyapunov": 1.586991887873091, + "grad_norm": 0.23271259978105882, + "grad_max_sv": 0.04189403969794512, + "grad_min_sv": 2.1019476964872255e-46, + "grad_condition": 41894039697.945114, + "lr": 0.0006742860236609073, + "time_sec": 177.32643222808838 + }, + { + "epoch": 59, + "train_loss": 5.360649804382324, + "train_acc": 0.00986, + "test_loss": 5.02971961517334, + "test_acc": 0.01, + "lyapunov": 1.5858081442010983, + "grad_norm": 0.25490660325152764, + "grad_max_sv": 0.04079276975244284, + "grad_min_sv": 0.0, + "grad_condition": 40792769752.44284, + "lr": 0.0006644333233692913, + "time_sec": 177.3179268836975 + }, + { + "epoch": 60, + "train_loss": 5.364020364685058, + "train_acc": 0.00904, + "test_loss": 4.7199004196167, + "test_acc": 0.01, + "lyapunov": 1.5886733891713956, + "grad_norm": 0.22342122942097759, + "grad_max_sv": 0.027459373604506253, + "grad_min_sv": 0.0, + "grad_condition": 27459373604.506256, + "lr": 0.0006545084971874734, + "time_sec": 177.30202984809875 + }, + { + "epoch": 61, + "train_loss": 5.363523327484131, + "train_acc": 0.00934, + "test_loss": 4.7266477081298826, + "test_acc": 0.01, + "lyapunov": 1.5883313112551598, + "grad_norm": 0.20389335925530302, + "grad_max_sv": 0.045495460741221905, + "grad_min_sv": 1.4012984643248171e-46, + "grad_condition": 45495460741.2219, + "lr": 0.0006445158984722354, + "time_sec": 177.32515287399292 + }, + { + "epoch": 62, + "train_loss": 5.367948243408203, + "train_acc": 0.0091, + "test_loss": 4.75396729888916, + "test_acc": 0.01, + "lyapunov": 1.5914591578266504, + "grad_norm": 0.255614489528913, + "grad_max_sv": 0.03248326424509287, + "grad_min_sv": 1.3219893653396629e-33, + "grad_condition": 32483264245.092873, + "lr": 0.0006344599103076324, + "time_sec": 177.34726858139038 + }, + { + "epoch": 63, + "train_loss": 5.360079801940918, + "train_acc": 0.0094, + "test_loss": 5.19269112701416, + "test_acc": 0.01, + "lyapunov": 1.5859909679578699, + "grad_norm": 0.247568680367887, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824269, + "time_sec": 177.2823510169983 + }, + { + "epoch": 64, + "train_loss": 5.359493107910156, + "train_acc": 0.00876, + "test_loss": 5.2250466796875, + "test_acc": 0.01, + "lyapunov": 1.585366655188753, + "grad_norm": 0.2769224967661722, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 177.23246479034424 + }, + { + "epoch": 65, + "train_loss": 5.361286865844726, + "train_acc": 0.00938, + "test_loss": 5.298229453277588, + "test_acc": 0.01, + "lyapunov": 1.5870976630988938, + "grad_norm": 0.24716357558635968, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006039558454088793, + "time_sec": 177.274742603302 + }, + { + "epoch": 66, + "train_loss": 5.360220510559082, + "train_acc": 0.00942, + "test_loss": 5.1931522216796875, + "test_acc": 0.01, + "lyapunov": 1.5856442792946115, + "grad_norm": 0.21643181506904438, + "grad_max_sv": 0.028073416696861385, + "grad_min_sv": 0.0, + "grad_condition": 28073416696.86139, + "lr": 0.000593690657292862, + "time_sec": 177.3214614391327 + }, + { + "epoch": 67, + "train_loss": 5.3634411520385745, + "train_acc": 0.01004, + "test_loss": 4.726324760437012, + "test_acc": 0.01, + "lyapunov": 1.5876712076499333, + "grad_norm": 0.19917891606110388, + "grad_max_sv": 0.06480920519679785, + "grad_min_sv": 5.826939700269216e-27, + "grad_condition": 64809205196.797485, + "lr": 0.0005833843733580507, + "time_sec": 177.30631113052368 + }, + { + "epoch": 68, + "train_loss": 5.3627893775939945, + "train_acc": 0.0096, + "test_loss": 4.78324942779541, + "test_acc": 0.01, + "lyapunov": 1.5872700497927263, + "grad_norm": 0.17814025282763096, + "grad_max_sv": 0.05710890954360366, + "grad_min_sv": 1.642725198984103e-39, + "grad_condition": 57108909543.60366, + "lr": 0.0005730415142812054, + "time_sec": 177.28468227386475 + }, + { + "epoch": 69, + "train_loss": 5.36284663772583, + "train_acc": 0.01016, + "test_loss": 4.65924833908081, + "test_acc": 0.01, + "lyapunov": 1.5882405993883566, + "grad_norm": 0.18974647851723686, + "grad_max_sv": 0.03764563817530871, + "grad_min_sv": 0.0, + "grad_condition": 37645638175.3087, + "lr": 0.0005626666167821517, + "time_sec": 177.30268549919128 + }, + { + "epoch": 70, + "train_loss": 5.365585427398682, + "train_acc": 0.00962, + "test_loss": 4.667314112854004, + "test_acc": 0.01, + "lyapunov": 1.58941994451196, + "grad_norm": 0.17127250466631513, + "grad_max_sv": 0.043766821082681415, + "grad_min_sv": 0.0, + "grad_condition": 43766821082.68142, + "lr": 0.0005522642316338265, + "time_sec": 177.31375312805176 + }, + { + "epoch": 71, + "train_loss": 5.360834673461914, + "train_acc": 0.0103, + "test_loss": 4.691217092895508, + "test_acc": 0.01, + "lyapunov": 1.5854695108540529, + "grad_norm": 0.15750040762462056, + "grad_max_sv": 0.05662639001384377, + "grad_min_sv": 0.0, + "grad_condition": 56626390013.84377, + "lr": 0.0005418389216661573, + "time_sec": 177.3107042312622 + }, + { + "epoch": 72, + "train_loss": 5.360965846557617, + "train_acc": 0.01014, + "test_loss": 4.686003870391846, + "test_acc": 0.01, + "lyapunov": 1.586221619945048, + "grad_norm": 0.1761841219237378, + "grad_max_sv": 0.051002619601786134, + "grad_min_sv": 0.0, + "grad_condition": 51002619601.78613, + "lr": 0.0005313952597646563, + "time_sec": 177.28891253471375 + }, + { + "epoch": 73, + "train_loss": 5.365758000946045, + "train_acc": 0.00988, + "test_loss": 4.678875315856933, + "test_acc": 0.01, + "lyapunov": 1.5900602660825491, + "grad_norm": 0.21832467373191636, + "grad_max_sv": 0.06282770875841379, + "grad_min_sv": 0.0, + "grad_condition": 62827708758.413795, + "lr": 0.0005209378268645994, + "time_sec": 177.3162078857422 + }, + { + "epoch": 74, + "train_loss": 5.365496074371338, + "train_acc": 0.0093, + "test_loss": 4.655053031921387, + "test_acc": 0.01, + "lyapunov": 1.589696585979608, + "grad_norm": 0.23086253967925782, + "grad_max_sv": 0.060001683793962, + "grad_min_sv": 0.0, + "grad_condition": 60001683793.962, + "lr": 0.0005104712099416781, + "time_sec": 177.30215072631836 + }, + { + "epoch": 75, + "train_loss": 5.364179220275879, + "train_acc": 0.0099, + "test_loss": 4.638170684051514, + "test_acc": 0.01, + "lyapunov": 1.5883820352651883, + "grad_norm": 0.3049112090346521, + "grad_max_sv": 0.05380613347515464, + "grad_min_sv": 0.0, + "grad_condition": 53806133475.15464, + "lr": 0.0004999999999999996, + "time_sec": 177.36862349510193 + }, + { + "epoch": 76, + "train_loss": 5.359675194854736, + "train_acc": 0.01046, + "test_loss": 4.649093914794922, + "test_acc": 0.01, + "lyapunov": 1.5854026216375248, + "grad_norm": 0.2119481091202284, + "grad_max_sv": 0.03726704930886626, + "grad_min_sv": 0.0, + "grad_condition": 37267049308.86626, + "lr": 0.0004895287900583212, + "time_sec": 177.32284903526306 + }, + { + "epoch": 77, + "train_loss": 5.360474863128662, + "train_acc": 0.00958, + "test_loss": 4.605349244689942, + "test_acc": 0.01, + "lyapunov": 1.5860518323795876, + "grad_norm": 0.20492250658984978, + "grad_max_sv": 0.010520621668547392, + "grad_min_sv": 0.0, + "grad_condition": 10520621668.54739, + "lr": 0.0004790621731353997, + "time_sec": 177.27856492996216 + }, + { + "epoch": 78, + "train_loss": 5.3626285870361325, + "train_acc": 0.0096, + "test_loss": 4.636105052185059, + "test_acc": 0.01, + "lyapunov": 1.5883512807928997, + "grad_norm": 0.16200768770528595, + "grad_max_sv": 0.01769152507185936, + "grad_min_sv": 0.0, + "grad_condition": 17691525071.85936, + "lr": 0.000468604740235343, + "time_sec": 177.26149678230286 + }, + { + "epoch": 79, + "train_loss": 5.361725220947266, + "train_acc": 0.00962, + "test_loss": 4.642175579071045, + "test_acc": 0.01, + "lyapunov": 1.5874589931629504, + "grad_norm": 0.1671711869857159, + "grad_max_sv": 0.027231273613870143, + "grad_min_sv": 0.0, + "grad_condition": 27231273613.870144, + "lr": 0.00045816107833384175, + "time_sec": 177.28059816360474 + }, + { + "epoch": 80, + "train_loss": 5.359847649841309, + "train_acc": 0.00934, + "test_loss": 4.646283575439453, + "test_acc": 0.01, + "lyapunov": 1.5854374237377624, + "grad_norm": 0.15090527056955186, + "grad_max_sv": 0.02150285104289651, + "grad_min_sv": 0.0, + "grad_condition": 21502851042.896507, + "lr": 0.0004477357683661729, + "time_sec": 177.27379083633423 + }, + { + "epoch": 81, + "train_loss": 5.3600718869018555, + "train_acc": 0.01048, + "test_loss": 4.752709213256836, + "test_acc": 0.01, + "lyapunov": 1.585394742238857, + "grad_norm": 0.17187344605967436, + "grad_max_sv": 0.043320519663393495, + "grad_min_sv": 0.0, + "grad_condition": 43320519663.39349, + "lr": 0.00043733338321784746, + "time_sec": 177.62933731079102 + }, + { + "epoch": 82, + "train_loss": 5.362194033813476, + "train_acc": 0.00908, + "test_loss": 4.769781411743164, + "test_acc": 0.01, + "lyapunov": 1.5872593858967656, + "grad_norm": 0.17685474969644083, + "grad_max_sv": 0.043185068760067225, + "grad_min_sv": 0.0, + "grad_condition": 43185068760.06722, + "lr": 0.0004269584857187939, + "time_sec": 177.36878728866577 + }, + { + "epoch": 83, + "train_loss": 5.360512623901367, + "train_acc": 0.00896, + "test_loss": 4.634495629882813, + "test_acc": 0.01, + "lyapunov": 1.585809985999866, + "grad_norm": 0.17569851085947658, + "grad_max_sv": 0.048822146560996774, + "grad_min_sv": 0.0, + "grad_condition": 48822146560.99677, + "lr": 0.0004166156266419484, + "time_sec": 177.35730743408203 + }, + { + "epoch": 84, + "train_loss": 5.360660369110107, + "train_acc": 0.01062, + "test_loss": 4.635055514526367, + "test_acc": 0.01, + "lyapunov": 1.5863755276745848, + "grad_norm": 0.1734959766637803, + "grad_max_sv": 0.03708101906813681, + "grad_min_sv": 0.0, + "grad_condition": 37081019068.13681, + "lr": 0.0004063093427071373, + "time_sec": 177.31386804580688 + }, + { + "epoch": 85, + "train_loss": 5.359581319885254, + "train_acc": 0.00962, + "test_loss": 4.680524919128418, + "test_acc": 0.01, + "lyapunov": 1.585432373349319, + "grad_norm": 0.19633262712151112, + "grad_max_sv": 0.016985992342233656, + "grad_min_sv": 0.0, + "grad_condition": 16985992342.233658, + "lr": 0.0003960441545911199, + "time_sec": 177.29162740707397 + }, + { + "epoch": 86, + "train_loss": 5.364330820922851, + "train_acc": 0.00994, + "test_loss": 4.640988105010987, + "test_acc": 0.01, + "lyapunov": 1.5893402819133475, + "grad_norm": 0.17010660799200755, + "grad_max_sv": 0.005552049493417144, + "grad_min_sv": 0.0, + "grad_condition": 5552049493.417144, + "lr": 0.0003858245649446718, + "time_sec": 177.2697069644928 + }, + { + "epoch": 87, + "train_loss": 5.36001446975708, + "train_acc": 0.0091, + "test_loss": 4.6622309997558595, + "test_acc": 0.01, + "lyapunov": 1.5858566068932223, + "grad_norm": 0.18253684720194474, + "grad_max_sv": 0.009605350159108638, + "grad_min_sv": 0.0, + "grad_condition": 9605350159.108639, + "lr": 0.00037565505641757235, + "time_sec": 177.2729914188385 + }, + { + "epoch": 88, + "train_loss": 5.363334915313721, + "train_acc": 0.00928, + "test_loss": 4.651910215759277, + "test_acc": 0.01, + "lyapunov": 1.5891908779168678, + "grad_norm": 0.25285970261724394, + "grad_max_sv": 0.014622378209605814, + "grad_min_sv": 0.0, + "grad_condition": 14622378209.605814, + "lr": 0.00036554008969236695, + "time_sec": 177.25673460960388 + }, + { + "epoch": 89, + "train_loss": 5.366140861053466, + "train_acc": 0.0098, + "test_loss": 4.632004132843018, + "test_acc": 0.01, + "lyapunov": 1.5918613025904311, + "grad_norm": 0.3793803057886311, + "grad_max_sv": 0.0227991352789104, + "grad_min_sv": 0.0, + "grad_condition": 22799135278.9104, + "lr": 0.0003554841015277638, + "time_sec": 177.28270602226257 + }, + { + "epoch": 90, + "train_loss": 5.358956403503418, + "train_acc": 0.00908, + "test_loss": 4.634336037445069, + "test_acc": 0.01, + "lyapunov": 1.5845078528689607, + "grad_norm": 0.16129836844937653, + "grad_max_sv": 0.030955695733428, + "grad_min_sv": 0.0, + "grad_condition": 30955695733.428, + "lr": 0.000345491502812526, + "time_sec": 177.34664869308472 + }, + { + "epoch": 91, + "train_loss": 5.370377727966309, + "train_acc": 0.01008, + "test_loss": 4.641486628723144, + "test_acc": 0.01, + "lyapunov": 1.5915974838959286, + "grad_norm": 0.23056801493799003, + "grad_max_sv": 0.021973734814673664, + "grad_min_sv": 0.0, + "grad_condition": 21973734814.673664, + "lr": 0.0003355666766307081, + "time_sec": 177.30071926116943 + }, + { + "epoch": 92, + "train_loss": 5.35953079574585, + "train_acc": 0.0104, + "test_loss": 4.654357167816162, + "test_acc": 0.01, + "lyapunov": 1.5854123461886744, + "grad_norm": 0.2133357061554603, + "grad_max_sv": 0.01584432367235422, + "grad_min_sv": 0.0, + "grad_condition": 15844323672.354221, + "lr": 0.00032571397633909225, + "time_sec": 177.30744338035583 + }, + { + "epoch": 93, + "train_loss": 5.359757648162842, + "train_acc": 0.01004, + "test_loss": 4.635669487762451, + "test_acc": 0.01, + "lyapunov": 1.5857275602457774, + "grad_norm": 0.21123088900545153, + "grad_max_sv": 0.022326651168987154, + "grad_min_sv": 0.0, + "grad_condition": 22326651168.98716, + "lr": 0.00031593772365766094, + "time_sec": 177.30698537826538 + }, + { + "epoch": 94, + "train_loss": 5.358649451293945, + "train_acc": 0.00924, + "test_loss": 4.650500559997559, + "test_acc": 0.01, + "lyapunov": 1.584580004367682, + "grad_norm": 0.22156955822269123, + "grad_max_sv": 0.0036812785547226667, + "grad_min_sv": 0.0, + "grad_condition": 3681278554.7226667, + "lr": 0.0003062422067739483, + "time_sec": 177.29391837120056 + }, + { + "epoch": 95, + "train_loss": 5.368402194519043, + "train_acc": 0.0096, + "test_loss": 4.631659384155274, + "test_acc": 0.01, + "lyapunov": 1.5918427952720076, + "grad_norm": 0.19012319147558024, + "grad_max_sv": 0.01328945653513074, + "grad_min_sv": 0.0, + "grad_condition": 13289456535.130741, + "lr": 0.00029663167846209965, + "time_sec": 177.28295135498047 + }, + { + "epoch": 96, + "train_loss": 5.360648808441162, + "train_acc": 0.00988, + "test_loss": 4.642071528625488, + "test_acc": 0.01, + "lyapunov": 1.586560007251437, + "grad_norm": 0.16157307254883244, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 177.2989547252655 + }, + { + "epoch": 97, + "train_loss": 5.358733374786377, + "train_acc": 0.00914, + "test_loss": 4.639485282897949, + "test_acc": 0.01, + "lyapunov": 1.5846895253871713, + "grad_norm": 0.14480973228900776, + "grad_max_sv": 0.00837345547042787, + "grad_min_sv": 0.0, + "grad_condition": 8373455470.427872, + "lr": 0.00027768241040753615, + "time_sec": 177.27525234222412 + }, + { + "epoch": 98, + "train_loss": 5.360293337707519, + "train_acc": 0.0099, + "test_loss": 4.644459535980225, + "test_acc": 0.01, + "lyapunov": 1.5861705498927086, + "grad_norm": 0.18867802153244584, + "grad_max_sv": 0.026158737391233443, + "grad_min_sv": 0.0, + "grad_condition": 26158737391.23344, + "lr": 0.00026835198244006903, + "time_sec": 177.2919957637787 + }, + { + "epoch": 99, + "train_loss": 5.360852672576904, + "train_acc": 0.00976, + "test_loss": 4.641770568847656, + "test_acc": 0.01, + "lyapunov": 1.5866629604793265, + "grad_norm": 0.2490166385107765, + "grad_max_sv": 0.025310791656374933, + "grad_min_sv": 0.0, + "grad_condition": 25310791656.37493, + "lr": 0.0002591231629491421, + "time_sec": 177.28516483306885 + }, + { + "epoch": 100, + "train_loss": 5.359503317260742, + "train_acc": 0.0096, + "test_loss": 4.633657774353027, + "test_acc": 0.01, + "lyapunov": 1.5852865261190079, + "grad_norm": 0.31764569596084014, + "grad_max_sv": 0.03201284250244498, + "grad_min_sv": 0.0, + "grad_condition": 32012842502.444984, + "lr": 0.0002499999999999997, + "time_sec": 177.3286590576172 + }, + { + "epoch": 101, + "train_loss": 5.3610862644958495, + "train_acc": 0.01004, + "test_loss": 4.627243125915528, + "test_acc": 0.01, + "lyapunov": 1.586990461934863, + "grad_norm": 0.3077979208978545, + "grad_max_sv": 0.022488519130274654, + "grad_min_sv": 0.0, + "grad_condition": 22488519130.274654, + "lr": 0.00024098649531343477, + "time_sec": 177.27038407325745 + }, + { + "epoch": 102, + "train_loss": 5.359221751708985, + "train_acc": 0.0099, + "test_loss": 4.6350917106628415, + "test_acc": 0.01, + "lyapunov": 1.5852433824173324, + "grad_norm": 0.17125449319078032, + "grad_max_sv": 0.0006372035015374423, + "grad_min_sv": 0.0, + "grad_condition": 637203501.5374422, + "lr": 0.0002320866025105016, + "time_sec": 177.26434516906738 + }, + { + "epoch": 103, + "train_loss": 5.359845841064453, + "train_acc": 0.00998, + "test_loss": 4.644444650268555, + "test_acc": 0.01, + "lyapunov": 1.5859144453502372, + "grad_norm": 0.15906823668777442, + "grad_max_sv": 0.0012175182346254587, + "grad_min_sv": 0.0, + "grad_condition": 1217518234.6254587, + "lr": 0.0002233042253783278, + "time_sec": 177.29427409172058 + }, + { + "epoch": 104, + "train_loss": 5.359393982086182, + "train_acc": 0.00964, + "test_loss": 4.629140382385254, + "test_acc": 0.01, + "lyapunov": 1.5853588230469648, + "grad_norm": 0.18868988717884208, + "grad_max_sv": 0.007832410791888834, + "grad_min_sv": 0.0, + "grad_condition": 7832410791.888834, + "lr": 0.000214643216157784, + "time_sec": 177.3122420310974 + }, + { + "epoch": 105, + "train_loss": 5.376110725402832, + "train_acc": 0.00958, + "test_loss": 4.641193688201905, + "test_acc": 0.01, + "lyapunov": 1.594091626079491, + "grad_norm": 0.21866401239429448, + "grad_max_sv": 0.01763616520911455, + "grad_min_sv": 0.0, + "grad_condition": 17636165209.11455, + "lr": 0.00020610737385376332, + "time_sec": 177.33545303344727 + }, + { + "epoch": 106, + "train_loss": 5.360543824005127, + "train_acc": 0.00952, + "test_loss": 4.63230926361084, + "test_acc": 0.01, + "lyapunov": 1.586505341407893, + "grad_norm": 0.19148423296709022, + "grad_max_sv": 0.007322627399116754, + "grad_min_sv": 0.0, + "grad_condition": 7322627399.116755, + "lr": 0.00019770044256881242, + "time_sec": 177.29128861427307 + }, + { + "epoch": 107, + "train_loss": 5.359816354370118, + "train_acc": 0.00964, + "test_loss": 4.628876644897461, + "test_acc": 0.01, + "lyapunov": 1.5858964429182165, + "grad_norm": 0.16953893016049196, + "grad_max_sv": 0.005570205627009273, + "grad_min_sv": 0.0, + "grad_condition": 5570205627.009273, + "lr": 0.0001894261098608447, + "time_sec": 177.26312851905823 + }, + { + "epoch": 108, + "train_loss": 5.360526904602051, + "train_acc": 0.009, + "test_loss": 4.630769221496582, + "test_acc": 0.01, + "lyapunov": 1.5865018233618773, + "grad_norm": 0.18006495124030458, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 177.246666431427 + }, + { + "epoch": 109, + "train_loss": 5.361382939453125, + "train_acc": 0.0098, + "test_loss": 4.626291159820557, + "test_acc": 0.01, + "lyapunov": 1.586926028856536, + "grad_norm": 0.2328474503629796, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 177.25811576843262 + }, + { + "epoch": 110, + "train_loss": 5.358514823455811, + "train_acc": 0.00986, + "test_loss": 4.6495152236938475, + "test_acc": 0.01, + "lyapunov": 1.5844445182844196, + "grad_norm": 0.31612028134160525, + "grad_max_sv": 0.010267550591379404, + "grad_min_sv": 0.0, + "grad_condition": 10267550591.379404, + "lr": 0.00016543469682057076, + "time_sec": 177.28474497795105 + }, + { + "epoch": 111, + "train_loss": 5.366782173309327, + "train_acc": 0.00906, + "test_loss": 4.620611762237549, + "test_acc": 0.01, + "lyapunov": 1.5906709133816497, + "grad_norm": 0.40151776348821855, + "grad_max_sv": 0.010553297400474549, + "grad_min_sv": 0.0, + "grad_condition": 10553297400.474548, + "lr": 0.00015772644703565552, + "time_sec": 177.3135175704956 + }, + { + "epoch": 112, + "train_loss": 5.359567135009765, + "train_acc": 0.00886, + "test_loss": 4.628111135101318, + "test_acc": 0.01, + "lyapunov": 1.5856597996733683, + "grad_norm": 0.3009012541884835, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 177.25540447235107 + }, + { + "epoch": 113, + "train_loss": 5.358919576873779, + "train_acc": 0.00968, + "test_loss": 4.627276501464844, + "test_acc": 0.01, + "lyapunov": 1.5849643582883088, + "grad_norm": 0.3242366139837751, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 177.27025246620178 + }, + { + "epoch": 114, + "train_loss": 5.3586665776062015, + "train_acc": 0.00944, + "test_loss": 4.620662684631347, + "test_acc": 0.01, + "lyapunov": 1.5846976368018733, + "grad_norm": 0.2903374978600601, + "grad_max_sv": 0.004233767790719867, + "grad_min_sv": 0.0, + "grad_condition": 4233767790.7198668, + "lr": 0.00013551568628929425, + "time_sec": 177.26198053359985 + }, + { + "epoch": 115, + "train_loss": 5.3605953396606445, + "train_acc": 0.00902, + "test_loss": 4.621528549194336, + "test_acc": 0.01, + "lyapunov": 1.586485847792662, + "grad_norm": 0.331820693233947, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 177.23981928825378 + }, + { + "epoch": 116, + "train_loss": 5.359012928771973, + "train_acc": 0.00958, + "test_loss": 4.619492964172363, + "test_acc": 0.01, + "lyapunov": 1.585117801376011, + "grad_norm": 0.2797157160809922, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 177.225914478302 + }, + { + "epoch": 117, + "train_loss": 5.359644413146973, + "train_acc": 0.00924, + "test_loss": 4.621938159942627, + "test_acc": 0.01, + "lyapunov": 1.5857579552608987, + "grad_norm": 0.2795622109437437, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 177.22438168525696 + }, + { + "epoch": 118, + "train_loss": 5.359761270446778, + "train_acc": 0.00924, + "test_loss": 4.6217840301513675, + "test_acc": 0.01, + "lyapunov": 1.5858274750087573, + "grad_norm": 0.24852001797471837, + "grad_max_sv": 0.0012709970586001873, + "grad_min_sv": 0.0, + "grad_condition": 1270997058.6001873, + "lr": 0.00010815327133708009, + "time_sec": 177.2276487350464 + }, + { + "epoch": 119, + "train_loss": 5.357662630462647, + "train_acc": 0.0091, + "test_loss": 4.622296886444092, + "test_acc": 0.01, + "lyapunov": 1.5836935113458073, + "grad_norm": 0.24372977816065178, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 177.25115942955017 + }, + { + "epoch": 120, + "train_loss": 5.361358259277344, + "train_acc": 0.00944, + "test_loss": 4.622046688079834, + "test_acc": 0.01, + "lyapunov": 1.587042825301285, + "grad_norm": 0.22330891574384296, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 177.27366518974304 + }, + { + "epoch": 121, + "train_loss": 5.35905032409668, + "train_acc": 0.00908, + "test_loss": 4.622121089935303, + "test_acc": 0.01, + "lyapunov": 1.5851479878510966, + "grad_norm": 0.20960225247372524, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 177.23317313194275 + }, + { + "epoch": 122, + "train_loss": 5.361670205078125, + "train_acc": 0.0093, + "test_loss": 4.622285698699951, + "test_acc": 0.01, + "lyapunov": 1.5875935237425978, + "grad_norm": 0.21843560272800885, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 177.2194859981537 + }, + { + "epoch": 123, + "train_loss": 5.360625909729004, + "train_acc": 0.01, + "test_loss": 4.6224393463134765, + "test_acc": 0.01, + "lyapunov": 1.5867376934232005, + "grad_norm": 0.2137074208505857, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 177.2682557106018 + }, + { + "epoch": 124, + "train_loss": 5.358632594451905, + "train_acc": 0.0093, + "test_loss": 4.680952319335938, + "test_acc": 0.01, + "lyapunov": 1.5847194472237316, + "grad_norm": 0.1870926810471898, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 177.23400807380676 + }, + { + "epoch": 125, + "train_loss": 5.360412776184082, + "train_acc": 0.0089, + "test_loss": 4.73941685333252, + "test_acc": 0.01, + "lyapunov": 1.5865021639162926, + "grad_norm": 0.21273250180362335, + "grad_max_sv": 0.0014166037552058696, + "grad_min_sv": 0.0, + "grad_condition": 1416603755.2058697, + "lr": 6.698729810778072e-05, + "time_sec": 177.24382710456848 + }, + { + "epoch": 126, + "train_loss": 5.358947314758301, + "train_acc": 0.0097, + "test_loss": 4.672125242614746, + "test_acc": 0.01, + "lyapunov": 1.584972734646419, + "grad_norm": 0.23341550723215748, + "grad_max_sv": 0.001309919636696577, + "grad_min_sv": 0.0, + "grad_condition": 1309919636.696577, + "lr": 6.184665997806817e-05, + "time_sec": 177.26921725273132 + }, + { + "epoch": 127, + "train_loss": 5.359260606536865, + "train_acc": 0.00982, + "test_loss": 4.664470828247071, + "test_acc": 0.01, + "lyapunov": 1.585314722012376, + "grad_norm": 0.265210981123156, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 177.23559665679932 + }, + { + "epoch": 128, + "train_loss": 5.361228064270019, + "train_acc": 0.0096, + "test_loss": 4.79210078125, + "test_acc": 0.01, + "lyapunov": 1.5868884224416044, + "grad_norm": 0.284706461729636, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 177.23232126235962 + }, + { + "epoch": 129, + "train_loss": 5.358762674407959, + "train_acc": 0.00948, + "test_loss": 4.767799957275391, + "test_acc": 0.01, + "lyapunov": 1.5848681917580802, + "grad_norm": 0.27692568211643537, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 177.2341754436493 + }, + { + "epoch": 130, + "train_loss": 5.360010164489746, + "train_acc": 0.00926, + "test_loss": 4.671016343688965, + "test_acc": 0.01, + "lyapunov": 1.5858237874477417, + "grad_norm": 0.2706962686573412, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 177.24218034744263 + }, + { + "epoch": 131, + "train_loss": 5.3587316012573245, + "train_acc": 0.00928, + "test_loss": 4.748648097229004, + "test_acc": 0.01, + "lyapunov": 1.5848381055895324, + "grad_norm": 0.23937263927645328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 177.2330150604248 + }, + { + "epoch": 132, + "train_loss": 5.35890893157959, + "train_acc": 0.00964, + "test_loss": 4.8125279388427735, + "test_acc": 0.01, + "lyapunov": 1.5850241647656922, + "grad_norm": 0.2489556767273508, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 177.22991752624512 + }, + { + "epoch": 133, + "train_loss": 5.361185835876465, + "train_acc": 0.00952, + "test_loss": 4.643449569702148, + "test_acc": 0.01, + "lyapunov": 1.5871033570955477, + "grad_norm": 0.31193315187891146, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 177.2139208316803 + }, + { + "epoch": 134, + "train_loss": 5.358732033691406, + "train_acc": 0.00876, + "test_loss": 4.706984965515137, + "test_acc": 0.01, + "lyapunov": 1.5848448145420044, + "grad_norm": 0.25839982964286506, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 177.22592782974243 + }, + { + "epoch": 135, + "train_loss": 5.359151672363281, + "train_acc": 0.00906, + "test_loss": 4.7044763816833495, + "test_acc": 0.01, + "lyapunov": 1.5852836605228122, + "grad_norm": 0.2598696228178214, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 177.2558205127716 + }, + { + "epoch": 136, + "train_loss": 5.359703632965088, + "train_acc": 0.01, + "test_loss": 4.721178560638427, + "test_acc": 0.01, + "lyapunov": 1.5858281173974351, + "grad_norm": 0.26109222250019687, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 177.24931955337524 + }, + { + "epoch": 137, + "train_loss": 5.359647062225342, + "train_acc": 0.00956, + "test_loss": 4.705288150024414, + "test_acc": 0.01, + "lyapunov": 1.585799050453069, + "grad_norm": 0.2430419176031886, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 177.20098423957825 + }, + { + "epoch": 138, + "train_loss": 5.370798114471436, + "train_acc": 0.01, + "test_loss": 4.711322469329834, + "test_acc": 0.01, + "lyapunov": 1.592538814105646, + "grad_norm": 0.23717985848250528, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 177.27925276756287 + }, + { + "epoch": 139, + "train_loss": 5.358164114685058, + "train_acc": 0.0097, + "test_loss": 4.713753561401367, + "test_acc": 0.01, + "lyapunov": 1.5842537294568309, + "grad_norm": 0.21577381809039398, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 177.2640838623047 + }, + { + "epoch": 140, + "train_loss": 5.359127445678711, + "train_acc": 0.00982, + "test_loss": 4.702644599914551, + "test_acc": 0.01, + "lyapunov": 1.5852683206348468, + "grad_norm": 0.22693874606806255, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 177.26845002174377 + }, + { + "epoch": 141, + "train_loss": 5.358451212463379, + "train_acc": 0.01, + "test_loss": 4.709589306640625, + "test_acc": 0.01, + "lyapunov": 1.5845830724062517, + "grad_norm": 0.21686215956311627, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 177.26886224746704 + }, + { + "epoch": 142, + "train_loss": 5.359413949279785, + "train_acc": 0.01, + "test_loss": 4.713582644653321, + "test_acc": 0.01, + "lyapunov": 1.5855683030374825, + "grad_norm": 0.2386062253915984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 177.24717164039612 + }, + { + "epoch": 143, + "train_loss": 5.380280564575195, + "train_acc": 0.01, + "test_loss": 4.7039310775756835, + "test_acc": 0.01, + "lyapunov": 1.59827317331758, + "grad_norm": 0.281062533044562, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 177.23896765708923 + }, + { + "epoch": 144, + "train_loss": 5.359466158905029, + "train_acc": 0.01, + "test_loss": 4.690676583862305, + "test_acc": 0.01, + "lyapunov": 1.5856200407837968, + "grad_norm": 0.18794718433603225, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 177.22590732574463 + }, + { + "epoch": 145, + "train_loss": 5.358838105926513, + "train_acc": 0.01, + "test_loss": 4.686097943115234, + "test_acc": 0.01, + "lyapunov": 1.5849668324146124, + "grad_norm": 0.18762604455384463, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 177.2236692905426 + }, + { + "epoch": 146, + "train_loss": 5.358961830444336, + "train_acc": 0.01, + "test_loss": 4.6859198120117185, + "test_acc": 0.01, + "lyapunov": 1.5850938287232539, + "grad_norm": 0.20367093372209882, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 177.23711729049683 + }, + { + "epoch": 147, + "train_loss": 5.359495299530029, + "train_acc": 0.01, + "test_loss": 4.686381504821777, + "test_acc": 0.01, + "lyapunov": 1.585582929194126, + "grad_norm": 0.1846519425292254, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 177.23132824897766 + }, + { + "epoch": 148, + "train_loss": 5.358631723632812, + "train_acc": 0.01, + "test_loss": 4.686381640625, + "test_acc": 0.01, + "lyapunov": 1.5847509065857324, + "grad_norm": 0.21479574972052035, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 177.25513577461243 + }, + { + "epoch": 149, + "train_loss": 5.359418527679443, + "train_acc": 0.01, + "test_loss": 4.6863815933227535, + "test_acc": 0.01, + "lyapunov": 1.585573171105836, + "grad_norm": 0.18053721718052793, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 177.26594400405884 + }, + { + "epoch": 150, + "train_loss": 5.358559367828369, + "train_acc": 0.01, + "test_loss": 4.686381562042237, + "test_acc": 0.01, + "lyapunov": 1.584673622075249, + "grad_norm": 0.17806465386525372, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 177.21632599830627 + } + ] + } +}
\ No newline at end of file |
