From cd99d6b874d9d09b3bb87b8485cc787885af71f1 Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Tue, 13 Jan 2026 23:49:05 -0600 Subject: init commit --- .../cifar100_20260102-133339/results.json | 16822 +++++++++++++++++++ 1 file changed, 16822 insertions(+) create mode 100644 runs/depth_scaling_target1/cifar100_20260102-133339/results.json (limited to 'runs/depth_scaling_target1/cifar100_20260102-133339/results.json') diff --git a/runs/depth_scaling_target1/cifar100_20260102-133339/results.json b/runs/depth_scaling_target1/cifar100_20260102-133339/results.json new file mode 100644 index 0000000..b51175e --- /dev/null +++ b/runs/depth_scaling_target1/cifar100_20260102-133339/results.json @@ -0,0 +1,16822 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 4.357881842498779, + "train_acc": 0.09446, + "test_loss": 3.5281315925598142, + "test_acc": 0.1727, + "lyapunov": null, + "grad_norm": 6.340097491169349, + "grad_max_sv": 4.973841696977615, + "grad_min_sv": 1.1637189214486199e-07, + "grad_condition": 49820869.21311478, + "lr": 0.0009998903417374227, + "time_sec": 17.58898615837097 + }, + { + "epoch": 2, + "train_loss": 3.5162495974731445, + "train_acc": 0.18166, + "test_loss": 3.361986777496338, + "test_acc": 0.2212, + "lyapunov": null, + "grad_norm": 4.547965644035686, + "grad_max_sv": 3.3173387169837953, + "grad_min_sv": 8.365211060512578e-08, + "grad_condition": 74579242.00846244, + "lr": 0.0009995614150494292, + "time_sec": 15.70747685432434 + }, + { + "epoch": 3, + "train_loss": 3.049772911834717, + "train_acc": 0.25444, + "test_loss": 2.928312567138672, + "test_acc": 0.2881, + "lyapunov": null, + "grad_norm": 3.571965368749656, + "grad_max_sv": 2.4133509695529938, + "grad_min_sv": 6.657408836430179e-08, + "grad_condition": 49614137.32958214, + "lr": 0.0009990133642141358, + "time_sec": 15.519535303115845 + }, + { + "epoch": 4, + "train_loss": 2.724564817428589, + "train_acc": 0.31436, + "test_loss": 2.6733072105407714, + "test_acc": 0.331, + "lyapunov": null, + "grad_norm": 2.9818986561503382, + "grad_max_sv": 1.8422472059726716, + "grad_min_sv": 5.5166534979056436e-08, + "grad_condition": 46971156.93483184, + "lr": 0.0009982464296247522, + "time_sec": 15.458869457244873 + }, + { + "epoch": 5, + "train_loss": 2.501728704910278, + "train_acc": 0.35702, + "test_loss": 2.674536157989502, + "test_acc": 0.3431, + "lyapunov": null, + "grad_norm": 2.6380344213218527, + "grad_max_sv": 1.605541154742241, + "grad_min_sv": 5.005898049068036e-08, + "grad_condition": 177063609.4994608, + "lr": 0.0009972609476841367, + "time_sec": 15.46523928642273 + }, + { + "epoch": 6, + "train_loss": 2.322341884765625, + "train_acc": 0.39588, + "test_loss": 2.440810569000244, + "test_acc": 0.3786, + "lyapunov": null, + "grad_norm": 2.4046357640712968, + "grad_max_sv": 1.3473579943180085, + "grad_min_sv": 4.569443099143589e-08, + "grad_condition": 315579058.91849506, + "lr": 0.000996057350657239, + "time_sec": 15.45302700996399 + }, + { + "epoch": 7, + "train_loss": 2.1792964128112793, + "train_acc": 0.42468, + "test_loss": 3.6083086921691896, + "test_acc": 0.2555, + "lyapunov": null, + "grad_norm": 2.2401065243050575, + "grad_max_sv": 1.250352716445923, + "grad_min_sv": 4.339612316023311e-08, + "grad_condition": 110140464.91678305, + "lr": 0.000994636166481494, + "time_sec": 15.459157943725586 + }, + { + "epoch": 8, + "train_loss": 2.06442552192688, + "train_acc": 0.4489, + "test_loss": 2.2239890716552733, + "test_acc": 0.4291, + "lyapunov": null, + "grad_norm": 2.1012594692428856, + "grad_max_sv": 1.1558537915349008, + "grad_min_sv": 4.060080087131546e-08, + "grad_condition": 62897451.54566701, + "lr": 0.0009929980185352525, + "time_sec": 15.45511507987976 + }, + { + "epoch": 9, + "train_loss": 1.9475363119125366, + "train_acc": 0.47542, + "test_loss": 2.2026602458953857, + "test_acc": 0.4287, + "lyapunov": null, + "grad_norm": 1.9715615750533326, + "grad_max_sv": 1.032596978545189, + "grad_min_sv": 3.794599175710456e-08, + "grad_condition": 65058485.034411274, + "lr": 0.0009911436253643444, + "time_sec": 15.45013976097107 + }, + { + "epoch": 10, + "train_loss": 1.8557951174163818, + "train_acc": 0.49814, + "test_loss": 2.1774634853363035, + "test_acc": 0.4362, + "lyapunov": null, + "grad_norm": 1.8504614407647018, + "grad_max_sv": 0.9416742533445358, + "grad_min_sv": 3.512936608274231e-08, + "grad_condition": 46677459.72355051, + "lr": 0.0009890738003669028, + "time_sec": 15.440587997436523 + }, + { + "epoch": 11, + "train_loss": 1.763924418334961, + "train_acc": 0.5187, + "test_loss": 2.4288942903518675, + "test_acc": 0.4051, + "lyapunov": null, + "grad_norm": 1.7822208884902826, + "grad_max_sv": 0.9033506259322166, + "grad_min_sv": 3.467363161036019e-08, + "grad_condition": 30024832.372439463, + "lr": 0.00098678945143658, + "time_sec": 15.469273567199707 + }, + { + "epoch": 12, + "train_loss": 1.6992105947494507, + "train_acc": 0.53384, + "test_loss": 2.3932419761657715, + "test_acc": 0.4169, + "lyapunov": null, + "grad_norm": 1.6908902602895592, + "grad_max_sv": 0.8336813643574714, + "grad_min_sv": 3.225944931739555e-08, + "grad_condition": 38720407.501370475, + "lr": 0.0009842915805643154, + "time_sec": 15.462818622589111 + }, + { + "epoch": 13, + "train_loss": 1.6412196295166015, + "train_acc": 0.54614, + "test_loss": 2.303184538459778, + "test_acc": 0.4269, + "lyapunov": null, + "grad_norm": 1.6321649042964204, + "grad_max_sv": 0.7801442697644234, + "grad_min_sv": 3.083002481085728e-08, + "grad_condition": 35858025.435112044, + "lr": 0.000981581283398829, + "time_sec": 15.466039419174194 + }, + { + "epoch": 14, + "train_loss": 1.5800055722045898, + "train_acc": 0.56072, + "test_loss": 2.34448659324646, + "test_acc": 0.4166, + "lyapunov": null, + "grad_norm": 1.5709541615646672, + "grad_max_sv": 0.7645063757896423, + "grad_min_sv": 3.010382080819579e-08, + "grad_condition": 425485709.2107061, + "lr": 0.0009786597487660333, + "time_sec": 15.457959175109863 + }, + { + "epoch": 15, + "train_loss": 1.522832469100952, + "train_acc": 0.5756, + "test_loss": 2.018679809951782, + "test_acc": 0.4728, + "lyapunov": null, + "grad_norm": 1.516521779058338, + "grad_max_sv": 0.7272973746061325, + "grad_min_sv": 2.8604062869697076e-08, + "grad_condition": 94477206.12080687, + "lr": 0.0009755282581475766, + "time_sec": 15.45545220375061 + }, + { + "epoch": 16, + "train_loss": 1.4677007636260986, + "train_acc": 0.58764, + "test_loss": 1.9565035533905029, + "test_acc": 0.4933, + "lyapunov": null, + "grad_norm": 1.453059249026843, + "grad_max_sv": 0.67758848965168, + "grad_min_sv": 2.7189674285665878e-08, + "grad_condition": 55305058.773309946, + "lr": 0.0009721881851187403, + "time_sec": 15.498552322387695 + }, + { + "epoch": 17, + "train_loss": 1.4236618344116212, + "train_acc": 0.59808, + "test_loss": 1.8643951223373414, + "test_acc": 0.5109, + "lyapunov": null, + "grad_norm": 1.4131743339238467, + "grad_max_sv": 0.6649302154779434, + "grad_min_sv": 2.678126555383242e-08, + "grad_condition": 54799789.840084136, + "lr": 0.0009686409947459456, + "time_sec": 15.623136520385742 + }, + { + "epoch": 18, + "train_loss": 1.3931309001159669, + "train_acc": 0.60628, + "test_loss": 1.9086449605941773, + "test_acc": 0.5161, + "lyapunov": null, + "grad_norm": 1.3774038135699718, + "grad_max_sv": 0.6381687998771668, + "grad_min_sv": 2.581961362491114e-08, + "grad_condition": 53150613.95565927, + "lr": 0.0009648882429441254, + "time_sec": 16.356106758117676 + }, + { + "epoch": 19, + "train_loss": 1.332000114517212, + "train_acc": 0.61976, + "test_loss": 1.9447854751586915, + "test_acc": 0.4998, + "lyapunov": null, + "grad_norm": 1.3339422136321473, + "grad_max_sv": 0.6115798369050026, + "grad_min_sv": 2.4986909905738708e-08, + "grad_condition": 76361025.08562623, + "lr": 0.00096093157579425, + "time_sec": 15.486042737960815 + }, + { + "epoch": 20, + "train_loss": 1.2998398171234131, + "train_acc": 0.62884, + "test_loss": 1.9578068918228149, + "test_acc": 0.499, + "lyapunov": null, + "grad_norm": 1.3044281680786607, + "grad_max_sv": 0.5868817433714867, + "grad_min_sv": 2.460346111539738e-08, + "grad_condition": 1416469832.4203677, + "lr": 0.0009567727288213001, + "time_sec": 15.45453691482544 + }, + { + "epoch": 21, + "train_loss": 1.266195481147766, + "train_acc": 0.63696, + "test_loss": 2.05823407535553, + "test_acc": 0.4838, + "lyapunov": null, + "grad_norm": 1.2726472953754493, + "grad_max_sv": 0.5784675382077694, + "grad_min_sv": 2.384093428370315e-08, + "grad_condition": 156182020.27727562, + "lr": 0.0009524135262330095, + "time_sec": 15.506311893463135 + }, + { + "epoch": 22, + "train_loss": 1.2384513986587524, + "train_acc": 0.64552, + "test_loss": 1.9120031692504882, + "test_acc": 0.5172, + "lyapunov": null, + "grad_norm": 1.252497757690001, + "grad_max_sv": 0.5717031776905059, + "grad_min_sv": 2.3619134396912768e-08, + "grad_condition": 67519805.29707912, + "lr": 0.0009478558801197061, + "time_sec": 15.47418475151062 + }, + { + "epoch": 23, + "train_loss": 1.1993658528137208, + "train_acc": 0.65306, + "test_loss": 1.7887667993545533, + "test_acc": 0.5382, + "lyapunov": null, + "grad_norm": 1.2275759420533918, + "grad_max_sv": 0.5570299223065376, + "grad_min_sv": 2.2936629940836784e-08, + "grad_condition": 165671008.87666664, + "lr": 0.000943101789615607, + "time_sec": 15.476239204406738 + }, + { + "epoch": 24, + "train_loss": 1.1695793395996095, + "train_acc": 0.66222, + "test_loss": 1.9164223749160767, + "test_acc": 0.5069, + "lyapunov": null, + "grad_norm": 1.19558806415952, + "grad_max_sv": 0.5234090469777584, + "grad_min_sv": 2.2025900239808215e-08, + "grad_condition": 38525149.552328385, + "lr": 0.0009381533400219313, + "time_sec": 15.470394372940063 + }, + { + "epoch": 25, + "train_loss": 1.1371285773468018, + "train_acc": 0.66864, + "test_loss": 1.9049333578109742, + "test_acc": 0.5198, + "lyapunov": null, + "grad_norm": 1.1691991255738516, + "grad_max_sv": 0.5114153914153576, + "grad_min_sv": 2.1633911190255262e-08, + "grad_condition": 40420362.43580131, + "lr": 0.0009330127018922189, + "time_sec": 15.475921392440796 + }, + { + "epoch": 26, + "train_loss": 1.0984287197875977, + "train_acc": 0.67622, + "test_loss": 1.9236036626815796, + "test_acc": 0.5105, + "lyapunov": null, + "grad_norm": 1.1491919288876447, + "grad_max_sv": 0.5075508892536164, + "grad_min_sv": 2.156528700753002e-08, + "grad_condition": 52800149.44483626, + "lr": 0.000927682130080253, + "time_sec": 15.560164213180542 + }, + { + "epoch": 27, + "train_loss": 1.085814157333374, + "train_acc": 0.68168, + "test_loss": 1.854748671913147, + "test_acc": 0.5303, + "lyapunov": null, + "grad_norm": 1.132642015283084, + "grad_max_sv": 0.5079298578202724, + "grad_min_sv": 2.0747377492413844e-08, + "grad_condition": 40886114.03567152, + "lr": 0.0009221639627510072, + "time_sec": 15.515005350112915 + }, + { + "epoch": 28, + "train_loss": 1.0481378091812135, + "train_acc": 0.6919, + "test_loss": 1.787252332687378, + "test_acc": 0.5447, + "lyapunov": null, + "grad_norm": 1.1084077878736969, + "grad_max_sv": 0.48980700969696045, + "grad_min_sv": 2.03924750370732e-08, + "grad_condition": 144667188.87541157, + "lr": 0.0009164606203550494, + "time_sec": 15.477014064788818 + }, + { + "epoch": 29, + "train_loss": 1.0372727437210083, + "train_acc": 0.6921, + "test_loss": 1.8922377561569215, + "test_acc": 0.5273, + "lyapunov": null, + "grad_norm": 1.0954714543743995, + "grad_max_sv": 0.4976396970450878, + "grad_min_sv": 2.0566780979669463e-08, + "grad_condition": 42633949.37567282, + "lr": 0.0009105746045668516, + "time_sec": 15.492783546447754 + }, + { + "epoch": 30, + "train_loss": 0.9987185321426392, + "train_acc": 0.70062, + "test_loss": 1.8061668651580811, + "test_acc": 0.5499, + "lyapunov": null, + "grad_norm": 1.0825800954246438, + "grad_max_sv": 0.47690314128994943, + "grad_min_sv": 2.0063227677488694e-08, + "grad_condition": 114878509.5913475, + "lr": 0.0009045084971874733, + "time_sec": 15.465651512145996 + }, + { + "epoch": 31, + "train_loss": 0.9715755378532409, + "train_acc": 0.71128, + "test_loss": 2.5642683250427245, + "test_acc": 0.434, + "lyapunov": null, + "grad_norm": 1.0638185111036047, + "grad_max_sv": 0.46563360542058946, + "grad_min_sv": 1.9753409723904936e-08, + "grad_condition": 54475045.10178232, + "lr": 0.0008982649590120977, + "time_sec": 15.514770984649658 + }, + { + "epoch": 32, + "train_loss": 0.9588010568237305, + "train_acc": 0.71496, + "test_loss": 2.0556532321929932, + "test_acc": 0.5074, + "lyapunov": null, + "grad_norm": 1.0445708403852423, + "grad_max_sv": 0.4599720284342766, + "grad_min_sv": 1.917516104857353e-08, + "grad_condition": 71151837.22383483, + "lr": 0.0008918467286629196, + "time_sec": 15.503283977508545 + }, + { + "epoch": 33, + "train_loss": 0.93256760181427, + "train_acc": 0.72162, + "test_loss": 1.751899316596985, + "test_acc": 0.5538, + "lyapunov": null, + "grad_norm": 1.0334590332592064, + "grad_max_sv": 0.4484298422932625, + "grad_min_sv": 1.938236048604214e-08, + "grad_condition": 38422022.12695898, + "lr": 0.0008852566213878943, + "time_sec": 15.474556922912598 + }, + { + "epoch": 34, + "train_loss": 0.9141502959060669, + "train_acc": 0.72538, + "test_loss": 1.8125969528198242, + "test_acc": 0.5461, + "lyapunov": null, + "grad_norm": 1.020200863648912, + "grad_max_sv": 0.44143804982304574, + "grad_min_sv": 1.856398942207127e-08, + "grad_condition": 117935929.65389478, + "lr": 0.000878497527825878, + "time_sec": 15.485417366027832 + }, + { + "epoch": 35, + "train_loss": 0.8939477145385742, + "train_acc": 0.72998, + "test_loss": 1.8124234422683716, + "test_acc": 0.5558, + "lyapunov": null, + "grad_norm": 1.0031609444634824, + "grad_max_sv": 0.4364132799208164, + "grad_min_sv": 1.819760966359496e-08, + "grad_condition": 38733067.30472837, + "lr": 0.000871572412738697, + "time_sec": 15.474757432937622 + }, + { + "epoch": 36, + "train_loss": 0.8783849499893188, + "train_acc": 0.7375, + "test_loss": 2.0318579233169554, + "test_acc": 0.5215, + "lyapunov": null, + "grad_norm": 0.993071712133669, + "grad_max_sv": 0.4357504576444626, + "grad_min_sv": 1.8338578772203463e-08, + "grad_condition": 66584075.59983899, + "lr": 0.0008644843137107055, + "time_sec": 15.47328805923462 + }, + { + "epoch": 37, + "train_loss": 0.8544786010742188, + "train_acc": 0.74252, + "test_loss": 1.7350282289505006, + "test_acc": 0.5703, + "lyapunov": null, + "grad_norm": 0.9779352878833807, + "grad_max_sv": 0.42835590019822123, + "grad_min_sv": 1.7869282904758865e-08, + "grad_condition": 39240168.34852584, + "lr": 0.0008572363398164014, + "time_sec": 15.479693412780762 + }, + { + "epoch": 38, + "train_loss": 0.8369656467819214, + "train_acc": 0.7451, + "test_loss": 1.8668952745437621, + "test_acc": 0.545, + "lyapunov": null, + "grad_norm": 0.9729051326605097, + "grad_max_sv": 0.42709693908691404, + "grad_min_sv": 1.8001504511339085e-08, + "grad_condition": 69145831.04846993, + "lr": 0.0008498316702566826, + "time_sec": 15.467434167861938 + }, + { + "epoch": 39, + "train_loss": 0.8145392098999024, + "train_acc": 0.75306, + "test_loss": 1.8897558479309082, + "test_acc": 0.5503, + "lyapunov": null, + "grad_norm": 0.9541931051989594, + "grad_max_sv": 0.4177068963646889, + "grad_min_sv": 1.733705095180449e-08, + "grad_condition": 47970887.65811751, + "lr": 0.0008422735529643442, + "time_sec": 15.485415935516357 + }, + { + "epoch": 40, + "train_loss": 0.807158277015686, + "train_acc": 0.75318, + "test_loss": 1.9477338481903077, + "test_acc": 0.5448, + "lyapunov": null, + "grad_norm": 0.954786311576214, + "grad_max_sv": 0.4165697038173676, + "grad_min_sv": 1.7467571476748044e-08, + "grad_condition": 71184092.08959822, + "lr": 0.0008345653031794289, + "time_sec": 15.485467195510864 + }, + { + "epoch": 41, + "train_loss": 0.7800393992233277, + "train_acc": 0.76146, + "test_loss": 1.8521117683410644, + "test_acc": 0.558, + "lyapunov": null, + "grad_norm": 0.9354361850547955, + "grad_max_sv": 0.39634769782423973, + "grad_min_sv": 1.7005577766619763e-08, + "grad_condition": 138342469.93119007, + "lr": 0.0008267103019950526, + "time_sec": 15.47174334526062 + }, + { + "epoch": 42, + "train_loss": 0.7673079490661621, + "train_acc": 0.76286, + "test_loss": 1.7608818145751952, + "test_acc": 0.577, + "lyapunov": null, + "grad_norm": 0.9379451954941195, + "grad_max_sv": 0.4147824175655842, + "grad_min_sv": 1.7161911683612197e-08, + "grad_condition": 393263932.238869, + "lr": 0.0008187119948743447, + "time_sec": 15.480841875076294 + }, + { + "epoch": 43, + "train_loss": 0.7557721022987366, + "train_acc": 0.76692, + "test_loss": 1.8332683414459228, + "test_acc": 0.5644, + "lyapunov": null, + "grad_norm": 0.9301101362040648, + "grad_max_sv": 0.40277465879917146, + "grad_min_sv": 1.665620945143914e-08, + "grad_condition": 317094927.94089293, + "lr": 0.000810573890139155, + "time_sec": 15.466366291046143 + }, + { + "epoch": 44, + "train_loss": 0.7345015475463867, + "train_acc": 0.77376, + "test_loss": 2.0360315671920777, + "test_acc": 0.5296, + "lyapunov": null, + "grad_norm": 0.9112815822240762, + "grad_max_sv": 0.39828494787216184, + "grad_min_sv": 1.6604482540208235e-08, + "grad_condition": 1254182168.7542708, + "lr": 0.0008022995574311873, + "time_sec": 15.476161003112793 + }, + { + "epoch": 45, + "train_loss": 0.7160864910125733, + "train_acc": 0.77798, + "test_loss": 2.0404258838653564, + "test_acc": 0.5382, + "lyapunov": null, + "grad_norm": 0.8941597810728247, + "grad_max_sv": 0.397457180917263, + "grad_min_sv": 1.6262863201943478e-08, + "grad_condition": 84531533.80346392, + "lr": 0.0007938926261462363, + "time_sec": 15.475411176681519 + }, + { + "epoch": 46, + "train_loss": 0.6994082283973694, + "train_acc": 0.78516, + "test_loss": 1.8352840042114258, + "test_acc": 0.5715, + "lyapunov": null, + "grad_norm": 0.8836953876364382, + "grad_max_sv": 0.38196621984243395, + "grad_min_sv": 1.585408843512992e-08, + "grad_condition": 76847427.02204503, + "lr": 0.0007853567838422158, + "time_sec": 15.509245872497559 + }, + { + "epoch": 47, + "train_loss": 0.6929370341110229, + "train_acc": 0.786, + "test_loss": 1.7921090829849242, + "test_acc": 0.5714, + "lyapunov": null, + "grad_norm": 0.8861845328251086, + "grad_max_sv": 0.39072656705975534, + "grad_min_sv": 1.5896329046182282e-08, + "grad_condition": 600990537.5108824, + "lr": 0.0007766957746216719, + "time_sec": 15.538230895996094 + }, + { + "epoch": 48, + "train_loss": 0.6808394806671143, + "train_acc": 0.79018, + "test_loss": 1.8164992214202882, + "test_acc": 0.5718, + "lyapunov": null, + "grad_norm": 0.8747589044293621, + "grad_max_sv": 0.3651046365499496, + "grad_min_sv": 1.5464912742416125e-08, + "grad_condition": 108472217.28693132, + "lr": 0.0007679133974894982, + "time_sec": 15.491382360458374 + }, + { + "epoch": 49, + "train_loss": 0.6645313382148743, + "train_acc": 0.79124, + "test_loss": 1.9076677312850951, + "test_acc": 0.5604, + "lyapunov": null, + "grad_norm": 0.8702547527458556, + "grad_max_sv": 0.3733041428029537, + "grad_min_sv": 1.552003626170695e-08, + "grad_condition": 37206285.59276767, + "lr": 0.000759013504686565, + "time_sec": 15.492026090621948 + }, + { + "epoch": 50, + "train_loss": 0.6496543109512329, + "train_acc": 0.79798, + "test_loss": 1.7902040550231935, + "test_acc": 0.577, + "lyapunov": null, + "grad_norm": 0.8583943232969492, + "grad_max_sv": 0.3693894289433956, + "grad_min_sv": 1.526528436018859e-08, + "grad_condition": 167614304.3259273, + "lr": 0.0007499999999999998, + "time_sec": 15.511015892028809 + }, + { + "epoch": 51, + "train_loss": 0.6329201017856598, + "train_acc": 0.8008, + "test_loss": 1.8939409488677978, + "test_acc": 0.5669, + "lyapunov": null, + "grad_norm": 0.8468251234327242, + "grad_max_sv": 0.379767844825983, + "grad_min_sv": 1.5527148693184055e-08, + "grad_condition": 40445680.98758187, + "lr": 0.0007408768370508575, + "time_sec": 15.502861976623535 + }, + { + "epoch": 52, + "train_loss": 0.6156794411849975, + "train_acc": 0.8076, + "test_loss": 1.8557664161682128, + "test_acc": 0.5669, + "lyapunov": null, + "grad_norm": 0.8409556426090318, + "grad_max_sv": 0.3604695089161396, + "grad_min_sv": 1.5232246320523447e-08, + "grad_condition": 154891483.950261, + "lr": 0.0007316480175599307, + "time_sec": 15.50012731552124 + }, + { + "epoch": 53, + "train_loss": 0.6097512643051147, + "train_acc": 0.80932, + "test_loss": 1.9206684701919556, + "test_acc": 0.5625, + "lyapunov": null, + "grad_norm": 0.8343400645564791, + "grad_max_sv": 0.36483332961797715, + "grad_min_sv": 1.4756883175842672e-08, + "grad_condition": 60983068.9144889, + "lr": 0.0007223175895924635, + "time_sec": 15.473671436309814 + }, + { + "epoch": 54, + "train_loss": 0.5996515681266784, + "train_acc": 0.81028, + "test_loss": 1.813775136566162, + "test_acc": 0.5799, + "lyapunov": null, + "grad_norm": 0.8292003009813924, + "grad_max_sv": 0.3576398268342018, + "grad_min_sv": 1.4879297414310821e-08, + "grad_condition": 169462696.72509637, + "lr": 0.0007128896457825361, + "time_sec": 15.514740228652954 + }, + { + "epoch": 55, + "train_loss": 0.583572147731781, + "train_acc": 0.81692, + "test_loss": 2.1540262565612793, + "test_acc": 0.5359, + "lyapunov": null, + "grad_norm": 0.8153888602407285, + "grad_max_sv": 0.35695644542574884, + "grad_min_sv": 1.4523149247103185e-08, + "grad_condition": 121177173.48603642, + "lr": 0.0007033683215378998, + "time_sec": 15.494624614715576 + }, + { + "epoch": 56, + "train_loss": 0.5730211604690552, + "train_acc": 0.81882, + "test_loss": 1.9024797750473021, + "test_acc": 0.5681, + "lyapunov": null, + "grad_norm": 0.8114470689653183, + "grad_max_sv": 0.3512945234775543, + "grad_min_sv": 1.4168293734420634e-08, + "grad_condition": 1195593278.9067845, + "lr": 0.0006937577932260512, + "time_sec": 15.484891176223755 + }, + { + "epoch": 57, + "train_loss": 0.5623767246627808, + "train_acc": 0.82144, + "test_loss": 1.8823775342941285, + "test_acc": 0.5727, + "lyapunov": null, + "grad_norm": 0.8082731215074979, + "grad_max_sv": 0.348369175940752, + "grad_min_sv": 1.429975417729934e-08, + "grad_condition": 63927698.94124661, + "lr": 0.0006840622763423388, + "time_sec": 15.500881433486938 + }, + { + "epoch": 58, + "train_loss": 0.5483553691482544, + "train_acc": 0.82696, + "test_loss": 1.8506002332687377, + "test_acc": 0.5809, + "lyapunov": null, + "grad_norm": 0.7992259508625827, + "grad_max_sv": 0.341405463218689, + "grad_min_sv": 1.3835257317573735e-08, + "grad_condition": 33930048.946812846, + "lr": 0.0006742860236609073, + "time_sec": 15.480631589889526 + }, + { + "epoch": 59, + "train_loss": 0.5366774555110931, + "train_acc": 0.8303, + "test_loss": 1.825086770439148, + "test_acc": 0.5833, + "lyapunov": null, + "grad_norm": 0.7819063927350494, + "grad_max_sv": 0.3418069466948509, + "grad_min_sv": 1.3836575564691103e-08, + "grad_condition": 408216925.10828066, + "lr": 0.0006644333233692913, + "time_sec": 15.500194072723389 + }, + { + "epoch": 60, + "train_loss": 0.5336303442287446, + "train_acc": 0.83014, + "test_loss": 1.8931641094207763, + "test_acc": 0.5815, + "lyapunov": null, + "grad_norm": 0.7872838454858564, + "grad_max_sv": 0.3333701379597187, + "grad_min_sv": 1.3876314406248771e-08, + "grad_condition": 438039568.05699426, + "lr": 0.0006545084971874734, + "time_sec": 15.50975775718689 + }, + { + "epoch": 61, + "train_loss": 0.5172760334014893, + "train_acc": 0.8346, + "test_loss": 1.8987928335189819, + "test_acc": 0.579, + "lyapunov": null, + "grad_norm": 0.7761151334812662, + "grad_max_sv": 0.34407150372862816, + "grad_min_sv": 1.3653881279773738e-08, + "grad_condition": 74302812.53353639, + "lr": 0.0006445158984722354, + "time_sec": 15.496349096298218 + }, + { + "epoch": 62, + "train_loss": 0.5046570606422425, + "train_acc": 0.83994, + "test_loss": 1.8855070373535157, + "test_acc": 0.5827, + "lyapunov": null, + "grad_norm": 0.7637023137146217, + "grad_max_sv": 0.3265983276069164, + "grad_min_sv": 1.3850480627165818e-08, + "grad_condition": 140662163.06722394, + "lr": 0.0006344599103076324, + "time_sec": 15.499541997909546 + }, + { + "epoch": 63, + "train_loss": 0.5043497357273102, + "train_acc": 0.8385, + "test_loss": 1.9895195541381836, + "test_acc": 0.5677, + "lyapunov": null, + "grad_norm": 0.7677478821534836, + "grad_max_sv": 0.33033859431743623, + "grad_min_sv": 1.32192005543319e-08, + "grad_condition": 238327868.213135, + "lr": 0.0006243449435824269, + "time_sec": 15.487115621566772 + }, + { + "epoch": 64, + "train_loss": 0.4833570729255676, + "train_acc": 0.84588, + "test_loss": 1.8681790885925293, + "test_acc": 0.586, + "lyapunov": null, + "grad_norm": 0.751862285796187, + "grad_max_sv": 0.3356017153710127, + "grad_min_sv": 1.374610183761324e-08, + "grad_condition": 301923677.0958418, + "lr": 0.0006141754350553275, + "time_sec": 15.47073483467102 + }, + { + "epoch": 65, + "train_loss": 0.4746548810005188, + "train_acc": 0.85036, + "test_loss": 1.8871611476898194, + "test_acc": 0.5849, + "lyapunov": null, + "grad_norm": 0.7470026047014822, + "grad_max_sv": 0.3292991783469915, + "grad_min_sv": 1.3641982613693537e-08, + "grad_condition": 89497941.46737906, + "lr": 0.0006039558454088793, + "time_sec": 15.498655796051025 + }, + { + "epoch": 66, + "train_loss": 0.4682476936244965, + "train_acc": 0.85176, + "test_loss": 1.9322247032165527, + "test_acc": 0.5781, + "lyapunov": null, + "grad_norm": 0.746205818915284, + "grad_max_sv": 0.324980178847909, + "grad_min_sv": 1.332827236268791e-08, + "grad_condition": 515634785.2347584, + "lr": 0.000593690657292862, + "time_sec": 15.49347710609436 + }, + { + "epoch": 67, + "train_loss": 0.4535627157497406, + "train_acc": 0.85524, + "test_loss": 1.9315398765563965, + "test_acc": 0.5792, + "lyapunov": null, + "grad_norm": 0.7351128594354965, + "grad_max_sv": 0.32144386470317843, + "grad_min_sv": 1.316271100388136e-08, + "grad_condition": 198503645.63195387, + "lr": 0.0005833843733580507, + "time_sec": 15.485307216644287 + }, + { + "epoch": 68, + "train_loss": 0.44375179916381835, + "train_acc": 0.85868, + "test_loss": 1.9626713150024413, + "test_acc": 0.5797, + "lyapunov": null, + "grad_norm": 0.7275082319568421, + "grad_max_sv": 0.31693296767771245, + "grad_min_sv": 1.2464710682147037e-08, + "grad_condition": 448992015.43105906, + "lr": 0.0005730415142812054, + "time_sec": 15.502485990524292 + }, + { + "epoch": 69, + "train_loss": 0.4375394599914551, + "train_acc": 0.8578, + "test_loss": 1.933611646080017, + "test_acc": 0.5841, + "lyapunov": null, + "grad_norm": 0.7285377709438317, + "grad_max_sv": 0.3246665924787521, + "grad_min_sv": 1.2657065806900847e-08, + "grad_condition": 183352263.73309737, + "lr": 0.0005626666167821517, + "time_sec": 15.504365682601929 + }, + { + "epoch": 70, + "train_loss": 0.4293804252910614, + "train_acc": 0.86176, + "test_loss": 1.9648184246063232, + "test_acc": 0.5803, + "lyapunov": null, + "grad_norm": 0.7201252438636403, + "grad_max_sv": 0.32932178787887095, + "grad_min_sv": 1.2632546332082274e-08, + "grad_condition": 152515630.29556593, + "lr": 0.0005522642316338265, + "time_sec": 15.50436282157898 + }, + { + "epoch": 71, + "train_loss": 0.4283500701713562, + "train_acc": 0.86214, + "test_loss": 1.9075251319885254, + "test_acc": 0.5925, + "lyapunov": null, + "grad_norm": 0.7191799969742115, + "grad_max_sv": 0.31320683732628823, + "grad_min_sv": 1.3020388655790583e-08, + "grad_condition": 140157658.32034963, + "lr": 0.0005418389216661573, + "time_sec": 15.498285293579102 + }, + { + "epoch": 72, + "train_loss": 0.41739362247467043, + "train_acc": 0.86518, + "test_loss": 1.9817939153671265, + "test_acc": 0.5787, + "lyapunov": null, + "grad_norm": 0.7089702462612528, + "grad_max_sv": 0.31360611245036124, + "grad_min_sv": 1.2536597712286407e-08, + "grad_condition": 419598262.18900955, + "lr": 0.0005313952597646563, + "time_sec": 15.484673976898193 + }, + { + "epoch": 73, + "train_loss": 0.4100272283267975, + "train_acc": 0.8682, + "test_loss": 1.9430673105239868, + "test_acc": 0.5896, + "lyapunov": null, + "grad_norm": 0.701251782999493, + "grad_max_sv": 0.31041153334081173, + "grad_min_sv": 1.2882357953384466e-08, + "grad_condition": 168668664.161966, + "lr": 0.0005209378268645994, + "time_sec": 15.47413682937622 + }, + { + "epoch": 74, + "train_loss": 0.399578921251297, + "train_acc": 0.87068, + "test_loss": 1.9265120712280273, + "test_acc": 0.5864, + "lyapunov": null, + "grad_norm": 0.6934025786184035, + "grad_max_sv": 0.3066574942320585, + "grad_min_sv": 1.2560646439098433e-08, + "grad_condition": 129867930.4907889, + "lr": 0.0005104712099416781, + "time_sec": 15.502904891967773 + }, + { + "epoch": 75, + "train_loss": 0.38554568584918975, + "train_acc": 0.87558, + "test_loss": 1.9176615629196168, + "test_acc": 0.5925, + "lyapunov": null, + "grad_norm": 0.6895198915282967, + "grad_max_sv": 0.3080108392983675, + "grad_min_sv": 1.229493239038532e-08, + "grad_condition": 1984776951.5641804, + "lr": 0.0004999999999999996, + "time_sec": 15.504841089248657 + }, + { + "epoch": 76, + "train_loss": 0.3888973752117157, + "train_acc": 0.87366, + "test_loss": 1.9323603094100952, + "test_acc": 0.5905, + "lyapunov": null, + "grad_norm": 0.689575361251709, + "grad_max_sv": 0.30503964237868786, + "grad_min_sv": 1.223273589129499e-08, + "grad_condition": 592473189.0734928, + "lr": 0.0004895287900583212, + "time_sec": 15.488545894622803 + }, + { + "epoch": 77, + "train_loss": 0.375536418132782, + "train_acc": 0.87906, + "test_loss": 1.9612086307525636, + "test_acc": 0.5896, + "lyapunov": null, + "grad_norm": 0.6799899173694914, + "grad_max_sv": 0.28870479166507723, + "grad_min_sv": 1.1852196383013713e-08, + "grad_condition": 974539567.6482589, + "lr": 0.0004790621731353997, + "time_sec": 15.496360778808594 + }, + { + "epoch": 78, + "train_loss": 0.3633386760520935, + "train_acc": 0.88388, + "test_loss": 2.0136638622283938, + "test_acc": 0.5813, + "lyapunov": null, + "grad_norm": 0.669468067176516, + "grad_max_sv": 0.2999464552849531, + "grad_min_sv": 1.1967348311804626e-08, + "grad_condition": 336932159.827844, + "lr": 0.000468604740235343, + "time_sec": 15.49899435043335 + }, + { + "epoch": 79, + "train_loss": 0.3648362389755249, + "train_acc": 0.88286, + "test_loss": 1.962812972831726, + "test_acc": 0.5878, + "lyapunov": null, + "grad_norm": 0.6712781124195144, + "grad_max_sv": 0.3077389158308506, + "grad_min_sv": 1.1902174327019233e-08, + "grad_condition": 79151255.2676374, + "lr": 0.00045816107833384175, + "time_sec": 15.50163722038269 + }, + { + "epoch": 80, + "train_loss": 0.3587533256816864, + "train_acc": 0.88438, + "test_loss": 2.031941645812988, + "test_acc": 0.5782, + "lyapunov": null, + "grad_norm": 0.6682785418366496, + "grad_max_sv": 0.3066766869276762, + "grad_min_sv": 1.2061256379237995e-08, + "grad_condition": 166882222.61886424, + "lr": 0.0004477357683661729, + "time_sec": 15.493919610977173 + }, + { + "epoch": 81, + "train_loss": 0.3532279273414612, + "train_acc": 0.88642, + "test_loss": 1.9712375566482543, + "test_acc": 0.5907, + "lyapunov": null, + "grad_norm": 0.6617439515766644, + "grad_max_sv": 0.2908315297216177, + "grad_min_sv": 1.1691992539419882e-08, + "grad_condition": 159733352.26610285, + "lr": 0.00043733338321784746, + "time_sec": 15.49502420425415 + }, + { + "epoch": 82, + "train_loss": 0.337565802192688, + "train_acc": 0.8912, + "test_loss": 2.0504629846572877, + "test_acc": 0.5809, + "lyapunov": null, + "grad_norm": 0.6468139784059553, + "grad_max_sv": 0.29187568798661234, + "grad_min_sv": 1.1621694805114122e-08, + "grad_condition": 4917199791.496119, + "lr": 0.0004269584857187939, + "time_sec": 15.506073236465454 + }, + { + "epoch": 83, + "train_loss": 0.3370664621257782, + "train_acc": 0.8903, + "test_loss": 1.9356835838317872, + "test_acc": 0.5944, + "lyapunov": null, + "grad_norm": 0.6494703611205956, + "grad_max_sv": 0.29382526241242884, + "grad_min_sv": 1.174881616096586e-08, + "grad_condition": 730478169.7287635, + "lr": 0.0004166156266419484, + "time_sec": 15.50250792503357 + }, + { + "epoch": 84, + "train_loss": 0.329011485414505, + "train_acc": 0.8946, + "test_loss": 2.079398715400696, + "test_acc": 0.5797, + "lyapunov": null, + "grad_norm": 0.643698144652478, + "grad_max_sv": 0.29514241628348825, + "grad_min_sv": 1.140666323123582e-08, + "grad_condition": 487746924.1063552, + "lr": 0.0004063093427071373, + "time_sec": 15.505268812179565 + }, + { + "epoch": 85, + "train_loss": 0.3234008149909973, + "train_acc": 0.89458, + "test_loss": 1.9295039024353027, + "test_acc": 0.5972, + "lyapunov": null, + "grad_norm": 0.6406406419682773, + "grad_max_sv": 0.28015601113438604, + "grad_min_sv": 1.1093708248907652e-08, + "grad_condition": 168584514.79069662, + "lr": 0.0003960441545911199, + "time_sec": 15.517300128936768 + }, + { + "epoch": 86, + "train_loss": 0.3155531369972229, + "train_acc": 0.89746, + "test_loss": 1.9418060377120971, + "test_acc": 0.5998, + "lyapunov": null, + "grad_norm": 0.6350703488704397, + "grad_max_sv": 0.29371371641755106, + "grad_min_sv": 1.1439264175315545e-08, + "grad_condition": 137016772.41396585, + "lr": 0.0003858245649446718, + "time_sec": 15.547461986541748 + }, + { + "epoch": 87, + "train_loss": 0.3074404651927948, + "train_acc": 0.90046, + "test_loss": 1.9792525926589966, + "test_acc": 0.5962, + "lyapunov": null, + "grad_norm": 0.6264501533131277, + "grad_max_sv": 0.2842790149152279, + "grad_min_sv": 1.0928390427257691e-08, + "grad_condition": 1305488613.824437, + "lr": 0.00037565505641757235, + "time_sec": 15.51766037940979 + }, + { + "epoch": 88, + "train_loss": 0.30229676830768587, + "train_acc": 0.90176, + "test_loss": 1.976724716567993, + "test_acc": 0.5936, + "lyapunov": null, + "grad_norm": 0.6211883734687677, + "grad_max_sv": 0.2838983990252018, + "grad_min_sv": 1.1175761286449232e-08, + "grad_condition": 333355247.3488082, + "lr": 0.00036554008969236695, + "time_sec": 15.503639221191406 + }, + { + "epoch": 89, + "train_loss": 0.2988234822654724, + "train_acc": 0.90424, + "test_loss": 1.9976719675064087, + "test_acc": 0.5967, + "lyapunov": null, + "grad_norm": 0.6213370027659331, + "grad_max_sv": 0.28663169853389264, + "grad_min_sv": 1.1367645391321956e-08, + "grad_condition": 134336770.77173668, + "lr": 0.0003554841015277638, + "time_sec": 15.497193574905396 + }, + { + "epoch": 90, + "train_loss": 0.29101773542404175, + "train_acc": 0.9066, + "test_loss": 1.9723329444885254, + "test_acc": 0.5984, + "lyapunov": null, + "grad_norm": 0.6117671492586956, + "grad_max_sv": 0.2787142962217331, + "grad_min_sv": 1.082959833688564e-08, + "grad_condition": 693540712.1308935, + "lr": 0.000345491502812526, + "time_sec": 15.504314661026001 + }, + { + "epoch": 91, + "train_loss": 0.29135215978622436, + "train_acc": 0.90466, + "test_loss": 1.9791620111465453, + "test_acc": 0.5971, + "lyapunov": null, + "grad_norm": 0.6144584827027046, + "grad_max_sv": 0.2858317792415619, + "grad_min_sv": 1.112117410219729e-08, + "grad_condition": 533297710.9846781, + "lr": 0.0003355666766307081, + "time_sec": 15.508234977722168 + }, + { + "epoch": 92, + "train_loss": 0.28011693614006045, + "train_acc": 0.90924, + "test_loss": 1.9835497787475587, + "test_acc": 0.5948, + "lyapunov": null, + "grad_norm": 0.6018450358334453, + "grad_max_sv": 0.2840783912688494, + "grad_min_sv": 1.073533659606829e-08, + "grad_condition": 553082386.2675663, + "lr": 0.00032571397633909225, + "time_sec": 15.51693344116211 + }, + { + "epoch": 93, + "train_loss": 0.28014948011398316, + "train_acc": 0.91044, + "test_loss": 1.9525927974700927, + "test_acc": 0.5988, + "lyapunov": null, + "grad_norm": 0.5970591995758349, + "grad_max_sv": 0.27580611146986483, + "grad_min_sv": 1.084302959390368e-08, + "grad_condition": 267617873.38796434, + "lr": 0.00031593772365766094, + "time_sec": 15.507484197616577 + }, + { + "epoch": 94, + "train_loss": 0.2744602131557465, + "train_acc": 0.90992, + "test_loss": 1.9839596082687379, + "test_acc": 0.5989, + "lyapunov": null, + "grad_norm": 0.5927553038661005, + "grad_max_sv": 0.2760546799749136, + "grad_min_sv": 1.0739196502950258e-08, + "grad_condition": 394969307.85135096, + "lr": 0.0003062422067739483, + "time_sec": 15.516487121582031 + }, + { + "epoch": 95, + "train_loss": 0.2686861476325989, + "train_acc": 0.91254, + "test_loss": 1.977996702194214, + "test_acc": 0.605, + "lyapunov": null, + "grad_norm": 0.5892956934064133, + "grad_max_sv": 0.27805082462728026, + "grad_min_sv": 1.052729135583158e-08, + "grad_condition": 344387886.3070652, + "lr": 0.00029663167846209965, + "time_sec": 15.495723962783813 + }, + { + "epoch": 96, + "train_loss": 0.26172939152240754, + "train_acc": 0.91622, + "test_loss": 2.0434574504852296, + "test_acc": 0.5946, + "lyapunov": null, + "grad_norm": 0.5805032172314536, + "grad_max_sv": 0.2648235227912664, + "grad_min_sv": 1.057376605411841e-08, + "grad_condition": 771027815.348639, + "lr": 0.00028711035421746345, + "time_sec": 15.489963293075562 + }, + { + "epoch": 97, + "train_loss": 0.25184455102920533, + "train_acc": 0.91832, + "test_loss": 1.9518341100692749, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.5774864526737941, + "grad_max_sv": 0.26801337823271754, + "grad_min_sv": 1.0317103195465332e-08, + "grad_condition": 602185384.328079, + "lr": 0.00027768241040753615, + "time_sec": 15.513015985488892 + }, + { + "epoch": 98, + "train_loss": 0.24914393192768097, + "train_acc": 0.91812, + "test_loss": 1.983034141921997, + "test_acc": 0.6073, + "lyapunov": null, + "grad_norm": 0.573198769045943, + "grad_max_sv": 0.2713981341570616, + "grad_min_sv": 1.03603865028723e-08, + "grad_condition": 87200014.42748493, + "lr": 0.00026835198244006903, + "time_sec": 15.507933616638184 + }, + { + "epoch": 99, + "train_loss": 0.2450516757631302, + "train_acc": 0.9213, + "test_loss": 2.0576653924942017, + "test_acc": 0.5987, + "lyapunov": null, + "grad_norm": 0.565340793701802, + "grad_max_sv": 0.26787664406001566, + "grad_min_sv": 1.0084340480113335e-08, + "grad_condition": 993815528.2154503, + "lr": 0.0002591231629491421, + "time_sec": 15.498576164245605 + }, + { + "epoch": 100, + "train_loss": 0.2435112312412262, + "train_acc": 0.92126, + "test_loss": 1.9808508350372314, + "test_acc": 0.6083, + "lyapunov": null, + "grad_norm": 0.5671331888797334, + "grad_max_sv": 0.2718590907752514, + "grad_min_sv": 1.0603882181613872e-08, + "grad_condition": 515734941.7641746, + "lr": 0.0002499999999999997, + "time_sec": 15.509106874465942 + }, + { + "epoch": 101, + "train_loss": 0.23981757608413695, + "train_acc": 0.92198, + "test_loss": 1.9874406982421875, + "test_acc": 0.6051, + "lyapunov": null, + "grad_norm": 0.5662694992474826, + "grad_max_sv": 0.27430120259523394, + "grad_min_sv": 1.0230437299217631e-08, + "grad_condition": 552718981.9754595, + "lr": 0.00024098649531343477, + "time_sec": 15.50493860244751 + }, + { + "epoch": 102, + "train_loss": 0.23594800971031188, + "train_acc": 0.92386, + "test_loss": 2.0030108623504637, + "test_acc": 0.6045, + "lyapunov": null, + "grad_norm": 0.557765074009711, + "grad_max_sv": 0.25009447410702706, + "grad_min_sv": 9.674274866248132e-09, + "grad_condition": 671563833.1462272, + "lr": 0.0002320866025105016, + "time_sec": 15.537469863891602 + }, + { + "epoch": 103, + "train_loss": 0.22944483037471772, + "train_acc": 0.9257, + "test_loss": 1.997948205947876, + "test_acc": 0.6021, + "lyapunov": null, + "grad_norm": 0.5530501913094669, + "grad_max_sv": 0.25403534434735775, + "grad_min_sv": 9.987440614811493e-09, + "grad_condition": 64606423.56909867, + "lr": 0.0002233042253783278, + "time_sec": 15.524824619293213 + }, + { + "epoch": 104, + "train_loss": 0.2232392775917053, + "train_acc": 0.92808, + "test_loss": 1.916127438735962, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.5470142147101442, + "grad_max_sv": 0.2518034357577562, + "grad_min_sv": 9.64682456273784e-09, + "grad_condition": 523753099.18247145, + "lr": 0.000214643216157784, + "time_sec": 15.519572973251343 + }, + { + "epoch": 105, + "train_loss": 0.21899011870384216, + "train_acc": 0.93022, + "test_loss": 1.9813644931793213, + "test_acc": 0.6042, + "lyapunov": null, + "grad_norm": 0.540595572944098, + "grad_max_sv": 0.25836079344153406, + "grad_min_sv": 9.721760932390744e-09, + "grad_condition": 149408798.18128103, + "lr": 0.00020610737385376332, + "time_sec": 15.511976957321167 + }, + { + "epoch": 106, + "train_loss": 0.22239319385528564, + "train_acc": 0.9288, + "test_loss": 2.019803592300415, + "test_acc": 0.6062, + "lyapunov": null, + "grad_norm": 0.5444023817051111, + "grad_max_sv": 0.2558960601687431, + "grad_min_sv": 9.743871165522958e-09, + "grad_condition": 421456811.7162399, + "lr": 0.00019770044256881242, + "time_sec": 15.492303371429443 + }, + { + "epoch": 107, + "train_loss": 0.21911219958305359, + "train_acc": 0.92724, + "test_loss": 1.9594658828735352, + "test_acc": 0.6122, + "lyapunov": null, + "grad_norm": 0.5463060896750315, + "grad_max_sv": 0.25181276090443133, + "grad_min_sv": 9.477817535397808e-09, + "grad_condition": 260599469.65846786, + "lr": 0.0001894261098608447, + "time_sec": 15.511865139007568 + }, + { + "epoch": 108, + "train_loss": 0.2136860816383362, + "train_acc": 0.93128, + "test_loss": 1.9913309350967408, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.5352068921664158, + "grad_max_sv": 0.2675321064889431, + "grad_min_sv": 1.0163352071659035e-08, + "grad_condition": 3452227132.4482284, + "lr": 0.000181288005125655, + "time_sec": 15.58255934715271 + }, + { + "epoch": 109, + "train_loss": 0.21131246563911438, + "train_acc": 0.93124, + "test_loss": 1.9869737873077393, + "test_acc": 0.6101, + "lyapunov": null, + "grad_norm": 0.5344952417105377, + "grad_max_sv": 0.2572028797119856, + "grad_min_sv": 9.894322512259829e-09, + "grad_condition": 825239604.2039155, + "lr": 0.0001732896980049473, + "time_sec": 15.527096509933472 + }, + { + "epoch": 110, + "train_loss": 0.20613145572185515, + "train_acc": 0.93496, + "test_loss": 1.9642673852920531, + "test_acc": 0.6083, + "lyapunov": null, + "grad_norm": 0.5266562322432973, + "grad_max_sv": 0.25352666079998015, + "grad_min_sv": 9.363287075498869e-09, + "grad_condition": 505733273.3952273, + "lr": 0.00016543469682057076, + "time_sec": 15.536001443862915 + }, + { + "epoch": 111, + "train_loss": 0.20270503174304963, + "train_acc": 0.93508, + "test_loss": 1.9903694719314575, + "test_acc": 0.608, + "lyapunov": null, + "grad_norm": 0.5210342707384447, + "grad_max_sv": 0.2542009174823761, + "grad_min_sv": 9.446510174006967e-09, + "grad_condition": 286370629.6135062, + "lr": 0.00015772644703565552, + "time_sec": 15.513093948364258 + }, + { + "epoch": 112, + "train_loss": 0.20146147197723388, + "train_acc": 0.93366, + "test_loss": 2.0144760524749756, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.5269979725551543, + "grad_max_sv": 0.26795426234602926, + "grad_min_sv": 9.357044586204288e-09, + "grad_condition": 370288038.01884973, + "lr": 0.00015016832974331713, + "time_sec": 15.502255916595459 + }, + { + "epoch": 113, + "train_loss": 0.19924361347198485, + "train_acc": 0.93656, + "test_loss": 2.037332961463928, + "test_acc": 0.6045, + "lyapunov": null, + "grad_norm": 0.5185296845346113, + "grad_max_sv": 0.2515675876289606, + "grad_min_sv": 9.252139900398081e-09, + "grad_condition": 112959773.59806451, + "lr": 0.00014276366018359834, + "time_sec": 15.511096477508545 + }, + { + "epoch": 114, + "train_loss": 0.1925122591304779, + "train_acc": 0.9381, + "test_loss": 2.001781312942505, + "test_acc": 0.6067, + "lyapunov": null, + "grad_norm": 0.512080843138899, + "grad_max_sv": 0.2638113047927618, + "grad_min_sv": 9.222902344467079e-09, + "grad_condition": 702867317.5417335, + "lr": 0.00013551568628929425, + "time_sec": 15.528293132781982 + }, + { + "epoch": 115, + "train_loss": 0.1863429721736908, + "train_acc": 0.94024, + "test_loss": 1.9896372226715089, + "test_acc": 0.6147, + "lyapunov": null, + "grad_norm": 0.5052730414811996, + "grad_max_sv": 0.239008704200387, + "grad_min_sv": 8.86921835820207e-09, + "grad_condition": 1285263365.3241801, + "lr": 0.00012842758726130276, + "time_sec": 15.514945983886719 + }, + { + "epoch": 116, + "train_loss": 0.18872571726799012, + "train_acc": 0.93914, + "test_loss": 2.0415555866241455, + "test_acc": 0.6066, + "lyapunov": null, + "grad_norm": 0.5103345009623144, + "grad_max_sv": 0.24828836917877198, + "grad_min_sv": 9.405215367630503e-09, + "grad_condition": 207294853.39805278, + "lr": 0.0001215024721741218, + "time_sec": 15.541447639465332 + }, + { + "epoch": 117, + "train_loss": 0.18968458090782164, + "train_acc": 0.93852, + "test_loss": 2.043529853057861, + "test_acc": 0.6064, + "lyapunov": null, + "grad_norm": 0.5117797700108315, + "grad_max_sv": 0.25188570134341715, + "grad_min_sv": 9.368504555202357e-09, + "grad_condition": 350583787.5469278, + "lr": 0.00011474337861210538, + "time_sec": 15.519954681396484 + }, + { + "epoch": 118, + "train_loss": 0.18446471235752104, + "train_acc": 0.94032, + "test_loss": 2.0161501600265503, + "test_acc": 0.611, + "lyapunov": null, + "grad_norm": 0.5034586286350297, + "grad_max_sv": 0.24743926264345645, + "grad_min_sv": 9.410030827038682e-09, + "grad_condition": 1867541501.3184059, + "lr": 0.00010815327133708009, + "time_sec": 15.52394437789917 + }, + { + "epoch": 119, + "train_loss": 0.18162137420654298, + "train_acc": 0.94302, + "test_loss": 2.045531623840332, + "test_acc": 0.6089, + "lyapunov": null, + "grad_norm": 0.4988474494797281, + "grad_max_sv": 0.2458579033613205, + "grad_min_sv": 9.119631047809635e-09, + "grad_condition": 646958702.124923, + "lr": 0.00010173504098790182, + "time_sec": 15.515710353851318 + }, + { + "epoch": 120, + "train_loss": 0.17938962819099427, + "train_acc": 0.94308, + "test_loss": 2.0503937309265137, + "test_acc": 0.6077, + "lyapunov": null, + "grad_norm": 0.4989562559637299, + "grad_max_sv": 0.2459786232560873, + "grad_min_sv": 9.11741269214554e-09, + "grad_condition": 412394597.02274954, + "lr": 9.549150281252629e-05, + "time_sec": 15.50988483428955 + }, + { + "epoch": 121, + "train_loss": 0.17874448727607728, + "train_acc": 0.9433, + "test_loss": 1.9961147312164307, + "test_acc": 0.6151, + "lyapunov": null, + "grad_norm": 0.4935280058170082, + "grad_max_sv": 0.24326966032385827, + "grad_min_sv": 9.25761599965963e-09, + "grad_condition": 299984759.10134274, + "lr": 8.942539543314794e-05, + "time_sec": 15.528467416763306 + }, + { + "epoch": 122, + "train_loss": 0.17431395033836364, + "train_acc": 0.94446, + "test_loss": 2.038390445327759, + "test_acc": 0.613, + "lyapunov": null, + "grad_norm": 0.48926666642054484, + "grad_max_sv": 0.23983839638531207, + "grad_min_sv": 8.987133019505365e-09, + "grad_condition": 372068253.35925686, + "lr": 8.353937964495024e-05, + "time_sec": 15.500731706619263 + }, + { + "epoch": 123, + "train_loss": 0.1746806291246414, + "train_acc": 0.94498, + "test_loss": 2.0120771438598632, + "test_acc": 0.6099, + "lyapunov": null, + "grad_norm": 0.48962253985732923, + "grad_max_sv": 0.23851457759737968, + "grad_min_sv": 8.603977001459158e-09, + "grad_condition": 1007854799.2213293, + "lr": 7.783603724899243e-05, + "time_sec": 15.516981840133667 + }, + { + "epoch": 124, + "train_loss": 0.17128678526878358, + "train_acc": 0.94656, + "test_loss": 2.0720390872955323, + "test_acc": 0.6088, + "lyapunov": null, + "grad_norm": 0.4869814196810216, + "grad_max_sv": 0.2417709030210972, + "grad_min_sv": 9.009437708026868e-09, + "grad_condition": 145836314.2500567, + "lr": 7.231786991974666e-05, + "time_sec": 15.496051549911499 + }, + { + "epoch": 125, + "train_loss": 0.17059236883163453, + "train_acc": 0.94604, + "test_loss": 2.0477584241867066, + "test_acc": 0.6122, + "lyapunov": null, + "grad_norm": 0.4843155728593804, + "grad_max_sv": 0.2388555094599724, + "grad_min_sv": 8.632761457245953e-09, + "grad_condition": 270912168.9760497, + "lr": 6.698729810778072e-05, + "time_sec": 15.507468223571777 + }, + { + "epoch": 126, + "train_loss": 0.1733051071071625, + "train_acc": 0.94568, + "test_loss": 2.0736024877548216, + "test_acc": 0.6062, + "lyapunov": null, + "grad_norm": 0.4894754419923655, + "grad_max_sv": 0.2332348022609949, + "grad_min_sv": 8.863469305384064e-09, + "grad_condition": 160444601.063775, + "lr": 6.184665997806817e-05, + "time_sec": 15.507078647613525 + }, + { + "epoch": 127, + "train_loss": 0.16721239070892335, + "train_acc": 0.9461, + "test_loss": 2.0207285331726075, + "test_acc": 0.6115, + "lyapunov": null, + "grad_norm": 0.4795404458508196, + "grad_max_sv": 0.23950408175587654, + "grad_min_sv": 8.801710726718485e-09, + "grad_condition": 1343442143.4331565, + "lr": 5.6898210384392595e-05, + "time_sec": 15.510753154754639 + }, + { + "epoch": 128, + "train_loss": 0.16301859991550446, + "train_acc": 0.94872, + "test_loss": 2.0851793113708497, + "test_acc": 0.6103, + "lyapunov": null, + "grad_norm": 0.4714155804221718, + "grad_max_sv": 0.23401366584002972, + "grad_min_sv": 8.772188082482521e-09, + "grad_condition": 704162454.9287102, + "lr": 5.214411988029363e-05, + "time_sec": 15.514019966125488 + }, + { + "epoch": 129, + "train_loss": 0.16865292779922486, + "train_acc": 0.94554, + "test_loss": 2.0298268291473387, + "test_acc": 0.6124, + "lyapunov": null, + "grad_norm": 0.4834939277959604, + "grad_max_sv": 0.23208196237683296, + "grad_min_sv": 8.83715973165871e-09, + "grad_condition": 657084742.2965086, + "lr": 4.7586473766990294e-05, + "time_sec": 15.501888990402222 + }, + { + "epoch": 130, + "train_loss": 0.16090039955615998, + "train_acc": 0.94934, + "test_loss": 2.003493827056885, + "test_acc": 0.6146, + "lyapunov": null, + "grad_norm": 0.4705215229572171, + "grad_max_sv": 0.23428524732589723, + "grad_min_sv": 8.827295219608623e-09, + "grad_condition": 132321813.8931369, + "lr": 4.32272711786996e-05, + "time_sec": 15.520491600036621 + }, + { + "epoch": 131, + "train_loss": 0.16265953367233277, + "train_acc": 0.94782, + "test_loss": 2.0326833637237547, + "test_acc": 0.6098, + "lyapunov": null, + "grad_norm": 0.4733595950570731, + "grad_max_sv": 0.2481051605194807, + "grad_min_sv": 8.921660872021013e-09, + "grad_condition": 1308927492.8875818, + "lr": 3.906842420574966e-05, + "time_sec": 15.518625020980835 + }, + { + "epoch": 132, + "train_loss": 0.16258932497501374, + "train_acc": 0.94914, + "test_loss": 2.0198348827362063, + "test_acc": 0.6125, + "lyapunov": null, + "grad_norm": 0.4699519678045664, + "grad_max_sv": 0.24516641050577165, + "grad_min_sv": 9.013820106567064e-09, + "grad_condition": 2740149017.6448007, + "lr": 3.5111757055874305e-05, + "time_sec": 15.513976335525513 + }, + { + "epoch": 133, + "train_loss": 0.16045542496204376, + "train_acc": 0.9487, + "test_loss": 2.0480993354797365, + "test_acc": 0.6079, + "lyapunov": null, + "grad_norm": 0.47270172858917925, + "grad_max_sv": 0.24782115481793882, + "grad_min_sv": 8.897941883821703e-09, + "grad_condition": 2462171077.7853346, + "lr": 3.1359005254054254e-05, + "time_sec": 15.518577098846436 + }, + { + "epoch": 134, + "train_loss": 0.1573088404560089, + "train_acc": 0.95036, + "test_loss": 1.996682660484314, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.467276051790063, + "grad_max_sv": 0.23228747248649598, + "grad_min_sv": 8.598132571376038e-09, + "grad_condition": 260351989.2850774, + "lr": 2.7811814881259484e-05, + "time_sec": 15.509779214859009 + }, + { + "epoch": 135, + "train_loss": 0.15793343636512755, + "train_acc": 0.94978, + "test_loss": 2.078777936553955, + "test_acc": 0.61, + "lyapunov": null, + "grad_norm": 0.46749496867126566, + "grad_max_sv": 0.23898076675832272, + "grad_min_sv": 8.952387563860784e-09, + "grad_condition": 451518473.6951105, + "lr": 2.4471741852423218e-05, + "time_sec": 15.52340030670166 + }, + { + "epoch": 136, + "train_loss": 0.154298712348938, + "train_acc": 0.9515, + "test_loss": 1.9956215568542481, + "test_acc": 0.6138, + "lyapunov": null, + "grad_norm": 0.4608054622581305, + "grad_max_sv": 0.2408101461827755, + "grad_min_sv": 8.805307293241817e-09, + "grad_condition": 1102254676.5159357, + "lr": 2.1340251233966362e-05, + "time_sec": 15.507319211959839 + }, + { + "epoch": 137, + "train_loss": 0.15331442908525467, + "train_acc": 0.95256, + "test_loss": 2.0495632625579834, + "test_acc": 0.6123, + "lyapunov": null, + "grad_norm": 0.4574770378660416, + "grad_max_sv": 0.23036178909242153, + "grad_min_sv": 8.661849632126891e-09, + "grad_condition": 506789914.31804866, + "lr": 1.8418716601170932e-05, + "time_sec": 15.507285833358765 + }, + { + "epoch": 138, + "train_loss": 0.1548746111679077, + "train_acc": 0.9515, + "test_loss": 2.0342879112243653, + "test_acc": 0.6092, + "lyapunov": null, + "grad_norm": 0.4633719984784024, + "grad_max_sv": 0.23631713092327117, + "grad_min_sv": 8.577337108357351e-09, + "grad_condition": 2670530904.2886295, + "lr": 1.570841943568445e-05, + "time_sec": 15.521555662155151 + }, + { + "epoch": 139, + "train_loss": 0.15485820642471312, + "train_acc": 0.95088, + "test_loss": 2.107874339675903, + "test_acc": 0.604, + "lyapunov": null, + "grad_norm": 0.4629261012072699, + "grad_max_sv": 0.23058986626565456, + "grad_min_sv": 8.546779077175937e-09, + "grad_condition": 89370689.31677079, + "lr": 1.3210548563419845e-05, + "time_sec": 15.533792972564697 + }, + { + "epoch": 140, + "train_loss": 0.15574090136051177, + "train_acc": 0.95052, + "test_loss": 2.0240774383544924, + "test_acc": 0.6098, + "lyapunov": null, + "grad_norm": 0.46494058002876526, + "grad_max_sv": 0.23221574500203132, + "grad_min_sv": 8.638921627709962e-09, + "grad_condition": 80246168.02315111, + "lr": 1.0926199633097203e-05, + "time_sec": 15.512130975723267 + }, + { + "epoch": 141, + "train_loss": 0.1591239344215393, + "train_acc": 0.94958, + "test_loss": 2.024708453178406, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.46462826011917274, + "grad_max_sv": 0.23822997957468034, + "grad_min_sv": 8.92720696771363e-09, + "grad_condition": 4042860284.9715805, + "lr": 8.856374635655688e-06, + "time_sec": 15.50205683708191 + }, + { + "epoch": 142, + "train_loss": 0.1531704497528076, + "train_acc": 0.95164, + "test_loss": 2.019575048828125, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.45691454501139306, + "grad_max_sv": 0.2273581113666296, + "grad_min_sv": 8.328775530700144e-09, + "grad_condition": 1373651140.614626, + "lr": 7.001981464747503e-06, + "time_sec": 15.521899938583374 + }, + { + "epoch": 143, + "train_loss": 0.15698250900268554, + "train_acc": 0.94968, + "test_loss": 2.0042268390655518, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.46686753330324193, + "grad_max_sv": 0.23650417439639568, + "grad_min_sv": 8.831455570535232e-09, + "grad_condition": 482562028.10267067, + "lr": 5.3638335185058295e-06, + "time_sec": 15.537745237350464 + }, + { + "epoch": 144, + "train_loss": 0.15602278783798218, + "train_acc": 0.95138, + "test_loss": 2.042717301368713, + "test_acc": 0.611, + "lyapunov": null, + "grad_norm": 0.46083256086412094, + "grad_max_sv": 0.23666680604219437, + "grad_min_sv": 8.818174148696178e-09, + "grad_condition": 276670204.88561904, + "lr": 3.942649342761114e-06, + "time_sec": 15.521801948547363 + }, + { + "epoch": 145, + "train_loss": 0.15351612282276153, + "train_acc": 0.95176, + "test_loss": 2.0216105178833006, + "test_acc": 0.6124, + "lyapunov": null, + "grad_norm": 0.4578762379981558, + "grad_max_sv": 0.21950803697109222, + "grad_min_sv": 8.404475567989662e-09, + "grad_condition": 6256996699.314726, + "lr": 2.7390523158633524e-06, + "time_sec": 15.50935411453247 + }, + { + "epoch": 146, + "train_loss": 0.15463469685077666, + "train_acc": 0.95138, + "test_loss": 1.9923904767990113, + "test_acc": 0.6146, + "lyapunov": null, + "grad_norm": 0.4604794709370396, + "grad_max_sv": 0.23074053600430489, + "grad_min_sv": 8.697518219221225e-09, + "grad_condition": 857409957.1641747, + "lr": 1.7535703752478133e-06, + "time_sec": 15.525001287460327 + }, + { + "epoch": 147, + "train_loss": 0.15173500085830688, + "train_acc": 0.95292, + "test_loss": 2.0695271726608278, + "test_acc": 0.6111, + "lyapunov": null, + "grad_norm": 0.4579307395851847, + "grad_max_sv": 0.24183545261621475, + "grad_min_sv": 8.57581264745045e-09, + "grad_condition": 811599787.3349051, + "lr": 9.866357858642196e-07, + "time_sec": 15.52645206451416 + }, + { + "epoch": 148, + "train_loss": 0.15419637537956238, + "train_acc": 0.95064, + "test_loss": 2.059994563674927, + "test_acc": 0.6067, + "lyapunov": null, + "grad_norm": 0.4599018124122232, + "grad_max_sv": 0.23474312983453274, + "grad_min_sv": 9.05704030905452e-09, + "grad_condition": 153015326.96145612, + "lr": 4.38584950570808e-07, + "time_sec": 15.522296905517578 + }, + { + "epoch": 149, + "train_loss": 0.15387048045158386, + "train_acc": 0.95202, + "test_loss": 2.021223978805542, + "test_acc": 0.6131, + "lyapunov": null, + "grad_norm": 0.45892673603732886, + "grad_max_sv": 0.23917307555675507, + "grad_min_sv": 8.54765248256041e-09, + "grad_condition": 282516990.135565, + "lr": 1.096582625772501e-07, + "time_sec": 15.493387222290039 + }, + { + "epoch": 150, + "train_loss": 0.14960056081056594, + "train_acc": 0.95382, + "test_loss": 2.009403101348877, + "test_acc": 0.6142, + "lyapunov": null, + "grad_norm": 0.4516160601649041, + "grad_max_sv": 0.23220950104296206, + "grad_min_sv": 8.634985401440986e-09, + "grad_condition": 1119985917.5419166, + "lr": 0.0, + "time_sec": 15.502899169921875 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.612606842651367, + "train_acc": 0.05934, + "test_loss": 4.430249005126953, + "test_acc": 0.0547, + "lyapunov": null, + "grad_norm": 6.270141227832012, + "grad_max_sv": 5.356529116630554, + "grad_min_sv": 1.0947098767893904e-07, + "grad_condition": 215195113.11712712, + "lr": 0.0009998903417374227, + "time_sec": 32.60336875915527 + }, + { + "epoch": 2, + "train_loss": 3.9147449421691896, + "train_acc": 0.11836, + "test_loss": 4.028561441802979, + "test_acc": 0.0982, + "lyapunov": null, + "grad_norm": 4.747243571853921, + "grad_max_sv": 4.05106902718544, + "grad_min_sv": 8.568258646965421e-08, + "grad_condition": 545107965.2871394, + "lr": 0.0009995614150494292, + "time_sec": 32.505430459976196 + }, + { + "epoch": 3, + "train_loss": 3.5624093733215334, + "train_acc": 0.16334, + "test_loss": 3.77226120300293, + "test_acc": 0.1374, + "lyapunov": null, + "grad_norm": 3.93250289804397, + "grad_max_sv": 3.243712919950485, + "grad_min_sv": 7.186751209697917e-08, + "grad_condition": 88711185.58982365, + "lr": 0.0009990133642141358, + "time_sec": 32.51404023170471 + }, + { + "epoch": 4, + "train_loss": 3.3006829078674316, + "train_acc": 0.20094, + "test_loss": 3.4272261234283445, + "test_acc": 0.1834, + "lyapunov": null, + "grad_norm": 3.319092979228889, + "grad_max_sv": 2.5326511025428773, + "grad_min_sv": 6.180275069489483e-08, + "grad_condition": 54405947.77847425, + "lr": 0.0009982464296247522, + "time_sec": 32.52905559539795 + }, + { + "epoch": 5, + "train_loss": 3.0730740076446534, + "train_acc": 0.24396, + "test_loss": 3.2210192291259765, + "test_acc": 0.2218, + "lyapunov": null, + "grad_norm": 2.8429187472839956, + "grad_max_sv": 2.069159355759621, + "grad_min_sv": 5.258070004746096e-08, + "grad_condition": 221832198.05063334, + "lr": 0.0009972609476841367, + "time_sec": 32.5269730091095 + }, + { + "epoch": 6, + "train_loss": 2.8943703575897217, + "train_acc": 0.27524, + "test_loss": 3.2233618530273436, + "test_acc": 0.2301, + "lyapunov": null, + "grad_norm": 2.489126623121483, + "grad_max_sv": 1.7037211507558823, + "grad_min_sv": 4.641174645991786e-08, + "grad_condition": 69020973.60049818, + "lr": 0.000996057350657239, + "time_sec": 32.522809982299805 + }, + { + "epoch": 7, + "train_loss": 2.7278697608184816, + "train_acc": 0.30568, + "test_loss": 2.7846542739868165, + "test_acc": 0.3021, + "lyapunov": null, + "grad_norm": 2.2145469317565336, + "grad_max_sv": 1.4053084224462509, + "grad_min_sv": 4.121676469709401e-08, + "grad_condition": 74031008.12531385, + "lr": 0.000994636166481494, + "time_sec": 32.5133273601532 + }, + { + "epoch": 8, + "train_loss": 2.5846466691589356, + "train_acc": 0.33468, + "test_loss": 2.6393014106750488, + "test_acc": 0.3355, + "lyapunov": null, + "grad_norm": 2.001252586211609, + "grad_max_sv": 1.2068818539381028, + "grad_min_sv": 3.724083600525896e-08, + "grad_condition": 111617642.9828302, + "lr": 0.0009929980185352525, + "time_sec": 32.54776215553284 + }, + { + "epoch": 9, + "train_loss": 2.4496477169036863, + "train_acc": 0.36334, + "test_loss": 2.6101227111816407, + "test_acc": 0.338, + "lyapunov": null, + "grad_norm": 1.8212885788905564, + "grad_max_sv": 1.0235964789986611, + "grad_min_sv": 3.432924873258969e-08, + "grad_condition": 33560453.54798009, + "lr": 0.0009911436253643444, + "time_sec": 32.51866698265076 + }, + { + "epoch": 10, + "train_loss": 2.3403686044311525, + "train_acc": 0.38794, + "test_loss": 2.52991734085083, + "test_acc": 0.3506, + "lyapunov": null, + "grad_norm": 1.6843997430422568, + "grad_max_sv": 0.8722436726093292, + "grad_min_sv": 3.162951408564041e-08, + "grad_condition": 41826895.787083015, + "lr": 0.0009890738003669028, + "time_sec": 32.545666456222534 + }, + { + "epoch": 11, + "train_loss": 2.2328610494232177, + "train_acc": 0.4093, + "test_loss": 2.4910150177001955, + "test_acc": 0.3614, + "lyapunov": null, + "grad_norm": 1.602309204488071, + "grad_max_sv": 0.7984312251210213, + "grad_min_sv": 3.0149957178093877e-08, + "grad_condition": 42410766.28650923, + "lr": 0.00098678945143658, + "time_sec": 32.538198471069336 + }, + { + "epoch": 12, + "train_loss": 2.143996323623657, + "train_acc": 0.42864, + "test_loss": 2.4733912868499757, + "test_acc": 0.371, + "lyapunov": null, + "grad_norm": 1.5058778232189263, + "grad_max_sv": 0.7046674489974976, + "grad_min_sv": 2.8541812209514905e-08, + "grad_condition": 89676864.87927453, + "lr": 0.0009842915805643154, + "time_sec": 32.55523920059204 + }, + { + "epoch": 13, + "train_loss": 2.0627913328552245, + "train_acc": 0.44824, + "test_loss": 2.3573100704193117, + "test_acc": 0.3883, + "lyapunov": null, + "grad_norm": 1.4381799734328438, + "grad_max_sv": 0.657113502919674, + "grad_min_sv": 2.6757648968755986e-08, + "grad_condition": 44542952.01193309, + "lr": 0.000981581283398829, + "time_sec": 32.53194808959961 + }, + { + "epoch": 14, + "train_loss": 2.0010124866104126, + "train_acc": 0.45794, + "test_loss": 2.2445085243225096, + "test_acc": 0.4153, + "lyapunov": null, + "grad_norm": 1.3839283952743018, + "grad_max_sv": 0.6215245097875595, + "grad_min_sv": 2.586353823885723e-08, + "grad_condition": 32103062.13610636, + "lr": 0.0009786597487660333, + "time_sec": 32.547112703323364 + }, + { + "epoch": 15, + "train_loss": 1.9416577011489868, + "train_acc": 0.47534, + "test_loss": 2.2182875526428223, + "test_acc": 0.4247, + "lyapunov": null, + "grad_norm": 1.3285678956385127, + "grad_max_sv": 0.5932768613100052, + "grad_min_sv": 2.5034504780308e-08, + "grad_condition": 29217346.01697495, + "lr": 0.0009755282581475766, + "time_sec": 32.527819871902466 + }, + { + "epoch": 16, + "train_loss": 1.873101312637329, + "train_acc": 0.48986, + "test_loss": 2.2290160217285155, + "test_acc": 0.4272, + "lyapunov": null, + "grad_norm": 1.2913331830478172, + "grad_max_sv": 0.5665568478405476, + "grad_min_sv": 2.474239251260002e-08, + "grad_condition": 27395673.607036375, + "lr": 0.0009721881851187403, + "time_sec": 32.52952456474304 + }, + { + "epoch": 17, + "train_loss": 1.8097029363250732, + "train_acc": 0.50292, + "test_loss": 2.2615955074310303, + "test_acc": 0.424, + "lyapunov": null, + "grad_norm": 1.252294761267169, + "grad_max_sv": 0.5210624538362026, + "grad_min_sv": 2.3697808424968936e-08, + "grad_condition": 114051245.48515114, + "lr": 0.0009686409947459456, + "time_sec": 32.54529142379761 + }, + { + "epoch": 18, + "train_loss": 1.747176973838806, + "train_acc": 0.51946, + "test_loss": 2.2190833429336547, + "test_acc": 0.4281, + "lyapunov": null, + "grad_norm": 1.213131360578199, + "grad_max_sv": 0.5172027304768563, + "grad_min_sv": 2.289411261818808e-08, + "grad_condition": 51051175.59109087, + "lr": 0.0009648882429441254, + "time_sec": 32.51650047302246 + }, + { + "epoch": 19, + "train_loss": 1.694791968383789, + "train_acc": 0.5301, + "test_loss": 2.2439287574768065, + "test_acc": 0.4362, + "lyapunov": null, + "grad_norm": 1.1797460355462452, + "grad_max_sv": 0.4871015749871731, + "grad_min_sv": 2.21617759829304e-08, + "grad_condition": 166781679.9487027, + "lr": 0.00096093157579425, + "time_sec": 32.51687932014465 + }, + { + "epoch": 20, + "train_loss": 1.6451108572006226, + "train_acc": 0.54392, + "test_loss": 2.30450572013855, + "test_acc": 0.4271, + "lyapunov": null, + "grad_norm": 1.1471849936044856, + "grad_max_sv": 0.47273003607988356, + "grad_min_sv": 2.1620291118518155e-08, + "grad_condition": 25041556.16833921, + "lr": 0.0009567727288213001, + "time_sec": 32.532697916030884 + }, + { + "epoch": 21, + "train_loss": 1.6014679947662354, + "train_acc": 0.55142, + "test_loss": 2.1664475830078125, + "test_acc": 0.4584, + "lyapunov": null, + "grad_norm": 1.1229957179757897, + "grad_max_sv": 0.4562165729701519, + "grad_min_sv": 2.1112780196341775e-08, + "grad_condition": 26298334.51243094, + "lr": 0.0009524135262330095, + "time_sec": 32.53035640716553 + }, + { + "epoch": 22, + "train_loss": 1.5620909811401367, + "train_acc": 0.5613, + "test_loss": 2.162712843322754, + "test_acc": 0.4535, + "lyapunov": null, + "grad_norm": 1.1030961025754331, + "grad_max_sv": 0.4406334914267063, + "grad_min_sv": 2.045089818741852e-08, + "grad_condition": 43337785.20413343, + "lr": 0.0009478558801197061, + "time_sec": 32.51555895805359 + }, + { + "epoch": 23, + "train_loss": 1.5185724276351928, + "train_acc": 0.56968, + "test_loss": 2.1629050983428955, + "test_acc": 0.4642, + "lyapunov": null, + "grad_norm": 1.0796470270409146, + "grad_max_sv": 0.4365608513355255, + "grad_min_sv": 2.0348640585379775e-08, + "grad_condition": 199103454.04638118, + "lr": 0.000943101789615607, + "time_sec": 32.51700782775879 + }, + { + "epoch": 24, + "train_loss": 1.4762262714385985, + "train_acc": 0.58122, + "test_loss": 2.0623104194641115, + "test_acc": 0.4808, + "lyapunov": null, + "grad_norm": 1.058223580636924, + "grad_max_sv": 0.422040344029665, + "grad_min_sv": 1.999172487554546e-08, + "grad_condition": 26445060.697539486, + "lr": 0.0009381533400219313, + "time_sec": 32.54439735412598 + }, + { + "epoch": 25, + "train_loss": 1.4411011653900145, + "train_acc": 0.58896, + "test_loss": 2.168187129974365, + "test_acc": 0.4692, + "lyapunov": null, + "grad_norm": 1.0360388595339232, + "grad_max_sv": 0.4249138444662094, + "grad_min_sv": 1.99582824841546e-08, + "grad_condition": 246451377.91849524, + "lr": 0.0009330127018922189, + "time_sec": 32.548271894454956 + }, + { + "epoch": 26, + "train_loss": 1.4043142713928223, + "train_acc": 0.59902, + "test_loss": 2.0536590896606444, + "test_acc": 0.4891, + "lyapunov": null, + "grad_norm": 1.0113140938455152, + "grad_max_sv": 0.3988976672291756, + "grad_min_sv": 1.8759028042047988e-08, + "grad_condition": 37432251.439904764, + "lr": 0.000927682130080253, + "time_sec": 32.561890840530396 + }, + { + "epoch": 27, + "train_loss": 1.3714225146484376, + "train_acc": 0.60766, + "test_loss": 2.2935733531951903, + "test_acc": 0.4525, + "lyapunov": null, + "grad_norm": 1.0021764966836944, + "grad_max_sv": 0.3959275037050247, + "grad_min_sv": 1.8507436513881537e-08, + "grad_condition": 44956111.71393384, + "lr": 0.0009221639627510072, + "time_sec": 32.53670048713684 + }, + { + "epoch": 28, + "train_loss": 1.3370341487121582, + "train_acc": 0.61666, + "test_loss": 2.151699178314209, + "test_acc": 0.4715, + "lyapunov": null, + "grad_norm": 0.9794476786709188, + "grad_max_sv": 0.39209934026002885, + "grad_min_sv": 1.867815887374169e-08, + "grad_condition": 35054340.009755686, + "lr": 0.0009164606203550494, + "time_sec": 32.54069757461548 + }, + { + "epoch": 29, + "train_loss": 1.3072684922790527, + "train_acc": 0.62288, + "test_loss": 2.177260079193115, + "test_acc": 0.4723, + "lyapunov": null, + "grad_norm": 0.9630039914022892, + "grad_max_sv": 0.38177175372838973, + "grad_min_sv": 1.8039237006939324e-08, + "grad_condition": 32222597.95523299, + "lr": 0.0009105746045668516, + "time_sec": 32.513834953308105 + }, + { + "epoch": 30, + "train_loss": 1.2830923750686645, + "train_acc": 0.63006, + "test_loss": 2.2779099143981933, + "test_acc": 0.4655, + "lyapunov": null, + "grad_norm": 0.9518974286811641, + "grad_max_sv": 0.38100970312953, + "grad_min_sv": 1.788316939428658e-08, + "grad_condition": 99211564.21329594, + "lr": 0.0009045084971874733, + "time_sec": 32.5218071937561 + }, + { + "epoch": 31, + "train_loss": 1.244770231819153, + "train_acc": 0.6375, + "test_loss": 2.1691842304229736, + "test_acc": 0.4808, + "lyapunov": null, + "grad_norm": 0.9340551179231076, + "grad_max_sv": 0.36914008632302286, + "grad_min_sv": 1.7114106357074555e-08, + "grad_condition": 29377579.043874025, + "lr": 0.0008982649590120977, + "time_sec": 32.50562572479248 + }, + { + "epoch": 32, + "train_loss": 1.2236427535629273, + "train_acc": 0.64292, + "test_loss": 2.128678413200378, + "test_acc": 0.4897, + "lyapunov": null, + "grad_norm": 0.9308816117267062, + "grad_max_sv": 0.3699117600917816, + "grad_min_sv": 1.7350169867480502e-08, + "grad_condition": 29708594.41851766, + "lr": 0.0008918467286629196, + "time_sec": 32.53521537780762 + }, + { + "epoch": 33, + "train_loss": 1.1827713982772827, + "train_acc": 0.65544, + "test_loss": 2.1373632209777833, + "test_acc": 0.5017, + "lyapunov": null, + "grad_norm": 0.9081423627717244, + "grad_max_sv": 0.3551614835858345, + "grad_min_sv": 1.6811319347286718e-08, + "grad_condition": 306006053.9068912, + "lr": 0.0008852566213878943, + "time_sec": 32.57274842262268 + }, + { + "epoch": 34, + "train_loss": 1.1642235271072388, + "train_acc": 0.65892, + "test_loss": 2.1604542951583863, + "test_acc": 0.4885, + "lyapunov": null, + "grad_norm": 0.9090398412926194, + "grad_max_sv": 0.35307114869356154, + "grad_min_sv": 1.6331064042404696e-08, + "grad_condition": 75342806.75988543, + "lr": 0.000878497527825878, + "time_sec": 32.53737998008728 + }, + { + "epoch": 35, + "train_loss": 1.1387675298309325, + "train_acc": 0.6667, + "test_loss": 2.1841554317474365, + "test_acc": 0.4875, + "lyapunov": null, + "grad_norm": 0.8905589789768327, + "grad_max_sv": 0.34435485303401947, + "grad_min_sv": 1.63940996583678e-08, + "grad_condition": 31858813.754447132, + "lr": 0.000871572412738697, + "time_sec": 32.53908848762512 + }, + { + "epoch": 36, + "train_loss": 1.112549288597107, + "train_acc": 0.6711, + "test_loss": 2.1255173376083376, + "test_acc": 0.4972, + "lyapunov": null, + "grad_norm": 0.888003290237527, + "grad_max_sv": 0.3482539109885693, + "grad_min_sv": 1.6459002988994388e-08, + "grad_condition": 106865396.27418132, + "lr": 0.0008644843137107055, + "time_sec": 32.52313590049744 + }, + { + "epoch": 37, + "train_loss": 1.0873542625236512, + "train_acc": 0.6763, + "test_loss": 2.098120114517212, + "test_acc": 0.5037, + "lyapunov": null, + "grad_norm": 0.8726919198419328, + "grad_max_sv": 0.34534994438290595, + "grad_min_sv": 1.612610790874269e-08, + "grad_condition": 39535112.979377694, + "lr": 0.0008572363398164014, + "time_sec": 32.54535698890686 + }, + { + "epoch": 38, + "train_loss": 1.0494415398788453, + "train_acc": 0.6891, + "test_loss": 2.1943147089004515, + "test_acc": 0.4975, + "lyapunov": null, + "grad_norm": 0.867993871250333, + "grad_max_sv": 0.3474706750363111, + "grad_min_sv": 1.6011337518329062e-08, + "grad_condition": 53782583.5534817, + "lr": 0.0008498316702566826, + "time_sec": 32.5124135017395 + }, + { + "epoch": 39, + "train_loss": 1.0355109643936158, + "train_acc": 0.69258, + "test_loss": 2.145528812789917, + "test_acc": 0.5015, + "lyapunov": null, + "grad_norm": 0.8555269464693561, + "grad_max_sv": 0.3424593433737755, + "grad_min_sv": 1.5947514456216004e-08, + "grad_condition": 33880811.6761477, + "lr": 0.0008422735529643442, + "time_sec": 32.515289545059204 + }, + { + "epoch": 40, + "train_loss": 1.0165967633247375, + "train_acc": 0.69846, + "test_loss": 2.175649596786499, + "test_acc": 0.5019, + "lyapunov": null, + "grad_norm": 0.8376771010486573, + "grad_max_sv": 0.3215891238301992, + "grad_min_sv": 1.5263620372837905e-08, + "grad_condition": 85010303.02194887, + "lr": 0.0008345653031794289, + "time_sec": 32.54841685295105 + }, + { + "epoch": 41, + "train_loss": 0.9950240628051757, + "train_acc": 0.70056, + "test_loss": 2.2173702697753908, + "test_acc": 0.5002, + "lyapunov": null, + "grad_norm": 0.8305965994955763, + "grad_max_sv": 0.3256087012588978, + "grad_min_sv": 1.5127571602671642e-08, + "grad_condition": 137474843.23784915, + "lr": 0.0008267103019950526, + "time_sec": 32.57811760902405 + }, + { + "epoch": 42, + "train_loss": 0.9775527880096435, + "train_acc": 0.70474, + "test_loss": 2.1698096994400022, + "test_acc": 0.5034, + "lyapunov": null, + "grad_norm": 0.8275704405899154, + "grad_max_sv": 0.3146204575896263, + "grad_min_sv": 1.4814988586950295e-08, + "grad_condition": 63410761.569527075, + "lr": 0.0008187119948743447, + "time_sec": 32.52773356437683 + }, + { + "epoch": 43, + "train_loss": 0.9515444298553467, + "train_acc": 0.7129, + "test_loss": 2.284324015045166, + "test_acc": 0.4919, + "lyapunov": null, + "grad_norm": 0.8256111526505941, + "grad_max_sv": 0.3248642094433308, + "grad_min_sv": 1.5077374472538542e-08, + "grad_condition": 120729497.4258703, + "lr": 0.000810573890139155, + "time_sec": 32.54343295097351 + }, + { + "epoch": 44, + "train_loss": 0.932089543800354, + "train_acc": 0.71794, + "test_loss": 2.347640796661377, + "test_acc": 0.4952, + "lyapunov": null, + "grad_norm": 0.8221551718061502, + "grad_max_sv": 0.3309069760143757, + "grad_min_sv": 1.531730618592464e-08, + "grad_condition": 43621618.830579884, + "lr": 0.0008022995574311873, + "time_sec": 32.540892362594604 + }, + { + "epoch": 45, + "train_loss": 0.9129991551589965, + "train_acc": 0.72538, + "test_loss": 2.3257674713134766, + "test_acc": 0.4986, + "lyapunov": null, + "grad_norm": 0.7995996108758867, + "grad_max_sv": 0.3120440490543842, + "grad_min_sv": 1.4420761846635487e-08, + "grad_condition": 274280638.56129825, + "lr": 0.0007938926261462363, + "time_sec": 32.56113886833191 + }, + { + "epoch": 46, + "train_loss": 0.8904787008476257, + "train_acc": 0.72998, + "test_loss": 2.3609681858062745, + "test_acc": 0.4974, + "lyapunov": null, + "grad_norm": 0.8006123840154866, + "grad_max_sv": 0.3184788428246975, + "grad_min_sv": 1.479064429370236e-08, + "grad_condition": 82532558.79183207, + "lr": 0.0007853567838422158, + "time_sec": 32.55464220046997 + }, + { + "epoch": 47, + "train_loss": 0.8791391965866089, + "train_acc": 0.73118, + "test_loss": 2.3235943592071533, + "test_acc": 0.5011, + "lyapunov": null, + "grad_norm": 0.7941774318900212, + "grad_max_sv": 0.31571171544492244, + "grad_min_sv": 1.4471256026826751e-08, + "grad_condition": 31975325.9529503, + "lr": 0.0007766957746216719, + "time_sec": 32.531195402145386 + }, + { + "epoch": 48, + "train_loss": 0.8462872068786621, + "train_acc": 0.74152, + "test_loss": 2.2702061416625976, + "test_acc": 0.5127, + "lyapunov": null, + "grad_norm": 0.7790110299262845, + "grad_max_sv": 0.31310132145881653, + "grad_min_sv": 1.4011670552635525e-08, + "grad_condition": 69070584.021189, + "lr": 0.0007679133974894982, + "time_sec": 32.550259828567505 + }, + { + "epoch": 49, + "train_loss": 0.8320243933296204, + "train_acc": 0.74518, + "test_loss": 2.3156275840759277, + "test_acc": 0.5109, + "lyapunov": null, + "grad_norm": 0.7829430590909012, + "grad_max_sv": 0.3146356470882893, + "grad_min_sv": 1.4089187793265428e-08, + "grad_condition": 233080772.68985993, + "lr": 0.000759013504686565, + "time_sec": 32.55922746658325 + }, + { + "epoch": 50, + "train_loss": 0.8245939933776856, + "train_acc": 0.74696, + "test_loss": 2.265205925178528, + "test_acc": 0.5189, + "lyapunov": null, + "grad_norm": 0.7672411895816676, + "grad_max_sv": 0.3079528912901878, + "grad_min_sv": 1.4155918948415697e-08, + "grad_condition": 343933636.95908105, + "lr": 0.0007499999999999998, + "time_sec": 32.53189420700073 + }, + { + "epoch": 51, + "train_loss": 0.7894153217315674, + "train_acc": 0.7565, + "test_loss": 2.3188957998275757, + "test_acc": 0.5074, + "lyapunov": null, + "grad_norm": 0.7639570769617415, + "grad_max_sv": 0.30883320979774, + "grad_min_sv": 1.3941536785438969e-08, + "grad_condition": 58007269.384739935, + "lr": 0.0007408768370508575, + "time_sec": 32.537278175354004 + }, + { + "epoch": 52, + "train_loss": 0.7845482840156556, + "train_acc": 0.75934, + "test_loss": 2.3104104595184327, + "test_acc": 0.5194, + "lyapunov": null, + "grad_norm": 0.758426806815466, + "grad_max_sv": 0.3017439119517803, + "grad_min_sv": 1.3761643591347906e-08, + "grad_condition": 64403689.199135736, + "lr": 0.0007316480175599307, + "time_sec": 32.567556858062744 + }, + { + "epoch": 53, + "train_loss": 0.7678517831802368, + "train_acc": 0.76302, + "test_loss": 2.2519205989837645, + "test_acc": 0.5187, + "lyapunov": null, + "grad_norm": 0.7525741359749043, + "grad_max_sv": 0.3043193075805902, + "grad_min_sv": 1.4057699764414428e-08, + "grad_condition": 603144630.5655534, + "lr": 0.0007223175895924635, + "time_sec": 32.54323744773865 + }, + { + "epoch": 54, + "train_loss": 0.7441292473983765, + "train_acc": 0.77002, + "test_loss": 2.321862815093994, + "test_acc": 0.5195, + "lyapunov": null, + "grad_norm": 0.7385816998340842, + "grad_max_sv": 0.2950198922306299, + "grad_min_sv": 1.3242542280800241e-08, + "grad_condition": 47788499.822593346, + "lr": 0.0007128896457825361, + "time_sec": 32.546525955200195 + }, + { + "epoch": 55, + "train_loss": 0.7237247510147095, + "train_acc": 0.77684, + "test_loss": 2.443076996231079, + "test_acc": 0.5105, + "lyapunov": null, + "grad_norm": 0.7236745133446179, + "grad_max_sv": 0.2926642097532749, + "grad_min_sv": 1.3385297276298502e-08, + "grad_condition": 180910825.71869814, + "lr": 0.0007033683215378998, + "time_sec": 32.5228271484375 + }, + { + "epoch": 56, + "train_loss": 0.714698567867279, + "train_acc": 0.77636, + "test_loss": 2.4090746616363528, + "test_acc": 0.5073, + "lyapunov": null, + "grad_norm": 0.7344734039694485, + "grad_max_sv": 0.2945756554603577, + "grad_min_sv": 1.3372697777163517e-08, + "grad_condition": 191394798.44401574, + "lr": 0.0006937577932260512, + "time_sec": 32.53384256362915 + }, + { + "epoch": 57, + "train_loss": 0.701706619796753, + "train_acc": 0.7817, + "test_loss": 2.4898623809814455, + "test_acc": 0.5061, + "lyapunov": null, + "grad_norm": 0.7242445850699529, + "grad_max_sv": 0.29475805573165414, + "grad_min_sv": 1.3282284945341504e-08, + "grad_condition": 139859409.2511898, + "lr": 0.0006840622763423388, + "time_sec": 32.55175542831421 + }, + { + "epoch": 58, + "train_loss": 0.683065224571228, + "train_acc": 0.78578, + "test_loss": 2.40970786857605, + "test_acc": 0.5161, + "lyapunov": null, + "grad_norm": 0.7133541403038509, + "grad_max_sv": 0.28903776630759237, + "grad_min_sv": 1.2887932776279449e-08, + "grad_condition": 217157653.7481032, + "lr": 0.0006742860236609073, + "time_sec": 32.54868960380554 + }, + { + "epoch": 59, + "train_loss": 0.658868628025055, + "train_acc": 0.79364, + "test_loss": 2.4330540966033936, + "test_acc": 0.512, + "lyapunov": null, + "grad_norm": 0.7071819631685043, + "grad_max_sv": 0.28152512572705746, + "grad_min_sv": 1.2446668359172852e-08, + "grad_condition": 53600070.902513206, + "lr": 0.0006644333233692913, + "time_sec": 32.54175162315369 + }, + { + "epoch": 60, + "train_loss": 0.6470879960250855, + "train_acc": 0.7992, + "test_loss": 2.4595475191116334, + "test_acc": 0.5146, + "lyapunov": null, + "grad_norm": 0.7011871838547499, + "grad_max_sv": 0.2868143357336521, + "grad_min_sv": 1.2911446190672082e-08, + "grad_condition": 55527160.04901831, + "lr": 0.0006545084971874734, + "time_sec": 32.56122612953186 + }, + { + "epoch": 61, + "train_loss": 0.6354982923126221, + "train_acc": 0.8022, + "test_loss": 2.560771873855591, + "test_acc": 0.5081, + "lyapunov": null, + "grad_norm": 0.6984352092808961, + "grad_max_sv": 0.27748913019895555, + "grad_min_sv": 1.239017393675143e-08, + "grad_condition": 1468960068.2366312, + "lr": 0.0006445158984722354, + "time_sec": 32.540645360946655 + }, + { + "epoch": 62, + "train_loss": 0.616827200679779, + "train_acc": 0.80592, + "test_loss": 2.4981941551208497, + "test_acc": 0.5168, + "lyapunov": null, + "grad_norm": 0.693034220707574, + "grad_max_sv": 0.27250286303460597, + "grad_min_sv": 1.2243235950146896e-08, + "grad_condition": 346615785.32809913, + "lr": 0.0006344599103076324, + "time_sec": 32.55153822898865 + }, + { + "epoch": 63, + "train_loss": 0.6024868152618408, + "train_acc": 0.81298, + "test_loss": 2.4579322681427, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.6859865381743082, + "grad_max_sv": 0.2814170353114605, + "grad_min_sv": 1.2453174788248922e-08, + "grad_condition": 71845159.85056672, + "lr": 0.0006243449435824269, + "time_sec": 32.56982493400574 + }, + { + "epoch": 64, + "train_loss": 0.5879015256500244, + "train_acc": 0.81586, + "test_loss": 2.537950067138672, + "test_acc": 0.5154, + "lyapunov": null, + "grad_norm": 0.6770827367834238, + "grad_max_sv": 0.2760712094604969, + "grad_min_sv": 1.2060245246827555e-08, + "grad_condition": 242477478.97334537, + "lr": 0.0006141754350553275, + "time_sec": 32.555153369903564 + }, + { + "epoch": 65, + "train_loss": 0.5838800269126893, + "train_acc": 0.8159, + "test_loss": 2.5163471378326414, + "test_acc": 0.5163, + "lyapunov": null, + "grad_norm": 0.6785242818211942, + "grad_max_sv": 0.27877960838377475, + "grad_min_sv": 1.2008392599738293e-08, + "grad_condition": 40446768.53559095, + "lr": 0.0006039558454088793, + "time_sec": 32.543633460998535 + }, + { + "epoch": 66, + "train_loss": 0.577277703781128, + "train_acc": 0.81916, + "test_loss": 2.4027950271606446, + "test_acc": 0.53, + "lyapunov": null, + "grad_norm": 0.6749900226760103, + "grad_max_sv": 0.2747200779616833, + "grad_min_sv": 1.2062701042203639e-08, + "grad_condition": 32367967.36566303, + "lr": 0.000593690657292862, + "time_sec": 32.588738441467285 + }, + { + "epoch": 67, + "train_loss": 0.5638121318435669, + "train_acc": 0.82124, + "test_loss": 2.5093120254516603, + "test_acc": 0.5143, + "lyapunov": null, + "grad_norm": 0.6756248898956171, + "grad_max_sv": 0.2708110649138689, + "grad_min_sv": 1.1944636340091575e-08, + "grad_condition": 75752957.05132133, + "lr": 0.0005833843733580507, + "time_sec": 32.55442571640015 + }, + { + "epoch": 68, + "train_loss": 0.5368257042694092, + "train_acc": 0.82994, + "test_loss": 2.589290417480469, + "test_acc": 0.5118, + "lyapunov": null, + "grad_norm": 0.6598937386660447, + "grad_max_sv": 0.261281393840909, + "grad_min_sv": 1.1725735699075201e-08, + "grad_condition": 169472540.689181, + "lr": 0.0005730415142812054, + "time_sec": 32.52515912055969 + }, + { + "epoch": 69, + "train_loss": 0.5388207937431335, + "train_acc": 0.82916, + "test_loss": 2.563585631942749, + "test_acc": 0.5202, + "lyapunov": null, + "grad_norm": 0.6573002747793157, + "grad_max_sv": 0.2725424364209175, + "grad_min_sv": 1.2047364596375065e-08, + "grad_condition": 444347034.8797019, + "lr": 0.0005626666167821517, + "time_sec": 32.586650133132935 + }, + { + "epoch": 70, + "train_loss": 0.513670022392273, + "train_acc": 0.83646, + "test_loss": 2.5132864803314208, + "test_acc": 0.5236, + "lyapunov": null, + "grad_norm": 0.6431550925781278, + "grad_max_sv": 0.27632256150245665, + "grad_min_sv": 1.1758005316261921e-08, + "grad_condition": 110006576.71894233, + "lr": 0.0005522642316338265, + "time_sec": 32.577406883239746 + }, + { + "epoch": 71, + "train_loss": 0.5131872615623474, + "train_acc": 0.83644, + "test_loss": 2.5521981464385988, + "test_acc": 0.5241, + "lyapunov": null, + "grad_norm": 0.6453851866055248, + "grad_max_sv": 0.2702975060790777, + "grad_min_sv": 1.1546318178521155e-08, + "grad_condition": 1790962873.9237118, + "lr": 0.0005418389216661573, + "time_sec": 32.55422234535217 + }, + { + "epoch": 72, + "train_loss": 0.5012564387702942, + "train_acc": 0.83844, + "test_loss": 2.6108884536743164, + "test_acc": 0.5145, + "lyapunov": null, + "grad_norm": 0.641535680347223, + "grad_max_sv": 0.263116517290473, + "grad_min_sv": 1.133218473052533e-08, + "grad_condition": 97098064.25597176, + "lr": 0.0005313952597646563, + "time_sec": 32.55845665931702 + }, + { + "epoch": 73, + "train_loss": 0.4879260776901245, + "train_acc": 0.84454, + "test_loss": 2.5678638622283936, + "test_acc": 0.5233, + "lyapunov": null, + "grad_norm": 0.6388994964495804, + "grad_max_sv": 0.26682182475924493, + "grad_min_sv": 1.1433825197054715e-08, + "grad_condition": 115135062.42170426, + "lr": 0.0005209378268645994, + "time_sec": 32.551618576049805 + }, + { + "epoch": 74, + "train_loss": 0.47297955097198485, + "train_acc": 0.84948, + "test_loss": 2.5823446689605714, + "test_acc": 0.5234, + "lyapunov": null, + "grad_norm": 0.625079210207, + "grad_max_sv": 0.2719780694693327, + "grad_min_sv": 1.1374299929472944e-08, + "grad_condition": 1819913042.7712326, + "lr": 0.0005104712099416781, + "time_sec": 32.56480145454407 + }, + { + "epoch": 75, + "train_loss": 0.46812099950790403, + "train_acc": 0.85034, + "test_loss": 2.6528441036224364, + "test_acc": 0.5183, + "lyapunov": null, + "grad_norm": 0.6231186463016253, + "grad_max_sv": 0.25995977483689786, + "grad_min_sv": 1.1211473876398311e-08, + "grad_condition": 1535902619.2174218, + "lr": 0.0004999999999999996, + "time_sec": 32.557714223861694 + }, + { + "epoch": 76, + "train_loss": 0.4614518400478363, + "train_acc": 0.85322, + "test_loss": 2.722090990829468, + "test_acc": 0.5123, + "lyapunov": null, + "grad_norm": 0.6189058016152714, + "grad_max_sv": 0.26107010766863825, + "grad_min_sv": 1.121603938145782e-08, + "grad_condition": 156852744.39388055, + "lr": 0.0004895287900583212, + "time_sec": 32.57050681114197 + }, + { + "epoch": 77, + "train_loss": 0.4433125625228882, + "train_acc": 0.85798, + "test_loss": 2.683233337402344, + "test_acc": 0.5176, + "lyapunov": null, + "grad_norm": 0.6092718322680238, + "grad_max_sv": 0.26060184724628926, + "grad_min_sv": 1.0807431153128655e-08, + "grad_condition": 94720998.74768767, + "lr": 0.0004790621731353997, + "time_sec": 32.566901445388794 + }, + { + "epoch": 78, + "train_loss": 0.43715192074775694, + "train_acc": 0.85892, + "test_loss": 2.8140779514312744, + "test_acc": 0.5126, + "lyapunov": null, + "grad_norm": 0.6093756219980636, + "grad_max_sv": 0.25670241452753545, + "grad_min_sv": 1.0911793120807477e-08, + "grad_condition": 96322404.6795116, + "lr": 0.000468604740235343, + "time_sec": 32.57596945762634 + }, + { + "epoch": 79, + "train_loss": 0.4312542087650299, + "train_acc": 0.86156, + "test_loss": 2.688641630935669, + "test_acc": 0.5206, + "lyapunov": null, + "grad_norm": 0.6073166568575497, + "grad_max_sv": 0.25702770203351977, + "grad_min_sv": 1.0958630206232833e-08, + "grad_condition": 250707729.3021683, + "lr": 0.00045816107833384175, + "time_sec": 32.56645917892456 + }, + { + "epoch": 80, + "train_loss": 0.4118970446872711, + "train_acc": 0.86894, + "test_loss": 2.5730819744110107, + "test_acc": 0.5337, + "lyapunov": null, + "grad_norm": 0.5969485138195714, + "grad_max_sv": 0.244117346778512, + "grad_min_sv": 1.0501346974639558e-08, + "grad_condition": 268969770.6987619, + "lr": 0.0004477357683661729, + "time_sec": 32.55648875236511 + }, + { + "epoch": 81, + "train_loss": 0.40473406177520754, + "train_acc": 0.8705, + "test_loss": 2.768511548614502, + "test_acc": 0.5175, + "lyapunov": null, + "grad_norm": 0.5946234097363065, + "grad_max_sv": 0.25840370543301105, + "grad_min_sv": 1.0675248116140834e-08, + "grad_condition": 1433985790.1272235, + "lr": 0.00043733338321784746, + "time_sec": 32.56024956703186 + }, + { + "epoch": 82, + "train_loss": 0.39231891386032103, + "train_acc": 0.87338, + "test_loss": 2.6643074661254884, + "test_acc": 0.5309, + "lyapunov": null, + "grad_norm": 0.5900838298376547, + "grad_max_sv": 0.2576967000961304, + "grad_min_sv": 1.0706646371176284e-08, + "grad_condition": 410914403.2919628, + "lr": 0.0004269584857187939, + "time_sec": 32.52906775474548 + }, + { + "epoch": 83, + "train_loss": 0.38102890924453736, + "train_acc": 0.87712, + "test_loss": 2.746966218185425, + "test_acc": 0.5212, + "lyapunov": null, + "grad_norm": 0.5804702132437124, + "grad_max_sv": 0.24822848811745643, + "grad_min_sv": 1.0360890155157107e-08, + "grad_condition": 348582315.4871143, + "lr": 0.0004166156266419484, + "time_sec": 32.575536489486694 + }, + { + "epoch": 84, + "train_loss": 0.37733193599700926, + "train_acc": 0.87564, + "test_loss": 2.7224476852416992, + "test_acc": 0.5248, + "lyapunov": null, + "grad_norm": 0.5836201032332736, + "grad_max_sv": 0.2583346772938967, + "grad_min_sv": 1.070241965142084e-08, + "grad_condition": 801944412.6941237, + "lr": 0.0004063093427071373, + "time_sec": 32.56175231933594 + }, + { + "epoch": 85, + "train_loss": 0.3640913159942627, + "train_acc": 0.88294, + "test_loss": 2.758930994796753, + "test_acc": 0.527, + "lyapunov": null, + "grad_norm": 0.5660514135717984, + "grad_max_sv": 0.24142069853842257, + "grad_min_sv": 1.0190759017463663e-08, + "grad_condition": 1202285628.3006241, + "lr": 0.0003960441545911199, + "time_sec": 32.5456702709198 + }, + { + "epoch": 86, + "train_loss": 0.3523704248428345, + "train_acc": 0.88546, + "test_loss": 2.687824221420288, + "test_acc": 0.5297, + "lyapunov": null, + "grad_norm": 0.5608649440048047, + "grad_max_sv": 0.2463057145476341, + "grad_min_sv": 1.0161699044372586e-08, + "grad_condition": 82146942.52646025, + "lr": 0.0003858245649446718, + "time_sec": 32.53918766975403 + }, + { + "epoch": 87, + "train_loss": 0.35160433542251585, + "train_acc": 0.8864, + "test_loss": 2.7660649963378905, + "test_acc": 0.5254, + "lyapunov": null, + "grad_norm": 0.5647074650828036, + "grad_max_sv": 0.2515272866934538, + "grad_min_sv": 1.0253057474568505e-08, + "grad_condition": 106198876.53293958, + "lr": 0.00037565505641757235, + "time_sec": 32.57175302505493 + }, + { + "epoch": 88, + "train_loss": 0.34372631204605103, + "train_acc": 0.8903, + "test_loss": 2.7611888675689698, + "test_acc": 0.5293, + "lyapunov": null, + "grad_norm": 0.5539379162644149, + "grad_max_sv": 0.24760488532483577, + "grad_min_sv": 1.0237206365037652e-08, + "grad_condition": 268378740.40175262, + "lr": 0.00036554008969236695, + "time_sec": 32.61865496635437 + }, + { + "epoch": 89, + "train_loss": 0.3349831074714661, + "train_acc": 0.89124, + "test_loss": 2.852033778381348, + "test_acc": 0.5246, + "lyapunov": null, + "grad_norm": 0.5543234221756905, + "grad_max_sv": 0.2524993114173412, + "grad_min_sv": 1.0068119724645358e-08, + "grad_condition": 881390959.6058903, + "lr": 0.0003554841015277638, + "time_sec": 32.56809163093567 + }, + { + "epoch": 90, + "train_loss": 0.3192900574111939, + "train_acc": 0.8978, + "test_loss": 2.8204364456176756, + "test_acc": 0.5277, + "lyapunov": null, + "grad_norm": 0.539170960935015, + "grad_max_sv": 0.23871867544949055, + "grad_min_sv": 9.515663445397448e-09, + "grad_condition": 82474731.67522079, + "lr": 0.000345491502812526, + "time_sec": 32.549994468688965 + }, + { + "epoch": 91, + "train_loss": 0.3178176963233948, + "train_acc": 0.8972, + "test_loss": 2.860647204208374, + "test_acc": 0.527, + "lyapunov": null, + "grad_norm": 0.5335824951523024, + "grad_max_sv": 0.24524600319564344, + "grad_min_sv": 9.955028348364314e-09, + "grad_condition": 189160981.0331933, + "lr": 0.0003355666766307081, + "time_sec": 32.5523841381073 + }, + { + "epoch": 92, + "train_loss": 0.30979349758148195, + "train_acc": 0.90114, + "test_loss": 2.792916820526123, + "test_acc": 0.5334, + "lyapunov": null, + "grad_norm": 0.536022212715003, + "grad_max_sv": 0.2439738731831312, + "grad_min_sv": 9.802463784257254e-09, + "grad_condition": 392308745.7452389, + "lr": 0.00032571397633909225, + "time_sec": 32.534363746643066 + }, + { + "epoch": 93, + "train_loss": 0.29998136956214905, + "train_acc": 0.90294, + "test_loss": 2.8000693214416503, + "test_acc": 0.5371, + "lyapunov": null, + "grad_norm": 0.526141212631399, + "grad_max_sv": 0.2302109245210886, + "grad_min_sv": 9.57197021107109e-09, + "grad_condition": 990380151.1551683, + "lr": 0.00031593772365766094, + "time_sec": 32.5524480342865 + }, + { + "epoch": 94, + "train_loss": 0.2947264695549011, + "train_acc": 0.90426, + "test_loss": 2.8803435722351076, + "test_acc": 0.5269, + "lyapunov": null, + "grad_norm": 0.5244681069551711, + "grad_max_sv": 0.2267349176108837, + "grad_min_sv": 9.39341851901969e-09, + "grad_condition": 350481322.0522052, + "lr": 0.0003062422067739483, + "time_sec": 32.55219221115112 + }, + { + "epoch": 95, + "train_loss": 0.2886659768772125, + "train_acc": 0.90604, + "test_loss": 2.9347433059692385, + "test_acc": 0.5258, + "lyapunov": null, + "grad_norm": 0.5214353080258765, + "grad_max_sv": 0.2345777176320553, + "grad_min_sv": 9.640483901365155e-09, + "grad_condition": 720854220.3900421, + "lr": 0.00029663167846209965, + "time_sec": 32.557831048965454 + }, + { + "epoch": 96, + "train_loss": 0.27894444655418393, + "train_acc": 0.90976, + "test_loss": 2.9434762027740478, + "test_acc": 0.5285, + "lyapunov": null, + "grad_norm": 0.5097107775143732, + "grad_max_sv": 0.2310101106762886, + "grad_min_sv": 9.385787539729386e-09, + "grad_condition": 526341011.33289146, + "lr": 0.00028711035421746345, + "time_sec": 32.542834997177124 + }, + { + "epoch": 97, + "train_loss": 0.27359901790618896, + "train_acc": 0.9111, + "test_loss": 2.8853713760375976, + "test_acc": 0.5255, + "lyapunov": null, + "grad_norm": 0.5155496576192513, + "grad_max_sv": 0.2377286858856678, + "grad_min_sv": 9.5194454921327e-09, + "grad_condition": 3878284949.6481657, + "lr": 0.00027768241040753615, + "time_sec": 32.55704665184021 + }, + { + "epoch": 98, + "train_loss": 0.27738544737815857, + "train_acc": 0.90926, + "test_loss": 2.9445196617126466, + "test_acc": 0.5299, + "lyapunov": null, + "grad_norm": 0.5179989785468311, + "grad_max_sv": 0.22777627930045127, + "grad_min_sv": 9.246968936957659e-09, + "grad_condition": 960537397.7931906, + "lr": 0.00026835198244006903, + "time_sec": 32.64381694793701 + }, + { + "epoch": 99, + "train_loss": 0.26050106247901916, + "train_acc": 0.91634, + "test_loss": 2.9518425941467283, + "test_acc": 0.5252, + "lyapunov": null, + "grad_norm": 0.5021876835039283, + "grad_max_sv": 0.23347571939229966, + "grad_min_sv": 9.252318778490976e-09, + "grad_condition": 358829344.2311903, + "lr": 0.0002591231629491421, + "time_sec": 32.63876390457153 + }, + { + "epoch": 100, + "train_loss": 0.258883156375885, + "train_acc": 0.91784, + "test_loss": 2.9451918140411375, + "test_acc": 0.5271, + "lyapunov": null, + "grad_norm": 0.49558170482534186, + "grad_max_sv": 0.22932566255331038, + "grad_min_sv": 8.960364150656374e-09, + "grad_condition": 133402370.68097286, + "lr": 0.0002499999999999997, + "time_sec": 32.63405442237854 + }, + { + "epoch": 101, + "train_loss": 0.2544194602584839, + "train_acc": 0.9178, + "test_loss": 2.931644026184082, + "test_acc": 0.5324, + "lyapunov": null, + "grad_norm": 0.49432462184183484, + "grad_max_sv": 0.23283861316740512, + "grad_min_sv": 9.245908496593666e-09, + "grad_condition": 394496802.8033221, + "lr": 0.00024098649531343477, + "time_sec": 32.61276388168335 + }, + { + "epoch": 102, + "train_loss": 0.2480203760242462, + "train_acc": 0.92056, + "test_loss": 2.8568203742980955, + "test_acc": 0.5384, + "lyapunov": null, + "grad_norm": 0.49038134461440325, + "grad_max_sv": 0.21357116661965847, + "grad_min_sv": 8.517364178338947e-09, + "grad_condition": 517553648.95562804, + "lr": 0.0002320866025105016, + "time_sec": 32.561208724975586 + }, + { + "epoch": 103, + "train_loss": 0.24091191486358643, + "train_acc": 0.92288, + "test_loss": 2.921445244216919, + "test_acc": 0.539, + "lyapunov": null, + "grad_norm": 0.48403203094337405, + "grad_max_sv": 0.2229804780334234, + "grad_min_sv": 8.76879201030037e-09, + "grad_condition": 395225985.76028645, + "lr": 0.0002233042253783278, + "time_sec": 32.58884024620056 + }, + { + "epoch": 104, + "train_loss": 0.2340097396659851, + "train_acc": 0.92426, + "test_loss": 2.952641244506836, + "test_acc": 0.5359, + "lyapunov": null, + "grad_norm": 0.47933424227822113, + "grad_max_sv": 0.21846036985516548, + "grad_min_sv": 8.535758917998377e-09, + "grad_condition": 633016056.7145557, + "lr": 0.000214643216157784, + "time_sec": 32.56481146812439 + }, + { + "epoch": 105, + "train_loss": 0.2301298531961441, + "train_acc": 0.92618, + "test_loss": 3.0041401138305663, + "test_acc": 0.5291, + "lyapunov": null, + "grad_norm": 0.4740683813989447, + "grad_max_sv": 0.22231761552393436, + "grad_min_sv": 8.433698867145923e-09, + "grad_condition": 3779496448.19964, + "lr": 0.00020610737385376332, + "time_sec": 32.58962845802307 + }, + { + "epoch": 106, + "train_loss": 0.23071280053138732, + "train_acc": 0.92596, + "test_loss": 2.902844191741943, + "test_acc": 0.5388, + "lyapunov": null, + "grad_norm": 0.4741615782059369, + "grad_max_sv": 0.22535606250166892, + "grad_min_sv": 8.869640872113949e-09, + "grad_condition": 162288203.3742172, + "lr": 0.00019770044256881242, + "time_sec": 32.57167601585388 + }, + { + "epoch": 107, + "train_loss": 0.22119897150993348, + "train_acc": 0.92908, + "test_loss": 2.9124989013671874, + "test_acc": 0.5401, + "lyapunov": null, + "grad_norm": 0.4665652562574251, + "grad_max_sv": 0.22006149925291538, + "grad_min_sv": 8.667695651325135e-09, + "grad_condition": 151185833.18543836, + "lr": 0.0001894261098608447, + "time_sec": 32.57570242881775 + }, + { + "epoch": 108, + "train_loss": 0.2127019773054123, + "train_acc": 0.93066, + "test_loss": 2.880406095504761, + "test_acc": 0.5451, + "lyapunov": null, + "grad_norm": 0.4590032433316164, + "grad_max_sv": 0.2255195803940296, + "grad_min_sv": 9.011924857207053e-09, + "grad_condition": 814863477.0120376, + "lr": 0.000181288005125655, + "time_sec": 32.57649230957031 + }, + { + "epoch": 109, + "train_loss": 0.21624571283340455, + "train_acc": 0.9307, + "test_loss": 2.967872815322876, + "test_acc": 0.5365, + "lyapunov": null, + "grad_norm": 0.46217449604521815, + "grad_max_sv": 0.22467305175960064, + "grad_min_sv": 8.434571406850528e-09, + "grad_condition": 269913512.95570815, + "lr": 0.0001732896980049473, + "time_sec": 32.688621520996094 + }, + { + "epoch": 110, + "train_loss": 0.21068411350250243, + "train_acc": 0.93312, + "test_loss": 2.9756517448425295, + "test_acc": 0.5417, + "lyapunov": null, + "grad_norm": 0.4560381046604994, + "grad_max_sv": 0.2259811393916607, + "grad_min_sv": 8.584292448838432e-09, + "grad_condition": 247618387.92470437, + "lr": 0.00016543469682057076, + "time_sec": 32.61171579360962 + }, + { + "epoch": 111, + "train_loss": 0.20692597856521605, + "train_acc": 0.93424, + "test_loss": 2.9772758766174316, + "test_acc": 0.5401, + "lyapunov": null, + "grad_norm": 0.4537336475301346, + "grad_max_sv": 0.22052315585315227, + "grad_min_sv": 8.457724332781163e-09, + "grad_condition": 209643026.63441467, + "lr": 0.00015772644703565552, + "time_sec": 32.74080443382263 + }, + { + "epoch": 112, + "train_loss": 0.19982836018562317, + "train_acc": 0.93464, + "test_loss": 2.9877874111175537, + "test_acc": 0.5374, + "lyapunov": null, + "grad_norm": 0.4502543545130326, + "grad_max_sv": 0.21837349496781827, + "grad_min_sv": 8.382589276531572e-09, + "grad_condition": 190131911.5426251, + "lr": 0.00015016832974331713, + "time_sec": 32.61341071128845 + }, + { + "epoch": 113, + "train_loss": 0.19814088920593262, + "train_acc": 0.93678, + "test_loss": 3.0002061031341554, + "test_acc": 0.5372, + "lyapunov": null, + "grad_norm": 0.4475396172239947, + "grad_max_sv": 0.20673769935965539, + "grad_min_sv": 8.026082756024642e-09, + "grad_condition": 821010169.1913308, + "lr": 0.00014276366018359834, + "time_sec": 32.59360718727112 + }, + { + "epoch": 114, + "train_loss": 0.19049308371543885, + "train_acc": 0.93866, + "test_loss": 3.0283890243530274, + "test_acc": 0.5348, + "lyapunov": null, + "grad_norm": 0.4406442112045554, + "grad_max_sv": 0.21337005980312823, + "grad_min_sv": 8.07762924176763e-09, + "grad_condition": 667248655.8256387, + "lr": 0.00013551568628929425, + "time_sec": 32.58922576904297 + }, + { + "epoch": 115, + "train_loss": 0.18477844835281373, + "train_acc": 0.9408, + "test_loss": 2.979667907714844, + "test_acc": 0.538, + "lyapunov": null, + "grad_norm": 0.4338873325468347, + "grad_max_sv": 0.20222999081015586, + "grad_min_sv": 7.837895723032327e-09, + "grad_condition": 353434541.5259349, + "lr": 0.00012842758726130276, + "time_sec": 32.564921617507935 + }, + { + "epoch": 116, + "train_loss": 0.1859721972846985, + "train_acc": 0.93958, + "test_loss": 3.0662242183685304, + "test_acc": 0.5393, + "lyapunov": null, + "grad_norm": 0.436884545053576, + "grad_max_sv": 0.2168640349060297, + "grad_min_sv": 8.084562923496817e-09, + "grad_condition": 9428488559.560253, + "lr": 0.0001215024721741218, + "time_sec": 32.58519434928894 + }, + { + "epoch": 117, + "train_loss": 0.1802575473511219, + "train_acc": 0.9417, + "test_loss": 2.9826597057342528, + "test_acc": 0.5406, + "lyapunov": null, + "grad_norm": 0.42742032333852065, + "grad_max_sv": 0.2029492624104023, + "grad_min_sv": 7.847825115431771e-09, + "grad_condition": 1633268903.8573327, + "lr": 0.00011474337861210538, + "time_sec": 32.59012532234192 + }, + { + "epoch": 118, + "train_loss": 0.1823931166434288, + "train_acc": 0.94122, + "test_loss": 3.021400856399536, + "test_acc": 0.5422, + "lyapunov": null, + "grad_norm": 0.43215599630315543, + "grad_max_sv": 0.20591359175741672, + "grad_min_sv": 8.091189306514043e-09, + "grad_condition": 1689348599.2248282, + "lr": 0.00010815327133708009, + "time_sec": 32.5699896812439 + }, + { + "epoch": 119, + "train_loss": 0.17618105165958406, + "train_acc": 0.94406, + "test_loss": 3.000937869644165, + "test_acc": 0.5384, + "lyapunov": null, + "grad_norm": 0.4237935060578588, + "grad_max_sv": 0.20426486507058145, + "grad_min_sv": 7.760857991326308e-09, + "grad_condition": 126737655.38842675, + "lr": 0.00010173504098790182, + "time_sec": 32.55027508735657 + }, + { + "epoch": 120, + "train_loss": 0.17707269381523133, + "train_acc": 0.9433, + "test_loss": 3.0262657794952394, + "test_acc": 0.5423, + "lyapunov": null, + "grad_norm": 0.4262563994652449, + "grad_max_sv": 0.20858144126832484, + "grad_min_sv": 7.881152512198563e-09, + "grad_condition": 309539963.7397119, + "lr": 9.549150281252629e-05, + "time_sec": 32.56339383125305 + }, + { + "epoch": 121, + "train_loss": 0.17405739032268525, + "train_acc": 0.94424, + "test_loss": 3.066022943115234, + "test_acc": 0.5357, + "lyapunov": null, + "grad_norm": 0.4209047902648977, + "grad_max_sv": 0.208182505145669, + "grad_min_sv": 7.926291366831817e-09, + "grad_condition": 1481844022.098684, + "lr": 8.942539543314794e-05, + "time_sec": 32.55572319030762 + }, + { + "epoch": 122, + "train_loss": 0.1722756038427353, + "train_acc": 0.94372, + "test_loss": 2.9237624008178713, + "test_acc": 0.5501, + "lyapunov": null, + "grad_norm": 0.42147984672159844, + "grad_max_sv": 0.2044668670743704, + "grad_min_sv": 7.998760296129494e-09, + "grad_condition": 3201646284.8678083, + "lr": 8.353937964495024e-05, + "time_sec": 32.587459087371826 + }, + { + "epoch": 123, + "train_loss": 0.16738181323051451, + "train_acc": 0.9461, + "test_loss": 3.094963736343384, + "test_acc": 0.5344, + "lyapunov": null, + "grad_norm": 0.41903231386737333, + "grad_max_sv": 0.20275984779000283, + "grad_min_sv": 7.716203944308116e-09, + "grad_condition": 621612446.7663743, + "lr": 7.783603724899243e-05, + "time_sec": 32.584996461868286 + }, + { + "epoch": 124, + "train_loss": 0.16972655351161955, + "train_acc": 0.94622, + "test_loss": 3.0508366065979002, + "test_acc": 0.5412, + "lyapunov": null, + "grad_norm": 0.4200695555516322, + "grad_max_sv": 0.2031144231557846, + "grad_min_sv": 7.729263715579261e-09, + "grad_condition": 3217546779.4275866, + "lr": 7.231786991974666e-05, + "time_sec": 32.571866035461426 + }, + { + "epoch": 125, + "train_loss": 0.16630077925682069, + "train_acc": 0.94662, + "test_loss": 3.022613596343994, + "test_acc": 0.5392, + "lyapunov": null, + "grad_norm": 0.41758178037006294, + "grad_max_sv": 0.20861225724220275, + "grad_min_sv": 7.841609751726292e-09, + "grad_condition": 338985297.6185556, + "lr": 6.698729810778072e-05, + "time_sec": 32.5552761554718 + }, + { + "epoch": 126, + "train_loss": 0.15956245457649232, + "train_acc": 0.94972, + "test_loss": 3.0561922130584716, + "test_acc": 0.5398, + "lyapunov": null, + "grad_norm": 0.40878054032118605, + "grad_max_sv": 0.19741955921053886, + "grad_min_sv": 7.37841599316065e-09, + "grad_condition": 303424830.56526506, + "lr": 6.184665997806817e-05, + "time_sec": 32.54996180534363 + }, + { + "epoch": 127, + "train_loss": 0.15993500823020934, + "train_acc": 0.9489, + "test_loss": 3.026379292297363, + "test_acc": 0.5441, + "lyapunov": null, + "grad_norm": 0.40620434130290156, + "grad_max_sv": 0.20242127142846583, + "grad_min_sv": 7.71886330243679e-09, + "grad_condition": 171983926.969037, + "lr": 5.6898210384392595e-05, + "time_sec": 32.630762577056885 + }, + { + "epoch": 128, + "train_loss": 0.15721613983869553, + "train_acc": 0.94976, + "test_loss": 3.0123806335449217, + "test_acc": 0.543, + "lyapunov": null, + "grad_norm": 0.40771760456255063, + "grad_max_sv": 0.19883232600986958, + "grad_min_sv": 7.65689685735399e-09, + "grad_condition": 140452566.13847277, + "lr": 5.214411988029363e-05, + "time_sec": 32.56053280830383 + }, + { + "epoch": 129, + "train_loss": 0.15980393629074097, + "train_acc": 0.9494, + "test_loss": 3.0619752151489257, + "test_acc": 0.5385, + "lyapunov": null, + "grad_norm": 0.40680055079987404, + "grad_max_sv": 0.21151602938771247, + "grad_min_sv": 7.960656847678569e-09, + "grad_condition": 6835345348.5200405, + "lr": 4.7586473766990294e-05, + "time_sec": 32.56260585784912 + }, + { + "epoch": 130, + "train_loss": 0.1551200196647644, + "train_acc": 0.95066, + "test_loss": 3.0138941650390625, + "test_acc": 0.5454, + "lyapunov": null, + "grad_norm": 0.4023235762601659, + "grad_max_sv": 0.19708200730383396, + "grad_min_sv": 7.800858144299192e-09, + "grad_condition": 626827866.159754, + "lr": 4.32272711786996e-05, + "time_sec": 32.59095644950867 + }, + { + "epoch": 131, + "train_loss": 0.15415350935935973, + "train_acc": 0.95194, + "test_loss": 2.9972058124542236, + "test_acc": 0.5443, + "lyapunov": null, + "grad_norm": 0.40269684147235807, + "grad_max_sv": 0.20214904472231865, + "grad_min_sv": 7.632781651861764e-09, + "grad_condition": 3110137965.882431, + "lr": 3.906842420574966e-05, + "time_sec": 32.64683389663696 + }, + { + "epoch": 132, + "train_loss": 0.15071093450546263, + "train_acc": 0.95362, + "test_loss": 3.058548362350464, + "test_acc": 0.5406, + "lyapunov": null, + "grad_norm": 0.3962388158117765, + "grad_max_sv": 0.20194376222789287, + "grad_min_sv": 7.476556948202151e-09, + "grad_condition": 251161532.73020416, + "lr": 3.5111757055874305e-05, + "time_sec": 32.57603096961975 + }, + { + "epoch": 133, + "train_loss": 0.15083105179309844, + "train_acc": 0.95186, + "test_loss": 3.0908397106170655, + "test_acc": 0.5372, + "lyapunov": null, + "grad_norm": 0.396089047457992, + "grad_max_sv": 0.19243778996169567, + "grad_min_sv": 7.3091202180313244e-09, + "grad_condition": 798644628.4177251, + "lr": 3.1359005254054254e-05, + "time_sec": 32.73746132850647 + }, + { + "epoch": 134, + "train_loss": 0.14782890917301178, + "train_acc": 0.95342, + "test_loss": 3.050483916091919, + "test_acc": 0.5423, + "lyapunov": null, + "grad_norm": 0.3935039829273189, + "grad_max_sv": 0.1971876610070467, + "grad_min_sv": 7.67425883595142e-09, + "grad_condition": 2485965444.639862, + "lr": 2.7811814881259484e-05, + "time_sec": 32.72033095359802 + }, + { + "epoch": 135, + "train_loss": 0.1471274660015106, + "train_acc": 0.95372, + "test_loss": 2.9947123558044435, + "test_acc": 0.5426, + "lyapunov": null, + "grad_norm": 0.3920191534951485, + "grad_max_sv": 0.20197632759809495, + "grad_min_sv": 7.500751369148018e-09, + "grad_condition": 520365917.2206461, + "lr": 2.4471741852423218e-05, + "time_sec": 32.67989182472229 + }, + { + "epoch": 136, + "train_loss": 0.1491823548412323, + "train_acc": 0.9526, + "test_loss": 3.0622998500823972, + "test_acc": 0.5417, + "lyapunov": null, + "grad_norm": 0.3958637689339096, + "grad_max_sv": 0.1968228505924344, + "grad_min_sv": 7.479480308540676e-09, + "grad_condition": 707924605.8880411, + "lr": 2.1340251233966362e-05, + "time_sec": 32.66845107078552 + }, + { + "epoch": 137, + "train_loss": 0.1438249187850952, + "train_acc": 0.95456, + "test_loss": 3.0126154830932617, + "test_acc": 0.5438, + "lyapunov": null, + "grad_norm": 0.3880549357238996, + "grad_max_sv": 0.1975066963583231, + "grad_min_sv": 7.686822375862525e-09, + "grad_condition": 958291083.1124929, + "lr": 1.8418716601170932e-05, + "time_sec": 32.62222647666931 + }, + { + "epoch": 138, + "train_loss": 0.14332568585395813, + "train_acc": 0.95562, + "test_loss": 2.970457587814331, + "test_acc": 0.5475, + "lyapunov": null, + "grad_norm": 0.387864370948264, + "grad_max_sv": 0.19698900803923608, + "grad_min_sv": 7.3030646496365096e-09, + "grad_condition": 522257153.2510088, + "lr": 1.570841943568445e-05, + "time_sec": 32.588345527648926 + }, + { + "epoch": 139, + "train_loss": 0.14504710802555085, + "train_acc": 0.95396, + "test_loss": 3.0413112239837647, + "test_acc": 0.5442, + "lyapunov": null, + "grad_norm": 0.39046406821011487, + "grad_max_sv": 0.19658712521195412, + "grad_min_sv": 7.706623579399608e-09, + "grad_condition": 210757363.08798447, + "lr": 1.3210548563419845e-05, + "time_sec": 32.57579827308655 + }, + { + "epoch": 140, + "train_loss": 0.1440677634191513, + "train_acc": 0.9551, + "test_loss": 3.0336122520446778, + "test_acc": 0.5421, + "lyapunov": null, + "grad_norm": 0.3879105148922517, + "grad_max_sv": 0.20634672362357379, + "grad_min_sv": 7.609137083592308e-09, + "grad_condition": 799925132.5815533, + "lr": 1.0926199633097203e-05, + "time_sec": 32.56750822067261 + }, + { + "epoch": 141, + "train_loss": 0.1450736529636383, + "train_acc": 0.9539, + "test_loss": 3.0418475845336914, + "test_acc": 0.542, + "lyapunov": null, + "grad_norm": 0.3893245206754723, + "grad_max_sv": 0.19981114380061626, + "grad_min_sv": 7.533249978951707e-09, + "grad_condition": 1055093430.0963647, + "lr": 8.856374635655688e-06, + "time_sec": 32.5803439617157 + }, + { + "epoch": 142, + "train_loss": 0.14690097001075744, + "train_acc": 0.9539, + "test_loss": 3.085536852264404, + "test_acc": 0.5402, + "lyapunov": null, + "grad_norm": 0.393962854701407, + "grad_max_sv": 0.19642856512218715, + "grad_min_sv": 7.33013154697107e-09, + "grad_condition": 1287238710.5116677, + "lr": 7.001981464747503e-06, + "time_sec": 32.587260246276855 + }, + { + "epoch": 143, + "train_loss": 0.14333253172159194, + "train_acc": 0.95502, + "test_loss": 3.0491490406036377, + "test_acc": 0.5422, + "lyapunov": null, + "grad_norm": 0.38524967986058734, + "grad_max_sv": 0.1963527824729681, + "grad_min_sv": 7.358908829112505e-09, + "grad_condition": 554422862.0300386, + "lr": 5.3638335185058295e-06, + "time_sec": 32.558162450790405 + }, + { + "epoch": 144, + "train_loss": 0.14636923120975495, + "train_acc": 0.95354, + "test_loss": 3.061640990829468, + "test_acc": 0.5427, + "lyapunov": null, + "grad_norm": 0.39405435868542676, + "grad_max_sv": 0.20560368224978448, + "grad_min_sv": 7.55005881126168e-09, + "grad_condition": 511328197.16483086, + "lr": 3.942649342761114e-06, + "time_sec": 32.583282709121704 + }, + { + "epoch": 145, + "train_loss": 0.14265491032361985, + "train_acc": 0.95596, + "test_loss": 3.0034291164398192, + "test_acc": 0.5447, + "lyapunov": null, + "grad_norm": 0.38473538959699044, + "grad_max_sv": 0.20014677122235297, + "grad_min_sv": 7.530181120709092e-09, + "grad_condition": 337796403.57093, + "lr": 2.7390523158633524e-06, + "time_sec": 32.637805223464966 + }, + { + "epoch": 146, + "train_loss": 0.14478088060855865, + "train_acc": 0.95472, + "test_loss": 3.0147633277893067, + "test_acc": 0.5419, + "lyapunov": null, + "grad_norm": 0.3885491395116739, + "grad_max_sv": 0.19666519686579703, + "grad_min_sv": 7.584344775216773e-09, + "grad_condition": 547643565.9603722, + "lr": 1.7535703752478133e-06, + "time_sec": 32.652307748794556 + }, + { + "epoch": 147, + "train_loss": 0.14279501497268676, + "train_acc": 0.9546, + "test_loss": 3.0440410163879394, + "test_acc": 0.541, + "lyapunov": null, + "grad_norm": 0.38669357310585645, + "grad_max_sv": 0.21015651226043702, + "grad_min_sv": 7.688521032247348e-09, + "grad_condition": 469600192.5783922, + "lr": 9.866357858642196e-07, + "time_sec": 32.59567952156067 + }, + { + "epoch": 148, + "train_loss": 0.14565588755607606, + "train_acc": 0.9541, + "test_loss": 3.0802265747070314, + "test_acc": 0.5416, + "lyapunov": null, + "grad_norm": 0.38859455199964604, + "grad_max_sv": 0.19257190506905317, + "grad_min_sv": 7.505198252591092e-09, + "grad_condition": 881395202.1431038, + "lr": 4.38584950570808e-07, + "time_sec": 32.61454796791077 + }, + { + "epoch": 149, + "train_loss": 0.14538168624401093, + "train_acc": 0.9543, + "test_loss": 3.0341483921051027, + "test_acc": 0.5461, + "lyapunov": null, + "grad_norm": 0.3912198061226822, + "grad_max_sv": 0.19850266501307487, + "grad_min_sv": 7.570504590619434e-09, + "grad_condition": 1146760478.7303884, + "lr": 1.096582625772501e-07, + "time_sec": 32.57002377510071 + }, + { + "epoch": 150, + "train_loss": 0.14344769035339355, + "train_acc": 0.95432, + "test_loss": 3.151827312850952, + "test_acc": 0.5351, + "lyapunov": null, + "grad_norm": 0.38700258459733883, + "grad_max_sv": 0.19427692480385303, + "grad_min_sv": 7.459068278141413e-09, + "grad_condition": 795616674.0450132, + "lr": 0.0, + "time_sec": 32.58071160316467 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.869130941009521, + "train_acc": 0.0299, + "test_loss": 4.81726124420166, + "test_acc": 0.0158, + "lyapunov": null, + "grad_norm": 5.958599870859213, + "grad_max_sv": 5.32314133644104, + "grad_min_sv": 1.0002176032419818e-07, + "grad_condition": 117638897.02667244, + "lr": 0.0009998903417374227, + "time_sec": 49.630311012268066 + }, + { + "epoch": 2, + "train_loss": 4.33411005065918, + "train_acc": 0.05812, + "test_loss": 4.9022071792602535, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 4.4717426818192445, + "grad_max_sv": 3.9425308763980866, + "grad_min_sv": 7.707211335805653e-08, + "grad_condition": 68733255.35507934, + "lr": 0.0009995614150494292, + "time_sec": 49.65966987609863 + }, + { + "epoch": 3, + "train_loss": 4.058719948577881, + "train_acc": 0.08542, + "test_loss": 4.564939413452149, + "test_acc": 0.0316, + "lyapunov": null, + "grad_norm": 3.6062592227635153, + "grad_max_sv": 3.0093896448612214, + "grad_min_sv": 6.351203426790964e-08, + "grad_condition": 159552980.8120403, + "lr": 0.0009990133642141358, + "time_sec": 49.6358323097229 + }, + { + "epoch": 4, + "train_loss": 3.8575441249084474, + "train_acc": 0.11032, + "test_loss": 4.524412051391602, + "test_acc": 0.0409, + "lyapunov": null, + "grad_norm": 2.92902742157696, + "grad_max_sv": 2.357221654057503, + "grad_min_sv": 5.122935820833785e-08, + "grad_condition": 93072427.1014817, + "lr": 0.0009982464296247522, + "time_sec": 49.63461923599243 + }, + { + "epoch": 5, + "train_loss": 3.6889766606140135, + "train_acc": 0.13372, + "test_loss": 4.625890071105957, + "test_acc": 0.0423, + "lyapunov": null, + "grad_norm": 2.3880731569941602, + "grad_max_sv": 1.768235558271408, + "grad_min_sv": 4.081188793129964e-08, + "grad_condition": 393314864.55004865, + "lr": 0.0009972609476841367, + "time_sec": 49.89368748664856 + }, + { + "epoch": 6, + "train_loss": 3.5618105076599123, + "train_acc": 0.15236, + "test_loss": 4.4743853515625, + "test_acc": 0.0606, + "lyapunov": null, + "grad_norm": 1.9549034892194537, + "grad_max_sv": 1.3601578801870347, + "grad_min_sv": 3.461635420948239e-08, + "grad_condition": 108039525.34253314, + "lr": 0.000996057350657239, + "time_sec": 49.63013410568237 + }, + { + "epoch": 7, + "train_loss": 3.449751102294922, + "train_acc": 0.17348, + "test_loss": 4.566000821304321, + "test_acc": 0.0583, + "lyapunov": null, + "grad_norm": 1.6054375498086935, + "grad_max_sv": 0.970761476457119, + "grad_min_sv": 2.837226934226944e-08, + "grad_condition": 97915375.34094961, + "lr": 0.000994636166481494, + "time_sec": 49.65112805366516 + }, + { + "epoch": 8, + "train_loss": 3.362903434448242, + "train_acc": 0.18704, + "test_loss": 5.157250576019287, + "test_acc": 0.0509, + "lyapunov": null, + "grad_norm": 1.4122949125779343, + "grad_max_sv": 0.7663216680288315, + "grad_min_sv": 2.498295813726896e-08, + "grad_condition": 819581329.8584878, + "lr": 0.0009929980185352525, + "time_sec": 49.64129614830017 + }, + { + "epoch": 9, + "train_loss": 3.2836685932922363, + "train_acc": 0.20434, + "test_loss": 4.776924538803101, + "test_acc": 0.0722, + "lyapunov": null, + "grad_norm": 1.3022948327813888, + "grad_max_sv": 0.6469943135976791, + "grad_min_sv": 2.306396500451058e-08, + "grad_condition": 39951536.65872553, + "lr": 0.0009911436253643444, + "time_sec": 49.625274658203125 + }, + { + "epoch": 10, + "train_loss": 3.2231285871887208, + "train_acc": 0.21402, + "test_loss": 4.61860969619751, + "test_acc": 0.0698, + "lyapunov": null, + "grad_norm": 1.2196486517440839, + "grad_max_sv": 0.5692647032439708, + "grad_min_sv": 2.19049595906462e-08, + "grad_condition": 33845479.69359137, + "lr": 0.0009890738003669028, + "time_sec": 49.660149335861206 + }, + { + "epoch": 11, + "train_loss": 3.1583662706756592, + "train_acc": 0.22336, + "test_loss": 4.968407231903076, + "test_acc": 0.0756, + "lyapunov": null, + "grad_norm": 1.1538157456115983, + "grad_max_sv": 0.5210241436958313, + "grad_min_sv": 2.0956197309580926e-08, + "grad_condition": 525394408.4356891, + "lr": 0.00098678945143658, + "time_sec": 49.65011477470398 + }, + { + "epoch": 12, + "train_loss": 3.109931953125, + "train_acc": 0.23662, + "test_loss": 4.948040252685547, + "test_acc": 0.0649, + "lyapunov": null, + "grad_norm": 1.1104505996303506, + "grad_max_sv": 0.49291609674692155, + "grad_min_sv": 2.0293893665535024e-08, + "grad_condition": 28415855.264934354, + "lr": 0.0009842915805643154, + "time_sec": 49.63184213638306 + }, + { + "epoch": 13, + "train_loss": 3.0547399656677245, + "train_acc": 0.24656, + "test_loss": 4.970808222198486, + "test_acc": 0.071, + "lyapunov": null, + "grad_norm": 1.0601665770785784, + "grad_max_sv": 0.43972166776657107, + "grad_min_sv": 1.913768455791276e-08, + "grad_condition": 43447965.04145826, + "lr": 0.000981581283398829, + "time_sec": 49.61093473434448 + }, + { + "epoch": 14, + "train_loss": 3.017925659484863, + "train_acc": 0.25326, + "test_loss": 4.814505133056641, + "test_acc": 0.0837, + "lyapunov": null, + "grad_norm": 1.014870172987229, + "grad_max_sv": 0.42207302525639534, + "grad_min_sv": 1.853980992200244e-08, + "grad_condition": 39195315.53960514, + "lr": 0.0009786597487660333, + "time_sec": 49.673532009124756 + }, + { + "epoch": 15, + "train_loss": 2.9702432484436034, + "train_acc": 0.2631, + "test_loss": 5.807154141235351, + "test_acc": 0.063, + "lyapunov": null, + "grad_norm": 0.9937971972307359, + "grad_max_sv": 0.4026923879981041, + "grad_min_sv": 1.8250485112059068e-08, + "grad_condition": 40167603.205859475, + "lr": 0.0009755282581475766, + "time_sec": 49.618321657180786 + }, + { + "epoch": 16, + "train_loss": 2.944736771850586, + "train_acc": 0.26722, + "test_loss": 5.26193563079834, + "test_acc": 0.0679, + "lyapunov": null, + "grad_norm": 0.9522428456453783, + "grad_max_sv": 0.38795666843652726, + "grad_min_sv": 1.7932681539711838e-08, + "grad_condition": 23883480.656060785, + "lr": 0.0009721881851187403, + "time_sec": 49.62830376625061 + }, + { + "epoch": 17, + "train_loss": 2.9034721049499512, + "train_acc": 0.27602, + "test_loss": 5.7925373001098635, + "test_acc": 0.064, + "lyapunov": null, + "grad_norm": 0.9254531496563255, + "grad_max_sv": 0.3589652024209499, + "grad_min_sv": 1.6935554087902337e-08, + "grad_condition": 1457602436.4631252, + "lr": 0.0009686409947459456, + "time_sec": 49.61351823806763 + }, + { + "epoch": 18, + "train_loss": 2.8702178131866454, + "train_acc": 0.27916, + "test_loss": 5.747376763916016, + "test_acc": 0.0602, + "lyapunov": null, + "grad_norm": 0.886880691282622, + "grad_max_sv": 0.35455706864595415, + "grad_min_sv": 1.661939068586804e-08, + "grad_condition": 37189913.97942409, + "lr": 0.0009648882429441254, + "time_sec": 49.602774143218994 + }, + { + "epoch": 19, + "train_loss": 2.8457236665344237, + "train_acc": 0.28346, + "test_loss": 5.225064262390137, + "test_acc": 0.0742, + "lyapunov": null, + "grad_norm": 0.8745352102009426, + "grad_max_sv": 0.33497569262981414, + "grad_min_sv": 1.610201680879442e-08, + "grad_condition": 37118382.124889985, + "lr": 0.00096093157579425, + "time_sec": 49.60137701034546 + }, + { + "epoch": 20, + "train_loss": 2.8215041007995607, + "train_acc": 0.28872, + "test_loss": 6.004126496887207, + "test_acc": 0.0566, + "lyapunov": null, + "grad_norm": 0.8595248383665987, + "grad_max_sv": 0.3317968972027302, + "grad_min_sv": 1.6277641995410263e-08, + "grad_condition": 25076117.492004953, + "lr": 0.0009567727288213001, + "time_sec": 49.606021881103516 + }, + { + "epoch": 21, + "train_loss": 2.7879924519348145, + "train_acc": 0.296, + "test_loss": 5.8324502685546875, + "test_acc": 0.0713, + "lyapunov": null, + "grad_norm": 0.8282095227121367, + "grad_max_sv": 0.3175826959311962, + "grad_min_sv": 1.5523823382324054e-08, + "grad_condition": 33473762.080522645, + "lr": 0.0009524135262330095, + "time_sec": 49.607139110565186 + }, + { + "epoch": 22, + "train_loss": 2.758204474105835, + "train_acc": 0.30248, + "test_loss": 6.578706220245361, + "test_acc": 0.0618, + "lyapunov": null, + "grad_norm": 0.8257961231351345, + "grad_max_sv": 0.30810598842799664, + "grad_min_sv": 1.5302382311288555e-08, + "grad_condition": 24529675.495205637, + "lr": 0.0009478558801197061, + "time_sec": 49.624640464782715 + }, + { + "epoch": 23, + "train_loss": 2.738676343231201, + "train_acc": 0.30592, + "test_loss": 5.4664344863891605, + "test_acc": 0.0861, + "lyapunov": null, + "grad_norm": 0.8065233040737523, + "grad_max_sv": 0.30156193524599073, + "grad_min_sv": 1.49054265444204e-08, + "grad_condition": 33421080.710955955, + "lr": 0.000943101789615607, + "time_sec": 49.63160300254822 + }, + { + "epoch": 24, + "train_loss": 2.716878635177612, + "train_acc": 0.31244, + "test_loss": 6.44300007019043, + "test_acc": 0.0749, + "lyapunov": null, + "grad_norm": 0.786905827456602, + "grad_max_sv": 0.30066613033413886, + "grad_min_sv": 1.476351601525927e-08, + "grad_condition": 22958316.6446944, + "lr": 0.0009381533400219313, + "time_sec": 49.617870569229126 + }, + { + "epoch": 25, + "train_loss": 2.694182593231201, + "train_acc": 0.31604, + "test_loss": 5.382769798278809, + "test_acc": 0.0916, + "lyapunov": null, + "grad_norm": 0.7761045602879763, + "grad_max_sv": 0.2905112482607365, + "grad_min_sv": 1.4682144194866353e-08, + "grad_condition": 23004874.738089267, + "lr": 0.0009330127018922189, + "time_sec": 49.63197326660156 + }, + { + "epoch": 26, + "train_loss": 2.665074285736084, + "train_acc": 0.3195, + "test_loss": 6.5514334884643555, + "test_acc": 0.0798, + "lyapunov": null, + "grad_norm": 0.7692786817334373, + "grad_max_sv": 0.28090294301509855, + "grad_min_sv": 1.4502390317805425e-08, + "grad_condition": 76981810.64111714, + "lr": 0.000927682130080253, + "time_sec": 49.62014698982239 + }, + { + "epoch": 27, + "train_loss": 2.6460686820983885, + "train_acc": 0.32446, + "test_loss": 5.83518740234375, + "test_acc": 0.0812, + "lyapunov": null, + "grad_norm": 0.754398795054657, + "grad_max_sv": 0.27323813289403914, + "grad_min_sv": 1.4150497623655057e-08, + "grad_condition": 21603221.75046044, + "lr": 0.0009221639627510072, + "time_sec": 49.62936043739319 + }, + { + "epoch": 28, + "train_loss": 2.6265927952575683, + "train_acc": 0.32812, + "test_loss": 6.598120281982422, + "test_acc": 0.0812, + "lyapunov": null, + "grad_norm": 0.7495858584128283, + "grad_max_sv": 0.2764635566622019, + "grad_min_sv": 1.3928179298794419e-08, + "grad_condition": 26592087.597849313, + "lr": 0.0009164606203550494, + "time_sec": 49.65487575531006 + }, + { + "epoch": 29, + "train_loss": 2.5989754135131835, + "train_acc": 0.33438, + "test_loss": 6.019640913391113, + "test_acc": 0.0853, + "lyapunov": null, + "grad_norm": 0.7328457671272296, + "grad_max_sv": 0.26275444217026234, + "grad_min_sv": 1.3466245638027452e-08, + "grad_condition": 27074823.030799665, + "lr": 0.0009105746045668516, + "time_sec": 49.61575961112976 + }, + { + "epoch": 30, + "train_loss": 2.569355689697266, + "train_acc": 0.3403, + "test_loss": 5.656453500366211, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 0.7285247723431758, + "grad_max_sv": 0.2620399072766304, + "grad_min_sv": 1.3607302561113865e-08, + "grad_condition": 36595154.18813526, + "lr": 0.0009045084971874733, + "time_sec": 49.61033368110657 + }, + { + "epoch": 31, + "train_loss": 2.5531623433685304, + "train_acc": 0.34344, + "test_loss": 5.512335840606689, + "test_acc": 0.1014, + "lyapunov": null, + "grad_norm": 0.7271132291276766, + "grad_max_sv": 0.2741693131625652, + "grad_min_sv": 1.3862067549386126e-08, + "grad_condition": 23784567.90840191, + "lr": 0.0008982649590120977, + "time_sec": 49.62810754776001 + }, + { + "epoch": 32, + "train_loss": 2.540181041793823, + "train_acc": 0.3433, + "test_loss": 6.18716075592041, + "test_acc": 0.0672, + "lyapunov": null, + "grad_norm": 0.7235480377928197, + "grad_max_sv": 0.2649095542728901, + "grad_min_sv": 1.3458577613478795e-08, + "grad_condition": 45957043.50585803, + "lr": 0.0008918467286629196, + "time_sec": 49.6074960231781 + }, + { + "epoch": 33, + "train_loss": 2.5191816319274905, + "train_acc": 0.34908, + "test_loss": 6.582100025939941, + "test_acc": 0.0751, + "lyapunov": null, + "grad_norm": 0.7200938019415711, + "grad_max_sv": 0.25730164162814617, + "grad_min_sv": 1.3406257262649212e-08, + "grad_condition": 31538992.96164729, + "lr": 0.0008852566213878943, + "time_sec": 49.61494970321655 + }, + { + "epoch": 34, + "train_loss": 2.496463624954224, + "train_acc": 0.35388, + "test_loss": 6.577035200500489, + "test_acc": 0.0824, + "lyapunov": null, + "grad_norm": 0.7056443924011199, + "grad_max_sv": 0.2493937097489834, + "grad_min_sv": 1.2909361921803475e-08, + "grad_condition": 45513498.69422473, + "lr": 0.000878497527825878, + "time_sec": 49.61423134803772 + }, + { + "epoch": 35, + "train_loss": 2.476149175262451, + "train_acc": 0.3577, + "test_loss": 6.60574702758789, + "test_acc": 0.0683, + "lyapunov": null, + "grad_norm": 0.7081960767237655, + "grad_max_sv": 0.2570201367139816, + "grad_min_sv": 1.3318109846893745e-08, + "grad_condition": 40942846.386733145, + "lr": 0.000871572412738697, + "time_sec": 49.627204179763794 + }, + { + "epoch": 36, + "train_loss": 2.4584676556396485, + "train_acc": 0.36174, + "test_loss": 6.376377404785156, + "test_acc": 0.1036, + "lyapunov": null, + "grad_norm": 0.7033365437967071, + "grad_max_sv": 0.25586923360824587, + "grad_min_sv": 1.3038588915492699e-08, + "grad_condition": 29808789.927535187, + "lr": 0.0008644843137107055, + "time_sec": 49.658987283706665 + }, + { + "epoch": 37, + "train_loss": 2.437811667022705, + "train_acc": 0.36606, + "test_loss": 5.828952204895019, + "test_acc": 0.1031, + "lyapunov": null, + "grad_norm": 0.6944168249360962, + "grad_max_sv": 0.24849907420575618, + "grad_min_sv": 1.295541044166182e-08, + "grad_condition": 25181358.80101443, + "lr": 0.0008572363398164014, + "time_sec": 49.69488453865051 + }, + { + "epoch": 38, + "train_loss": 2.428686420135498, + "train_acc": 0.36772, + "test_loss": 5.761842573547363, + "test_acc": 0.1089, + "lyapunov": null, + "grad_norm": 0.6926211199497188, + "grad_max_sv": 0.24097422771155835, + "grad_min_sv": 1.2852728982493122e-08, + "grad_condition": 34221857.55107718, + "lr": 0.0008498316702566826, + "time_sec": 49.65219521522522 + }, + { + "epoch": 39, + "train_loss": 2.403228950653076, + "train_acc": 0.37238, + "test_loss": 6.327913746643066, + "test_acc": 0.0717, + "lyapunov": null, + "grad_norm": 0.6898323608739025, + "grad_max_sv": 0.24370794370770454, + "grad_min_sv": 1.2873074178160193e-08, + "grad_condition": 57305083.56976622, + "lr": 0.0008422735529643442, + "time_sec": 49.67387104034424 + }, + { + "epoch": 40, + "train_loss": 2.4002745401000976, + "train_acc": 0.37394, + "test_loss": 6.5177731010437014, + "test_acc": 0.083, + "lyapunov": null, + "grad_norm": 0.6833298006535204, + "grad_max_sv": 0.2354185614734888, + "grad_min_sv": 1.2765965198835438e-08, + "grad_condition": 21504088.72491734, + "lr": 0.0008345653031794289, + "time_sec": 49.617934226989746 + }, + { + "epoch": 41, + "train_loss": 2.375027209320068, + "train_acc": 0.37838, + "test_loss": 5.745588743591308, + "test_acc": 0.0906, + "lyapunov": null, + "grad_norm": 0.6828029580415041, + "grad_max_sv": 0.2435049433261156, + "grad_min_sv": 1.2850220883556252e-08, + "grad_condition": 81583325.51254459, + "lr": 0.0008267103019950526, + "time_sec": 49.618937492370605 + }, + { + "epoch": 42, + "train_loss": 2.3483433491516115, + "train_acc": 0.38482, + "test_loss": 6.884811988830567, + "test_acc": 0.0781, + "lyapunov": null, + "grad_norm": 0.6754176682521642, + "grad_max_sv": 0.23814460188150405, + "grad_min_sv": 1.2720279750355611e-08, + "grad_condition": 59300475.89689113, + "lr": 0.0008187119948743447, + "time_sec": 49.61317276954651 + }, + { + "epoch": 43, + "train_loss": 2.3344376317596436, + "train_acc": 0.38764, + "test_loss": 6.61351337890625, + "test_acc": 0.0969, + "lyapunov": null, + "grad_norm": 0.6769988439891311, + "grad_max_sv": 0.23613341376185418, + "grad_min_sv": 1.2639965266819653e-08, + "grad_condition": 52119429.92492165, + "lr": 0.000810573890139155, + "time_sec": 49.61902713775635 + }, + { + "epoch": 44, + "train_loss": 2.3136163584899903, + "train_acc": 0.39148, + "test_loss": 6.608843360137939, + "test_acc": 0.0931, + "lyapunov": null, + "grad_norm": 0.6707039764412329, + "grad_max_sv": 0.23947011977434157, + "grad_min_sv": 1.2690825271916007e-08, + "grad_condition": 66659408.04853566, + "lr": 0.0008022995574311873, + "time_sec": 49.651583671569824 + }, + { + "epoch": 45, + "train_loss": 2.303262007751465, + "train_acc": 0.3968, + "test_loss": 7.3357599853515625, + "test_acc": 0.0763, + "lyapunov": null, + "grad_norm": 0.6720641219214196, + "grad_max_sv": 0.2344801113009453, + "grad_min_sv": 1.2468999964487804e-08, + "grad_condition": 28252178.039376438, + "lr": 0.0007938926261462363, + "time_sec": 49.6513557434082 + }, + { + "epoch": 46, + "train_loss": 2.294885206298828, + "train_acc": 0.39602, + "test_loss": 7.143599510192871, + "test_acc": 0.0808, + "lyapunov": null, + "grad_norm": 0.6723751960213503, + "grad_max_sv": 0.23659461848437785, + "grad_min_sv": 1.2819257341756262e-08, + "grad_condition": 24273419.96656149, + "lr": 0.0007853567838422158, + "time_sec": 49.67392659187317 + }, + { + "epoch": 47, + "train_loss": 2.2797239797973634, + "train_acc": 0.39734, + "test_loss": 7.214380073547363, + "test_acc": 0.0775, + "lyapunov": null, + "grad_norm": 0.6804834576699708, + "grad_max_sv": 0.23809269666671753, + "grad_min_sv": 1.2608010335757313e-08, + "grad_condition": 25254183.290313803, + "lr": 0.0007766957746216719, + "time_sec": 49.69322681427002 + }, + { + "epoch": 48, + "train_loss": 2.265524502334595, + "train_acc": 0.40104, + "test_loss": 7.091396580505371, + "test_acc": 0.0731, + "lyapunov": null, + "grad_norm": 0.667046368857113, + "grad_max_sv": 0.23234264142811298, + "grad_min_sv": 1.2433218019025638e-08, + "grad_condition": 22653859.281439293, + "lr": 0.0007679133974894982, + "time_sec": 49.65531873703003 + }, + { + "epoch": 49, + "train_loss": 2.2435117234802244, + "train_acc": 0.40428, + "test_loss": 7.294827133178711, + "test_acc": 0.0737, + "lyapunov": null, + "grad_norm": 0.6646443647443216, + "grad_max_sv": 0.23331840261816977, + "grad_min_sv": 1.2566753440634847e-08, + "grad_condition": 29559825.642532967, + "lr": 0.000759013504686565, + "time_sec": 49.66777467727661 + }, + { + "epoch": 50, + "train_loss": 2.2254374363708496, + "train_acc": 0.4097, + "test_loss": 8.604184033203126, + "test_acc": 0.0731, + "lyapunov": null, + "grad_norm": 0.6690954918149841, + "grad_max_sv": 0.22841170839965344, + "grad_min_sv": 1.2475536101397288e-08, + "grad_condition": 21723914.29311887, + "lr": 0.0007499999999999998, + "time_sec": 49.67113780975342 + }, + { + "epoch": 51, + "train_loss": 2.2072127560424804, + "train_acc": 0.41446, + "test_loss": 6.9883695976257325, + "test_acc": 0.0803, + "lyapunov": null, + "grad_norm": 0.6607736738937507, + "grad_max_sv": 0.2331558234989643, + "grad_min_sv": 1.243218040875016e-08, + "grad_condition": 27632939.34803492, + "lr": 0.0007408768370508575, + "time_sec": 49.65227961540222 + }, + { + "epoch": 52, + "train_loss": 2.1981446758270264, + "train_acc": 0.41588, + "test_loss": 8.058159327697753, + "test_acc": 0.0799, + "lyapunov": null, + "grad_norm": 0.6648453996346088, + "grad_max_sv": 0.2446960099041462, + "grad_min_sv": 1.2652686252889733e-08, + "grad_condition": 41197472.85285741, + "lr": 0.0007316480175599307, + "time_sec": 49.61691617965698 + }, + { + "epoch": 53, + "train_loss": 2.174496583709717, + "train_acc": 0.42132, + "test_loss": 7.289675385284424, + "test_acc": 0.0877, + "lyapunov": null, + "grad_norm": 0.6618427859375565, + "grad_max_sv": 0.2312875609844923, + "grad_min_sv": 1.239080896497935e-08, + "grad_condition": 23822848.628154784, + "lr": 0.0007223175895924635, + "time_sec": 49.65499806404114 + }, + { + "epoch": 54, + "train_loss": 2.16634906211853, + "train_acc": 0.42064, + "test_loss": 7.236015202331543, + "test_acc": 0.0958, + "lyapunov": null, + "grad_norm": 0.6619124781918282, + "grad_max_sv": 0.2310062251985073, + "grad_min_sv": 1.2317981715193049e-08, + "grad_condition": 26820300.581125747, + "lr": 0.0007128896457825361, + "time_sec": 49.61980724334717 + }, + { + "epoch": 55, + "train_loss": 2.14550412109375, + "train_acc": 0.4265, + "test_loss": 6.8394420608520505, + "test_acc": 0.0943, + "lyapunov": null, + "grad_norm": 0.6625916025346076, + "grad_max_sv": 0.23202612698078157, + "grad_min_sv": 1.2528317372417775e-08, + "grad_condition": 25612000.25663858, + "lr": 0.0007033683215378998, + "time_sec": 49.674599170684814 + }, + { + "epoch": 56, + "train_loss": 2.1276820320892336, + "train_acc": 0.42994, + "test_loss": 6.964908208465576, + "test_acc": 0.0954, + "lyapunov": null, + "grad_norm": 0.6554659738718382, + "grad_max_sv": 0.2207026917487383, + "grad_min_sv": 1.2088878859062292e-08, + "grad_condition": 21085232.116952278, + "lr": 0.0006937577932260512, + "time_sec": 49.67076587677002 + }, + { + "epoch": 57, + "train_loss": 2.1337597509765627, + "train_acc": 0.42926, + "test_loss": 8.229502785491944, + "test_acc": 0.0862, + "lyapunov": null, + "grad_norm": 0.65752559961672, + "grad_max_sv": 0.2246583230793476, + "grad_min_sv": 1.2207756456758534e-08, + "grad_condition": 64230626.47705172, + "lr": 0.0006840622763423388, + "time_sec": 49.64063334465027 + }, + { + "epoch": 58, + "train_loss": 2.1041818314361573, + "train_acc": 0.43524, + "test_loss": 6.589992712402344, + "test_acc": 0.1085, + "lyapunov": null, + "grad_norm": 0.6598697025296996, + "grad_max_sv": 0.23252296969294547, + "grad_min_sv": 1.2361365446522666e-08, + "grad_condition": 30301917.129872173, + "lr": 0.0006742860236609073, + "time_sec": 49.61933445930481 + }, + { + "epoch": 59, + "train_loss": 2.096152271270752, + "train_acc": 0.4375, + "test_loss": 6.983989217376709, + "test_acc": 0.0982, + "lyapunov": null, + "grad_norm": 0.6560896741871133, + "grad_max_sv": 0.23231945298612117, + "grad_min_sv": 1.251871321050757e-08, + "grad_condition": 22362788.103550732, + "lr": 0.0006644333233692913, + "time_sec": 49.61751055717468 + }, + { + "epoch": 60, + "train_loss": 2.081830069847107, + "train_acc": 0.43602, + "test_loss": 7.386634468841553, + "test_acc": 0.1014, + "lyapunov": null, + "grad_norm": 0.6536599782236483, + "grad_max_sv": 0.22322102561593055, + "grad_min_sv": 1.2262779891525356e-08, + "grad_condition": 23489422.867959693, + "lr": 0.0006545084971874734, + "time_sec": 49.620344161987305 + }, + { + "epoch": 61, + "train_loss": 2.0558355644226074, + "train_acc": 0.44474, + "test_loss": 7.227272665405273, + "test_acc": 0.1013, + "lyapunov": null, + "grad_norm": 0.6572328158390935, + "grad_max_sv": 0.22376591265201567, + "grad_min_sv": 1.238219781984906e-08, + "grad_condition": 31021778.17636667, + "lr": 0.0006445158984722354, + "time_sec": 49.6348340511322 + }, + { + "epoch": 62, + "train_loss": 2.0572922328948975, + "train_acc": 0.44566, + "test_loss": 7.505316355133057, + "test_acc": 0.0927, + "lyapunov": null, + "grad_norm": 0.656923815023976, + "grad_max_sv": 0.23445738479495049, + "grad_min_sv": 1.2478020391688133e-08, + "grad_condition": 262812298.93435702, + "lr": 0.0006344599103076324, + "time_sec": 49.62543535232544 + }, + { + "epoch": 63, + "train_loss": 2.0413633464813232, + "train_acc": 0.44668, + "test_loss": 7.251725723266602, + "test_acc": 0.0991, + "lyapunov": null, + "grad_norm": 0.6568909181034195, + "grad_max_sv": 0.2302928999066353, + "grad_min_sv": 1.2521502933821038e-08, + "grad_condition": 42011077.53000567, + "lr": 0.0006243449435824269, + "time_sec": 49.68104648590088 + }, + { + "epoch": 64, + "train_loss": 2.0206649338531495, + "train_acc": 0.4545, + "test_loss": 7.670287243652344, + "test_acc": 0.0929, + "lyapunov": null, + "grad_norm": 0.6597611249894066, + "grad_max_sv": 0.2243791937828064, + "grad_min_sv": 1.2141039159446754e-08, + "grad_condition": 44929605.00249899, + "lr": 0.0006141754350553275, + "time_sec": 49.63578200340271 + }, + { + "epoch": 65, + "train_loss": 2.005788911895752, + "train_acc": 0.45556, + "test_loss": 8.490129399871826, + "test_acc": 0.0881, + "lyapunov": null, + "grad_norm": 0.6550260718391842, + "grad_max_sv": 0.2345993619412184, + "grad_min_sv": 1.2238496998467907e-08, + "grad_condition": 51372022.47833033, + "lr": 0.0006039558454088793, + "time_sec": 49.70135450363159 + }, + { + "epoch": 66, + "train_loss": 1.9908720332336425, + "train_acc": 0.45934, + "test_loss": 7.83362244720459, + "test_acc": 0.086, + "lyapunov": null, + "grad_norm": 0.6563592700125107, + "grad_max_sv": 0.22401900850236417, + "grad_min_sv": 1.2119369038193772e-08, + "grad_condition": 33434586.35249608, + "lr": 0.000593690657292862, + "time_sec": 49.64280724525452 + }, + { + "epoch": 67, + "train_loss": 1.9691172955703735, + "train_acc": 0.46306, + "test_loss": 7.884465830230713, + "test_acc": 0.0818, + "lyapunov": null, + "grad_norm": 0.6567132328483392, + "grad_max_sv": 0.231986141204834, + "grad_min_sv": 1.2402723173488006e-08, + "grad_condition": 25823647.646229025, + "lr": 0.0005833843733580507, + "time_sec": 49.62420701980591 + }, + { + "epoch": 68, + "train_loss": 1.9622927265167236, + "train_acc": 0.46458, + "test_loss": 8.4931605758667, + "test_acc": 0.0703, + "lyapunov": null, + "grad_norm": 0.6522693664046653, + "grad_max_sv": 0.2248720645904541, + "grad_min_sv": 1.232144753449127e-08, + "grad_condition": 20661085.738957692, + "lr": 0.0005730415142812054, + "time_sec": 49.61964273452759 + }, + { + "epoch": 69, + "train_loss": 1.936687505493164, + "train_acc": 0.47236, + "test_loss": 8.64132734375, + "test_acc": 0.0679, + "lyapunov": null, + "grad_norm": 0.6510309265124044, + "grad_max_sv": 0.21742373295128345, + "grad_min_sv": 1.1974758069681346e-08, + "grad_condition": 304726416.82408583, + "lr": 0.0005626666167821517, + "time_sec": 49.644230365753174 + }, + { + "epoch": 70, + "train_loss": 1.9254214583587645, + "train_acc": 0.47336, + "test_loss": 7.787073600769043, + "test_acc": 0.0873, + "lyapunov": null, + "grad_norm": 0.6550976880903316, + "grad_max_sv": 0.23343021050095558, + "grad_min_sv": 1.22054698495919e-08, + "grad_condition": 998661796.8752277, + "lr": 0.0005522642316338265, + "time_sec": 49.61548924446106 + }, + { + "epoch": 71, + "train_loss": 1.916664266433716, + "train_acc": 0.47384, + "test_loss": 8.817724546051025, + "test_acc": 0.0687, + "lyapunov": null, + "grad_norm": 0.6548099516468633, + "grad_max_sv": 0.21803590469062328, + "grad_min_sv": 1.2030009292202104e-08, + "grad_condition": 43118102.26962634, + "lr": 0.0005418389216661573, + "time_sec": 49.63275456428528 + }, + { + "epoch": 72, + "train_loss": 1.907302893638611, + "train_acc": 0.47762, + "test_loss": 9.211192407989502, + "test_acc": 0.0704, + "lyapunov": null, + "grad_norm": 0.6550135667381578, + "grad_max_sv": 0.22547000497579575, + "grad_min_sv": 1.232130381889629e-08, + "grad_condition": 21984085.02642382, + "lr": 0.0005313952597646563, + "time_sec": 49.6118586063385 + }, + { + "epoch": 73, + "train_loss": 1.877649710121155, + "train_acc": 0.4827, + "test_loss": 9.066388426208496, + "test_acc": 0.0801, + "lyapunov": null, + "grad_norm": 0.6600796471066996, + "grad_max_sv": 0.23919763825833798, + "grad_min_sv": 1.2670018244287374e-08, + "grad_condition": 42742098.34257165, + "lr": 0.0005209378268645994, + "time_sec": 49.67570900917053 + }, + { + "epoch": 74, + "train_loss": 1.8662859315490723, + "train_acc": 0.48722, + "test_loss": 9.122249521636963, + "test_acc": 0.0675, + "lyapunov": null, + "grad_norm": 0.6547425237687021, + "grad_max_sv": 0.22284357100725175, + "grad_min_sv": 1.2111998770603094e-08, + "grad_condition": 21063233.798650313, + "lr": 0.0005104712099416781, + "time_sec": 49.62467122077942 + }, + { + "epoch": 75, + "train_loss": 1.8634462587738037, + "train_acc": 0.48572, + "test_loss": 8.603226243591308, + "test_acc": 0.07, + "lyapunov": null, + "grad_norm": 0.6594891408678691, + "grad_max_sv": 0.2292952246963978, + "grad_min_sv": 1.216953539884269e-08, + "grad_condition": 23304533.995393943, + "lr": 0.0004999999999999996, + "time_sec": 49.6065719127655 + }, + { + "epoch": 76, + "train_loss": 1.8428347550964355, + "train_acc": 0.49222, + "test_loss": 9.348575830841064, + "test_acc": 0.0716, + "lyapunov": null, + "grad_norm": 0.6514940871880716, + "grad_max_sv": 0.2246335681527853, + "grad_min_sv": 1.197331944077784e-08, + "grad_condition": 79775997.36608414, + "lr": 0.0004895287900583212, + "time_sec": 49.633445262908936 + }, + { + "epoch": 77, + "train_loss": 1.8474174691390992, + "train_acc": 0.49038, + "test_loss": 9.063310955810547, + "test_acc": 0.0749, + "lyapunov": null, + "grad_norm": 0.6555213730500407, + "grad_max_sv": 0.22386705875396729, + "grad_min_sv": 1.1975305359845923e-08, + "grad_condition": 30024891.493045498, + "lr": 0.0004790621731353997, + "time_sec": 49.6582727432251 + }, + { + "epoch": 78, + "train_loss": 1.8240000118255615, + "train_acc": 0.496, + "test_loss": 7.937534573364258, + "test_acc": 0.1042, + "lyapunov": null, + "grad_norm": 0.6578278625054611, + "grad_max_sv": 0.22472502514719964, + "grad_min_sv": 1.2227204815307146e-08, + "grad_condition": 24809414.276176114, + "lr": 0.000468604740235343, + "time_sec": 49.60278058052063 + }, + { + "epoch": 79, + "train_loss": 1.7988454669952392, + "train_acc": 0.50146, + "test_loss": 7.830693682098389, + "test_acc": 0.0946, + "lyapunov": null, + "grad_norm": 0.6564839484635767, + "grad_max_sv": 0.23010910004377366, + "grad_min_sv": 1.2367765268861408e-08, + "grad_condition": 34528993.96450578, + "lr": 0.00045816107833384175, + "time_sec": 49.63169765472412 + }, + { + "epoch": 80, + "train_loss": 1.7962154034423827, + "train_acc": 0.50466, + "test_loss": 7.877956019592285, + "test_acc": 0.0834, + "lyapunov": null, + "grad_norm": 0.6560300351960439, + "grad_max_sv": 0.22126091420650482, + "grad_min_sv": 1.2213627020862816e-08, + "grad_condition": 21445784.707883697, + "lr": 0.0004477357683661729, + "time_sec": 49.672850131988525 + }, + { + "epoch": 81, + "train_loss": 1.7689838317871094, + "train_acc": 0.5108, + "test_loss": 8.936191275024415, + "test_acc": 0.073, + "lyapunov": null, + "grad_norm": 0.6546524429638407, + "grad_max_sv": 0.22751210294663907, + "grad_min_sv": 1.2090203325293424e-08, + "grad_condition": 37126500.828596935, + "lr": 0.00043733338321784746, + "time_sec": 49.6825795173645 + }, + { + "epoch": 82, + "train_loss": 1.7687132528686524, + "train_acc": 0.50962, + "test_loss": 8.322722315979004, + "test_acc": 0.0867, + "lyapunov": null, + "grad_norm": 0.657879277273411, + "grad_max_sv": 0.23299325592815875, + "grad_min_sv": 1.2289513051655376e-08, + "grad_condition": 29654551.548070945, + "lr": 0.0004269584857187939, + "time_sec": 49.77833390235901 + }, + { + "epoch": 83, + "train_loss": 1.7514041207885742, + "train_acc": 0.51362, + "test_loss": 7.874627603149414, + "test_acc": 0.095, + "lyapunov": null, + "grad_norm": 0.65464844079956, + "grad_max_sv": 0.22664147801697254, + "grad_min_sv": 1.2152483562510863e-08, + "grad_condition": 25844246.169428695, + "lr": 0.0004166156266419484, + "time_sec": 49.665401220321655 + }, + { + "epoch": 84, + "train_loss": 1.7470465963745117, + "train_acc": 0.5132, + "test_loss": 8.254433164978026, + "test_acc": 0.0915, + "lyapunov": null, + "grad_norm": 0.6562560461399737, + "grad_max_sv": 0.22655668184161187, + "grad_min_sv": 1.2271174511246929e-08, + "grad_condition": 46640276.774946496, + "lr": 0.0004063093427071373, + "time_sec": 49.66734290122986 + }, + { + "epoch": 85, + "train_loss": 1.7298235196685792, + "train_acc": 0.51892, + "test_loss": 8.706323757171631, + "test_acc": 0.0911, + "lyapunov": null, + "grad_norm": 0.6550616576389223, + "grad_max_sv": 0.23714832365512847, + "grad_min_sv": 1.223523634630297e-08, + "grad_condition": 29585164.78334018, + "lr": 0.0003960441545911199, + "time_sec": 49.640406370162964 + }, + { + "epoch": 86, + "train_loss": 1.724207964477539, + "train_acc": 0.51926, + "test_loss": 8.765803309631348, + "test_acc": 0.0835, + "lyapunov": null, + "grad_norm": 0.6508855742051911, + "grad_max_sv": 0.2245300356298685, + "grad_min_sv": 1.2214838868152e-08, + "grad_condition": 20628200.471479602, + "lr": 0.0003858245649446718, + "time_sec": 49.63991856575012 + }, + { + "epoch": 87, + "train_loss": 1.7018416146087647, + "train_acc": 0.52598, + "test_loss": 8.139996655273437, + "test_acc": 0.096, + "lyapunov": null, + "grad_norm": 0.6595894571592862, + "grad_max_sv": 0.2325576465576887, + "grad_min_sv": 1.2264047567420167e-08, + "grad_condition": 62109028.98086828, + "lr": 0.00037565505641757235, + "time_sec": 49.62706279754639 + }, + { + "epoch": 88, + "train_loss": 1.690174805984497, + "train_acc": 0.52992, + "test_loss": 8.284830725860596, + "test_acc": 0.0946, + "lyapunov": null, + "grad_norm": 0.6523549145137596, + "grad_max_sv": 0.22278686761856079, + "grad_min_sv": 1.2230143851127417e-08, + "grad_condition": 41887788.39074431, + "lr": 0.00036554008969236695, + "time_sec": 49.6299991607666 + }, + { + "epoch": 89, + "train_loss": 1.6808083280181885, + "train_acc": 0.5298, + "test_loss": 8.205404133605956, + "test_acc": 0.0955, + "lyapunov": null, + "grad_norm": 0.6525447581270152, + "grad_max_sv": 0.22465928830206394, + "grad_min_sv": 1.2332067528264546e-08, + "grad_condition": 23009318.737796, + "lr": 0.0003554841015277638, + "time_sec": 49.66408705711365 + }, + { + "epoch": 90, + "train_loss": 1.6637053575134277, + "train_acc": 0.5337, + "test_loss": 8.177736569213867, + "test_acc": 0.0899, + "lyapunov": null, + "grad_norm": 0.6537473055068921, + "grad_max_sv": 0.22377123720943928, + "grad_min_sv": 1.2110254177244429e-08, + "grad_condition": 25938015.098525234, + "lr": 0.000345491502812526, + "time_sec": 49.63126850128174 + }, + { + "epoch": 91, + "train_loss": 1.6554726396942139, + "train_acc": 0.5354, + "test_loss": 8.995069329833985, + "test_acc": 0.08, + "lyapunov": null, + "grad_norm": 0.6575477667608048, + "grad_max_sv": 0.23422496095299722, + "grad_min_sv": 1.246219855713382e-08, + "grad_condition": 41932891.920117736, + "lr": 0.0003355666766307081, + "time_sec": 49.63232660293579 + }, + { + "epoch": 92, + "train_loss": 1.6413372038269043, + "train_acc": 0.54098, + "test_loss": 9.550636445617675, + "test_acc": 0.0761, + "lyapunov": null, + "grad_norm": 0.6610051290863374, + "grad_max_sv": 0.23229929022490978, + "grad_min_sv": 1.2352718607028245e-08, + "grad_condition": 41078160.523768075, + "lr": 0.00032571397633909225, + "time_sec": 49.653891801834106 + }, + { + "epoch": 93, + "train_loss": 1.6310989672470093, + "train_acc": 0.54374, + "test_loss": 9.458463846588135, + "test_acc": 0.0736, + "lyapunov": null, + "grad_norm": 0.6572216683080783, + "grad_max_sv": 0.23672427460551262, + "grad_min_sv": 1.2539241084352782e-08, + "grad_condition": 23064462.944409598, + "lr": 0.00031593772365766094, + "time_sec": 49.65013003349304 + }, + { + "epoch": 94, + "train_loss": 1.6185439474868775, + "train_acc": 0.5456, + "test_loss": 9.447592375946044, + "test_acc": 0.0781, + "lyapunov": null, + "grad_norm": 0.6543172085287396, + "grad_max_sv": 0.2255704291164875, + "grad_min_sv": 1.1963030848924361e-08, + "grad_condition": 48501470.614931956, + "lr": 0.0003062422067739483, + "time_sec": 49.68069577217102 + }, + { + "epoch": 95, + "train_loss": 1.6036190982055665, + "train_acc": 0.54806, + "test_loss": 9.521705908203124, + "test_acc": 0.0835, + "lyapunov": null, + "grad_norm": 0.6561083866637782, + "grad_max_sv": 0.23088240325450898, + "grad_min_sv": 1.2247599834314115e-08, + "grad_condition": 26484829.628142, + "lr": 0.00029663167846209965, + "time_sec": 49.62816071510315 + }, + { + "epoch": 96, + "train_loss": 1.6020113516998291, + "train_acc": 0.54904, + "test_loss": 9.115081603240967, + "test_acc": 0.0889, + "lyapunov": null, + "grad_norm": 0.6572025699230744, + "grad_max_sv": 0.22745007649064064, + "grad_min_sv": 1.2209962416132036e-08, + "grad_condition": 32247618.106625605, + "lr": 0.00028711035421746345, + "time_sec": 49.61973428726196 + }, + { + "epoch": 97, + "train_loss": 1.589581788368225, + "train_acc": 0.55386, + "test_loss": 9.091486672973632, + "test_acc": 0.0752, + "lyapunov": null, + "grad_norm": 0.6480214804623958, + "grad_max_sv": 0.22622964382171631, + "grad_min_sv": 1.213211238138001e-08, + "grad_condition": 23427245.234249383, + "lr": 0.00027768241040753615, + "time_sec": 49.67304968833923 + }, + { + "epoch": 98, + "train_loss": 1.5766529482269287, + "train_acc": 0.55484, + "test_loss": 8.739159268188477, + "test_acc": 0.0912, + "lyapunov": null, + "grad_norm": 0.6545216229967632, + "grad_max_sv": 0.22466104663908482, + "grad_min_sv": 1.2034743685634952e-08, + "grad_condition": 37920262.92732872, + "lr": 0.00026835198244006903, + "time_sec": 49.6529438495636 + }, + { + "epoch": 99, + "train_loss": 1.5610430017852783, + "train_acc": 0.55952, + "test_loss": 9.326904290771484, + "test_acc": 0.0857, + "lyapunov": null, + "grad_norm": 0.6510280187361254, + "grad_max_sv": 0.22991822883486748, + "grad_min_sv": 1.2031296814374315e-08, + "grad_condition": 33021222.855397005, + "lr": 0.0002591231629491421, + "time_sec": 49.64146590232849 + }, + { + "epoch": 100, + "train_loss": 1.5503544171142578, + "train_acc": 0.56096, + "test_loss": 8.863075296783448, + "test_acc": 0.0956, + "lyapunov": null, + "grad_norm": 0.6587934740560508, + "grad_max_sv": 0.22904604896903039, + "grad_min_sv": 1.2335589709942807e-08, + "grad_condition": 85131461.34992474, + "lr": 0.0002499999999999997, + "time_sec": 49.6390540599823 + }, + { + "epoch": 101, + "train_loss": 1.5390491861343383, + "train_acc": 0.56416, + "test_loss": 8.707357301330566, + "test_acc": 0.1024, + "lyapunov": null, + "grad_norm": 0.662018499627777, + "grad_max_sv": 0.23979119583964348, + "grad_min_sv": 1.238348213417062e-08, + "grad_condition": 33906848.52058145, + "lr": 0.00024098649531343477, + "time_sec": 49.63421368598938 + }, + { + "epoch": 102, + "train_loss": 1.5312192189788818, + "train_acc": 0.56726, + "test_loss": 9.40553295135498, + "test_acc": 0.0875, + "lyapunov": null, + "grad_norm": 0.6540742670514875, + "grad_max_sv": 0.23145525828003882, + "grad_min_sv": 1.2288377408686824e-08, + "grad_condition": 37958642.13054756, + "lr": 0.0002320866025105016, + "time_sec": 49.65552067756653 + }, + { + "epoch": 103, + "train_loss": 1.5286355770111084, + "train_acc": 0.56548, + "test_loss": 9.07997163925171, + "test_acc": 0.1043, + "lyapunov": null, + "grad_norm": 0.6557756421519878, + "grad_max_sv": 0.24100108593702316, + "grad_min_sv": 1.2461116480344537e-08, + "grad_condition": 25662204.639090188, + "lr": 0.0002233042253783278, + "time_sec": 49.6308536529541 + }, + { + "epoch": 104, + "train_loss": 1.5213085984420776, + "train_acc": 0.56866, + "test_loss": 9.145785698699951, + "test_acc": 0.0859, + "lyapunov": null, + "grad_norm": 0.6504666354250909, + "grad_max_sv": 0.2253209725022316, + "grad_min_sv": 1.1966959748144212e-08, + "grad_condition": 54876833.04192768, + "lr": 0.000214643216157784, + "time_sec": 49.63847613334656 + }, + { + "epoch": 105, + "train_loss": 1.5079352280044556, + "train_acc": 0.5695, + "test_loss": 8.336384162902831, + "test_acc": 0.1061, + "lyapunov": null, + "grad_norm": 0.6571653396229992, + "grad_max_sv": 0.23069135881960393, + "grad_min_sv": 1.2210977743190576e-08, + "grad_condition": 88846977.18417618, + "lr": 0.00020610737385376332, + "time_sec": 49.627315044403076 + }, + { + "epoch": 106, + "train_loss": 1.4935028577423095, + "train_acc": 0.57654, + "test_loss": 9.006987256622315, + "test_acc": 0.0957, + "lyapunov": null, + "grad_norm": 0.651656183779343, + "grad_max_sv": 0.22712415568530558, + "grad_min_sv": 1.2032355989344268e-08, + "grad_condition": 25049163.560516536, + "lr": 0.00019770044256881242, + "time_sec": 49.62053084373474 + }, + { + "epoch": 107, + "train_loss": 1.4878737406158447, + "train_acc": 0.57426, + "test_loss": 10.11307799987793, + "test_acc": 0.075, + "lyapunov": null, + "grad_norm": 0.6524830728325739, + "grad_max_sv": 0.22892994433641434, + "grad_min_sv": 1.2128688251650255e-08, + "grad_condition": 43366733.79550102, + "lr": 0.0001894261098608447, + "time_sec": 49.60416531562805 + }, + { + "epoch": 108, + "train_loss": 1.4871094806671143, + "train_acc": 0.57634, + "test_loss": 9.736641611480714, + "test_acc": 0.0847, + "lyapunov": null, + "grad_norm": 0.6526478556992521, + "grad_max_sv": 0.2283865675330162, + "grad_min_sv": 1.2084086392638583e-08, + "grad_condition": 30684405.14241614, + "lr": 0.000181288005125655, + "time_sec": 49.599942207336426 + }, + { + "epoch": 109, + "train_loss": 1.4713194018936158, + "train_acc": 0.5814, + "test_loss": 9.849570913696288, + "test_acc": 0.0735, + "lyapunov": null, + "grad_norm": 0.6520669107663062, + "grad_max_sv": 0.22863508015871048, + "grad_min_sv": 1.206205209880462e-08, + "grad_condition": 22397938.389471006, + "lr": 0.0001732896980049473, + "time_sec": 49.610928773880005 + }, + { + "epoch": 110, + "train_loss": 1.463755881729126, + "train_acc": 0.58362, + "test_loss": 10.715107778930664, + "test_acc": 0.0741, + "lyapunov": null, + "grad_norm": 0.6526504347541894, + "grad_max_sv": 0.2301381327211857, + "grad_min_sv": 1.2070842162273388e-08, + "grad_condition": 58529848.61276511, + "lr": 0.00016543469682057076, + "time_sec": 49.607982873916626 + }, + { + "epoch": 111, + "train_loss": 1.458272280807495, + "train_acc": 0.58544, + "test_loss": 9.91223872833252, + "test_acc": 0.0829, + "lyapunov": null, + "grad_norm": 0.657140008872575, + "grad_max_sv": 0.23369005173444748, + "grad_min_sv": 1.2170888367274423e-08, + "grad_condition": 42634071.92220701, + "lr": 0.00015772644703565552, + "time_sec": 49.6121985912323 + }, + { + "epoch": 112, + "train_loss": 1.4423779841613769, + "train_acc": 0.58982, + "test_loss": 10.218679902648926, + "test_acc": 0.0785, + "lyapunov": null, + "grad_norm": 0.6570457541981778, + "grad_max_sv": 0.2342597097158432, + "grad_min_sv": 1.2216584609550663e-08, + "grad_condition": 64070619.26224355, + "lr": 0.00015016832974331713, + "time_sec": 49.62796497344971 + }, + { + "epoch": 113, + "train_loss": 1.4301787731170654, + "train_acc": 0.58978, + "test_loss": 9.96994764251709, + "test_acc": 0.0848, + "lyapunov": null, + "grad_norm": 0.6545785705102263, + "grad_max_sv": 0.23776416704058648, + "grad_min_sv": 1.2195284053440059e-08, + "grad_condition": 29429303.691607207, + "lr": 0.00014276366018359834, + "time_sec": 49.63600516319275 + }, + { + "epoch": 114, + "train_loss": 1.431484651260376, + "train_acc": 0.59188, + "test_loss": 9.352456809234619, + "test_acc": 0.0912, + "lyapunov": null, + "grad_norm": 0.6560872782233574, + "grad_max_sv": 0.23789514154195784, + "grad_min_sv": 1.2277434646712493e-08, + "grad_condition": 29643562.652553707, + "lr": 0.00013551568628929425, + "time_sec": 49.64847278594971 + }, + { + "epoch": 115, + "train_loss": 1.4156108039093018, + "train_acc": 0.59466, + "test_loss": 9.393049124145508, + "test_acc": 0.0902, + "lyapunov": null, + "grad_norm": 0.6560202611490502, + "grad_max_sv": 0.23022275194525718, + "grad_min_sv": 1.211471579581902e-08, + "grad_condition": 29752416.717853196, + "lr": 0.00012842758726130276, + "time_sec": 49.646286725997925 + }, + { + "epoch": 116, + "train_loss": 1.419507451171875, + "train_acc": 0.59538, + "test_loss": 9.898611540222168, + "test_acc": 0.0823, + "lyapunov": null, + "grad_norm": 0.6554438751866899, + "grad_max_sv": 0.23169372119009496, + "grad_min_sv": 1.2254989865956301e-08, + "grad_condition": 32739963.172941543, + "lr": 0.0001215024721741218, + "time_sec": 49.66101384162903 + }, + { + "epoch": 117, + "train_loss": 1.4052832598495484, + "train_acc": 0.59742, + "test_loss": 9.80786139831543, + "test_acc": 0.0746, + "lyapunov": null, + "grad_norm": 0.6502624050693765, + "grad_max_sv": 0.23535267189145087, + "grad_min_sv": 1.2210560307313046e-08, + "grad_condition": 34512756.66701891, + "lr": 0.00011474337861210538, + "time_sec": 49.635112285614014 + }, + { + "epoch": 118, + "train_loss": 1.407028383216858, + "train_acc": 0.59456, + "test_loss": 9.323918186950683, + "test_acc": 0.0923, + "lyapunov": null, + "grad_norm": 0.6532731757355527, + "grad_max_sv": 0.23146636895835399, + "grad_min_sv": 1.2073984001492733e-08, + "grad_condition": 27415450.93514964, + "lr": 0.00010815327133708009, + "time_sec": 49.67300295829773 + }, + { + "epoch": 119, + "train_loss": 1.3942961041641235, + "train_acc": 0.60004, + "test_loss": 9.392257122802734, + "test_acc": 0.0923, + "lyapunov": null, + "grad_norm": 0.6512526041128694, + "grad_max_sv": 0.2304602511227131, + "grad_min_sv": 1.196873851000424e-08, + "grad_condition": 27052501.627034713, + "lr": 0.00010173504098790182, + "time_sec": 49.66038250923157 + }, + { + "epoch": 120, + "train_loss": 1.3861536862182617, + "train_acc": 0.60168, + "test_loss": 9.79215132522583, + "test_acc": 0.0883, + "lyapunov": null, + "grad_norm": 0.6546312963164914, + "grad_max_sv": 0.23524674400687218, + "grad_min_sv": 1.2223635334485117e-08, + "grad_condition": 23146281.84709592, + "lr": 9.549150281252629e-05, + "time_sec": 49.64855408668518 + }, + { + "epoch": 121, + "train_loss": 1.382921607093811, + "train_acc": 0.60466, + "test_loss": 9.083266135406495, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 0.6533990071886453, + "grad_max_sv": 0.22603939548134805, + "grad_min_sv": 1.2147275964269344e-08, + "grad_condition": 31306417.63450122, + "lr": 8.942539543314794e-05, + "time_sec": 49.62118649482727 + }, + { + "epoch": 122, + "train_loss": 1.3776706603240967, + "train_acc": 0.60552, + "test_loss": 10.107886312866212, + "test_acc": 0.0771, + "lyapunov": null, + "grad_norm": 0.650347981554726, + "grad_max_sv": 0.22755396254360677, + "grad_min_sv": 1.200875722057182e-08, + "grad_condition": 26822439.671770982, + "lr": 8.353937964495024e-05, + "time_sec": 49.625091552734375 + }, + { + "epoch": 123, + "train_loss": 1.3719213924789428, + "train_acc": 0.60596, + "test_loss": 9.897831336212159, + "test_acc": 0.0827, + "lyapunov": null, + "grad_norm": 0.6494680388920978, + "grad_max_sv": 0.23135662637650967, + "grad_min_sv": 1.2129681067896137e-08, + "grad_condition": 24324265.536500372, + "lr": 7.783603724899243e-05, + "time_sec": 49.683146476745605 + }, + { + "epoch": 124, + "train_loss": 1.372097077255249, + "train_acc": 0.60532, + "test_loss": 9.392827641296387, + "test_acc": 0.091, + "lyapunov": null, + "grad_norm": 0.650191030859608, + "grad_max_sv": 0.2314681064337492, + "grad_min_sv": 1.2054343853651339e-08, + "grad_condition": 27641091.69673177, + "lr": 7.231786991974666e-05, + "time_sec": 49.71274280548096 + }, + { + "epoch": 125, + "train_loss": 1.370953790550232, + "train_acc": 0.6058, + "test_loss": 9.41628999938965, + "test_acc": 0.0969, + "lyapunov": null, + "grad_norm": 0.6479408268968022, + "grad_max_sv": 0.22912745289504527, + "grad_min_sv": 1.1926550955165816e-08, + "grad_condition": 38383449.24679903, + "lr": 6.698729810778072e-05, + "time_sec": 49.61937499046326 + }, + { + "epoch": 126, + "train_loss": 1.35777675239563, + "train_acc": 0.61084, + "test_loss": 9.729599977111816, + "test_acc": 0.084, + "lyapunov": null, + "grad_norm": 0.6511889017989357, + "grad_max_sv": 0.23615461364388465, + "grad_min_sv": 1.21181827100747e-08, + "grad_condition": 23269107.95301483, + "lr": 6.184665997806817e-05, + "time_sec": 49.616145610809326 + }, + { + "epoch": 127, + "train_loss": 1.3525141822052003, + "train_acc": 0.60988, + "test_loss": 9.375829245758057, + "test_acc": 0.0908, + "lyapunov": null, + "grad_norm": 0.6536840306066181, + "grad_max_sv": 0.23197561018168927, + "grad_min_sv": 1.2315820041575164e-08, + "grad_condition": 24883789.486126114, + "lr": 5.6898210384392595e-05, + "time_sec": 49.629499435424805 + }, + { + "epoch": 128, + "train_loss": 1.3482640004730224, + "train_acc": 0.61222, + "test_loss": 9.813197325134277, + "test_acc": 0.0856, + "lyapunov": null, + "grad_norm": 0.6514039873738223, + "grad_max_sv": 0.23501852825284003, + "grad_min_sv": 1.2142686500737909e-08, + "grad_condition": 25266297.201565318, + "lr": 5.214411988029363e-05, + "time_sec": 49.605358600616455 + }, + { + "epoch": 129, + "train_loss": 1.3569378799057006, + "train_acc": 0.60816, + "test_loss": 9.541576918029785, + "test_acc": 0.0874, + "lyapunov": null, + "grad_norm": 0.6517316484787671, + "grad_max_sv": 0.23406252562999724, + "grad_min_sv": 1.2258221140926118e-08, + "grad_condition": 29626662.60122323, + "lr": 4.7586473766990294e-05, + "time_sec": 49.625590085983276 + }, + { + "epoch": 130, + "train_loss": 1.3529891060638428, + "train_acc": 0.60898, + "test_loss": 9.487888061523437, + "test_acc": 0.0929, + "lyapunov": null, + "grad_norm": 0.6538198266172623, + "grad_max_sv": 0.23005600720643998, + "grad_min_sv": 1.201972722117417e-08, + "grad_condition": 37209362.20372974, + "lr": 4.32272711786996e-05, + "time_sec": 49.65739893913269 + }, + { + "epoch": 131, + "train_loss": 1.3454697626495362, + "train_acc": 0.61572, + "test_loss": 9.924783717346191, + "test_acc": 0.0811, + "lyapunov": null, + "grad_norm": 0.6551713288471978, + "grad_max_sv": 0.240146154910326, + "grad_min_sv": 1.2333497152738903e-08, + "grad_condition": 66623015.95467502, + "lr": 3.906842420574966e-05, + "time_sec": 49.62453866004944 + }, + { + "epoch": 132, + "train_loss": 1.3360938589859008, + "train_acc": 0.61616, + "test_loss": 9.586818018341065, + "test_acc": 0.0889, + "lyapunov": null, + "grad_norm": 0.6504956714032589, + "grad_max_sv": 0.23334665820002556, + "grad_min_sv": 1.2104059498446728e-08, + "grad_condition": 52369707.49757277, + "lr": 3.5111757055874305e-05, + "time_sec": 49.62921142578125 + }, + { + "epoch": 133, + "train_loss": 1.339883793449402, + "train_acc": 0.61552, + "test_loss": 9.673538793945312, + "test_acc": 0.0929, + "lyapunov": null, + "grad_norm": 0.6476453899351778, + "grad_max_sv": 0.23297516368329524, + "grad_min_sv": 1.2124888488021512e-08, + "grad_condition": 68199072.30592722, + "lr": 3.1359005254054254e-05, + "time_sec": 49.593669414520264 + }, + { + "epoch": 134, + "train_loss": 1.3361684355545045, + "train_acc": 0.61882, + "test_loss": 9.66245351715088, + "test_acc": 0.0778, + "lyapunov": null, + "grad_norm": 0.6491838850685481, + "grad_max_sv": 0.23596667721867562, + "grad_min_sv": 1.1881547391789926e-08, + "grad_condition": 40898877.174065895, + "lr": 2.7811814881259484e-05, + "time_sec": 49.60944747924805 + }, + { + "epoch": 135, + "train_loss": 1.3277960977554322, + "train_acc": 0.61818, + "test_loss": 9.974994463348388, + "test_acc": 0.0794, + "lyapunov": null, + "grad_norm": 0.6475029366208067, + "grad_max_sv": 0.2263253577053547, + "grad_min_sv": 1.206646519577581e-08, + "grad_condition": 59123509.407670066, + "lr": 2.4471741852423218e-05, + "time_sec": 49.63754081726074 + }, + { + "epoch": 136, + "train_loss": 1.3390293844604493, + "train_acc": 0.6147, + "test_loss": 9.827523893737792, + "test_acc": 0.0857, + "lyapunov": null, + "grad_norm": 0.6539959690699623, + "grad_max_sv": 0.2373226772993803, + "grad_min_sv": 1.2036285343408615e-08, + "grad_condition": 24295457.361463245, + "lr": 2.1340251233966362e-05, + "time_sec": 49.649282455444336 + }, + { + "epoch": 137, + "train_loss": 1.320917113571167, + "train_acc": 0.62042, + "test_loss": 10.049297039031982, + "test_acc": 0.0816, + "lyapunov": null, + "grad_norm": 0.6470381085306396, + "grad_max_sv": 0.22178312465548516, + "grad_min_sv": 1.1698476365396004e-08, + "grad_condition": 21323664.731712654, + "lr": 1.8418716601170932e-05, + "time_sec": 49.63605809211731 + }, + { + "epoch": 138, + "train_loss": 1.3167627235412598, + "train_acc": 0.6236, + "test_loss": 9.956857801055909, + "test_acc": 0.0836, + "lyapunov": null, + "grad_norm": 0.6460826791518621, + "grad_max_sv": 0.23469048999249936, + "grad_min_sv": 1.2084183138643886e-08, + "grad_condition": 303408536.5105225, + "lr": 1.570841943568445e-05, + "time_sec": 49.59550142288208 + }, + { + "epoch": 139, + "train_loss": 1.3184237383270263, + "train_acc": 0.6197, + "test_loss": 10.09333883972168, + "test_acc": 0.0839, + "lyapunov": null, + "grad_norm": 0.6477507203630667, + "grad_max_sv": 0.2281213853508234, + "grad_min_sv": 1.203405910962796e-08, + "grad_condition": 39837437.01020629, + "lr": 1.3210548563419845e-05, + "time_sec": 49.6094229221344 + }, + { + "epoch": 140, + "train_loss": 1.3220056551361083, + "train_acc": 0.61976, + "test_loss": 9.424947094726562, + "test_acc": 0.0942, + "lyapunov": null, + "grad_norm": 0.644643549451068, + "grad_max_sv": 0.22695489414036274, + "grad_min_sv": 1.1866805089966182e-08, + "grad_condition": 49710189.62801478, + "lr": 1.0926199633097203e-05, + "time_sec": 49.65405297279358 + }, + { + "epoch": 141, + "train_loss": 1.3249128121566773, + "train_acc": 0.61924, + "test_loss": 10.150922741699219, + "test_acc": 0.0839, + "lyapunov": null, + "grad_norm": 0.6496616529807254, + "grad_max_sv": 0.23303747363388538, + "grad_min_sv": 1.2297343177092301e-08, + "grad_condition": 32251173.502706695, + "lr": 8.856374635655688e-06, + "time_sec": 49.62998151779175 + }, + { + "epoch": 142, + "train_loss": 1.3221977783966063, + "train_acc": 0.61854, + "test_loss": 9.545345922851563, + "test_acc": 0.0896, + "lyapunov": null, + "grad_norm": 0.6498976979178819, + "grad_max_sv": 0.23321284241974355, + "grad_min_sv": 1.2192657036780297e-08, + "grad_condition": 38327958.94438372, + "lr": 7.001981464747503e-06, + "time_sec": 49.62353038787842 + }, + { + "epoch": 143, + "train_loss": 1.3161465112304687, + "train_acc": 0.62108, + "test_loss": 9.518995339202881, + "test_acc": 0.0904, + "lyapunov": null, + "grad_norm": 0.65049671322247, + "grad_max_sv": 0.2355397418141365, + "grad_min_sv": 1.2113919437006793e-08, + "grad_condition": 34055758.838127285, + "lr": 5.3638335185058295e-06, + "time_sec": 49.636550426483154 + }, + { + "epoch": 144, + "train_loss": 1.3199945546722411, + "train_acc": 0.61928, + "test_loss": 9.653044511413574, + "test_acc": 0.0889, + "lyapunov": null, + "grad_norm": 0.6510219033687272, + "grad_max_sv": 0.23736767545342446, + "grad_min_sv": 1.2120116818503668e-08, + "grad_condition": 26653772.592295133, + "lr": 3.942649342761114e-06, + "time_sec": 49.64809012413025 + }, + { + "epoch": 145, + "train_loss": 1.310637080039978, + "train_acc": 0.62316, + "test_loss": 10.082862811279297, + "test_acc": 0.0865, + "lyapunov": null, + "grad_norm": 0.6486131550644274, + "grad_max_sv": 0.23344326205551624, + "grad_min_sv": 1.1724270552321281e-08, + "grad_condition": 226542482.35064834, + "lr": 2.7390523158633524e-06, + "time_sec": 49.61792755126953 + }, + { + "epoch": 146, + "train_loss": 1.3224388639450073, + "train_acc": 0.62, + "test_loss": 10.004590126037598, + "test_acc": 0.083, + "lyapunov": null, + "grad_norm": 0.6514083277071326, + "grad_max_sv": 0.23273181915283203, + "grad_min_sv": 1.1958840047718951e-08, + "grad_condition": 1281589470.9369996, + "lr": 1.7535703752478133e-06, + "time_sec": 49.663915157318115 + }, + { + "epoch": 147, + "train_loss": 1.3165813917160034, + "train_acc": 0.62328, + "test_loss": 9.630343141174317, + "test_acc": 0.0889, + "lyapunov": null, + "grad_norm": 0.6474798234673506, + "grad_max_sv": 0.22821973785758018, + "grad_min_sv": 1.1936759166872312e-08, + "grad_condition": 467313215.8090695, + "lr": 9.866357858642196e-07, + "time_sec": 49.623547077178955 + }, + { + "epoch": 148, + "train_loss": 1.3181095361328126, + "train_acc": 0.61742, + "test_loss": 10.228155642700195, + "test_acc": 0.0788, + "lyapunov": null, + "grad_norm": 0.6510409626330189, + "grad_max_sv": 0.23130737692117692, + "grad_min_sv": 1.1935725464928826e-08, + "grad_condition": 55668871.204657175, + "lr": 4.38584950570808e-07, + "time_sec": 49.621832609176636 + }, + { + "epoch": 149, + "train_loss": 1.31113261013031, + "train_acc": 0.6221, + "test_loss": 9.91230221786499, + "test_acc": 0.0822, + "lyapunov": null, + "grad_norm": 0.6472982694090295, + "grad_max_sv": 0.2277739927172661, + "grad_min_sv": 1.1845563784029788e-08, + "grad_condition": 25904808.412874807, + "lr": 1.096582625772501e-07, + "time_sec": 49.62464380264282 + }, + { + "epoch": 150, + "train_loss": 1.3088498344039916, + "train_acc": 0.62396, + "test_loss": 9.814052784729004, + "test_acc": 0.0858, + "lyapunov": null, + "grad_norm": 0.6471687901699209, + "grad_max_sv": 0.23137033209204674, + "grad_min_sv": 1.2163310093502022e-08, + "grad_condition": 48891964.404683754, + "lr": 0.0, + "time_sec": 49.660566329956055 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.089254416656495, + "train_acc": 0.01344, + "test_loss": 4.870831555175781, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.582063459208639, + "grad_max_sv": 5.0306542873382565, + "grad_min_sv": 8.441757832766683e-08, + "grad_condition": 74707534.78681344, + "lr": 0.0009998903417374227, + "time_sec": 66.70783400535583 + }, + { + "epoch": 2, + "train_loss": 4.736304296569824, + "train_acc": 0.02172, + "test_loss": 4.92340059890747, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.087296772772229, + "grad_max_sv": 3.672157108783722, + "grad_min_sv": 6.109624839933935e-08, + "grad_condition": 230714811.36310124, + "lr": 0.0009995614150494292, + "time_sec": 66.69390416145325 + }, + { + "epoch": 3, + "train_loss": 4.52685978515625, + "train_acc": 0.03204, + "test_loss": 5.045831031799317, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 3.1470044543912175, + "grad_max_sv": 2.6447540044784548, + "grad_min_sv": 4.639755384339139e-08, + "grad_condition": 65625701.84585605, + "lr": 0.0009990133642141358, + "time_sec": 66.70076084136963 + }, + { + "epoch": 4, + "train_loss": 4.371717319641113, + "train_acc": 0.04112, + "test_loss": 4.993129699707032, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 2.5123688948843395, + "grad_max_sv": 2.1027904629707335, + "grad_min_sv": 3.615837387664633e-08, + "grad_condition": 418817692.03399765, + "lr": 0.0009982464296247522, + "time_sec": 66.71976566314697 + }, + { + "epoch": 5, + "train_loss": 4.27407361251831, + "train_acc": 0.0488, + "test_loss": 5.161634465789795, + "test_acc": 0.0119, + "lyapunov": null, + "grad_norm": 1.9573801826064445, + "grad_max_sv": 1.613087645173073, + "grad_min_sv": 2.8529539808364034e-08, + "grad_condition": 62747668.20627429, + "lr": 0.0009972609476841367, + "time_sec": 66.74850869178772 + }, + { + "epoch": 6, + "train_loss": 4.183251854553222, + "train_acc": 0.05812, + "test_loss": 5.447854755401611, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 1.436449079599314, + "grad_max_sv": 1.0459295481443405, + "grad_min_sv": 2.0654144772258576e-08, + "grad_condition": 94732574.16372415, + "lr": 0.000996057350657239, + "time_sec": 66.69263577461243 + }, + { + "epoch": 7, + "train_loss": 4.103355536193848, + "train_acc": 0.06872, + "test_loss": 5.544150679016114, + "test_acc": 0.0124, + "lyapunov": null, + "grad_norm": 1.082624040556548, + "grad_max_sv": 0.678101472556591, + "grad_min_sv": 1.6660088839048904e-08, + "grad_condition": 49338508.46283151, + "lr": 0.000994636166481494, + "time_sec": 66.69370245933533 + }, + { + "epoch": 8, + "train_loss": 4.040529095458984, + "train_acc": 0.07876, + "test_loss": 5.577163777160645, + "test_acc": 0.0172, + "lyapunov": null, + "grad_norm": 0.963869121683512, + "grad_max_sv": 0.5578698106110096, + "grad_min_sv": 1.4817374840991882e-08, + "grad_condition": 46172185.25999212, + "lr": 0.0009929980185352525, + "time_sec": 66.70931386947632 + }, + { + "epoch": 9, + "train_loss": 3.999490645446777, + "train_acc": 0.0856, + "test_loss": 5.472281336975097, + "test_acc": 0.0116, + "lyapunov": null, + "grad_norm": 0.9198022107734598, + "grad_max_sv": 0.5003849364817142, + "grad_min_sv": 1.3862486752946878e-08, + "grad_condition": 137028895.09887612, + "lr": 0.0009911436253643444, + "time_sec": 66.70475840568542 + }, + { + "epoch": 10, + "train_loss": 3.9641557629394533, + "train_acc": 0.09124, + "test_loss": 5.43024553604126, + "test_acc": 0.0112, + "lyapunov": null, + "grad_norm": 0.8539816540258655, + "grad_max_sv": 0.4397390566766262, + "grad_min_sv": 1.3177782898221579e-08, + "grad_condition": 50953468.3517745, + "lr": 0.0009890738003669028, + "time_sec": 66.75189590454102 + }, + { + "epoch": 11, + "train_loss": 3.912582547149658, + "train_acc": 0.09724, + "test_loss": 5.977069612121582, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 0.8304366482521061, + "grad_max_sv": 0.4253105387091637, + "grad_min_sv": 1.2851445623657253e-08, + "grad_condition": 192581837.7575304, + "lr": 0.00098678945143658, + "time_sec": 66.72230935096741 + }, + { + "epoch": 12, + "train_loss": 3.885940095291138, + "train_acc": 0.10388, + "test_loss": 5.707202329254151, + "test_acc": 0.0161, + "lyapunov": null, + "grad_norm": 0.7930567752358824, + "grad_max_sv": 0.3784016497433186, + "grad_min_sv": 1.2496499026196095e-08, + "grad_condition": 121475679.84002523, + "lr": 0.0009842915805643154, + "time_sec": 66.80430769920349 + }, + { + "epoch": 13, + "train_loss": 3.848949595184326, + "train_acc": 0.10982, + "test_loss": 5.604932201385498, + "test_acc": 0.0138, + "lyapunov": null, + "grad_norm": 0.7694655756397059, + "grad_max_sv": 0.36012797653675077, + "grad_min_sv": 1.2309415998654205e-08, + "grad_condition": 96913763.80192877, + "lr": 0.000981581283398829, + "time_sec": 66.77498316764832 + }, + { + "epoch": 14, + "train_loss": 3.822469270477295, + "train_acc": 0.11176, + "test_loss": 5.5594536964416505, + "test_acc": 0.0144, + "lyapunov": null, + "grad_norm": 0.751737952115685, + "grad_max_sv": 0.34815125875175, + "grad_min_sv": 1.1860258068707719e-08, + "grad_condition": 63821387.65591574, + "lr": 0.0009786597487660333, + "time_sec": 66.78450131416321 + }, + { + "epoch": 15, + "train_loss": 3.8008637019348144, + "train_acc": 0.11732, + "test_loss": 5.8510744079589845, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 0.7274896957635634, + "grad_max_sv": 0.3341310672461987, + "grad_min_sv": 1.185839371142805e-08, + "grad_condition": 51068114.03076443, + "lr": 0.0009755282581475766, + "time_sec": 66.75975847244263 + }, + { + "epoch": 16, + "train_loss": 3.7793116706085206, + "train_acc": 0.12078, + "test_loss": 6.094802139282226, + "test_acc": 0.0135, + "lyapunov": null, + "grad_norm": 0.7029997372387793, + "grad_max_sv": 0.31635181941092017, + "grad_min_sv": 1.1313535006052256e-08, + "grad_condition": 34061221.316739336, + "lr": 0.0009721881851187403, + "time_sec": 66.70034837722778 + }, + { + "epoch": 17, + "train_loss": 3.756349168548584, + "train_acc": 0.12318, + "test_loss": 6.524116158294678, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6891476510098721, + "grad_max_sv": 0.30746029056608676, + "grad_min_sv": 1.1205093228272567e-08, + "grad_condition": 55101632.74828547, + "lr": 0.0009686409947459456, + "time_sec": 66.70887970924377 + }, + { + "epoch": 18, + "train_loss": 3.736860103225708, + "train_acc": 0.12666, + "test_loss": 6.334092637634277, + "test_acc": 0.0151, + "lyapunov": null, + "grad_norm": 0.6735913591792417, + "grad_max_sv": 0.3038469754159451, + "grad_min_sv": 1.1184529693109707e-08, + "grad_condition": 266599149.22808576, + "lr": 0.0009648882429441254, + "time_sec": 66.7028694152832 + }, + { + "epoch": 19, + "train_loss": 3.721009854812622, + "train_acc": 0.13104, + "test_loss": 6.503785885620117, + "test_acc": 0.0158, + "lyapunov": null, + "grad_norm": 0.6543898752326373, + "grad_max_sv": 0.2952485930174589, + "grad_min_sv": 1.0702305973386839e-08, + "grad_condition": 36178987.94815246, + "lr": 0.00096093157579425, + "time_sec": 66.91662836074829 + }, + { + "epoch": 20, + "train_loss": 3.6978233711242674, + "train_acc": 0.13484, + "test_loss": 7.133095213317871, + "test_acc": 0.014, + "lyapunov": null, + "grad_norm": 0.6416047326169007, + "grad_max_sv": 0.2835653819143772, + "grad_min_sv": 1.061290202941656e-08, + "grad_condition": 29580333.508830875, + "lr": 0.0009567727288213001, + "time_sec": 66.7187888622284 + }, + { + "epoch": 21, + "train_loss": 3.678186371612549, + "train_acc": 0.13804, + "test_loss": 6.526899772644043, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 0.6346445495636812, + "grad_max_sv": 0.2758004698902369, + "grad_min_sv": 1.0650165743059103e-08, + "grad_condition": 50339413.533409506, + "lr": 0.0009524135262330095, + "time_sec": 66.77347826957703 + }, + { + "epoch": 22, + "train_loss": 3.6615531184387207, + "train_acc": 0.13652, + "test_loss": 7.463528224182129, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6211761686754148, + "grad_max_sv": 0.2590024430304766, + "grad_min_sv": 1.0093259970866963e-08, + "grad_condition": 54350139.527433194, + "lr": 0.0009478558801197061, + "time_sec": 66.74172306060791 + }, + { + "epoch": 23, + "train_loss": 3.646244419708252, + "train_acc": 0.14018, + "test_loss": 7.247557836151123, + "test_acc": 0.0133, + "lyapunov": null, + "grad_norm": 0.6087560504487702, + "grad_max_sv": 0.26471212282776835, + "grad_min_sv": 1.0175153231789525e-08, + "grad_condition": 76037868.51400027, + "lr": 0.000943101789615607, + "time_sec": 66.74379682540894 + }, + { + "epoch": 24, + "train_loss": 3.6286012983703615, + "train_acc": 0.14502, + "test_loss": 7.168135193634034, + "test_acc": 0.0191, + "lyapunov": null, + "grad_norm": 0.5998778506859267, + "grad_max_sv": 0.24980814158916473, + "grad_min_sv": 1.0037150326158706e-08, + "grad_condition": 32920800.60529256, + "lr": 0.0009381533400219313, + "time_sec": 66.68860864639282 + }, + { + "epoch": 25, + "train_loss": 3.6192829264831543, + "train_acc": 0.14634, + "test_loss": 7.535636337280273, + "test_acc": 0.0161, + "lyapunov": null, + "grad_norm": 0.5983012708829252, + "grad_max_sv": 0.2530865453183651, + "grad_min_sv": 9.982956203358206e-09, + "grad_condition": 29219670.862144046, + "lr": 0.0009330127018922189, + "time_sec": 66.75418090820312 + }, + { + "epoch": 26, + "train_loss": 3.6001767744445803, + "train_acc": 0.1487, + "test_loss": 6.850593623352051, + "test_acc": 0.0151, + "lyapunov": null, + "grad_norm": 0.5947140415117098, + "grad_max_sv": 0.24490244090557098, + "grad_min_sv": 9.946103620567249e-09, + "grad_condition": 94915701.68580723, + "lr": 0.000927682130080253, + "time_sec": 66.72897815704346 + }, + { + "epoch": 27, + "train_loss": 3.5885346211242677, + "train_acc": 0.15218, + "test_loss": 7.121657147216797, + "test_acc": 0.0175, + "lyapunov": null, + "grad_norm": 0.5825348653665754, + "grad_max_sv": 0.2360658310353756, + "grad_min_sv": 9.758478072829923e-09, + "grad_condition": 28325624.288454544, + "lr": 0.0009221639627510072, + "time_sec": 66.82140755653381 + }, + { + "epoch": 28, + "train_loss": 3.5699786253356933, + "train_acc": 0.15318, + "test_loss": 7.339261558532715, + "test_acc": 0.0157, + "lyapunov": null, + "grad_norm": 0.5731165313342855, + "grad_max_sv": 0.23213129304349422, + "grad_min_sv": 9.869128861361709e-09, + "grad_condition": 27851276.279406942, + "lr": 0.0009164606203550494, + "time_sec": 66.72496843338013 + }, + { + "epoch": 29, + "train_loss": 3.562197733078003, + "train_acc": 0.15604, + "test_loss": 7.580322309875489, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 0.5656101207986921, + "grad_max_sv": 0.21968504451215268, + "grad_min_sv": 9.579083420918621e-09, + "grad_condition": 25012099.962059125, + "lr": 0.0009105746045668516, + "time_sec": 66.69681811332703 + }, + { + "epoch": 30, + "train_loss": 3.560017660369873, + "train_acc": 0.15662, + "test_loss": 7.44054066619873, + "test_acc": 0.0173, + "lyapunov": null, + "grad_norm": 0.5599580597173339, + "grad_max_sv": 0.2209590796381235, + "grad_min_sv": 9.39374856998021e-09, + "grad_condition": 61658396.11314602, + "lr": 0.0009045084971874733, + "time_sec": 66.69601655006409 + }, + { + "epoch": 31, + "train_loss": 3.5422336725616455, + "train_acc": 0.1599, + "test_loss": 7.076059481048584, + "test_acc": 0.0198, + "lyapunov": null, + "grad_norm": 0.5515859229373342, + "grad_max_sv": 0.21789075396955013, + "grad_min_sv": 9.395337015327687e-09, + "grad_condition": 33141907.468724538, + "lr": 0.0008982649590120977, + "time_sec": 66.75024151802063 + }, + { + "epoch": 32, + "train_loss": 3.529042202835083, + "train_acc": 0.15972, + "test_loss": 7.7532018966674805, + "test_acc": 0.0155, + "lyapunov": null, + "grad_norm": 0.5497951397745081, + "grad_max_sv": 0.20885453820228578, + "grad_min_sv": 9.25596560404085e-09, + "grad_condition": 82473516.26766083, + "lr": 0.0008918467286629196, + "time_sec": 66.80956888198853 + }, + { + "epoch": 33, + "train_loss": 3.51621552734375, + "train_acc": 0.1644, + "test_loss": 6.8358760055542, + "test_acc": 0.0194, + "lyapunov": null, + "grad_norm": 0.5469890700179638, + "grad_max_sv": 0.21847443841397762, + "grad_min_sv": 9.440127946014343e-09, + "grad_condition": 25421324.334352963, + "lr": 0.0008852566213878943, + "time_sec": 66.7693350315094 + }, + { + "epoch": 34, + "train_loss": 3.5162335932922364, + "train_acc": 0.16484, + "test_loss": 6.398185224914551, + "test_acc": 0.0185, + "lyapunov": null, + "grad_norm": 0.5383581492940669, + "grad_max_sv": 0.20689108446240426, + "grad_min_sv": 9.233877815151281e-09, + "grad_condition": 27064375.409329318, + "lr": 0.000878497527825878, + "time_sec": 66.79785513877869 + }, + { + "epoch": 35, + "train_loss": 3.5035785108184814, + "train_acc": 0.16536, + "test_loss": 7.335230517578125, + "test_acc": 0.0195, + "lyapunov": null, + "grad_norm": 0.5402027402758915, + "grad_max_sv": 0.20682688914239405, + "grad_min_sv": 9.348574800394082e-09, + "grad_condition": 28438563.468850803, + "lr": 0.000871572412738697, + "time_sec": 66.81045579910278 + }, + { + "epoch": 36, + "train_loss": 3.493286726074219, + "train_acc": 0.16834, + "test_loss": 6.502911682128906, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.5280034242832364, + "grad_max_sv": 0.19797059781849385, + "grad_min_sv": 9.105119513908022e-09, + "grad_condition": 25415325.485806335, + "lr": 0.0008644843137107055, + "time_sec": 66.76097869873047 + }, + { + "epoch": 37, + "train_loss": 3.4780256481933596, + "train_acc": 0.1702, + "test_loss": 7.499637036132812, + "test_acc": 0.0188, + "lyapunov": null, + "grad_norm": 0.5321877448382957, + "grad_max_sv": 0.19945566728711128, + "grad_min_sv": 9.11805770470453e-09, + "grad_condition": 72290792.90222318, + "lr": 0.0008572363398164014, + "time_sec": 66.87902355194092 + }, + { + "epoch": 38, + "train_loss": 3.4674857460021973, + "train_acc": 0.17068, + "test_loss": 6.972921762847901, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.5289491654487876, + "grad_max_sv": 0.19467646181583403, + "grad_min_sv": 9.052938640397023e-09, + "grad_condition": 27977910.49401158, + "lr": 0.0008498316702566826, + "time_sec": 66.71038794517517 + }, + { + "epoch": 39, + "train_loss": 3.456567892379761, + "train_acc": 0.1718, + "test_loss": 7.583123879241944, + "test_acc": 0.0204, + "lyapunov": null, + "grad_norm": 0.5257287769620685, + "grad_max_sv": 0.19668871462345122, + "grad_min_sv": 9.095625710942024e-09, + "grad_condition": 27660923.67992892, + "lr": 0.0008422735529643442, + "time_sec": 66.70259189605713 + }, + { + "epoch": 40, + "train_loss": 3.439600283050537, + "train_acc": 0.17702, + "test_loss": 7.07623366394043, + "test_acc": 0.0194, + "lyapunov": null, + "grad_norm": 0.5218212705616453, + "grad_max_sv": 0.19257443137466906, + "grad_min_sv": 8.974160192742886e-09, + "grad_condition": 24645717.0349477, + "lr": 0.0008345653031794289, + "time_sec": 66.69467544555664 + }, + { + "epoch": 41, + "train_loss": 3.441303518218994, + "train_acc": 0.17488, + "test_loss": 7.0255078727722164, + "test_acc": 0.0229, + "lyapunov": null, + "grad_norm": 0.51868028277477, + "grad_max_sv": 0.19331826008856295, + "grad_min_sv": 9.044294972671008e-09, + "grad_condition": 26826321.000719573, + "lr": 0.0008267103019950526, + "time_sec": 66.69299244880676 + }, + { + "epoch": 42, + "train_loss": 3.4292957513427735, + "train_acc": 0.17452, + "test_loss": 7.204381840515136, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.5253643254473546, + "grad_max_sv": 0.19751012995839118, + "grad_min_sv": 9.221263796987956e-09, + "grad_condition": 24125885.16929126, + "lr": 0.0008187119948743447, + "time_sec": 66.71035814285278 + }, + { + "epoch": 43, + "train_loss": 3.4281089696502685, + "train_acc": 0.17694, + "test_loss": 7.537664138793946, + "test_acc": 0.0211, + "lyapunov": null, + "grad_norm": 0.5194108534896916, + "grad_max_sv": 0.2011748518794775, + "grad_min_sv": 9.108393971002382e-09, + "grad_condition": 44095500.51692389, + "lr": 0.000810573890139155, + "time_sec": 66.8431122303009 + }, + { + "epoch": 44, + "train_loss": 3.4221175812530515, + "train_acc": 0.1796, + "test_loss": 7.407726572418213, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.5178702018876962, + "grad_max_sv": 0.19308201856911184, + "grad_min_sv": 9.019754657058065e-09, + "grad_condition": 26647196.819321267, + "lr": 0.0008022995574311873, + "time_sec": 66.78941011428833 + }, + { + "epoch": 45, + "train_loss": 3.400263899459839, + "train_acc": 0.18424, + "test_loss": 6.749155438232422, + "test_acc": 0.0251, + "lyapunov": null, + "grad_norm": 0.518187566195941, + "grad_max_sv": 0.18997054174542427, + "grad_min_sv": 8.950063522597528e-09, + "grad_condition": 64164305.6683145, + "lr": 0.0007938926261462363, + "time_sec": 66.72000646591187 + }, + { + "epoch": 46, + "train_loss": 3.395167677078247, + "train_acc": 0.18308, + "test_loss": 6.933445383453369, + "test_acc": 0.0219, + "lyapunov": null, + "grad_norm": 0.5105878399725617, + "grad_max_sv": 0.18559869714081287, + "grad_min_sv": 8.806649112215459e-09, + "grad_condition": 120544633.7455566, + "lr": 0.0007853567838422158, + "time_sec": 66.71739363670349 + }, + { + "epoch": 47, + "train_loss": 3.3893753800964355, + "train_acc": 0.18392, + "test_loss": 7.526408071899414, + "test_acc": 0.0222, + "lyapunov": null, + "grad_norm": 0.5062040296706847, + "grad_max_sv": 0.18082244805991649, + "grad_min_sv": 8.976306442587401e-09, + "grad_condition": 29608816.90495221, + "lr": 0.0007766957746216719, + "time_sec": 66.72174620628357 + }, + { + "epoch": 48, + "train_loss": 3.3721413567352294, + "train_acc": 0.18658, + "test_loss": 6.825230180358886, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5095470173179549, + "grad_max_sv": 0.18853078819811345, + "grad_min_sv": 8.948983057366356e-09, + "grad_condition": 26865035.338588893, + "lr": 0.0007679133974894982, + "time_sec": 66.80622148513794 + }, + { + "epoch": 49, + "train_loss": 3.3716752050018313, + "train_acc": 0.18754, + "test_loss": 7.223709740447998, + "test_acc": 0.0303, + "lyapunov": null, + "grad_norm": 0.5066211171288654, + "grad_max_sv": 0.1869507610797882, + "grad_min_sv": 8.992035052668434e-09, + "grad_condition": 23283441.10076283, + "lr": 0.000759013504686565, + "time_sec": 66.81845688819885 + }, + { + "epoch": 50, + "train_loss": 3.3587275280761717, + "train_acc": 0.19086, + "test_loss": 6.7569826782226565, + "test_acc": 0.0243, + "lyapunov": null, + "grad_norm": 0.506317038211902, + "grad_max_sv": 0.18107994161546231, + "grad_min_sv": 8.999141074342299e-09, + "grad_condition": 200538246.60999444, + "lr": 0.0007499999999999998, + "time_sec": 66.70761036872864 + }, + { + "epoch": 51, + "train_loss": 3.3526639527130127, + "train_acc": 0.19188, + "test_loss": 6.670795946502685, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.5023637852793532, + "grad_max_sv": 0.1799766130745411, + "grad_min_sv": 9.005793131719453e-09, + "grad_condition": 60303250.12300022, + "lr": 0.0007408768370508575, + "time_sec": 66.8078305721283 + }, + { + "epoch": 52, + "train_loss": 3.3506644287872316, + "train_acc": 0.19068, + "test_loss": 7.382517870330811, + "test_acc": 0.022, + "lyapunov": null, + "grad_norm": 0.49959851459507565, + "grad_max_sv": 0.17121989093720913, + "grad_min_sv": 8.849344752120958e-09, + "grad_condition": 34334249.77637265, + "lr": 0.0007316480175599307, + "time_sec": 66.78811454772949 + }, + { + "epoch": 53, + "train_loss": 3.3417568744659425, + "train_acc": 0.19254, + "test_loss": 8.142177056884766, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 0.4981274188163727, + "grad_max_sv": 0.17399160973727704, + "grad_min_sv": 8.837567241903877e-09, + "grad_condition": 24739202.69426199, + "lr": 0.0007223175895924635, + "time_sec": 66.85724830627441 + }, + { + "epoch": 54, + "train_loss": 3.3355814123535157, + "train_acc": 0.1957, + "test_loss": 6.92948182220459, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.49764414817443375, + "grad_max_sv": 0.17371546551585199, + "grad_min_sv": 8.84867411088744e-09, + "grad_condition": 150304225.8365222, + "lr": 0.0007128896457825361, + "time_sec": 66.71973633766174 + }, + { + "epoch": 55, + "train_loss": 3.326216081542969, + "train_acc": 0.19418, + "test_loss": 7.809853678131104, + "test_acc": 0.023, + "lyapunov": null, + "grad_norm": 0.4993878218606792, + "grad_max_sv": 0.17109079472720623, + "grad_min_sv": 8.849828239676505e-09, + "grad_condition": 22057140.335132368, + "lr": 0.0007033683215378998, + "time_sec": 66.97141337394714 + }, + { + "epoch": 56, + "train_loss": 3.319088702545166, + "train_acc": 0.19614, + "test_loss": 7.596286960601807, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.49667047439168693, + "grad_max_sv": 0.16795397438108922, + "grad_min_sv": 8.856667624290716e-09, + "grad_condition": 21032117.189596005, + "lr": 0.0006937577932260512, + "time_sec": 66.70526051521301 + }, + { + "epoch": 57, + "train_loss": 3.303804122848511, + "train_acc": 0.19878, + "test_loss": 7.291678775024414, + "test_acc": 0.02, + "lyapunov": null, + "grad_norm": 0.499572780086862, + "grad_max_sv": 0.17316541597247123, + "grad_min_sv": 8.944026716473098e-09, + "grad_condition": 23580602.560242586, + "lr": 0.0006840622763423388, + "time_sec": 66.72219276428223 + }, + { + "epoch": 58, + "train_loss": 3.2961739293670655, + "train_acc": 0.20036, + "test_loss": 7.379423007202148, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.49780422530713136, + "grad_max_sv": 0.17306868806481362, + "grad_min_sv": 8.897491003689862e-09, + "grad_condition": 33645085.03834008, + "lr": 0.0006742860236609073, + "time_sec": 66.7072229385376 + }, + { + "epoch": 59, + "train_loss": 3.292852275466919, + "train_acc": 0.20314, + "test_loss": 6.699318830871582, + "test_acc": 0.0262, + "lyapunov": null, + "grad_norm": 0.49686323718116887, + "grad_max_sv": 0.17558623403310775, + "grad_min_sv": 8.761962172476601e-09, + "grad_condition": 38386994.848281495, + "lr": 0.0006644333233692913, + "time_sec": 66.72137403488159 + }, + { + "epoch": 60, + "train_loss": 3.2881739818573, + "train_acc": 0.20208, + "test_loss": 6.617448914337158, + "test_acc": 0.0235, + "lyapunov": null, + "grad_norm": 0.4972800368236651, + "grad_max_sv": 0.17418485544621945, + "grad_min_sv": 8.887109359534406e-09, + "grad_condition": 23772781.473704576, + "lr": 0.0006545084971874734, + "time_sec": 66.76340699195862 + }, + { + "epoch": 61, + "train_loss": 3.2832211613464355, + "train_acc": 0.20396, + "test_loss": 7.8168681640625, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.49347264852603, + "grad_max_sv": 0.16998312883079053, + "grad_min_sv": 8.87461152343505e-09, + "grad_condition": 22196538.972435523, + "lr": 0.0006445158984722354, + "time_sec": 66.69128584861755 + }, + { + "epoch": 62, + "train_loss": 3.267657317352295, + "train_acc": 0.20602, + "test_loss": 6.787965573120117, + "test_acc": 0.0226, + "lyapunov": null, + "grad_norm": 0.4942819436191628, + "grad_max_sv": 0.1665095403790474, + "grad_min_sv": 8.805719026172553e-09, + "grad_condition": 21888086.61137065, + "lr": 0.0006344599103076324, + "time_sec": 66.72603845596313 + }, + { + "epoch": 63, + "train_loss": 3.264744351043701, + "train_acc": 0.20522, + "test_loss": 7.947964939117432, + "test_acc": 0.0218, + "lyapunov": null, + "grad_norm": 0.49153660537625127, + "grad_max_sv": 0.16237439326941966, + "grad_min_sv": 8.742884187451505e-09, + "grad_condition": 23911997.384101003, + "lr": 0.0006243449435824269, + "time_sec": 66.6943769454956 + }, + { + "epoch": 64, + "train_loss": 3.2640425563812254, + "train_acc": 0.20452, + "test_loss": 7.12151423034668, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.49384434943361655, + "grad_max_sv": 0.168024880066514, + "grad_min_sv": 8.758979427869739e-09, + "grad_condition": 21739668.66096285, + "lr": 0.0006141754350553275, + "time_sec": 66.69389152526855 + }, + { + "epoch": 65, + "train_loss": 3.244006223831177, + "train_acc": 0.21052, + "test_loss": 7.017924461364746, + "test_acc": 0.0234, + "lyapunov": null, + "grad_norm": 0.49421653603545956, + "grad_max_sv": 0.1682070516049862, + "grad_min_sv": 8.867816919666538e-09, + "grad_condition": 33570918.978102654, + "lr": 0.0006039558454088793, + "time_sec": 66.70642900466919 + }, + { + "epoch": 66, + "train_loss": 3.2429666870880127, + "train_acc": 0.2095, + "test_loss": 7.507377795410156, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.4920675755358138, + "grad_max_sv": 0.16653703041374684, + "grad_min_sv": 8.782905018545061e-09, + "grad_condition": 33037433.310028076, + "lr": 0.000593690657292862, + "time_sec": 66.69945740699768 + }, + { + "epoch": 67, + "train_loss": 3.235812818222046, + "train_acc": 0.21004, + "test_loss": 8.179235096740722, + "test_acc": 0.0199, + "lyapunov": null, + "grad_norm": 0.49143560072681164, + "grad_max_sv": 0.16453767009079456, + "grad_min_sv": 8.906316832646422e-09, + "grad_condition": 24459655.594651837, + "lr": 0.0005833843733580507, + "time_sec": 66.68722915649414 + }, + { + "epoch": 68, + "train_loss": 3.2230448572540285, + "train_acc": 0.21154, + "test_loss": 7.499305305480957, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.49248528868620167, + "grad_max_sv": 0.16838400289416314, + "grad_min_sv": 8.870841536334773e-09, + "grad_condition": 21419108.58487917, + "lr": 0.0005730415142812054, + "time_sec": 66.70680451393127 + }, + { + "epoch": 69, + "train_loss": 3.2205778658294677, + "train_acc": 0.21464, + "test_loss": 7.50203574142456, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.4909914070718711, + "grad_max_sv": 0.1646382961422205, + "grad_min_sv": 8.7063952491917e-09, + "grad_condition": 22220196.366961446, + "lr": 0.0005626666167821517, + "time_sec": 66.76639890670776 + }, + { + "epoch": 70, + "train_loss": 3.207180488128662, + "train_acc": 0.21516, + "test_loss": 7.001610806274414, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.495424727651562, + "grad_max_sv": 0.16553561352193355, + "grad_min_sv": 8.972080669383819e-09, + "grad_condition": 47422658.54318248, + "lr": 0.0005522642316338265, + "time_sec": 66.70834302902222 + }, + { + "epoch": 71, + "train_loss": 3.2062013800048828, + "train_acc": 0.21612, + "test_loss": 6.927703591156006, + "test_acc": 0.0308, + "lyapunov": null, + "grad_norm": 0.49114896439763267, + "grad_max_sv": 0.16479650065302848, + "grad_min_sv": 8.813466856327778e-09, + "grad_condition": 43207807.33314108, + "lr": 0.0005418389216661573, + "time_sec": 66.71610283851624 + }, + { + "epoch": 72, + "train_loss": 3.1919854682922364, + "train_acc": 0.21694, + "test_loss": 6.498612490844726, + "test_acc": 0.0294, + "lyapunov": null, + "grad_norm": 0.49506236999909303, + "grad_max_sv": 0.16502842903137208, + "grad_min_sv": 8.951233382292757e-09, + "grad_condition": 20833946.329851203, + "lr": 0.0005313952597646563, + "time_sec": 66.70564031600952 + }, + { + "epoch": 73, + "train_loss": 3.19263421005249, + "train_acc": 0.22014, + "test_loss": 7.917480190277099, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.4934923943021254, + "grad_max_sv": 0.1658387891948223, + "grad_min_sv": 8.915270069409509e-09, + "grad_condition": 23230788.976801574, + "lr": 0.0005209378268645994, + "time_sec": 66.77329587936401 + }, + { + "epoch": 74, + "train_loss": 3.185640338821411, + "train_acc": 0.21906, + "test_loss": 7.357819847106933, + "test_acc": 0.0252, + "lyapunov": null, + "grad_norm": 0.4911097758269761, + "grad_max_sv": 0.16611208710819483, + "grad_min_sv": 8.851672780169073e-09, + "grad_condition": 58442839.12499788, + "lr": 0.0005104712099416781, + "time_sec": 66.684730052948 + }, + { + "epoch": 75, + "train_loss": 3.1690349718475344, + "train_acc": 0.2239, + "test_loss": 7.2397661224365235, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.4906690124125115, + "grad_max_sv": 0.16415953114628792, + "grad_min_sv": 8.816434821090625e-09, + "grad_condition": 20409708.15696338, + "lr": 0.0004999999999999996, + "time_sec": 66.71101260185242 + }, + { + "epoch": 76, + "train_loss": 3.1630740728759767, + "train_acc": 0.2228, + "test_loss": 7.3856810913085935, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.4942494495158576, + "grad_max_sv": 0.16416314020752906, + "grad_min_sv": 8.881746908773192e-09, + "grad_condition": 22916920.692442246, + "lr": 0.0004895287900583212, + "time_sec": 66.72276592254639 + }, + { + "epoch": 77, + "train_loss": 3.157883042678833, + "train_acc": 0.2226, + "test_loss": 7.461940403747558, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.48944835890506283, + "grad_max_sv": 0.16295542381703854, + "grad_min_sv": 8.790652895884766e-09, + "grad_condition": 25190467.13440006, + "lr": 0.0004790621731353997, + "time_sec": 66.73238253593445 + }, + { + "epoch": 78, + "train_loss": 3.15415998550415, + "train_acc": 0.2232, + "test_loss": 7.546776051330567, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.48925024138964845, + "grad_max_sv": 0.1628365319222212, + "grad_min_sv": 8.811498453109578e-09, + "grad_condition": 23075857.06663191, + "lr": 0.000468604740235343, + "time_sec": 66.73092246055603 + }, + { + "epoch": 79, + "train_loss": 3.1458859318542483, + "train_acc": 0.22802, + "test_loss": 7.108101511383056, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.495366871838511, + "grad_max_sv": 0.1650368317961693, + "grad_min_sv": 9.025954333247154e-09, + "grad_condition": 38457801.29496137, + "lr": 0.00045816107833384175, + "time_sec": 66.74371480941772 + }, + { + "epoch": 80, + "train_loss": 3.140154826583862, + "train_acc": 0.2266, + "test_loss": 7.284811801147461, + "test_acc": 0.0302, + "lyapunov": null, + "grad_norm": 0.4914271153786783, + "grad_max_sv": 0.16505839116871357, + "grad_min_sv": 8.893962011443865e-09, + "grad_condition": 369021517.7075845, + "lr": 0.0004477357683661729, + "time_sec": 66.69183111190796 + }, + { + "epoch": 81, + "train_loss": 3.1333287098693847, + "train_acc": 0.22694, + "test_loss": 7.571458190917968, + "test_acc": 0.0209, + "lyapunov": null, + "grad_norm": 0.494073529942036, + "grad_max_sv": 0.1608546230942011, + "grad_min_sv": 9.091243879932875e-09, + "grad_condition": 20891716.667523753, + "lr": 0.00043733338321784746, + "time_sec": 66.71526265144348 + }, + { + "epoch": 82, + "train_loss": 3.1283695087432863, + "train_acc": 0.23006, + "test_loss": 7.788016625976563, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.49129892073668435, + "grad_max_sv": 0.16086806021630765, + "grad_min_sv": 8.920912475049448e-09, + "grad_condition": 47898591.96295839, + "lr": 0.0004269584857187939, + "time_sec": 66.69153666496277 + }, + { + "epoch": 83, + "train_loss": 3.130916413574219, + "train_acc": 0.23138, + "test_loss": 7.913901668548584, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.48912391484879925, + "grad_max_sv": 0.16135921962559224, + "grad_min_sv": 9.076431696855569e-09, + "grad_condition": 50854672.26653309, + "lr": 0.0004166156266419484, + "time_sec": 66.75194883346558 + }, + { + "epoch": 84, + "train_loss": 3.116759624481201, + "train_acc": 0.22928, + "test_loss": 7.443206707763672, + "test_acc": 0.0267, + "lyapunov": null, + "grad_norm": 0.49216768079497325, + "grad_max_sv": 0.16190627813339234, + "grad_min_sv": 9.013408105995602e-09, + "grad_condition": 22062192.06550083, + "lr": 0.0004063093427071373, + "time_sec": 66.76291751861572 + }, + { + "epoch": 85, + "train_loss": 3.1119228192138673, + "train_acc": 0.23272, + "test_loss": 7.789751325988769, + "test_acc": 0.028, + "lyapunov": null, + "grad_norm": 0.4906237938270759, + "grad_max_sv": 0.16028195321559907, + "grad_min_sv": 8.904607010085108e-09, + "grad_condition": 21362215.652891032, + "lr": 0.0003960441545911199, + "time_sec": 66.72702622413635 + }, + { + "epoch": 86, + "train_loss": 3.095892171173096, + "train_acc": 0.23322, + "test_loss": 7.520130683135986, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.49558582555905584, + "grad_max_sv": 0.15913640297949314, + "grad_min_sv": 9.008386794850943e-09, + "grad_condition": 19711267.83894111, + "lr": 0.0003858245649446718, + "time_sec": 66.69949555397034 + }, + { + "epoch": 87, + "train_loss": 3.0982225965118406, + "train_acc": 0.23538, + "test_loss": 7.958539725494385, + "test_acc": 0.0227, + "lyapunov": null, + "grad_norm": 0.4928264723148802, + "grad_max_sv": 0.16157768219709395, + "grad_min_sv": 9.009624502009927e-09, + "grad_condition": 22513594.923468076, + "lr": 0.00037565505641757235, + "time_sec": 66.7021861076355 + }, + { + "epoch": 88, + "train_loss": 3.0881566471099853, + "train_acc": 0.23704, + "test_loss": 7.651519326782227, + "test_acc": 0.0317, + "lyapunov": null, + "grad_norm": 0.4925350840337203, + "grad_max_sv": 0.16133950129151345, + "grad_min_sv": 8.917141037720344e-09, + "grad_condition": 46990788.85548556, + "lr": 0.00036554008969236695, + "time_sec": 66.71680331230164 + }, + { + "epoch": 89, + "train_loss": 3.0752701135253906, + "train_acc": 0.24002, + "test_loss": 8.03997054977417, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.49191590245060596, + "grad_max_sv": 0.16232036016881465, + "grad_min_sv": 8.918097575694173e-09, + "grad_condition": 40862815.39075501, + "lr": 0.0003554841015277638, + "time_sec": 66.69313955307007 + }, + { + "epoch": 90, + "train_loss": 3.078908212738037, + "train_acc": 0.24046, + "test_loss": 7.6376062118530275, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.4911817237537404, + "grad_max_sv": 0.1551229476928711, + "grad_min_sv": 8.927438248373943e-09, + "grad_condition": 22037340.73214477, + "lr": 0.000345491502812526, + "time_sec": 66.69833588600159 + }, + { + "epoch": 91, + "train_loss": 3.068959038543701, + "train_acc": 0.23882, + "test_loss": 8.130451618957519, + "test_acc": 0.0246, + "lyapunov": null, + "grad_norm": 0.4906750851127587, + "grad_max_sv": 0.15804662480950354, + "grad_min_sv": 8.945024668194357e-09, + "grad_condition": 20238836.161220632, + "lr": 0.0003355666766307081, + "time_sec": 66.82877826690674 + }, + { + "epoch": 92, + "train_loss": 3.0708934452819823, + "train_acc": 0.23938, + "test_loss": 7.4464682083129885, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.49334078113347807, + "grad_max_sv": 0.16077993027865886, + "grad_min_sv": 9.145524822347373e-09, + "grad_condition": 187037203.19992697, + "lr": 0.00032571397633909225, + "time_sec": 66.74011158943176 + }, + { + "epoch": 93, + "train_loss": 3.0600284594726563, + "train_acc": 0.24034, + "test_loss": 7.877293493652344, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.4935640341843895, + "grad_max_sv": 0.1569301776587963, + "grad_min_sv": 9.054515949513675e-09, + "grad_condition": 27829600.056863032, + "lr": 0.00031593772365766094, + "time_sec": 66.81489491462708 + }, + { + "epoch": 94, + "train_loss": 3.051695512161255, + "train_acc": 0.23988, + "test_loss": 7.893620376586914, + "test_acc": 0.026, + "lyapunov": null, + "grad_norm": 0.49337091451194337, + "grad_max_sv": 0.15855305679142476, + "grad_min_sv": 8.944794831905467e-09, + "grad_condition": 38859308.23023894, + "lr": 0.0003062422067739483, + "time_sec": 66.7299313545227 + }, + { + "epoch": 95, + "train_loss": 3.0489727338409423, + "train_acc": 0.2417, + "test_loss": 8.291682899475097, + "test_acc": 0.0277, + "lyapunov": null, + "grad_norm": 0.49538404769918437, + "grad_max_sv": 0.1582469828426838, + "grad_min_sv": 8.944870299315566e-09, + "grad_condition": 46091432.107807726, + "lr": 0.00029663167846209965, + "time_sec": 66.69549345970154 + }, + { + "epoch": 96, + "train_loss": 3.0484196520233153, + "train_acc": 0.243, + "test_loss": 7.872291290283203, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.49220383248292715, + "grad_max_sv": 0.15892123989760876, + "grad_min_sv": 9.01737370051503e-09, + "grad_condition": 21302011.98175659, + "lr": 0.00028711035421746345, + "time_sec": 66.71452689170837 + }, + { + "epoch": 97, + "train_loss": 3.037676093826294, + "train_acc": 0.246, + "test_loss": 7.654231861877442, + "test_acc": 0.0293, + "lyapunov": null, + "grad_norm": 0.49508860986225445, + "grad_max_sv": 0.15910031460225582, + "grad_min_sv": 9.107966224752503e-09, + "grad_condition": 219510223.0929153, + "lr": 0.00027768241040753615, + "time_sec": 66.68213939666748 + }, + { + "epoch": 98, + "train_loss": 3.0303984658813476, + "train_acc": 0.2483, + "test_loss": 7.705853749084473, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.4955532184661232, + "grad_max_sv": 0.1598552517592907, + "grad_min_sv": 9.178445775637201e-09, + "grad_condition": 19678066.130865358, + "lr": 0.00026835198244006903, + "time_sec": 66.72349858283997 + }, + { + "epoch": 99, + "train_loss": 3.0224529089355467, + "train_acc": 0.24928, + "test_loss": 8.284590560913086, + "test_acc": 0.0288, + "lyapunov": null, + "grad_norm": 0.49667728346438245, + "grad_max_sv": 0.16261373981833457, + "grad_min_sv": 9.261911344468631e-09, + "grad_condition": 43957646.17011832, + "lr": 0.0002591231629491421, + "time_sec": 66.71236634254456 + }, + { + "epoch": 100, + "train_loss": 3.026221090545654, + "train_acc": 0.24816, + "test_loss": 8.147641947174073, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.4973181888980844, + "grad_max_sv": 0.161344700306654, + "grad_min_sv": 9.093790653835754e-09, + "grad_condition": 22073209.92013366, + "lr": 0.0002499999999999997, + "time_sec": 66.67841935157776 + }, + { + "epoch": 101, + "train_loss": 3.024826983642578, + "train_acc": 0.24746, + "test_loss": 8.172234124755859, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.4987508334210676, + "grad_max_sv": 0.1609908178448677, + "grad_min_sv": 9.188273343563313e-09, + "grad_condition": 29575100.287913345, + "lr": 0.00024098649531343477, + "time_sec": 66.66067171096802 + }, + { + "epoch": 102, + "train_loss": 3.00824671585083, + "train_acc": 0.25088, + "test_loss": 8.115251203918458, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.49705452560220326, + "grad_max_sv": 0.16128522865474224, + "grad_min_sv": 9.071875566209197e-09, + "grad_condition": 183987800.30718166, + "lr": 0.0002320866025105016, + "time_sec": 66.69079804420471 + }, + { + "epoch": 103, + "train_loss": 3.012382175140381, + "train_acc": 0.2474, + "test_loss": 7.876342864227295, + "test_acc": 0.0358, + "lyapunov": null, + "grad_norm": 0.49759795132738194, + "grad_max_sv": 0.15578284673392773, + "grad_min_sv": 9.15119064692771e-09, + "grad_condition": 20274304.806162156, + "lr": 0.0002233042253783278, + "time_sec": 66.68386912345886 + }, + { + "epoch": 104, + "train_loss": 2.999149740066528, + "train_acc": 0.25194, + "test_loss": 8.156604473876953, + "test_acc": 0.0334, + "lyapunov": null, + "grad_norm": 0.4993865662081535, + "grad_max_sv": 0.16031337156891823, + "grad_min_sv": 9.130539890822575e-09, + "grad_condition": 20692502.69173783, + "lr": 0.000214643216157784, + "time_sec": 66.76614332199097 + }, + { + "epoch": 105, + "train_loss": 2.993046808395386, + "train_acc": 0.25322, + "test_loss": 8.206476106262206, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 0.49628166690763564, + "grad_max_sv": 0.1620720062404871, + "grad_min_sv": 9.0822705509086e-09, + "grad_condition": 31802699.452992357, + "lr": 0.00020610737385376332, + "time_sec": 66.92790508270264 + }, + { + "epoch": 106, + "train_loss": 2.9957507374572754, + "train_acc": 0.25204, + "test_loss": 8.32369485168457, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 0.499844986274271, + "grad_max_sv": 0.15692994557321072, + "grad_min_sv": 9.113036909119687e-09, + "grad_condition": 37954326.83555563, + "lr": 0.00019770044256881242, + "time_sec": 66.69280505180359 + }, + { + "epoch": 107, + "train_loss": 2.986658691177368, + "train_acc": 0.25358, + "test_loss": 8.158060417938232, + "test_acc": 0.0315, + "lyapunov": null, + "grad_norm": 0.5001001823423601, + "grad_max_sv": 0.16076837331056595, + "grad_min_sv": 9.191752022019718e-09, + "grad_condition": 24107799.99388643, + "lr": 0.0001894261098608447, + "time_sec": 66.8065435886383 + }, + { + "epoch": 108, + "train_loss": 2.9821577393341063, + "train_acc": 0.25654, + "test_loss": 8.488254710388183, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.502485476242763, + "grad_max_sv": 0.1583723586052656, + "grad_min_sv": 9.112645133618757e-09, + "grad_condition": 75568130.83148949, + "lr": 0.000181288005125655, + "time_sec": 66.69794940948486 + }, + { + "epoch": 109, + "train_loss": 2.9782085455322265, + "train_acc": 0.25542, + "test_loss": 8.012923631286622, + "test_acc": 0.0329, + "lyapunov": null, + "grad_norm": 0.4984903393296528, + "grad_max_sv": 0.15951386988162994, + "grad_min_sv": 9.13156463222542e-09, + "grad_condition": 19541255.215787858, + "lr": 0.0001732896980049473, + "time_sec": 66.75459599494934 + }, + { + "epoch": 110, + "train_loss": 2.977617024688721, + "train_acc": 0.25416, + "test_loss": 7.927994426727295, + "test_acc": 0.0312, + "lyapunov": null, + "grad_norm": 0.5009242415138291, + "grad_max_sv": 0.15868730172514917, + "grad_min_sv": 9.178975504675613e-09, + "grad_condition": 20582427.94600161, + "lr": 0.00016543469682057076, + "time_sec": 66.69332385063171 + }, + { + "epoch": 111, + "train_loss": 2.9753467011260986, + "train_acc": 0.25596, + "test_loss": 8.319595712280274, + "test_acc": 0.0307, + "lyapunov": null, + "grad_norm": 0.5005941372001506, + "grad_max_sv": 0.16290293373167514, + "grad_min_sv": 9.188780414337571e-09, + "grad_condition": 58141904.50898675, + "lr": 0.00015772644703565552, + "time_sec": 66.67908811569214 + }, + { + "epoch": 112, + "train_loss": 2.964190831069946, + "train_acc": 0.2586, + "test_loss": 8.675558572387695, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.49904161219237203, + "grad_max_sv": 0.15657965913414956, + "grad_min_sv": 9.138289626658274e-09, + "grad_condition": 176788840.7312159, + "lr": 0.00015016832974331713, + "time_sec": 66.7088508605957 + }, + { + "epoch": 113, + "train_loss": 2.954090965118408, + "train_acc": 0.26176, + "test_loss": 8.300330653381348, + "test_acc": 0.0295, + "lyapunov": null, + "grad_norm": 0.49993834308283913, + "grad_max_sv": 0.16308558471500872, + "grad_min_sv": 9.294466957188163e-09, + "grad_condition": 21663432.51767642, + "lr": 0.00014276366018359834, + "time_sec": 66.69772529602051 + }, + { + "epoch": 114, + "train_loss": 2.963344728240967, + "train_acc": 0.25764, + "test_loss": 8.330418551635741, + "test_acc": 0.0289, + "lyapunov": null, + "grad_norm": 0.5018230989792033, + "grad_max_sv": 0.15932467840611936, + "grad_min_sv": 9.236983548877032e-09, + "grad_condition": 27736134.476570655, + "lr": 0.00013551568628929425, + "time_sec": 66.70325803756714 + }, + { + "epoch": 115, + "train_loss": 2.9565879733276366, + "train_acc": 0.25964, + "test_loss": 7.8575323272705075, + "test_acc": 0.0326, + "lyapunov": null, + "grad_norm": 0.5008809900364136, + "grad_max_sv": 0.1622266974300146, + "grad_min_sv": 9.12305047895412e-09, + "grad_condition": 30845128.19165374, + "lr": 0.00012842758726130276, + "time_sec": 66.68990015983582 + }, + { + "epoch": 116, + "train_loss": 2.9527316310119627, + "train_acc": 0.25978, + "test_loss": 8.399875411987304, + "test_acc": 0.0331, + "lyapunov": null, + "grad_norm": 0.501442711033118, + "grad_max_sv": 0.15974901132285596, + "grad_min_sv": 9.164257287058719e-09, + "grad_condition": 38992915.8072435, + "lr": 0.0001215024721741218, + "time_sec": 66.69366478919983 + }, + { + "epoch": 117, + "train_loss": 2.9503427956390382, + "train_acc": 0.26032, + "test_loss": 7.990305528259277, + "test_acc": 0.0321, + "lyapunov": null, + "grad_norm": 0.503589536410986, + "grad_max_sv": 0.16520196348428726, + "grad_min_sv": 9.264067410072464e-09, + "grad_condition": 83868622.08023986, + "lr": 0.00011474337861210538, + "time_sec": 66.72409868240356 + }, + { + "epoch": 118, + "train_loss": 2.9452951972961428, + "train_acc": 0.26186, + "test_loss": 8.147903689575195, + "test_acc": 0.0314, + "lyapunov": null, + "grad_norm": 0.5033856715448645, + "grad_max_sv": 0.16233305558562278, + "grad_min_sv": 9.248901002012478e-09, + "grad_condition": 25081711.234670334, + "lr": 0.00010815327133708009, + "time_sec": 66.7026617527008 + }, + { + "epoch": 119, + "train_loss": 2.941498958053589, + "train_acc": 0.26368, + "test_loss": 8.610751574707031, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.5024430434883491, + "grad_max_sv": 0.1590784341096878, + "grad_min_sv": 9.23304959987714e-09, + "grad_condition": 20494387.45624064, + "lr": 0.00010173504098790182, + "time_sec": 66.76532936096191 + }, + { + "epoch": 120, + "train_loss": 2.935255004730225, + "train_acc": 0.26242, + "test_loss": 8.297263900756835, + "test_acc": 0.0331, + "lyapunov": null, + "grad_norm": 0.5040302766957269, + "grad_max_sv": 0.163528535887599, + "grad_min_sv": 9.301190626032075e-09, + "grad_condition": 28694382.488496322, + "lr": 9.549150281252629e-05, + "time_sec": 66.68135213851929 + }, + { + "epoch": 121, + "train_loss": 2.9364529040527345, + "train_acc": 0.26432, + "test_loss": 8.291862780761718, + "test_acc": 0.032, + "lyapunov": null, + "grad_norm": 0.5046029560998396, + "grad_max_sv": 0.15975070968270302, + "grad_min_sv": 9.412849380496801e-09, + "grad_condition": 19587449.45790067, + "lr": 8.942539543314794e-05, + "time_sec": 66.67216777801514 + }, + { + "epoch": 122, + "train_loss": 2.936676673126221, + "train_acc": 0.26518, + "test_loss": 8.499242510986328, + "test_acc": 0.0304, + "lyapunov": null, + "grad_norm": 0.5047649009210087, + "grad_max_sv": 0.16289451010525227, + "grad_min_sv": 9.350050624370998e-09, + "grad_condition": 55505776.29325993, + "lr": 8.353937964495024e-05, + "time_sec": 66.71731305122375 + }, + { + "epoch": 123, + "train_loss": 2.928475122909546, + "train_acc": 0.26562, + "test_loss": 8.177069671630859, + "test_acc": 0.0342, + "lyapunov": null, + "grad_norm": 0.5048999761698001, + "grad_max_sv": 0.15904909931123257, + "grad_min_sv": 9.226389620364817e-09, + "grad_condition": 25050377.05934065, + "lr": 7.783603724899243e-05, + "time_sec": 66.7349808216095 + }, + { + "epoch": 124, + "train_loss": 2.931030046463013, + "train_acc": 0.2641, + "test_loss": 8.353331985473632, + "test_acc": 0.031, + "lyapunov": null, + "grad_norm": 0.5023168097041694, + "grad_max_sv": 0.162389824539423, + "grad_min_sv": 9.286878636938223e-09, + "grad_condition": 23152814.43828611, + "lr": 7.231786991974666e-05, + "time_sec": 66.72571802139282 + }, + { + "epoch": 125, + "train_loss": 2.9270871754455565, + "train_acc": 0.26426, + "test_loss": 8.401993353271484, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.5049758798636186, + "grad_max_sv": 0.16142708584666252, + "grad_min_sv": 9.297885433801056e-09, + "grad_condition": 19875141.174937833, + "lr": 6.698729810778072e-05, + "time_sec": 66.69990706443787 + }, + { + "epoch": 126, + "train_loss": 2.930443018951416, + "train_acc": 0.26334, + "test_loss": 8.037101096343994, + "test_acc": 0.0338, + "lyapunov": null, + "grad_norm": 0.5046016651861616, + "grad_max_sv": 0.16035589538514614, + "grad_min_sv": 9.240497411688865e-09, + "grad_condition": 28125977.648946952, + "lr": 6.184665997806817e-05, + "time_sec": 67.14951395988464 + }, + { + "epoch": 127, + "train_loss": 2.920647982254028, + "train_acc": 0.26692, + "test_loss": 8.046730439758301, + "test_acc": 0.0324, + "lyapunov": null, + "grad_norm": 0.5049604973588052, + "grad_max_sv": 0.16098853275179864, + "grad_min_sv": 9.3294794306642e-09, + "grad_condition": 20407197.848863874, + "lr": 5.6898210384392595e-05, + "time_sec": 66.7223470211029 + }, + { + "epoch": 128, + "train_loss": 2.9174925131988525, + "train_acc": 0.2684, + "test_loss": 8.320220652770995, + "test_acc": 0.0303, + "lyapunov": null, + "grad_norm": 0.5053571563299065, + "grad_max_sv": 0.1587530255317688, + "grad_min_sv": 9.217601072697424e-09, + "grad_condition": 27425905.55975602, + "lr": 5.214411988029363e-05, + "time_sec": 66.72726678848267 + }, + { + "epoch": 129, + "train_loss": 2.912207716064453, + "train_acc": 0.26822, + "test_loss": 8.340176411437989, + "test_acc": 0.0329, + "lyapunov": null, + "grad_norm": 0.5070723294876998, + "grad_max_sv": 0.16541431248188018, + "grad_min_sv": 9.451083940459348e-09, + "grad_condition": 20567354.357769065, + "lr": 4.7586473766990294e-05, + "time_sec": 66.71740126609802 + }, + { + "epoch": 130, + "train_loss": 2.9202334938049317, + "train_acc": 0.2674, + "test_loss": 8.199926257324218, + "test_acc": 0.0327, + "lyapunov": null, + "grad_norm": 0.5048916415346303, + "grad_max_sv": 0.15801323913037776, + "grad_min_sv": 9.219233110258073e-09, + "grad_condition": 19376960.764617294, + "lr": 4.32272711786996e-05, + "time_sec": 66.70238876342773 + }, + { + "epoch": 131, + "train_loss": 2.9117065854644775, + "train_acc": 0.27042, + "test_loss": 8.4127576171875, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.5046808443683461, + "grad_max_sv": 0.15953834764659405, + "grad_min_sv": 9.310256252059723e-09, + "grad_condition": 21439898.88764466, + "lr": 3.906842420574966e-05, + "time_sec": 66.70873999595642 + }, + { + "epoch": 132, + "train_loss": 2.910150853881836, + "train_acc": 0.26928, + "test_loss": 8.432557550048829, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.5068478509780873, + "grad_max_sv": 0.1597142592072487, + "grad_min_sv": 9.218466880817066e-09, + "grad_condition": 51315275.56326776, + "lr": 3.5111757055874305e-05, + "time_sec": 66.67959189414978 + }, + { + "epoch": 133, + "train_loss": 2.913581671066284, + "train_acc": 0.26686, + "test_loss": 8.2192110748291, + "test_acc": 0.0342, + "lyapunov": null, + "grad_norm": 0.5053193098572983, + "grad_max_sv": 0.15978670455515384, + "grad_min_sv": 9.38243127635019e-09, + "grad_condition": 22892063.67804382, + "lr": 3.1359005254054254e-05, + "time_sec": 66.68708491325378 + }, + { + "epoch": 134, + "train_loss": 2.9081906867980956, + "train_acc": 0.26852, + "test_loss": 8.766140046691895, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.5038449350705952, + "grad_max_sv": 0.15981822535395623, + "grad_min_sv": 9.258106009601974e-09, + "grad_condition": 23090442.640830033, + "lr": 2.7811814881259484e-05, + "time_sec": 66.70866632461548 + }, + { + "epoch": 135, + "train_loss": 2.910741279144287, + "train_acc": 0.26908, + "test_loss": 8.568949060058594, + "test_acc": 0.0305, + "lyapunov": null, + "grad_norm": 0.5060252593926529, + "grad_max_sv": 0.16062484085559844, + "grad_min_sv": 9.328420333409859e-09, + "grad_condition": 20022211.16398121, + "lr": 2.4471741852423218e-05, + "time_sec": 66.7052571773529 + }, + { + "epoch": 136, + "train_loss": 2.904768952407837, + "train_acc": 0.26876, + "test_loss": 8.586251429748534, + "test_acc": 0.0286, + "lyapunov": null, + "grad_norm": 0.5057054893343615, + "grad_max_sv": 0.16051347628235818, + "grad_min_sv": 9.250093449542085e-09, + "grad_condition": 19758794.64532106, + "lr": 2.1340251233966362e-05, + "time_sec": 66.70623755455017 + }, + { + "epoch": 137, + "train_loss": 2.899753532714844, + "train_acc": 0.2719, + "test_loss": 8.500251341247559, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.504993553912477, + "grad_max_sv": 0.1628888875246048, + "grad_min_sv": 9.47467431733351e-09, + "grad_condition": 23562830.437205564, + "lr": 1.8418716601170932e-05, + "time_sec": 66.70105028152466 + }, + { + "epoch": 138, + "train_loss": 2.903391772613525, + "train_acc": 0.26772, + "test_loss": 8.47085325012207, + "test_acc": 0.0328, + "lyapunov": null, + "grad_norm": 0.5045632679546488, + "grad_max_sv": 0.158877120167017, + "grad_min_sv": 9.315059612546861e-09, + "grad_condition": 21175946.281570215, + "lr": 1.570841943568445e-05, + "time_sec": 66.6920268535614 + }, + { + "epoch": 139, + "train_loss": 2.902729499740601, + "train_acc": 0.27098, + "test_loss": 8.424858071136475, + "test_acc": 0.0315, + "lyapunov": null, + "grad_norm": 0.5057203739338342, + "grad_max_sv": 0.16270199753344058, + "grad_min_sv": 9.42042569042467e-09, + "grad_condition": 3524579699.0758705, + "lr": 1.3210548563419845e-05, + "time_sec": 66.71372246742249 + }, + { + "epoch": 140, + "train_loss": 2.906615010299683, + "train_acc": 0.2691, + "test_loss": 8.602820767211915, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.5062145592542612, + "grad_max_sv": 0.16128202974796296, + "grad_min_sv": 9.31656084814103e-09, + "grad_condition": 91607684.02825375, + "lr": 1.0926199633097203e-05, + "time_sec": 66.70090675354004 + }, + { + "epoch": 141, + "train_loss": 2.9058460761260987, + "train_acc": 0.26978, + "test_loss": 8.383630235290527, + "test_acc": 0.0304, + "lyapunov": null, + "grad_norm": 0.5058119945694454, + "grad_max_sv": 0.1625796493142843, + "grad_min_sv": 9.312921286919184e-09, + "grad_condition": 20916832.67992229, + "lr": 8.856374635655688e-06, + "time_sec": 66.7032151222229 + }, + { + "epoch": 142, + "train_loss": 2.901709259185791, + "train_acc": 0.27014, + "test_loss": 8.529939315795898, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.50529937487535, + "grad_max_sv": 0.16269058287143706, + "grad_min_sv": 9.338738224395903e-09, + "grad_condition": 21214498.9394589, + "lr": 7.001981464747503e-06, + "time_sec": 66.72001433372498 + }, + { + "epoch": 143, + "train_loss": 2.9003410097503664, + "train_acc": 0.26956, + "test_loss": 8.474568194580078, + "test_acc": 0.0308, + "lyapunov": null, + "grad_norm": 0.5059546395273652, + "grad_max_sv": 0.16158490478992463, + "grad_min_sv": 9.306980860990244e-09, + "grad_condition": 26379170.2127072, + "lr": 5.3638335185058295e-06, + "time_sec": 66.71419501304626 + }, + { + "epoch": 144, + "train_loss": 2.900580298156738, + "train_acc": 0.27204, + "test_loss": 8.518251318359376, + "test_acc": 0.0304, + "lyapunov": null, + "grad_norm": 0.5064412723494297, + "grad_max_sv": 0.16376300603151323, + "grad_min_sv": 9.383655452666063e-09, + "grad_condition": 20476900.61761298, + "lr": 3.942649342761114e-06, + "time_sec": 66.69701147079468 + }, + { + "epoch": 145, + "train_loss": 2.9021220780181887, + "train_acc": 0.27056, + "test_loss": 8.362188708496094, + "test_acc": 0.0328, + "lyapunov": null, + "grad_norm": 0.5070330634175128, + "grad_max_sv": 0.1640974970534444, + "grad_min_sv": 9.447458995670566e-09, + "grad_condition": 19525333.626517944, + "lr": 2.7390523158633524e-06, + "time_sec": 67.06064939498901 + }, + { + "epoch": 146, + "train_loss": 2.9056922393035887, + "train_acc": 0.26996, + "test_loss": 8.198326219177247, + "test_acc": 0.0315, + "lyapunov": null, + "grad_norm": 0.5052726916497198, + "grad_max_sv": 0.1608945619314909, + "grad_min_sv": 9.247097532832926e-09, + "grad_condition": 30881517.504121702, + "lr": 1.7535703752478133e-06, + "time_sec": 66.83930277824402 + }, + { + "epoch": 147, + "train_loss": 2.9056436912536623, + "train_acc": 0.27088, + "test_loss": 8.528380426025391, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.506185959212811, + "grad_max_sv": 0.1588722374290228, + "grad_min_sv": 9.394264763318283e-09, + "grad_condition": 20675797.94461853, + "lr": 9.866357858642196e-07, + "time_sec": 66.72091388702393 + }, + { + "epoch": 148, + "train_loss": 2.8992470669555663, + "train_acc": 0.27248, + "test_loss": 8.531358058166504, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.5065504938383886, + "grad_max_sv": 0.16413835100829602, + "grad_min_sv": 9.337682073222442e-09, + "grad_condition": 78330146.63114226, + "lr": 4.38584950570808e-07, + "time_sec": 66.73046231269836 + }, + { + "epoch": 149, + "train_loss": 2.9046918795013426, + "train_acc": 0.26942, + "test_loss": 8.69618356628418, + "test_acc": 0.0302, + "lyapunov": null, + "grad_norm": 0.5057233580127345, + "grad_max_sv": 0.16292193159461021, + "grad_min_sv": 9.351353436048982e-09, + "grad_condition": 19471249.74441474, + "lr": 1.096582625772501e-07, + "time_sec": 66.730135679245 + }, + { + "epoch": 150, + "train_loss": 2.904742412261963, + "train_acc": 0.2691, + "test_loss": 8.56440517730713, + "test_acc": 0.0303, + "lyapunov": null, + "grad_norm": 0.506527150487024, + "grad_max_sv": 0.16403611674904822, + "grad_min_sv": 9.31519477109788e-09, + "grad_condition": 20813101.77306552, + "lr": 0.0, + "time_sec": 66.77998113632202 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 4.385416869049072, + "train_acc": 0.09238, + "test_loss": 3.76526393661499, + "test_acc": 0.1561, + "lyapunov": 2.248025039882611, + "grad_norm": 6.278186010639677, + "grad_max_sv": 4.849219900369644, + "grad_min_sv": 1.1319616959326595e-07, + "grad_condition": 56141122.1011496, + "lr": 0.0009998903417374227, + "time_sec": 41.7864191532135 + }, + { + "epoch": 2, + "train_loss": 3.6485818179321288, + "train_acc": 0.16322, + "test_loss": 3.3687725090026857, + "test_acc": 0.2122, + "lyapunov": 2.118248250783252, + "grad_norm": 4.443263102278264, + "grad_max_sv": 3.2507266819477083, + "grad_min_sv": 8.233919142064395e-08, + "grad_condition": 322584578.8706892, + "lr": 0.0009995614150494292, + "time_sec": 41.66770076751709 + }, + { + "epoch": 3, + "train_loss": 3.328380308380127, + "train_acc": 0.20764, + "test_loss": 3.374305525970459, + "test_acc": 0.2055, + "lyapunov": 1.9997802164853382, + "grad_norm": 3.3578148542704875, + "grad_max_sv": 2.267174106836319, + "grad_min_sv": 6.252581136179103e-08, + "grad_condition": 45047259.18741469, + "lr": 0.0009990133642141358, + "time_sec": 41.67004632949829 + }, + { + "epoch": 4, + "train_loss": 3.2626986949920656, + "train_acc": 0.2146, + "test_loss": 4.6115389114379886, + "test_acc": 0.0743, + "lyapunov": 1.77669187945783, + "grad_norm": 2.671171954416308, + "grad_max_sv": 1.6475970447063446, + "grad_min_sv": 4.904231385438607e-08, + "grad_condition": 37237118.01849495, + "lr": 0.0009982464296247522, + "time_sec": 41.662524461746216 + }, + { + "epoch": 5, + "train_loss": 3.2418214219665527, + "train_acc": 0.21486, + "test_loss": 6.85950913848877, + "test_acc": 0.0383, + "lyapunov": 1.577696952063714, + "grad_norm": 2.24297056171998, + "grad_max_sv": 1.3573209017515182, + "grad_min_sv": 4.2056884189123346e-08, + "grad_condition": 57071857.62248597, + "lr": 0.0009972609476841367, + "time_sec": 41.65110445022583 + }, + { + "epoch": 6, + "train_loss": 3.1473428995513917, + "train_acc": 0.2334, + "test_loss": 8.817106538391114, + "test_acc": 0.0334, + "lyapunov": 1.522594060739288, + "grad_norm": 2.0255024337601077, + "grad_max_sv": 1.1387103602290154, + "grad_min_sv": 3.8490053089201837e-08, + "grad_condition": 35218561.7694581, + "lr": 0.000996057350657239, + "time_sec": 41.70460891723633 + }, + { + "epoch": 7, + "train_loss": 3.0554499784851075, + "train_acc": 0.25108, + "test_loss": 10.19464548034668, + "test_acc": 0.0214, + "lyapunov": 1.498324869538817, + "grad_norm": 1.8452595544017367, + "grad_max_sv": 0.9877568006515502, + "grad_min_sv": 3.479785576354644e-08, + "grad_condition": 35325972.864356965, + "lr": 0.000994636166481494, + "time_sec": 41.68277025222778 + }, + { + "epoch": 8, + "train_loss": 2.9779827911376953, + "train_acc": 0.26282, + "test_loss": 11.777064636230469, + "test_acc": 0.0217, + "lyapunov": 1.4917038487046577, + "grad_norm": 1.7112589099882383, + "grad_max_sv": 0.9115550458431244, + "grad_min_sv": 3.2246774489541605e-08, + "grad_condition": 35535466.61101306, + "lr": 0.0009929980185352525, + "time_sec": 41.73534274101257 + }, + { + "epoch": 9, + "train_loss": 2.9365650801086427, + "train_acc": 0.27382, + "test_loss": 11.0659416595459, + "test_acc": 0.0285, + "lyapunov": 1.4870752608379745, + "grad_norm": 1.6385351402723778, + "grad_max_sv": 0.8621709123253822, + "grad_min_sv": 3.1201993953844376e-08, + "grad_condition": 65261212.14923034, + "lr": 0.0009911436253643444, + "time_sec": 41.677772760391235 + }, + { + "epoch": 10, + "train_loss": 2.8763271882629393, + "train_acc": 0.28468, + "test_loss": 12.026495361328125, + "test_acc": 0.0238, + "lyapunov": 1.483278246486888, + "grad_norm": 1.529513425384814, + "grad_max_sv": 0.7616375535726547, + "grad_min_sv": 2.9233747178558646e-08, + "grad_condition": 32138717.187251367, + "lr": 0.0009890738003669028, + "time_sec": 41.68400001525879 + }, + { + "epoch": 11, + "train_loss": 2.8316531258392335, + "train_acc": 0.29512, + "test_loss": 13.11057151184082, + "test_acc": 0.0192, + "lyapunov": 1.490352714153202, + "grad_norm": 1.4498581032880438, + "grad_max_sv": 0.7242703467607499, + "grad_min_sv": 2.7478494810107e-08, + "grad_condition": 41454194.81325731, + "lr": 0.00098678945143658, + "time_sec": 41.70621085166931 + }, + { + "epoch": 12, + "train_loss": 2.799339100418091, + "train_acc": 0.29892, + "test_loss": 7.575371592712402, + "test_acc": 0.0262, + "lyapunov": 1.4981255997782168, + "grad_norm": 1.363013693713406, + "grad_max_sv": 0.6757008329033851, + "grad_min_sv": 2.5993861326942257e-08, + "grad_condition": 160871874.0058652, + "lr": 0.0009842915805643154, + "time_sec": 41.677626609802246 + }, + { + "epoch": 13, + "train_loss": 2.7616972874450685, + "train_acc": 0.30544, + "test_loss": 10.457825009155274, + "test_acc": 0.0149, + "lyapunov": 1.5049866004977994, + "grad_norm": 1.3009395680954525, + "grad_max_sv": 0.6281382858753204, + "grad_min_sv": 2.4570545004154454e-08, + "grad_condition": 36433287.73809738, + "lr": 0.000981581283398829, + "time_sec": 41.678059816360474 + }, + { + "epoch": 14, + "train_loss": 2.7419771829223634, + "train_acc": 0.31176, + "test_loss": 6.96602774734497, + "test_acc": 0.0273, + "lyapunov": 1.5126411487989109, + "grad_norm": 1.2428065154077472, + "grad_max_sv": 0.6042070008814335, + "grad_min_sv": 2.367223045363076e-08, + "grad_condition": 28155768.001448244, + "lr": 0.0009786597487660333, + "time_sec": 41.6808295249939 + }, + { + "epoch": 15, + "train_loss": 2.6940654248809817, + "train_acc": 0.32072, + "test_loss": 8.578126625061035, + "test_acc": 0.0227, + "lyapunov": 1.5099453883402794, + "grad_norm": 1.2169506496641136, + "grad_max_sv": 0.5779954038560391, + "grad_min_sv": 2.2935282436783998e-08, + "grad_condition": 268648302.11607826, + "lr": 0.0009755282581475766, + "time_sec": 41.68640756607056 + }, + { + "epoch": 16, + "train_loss": 2.6707639625549318, + "train_acc": 0.32688, + "test_loss": 8.14136336288452, + "test_acc": 0.018, + "lyapunov": 1.5205869574071196, + "grad_norm": 1.180524231835774, + "grad_max_sv": 0.5504504255950451, + "grad_min_sv": 2.2226173457262632e-08, + "grad_condition": 33744566.308580026, + "lr": 0.0009721881851187403, + "time_sec": 41.68173384666443 + }, + { + "epoch": 17, + "train_loss": 2.6515627406311033, + "train_acc": 0.32992, + "test_loss": 8.464934133911132, + "test_acc": 0.017, + "lyapunov": 1.5374923237144489, + "grad_norm": 1.140051503610018, + "grad_max_sv": 0.5274666294455528, + "grad_min_sv": 2.1756941515072015e-08, + "grad_condition": 34749184.683609106, + "lr": 0.0009686409947459456, + "time_sec": 41.707985401153564 + }, + { + "epoch": 18, + "train_loss": 2.6277094244384767, + "train_acc": 0.33546, + "test_loss": 8.285575199890136, + "test_acc": 0.0127, + "lyapunov": 1.5355821253393618, + "grad_norm": 1.117208726103555, + "grad_max_sv": 0.5191602148115635, + "grad_min_sv": 2.1151740331459834e-08, + "grad_condition": 39519340.90094157, + "lr": 0.0009648882429441254, + "time_sec": 41.662739515304565 + }, + { + "epoch": 19, + "train_loss": 2.607321646118164, + "train_acc": 0.34158, + "test_loss": 8.017330313110351, + "test_acc": 0.0171, + "lyapunov": 1.552301183076161, + "grad_norm": 1.0897405882008309, + "grad_max_sv": 0.5023482128977775, + "grad_min_sv": 2.064225344128312e-08, + "grad_condition": 48287017.10977797, + "lr": 0.00096093157579425, + "time_sec": 41.693289041519165 + }, + { + "epoch": 20, + "train_loss": 2.5911361766052248, + "train_acc": 0.34448, + "test_loss": 6.698405216979981, + "test_acc": 0.0142, + "lyapunov": 1.5602374622583999, + "grad_norm": 1.065027082262344, + "grad_max_sv": 0.4803482659161091, + "grad_min_sv": 2.0105638209866328e-08, + "grad_condition": 53496143.92804453, + "lr": 0.0009567727288213001, + "time_sec": 41.69337177276611 + }, + { + "epoch": 21, + "train_loss": 2.581589804840088, + "train_acc": 0.34626, + "test_loss": 6.832892972564697, + "test_acc": 0.01, + "lyapunov": 1.5771442057226626, + "grad_norm": 1.0439470300070743, + "grad_max_sv": 0.4716391734778881, + "grad_min_sv": 1.994593953336121e-08, + "grad_condition": 29150078.74753332, + "lr": 0.0009524135262330095, + "time_sec": 41.680705308914185 + }, + { + "epoch": 22, + "train_loss": 2.5651588928222657, + "train_acc": 0.34914, + "test_loss": 9.158645959472656, + "test_acc": 0.01, + "lyapunov": 1.58292500716646, + "grad_norm": 1.02635920685996, + "grad_max_sv": 0.45573277324438094, + "grad_min_sv": 1.9168616865322673e-08, + "grad_condition": 70923838.75523397, + "lr": 0.0009478558801197061, + "time_sec": 41.669551849365234 + }, + { + "epoch": 23, + "train_loss": 2.5523301736450197, + "train_acc": 0.3523, + "test_loss": 8.809644000244141, + "test_acc": 0.01, + "lyapunov": 1.5998260813295995, + "grad_norm": 1.0017883748688885, + "grad_max_sv": 0.44832063987851145, + "grad_min_sv": 1.9039649867824692e-08, + "grad_condition": 27413330.740021694, + "lr": 0.000943101789615607, + "time_sec": 41.67731857299805 + }, + { + "epoch": 24, + "train_loss": 2.540596002731323, + "train_acc": 0.35496, + "test_loss": 9.603093579101563, + "test_acc": 0.01, + "lyapunov": 1.608014219557233, + "grad_norm": 0.9892621492137654, + "grad_max_sv": 0.4301694191992283, + "grad_min_sv": 1.8367088082393846e-08, + "grad_condition": 81196052.16569169, + "lr": 0.0009381533400219313, + "time_sec": 41.676315784454346 + }, + { + "epoch": 25, + "train_loss": 2.5427046757507323, + "train_acc": 0.35626, + "test_loss": 6.377327036285401, + "test_acc": 0.0121, + "lyapunov": 1.617281358870094, + "grad_norm": 0.9690834006908926, + "grad_max_sv": 0.4215060040354729, + "grad_min_sv": 1.847692875367457e-08, + "grad_condition": 26969157.744863987, + "lr": 0.0009330127018922189, + "time_sec": 41.6710147857666 + }, + { + "epoch": 26, + "train_loss": 2.5659257014465333, + "train_acc": 0.35094, + "test_loss": 7.642009206390381, + "test_acc": 0.01, + "lyapunov": 1.6466610379841016, + "grad_norm": 0.9589858174241993, + "grad_max_sv": 0.4141293965280056, + "grad_min_sv": 1.7795701028403e-08, + "grad_condition": 100155427.75409335, + "lr": 0.000927682130080253, + "time_sec": 41.67351698875427 + }, + { + "epoch": 27, + "train_loss": 2.5872419680023193, + "train_acc": 0.3491, + "test_loss": 6.126792880249023, + "test_acc": 0.01, + "lyapunov": 1.655874063596701, + "grad_norm": 0.9488520314828451, + "grad_max_sv": 0.4167667210102081, + "grad_min_sv": 1.7755209749670265e-08, + "grad_condition": 36482939.06456544, + "lr": 0.0009221639627510072, + "time_sec": 41.6674382686615 + }, + { + "epoch": 28, + "train_loss": 2.6444351440429688, + "train_acc": 0.33624, + "test_loss": 6.9149939208984375, + "test_acc": 0.0101, + "lyapunov": 1.642535175203972, + "grad_norm": 0.9303399228093118, + "grad_max_sv": 0.39700465872883794, + "grad_min_sv": 1.7362861481906577e-08, + "grad_condition": 35927282.240080185, + "lr": 0.0009164606203550494, + "time_sec": 41.694759130477905 + }, + { + "epoch": 29, + "train_loss": 2.5599649453735354, + "train_acc": 0.35268, + "test_loss": 7.456900106048584, + "test_acc": 0.0106, + "lyapunov": 1.640105134690814, + "grad_norm": 0.9138541555575717, + "grad_max_sv": 0.40499070957303046, + "grad_min_sv": 1.741128121124369e-08, + "grad_condition": 28008235.387952596, + "lr": 0.0009105746045668516, + "time_sec": 41.669721841812134 + }, + { + "epoch": 30, + "train_loss": 2.587169426727295, + "train_acc": 0.34752, + "test_loss": 7.112287390899658, + "test_acc": 0.0119, + "lyapunov": 1.679136826254218, + "grad_norm": 0.9055855274318034, + "grad_max_sv": 0.38519148603081704, + "grad_min_sv": 1.6915865576859478e-08, + "grad_condition": 154040606.17291743, + "lr": 0.0009045084971874733, + "time_sec": 41.68705892562866 + }, + { + "epoch": 31, + "train_loss": 2.5624461259460447, + "train_acc": 0.35596, + "test_loss": 7.3813514785766605, + "test_acc": 0.0124, + "lyapunov": 1.6608827205570154, + "grad_norm": 0.887369695582494, + "grad_max_sv": 0.37692187577486036, + "grad_min_sv": 1.6459350740682942e-08, + "grad_condition": 31475690.866420962, + "lr": 0.0008982649590120977, + "time_sec": 41.673012495040894 + }, + { + "epoch": 32, + "train_loss": 2.551432417373657, + "train_acc": 0.35684, + "test_loss": 6.42604938659668, + "test_acc": 0.0121, + "lyapunov": 1.6469347565375325, + "grad_norm": 0.8746022274317357, + "grad_max_sv": 0.3701463647186756, + "grad_min_sv": 1.6476226111922233e-08, + "grad_condition": 52317458.10447326, + "lr": 0.0008918467286629196, + "time_sec": 41.66220784187317 + }, + { + "epoch": 33, + "train_loss": 2.5348674264526365, + "train_acc": 0.35962, + "test_loss": 5.573617294311523, + "test_acc": 0.0241, + "lyapunov": 1.6317134284607284, + "grad_norm": 0.8557656352746138, + "grad_max_sv": 0.3519837222993374, + "grad_min_sv": 1.6144081904645446e-08, + "grad_condition": 26756099.798511714, + "lr": 0.0008852566213878943, + "time_sec": 41.66625261306763 + }, + { + "epoch": 34, + "train_loss": 2.5518150065612795, + "train_acc": 0.3554, + "test_loss": 7.073295845794678, + "test_acc": 0.0148, + "lyapunov": 1.649389718804518, + "grad_norm": 0.8523798964772112, + "grad_max_sv": 0.35057583153247834, + "grad_min_sv": 1.5881563142361442e-08, + "grad_condition": 28695640.9756914, + "lr": 0.000878497527825878, + "time_sec": 41.682754039764404 + }, + { + "epoch": 35, + "train_loss": 2.4595030923461914, + "train_acc": 0.37624, + "test_loss": 6.594732564544678, + "test_acc": 0.0135, + "lyapunov": 1.6497014946949757, + "grad_norm": 0.8413194934076474, + "grad_max_sv": 0.3433509707450867, + "grad_min_sv": 1.5582725373941564e-08, + "grad_condition": 32812761.595985997, + "lr": 0.000871572412738697, + "time_sec": 41.66791009902954 + }, + { + "epoch": 36, + "train_loss": 2.4551396466827393, + "train_acc": 0.37628, + "test_loss": 8.253561260986329, + "test_acc": 0.0118, + "lyapunov": 1.641755030892999, + "grad_norm": 0.843485970719339, + "grad_max_sv": 0.35417381674051285, + "grad_min_sv": 1.5807648856558387e-08, + "grad_condition": 26531326.086508345, + "lr": 0.0008644843137107055, + "time_sec": 41.667187213897705 + }, + { + "epoch": 37, + "train_loss": 2.4310810439300536, + "train_acc": 0.37952, + "test_loss": 6.83057543182373, + "test_acc": 0.0102, + "lyapunov": 1.6440746006758318, + "grad_norm": 0.835329787885881, + "grad_max_sv": 0.34257676601409914, + "grad_min_sv": 1.570942509132589e-08, + "grad_condition": 39002769.53085541, + "lr": 0.0008572363398164014, + "time_sec": 41.83383345603943 + }, + { + "epoch": 38, + "train_loss": 2.3961087857055663, + "train_acc": 0.38468, + "test_loss": 8.535474667358399, + "test_acc": 0.0125, + "lyapunov": 1.6436351958443136, + "grad_norm": 0.8290693986791846, + "grad_max_sv": 0.3357673093676567, + "grad_min_sv": 1.5592837618316757e-08, + "grad_condition": 29777273.236415513, + "lr": 0.0008498316702566826, + "time_sec": 41.67509579658508 + }, + { + "epoch": 39, + "train_loss": 2.418079302215576, + "train_acc": 0.38104, + "test_loss": 8.728886996459961, + "test_acc": 0.0138, + "lyapunov": 1.6392356294500248, + "grad_norm": 0.8215527161857048, + "grad_max_sv": 0.33165409713983535, + "grad_min_sv": 1.5307788804423682e-08, + "grad_condition": 151642365.19854102, + "lr": 0.0008422735529643442, + "time_sec": 41.690041065216064 + }, + { + "epoch": 40, + "train_loss": 2.385871609649658, + "train_acc": 0.38864, + "test_loss": 7.529428874206543, + "test_acc": 0.0132, + "lyapunov": 1.6354777038554706, + "grad_norm": 0.8200733881789374, + "grad_max_sv": 0.3330301932990551, + "grad_min_sv": 1.5384999157985745e-08, + "grad_condition": 37189354.004172444, + "lr": 0.0008345653031794289, + "time_sec": 41.66628098487854 + }, + { + "epoch": 41, + "train_loss": 2.3330577777862547, + "train_acc": 0.40102, + "test_loss": 7.123234498596191, + "test_acc": 0.0249, + "lyapunov": 1.6323570756961012, + "grad_norm": 0.8204860309316497, + "grad_max_sv": 0.3341449283063412, + "grad_min_sv": 1.5524073795208925e-08, + "grad_condition": 51332515.62539954, + "lr": 0.0008267103019950526, + "time_sec": 41.658520460128784 + }, + { + "epoch": 42, + "train_loss": 2.3339556999969484, + "train_acc": 0.39776, + "test_loss": 7.333181537628174, + "test_acc": 0.0185, + "lyapunov": 1.6354230733783655, + "grad_norm": 0.8120092023544444, + "grad_max_sv": 0.32391806691884995, + "grad_min_sv": 1.5330058230483833e-08, + "grad_condition": 63172058.450652756, + "lr": 0.0008187119948743447, + "time_sec": 41.67036032676697 + }, + { + "epoch": 43, + "train_loss": 2.3197922330474854, + "train_acc": 0.40358, + "test_loss": 6.427054233551026, + "test_acc": 0.0136, + "lyapunov": 1.6421251245166943, + "grad_norm": 0.8092554387074351, + "grad_max_sv": 0.330906642973423, + "grad_min_sv": 1.526612713464992e-08, + "grad_condition": 26225823.13057729, + "lr": 0.000810573890139155, + "time_sec": 41.665225982666016 + }, + { + "epoch": 44, + "train_loss": 2.3195025100708007, + "train_acc": 0.4033, + "test_loss": 7.0808923698425295, + "test_acc": 0.0118, + "lyapunov": 1.656124430239353, + "grad_norm": 0.8044803007377996, + "grad_max_sv": 0.31877501383423806, + "grad_min_sv": 1.485775653065069e-08, + "grad_condition": 62435666.9732676, + "lr": 0.0008022995574311873, + "time_sec": 41.6713650226593 + }, + { + "epoch": 45, + "train_loss": 2.2802742100524904, + "train_acc": 0.41386, + "test_loss": 6.140260126495361, + "test_acc": 0.0112, + "lyapunov": 1.640040697649007, + "grad_norm": 0.8004818224905164, + "grad_max_sv": 0.31864383071660995, + "grad_min_sv": 1.4937468863218672e-08, + "grad_condition": 92954234.04941478, + "lr": 0.0007938926261462363, + "time_sec": 41.66809844970703 + }, + { + "epoch": 46, + "train_loss": 2.262954523010254, + "train_acc": 0.414, + "test_loss": 7.2938560546875, + "test_acc": 0.0101, + "lyapunov": 1.637706352316815, + "grad_norm": 0.793081854121529, + "grad_max_sv": 0.31840832754969595, + "grad_min_sv": 1.496939308343048e-08, + "grad_condition": 25865099.124858934, + "lr": 0.0007853567838422158, + "time_sec": 41.66623878479004 + }, + { + "epoch": 47, + "train_loss": 2.267263908538818, + "train_acc": 0.41344, + "test_loss": 6.906099589538575, + "test_acc": 0.012, + "lyapunov": 1.6311360786637992, + "grad_norm": 0.797780329526112, + "grad_max_sv": 0.31469214931130407, + "grad_min_sv": 1.4971078365899616e-08, + "grad_condition": 25611249.79088702, + "lr": 0.0007766957746216719, + "time_sec": 41.708776235580444 + }, + { + "epoch": 48, + "train_loss": 2.2475574452209472, + "train_acc": 0.41852, + "test_loss": 8.073319694519043, + "test_acc": 0.0096, + "lyapunov": 1.6334223103950092, + "grad_norm": 0.7869763323374519, + "grad_max_sv": 0.31651476472616197, + "grad_min_sv": 1.4959556110527573e-08, + "grad_condition": 24572781.086960234, + "lr": 0.0007679133974894982, + "time_sec": 41.682409048080444 + }, + { + "epoch": 49, + "train_loss": 2.2258160152435305, + "train_acc": 0.42326, + "test_loss": 7.22346753692627, + "test_acc": 0.01, + "lyapunov": 1.6582896377119567, + "grad_norm": 0.7915396840627938, + "grad_max_sv": 0.31868951208889484, + "grad_min_sv": 1.4694817633553736e-08, + "grad_condition": 37064015.276476786, + "lr": 0.000759013504686565, + "time_sec": 41.66550970077515 + }, + { + "epoch": 50, + "train_loss": 2.191147954711914, + "train_acc": 0.43136, + "test_loss": 7.067440712738037, + "test_acc": 0.0113, + "lyapunov": 1.6353955543254648, + "grad_norm": 0.7852910579053439, + "grad_max_sv": 0.3114649154245853, + "grad_min_sv": 1.4506057238912461e-08, + "grad_condition": 117782435.52166636, + "lr": 0.0007499999999999998, + "time_sec": 41.676011085510254 + }, + { + "epoch": 51, + "train_loss": 2.1769231742095947, + "train_acc": 0.43202, + "test_loss": 8.091367781066895, + "test_acc": 0.0106, + "lyapunov": 1.6262942616591978, + "grad_norm": 0.7849301566787954, + "grad_max_sv": 0.31383112370967864, + "grad_min_sv": 1.482414189180048e-08, + "grad_condition": 24814087.204268403, + "lr": 0.0007408768370508575, + "time_sec": 41.71332907676697 + }, + { + "epoch": 52, + "train_loss": 2.1791525329589843, + "train_acc": 0.43434, + "test_loss": 6.640031047058105, + "test_acc": 0.0101, + "lyapunov": 1.6475636553581414, + "grad_norm": 0.7748205713957207, + "grad_max_sv": 0.3011137217283249, + "grad_min_sv": 1.4537112300733179e-08, + "grad_condition": 122190974.86962557, + "lr": 0.0007316480175599307, + "time_sec": 41.6874144077301 + }, + { + "epoch": 53, + "train_loss": 2.177708456039429, + "train_acc": 0.43164, + "test_loss": 6.330417361450196, + "test_acc": 0.0124, + "lyapunov": 1.6483547099106146, + "grad_norm": 0.7832189933674929, + "grad_max_sv": 0.3086284928023815, + "grad_min_sv": 1.4681565554952592e-08, + "grad_condition": 39128451.13660244, + "lr": 0.0007223175895924635, + "time_sec": 41.67819046974182 + }, + { + "epoch": 54, + "train_loss": 2.155647780075073, + "train_acc": 0.43836, + "test_loss": 6.180060083007812, + "test_acc": 0.0168, + "lyapunov": 1.6432840284484123, + "grad_norm": 0.7691412493425369, + "grad_max_sv": 0.29928392022848127, + "grad_min_sv": 1.4252177091278462e-08, + "grad_condition": 33900536.02069519, + "lr": 0.0007128896457825361, + "time_sec": 41.750109910964966 + }, + { + "epoch": 55, + "train_loss": 2.1353805670928954, + "train_acc": 0.44186, + "test_loss": 7.257317136383056, + "test_acc": 0.0132, + "lyapunov": 1.6428052202210097, + "grad_norm": 0.7679438794422704, + "grad_max_sv": 0.30230089724063874, + "grad_min_sv": 1.4329349766473153e-08, + "grad_condition": 34802929.64081846, + "lr": 0.0007033683215378998, + "time_sec": 41.669835805892944 + }, + { + "epoch": 56, + "train_loss": 2.128101917114258, + "train_acc": 0.44428, + "test_loss": 7.373139286804199, + "test_acc": 0.0137, + "lyapunov": 1.6414129276714666, + "grad_norm": 0.7718923152736775, + "grad_max_sv": 0.2989685770124197, + "grad_min_sv": 1.451244842631816e-08, + "grad_condition": 26370279.022705477, + "lr": 0.0006937577932260512, + "time_sec": 41.67406344413757 + }, + { + "epoch": 57, + "train_loss": 2.137920976486206, + "train_acc": 0.44384, + "test_loss": 5.424753893280029, + "test_acc": 0.0111, + "lyapunov": 1.6554484230173214, + "grad_norm": 0.773511600768633, + "grad_max_sv": 0.294682040810585, + "grad_min_sv": 1.4318467259077927e-08, + "grad_condition": 26244116.009311978, + "lr": 0.0006840622763423388, + "time_sec": 41.68566060066223 + }, + { + "epoch": 58, + "train_loss": 2.1886442722320556, + "train_acc": 0.43186, + "test_loss": 6.545238864135742, + "test_acc": 0.0159, + "lyapunov": 1.6389995575560938, + "grad_norm": 0.770667566152431, + "grad_max_sv": 0.2981013923883438, + "grad_min_sv": 1.4503179252695065e-08, + "grad_condition": 46106578.838229105, + "lr": 0.0006742860236609073, + "time_sec": 41.69116020202637 + }, + { + "epoch": 59, + "train_loss": 2.1066105070495604, + "train_acc": 0.44986, + "test_loss": 7.391026984405517, + "test_acc": 0.0181, + "lyapunov": 1.6416400030750753, + "grad_norm": 0.7602483384951753, + "grad_max_sv": 0.2911146242171526, + "grad_min_sv": 1.4345006460816933e-08, + "grad_condition": 63690343.21158177, + "lr": 0.0006644333233692913, + "time_sec": 41.654924392700195 + }, + { + "epoch": 60, + "train_loss": 2.0506089850234988, + "train_acc": 0.46106, + "test_loss": 8.025833796691895, + "test_acc": 0.0159, + "lyapunov": 1.621927274157629, + "grad_norm": 0.7629731967669975, + "grad_max_sv": 0.2949394479393959, + "grad_min_sv": 1.4372729567613262e-08, + "grad_condition": 30309204.558091305, + "lr": 0.0006545084971874734, + "time_sec": 41.66482877731323 + }, + { + "epoch": 61, + "train_loss": 2.038806278114319, + "train_acc": 0.46484, + "test_loss": 9.74862598876953, + "test_acc": 0.01, + "lyapunov": 1.6300551010214763, + "grad_norm": 0.7587096227595913, + "grad_max_sv": 0.29696495905518533, + "grad_min_sv": 1.4256705770446243e-08, + "grad_condition": 99834698.98389995, + "lr": 0.0006445158984722354, + "time_sec": 41.67584776878357 + }, + { + "epoch": 62, + "train_loss": 2.065830835571289, + "train_acc": 0.45776, + "test_loss": 8.374367053222656, + "test_acc": 0.0106, + "lyapunov": 1.6421477361713224, + "grad_norm": 0.7635630118818492, + "grad_max_sv": 0.29152632839977743, + "grad_min_sv": 1.4168918681389808e-08, + "grad_condition": 49794193.0235935, + "lr": 0.0006344599103076324, + "time_sec": 41.70599865913391 + }, + { + "epoch": 63, + "train_loss": 2.06199690322876, + "train_acc": 0.45774, + "test_loss": 9.43989691772461, + "test_acc": 0.0143, + "lyapunov": 1.6391434187779341, + "grad_norm": 0.7626912434978755, + "grad_max_sv": 0.3007299728691578, + "grad_min_sv": 1.421240057031259e-08, + "grad_condition": 29364542.182565797, + "lr": 0.0006243449435824269, + "time_sec": 41.69278836250305 + }, + { + "epoch": 64, + "train_loss": 2.0462368117523195, + "train_acc": 0.46278, + "test_loss": 7.563213960266113, + "test_acc": 0.01, + "lyapunov": 1.6542154858484293, + "grad_norm": 0.7636972310186092, + "grad_max_sv": 0.2974775414913893, + "grad_min_sv": 1.4351465202344648e-08, + "grad_condition": 27137193.96425879, + "lr": 0.0006141754350553275, + "time_sec": 41.68390464782715 + }, + { + "epoch": 65, + "train_loss": 2.0235327534866334, + "train_acc": 0.46756, + "test_loss": 6.978350220489502, + "test_acc": 0.0098, + "lyapunov": 1.6490768569204814, + "grad_norm": 0.7584239144021073, + "grad_max_sv": 0.29015346951782706, + "grad_min_sv": 1.4414379233967933e-08, + "grad_condition": 56409329.68513076, + "lr": 0.0006039558454088793, + "time_sec": 41.70132231712341 + }, + { + "epoch": 66, + "train_loss": 2.0327218698120118, + "train_acc": 0.46344, + "test_loss": 6.808298188781738, + "test_acc": 0.016, + "lyapunov": 1.6421981882256316, + "grad_norm": 0.7632841139098454, + "grad_max_sv": 0.2945323955267668, + "grad_min_sv": 1.4372620408403813e-08, + "grad_condition": 79999394.91706361, + "lr": 0.000593690657292862, + "time_sec": 41.77633190155029 + }, + { + "epoch": 67, + "train_loss": 1.9898056484222413, + "train_acc": 0.47598, + "test_loss": 7.061488777160645, + "test_acc": 0.0109, + "lyapunov": 1.647677140467612, + "grad_norm": 0.7591590906188236, + "grad_max_sv": 0.296347975358367, + "grad_min_sv": 1.415571162510787e-08, + "grad_condition": 25155146.125877418, + "lr": 0.0005833843733580507, + "time_sec": 41.705756425857544 + }, + { + "epoch": 68, + "train_loss": 2.0102797174835203, + "train_acc": 0.47046, + "test_loss": 7.231464897918701, + "test_acc": 0.01, + "lyapunov": 1.6583749330257211, + "grad_norm": 0.754101966257317, + "grad_max_sv": 0.28500255234539507, + "grad_min_sv": 1.3903248727298312e-08, + "grad_condition": 29630876.42759655, + "lr": 0.0005730415142812054, + "time_sec": 41.72124171257019 + }, + { + "epoch": 69, + "train_loss": 2.04611669380188, + "train_acc": 0.46162, + "test_loss": 5.946302236938476, + "test_acc": 0.0107, + "lyapunov": 1.6569105533077895, + "grad_norm": 0.7572448125574305, + "grad_max_sv": 0.2827830083668232, + "grad_min_sv": 1.4111277255729471e-08, + "grad_condition": 53632120.18934096, + "lr": 0.0005626666167821517, + "time_sec": 41.66360831260681 + }, + { + "epoch": 70, + "train_loss": 1.9799313236999512, + "train_acc": 0.47786, + "test_loss": 5.791928797912598, + "test_acc": 0.0139, + "lyapunov": 1.659774536976729, + "grad_norm": 0.743881925858891, + "grad_max_sv": 0.2895107101649046, + "grad_min_sv": 1.3961023534458939e-08, + "grad_condition": 29278721.035794042, + "lr": 0.0005522642316338265, + "time_sec": 41.70555853843689 + }, + { + "epoch": 71, + "train_loss": 1.9502769188308715, + "train_acc": 0.48312, + "test_loss": 5.28058690032959, + "test_acc": 0.0122, + "lyapunov": 1.6549167751961047, + "grad_norm": 0.7494747344108936, + "grad_max_sv": 0.2851333416998386, + "grad_min_sv": 1.4076917760575888e-08, + "grad_condition": 331119741.39895195, + "lr": 0.0005418389216661573, + "time_sec": 41.68225932121277 + }, + { + "epoch": 72, + "train_loss": 1.9479334468841554, + "train_acc": 0.48628, + "test_loss": 7.984691355895996, + "test_acc": 0.0103, + "lyapunov": 1.653415890300975, + "grad_norm": 0.7477937354985393, + "grad_max_sv": 0.28984881937503815, + "grad_min_sv": 1.4043280075794196e-08, + "grad_condition": 119153928.06545302, + "lr": 0.0005313952597646563, + "time_sec": 41.65925407409668 + }, + { + "epoch": 73, + "train_loss": 1.967646238708496, + "train_acc": 0.47644, + "test_loss": 6.1665235633850095, + "test_acc": 0.0142, + "lyapunov": 1.65852049915382, + "grad_norm": 0.7579543653963434, + "grad_max_sv": 0.2979495331645012, + "grad_min_sv": 1.4386894665874283e-08, + "grad_condition": 39194921.11896709, + "lr": 0.0005209378268645994, + "time_sec": 41.68930411338806 + }, + { + "epoch": 74, + "train_loss": 1.9287460524368285, + "train_acc": 0.49016, + "test_loss": 6.917835614776611, + "test_acc": 0.011, + "lyapunov": 1.6452750241969858, + "grad_norm": 0.7457505107152974, + "grad_max_sv": 0.2847950000315905, + "grad_min_sv": 1.4118661037509916e-08, + "grad_condition": 24938980.26155622, + "lr": 0.0005104712099416781, + "time_sec": 41.67027688026428 + }, + { + "epoch": 75, + "train_loss": 1.9238459339141847, + "train_acc": 0.48922, + "test_loss": 7.703335245513916, + "test_acc": 0.0102, + "lyapunov": 1.636191079683621, + "grad_norm": 0.7456866026716246, + "grad_max_sv": 0.28741468451917174, + "grad_min_sv": 1.3977797050368501e-08, + "grad_condition": 33299832.87362317, + "lr": 0.0004999999999999996, + "time_sec": 41.668753147125244 + }, + { + "epoch": 76, + "train_loss": 1.9011995269012452, + "train_acc": 0.49452, + "test_loss": 6.336113402557373, + "test_acc": 0.0109, + "lyapunov": 1.6527920217465257, + "grad_norm": 0.7472940737131395, + "grad_max_sv": 0.28794192261993884, + "grad_min_sv": 1.3842809193365114e-08, + "grad_condition": 26648537.366496623, + "lr": 0.0004895287900583212, + "time_sec": 41.664530515670776 + }, + { + "epoch": 77, + "train_loss": 1.9055398291778565, + "train_acc": 0.49198, + "test_loss": 5.844799766540527, + "test_acc": 0.011, + "lyapunov": 1.652166176025215, + "grad_norm": 0.7477207101099883, + "grad_max_sv": 0.29006113260984423, + "grad_min_sv": 1.4085541283348491e-08, + "grad_condition": 24059920.597129285, + "lr": 0.0004790621731353997, + "time_sec": 41.67645764350891 + }, + { + "epoch": 78, + "train_loss": 1.8853045474624635, + "train_acc": 0.49528, + "test_loss": 5.736059879302979, + "test_acc": 0.0109, + "lyapunov": 1.6538786385065454, + "grad_norm": 0.7430364105793885, + "grad_max_sv": 0.2820361901074648, + "grad_min_sv": 1.3740982796224544e-08, + "grad_condition": 1051094146.3111416, + "lr": 0.000468604740235343, + "time_sec": 41.67271661758423 + }, + { + "epoch": 79, + "train_loss": 1.8873431278610229, + "train_acc": 0.49708, + "test_loss": 7.06695590133667, + "test_acc": 0.0098, + "lyapunov": 1.6691140817559285, + "grad_norm": 0.7474584387052425, + "grad_max_sv": 0.2899070601910353, + "grad_min_sv": 1.3942933266980483e-08, + "grad_condition": 53163427.383831725, + "lr": 0.00045816107833384175, + "time_sec": 41.661076068878174 + }, + { + "epoch": 80, + "train_loss": 1.8736388172149658, + "train_acc": 0.49874, + "test_loss": 5.781377349853516, + "test_acc": 0.0131, + "lyapunov": 1.657112023104792, + "grad_norm": 0.7444710747937686, + "grad_max_sv": 0.28176243752241137, + "grad_min_sv": 1.3972709403224648e-08, + "grad_condition": 135132346.79221177, + "lr": 0.0004477357683661729, + "time_sec": 41.64565968513489 + }, + { + "epoch": 81, + "train_loss": 1.8635578856658936, + "train_acc": 0.50138, + "test_loss": 5.580086952209473, + "test_acc": 0.0135, + "lyapunov": 1.653865757195846, + "grad_norm": 0.7426015737094843, + "grad_max_sv": 0.2836704090237617, + "grad_min_sv": 1.4010618162646134e-08, + "grad_condition": 417585965.539017, + "lr": 0.00043733338321784746, + "time_sec": 41.66704249382019 + }, + { + "epoch": 82, + "train_loss": 1.9041340649414062, + "train_acc": 0.49242, + "test_loss": 6.370015201568603, + "test_acc": 0.0105, + "lyapunov": 1.695511110908235, + "grad_norm": 0.7494004766823937, + "grad_max_sv": 0.2831845413893461, + "grad_min_sv": 1.4006210818928722e-08, + "grad_condition": 24462326.60074065, + "lr": 0.0004269584857187939, + "time_sec": 41.662867307662964 + }, + { + "epoch": 83, + "train_loss": 1.854377107772827, + "train_acc": 0.5052, + "test_loss": 5.641559513854981, + "test_acc": 0.0107, + "lyapunov": 1.6620670087502132, + "grad_norm": 0.7432254276366087, + "grad_max_sv": 0.2882852029055357, + "grad_min_sv": 1.3851731775482712e-08, + "grad_condition": 26065103.969512142, + "lr": 0.0004166156266419484, + "time_sec": 41.68649983406067 + }, + { + "epoch": 84, + "train_loss": 1.8346456706237793, + "train_acc": 0.50848, + "test_loss": 6.769210389709473, + "test_acc": 0.0098, + "lyapunov": 1.668327778806467, + "grad_norm": 0.7445172315386438, + "grad_max_sv": 0.2814629077911377, + "grad_min_sv": 1.3836396603461587e-08, + "grad_condition": 24738537.843654584, + "lr": 0.0004063093427071373, + "time_sec": 41.7318229675293 + }, + { + "epoch": 85, + "train_loss": 1.8456001781845093, + "train_acc": 0.50552, + "test_loss": 5.615997741699219, + "test_acc": 0.0104, + "lyapunov": 1.6713733606021424, + "grad_norm": 0.745556048003164, + "grad_max_sv": 0.2879165679216385, + "grad_min_sv": 1.3856432721365275e-08, + "grad_condition": 45763261.566603445, + "lr": 0.0003960441545911199, + "time_sec": 41.671313762664795 + }, + { + "epoch": 86, + "train_loss": 1.8304506510925294, + "train_acc": 0.5126, + "test_loss": 7.119636929321289, + "test_acc": 0.0095, + "lyapunov": 1.6572847131573025, + "grad_norm": 0.742253787791735, + "grad_max_sv": 0.2842376373708248, + "grad_min_sv": 1.3829741059290246e-08, + "grad_condition": 32092921.731909145, + "lr": 0.0003858245649446718, + "time_sec": 41.68160605430603 + }, + { + "epoch": 87, + "train_loss": 1.8023982585525513, + "train_acc": 0.51886, + "test_loss": 5.729539224243164, + "test_acc": 0.0113, + "lyapunov": 1.6674704252911345, + "grad_norm": 0.7383133748182458, + "grad_max_sv": 0.2829333432018757, + "grad_min_sv": 1.3776665358511409e-08, + "grad_condition": 29369631.195804454, + "lr": 0.00037565505641757235, + "time_sec": 41.688772439956665 + }, + { + "epoch": 88, + "train_loss": 1.7957932733535766, + "train_acc": 0.51898, + "test_loss": 6.201405425262451, + "test_acc": 0.0112, + "lyapunov": 1.655544286188872, + "grad_norm": 0.7434211551258653, + "grad_max_sv": 0.2823782742023468, + "grad_min_sv": 1.3752334167282942e-08, + "grad_condition": 31024474.496423542, + "lr": 0.00036554008969236695, + "time_sec": 41.69476914405823 + }, + { + "epoch": 89, + "train_loss": 1.8189633627319335, + "train_acc": 0.51594, + "test_loss": 5.3315957733154296, + "test_acc": 0.0128, + "lyapunov": 1.6864432809907761, + "grad_norm": 0.7442939461149828, + "grad_max_sv": 0.2862010933458805, + "grad_min_sv": 1.3637743116745593e-08, + "grad_condition": 59934587.44977188, + "lr": 0.0003554841015277638, + "time_sec": 41.66425442695618 + }, + { + "epoch": 90, + "train_loss": 1.7849925768280028, + "train_acc": 0.52188, + "test_loss": 5.472545378112793, + "test_acc": 0.0127, + "lyapunov": 1.6630497878164892, + "grad_norm": 0.7379404154374459, + "grad_max_sv": 0.27791005559265614, + "grad_min_sv": 1.3561169532293193e-08, + "grad_condition": 146436762.42535684, + "lr": 0.000345491502812526, + "time_sec": 41.68130135536194 + }, + { + "epoch": 91, + "train_loss": 1.7678911954879761, + "train_acc": 0.52792, + "test_loss": 5.433208572387695, + "test_acc": 0.0111, + "lyapunov": 1.6612660357409426, + "grad_norm": 0.7436136899756786, + "grad_max_sv": 0.28643885627388954, + "grad_min_sv": 1.4077170534636252e-08, + "grad_condition": 141313299.4033515, + "lr": 0.0003355666766307081, + "time_sec": 41.69838857650757 + }, + { + "epoch": 92, + "train_loss": 1.7893417644119263, + "train_acc": 0.52188, + "test_loss": 5.732446333312988, + "test_acc": 0.0132, + "lyapunov": 1.6719880662001003, + "grad_norm": 0.7430166658849362, + "grad_max_sv": 0.2796207364648581, + "grad_min_sv": 1.370609366835307e-08, + "grad_condition": 61381680.96914546, + "lr": 0.00032571397633909225, + "time_sec": 41.662304639816284 + }, + { + "epoch": 93, + "train_loss": 1.793455412979126, + "train_acc": 0.51948, + "test_loss": 7.157857987976074, + "test_acc": 0.0156, + "lyapunov": 1.7097750539365022, + "grad_norm": 0.7503715678180837, + "grad_max_sv": 0.2879045564681292, + "grad_min_sv": 1.3920300624692405e-08, + "grad_condition": 46032234.96350131, + "lr": 0.00031593772365766094, + "time_sec": 41.68742322921753 + }, + { + "epoch": 94, + "train_loss": 1.790754737892151, + "train_acc": 0.51794, + "test_loss": 5.853521730041504, + "test_acc": 0.0183, + "lyapunov": 1.7012710964588253, + "grad_norm": 0.7508761734251582, + "grad_max_sv": 0.2927242830395699, + "grad_min_sv": 1.3959867344037757e-08, + "grad_condition": 30783098.824512742, + "lr": 0.0003062422067739483, + "time_sec": 41.696484327316284 + }, + { + "epoch": 95, + "train_loss": 1.7357876617050172, + "train_acc": 0.53082, + "test_loss": 5.843491268157959, + "test_acc": 0.0169, + "lyapunov": 1.6724172071422763, + "grad_norm": 0.7362974967473044, + "grad_max_sv": 0.28096207305788995, + "grad_min_sv": 1.3731502089206483e-08, + "grad_condition": 72155189.25605753, + "lr": 0.00029663167846209965, + "time_sec": 41.801615715026855 + }, + { + "epoch": 96, + "train_loss": 1.7516635646438599, + "train_acc": 0.529, + "test_loss": 5.930022283935547, + "test_acc": 0.0166, + "lyapunov": 1.6662769326773446, + "grad_norm": 0.7418130914367154, + "grad_max_sv": 0.27851024977862837, + "grad_min_sv": 1.3786014568806238e-08, + "grad_condition": 27146249.501743816, + "lr": 0.00028711035421746345, + "time_sec": 41.690131187438965 + }, + { + "epoch": 97, + "train_loss": 1.725118031539917, + "train_acc": 0.53522, + "test_loss": 7.037702999877929, + "test_acc": 0.0131, + "lyapunov": 1.6579057100178944, + "grad_norm": 0.7402503506761774, + "grad_max_sv": 0.2801696177572012, + "grad_min_sv": 1.3907192450424154e-08, + "grad_condition": 27217829.233857714, + "lr": 0.00027768241040753615, + "time_sec": 41.68803310394287 + }, + { + "epoch": 98, + "train_loss": 1.7803752786254883, + "train_acc": 0.52198, + "test_loss": 5.421708882141114, + "test_acc": 0.0156, + "lyapunov": 1.718612858706423, + "grad_norm": 0.7413849451100987, + "grad_max_sv": 0.2769254602491856, + "grad_min_sv": 1.3933566225636517e-08, + "grad_condition": 207039935.91921127, + "lr": 0.00026835198244006903, + "time_sec": 41.684860706329346 + }, + { + "epoch": 99, + "train_loss": 1.7348972189331056, + "train_acc": 0.53522, + "test_loss": 5.996163872528077, + "test_acc": 0.0138, + "lyapunov": 1.7001579844433328, + "grad_norm": 0.7422689999529027, + "grad_max_sv": 0.284788579121232, + "grad_min_sv": 1.3718373463589284e-08, + "grad_condition": 32133144.908362694, + "lr": 0.0002591231629491421, + "time_sec": 41.687785148620605 + }, + { + "epoch": 100, + "train_loss": 1.715971527557373, + "train_acc": 0.53706, + "test_loss": 5.193750161743164, + "test_acc": 0.0145, + "lyapunov": 1.678100373738867, + "grad_norm": 0.7359745614466124, + "grad_max_sv": 0.2779096748679876, + "grad_min_sv": 1.3629619793897874e-08, + "grad_condition": 45906662.87529864, + "lr": 0.0002499999999999997, + "time_sec": 41.68041801452637 + }, + { + "epoch": 101, + "train_loss": 1.7047844717025757, + "train_acc": 0.54014, + "test_loss": 5.4800733383178715, + "test_acc": 0.0147, + "lyapunov": 1.6837563725078808, + "grad_norm": 0.9365648414768546, + "grad_max_sv": 0.27644540667533873, + "grad_min_sv": 1.338469317047064e-08, + "grad_condition": 58253933.98672454, + "lr": 0.00024098649531343477, + "time_sec": 41.69390559196472 + }, + { + "epoch": 102, + "train_loss": 1.7108585023498535, + "train_acc": 0.53936, + "test_loss": 5.4571699615478515, + "test_acc": 0.0158, + "lyapunov": 1.6604459846720976, + "grad_norm": 0.7870713313934493, + "grad_max_sv": 0.2845739547163248, + "grad_min_sv": 1.3875931419160548e-08, + "grad_condition": 29653372.68228669, + "lr": 0.0002320866025105016, + "time_sec": 41.69141387939453 + }, + { + "epoch": 103, + "train_loss": 1.7227560781860352, + "train_acc": 0.53538, + "test_loss": 6.349255479431152, + "test_acc": 0.0136, + "lyapunov": 1.6870903968811035, + "grad_norm": 0.7434197839636765, + "grad_max_sv": 0.2914551913738251, + "grad_min_sv": 1.3957845548806525e-08, + "grad_condition": 32995362.81324634, + "lr": 0.0002233042253783278, + "time_sec": 41.680914640426636 + }, + { + "epoch": 104, + "train_loss": 1.702695262298584, + "train_acc": 0.53836, + "test_loss": 5.656436128234863, + "test_acc": 0.015, + "lyapunov": 1.6825833451717407, + "grad_norm": 0.7549456718817885, + "grad_max_sv": 0.2799145434051752, + "grad_min_sv": 1.3645678115237203e-08, + "grad_condition": 28379554.63119031, + "lr": 0.000214643216157784, + "time_sec": 41.65440130233765 + }, + { + "epoch": 105, + "train_loss": 1.6862115913772584, + "train_acc": 0.54564, + "test_loss": 5.472533478546143, + "test_acc": 0.0126, + "lyapunov": 1.7024933560120175, + "grad_norm": 1.26630705617649, + "grad_max_sv": 0.279131243750453, + "grad_min_sv": 1.38689274988002e-08, + "grad_condition": 38224107.421842635, + "lr": 0.00020610737385376332, + "time_sec": 41.66117596626282 + }, + { + "epoch": 106, + "train_loss": 1.6867632722473145, + "train_acc": 0.54602, + "test_loss": 5.890195466613769, + "test_acc": 0.0123, + "lyapunov": 1.6856458394423774, + "grad_norm": 0.8947104093954833, + "grad_max_sv": 0.28173881731927397, + "grad_min_sv": 1.3741654582635766e-08, + "grad_condition": 79792220.50526081, + "lr": 0.00019770044256881242, + "time_sec": 41.68054246902466 + }, + { + "epoch": 107, + "train_loss": 1.6547852846908568, + "train_acc": 0.55128, + "test_loss": 5.426952139282227, + "test_acc": 0.0138, + "lyapunov": 1.6635038605736345, + "grad_norm": 0.9461038074599576, + "grad_max_sv": 0.28091032803058624, + "grad_min_sv": 1.3631295835148105e-08, + "grad_condition": 121284689.6114355, + "lr": 0.0001894261098608447, + "time_sec": 41.6701295375824 + }, + { + "epoch": 108, + "train_loss": 1.6798790365219116, + "train_acc": 0.54798, + "test_loss": 6.159035799407959, + "test_acc": 0.0164, + "lyapunov": 1.6929522896056894, + "grad_norm": 0.743883475009877, + "grad_max_sv": 0.28309045545756817, + "grad_min_sv": 1.3724124101055502e-08, + "grad_condition": 39239015.729782544, + "lr": 0.000181288005125655, + "time_sec": 41.696985960006714 + }, + { + "epoch": 109, + "train_loss": 1.696175348777771, + "train_acc": 0.54438, + "test_loss": 5.6951647491455075, + "test_acc": 0.016, + "lyapunov": 1.7148385203402976, + "grad_norm": 0.8437266984263797, + "grad_max_sv": 0.27865533195436, + "grad_min_sv": 1.3687295685738121e-08, + "grad_condition": 84166239.98915759, + "lr": 0.0001732896980049473, + "time_sec": 41.71509552001953 + }, + { + "epoch": 110, + "train_loss": 1.6658023331832885, + "train_acc": 0.55012, + "test_loss": 5.7984600807189945, + "test_acc": 0.0143, + "lyapunov": 1.6841092344440158, + "grad_norm": 0.9121109366716545, + "grad_max_sv": 0.29167514853179455, + "grad_min_sv": 1.3800432944674478e-08, + "grad_condition": 144511278.99640113, + "lr": 0.00016543469682057076, + "time_sec": 41.66339421272278 + }, + { + "epoch": 111, + "train_loss": 1.6395328227615356, + "train_acc": 0.554, + "test_loss": 5.86650054473877, + "test_acc": 0.0152, + "lyapunov": 1.6673833018983417, + "grad_norm": 0.7699631101372096, + "grad_max_sv": 0.28348692767322065, + "grad_min_sv": 1.3636408227601927e-08, + "grad_condition": 55378180.92666749, + "lr": 0.00015772644703565552, + "time_sec": 41.665539026260376 + }, + { + "epoch": 112, + "train_loss": 1.6477852906799317, + "train_acc": 0.55158, + "test_loss": 5.940995491790772, + "test_acc": 0.0112, + "lyapunov": 1.6873568881808034, + "grad_norm": 0.7479570199711284, + "grad_max_sv": 0.28565193973481656, + "grad_min_sv": 1.3545885212663486e-08, + "grad_condition": 4195243968.2445326, + "lr": 0.00015016832974331713, + "time_sec": 41.66239333152771 + }, + { + "epoch": 113, + "train_loss": 1.6797285276412963, + "train_acc": 0.54658, + "test_loss": 5.699360008239746, + "test_acc": 0.0169, + "lyapunov": 1.7014049044655413, + "grad_norm": 0.870968251009497, + "grad_max_sv": 0.29082027412950995, + "grad_min_sv": 1.3837160986462926e-08, + "grad_condition": 38795421.79244965, + "lr": 0.00014276366018359834, + "time_sec": 41.68905782699585 + }, + { + "epoch": 114, + "train_loss": 1.6465518449401855, + "train_acc": 0.55668, + "test_loss": 6.088453164672852, + "test_acc": 0.0164, + "lyapunov": 1.7043657921769124, + "grad_norm": 0.8946839109968647, + "grad_max_sv": 0.2849067386239767, + "grad_min_sv": 1.3802866963286143e-08, + "grad_condition": 25630247.743903965, + "lr": 0.00013551568628929425, + "time_sec": 41.66656756401062 + }, + { + "epoch": 115, + "train_loss": 1.6319327460479736, + "train_acc": 0.55656, + "test_loss": 6.832156317138672, + "test_acc": 0.0153, + "lyapunov": 1.7021731708360754, + "grad_norm": 0.7410352883319467, + "grad_max_sv": 0.28490288034081457, + "grad_min_sv": 1.3852848871828693e-08, + "grad_condition": 105769705.67995845, + "lr": 0.00012842758726130276, + "time_sec": 41.65516543388367 + }, + { + "epoch": 116, + "train_loss": 1.6370894707107544, + "train_acc": 0.55944, + "test_loss": 6.086082221984864, + "test_acc": 0.0152, + "lyapunov": 1.704162275089937, + "grad_norm": 0.7404525214110508, + "grad_max_sv": 0.2851620279252529, + "grad_min_sv": 1.3774486038592437e-08, + "grad_condition": 64341791.17616973, + "lr": 0.0001215024721741218, + "time_sec": 41.70033001899719 + }, + { + "epoch": 117, + "train_loss": 1.6296995531082152, + "train_acc": 0.5565, + "test_loss": 5.999611178588867, + "test_acc": 0.0158, + "lyapunov": 1.6899978895016643, + "grad_norm": 0.7413749466972203, + "grad_max_sv": 0.28470359593629835, + "grad_min_sv": 1.3795419027962108e-08, + "grad_condition": 46293176.84023976, + "lr": 0.00011474337861210538, + "time_sec": 41.66957759857178 + }, + { + "epoch": 118, + "train_loss": 1.6183696263122558, + "train_acc": 0.56042, + "test_loss": 5.902465699768066, + "test_acc": 0.0155, + "lyapunov": 1.6653556753607357, + "grad_norm": 0.752028873574231, + "grad_max_sv": 0.2849472999572754, + "grad_min_sv": 1.3723038618310146e-08, + "grad_condition": 108717082.80762736, + "lr": 0.00010815327133708009, + "time_sec": 41.65808391571045 + }, + { + "epoch": 119, + "train_loss": 1.6181411283111573, + "train_acc": 0.56246, + "test_loss": 5.821061138153076, + "test_acc": 0.0127, + "lyapunov": 1.6990043498061198, + "grad_norm": 0.9212306864426181, + "grad_max_sv": 0.2813797727227211, + "grad_min_sv": 1.3685392258322438e-08, + "grad_condition": 36721469.46741449, + "lr": 0.00010173504098790182, + "time_sec": 41.65668511390686 + }, + { + "epoch": 120, + "train_loss": 1.6332576264572143, + "train_acc": 0.55946, + "test_loss": 5.637864579772949, + "test_acc": 0.0158, + "lyapunov": 1.7040051304165968, + "grad_norm": 0.8758295019344725, + "grad_max_sv": 0.2898151889443398, + "grad_min_sv": 1.4175130585991625e-08, + "grad_condition": 40539456.12140705, + "lr": 9.549150281252629e-05, + "time_sec": 41.7333300113678 + }, + { + "epoch": 121, + "train_loss": 1.6032706314468383, + "train_acc": 0.56424, + "test_loss": 6.044293823242188, + "test_acc": 0.0161, + "lyapunov": 1.687883598420321, + "grad_norm": 0.8855358425086, + "grad_max_sv": 0.28492439053952695, + "grad_min_sv": 1.3791471256685561e-08, + "grad_condition": 26792072.142948806, + "lr": 8.942539543314794e-05, + "time_sec": 41.69478678703308 + }, + { + "epoch": 122, + "train_loss": 1.6067510599517822, + "train_acc": 0.56546, + "test_loss": 6.217616750335694, + "test_acc": 0.0169, + "lyapunov": 1.6955407583500113, + "grad_norm": 1.007631118576203, + "grad_max_sv": 0.2878258924931288, + "grad_min_sv": 1.3879796437188396e-08, + "grad_condition": 33084555.795453023, + "lr": 8.353937964495024e-05, + "time_sec": 41.67023324966431 + }, + { + "epoch": 123, + "train_loss": 1.6053743167114258, + "train_acc": 0.56268, + "test_loss": 6.328966861724854, + "test_acc": 0.0153, + "lyapunov": 1.6795075369612944, + "grad_norm": 0.8699000468731735, + "grad_max_sv": 0.2898880571126938, + "grad_min_sv": 1.3709727229513358e-08, + "grad_condition": 124246234.40071194, + "lr": 7.783603724899243e-05, + "time_sec": 41.660712242126465 + }, + { + "epoch": 124, + "train_loss": 1.6071837269973754, + "train_acc": 0.56286, + "test_loss": 6.1388191246032715, + "test_acc": 0.0167, + "lyapunov": 1.7264370232286965, + "grad_norm": 0.8940529497792777, + "grad_max_sv": 0.28389453068375586, + "grad_min_sv": 1.3959469480351316e-08, + "grad_condition": 24432394.03377783, + "lr": 7.231786991974666e-05, + "time_sec": 41.68312621116638 + }, + { + "epoch": 125, + "train_loss": 1.6100223978042603, + "train_acc": 0.56692, + "test_loss": 5.9885783233642575, + "test_acc": 0.0166, + "lyapunov": 1.7270872559388886, + "grad_norm": 1.0226142905420907, + "grad_max_sv": 0.28528097458183765, + "grad_min_sv": 1.3753909883229553e-08, + "grad_condition": 59401243.51928474, + "lr": 6.698729810778072e-05, + "time_sec": 41.70276618003845 + }, + { + "epoch": 126, + "train_loss": 1.6035814072036743, + "train_acc": 0.56344, + "test_loss": 6.076493969726562, + "test_acc": 0.011, + "lyapunov": 1.6876506253581522, + "grad_norm": 0.9642119889310449, + "grad_max_sv": 0.2870322696864605, + "grad_min_sv": 1.3708104407150756e-08, + "grad_condition": 28048573.443991415, + "lr": 6.184665997806817e-05, + "time_sec": 41.8551926612854 + }, + { + "epoch": 127, + "train_loss": 1.6120177191162108, + "train_acc": 0.56444, + "test_loss": 6.843795123291016, + "test_acc": 0.0159, + "lyapunov": 1.7337111725526697, + "grad_norm": 0.8368578920332793, + "grad_max_sv": 0.28001562878489494, + "grad_min_sv": 1.3889535929734187e-08, + "grad_condition": 62985977.61673013, + "lr": 5.6898210384392595e-05, + "time_sec": 41.68673539161682 + }, + { + "epoch": 128, + "train_loss": 1.6090134407424928, + "train_acc": 0.56466, + "test_loss": 6.320640184783936, + "test_acc": 0.0146, + "lyapunov": 1.7266684904732668, + "grad_norm": 0.7858511448483877, + "grad_max_sv": 0.2850359447300434, + "grad_min_sv": 1.3702059388498444e-08, + "grad_condition": 42801480.40100025, + "lr": 5.214411988029363e-05, + "time_sec": 41.68818187713623 + }, + { + "epoch": 129, + "train_loss": 1.6249183625030517, + "train_acc": 0.56476, + "test_loss": 6.549667198181153, + "test_acc": 0.0162, + "lyapunov": 1.8164921944098704, + "grad_norm": 1.5114520241024798, + "grad_max_sv": 0.2812469657510519, + "grad_min_sv": 1.3925696595862291e-08, + "grad_condition": 57029114.93811275, + "lr": 4.7586473766990294e-05, + "time_sec": 41.79629635810852 + }, + { + "epoch": 130, + "train_loss": 1.5824087297058105, + "train_acc": 0.57044, + "test_loss": 6.021063035583496, + "test_acc": 0.0176, + "lyapunov": 1.70903730880269, + "grad_norm": 0.7379608621319285, + "grad_max_sv": 0.279190668836236, + "grad_min_sv": 1.3621928689200313e-08, + "grad_condition": 32815172.113138717, + "lr": 4.32272711786996e-05, + "time_sec": 41.70122241973877 + }, + { + "epoch": 131, + "train_loss": 1.595119048576355, + "train_acc": 0.56984, + "test_loss": 6.4952160888671875, + "test_acc": 0.0155, + "lyapunov": 1.754641688083444, + "grad_norm": 1.0023213514600722, + "grad_max_sv": 0.2834797468036413, + "grad_min_sv": 1.3511996389131698e-08, + "grad_condition": 68519633.56325917, + "lr": 3.906842420574966e-05, + "time_sec": 41.72273635864258 + }, + { + "epoch": 132, + "train_loss": 1.5923931760787964, + "train_acc": 0.57014, + "test_loss": 6.346144076538086, + "test_acc": 0.0148, + "lyapunov": 1.73292323177123, + "grad_norm": 0.7501780068501551, + "grad_max_sv": 0.28294241838157175, + "grad_min_sv": 1.389686744160748e-08, + "grad_condition": 365347440.4407994, + "lr": 3.5111757055874305e-05, + "time_sec": 41.898685693740845 + }, + { + "epoch": 133, + "train_loss": 1.6026707472991943, + "train_acc": 0.57266, + "test_loss": 6.185466950988769, + "test_acc": 0.0179, + "lyapunov": 1.8438011843834996, + "grad_norm": 0.9394783942730687, + "grad_max_sv": 0.2847215086221695, + "grad_min_sv": 1.390161358527653e-08, + "grad_condition": 34103085.04162355, + "lr": 3.1359005254054254e-05, + "time_sec": 41.84562015533447 + }, + { + "epoch": 134, + "train_loss": 1.6043600881576539, + "train_acc": 0.56972, + "test_loss": 6.54779362411499, + "test_acc": 0.0168, + "lyapunov": 1.8157421551701967, + "grad_norm": 0.9578717543319566, + "grad_max_sv": 0.2788985829800367, + "grad_min_sv": 1.373801071791192e-08, + "grad_condition": 33295442.566805385, + "lr": 2.7811814881259484e-05, + "time_sec": 41.748968839645386 + }, + { + "epoch": 135, + "train_loss": 1.6008320109558105, + "train_acc": 0.56734, + "test_loss": 6.480984884643554, + "test_acc": 0.0164, + "lyapunov": 1.824832089111933, + "grad_norm": 0.7833960844227048, + "grad_max_sv": 0.2834679901599884, + "grad_min_sv": 1.3707274611196584e-08, + "grad_condition": 34742063.3411188, + "lr": 2.4471741852423218e-05, + "time_sec": 41.679542541503906 + }, + { + "epoch": 136, + "train_loss": 1.6033842488479615, + "train_acc": 0.57426, + "test_loss": 6.3071887496948245, + "test_acc": 0.0161, + "lyapunov": 1.8717652309276258, + "grad_norm": 1.1623205937404684, + "grad_max_sv": 0.28173171132802965, + "grad_min_sv": 1.3602863799255793e-08, + "grad_condition": 47504661.60977468, + "lr": 2.1340251233966362e-05, + "time_sec": 41.70148062705994 + }, + { + "epoch": 137, + "train_loss": 1.585039638633728, + "train_acc": 0.57336, + "test_loss": 6.212019223022461, + "test_acc": 0.0167, + "lyapunov": 1.8105511723272025, + "grad_norm": 0.76774524189785, + "grad_max_sv": 0.2841952469199896, + "grad_min_sv": 1.3692064346898514e-08, + "grad_condition": 45911317.56625296, + "lr": 1.8418716601170932e-05, + "time_sec": 41.718605279922485 + }, + { + "epoch": 138, + "train_loss": 1.584446519355774, + "train_acc": 0.57526, + "test_loss": 6.243849922943115, + "test_acc": 0.0165, + "lyapunov": 1.828900443928321, + "grad_norm": 0.7339440588405652, + "grad_max_sv": 0.2821473300457001, + "grad_min_sv": 1.3492376377960413e-08, + "grad_condition": 46486868.242411375, + "lr": 1.570841943568445e-05, + "time_sec": 41.803757667541504 + }, + { + "epoch": 139, + "train_loss": 1.591472290611267, + "train_acc": 0.57168, + "test_loss": 6.332618227386474, + "test_acc": 0.0164, + "lyapunov": 1.8522861116682476, + "grad_norm": 0.7344821119501195, + "grad_max_sv": 0.2718358475714922, + "grad_min_sv": 1.3269187557063412e-08, + "grad_condition": 28030061.559468903, + "lr": 1.3210548563419845e-05, + "time_sec": 41.6920862197876 + }, + { + "epoch": 140, + "train_loss": 1.614663985748291, + "train_acc": 0.57106, + "test_loss": 6.035421504974365, + "test_acc": 0.0166, + "lyapunov": 1.865170035825666, + "grad_norm": 0.7488812688556887, + "grad_max_sv": 0.28298918418586255, + "grad_min_sv": 1.3682502991718692e-08, + "grad_condition": 24201290.710221395, + "lr": 1.0926199633097203e-05, + "time_sec": 41.67938685417175 + }, + { + "epoch": 141, + "train_loss": 1.602144892578125, + "train_acc": 0.57176, + "test_loss": 6.090472431182861, + "test_acc": 0.0168, + "lyapunov": 1.8573481064013508, + "grad_norm": 0.9964350746023342, + "grad_max_sv": 0.28083013482391833, + "grad_min_sv": 1.342545436419651e-08, + "grad_condition": 71076432.31589943, + "lr": 8.856374635655688e-06, + "time_sec": 41.67989158630371 + }, + { + "epoch": 142, + "train_loss": 1.5910524003982545, + "train_acc": 0.574, + "test_loss": 6.0493482467651365, + "test_acc": 0.0167, + "lyapunov": 1.8519471301447095, + "grad_norm": 0.7327372969700953, + "grad_max_sv": 0.28154470436275003, + "grad_min_sv": 1.3814112725940574e-08, + "grad_condition": 40685021.10874365, + "lr": 7.001981464747503e-06, + "time_sec": 41.87545084953308 + }, + { + "epoch": 143, + "train_loss": 1.5878816836166383, + "train_acc": 0.5754, + "test_loss": 6.0228049758911135, + "test_acc": 0.0173, + "lyapunov": 1.835201174096988, + "grad_norm": 0.7329380251080414, + "grad_max_sv": 0.2804208301007748, + "grad_min_sv": 1.3855345770696913e-08, + "grad_condition": 24866442.419618618, + "lr": 5.3638335185058295e-06, + "time_sec": 41.670424938201904 + }, + { + "epoch": 144, + "train_loss": 1.5844879238891603, + "train_acc": 0.57532, + "test_loss": 6.013319036102295, + "test_acc": 0.0167, + "lyapunov": 1.797589682557089, + "grad_norm": 0.7332915407418003, + "grad_max_sv": 0.2873740203678608, + "grad_min_sv": 1.3867528024166797e-08, + "grad_condition": 66782743.82880296, + "lr": 3.942649342761114e-06, + "time_sec": 41.666340827941895 + }, + { + "epoch": 145, + "train_loss": 1.5729130697250366, + "train_acc": 0.57884, + "test_loss": 5.962558745574952, + "test_acc": 0.0174, + "lyapunov": 1.8133810779932515, + "grad_norm": 0.7304773544167381, + "grad_max_sv": 0.2831062778830528, + "grad_min_sv": 1.3597974729551154e-08, + "grad_condition": 27885577.58840422, + "lr": 2.7390523158633524e-06, + "time_sec": 41.66122889518738 + }, + { + "epoch": 146, + "train_loss": 1.5774464596939086, + "train_acc": 0.57336, + "test_loss": 6.056200170898437, + "test_acc": 0.0176, + "lyapunov": 1.8052761911431237, + "grad_norm": 0.7323581109158898, + "grad_max_sv": 0.27999263890087606, + "grad_min_sv": 1.3672255842755998e-08, + "grad_condition": 30955091.121420026, + "lr": 1.7535703752478133e-06, + "time_sec": 41.6817889213562 + }, + { + "epoch": 147, + "train_loss": 1.5797025276184082, + "train_acc": 0.57294, + "test_loss": 6.142494761657715, + "test_acc": 0.0163, + "lyapunov": 1.8119597739880653, + "grad_norm": 0.7326729565983514, + "grad_max_sv": 0.2801577255129814, + "grad_min_sv": 1.3520314751103158e-08, + "grad_condition": 24177790.25879824, + "lr": 9.866357858642196e-07, + "time_sec": 41.667490005493164 + }, + { + "epoch": 148, + "train_loss": 1.5737435025787354, + "train_acc": 0.57896, + "test_loss": 6.0964897369384765, + "test_acc": 0.016, + "lyapunov": 1.8165211808651, + "grad_norm": 0.7295448230456424, + "grad_max_sv": 0.2751427095383406, + "grad_min_sv": 1.348928903022184e-08, + "grad_condition": 24265473.368122566, + "lr": 4.38584950570808e-07, + "time_sec": 41.68909525871277 + }, + { + "epoch": 149, + "train_loss": 1.5774297478485106, + "train_acc": 0.5743, + "test_loss": 6.148982523345947, + "test_acc": 0.0159, + "lyapunov": 1.8202249927593923, + "grad_norm": 0.7313561355684882, + "grad_max_sv": 0.2817809645086527, + "grad_min_sv": 1.3657219487261951e-08, + "grad_condition": 38822037.86584419, + "lr": 1.096582625772501e-07, + "time_sec": 41.70693755149841 + }, + { + "epoch": 150, + "train_loss": 1.5808244900512696, + "train_acc": 0.57584, + "test_loss": 5.973857634735108, + "test_acc": 0.0172, + "lyapunov": 1.8156279499268593, + "grad_norm": 0.7308465286184226, + "grad_max_sv": 0.28174142725765705, + "grad_min_sv": 1.372764353510525e-08, + "grad_condition": 43888249.75048177, + "lr": 0.0, + "time_sec": 41.68298602104187 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 5.021671794891358, + "train_acc": 0.02426, + "test_loss": 4.758953214263916, + "test_acc": 0.0194, + "lyapunov": 2.365524544740272, + "grad_norm": 5.666214881321602, + "grad_max_sv": 4.635834372043609, + "grad_min_sv": 9.740842493444202e-08, + "grad_condition": 345906665.41414034, + "lr": 0.0009998903417374227, + "time_sec": 86.94375228881836 + }, + { + "epoch": 2, + "train_loss": 4.6419046446228025, + "train_acc": 0.03036, + "test_loss": 4.812141468811035, + "test_acc": 0.0141, + "lyapunov": 1.8034114608984164, + "grad_norm": 3.7942354948877397, + "grad_max_sv": 2.932516324520111, + "grad_min_sv": 6.569729187888563e-08, + "grad_condition": 162956558.25651228, + "lr": 0.0009995614150494292, + "time_sec": 86.91073846817017 + }, + { + "epoch": 3, + "train_loss": 4.522548667297364, + "train_acc": 0.03148, + "test_loss": 4.54623723449707, + "test_acc": 0.0238, + "lyapunov": 1.6952560444926972, + "grad_norm": 2.3455501053352146, + "grad_max_sv": 1.7244864150881767, + "grad_min_sv": 4.1950142698997384e-08, + "grad_condition": 6680092616.82326, + "lr": 0.0009990133642141358, + "time_sec": 86.88951110839844 + }, + { + "epoch": 4, + "train_loss": 4.4614645977783205, + "train_acc": 0.0325, + "test_loss": 5.176557122039795, + "test_acc": 0.0101, + "lyapunov": 1.6139005059781282, + "grad_norm": 1.5168077426412896, + "grad_max_sv": 0.9842755444347858, + "grad_min_sv": 2.4031745480719025e-08, + "grad_condition": 11261049173.025684, + "lr": 0.0009982464296247522, + "time_sec": 86.94786024093628 + }, + { + "epoch": 5, + "train_loss": 4.4149443920898435, + "train_acc": 0.03626, + "test_loss": 5.137158406066894, + "test_acc": 0.01, + "lyapunov": 1.6045118917894485, + "grad_norm": 1.2582953215287522, + "grad_max_sv": 0.7553236961364747, + "grad_min_sv": 2.073135719031505e-08, + "grad_condition": 222472203.43764964, + "lr": 0.0009972609476841367, + "time_sec": 86.93599653244019 + }, + { + "epoch": 6, + "train_loss": 4.404399389801025, + "train_acc": 0.03718, + "test_loss": 5.152426997375488, + "test_acc": 0.0145, + "lyapunov": 1.5948826068502557, + "grad_norm": 1.0525562897343101, + "grad_max_sv": 0.5827781304717063, + "grad_min_sv": 1.6368500771208466e-08, + "grad_condition": 975204505.0574242, + "lr": 0.000996057350657239, + "time_sec": 86.89734673500061 + }, + { + "epoch": 7, + "train_loss": 4.373200228271484, + "train_acc": 0.0427, + "test_loss": 5.138384069824219, + "test_acc": 0.01, + "lyapunov": 1.5917642296427656, + "grad_norm": 0.979719698336329, + "grad_max_sv": 0.5500100567936897, + "grad_min_sv": 1.578485221420678e-08, + "grad_condition": 40146995.15588243, + "lr": 0.000994636166481494, + "time_sec": 86.9030191898346 + }, + { + "epoch": 8, + "train_loss": 4.3614981033325195, + "train_acc": 0.04452, + "test_loss": 5.208292040252686, + "test_acc": 0.0158, + "lyapunov": 1.5925918241291095, + "grad_norm": 0.8254065825253598, + "grad_max_sv": 0.43389859050512314, + "grad_min_sv": 1.2995100632032242e-08, + "grad_condition": 93911652.28137563, + "lr": 0.0009929980185352525, + "time_sec": 86.902259349823 + }, + { + "epoch": 9, + "train_loss": 4.359973902893066, + "train_acc": 0.04506, + "test_loss": 4.722157088470459, + "test_acc": 0.018, + "lyapunov": 1.5934884682335817, + "grad_norm": 0.7465758222368373, + "grad_max_sv": 0.3876167729496956, + "grad_min_sv": 1.1805707171921865e-08, + "grad_condition": 96983113.34478703, + "lr": 0.0009911436253643444, + "time_sec": 86.9238531589508 + }, + { + "epoch": 10, + "train_loss": 4.4141249188232425, + "train_acc": 0.03536, + "test_loss": 5.436407916259766, + "test_acc": 0.01, + "lyapunov": 1.5828703861407307, + "grad_norm": 0.6206738544013151, + "grad_max_sv": 0.3251112919300795, + "grad_min_sv": 9.17487998804145e-09, + "grad_condition": 105514243.19237423, + "lr": 0.0009890738003669028, + "time_sec": 86.9449622631073 + }, + { + "epoch": 11, + "train_loss": 4.426171367950439, + "train_acc": 0.0344, + "test_loss": 4.693856712341309, + "test_acc": 0.0236, + "lyapunov": 1.5946678465894422, + "grad_norm": 0.5860438322533541, + "grad_max_sv": 0.2918587654829025, + "grad_min_sv": 6.5412758706696685e-09, + "grad_condition": 5280467761.157875, + "lr": 0.00098678945143658, + "time_sec": 86.91325283050537 + }, + { + "epoch": 12, + "train_loss": 4.3411827925109865, + "train_acc": 0.04538, + "test_loss": 5.247728338623046, + "test_acc": 0.0136, + "lyapunov": 1.5863848153282614, + "grad_norm": 0.5956948826941676, + "grad_max_sv": 0.2928905326873064, + "grad_min_sv": 8.411352403828177e-09, + "grad_condition": 128968920.19480267, + "lr": 0.0009842915805643154, + "time_sec": 86.90281319618225 + }, + { + "epoch": 13, + "train_loss": 4.339786265563965, + "train_acc": 0.04572, + "test_loss": 5.686103868103027, + "test_acc": 0.0125, + "lyapunov": 1.5810096681575336, + "grad_norm": 0.5604669884006932, + "grad_max_sv": 0.2611371923238039, + "grad_min_sv": 8.195694697898936e-09, + "grad_condition": 39688248.11524393, + "lr": 0.000981581283398829, + "time_sec": 86.90422630310059 + }, + { + "epoch": 14, + "train_loss": 4.35356285232544, + "train_acc": 0.04532, + "test_loss": 4.883278243255615, + "test_acc": 0.015, + "lyapunov": 1.579099393866556, + "grad_norm": 0.528427576292652, + "grad_max_sv": 0.2469606887549162, + "grad_min_sv": 7.61194059832604e-09, + "grad_condition": 168282434.76948723, + "lr": 0.0009786597487660333, + "time_sec": 86.88846230506897 + }, + { + "epoch": 15, + "train_loss": 4.3755184262084965, + "train_acc": 0.04264, + "test_loss": 6.138819856262207, + "test_acc": 0.0126, + "lyapunov": 1.6284648536721154, + "grad_norm": 0.5259167846709967, + "grad_max_sv": 0.25808656550943854, + "grad_min_sv": 7.094433302975989e-09, + "grad_condition": 78394577.54559764, + "lr": 0.0009755282581475766, + "time_sec": 86.88808155059814 + }, + { + "epoch": 16, + "train_loss": 4.3449753375244144, + "train_acc": 0.04422, + "test_loss": 4.874321587371826, + "test_acc": 0.0139, + "lyapunov": 1.592136370861317, + "grad_norm": 0.5849477114279426, + "grad_max_sv": 0.2871789067983627, + "grad_min_sv": 7.143974147904957e-09, + "grad_condition": 825777754.2283806, + "lr": 0.0009721881851187403, + "time_sec": 86.88666772842407 + }, + { + "epoch": 17, + "train_loss": 4.326568845520019, + "train_acc": 0.04702, + "test_loss": 4.870712732696533, + "test_acc": 0.0106, + "lyapunov": 1.579986076830598, + "grad_norm": 0.587479722542324, + "grad_max_sv": 0.2732066046446562, + "grad_min_sv": 6.707479306713086e-09, + "grad_condition": 933588154.4592457, + "lr": 0.0009686409947459456, + "time_sec": 86.94699215888977 + }, + { + "epoch": 18, + "train_loss": 4.290269263916016, + "train_acc": 0.04908, + "test_loss": 4.543920527648925, + "test_acc": 0.0184, + "lyapunov": 1.5655539648612138, + "grad_norm": 0.5190972278925252, + "grad_max_sv": 0.27400444857776163, + "grad_min_sv": 7.268163138354766e-09, + "grad_condition": 103768651.90634331, + "lr": 0.0009648882429441254, + "time_sec": 86.91610383987427 + }, + { + "epoch": 19, + "train_loss": 4.277731272888183, + "train_acc": 0.0529, + "test_loss": 4.523501123046875, + "test_acc": 0.0234, + "lyapunov": 1.5601860742129938, + "grad_norm": 0.5064673349074232, + "grad_max_sv": 0.26197145469486716, + "grad_min_sv": 7.129040378514584e-09, + "grad_condition": 89369620.75339693, + "lr": 0.00096093157579425, + "time_sec": 86.9239010810852 + }, + { + "epoch": 20, + "train_loss": 4.283599534912109, + "train_acc": 0.04918, + "test_loss": 4.699870119476318, + "test_acc": 0.01, + "lyapunov": 1.573568820343603, + "grad_norm": 0.4940062913988571, + "grad_max_sv": 0.24619702994823456, + "grad_min_sv": 6.7696058640709375e-09, + "grad_condition": 72620577.46255757, + "lr": 0.0009567727288213001, + "time_sec": 86.96331477165222 + }, + { + "epoch": 21, + "train_loss": 4.293489807434082, + "train_acc": 0.05038, + "test_loss": 4.714311406707764, + "test_acc": 0.0108, + "lyapunov": 1.5708344915638799, + "grad_norm": 0.545017777953754, + "grad_max_sv": 0.2541573029011488, + "grad_min_sv": 6.718018621953981e-09, + "grad_condition": 42979908.88210177, + "lr": 0.0009524135262330095, + "time_sec": 86.91739249229431 + }, + { + "epoch": 22, + "train_loss": 4.2768078778076175, + "train_acc": 0.0541, + "test_loss": 4.779728842163086, + "test_acc": 0.01, + "lyapunov": 1.5667131340412228, + "grad_norm": 0.5092105231068674, + "grad_max_sv": 0.27126444056630133, + "grad_min_sv": 7.1301694416769925e-09, + "grad_condition": 57355277.993238926, + "lr": 0.0009478558801197061, + "time_sec": 86.9019386768341 + }, + { + "epoch": 23, + "train_loss": 4.27697469543457, + "train_acc": 0.05122, + "test_loss": 4.672700902557373, + "test_acc": 0.01, + "lyapunov": 1.5615102702089587, + "grad_norm": 0.4784115114004879, + "grad_max_sv": 0.24027332551777364, + "grad_min_sv": 6.443715307516418e-09, + "grad_condition": 95371819.86060278, + "lr": 0.000943101789615607, + "time_sec": 86.91923117637634 + }, + { + "epoch": 24, + "train_loss": 4.278717909088135, + "train_acc": 0.05186, + "test_loss": 4.900936952209473, + "test_acc": 0.01, + "lyapunov": 1.5694453353467195, + "grad_norm": 0.4949771017584012, + "grad_max_sv": 0.24392427019774915, + "grad_min_sv": 6.253112343201916e-09, + "grad_condition": 49683498.32382451, + "lr": 0.0009381533400219313, + "time_sec": 86.95798850059509 + }, + { + "epoch": 25, + "train_loss": 4.284033089141846, + "train_acc": 0.0516, + "test_loss": 4.647933837890625, + "test_acc": 0.01, + "lyapunov": 1.610082578781011, + "grad_norm": 0.4618580067316832, + "grad_max_sv": 0.21940371356904506, + "grad_min_sv": 5.9646471067820174e-09, + "grad_condition": 44077507.34171269, + "lr": 0.0009330127018922189, + "time_sec": 86.92604160308838 + }, + { + "epoch": 26, + "train_loss": 4.27171460357666, + "train_acc": 0.0513, + "test_loss": 4.689661137390137, + "test_acc": 0.01, + "lyapunov": 1.5887331782704424, + "grad_norm": 0.45567402361835824, + "grad_max_sv": 0.20672011002898216, + "grad_min_sv": 5.767535921075151e-09, + "grad_condition": 44437336.12601619, + "lr": 0.000927682130080253, + "time_sec": 86.91289949417114 + }, + { + "epoch": 27, + "train_loss": 4.287545222320556, + "train_acc": 0.0503, + "test_loss": 4.6759644165039065, + "test_acc": 0.0105, + "lyapunov": 1.6080376479936682, + "grad_norm": 0.4608750254003879, + "grad_max_sv": 0.21028368686675095, + "grad_min_sv": 5.734315782138567e-09, + "grad_condition": 303277586.5403552, + "lr": 0.0009221639627510072, + "time_sec": 86.92653059959412 + }, + { + "epoch": 28, + "train_loss": 4.26929240020752, + "train_acc": 0.05308, + "test_loss": 4.89806633605957, + "test_acc": 0.011, + "lyapunov": 1.6118984780348171, + "grad_norm": 0.43418302492765676, + "grad_max_sv": 0.20326684638857842, + "grad_min_sv": 5.713833948692293e-09, + "grad_condition": 85779552.11325228, + "lr": 0.0009164606203550494, + "time_sec": 86.91330051422119 + }, + { + "epoch": 29, + "train_loss": 4.253239243469238, + "train_acc": 0.05616, + "test_loss": 4.924478411865234, + "test_acc": 0.01, + "lyapunov": 1.6098854767392055, + "grad_norm": 0.4850634248026458, + "grad_max_sv": 0.20474721789360045, + "grad_min_sv": 5.8581581326979866e-09, + "grad_condition": 912075238.28812, + "lr": 0.0009105746045668516, + "time_sec": 86.93636131286621 + }, + { + "epoch": 30, + "train_loss": 4.235443085327148, + "train_acc": 0.0606, + "test_loss": 5.510071346282959, + "test_acc": 0.01, + "lyapunov": 1.571061046532048, + "grad_norm": 0.45361919630223685, + "grad_max_sv": 0.2025857836008072, + "grad_min_sv": 5.868267084763179e-09, + "grad_condition": 42096450.95484826, + "lr": 0.0009045084971874733, + "time_sec": 86.9319851398468 + }, + { + "epoch": 31, + "train_loss": 4.231041951293945, + "train_acc": 0.05988, + "test_loss": 5.147942330932617, + "test_acc": 0.01, + "lyapunov": 1.5691828867968391, + "grad_norm": 0.432720376091447, + "grad_max_sv": 0.19395264871418477, + "grad_min_sv": 6.259870760638719e-09, + "grad_condition": 34343773.40740795, + "lr": 0.0008982649590120977, + "time_sec": 86.94789290428162 + }, + { + "epoch": 32, + "train_loss": 4.2413297773742675, + "train_acc": 0.0587, + "test_loss": 5.009992076873779, + "test_acc": 0.01, + "lyapunov": 1.5915203551807062, + "grad_norm": 0.4122171639918169, + "grad_max_sv": 0.182863287627697, + "grad_min_sv": 5.790357663650308e-09, + "grad_condition": 714325029.1851714, + "lr": 0.0008918467286629196, + "time_sec": 86.911212682724 + }, + { + "epoch": 33, + "train_loss": 4.2658996716308595, + "train_acc": 0.0542, + "test_loss": 5.127438952636719, + "test_acc": 0.0101, + "lyapunov": 1.579336861210406, + "grad_norm": 0.44521811591156923, + "grad_max_sv": 0.19066935162991286, + "grad_min_sv": 5.523765223003352e-09, + "grad_condition": 53898858.78718817, + "lr": 0.0008852566213878943, + "time_sec": 86.91553449630737 + }, + { + "epoch": 34, + "train_loss": 4.242719013824463, + "train_acc": 0.05736, + "test_loss": 5.307705741882324, + "test_acc": 0.01, + "lyapunov": 1.554588299273225, + "grad_norm": 0.40056388572882007, + "grad_max_sv": 0.19328901916742325, + "grad_min_sv": 5.563922629570062e-09, + "grad_condition": 45803958.546867594, + "lr": 0.000878497527825878, + "time_sec": 86.91433024406433 + }, + { + "epoch": 35, + "train_loss": 4.213116936340332, + "train_acc": 0.06228, + "test_loss": 5.048512329101563, + "test_acc": 0.01, + "lyapunov": 1.548424531126876, + "grad_norm": 0.40286521350806986, + "grad_max_sv": 0.18639697767794133, + "grad_min_sv": 5.634928314929288e-09, + "grad_condition": 47861656.46465705, + "lr": 0.000871572412738697, + "time_sec": 86.94499635696411 + }, + { + "epoch": 36, + "train_loss": 4.46321242477417, + "train_acc": 0.02644, + "test_loss": 7.976507986450195, + "test_acc": 0.01, + "lyapunov": 1.5736174876122828, + "grad_norm": 0.3688662413553731, + "grad_max_sv": 0.1843747731298208, + "grad_min_sv": 1.027042620136494e-09, + "grad_condition": 23392046595.39054, + "lr": 0.0008644843137107055, + "time_sec": 86.94508624076843 + }, + { + "epoch": 37, + "train_loss": 4.448079302368164, + "train_acc": 0.02678, + "test_loss": 5.779720497131348, + "test_acc": 0.01, + "lyapunov": 1.5641913728031052, + "grad_norm": 0.3319698693631811, + "grad_max_sv": 0.17876109518110753, + "grad_min_sv": 2.4601973283386735e-10, + "grad_condition": 23401419871.768867, + "lr": 0.0008572363398164014, + "time_sec": 86.95254611968994 + }, + { + "epoch": 38, + "train_loss": 4.4511954998779295, + "train_acc": 0.02752, + "test_loss": 9.1264736038208, + "test_acc": 0.01, + "lyapunov": 1.5642469356127102, + "grad_norm": 0.2986469281617768, + "grad_max_sv": 0.1681674152612686, + "grad_min_sv": 2.3341577206836764e-10, + "grad_condition": 26143404878.86806, + "lr": 0.0008498316702566826, + "time_sec": 87.00612330436707 + }, + { + "epoch": 39, + "train_loss": 4.4328032247924805, + "train_acc": 0.03036, + "test_loss": 10.002013760375977, + "test_acc": 0.01, + "lyapunov": 1.545380079532828, + "grad_norm": 0.31612252817270037, + "grad_max_sv": 0.17967074736952782, + "grad_min_sv": 1.3078811700331324e-09, + "grad_condition": 7630262604.515658, + "lr": 0.0008422735529643442, + "time_sec": 86.96651196479797 + }, + { + "epoch": 40, + "train_loss": 4.410691116485595, + "train_acc": 0.03262, + "test_loss": 10.329160571289062, + "test_acc": 0.01, + "lyapunov": 1.544363977963967, + "grad_norm": 0.3305250196532406, + "grad_max_sv": 0.18044610992074012, + "grad_min_sv": 2.8862289467267156e-09, + "grad_condition": 208503955.3202583, + "lr": 0.0008345653031794289, + "time_sec": 86.93889307975769 + }, + { + "epoch": 41, + "train_loss": 4.40241349319458, + "train_acc": 0.03342, + "test_loss": 7.508806234741211, + "test_acc": 0.01, + "lyapunov": 1.5479626981803523, + "grad_norm": 0.37593581599125797, + "grad_max_sv": 0.17868120335042476, + "grad_min_sv": 2.733827051543125e-09, + "grad_condition": 137280184.1727237, + "lr": 0.0008267103019950526, + "time_sec": 86.95495200157166 + }, + { + "epoch": 42, + "train_loss": 4.370949498138428, + "train_acc": 0.03828, + "test_loss": 6.459606773376465, + "test_acc": 0.01, + "lyapunov": 1.5444700297187357, + "grad_norm": 0.3619230318860018, + "grad_max_sv": 0.16240518875420093, + "grad_min_sv": 3.560387096604445e-09, + "grad_condition": 86248484.21915439, + "lr": 0.0008187119948743447, + "time_sec": 86.94808578491211 + }, + { + "epoch": 43, + "train_loss": 4.395889522705078, + "train_acc": 0.03416, + "test_loss": 7.4897293304443355, + "test_acc": 0.01, + "lyapunov": 1.5568798454216375, + "grad_norm": 0.3066578397068162, + "grad_max_sv": 0.15977313853800296, + "grad_min_sv": 2.1426118134706616e-09, + "grad_condition": 694043179.0150942, + "lr": 0.000810573890139155, + "time_sec": 86.97652959823608 + }, + { + "epoch": 44, + "train_loss": 4.395970639190674, + "train_acc": 0.0331, + "test_loss": 6.251794491577148, + "test_acc": 0.01, + "lyapunov": 1.5505369288842086, + "grad_norm": 0.3558862909608559, + "grad_max_sv": 0.15992271900177002, + "grad_min_sv": 2.2060850382588092e-09, + "grad_condition": 314610426.30490005, + "lr": 0.0008022995574311873, + "time_sec": 86.97155785560608 + }, + { + "epoch": 45, + "train_loss": 4.3631904621887205, + "train_acc": 0.03756, + "test_loss": 5.525508670043945, + "test_acc": 0.01, + "lyapunov": 1.5545306144772892, + "grad_norm": 0.3150905966342124, + "grad_max_sv": 0.15917456932365895, + "grad_min_sv": 2.917880549419688e-09, + "grad_condition": 172334946.43984643, + "lr": 0.0007938926261462363, + "time_sec": 86.95413851737976 + }, + { + "epoch": 46, + "train_loss": 4.385730860290527, + "train_acc": 0.03456, + "test_loss": 5.2734522521972655, + "test_acc": 0.01, + "lyapunov": 1.5768346917598755, + "grad_norm": 0.30280594802628175, + "grad_max_sv": 0.15774821415543555, + "grad_min_sv": 3.0362800302642657e-09, + "grad_condition": 276419213.49352396, + "lr": 0.0007853567838422158, + "time_sec": 86.9428277015686 + }, + { + "epoch": 47, + "train_loss": 4.421937339019776, + "train_acc": 0.03154, + "test_loss": 5.600688215637207, + "test_acc": 0.01, + "lyapunov": 1.5790051977957607, + "grad_norm": 0.33072277785528675, + "grad_max_sv": 0.16996506713330745, + "grad_min_sv": 2.771691926927583e-09, + "grad_condition": 320580453.11077607, + "lr": 0.0007766957746216719, + "time_sec": 86.92568945884705 + }, + { + "epoch": 48, + "train_loss": 4.417486723175049, + "train_acc": 0.0318, + "test_loss": 5.850329084014892, + "test_acc": 0.01, + "lyapunov": 1.5709409283859956, + "grad_norm": 0.3015658481608736, + "grad_max_sv": 0.16958414614200593, + "grad_min_sv": 2.117095306404743e-09, + "grad_condition": 1465805966.8142715, + "lr": 0.0007679133974894982, + "time_sec": 86.98221182823181 + }, + { + "epoch": 49, + "train_loss": 4.413777235107422, + "train_acc": 0.03204, + "test_loss": 5.770690809631348, + "test_acc": 0.01, + "lyapunov": 1.5579876326539022, + "grad_norm": 0.3480252425503119, + "grad_max_sv": 0.16178445334080607, + "grad_min_sv": 2.0201714462289255e-09, + "grad_condition": 2834174702.248597, + "lr": 0.000759013504686565, + "time_sec": 87.00604128837585 + }, + { + "epoch": 50, + "train_loss": 4.4205519735717775, + "train_acc": 0.0298, + "test_loss": 5.984611973571777, + "test_acc": 0.01, + "lyapunov": 1.5497863826239506, + "grad_norm": 0.2905045703519568, + "grad_max_sv": 0.15919520035386087, + "grad_min_sv": 9.888408669417747e-10, + "grad_condition": 5631365913.291557, + "lr": 0.0007499999999999998, + "time_sec": 86.96013498306274 + }, + { + "epoch": 51, + "train_loss": 4.41098743927002, + "train_acc": 0.0325, + "test_loss": 6.533537203979492, + "test_acc": 0.01, + "lyapunov": 1.555987215407974, + "grad_norm": 0.30379457449464103, + "grad_max_sv": 0.16679704934358597, + "grad_min_sv": 2.413719297654146e-09, + "grad_condition": 341047841.4947473, + "lr": 0.0007408768370508575, + "time_sec": 86.97173476219177 + }, + { + "epoch": 52, + "train_loss": 4.390000881347656, + "train_acc": 0.03462, + "test_loss": 5.217885815429687, + "test_acc": 0.01, + "lyapunov": 1.5600232867633594, + "grad_norm": 0.32784156163445544, + "grad_max_sv": 0.15694030448794366, + "grad_min_sv": 2.8198880390462035e-09, + "grad_condition": 111339990.40279654, + "lr": 0.0007316480175599307, + "time_sec": 86.9988853931427 + }, + { + "epoch": 53, + "train_loss": 4.288632299194336, + "train_acc": 0.04882, + "test_loss": 8.274944879150391, + "test_acc": 0.01, + "lyapunov": 1.565576893899142, + "grad_norm": 0.3486314610649234, + "grad_max_sv": 0.1506714668124914, + "grad_min_sv": 3.930395829632172e-09, + "grad_condition": 78544413.37347092, + "lr": 0.0007223175895924635, + "time_sec": 86.96367621421814 + }, + { + "epoch": 54, + "train_loss": 4.362063083496094, + "train_acc": 0.03894, + "test_loss": 5.243001276397705, + "test_acc": 0.01, + "lyapunov": 1.5714266458740624, + "grad_norm": 0.33670855500975183, + "grad_max_sv": 0.1638818845152855, + "grad_min_sv": 3.341216674862535e-09, + "grad_condition": 143330583.52604035, + "lr": 0.0007128896457825361, + "time_sec": 86.96970129013062 + }, + { + "epoch": 55, + "train_loss": 4.3985242970275875, + "train_acc": 0.0349, + "test_loss": 5.079080085754395, + "test_acc": 0.01, + "lyapunov": 1.557041028881317, + "grad_norm": 0.3110407590384958, + "grad_max_sv": 0.13654662668704987, + "grad_min_sv": 3.0798576551929748e-09, + "grad_condition": 90826613.18081078, + "lr": 0.0007033683215378998, + "time_sec": 86.96664762496948 + }, + { + "epoch": 56, + "train_loss": 4.3555380534362795, + "train_acc": 0.03972, + "test_loss": 5.452935369873047, + "test_acc": 0.01, + "lyapunov": 1.560518858987657, + "grad_norm": 0.31258330150396313, + "grad_max_sv": 0.15348581783473492, + "grad_min_sv": 3.6443401876112836e-09, + "grad_condition": 63305882.37131055, + "lr": 0.0006937577932260512, + "time_sec": 87.06724190711975 + }, + { + "epoch": 57, + "train_loss": 4.381474671783447, + "train_acc": 0.03686, + "test_loss": 7.36265283203125, + "test_acc": 0.01, + "lyapunov": 1.5697053960522118, + "grad_norm": 0.3865664941898656, + "grad_max_sv": 0.15512134719174356, + "grad_min_sv": 3.3817354081872146e-09, + "grad_condition": 457011679.7340926, + "lr": 0.0006840622763423388, + "time_sec": 87.06652784347534 + }, + { + "epoch": 58, + "train_loss": 4.403821620025635, + "train_acc": 0.03228, + "test_loss": 8.040378480529785, + "test_acc": 0.01, + "lyapunov": 1.5559333075038002, + "grad_norm": 0.29135723667857816, + "grad_max_sv": 0.16249749660491944, + "grad_min_sv": 2.647806284818144e-09, + "grad_condition": 607788328.9678621, + "lr": 0.0006742860236609073, + "time_sec": 87.00199866294861 + }, + { + "epoch": 59, + "train_loss": 4.402755667114258, + "train_acc": 0.0333, + "test_loss": 8.325734463500977, + "test_acc": 0.01, + "lyapunov": 1.5946810336978845, + "grad_norm": 0.31029489050735465, + "grad_max_sv": 0.15088103022426366, + "grad_min_sv": 2.4962215631335606e-09, + "grad_condition": 846951781.3818216, + "lr": 0.0006644333233692913, + "time_sec": 86.94004797935486 + }, + { + "epoch": 60, + "train_loss": 4.4194785871887206, + "train_acc": 0.02986, + "test_loss": 9.861287240600586, + "test_acc": 0.01, + "lyapunov": 1.5665948046442797, + "grad_norm": 0.2681308492085899, + "grad_max_sv": 0.13850090205669402, + "grad_min_sv": 5.255404293767318e-10, + "grad_condition": 4977286898.088277, + "lr": 0.0006545084971874734, + "time_sec": 86.9956967830658 + }, + { + "epoch": 61, + "train_loss": 4.416754204711914, + "train_acc": 0.03102, + "test_loss": 6.132235699462891, + "test_acc": 0.01, + "lyapunov": 1.5757032172454288, + "grad_norm": 0.30003715480279103, + "grad_max_sv": 0.13602122720330953, + "grad_min_sv": 8.228586455857377e-10, + "grad_condition": 13175326162.721104, + "lr": 0.0006445158984722354, + "time_sec": 86.99738907814026 + }, + { + "epoch": 62, + "train_loss": 4.400070931243897, + "train_acc": 0.03248, + "test_loss": 6.946181610870362, + "test_acc": 0.01, + "lyapunov": 1.5760818457664432, + "grad_norm": 0.2705000538096509, + "grad_max_sv": 0.1345938090234995, + "grad_min_sv": 6.920980580521832e-10, + "grad_condition": 1943244549.4253707, + "lr": 0.0006344599103076324, + "time_sec": 87.10566878318787 + }, + { + "epoch": 63, + "train_loss": 4.397411993865966, + "train_acc": 0.03356, + "test_loss": 6.4025613311767575, + "test_acc": 0.01, + "lyapunov": 1.5691703021373895, + "grad_norm": 0.295770706108135, + "grad_max_sv": 0.13735821805894374, + "grad_min_sv": 6.700764958362821e-10, + "grad_condition": 4282192212.8114214, + "lr": 0.0006243449435824269, + "time_sec": 87.11572027206421 + }, + { + "epoch": 64, + "train_loss": 4.411172714538575, + "train_acc": 0.03268, + "test_loss": 6.260893269348145, + "test_acc": 0.01, + "lyapunov": 1.5818147948940697, + "grad_norm": 0.3079314625857066, + "grad_max_sv": 0.12949498016387223, + "grad_min_sv": 1.4190367893734219e-10, + "grad_condition": 12329273937.565323, + "lr": 0.0006141754350553275, + "time_sec": 86.98852014541626 + }, + { + "epoch": 65, + "train_loss": 4.395129007568359, + "train_acc": 0.03392, + "test_loss": 6.5868188064575195, + "test_acc": 0.01, + "lyapunov": 1.5632798476597232, + "grad_norm": 0.25782867400033804, + "grad_max_sv": 0.12777244430035353, + "grad_min_sv": 2.976579219378644e-10, + "grad_condition": 5942895423.124485, + "lr": 0.0006039558454088793, + "time_sec": 87.11568331718445 + }, + { + "epoch": 66, + "train_loss": 4.406106295013427, + "train_acc": 0.0315, + "test_loss": 6.073413898468018, + "test_acc": 0.01, + "lyapunov": 1.576541522884613, + "grad_norm": 0.30947554951534784, + "grad_max_sv": 0.1285885890945792, + "grad_min_sv": 5.432121253815892e-10, + "grad_condition": 6217167701.43366, + "lr": 0.000593690657292862, + "time_sec": 87.17264008522034 + }, + { + "epoch": 67, + "train_loss": 4.393605449829102, + "train_acc": 0.03414, + "test_loss": 6.305842741394043, + "test_acc": 0.01, + "lyapunov": 1.5533494059082187, + "grad_norm": 0.25961319227506663, + "grad_max_sv": 0.12907455265522003, + "grad_min_sv": 1.6513973369542203e-09, + "grad_condition": 1871563855.9625301, + "lr": 0.0005833843733580507, + "time_sec": 87.04546856880188 + }, + { + "epoch": 68, + "train_loss": 4.397481441650391, + "train_acc": 0.03526, + "test_loss": 9.038330000305177, + "test_acc": 0.01, + "lyapunov": 1.5915909249459386, + "grad_norm": 0.3105737189018771, + "grad_max_sv": 0.1272705690935254, + "grad_min_sv": 1.1124955923331755e-09, + "grad_condition": 6291710890.600344, + "lr": 0.0005730415142812054, + "time_sec": 87.03171014785767 + }, + { + "epoch": 69, + "train_loss": 4.432055924072266, + "train_acc": 0.02954, + "test_loss": 6.220795520019531, + "test_acc": 0.01, + "lyapunov": 1.606788797756595, + "grad_norm": 0.2965672457851634, + "grad_max_sv": 0.11880129799246789, + "grad_min_sv": 5.90287951778381e-11, + "grad_condition": 15582797170.964344, + "lr": 0.0005626666167821517, + "time_sec": 87.01269674301147 + }, + { + "epoch": 70, + "train_loss": 4.433936797943115, + "train_acc": 0.02888, + "test_loss": 6.659252740478515, + "test_acc": 0.01, + "lyapunov": 1.5713767874271363, + "grad_norm": 0.23364690554453782, + "grad_max_sv": 0.11591648273169994, + "grad_min_sv": 1.5320265177461676e-10, + "grad_condition": 17166771390.34465, + "lr": 0.0005522642316338265, + "time_sec": 87.01791882514954 + }, + { + "epoch": 71, + "train_loss": 4.438748676300049, + "train_acc": 0.02874, + "test_loss": 6.609808558654785, + "test_acc": 0.01, + "lyapunov": 1.584676984021121, + "grad_norm": 0.2633441624923964, + "grad_max_sv": 0.11810853406786918, + "grad_min_sv": 1.1007920121830777e-10, + "grad_condition": 12701526680.721195, + "lr": 0.0005418389216661573, + "time_sec": 86.99067282676697 + }, + { + "epoch": 72, + "train_loss": 4.428876764984131, + "train_acc": 0.029, + "test_loss": 7.024348274230957, + "test_acc": 0.01, + "lyapunov": 1.5694371559430875, + "grad_norm": 0.2586705276163511, + "grad_max_sv": 0.11742300663609058, + "grad_min_sv": 4.3393096759821404e-11, + "grad_condition": 17654480120.057854, + "lr": 0.0005313952597646563, + "time_sec": 86.99662733078003 + }, + { + "epoch": 73, + "train_loss": 4.406545689849853, + "train_acc": 0.033, + "test_loss": 5.295959346008301, + "test_acc": 0.01, + "lyapunov": 1.598822437283938, + "grad_norm": 0.48160257702896175, + "grad_max_sv": 0.12682502008974553, + "grad_min_sv": 1.6137241577078923e-09, + "grad_condition": 1098514733.1527858, + "lr": 0.0005209378268645994, + "time_sec": 86.98713731765747 + }, + { + "epoch": 74, + "train_loss": 4.371206529998779, + "train_acc": 0.03752, + "test_loss": 6.3423968727111815, + "test_acc": 0.01, + "lyapunov": 1.5900212995841374, + "grad_norm": 0.2599656462367281, + "grad_max_sv": 0.11894330121576786, + "grad_min_sv": 2.0068056321743966e-09, + "grad_condition": 322985873.66543674, + "lr": 0.0005104712099416781, + "time_sec": 87.01381850242615 + }, + { + "epoch": 75, + "train_loss": 4.4355110260009765, + "train_acc": 0.03008, + "test_loss": 6.5740388412475586, + "test_acc": 0.01, + "lyapunov": 1.5995566000414017, + "grad_norm": 0.46971014639594094, + "grad_max_sv": 0.11837511248886586, + "grad_min_sv": 9.224606550920768e-10, + "grad_condition": 5756377475.535638, + "lr": 0.0004999999999999996, + "time_sec": 86.98455214500427 + }, + { + "epoch": 76, + "train_loss": 4.386026970672607, + "train_acc": 0.03692, + "test_loss": 7.027304895019531, + "test_acc": 0.01, + "lyapunov": 1.5754540259271022, + "grad_norm": 0.26903612071874217, + "grad_max_sv": 0.11812076661735774, + "grad_min_sv": 2.299920467269123e-09, + "grad_condition": 91850509.00722608, + "lr": 0.0004895287900583212, + "time_sec": 86.98026323318481 + }, + { + "epoch": 77, + "train_loss": 4.393477527923584, + "train_acc": 0.03412, + "test_loss": 6.660316326904297, + "test_acc": 0.01, + "lyapunov": 1.5862211976819636, + "grad_norm": 0.3013890397473114, + "grad_max_sv": 0.1351075556129217, + "grad_min_sv": 2.3924681109713588e-09, + "grad_condition": 445706368.4192219, + "lr": 0.0004790621731353997, + "time_sec": 86.97005081176758 + }, + { + "epoch": 78, + "train_loss": 4.546225792083741, + "train_acc": 0.0251, + "test_loss": 5.343878612518311, + "test_acc": 0.01, + "lyapunov": 1.5964782609963966, + "grad_norm": 0.90282337732271, + "grad_max_sv": 0.20608680080622435, + "grad_min_sv": 2.659187132906355e-09, + "grad_condition": 7860910669.836441, + "lr": 0.000468604740235343, + "time_sec": 86.96122479438782 + }, + { + "epoch": 79, + "train_loss": 4.357597355346679, + "train_acc": 0.04282, + "test_loss": 8.47580428466797, + "test_acc": 0.01, + "lyapunov": 1.6247231682853016, + "grad_norm": 0.3014093640980023, + "grad_max_sv": 0.13778700064867735, + "grad_min_sv": 3.3349062959070475e-09, + "grad_condition": 113414547.08337688, + "lr": 0.00045816107833384175, + "time_sec": 86.99122476577759 + }, + { + "epoch": 80, + "train_loss": 4.353704885253906, + "train_acc": 0.04112, + "test_loss": 7.1475914855957035, + "test_acc": 0.01, + "lyapunov": 1.646431783581024, + "grad_norm": 0.2930066807721922, + "grad_max_sv": 0.14062532242387532, + "grad_min_sv": 3.158852413670532e-09, + "grad_condition": 56459529.26701255, + "lr": 0.0004477357683661729, + "time_sec": 86.95756244659424 + }, + { + "epoch": 81, + "train_loss": 4.300996598510742, + "train_acc": 0.0489, + "test_loss": 5.905246903991699, + "test_acc": 0.01, + "lyapunov": 1.5976380972606141, + "grad_norm": 0.3041834155807877, + "grad_max_sv": 0.14135726243257524, + "grad_min_sv": 3.5767058866736924e-09, + "grad_condition": 57327864.423104, + "lr": 0.00043733338321784746, + "time_sec": 86.97077941894531 + }, + { + "epoch": 82, + "train_loss": 4.3091406649780275, + "train_acc": 0.04946, + "test_loss": 7.282952543640136, + "test_acc": 0.01, + "lyapunov": 1.6646705594514033, + "grad_norm": 0.32878525949020004, + "grad_max_sv": 0.1341265318915248, + "grad_min_sv": 3.612622626048001e-09, + "grad_condition": 55658705.11435084, + "lr": 0.0004269584857187939, + "time_sec": 86.95407176017761 + }, + { + "epoch": 83, + "train_loss": 4.3103489337158205, + "train_acc": 0.0477, + "test_loss": 6.477012939453125, + "test_acc": 0.01, + "lyapunov": 1.6391792172361213, + "grad_norm": 0.2962764376330481, + "grad_max_sv": 0.13159138858318328, + "grad_min_sv": 3.4047045499975907e-09, + "grad_condition": 518340281.28618824, + "lr": 0.0004166156266419484, + "time_sec": 86.94712162017822 + }, + { + "epoch": 84, + "train_loss": 4.36897839553833, + "train_acc": 0.03928, + "test_loss": 7.850455484008789, + "test_acc": 0.01, + "lyapunov": 1.6661204986864953, + "grad_norm": 0.28424512363766397, + "grad_max_sv": 0.13404478561133146, + "grad_min_sv": 3.010059496851036e-09, + "grad_condition": 3110503073.168424, + "lr": 0.0004063093427071373, + "time_sec": 86.97210931777954 + }, + { + "epoch": 85, + "train_loss": 4.437010177459717, + "train_acc": 0.03262, + "test_loss": 9.851054901123048, + "test_acc": 0.01, + "lyapunov": 1.8142987602507061, + "grad_norm": 0.2956023765215779, + "grad_max_sv": 0.1340159485116601, + "grad_min_sv": 1.7363556922736066e-09, + "grad_condition": 1531015855.923596, + "lr": 0.0003960441545911199, + "time_sec": 86.96314144134521 + }, + { + "epoch": 86, + "train_loss": 4.416305867919922, + "train_acc": 0.03328, + "test_loss": 8.345118670654298, + "test_acc": 0.01, + "lyapunov": 1.6857655969117304, + "grad_norm": 0.36818360732987215, + "grad_max_sv": 0.1309028506744653, + "grad_min_sv": 1.6532958094842372e-09, + "grad_condition": 3316626722.3164024, + "lr": 0.0003858245649446718, + "time_sec": 86.98166847229004 + }, + { + "epoch": 87, + "train_loss": 4.4015829487609865, + "train_acc": 0.03524, + "test_loss": 12.013820776367188, + "test_acc": 0.01, + "lyapunov": 1.7373071418089026, + "grad_norm": 0.2760253519467448, + "grad_max_sv": 0.1359336195513606, + "grad_min_sv": 2.3007044532528943e-09, + "grad_condition": 346456514.74827063, + "lr": 0.00037565505641757235, + "time_sec": 86.93886590003967 + }, + { + "epoch": 88, + "train_loss": 4.4740436238098145, + "train_acc": 0.0295, + "test_loss": 6.990837461853027, + "test_acc": 0.01, + "lyapunov": 1.6694230228433828, + "grad_norm": 0.43177687387451896, + "grad_max_sv": 0.18005888294428588, + "grad_min_sv": 2.4754363480046505e-09, + "grad_condition": 195635928.7701267, + "lr": 0.00036554008969236695, + "time_sec": 86.95178961753845 + }, + { + "epoch": 89, + "train_loss": 4.411496069488526, + "train_acc": 0.03514, + "test_loss": 11.70218861694336, + "test_acc": 0.01, + "lyapunov": 1.7507646498472795, + "grad_norm": 0.31033816746007103, + "grad_max_sv": 0.14542356096208095, + "grad_min_sv": 2.638068418488876e-09, + "grad_condition": 139957124.11622453, + "lr": 0.0003554841015277638, + "time_sec": 86.93717288970947 + }, + { + "epoch": 90, + "train_loss": 4.404713847961426, + "train_acc": 0.03648, + "test_loss": 9.9756316696167, + "test_acc": 0.01, + "lyapunov": 1.807755483995618, + "grad_norm": 0.35906280668802704, + "grad_max_sv": 0.1372342212125659, + "grad_min_sv": 2.7565777874737076e-09, + "grad_condition": 675780697.8457712, + "lr": 0.000345491502812526, + "time_sec": 86.93306636810303 + }, + { + "epoch": 91, + "train_loss": 4.408483022918701, + "train_acc": 0.0368, + "test_loss": 7.146534729003906, + "test_acc": 0.01, + "lyapunov": 1.801394305570656, + "grad_norm": 0.3109524713855987, + "grad_max_sv": 0.13791952189058065, + "grad_min_sv": 2.771594766713681e-09, + "grad_condition": 92088285.24973363, + "lr": 0.0003355666766307081, + "time_sec": 87.15299654006958 + }, + { + "epoch": 92, + "train_loss": 4.409290451202392, + "train_acc": 0.03586, + "test_loss": 14.403669937133788, + "test_acc": 0.01, + "lyapunov": 1.7155236371642792, + "grad_norm": 0.4463202756830642, + "grad_max_sv": 0.1406608471646905, + "grad_min_sv": 2.481988065313384e-09, + "grad_condition": 2274242135.598548, + "lr": 0.00032571397633909225, + "time_sec": 86.9645299911499 + }, + { + "epoch": 93, + "train_loss": 4.38183258102417, + "train_acc": 0.03594, + "test_loss": 14.732258331298828, + "test_acc": 0.01, + "lyapunov": 1.642303287525616, + "grad_norm": 0.28509807189744846, + "grad_max_sv": 0.14340070001780986, + "grad_min_sv": 2.788214630510509e-09, + "grad_condition": 661394156.996754, + "lr": 0.00031593772365766094, + "time_sec": 86.95910167694092 + }, + { + "epoch": 94, + "train_loss": 4.385672190704346, + "train_acc": 0.03708, + "test_loss": 14.926625048828125, + "test_acc": 0.01, + "lyapunov": 1.6731561519910612, + "grad_norm": 0.3134461909653867, + "grad_max_sv": 0.13709199130535127, + "grad_min_sv": 2.8174823593109245e-09, + "grad_condition": 118734750.50598077, + "lr": 0.0003062422067739483, + "time_sec": 86.92044115066528 + }, + { + "epoch": 95, + "train_loss": 4.3819806816101075, + "train_acc": 0.03738, + "test_loss": 11.074764614868164, + "test_acc": 0.01, + "lyapunov": 1.7133415379487644, + "grad_norm": 0.33153421078042083, + "grad_max_sv": 0.1331325426697731, + "grad_min_sv": 2.8642708720452715e-09, + "grad_condition": 165102808.59407786, + "lr": 0.00029663167846209965, + "time_sec": 86.93906211853027 + }, + { + "epoch": 96, + "train_loss": 4.404074432220459, + "train_acc": 0.03724, + "test_loss": 10.12900542602539, + "test_acc": 0.01, + "lyapunov": 1.7632283039410095, + "grad_norm": 0.3911637522793098, + "grad_max_sv": 0.12627853509038686, + "grad_min_sv": 2.4115265688864905e-09, + "grad_condition": 541677422.6672779, + "lr": 0.00028711035421746345, + "time_sec": 86.93936419487 + }, + { + "epoch": 97, + "train_loss": 4.451261331481934, + "train_acc": 0.0326, + "test_loss": 5.3055485847473145, + "test_acc": 0.01, + "lyapunov": 1.8559754114321736, + "grad_norm": 0.5079628716235006, + "grad_max_sv": 0.12650683380197733, + "grad_min_sv": 1.8654332285903626e-09, + "grad_condition": 10465021306.197956, + "lr": 0.00027768241040753615, + "time_sec": 86.9362096786499 + }, + { + "epoch": 98, + "train_loss": 4.457196118621826, + "train_acc": 0.03388, + "test_loss": 5.874557138061523, + "test_acc": 0.01, + "lyapunov": 1.8899869574305346, + "grad_norm": 0.40869012587460146, + "grad_max_sv": 0.136830860003829, + "grad_min_sv": 2.1947758774298626e-09, + "grad_condition": 2135302003.3466086, + "lr": 0.00026835198244006903, + "time_sec": 86.93851733207703 + }, + { + "epoch": 99, + "train_loss": 4.461137276153565, + "train_acc": 0.03376, + "test_loss": 7.712980445861817, + "test_acc": 0.01, + "lyapunov": 1.9207234422264197, + "grad_norm": 0.44593651641010523, + "grad_max_sv": 0.154570347443223, + "grad_min_sv": 2.743885928125303e-09, + "grad_condition": 11426608589.300367, + "lr": 0.0002591231629491421, + "time_sec": 86.93646287918091 + }, + { + "epoch": 100, + "train_loss": 4.4880205709838865, + "train_acc": 0.0309, + "test_loss": 4.7405736495971675, + "test_acc": 0.01, + "lyapunov": 1.9402269292670442, + "grad_norm": 0.5314169008984867, + "grad_max_sv": 0.17140868678689003, + "grad_min_sv": 2.9702306628132115e-09, + "grad_condition": 68768483.18390863, + "lr": 0.0002499999999999997, + "time_sec": 86.96372699737549 + }, + { + "epoch": 101, + "train_loss": 4.516919324493408, + "train_acc": 0.02856, + "test_loss": 4.631107287597656, + "test_acc": 0.01, + "lyapunov": 1.8684387063736196, + "grad_norm": 0.40457693704891007, + "grad_max_sv": 0.17230616863816978, + "grad_min_sv": 3.0731200580808025e-09, + "grad_condition": 123538009.91902074, + "lr": 0.00024098649531343477, + "time_sec": 86.94155859947205 + }, + { + "epoch": 102, + "train_loss": 4.4609598399353025, + "train_acc": 0.03628, + "test_loss": 4.7487232215881345, + "test_acc": 0.01, + "lyapunov": 1.9666810218635422, + "grad_norm": 1.4354338025926532, + "grad_max_sv": 0.1278171473182738, + "grad_min_sv": 2.1240830764037368e-09, + "grad_condition": 9763663835.33721, + "lr": 0.0002320866025105016, + "time_sec": 86.95742726325989 + }, + { + "epoch": 103, + "train_loss": 4.386784707641602, + "train_acc": 0.04782, + "test_loss": 4.745209142303467, + "test_acc": 0.01, + "lyapunov": 2.016990929918216, + "grad_norm": 0.7337516988127725, + "grad_max_sv": 0.13401773255318403, + "grad_min_sv": 3.1091931931848117e-09, + "grad_condition": 60104344.68401686, + "lr": 0.0002233042253783278, + "time_sec": 86.95129346847534 + }, + { + "epoch": 104, + "train_loss": 4.375011655273438, + "train_acc": 0.04672, + "test_loss": 4.693084164428711, + "test_acc": 0.01, + "lyapunov": 1.9775711432137453, + "grad_norm": 1.0479430580386422, + "grad_max_sv": 0.12959324829280378, + "grad_min_sv": 3.1502246932574305e-09, + "grad_condition": 77237986.61774956, + "lr": 0.000214643216157784, + "time_sec": 86.95826411247253 + }, + { + "epoch": 105, + "train_loss": 4.405172659912109, + "train_acc": 0.04668, + "test_loss": 4.741758982849121, + "test_acc": 0.01, + "lyapunov": 2.0328768131982944, + "grad_norm": 0.4687797625820131, + "grad_max_sv": 0.12328344490379095, + "grad_min_sv": 3.1737769629405777e-09, + "grad_condition": 85772134.99380484, + "lr": 0.00020610737385376332, + "time_sec": 86.93880844116211 + }, + { + "epoch": 106, + "train_loss": 4.356244638671875, + "train_acc": 0.04978, + "test_loss": 4.669058666992187, + "test_acc": 0.01, + "lyapunov": 1.8990197315850221, + "grad_norm": 0.4676609605386515, + "grad_max_sv": 0.13252175226807594, + "grad_min_sv": 3.525467490855805e-09, + "grad_condition": 52596210.13089059, + "lr": 0.00019770044256881242, + "time_sec": 86.96025395393372 + }, + { + "epoch": 107, + "train_loss": 4.388246943969727, + "train_acc": 0.04924, + "test_loss": 4.68506374206543, + "test_acc": 0.01, + "lyapunov": 1.9624325927261197, + "grad_norm": 0.4545225835797128, + "grad_max_sv": 0.13236304577440022, + "grad_min_sv": 3.35203632160358e-09, + "grad_condition": 105742345.63281551, + "lr": 0.0001894261098608447, + "time_sec": 86.91460108757019 + }, + { + "epoch": 108, + "train_loss": 4.3695238963317875, + "train_acc": 0.0483, + "test_loss": 4.651059510803223, + "test_acc": 0.01, + "lyapunov": 1.9490872517876003, + "grad_norm": 0.3584506383494584, + "grad_max_sv": 0.13239602297544478, + "grad_min_sv": 3.544706423871946e-09, + "grad_condition": 66536799.35327874, + "lr": 0.000181288005125655, + "time_sec": 86.93394088745117 + }, + { + "epoch": 109, + "train_loss": 4.394715529022217, + "train_acc": 0.04782, + "test_loss": 4.621646475219727, + "test_acc": 0.01, + "lyapunov": 2.0419393695528854, + "grad_norm": 0.4760680798020925, + "grad_max_sv": 0.12705831751227378, + "grad_min_sv": 3.4668329873532855e-09, + "grad_condition": 42335589.552427046, + "lr": 0.0001732896980049473, + "time_sec": 86.94732666015625 + }, + { + "epoch": 110, + "train_loss": 4.396159273681641, + "train_acc": 0.04692, + "test_loss": 4.635798811340332, + "test_acc": 0.01, + "lyapunov": 1.9756651958236304, + "grad_norm": 0.5216765889891325, + "grad_max_sv": 0.1416484847664833, + "grad_min_sv": 3.2233721108509276e-09, + "grad_condition": 671403726.1537082, + "lr": 0.00016543469682057076, + "time_sec": 86.9427604675293 + }, + { + "epoch": 111, + "train_loss": 4.381094040985108, + "train_acc": 0.04852, + "test_loss": 4.627859112548828, + "test_acc": 0.01, + "lyapunov": 1.9908651262902848, + "grad_norm": 0.45725032205485455, + "grad_max_sv": 0.1261982116382569, + "grad_min_sv": 3.3899231258877062e-09, + "grad_condition": 95101801.02691573, + "lr": 0.00015772644703565552, + "time_sec": 86.96308636665344 + }, + { + "epoch": 112, + "train_loss": 4.365775197753906, + "train_acc": 0.04556, + "test_loss": 4.630611195373535, + "test_acc": 0.01, + "lyapunov": 1.7899589819066666, + "grad_norm": 0.327253288333232, + "grad_max_sv": 0.12595976889133453, + "grad_min_sv": 3.5455886261692714e-09, + "grad_condition": 83078444.71479167, + "lr": 0.00015016832974331713, + "time_sec": 86.92891812324524 + }, + { + "epoch": 113, + "train_loss": 4.326185424499512, + "train_acc": 0.04906, + "test_loss": 4.624507279968261, + "test_acc": 0.01, + "lyapunov": 1.743294736308515, + "grad_norm": 0.30709867178590255, + "grad_max_sv": 0.12423296440392732, + "grad_min_sv": 3.5773004710814434e-09, + "grad_condition": 294726116.3341021, + "lr": 0.00014276366018359834, + "time_sec": 86.93962240219116 + }, + { + "epoch": 114, + "train_loss": 4.36080623336792, + "train_acc": 0.04476, + "test_loss": 4.638040520477295, + "test_acc": 0.01, + "lyapunov": 1.7487388175466787, + "grad_norm": 0.2896504251843997, + "grad_max_sv": 0.12205407582223415, + "grad_min_sv": 3.2766004282210047e-09, + "grad_condition": 256392136.90108904, + "lr": 0.00013551568628929425, + "time_sec": 86.93535208702087 + }, + { + "epoch": 115, + "train_loss": 4.368169149475098, + "train_acc": 0.0457, + "test_loss": 4.695854078674317, + "test_acc": 0.01, + "lyapunov": 1.7834696016653115, + "grad_norm": 0.292592900967331, + "grad_max_sv": 0.11619443818926811, + "grad_min_sv": 3.1756336950887087e-09, + "grad_condition": 1621784198.0725887, + "lr": 0.00012842758726130276, + "time_sec": 86.98673295974731 + }, + { + "epoch": 116, + "train_loss": 4.387150159606934, + "train_acc": 0.04296, + "test_loss": 4.669398309326172, + "test_acc": 0.01, + "lyapunov": 1.90544245035752, + "grad_norm": 0.3736850472793119, + "grad_max_sv": 0.11484571509063243, + "grad_min_sv": 3.1586906028280294e-09, + "grad_condition": 96176772.93288267, + "lr": 0.0001215024721741218, + "time_sec": 86.95901346206665 + }, + { + "epoch": 117, + "train_loss": 4.474187949371338, + "train_acc": 0.04052, + "test_loss": 4.7027623680114745, + "test_acc": 0.01, + "lyapunov": 2.13019656860615, + "grad_norm": 0.4706454049323369, + "grad_max_sv": 0.15399074126034976, + "grad_min_sv": 3.3639367810409104e-09, + "grad_condition": 148375942.6842225, + "lr": 0.00011474337861210538, + "time_sec": 86.95926237106323 + }, + { + "epoch": 118, + "train_loss": 4.414019877319336, + "train_acc": 0.04538, + "test_loss": 4.650316640472412, + "test_acc": 0.01, + "lyapunov": 2.0560264450204953, + "grad_norm": 0.42333097819604315, + "grad_max_sv": 0.11436628978699445, + "grad_min_sv": 3.070071629500382e-09, + "grad_condition": 1871812696.3982494, + "lr": 0.00010815327133708009, + "time_sec": 86.95543646812439 + }, + { + "epoch": 119, + "train_loss": 4.386474652862549, + "train_acc": 0.04654, + "test_loss": 4.6715775375366215, + "test_acc": 0.01, + "lyapunov": 1.969224628889957, + "grad_norm": 0.47947570620147545, + "grad_max_sv": 0.1272017750889063, + "grad_min_sv": 3.3292521794958674e-09, + "grad_condition": 61497599.9453614, + "lr": 0.00010173504098790182, + "time_sec": 86.94949531555176 + }, + { + "epoch": 120, + "train_loss": 4.384591791992188, + "train_acc": 0.04658, + "test_loss": 4.632473320007324, + "test_acc": 0.0077, + "lyapunov": 1.9927328724385527, + "grad_norm": 0.5289661566724388, + "grad_max_sv": 0.1261268701404333, + "grad_min_sv": 3.4284845490395456e-09, + "grad_condition": 48538207.83291945, + "lr": 9.549150281252629e-05, + "time_sec": 86.94581913948059 + }, + { + "epoch": 121, + "train_loss": 4.385587129669189, + "train_acc": 0.04774, + "test_loss": 4.632090152740479, + "test_acc": 0.01, + "lyapunov": 2.0432661521770155, + "grad_norm": 0.4859111606482192, + "grad_max_sv": 0.11864052936434746, + "grad_min_sv": 3.4766741936753665e-09, + "grad_condition": 60808462.870111085, + "lr": 8.942539543314794e-05, + "time_sec": 86.94836401939392 + }, + { + "epoch": 122, + "train_loss": 4.37459453338623, + "train_acc": 0.05042, + "test_loss": 4.624907290649414, + "test_acc": 0.01, + "lyapunov": 2.0131407037110587, + "grad_norm": 0.4855933253122246, + "grad_max_sv": 0.11917878109961748, + "grad_min_sv": 3.5260590100505416e-09, + "grad_condition": 40236226.2868594, + "lr": 8.353937964495024e-05, + "time_sec": 86.96557188034058 + }, + { + "epoch": 123, + "train_loss": 4.384435540771484, + "train_acc": 0.04966, + "test_loss": 4.6222803535461425, + "test_acc": 0.01, + "lyapunov": 2.056239744891291, + "grad_norm": 0.4869249888343625, + "grad_max_sv": 0.13170703500509262, + "grad_min_sv": 3.4749707009465447e-09, + "grad_condition": 81569926.69224386, + "lr": 7.783603724899243e-05, + "time_sec": 86.94557666778564 + }, + { + "epoch": 124, + "train_loss": 4.411828415222168, + "train_acc": 0.04734, + "test_loss": 4.617088554382324, + "test_acc": 0.01, + "lyapunov": 2.088481501850021, + "grad_norm": 0.6074321406428054, + "grad_max_sv": 0.13408620320260525, + "grad_min_sv": 3.669820186798234e-09, + "grad_condition": 89563715.17480934, + "lr": 7.231786991974666e-05, + "time_sec": 86.94801068305969 + }, + { + "epoch": 125, + "train_loss": 4.379881989440918, + "train_acc": 0.04928, + "test_loss": 4.626477690124512, + "test_acc": 0.01, + "lyapunov": 2.0224476098404516, + "grad_norm": 0.5566340932563276, + "grad_max_sv": 0.11598262693732977, + "grad_min_sv": 3.3913336450717977e-09, + "grad_condition": 154440174.8024956, + "lr": 6.698729810778072e-05, + "time_sec": 86.95501017570496 + }, + { + "epoch": 126, + "train_loss": 4.406389302368164, + "train_acc": 0.04668, + "test_loss": 4.62824654006958, + "test_acc": 0.01, + "lyapunov": 2.0166642894525357, + "grad_norm": 0.5564968205221957, + "grad_max_sv": 0.12961208932101725, + "grad_min_sv": 3.404863768707855e-09, + "grad_condition": 46850126.917104796, + "lr": 6.184665997806817e-05, + "time_sec": 86.89860510826111 + }, + { + "epoch": 127, + "train_loss": 4.421845231018066, + "train_acc": 0.04476, + "test_loss": 4.664912997436524, + "test_acc": 0.01, + "lyapunov": 2.0588970028835796, + "grad_norm": 0.54518049391847, + "grad_max_sv": 0.13061115611344576, + "grad_min_sv": 3.511758283128441e-09, + "grad_condition": 220500422.1836423, + "lr": 5.6898210384392595e-05, + "time_sec": 86.902822971344 + }, + { + "epoch": 128, + "train_loss": 4.466351209259034, + "train_acc": 0.04156, + "test_loss": 4.625092854309082, + "test_acc": 0.01, + "lyapunov": 2.054337273168442, + "grad_norm": 0.8009056003184672, + "grad_max_sv": 0.15183761473745108, + "grad_min_sv": 3.3345070037309657e-09, + "grad_condition": 1708739228.5454607, + "lr": 5.214411988029363e-05, + "time_sec": 86.9044144153595 + }, + { + "epoch": 129, + "train_loss": 4.410576982879639, + "train_acc": 0.0476, + "test_loss": 4.881959016418457, + "test_acc": 0.01, + "lyapunov": 2.066727384277012, + "grad_norm": 0.5318034857860106, + "grad_max_sv": 0.13615109845995904, + "grad_min_sv": 3.475596455342761e-09, + "grad_condition": 319815003.9823411, + "lr": 4.7586473766990294e-05, + "time_sec": 86.9201877117157 + }, + { + "epoch": 130, + "train_loss": 4.433161810302734, + "train_acc": 0.04566, + "test_loss": 4.664642805480957, + "test_acc": 0.01, + "lyapunov": 2.0571704889502365, + "grad_norm": 0.6233163181376318, + "grad_max_sv": 0.1495013041421771, + "grad_min_sv": 3.495363523273176e-09, + "grad_condition": 164232362.84179428, + "lr": 4.32272711786996e-05, + "time_sec": 86.9145233631134 + }, + { + "epoch": 131, + "train_loss": 4.559218102874756, + "train_acc": 0.03048, + "test_loss": 6.326250002288818, + "test_acc": 0.01, + "lyapunov": 1.9217658497183525, + "grad_norm": 0.7564931295651885, + "grad_max_sv": 0.2271105471998453, + "grad_min_sv": 3.6081980313296123e-09, + "grad_condition": 117749026.05203581, + "lr": 3.906842420574966e-05, + "time_sec": 86.89276170730591 + }, + { + "epoch": 132, + "train_loss": 4.559870092773438, + "train_acc": 0.03412, + "test_loss": 5.827829841613769, + "test_acc": 0.01, + "lyapunov": 2.123707967950865, + "grad_norm": 0.6846614047113081, + "grad_max_sv": 0.20084010064601898, + "grad_min_sv": 3.3751881069101626e-09, + "grad_condition": 872873152.1371578, + "lr": 3.5111757055874305e-05, + "time_sec": 86.91409301757812 + }, + { + "epoch": 133, + "train_loss": 4.433041811676025, + "train_acc": 0.04474, + "test_loss": 5.367306958007813, + "test_acc": 0.01, + "lyapunov": 2.0676878599254676, + "grad_norm": 0.5862986449277, + "grad_max_sv": 0.14338587652891874, + "grad_min_sv": 3.311574372187598e-09, + "grad_condition": 132479663.36386319, + "lr": 3.1359005254054254e-05, + "time_sec": 86.91529488563538 + }, + { + "epoch": 134, + "train_loss": 4.398417986602783, + "train_acc": 0.04772, + "test_loss": 4.720828105163574, + "test_acc": 0.01, + "lyapunov": 2.0894959808310585, + "grad_norm": 0.5265195386524826, + "grad_max_sv": 0.12358421217650176, + "grad_min_sv": 3.3169084333317666e-09, + "grad_condition": 75397884.58751842, + "lr": 2.7811814881259484e-05, + "time_sec": 86.98745679855347 + }, + { + "epoch": 135, + "train_loss": 4.413595640716553, + "train_acc": 0.04784, + "test_loss": 4.712530905151367, + "test_acc": 0.01, + "lyapunov": 2.1319035063009433, + "grad_norm": 0.5366514710399874, + "grad_max_sv": 0.12893760427832604, + "grad_min_sv": 3.733237558065788e-09, + "grad_condition": 129039558.48728514, + "lr": 2.4471741852423218e-05, + "time_sec": 86.93967342376709 + }, + { + "epoch": 136, + "train_loss": 4.405735962677002, + "train_acc": 0.04902, + "test_loss": 4.652213160705567, + "test_acc": 0.01, + "lyapunov": 2.1043942465501675, + "grad_norm": 0.5842194415437647, + "grad_max_sv": 0.13640696089714766, + "grad_min_sv": 3.6649167473382093e-09, + "grad_condition": 67841494.7867911, + "lr": 2.1340251233966362e-05, + "time_sec": 86.92829084396362 + }, + { + "epoch": 137, + "train_loss": 4.409075500030518, + "train_acc": 0.04824, + "test_loss": 4.6458401512146, + "test_acc": 0.01, + "lyapunov": 2.1048210426364715, + "grad_norm": 0.6189485837537402, + "grad_max_sv": 0.12394427489489317, + "grad_min_sv": 3.56216997565717e-09, + "grad_condition": 43191541.57949173, + "lr": 1.8418716601170932e-05, + "time_sec": 86.98851037025452 + }, + { + "epoch": 138, + "train_loss": 4.394878734741211, + "train_acc": 0.05004, + "test_loss": 4.742844686889648, + "test_acc": 0.01, + "lyapunov": 2.098401205009207, + "grad_norm": 0.5053435905574138, + "grad_max_sv": 0.11973771546036005, + "grad_min_sv": 3.5540812636652985e-09, + "grad_condition": 48597244.2583981, + "lr": 1.570841943568445e-05, + "time_sec": 86.94594693183899 + }, + { + "epoch": 139, + "train_loss": 4.454589398956299, + "train_acc": 0.04486, + "test_loss": 10.641064196777343, + "test_acc": 0.01, + "lyapunov": 2.0825157180771496, + "grad_norm": 0.7130369910143651, + "grad_max_sv": 0.14804725386202336, + "grad_min_sv": 3.4161704021151706e-09, + "grad_condition": 236395663.3257776, + "lr": 1.3210548563419845e-05, + "time_sec": 87.00129246711731 + }, + { + "epoch": 140, + "train_loss": 4.612700431671143, + "train_acc": 0.02562, + "test_loss": 5.085433462524414, + "test_acc": 0.01, + "lyapunov": 2.0142276125490817, + "grad_norm": 0.8209647733278711, + "grad_max_sv": 0.24317651763558387, + "grad_min_sv": 3.4037354469662608e-09, + "grad_condition": 190430418.85185307, + "lr": 1.0926199633097203e-05, + "time_sec": 86.9971239566803 + }, + { + "epoch": 141, + "train_loss": 4.487321048126221, + "train_acc": 0.0448, + "test_loss": 4.666201837921142, + "test_acc": 0.01, + "lyapunov": 2.2915835459823803, + "grad_norm": 0.6559251797263009, + "grad_max_sv": 0.13485133294016122, + "grad_min_sv": 3.4415409784147033e-09, + "grad_condition": 93528260.3989991, + "lr": 8.856374635655688e-06, + "time_sec": 87.03978943824768 + }, + { + "epoch": 142, + "train_loss": 4.471693329467773, + "train_acc": 0.04518, + "test_loss": 10.255754643249512, + "test_acc": 0.01, + "lyapunov": 2.178483701118118, + "grad_norm": 0.8381236929202858, + "grad_max_sv": 0.14980254359543324, + "grad_min_sv": 3.358237557309074e-09, + "grad_condition": 83488767.17166467, + "lr": 7.001981464747503e-06, + "time_sec": 87.01720571517944 + }, + { + "epoch": 143, + "train_loss": 4.446647290802002, + "train_acc": 0.04566, + "test_loss": 4.652296996307373, + "test_acc": 0.01, + "lyapunov": 2.1722125500974143, + "grad_norm": 0.5045885772353321, + "grad_max_sv": 0.11461257673799992, + "grad_min_sv": 3.376102331031916e-09, + "grad_condition": 69534096.19918647, + "lr": 5.3638335185058295e-06, + "time_sec": 86.93180632591248 + }, + { + "epoch": 144, + "train_loss": 4.493613358459473, + "train_acc": 0.04666, + "test_loss": 4.656233798217773, + "test_acc": 0.01, + "lyapunov": 2.1921363026284806, + "grad_norm": 0.5273945169505434, + "grad_max_sv": 0.11423748508095741, + "grad_min_sv": 3.4756384994128094e-09, + "grad_condition": 646405488.9879736, + "lr": 3.942649342761114e-06, + "time_sec": 86.91520476341248 + }, + { + "epoch": 145, + "train_loss": 4.597374949035644, + "train_acc": 0.0423, + "test_loss": 4.678201083374024, + "test_acc": 0.01, + "lyapunov": 2.2713517182318452, + "grad_norm": 0.47075033695967056, + "grad_max_sv": 0.12002073060721159, + "grad_min_sv": 3.703222454382038e-09, + "grad_condition": 39345602.26548739, + "lr": 2.7390523158633524e-06, + "time_sec": 86.92837643623352 + }, + { + "epoch": 146, + "train_loss": 4.794219552612304, + "train_acc": 0.02986, + "test_loss": 4.920618478393554, + "test_acc": 0.01, + "lyapunov": 2.394326541429895, + "grad_norm": 0.5246817663077135, + "grad_max_sv": 0.1241353990510106, + "grad_min_sv": 3.777793512477895e-09, + "grad_condition": 151497093.53789455, + "lr": 1.7535703752478133e-06, + "time_sec": 86.90443754196167 + }, + { + "epoch": 147, + "train_loss": 4.823008825378418, + "train_acc": 0.02802, + "test_loss": 4.705312028503418, + "test_acc": 0.01, + "lyapunov": 2.351406611749888, + "grad_norm": 0.5821396042735293, + "grad_max_sv": 0.13014851678162814, + "grad_min_sv": 4.0446829205776495e-09, + "grad_condition": 251708764.25831342, + "lr": 9.866357858642196e-07, + "time_sec": 86.91423988342285 + }, + { + "epoch": 148, + "train_loss": 4.7621851733398435, + "train_acc": 0.03064, + "test_loss": 4.91432806854248, + "test_acc": 0.01, + "lyapunov": 2.320931021209873, + "grad_norm": 0.3655369703619559, + "grad_max_sv": 0.13613226637244225, + "grad_min_sv": 4.233843499401591e-09, + "grad_condition": 37577954.13970064, + "lr": 4.38584950570808e-07, + "time_sec": 86.91514897346497 + }, + { + "epoch": 149, + "train_loss": 4.751388474884033, + "train_acc": 0.0314, + "test_loss": 4.928393530273437, + "test_acc": 0.01, + "lyapunov": 2.314872954507618, + "grad_norm": 0.34582385046790637, + "grad_max_sv": 0.13010288886725901, + "grad_min_sv": 4.070593409566392e-09, + "grad_condition": 116727132.6636453, + "lr": 1.096582625772501e-07, + "time_sec": 86.9192042350769 + }, + { + "epoch": 150, + "train_loss": 4.749187584838867, + "train_acc": 0.03084, + "test_loss": 4.9377007514953615, + "test_acc": 0.01, + "lyapunov": 2.3339363833522553, + "grad_norm": 0.3438957720875417, + "grad_max_sv": 0.13015102557837963, + "grad_min_sv": 4.109157251269702e-09, + "grad_condition": 44500021.17512281, + "lr": 0.0, + "time_sec": 86.93520998954773 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 5.079536279754639, + "train_acc": 0.01882, + "test_loss": 4.8872514236450195, + "test_acc": 0.01, + "lyapunov": 2.433271625157817, + "grad_norm": 5.340808628002946, + "grad_max_sv": 4.541763198375702, + "grad_min_sv": 9.132611378248612e-08, + "grad_condition": 60829743.69210352, + "lr": 0.0009998903417374227, + "time_sec": 132.14811611175537 + }, + { + "epoch": 2, + "train_loss": 4.774603317108154, + "train_acc": 0.01862, + "test_loss": 4.825307096862793, + "test_acc": 0.0099, + "lyapunov": 1.98436847062367, + "grad_norm": 3.9424334574306945, + "grad_max_sv": 2.8938568502198905, + "grad_min_sv": 5.677021384237202e-08, + "grad_condition": 58708438.134107456, + "lr": 0.0009995614150494292, + "time_sec": 132.15339040756226 + }, + { + "epoch": 3, + "train_loss": 4.663901504821777, + "train_acc": 0.0181, + "test_loss": 4.741232266235351, + "test_acc": 0.0145, + "lyapunov": 1.810482630949191, + "grad_norm": 2.7675521449461615, + "grad_max_sv": 1.8919199114665388, + "grad_min_sv": 3.818708835257034e-08, + "grad_condition": 54723570.14412842, + "lr": 0.0009990133642141358, + "time_sec": 132.11823868751526 + }, + { + "epoch": 4, + "train_loss": 4.583503988037109, + "train_acc": 0.0196, + "test_loss": 4.733808113098145, + "test_acc": 0.0127, + "lyapunov": 1.7725569412226567, + "grad_norm": 1.5853399774616823, + "grad_max_sv": 1.1614753112196923, + "grad_min_sv": 2.5252084090432447e-08, + "grad_condition": 49535418.60263091, + "lr": 0.0009982464296247522, + "time_sec": 132.14728569984436 + }, + { + "epoch": 5, + "train_loss": 4.5524190596008305, + "train_acc": 0.0185, + "test_loss": 4.749317463684082, + "test_acc": 0.0192, + "lyapunov": 1.7379879927086404, + "grad_norm": 0.9357664119583106, + "grad_max_sv": 0.623048696666956, + "grad_min_sv": 9.444938395329703e-09, + "grad_condition": 17454448603.577705, + "lr": 0.0009972609476841367, + "time_sec": 132.12196040153503 + }, + { + "epoch": 6, + "train_loss": 4.5547177754211425, + "train_acc": 0.0182, + "test_loss": 4.739207301330566, + "test_acc": 0.01, + "lyapunov": 1.7158090205448668, + "grad_norm": 0.6464921766494518, + "grad_max_sv": 0.4727002829313278, + "grad_min_sv": 1.4752434742032504e-09, + "grad_condition": 79239316890.38657, + "lr": 0.000996057350657239, + "time_sec": 132.20789337158203 + }, + { + "epoch": 7, + "train_loss": 4.567618137207031, + "train_acc": 0.01618, + "test_loss": 4.935951011657715, + "test_acc": 0.01, + "lyapunov": 1.6808951733362338, + "grad_norm": 0.708796945528179, + "grad_max_sv": 0.49447881430387497, + "grad_min_sv": 6.565144610538648e-12, + "grad_condition": 125853841385.85806, + "lr": 0.000994636166481494, + "time_sec": 132.16308617591858 + }, + { + "epoch": 8, + "train_loss": 4.5752451333618165, + "train_acc": 0.01508, + "test_loss": 4.654486715698242, + "test_acc": 0.01, + "lyapunov": 1.6649316146855464, + "grad_norm": 0.516840314330209, + "grad_max_sv": 0.3999390289187431, + "grad_min_sv": 3.239160638355361e-12, + "grad_condition": 132523175102.69946, + "lr": 0.0009929980185352525, + "time_sec": 132.1433699131012 + }, + { + "epoch": 9, + "train_loss": 4.584617326049805, + "train_acc": 0.01304, + "test_loss": 5.1370941864013675, + "test_acc": 0.01, + "lyapunov": 1.6745121082686403, + "grad_norm": 0.4662376866434158, + "grad_max_sv": 0.40068961679935455, + "grad_min_sv": 1.600815539628815e-12, + "grad_condition": 195211792607.34824, + "lr": 0.0009911436253643444, + "time_sec": 132.11373782157898 + }, + { + "epoch": 10, + "train_loss": 4.584750150451661, + "train_acc": 0.01344, + "test_loss": 5.014252323913574, + "test_acc": 0.01, + "lyapunov": 1.6392524599114342, + "grad_norm": 0.44066573339421267, + "grad_max_sv": 0.36354004368186, + "grad_min_sv": 1.0598376590459934e-12, + "grad_condition": 227681718826.60748, + "lr": 0.0009890738003669028, + "time_sec": 132.10810494422913 + }, + { + "epoch": 11, + "train_loss": 4.5782438153076175, + "train_acc": 0.01444, + "test_loss": 5.320826235198974, + "test_acc": 0.01, + "lyapunov": 1.6105381171111866, + "grad_norm": 0.46476522396770953, + "grad_max_sv": 0.384793009608984, + "grad_min_sv": 2.2384307405079876e-12, + "grad_condition": 181440627603.39355, + "lr": 0.00098678945143658, + "time_sec": 132.21521854400635 + }, + { + "epoch": 12, + "train_loss": 4.58615560546875, + "train_acc": 0.0146, + "test_loss": 6.162300729370117, + "test_acc": 0.01, + "lyapunov": 1.6162703143971047, + "grad_norm": 0.4583379516120641, + "grad_max_sv": 0.35209991298615934, + "grad_min_sv": 2.3950308634256474e-10, + "grad_condition": 199277790232.2622, + "lr": 0.0009842915805643154, + "time_sec": 132.06736636161804 + }, + { + "epoch": 13, + "train_loss": 4.58813276260376, + "train_acc": 0.01408, + "test_loss": 5.858095126342773, + "test_acc": 0.01, + "lyapunov": 1.6260488749769948, + "grad_norm": 0.39204254749475886, + "grad_max_sv": 0.3283296298235655, + "grad_min_sv": 5.234225415161807e-13, + "grad_condition": 249094970429.50763, + "lr": 0.000981581283398829, + "time_sec": 132.05243945121765 + }, + { + "epoch": 14, + "train_loss": 4.583052165374756, + "train_acc": 0.01376, + "test_loss": 5.763050801086425, + "test_acc": 0.0129, + "lyapunov": 1.6144071317389799, + "grad_norm": 0.5077264967403567, + "grad_max_sv": 0.4109547406435013, + "grad_min_sv": 1.3599295635453275e-12, + "grad_condition": 228187641587.3903, + "lr": 0.0009786597487660333, + "time_sec": 132.10575103759766 + }, + { + "epoch": 15, + "train_loss": 4.5714335003662105, + "train_acc": 0.0158, + "test_loss": 5.952970848083496, + "test_acc": 0.0108, + "lyapunov": 1.6084746881519132, + "grad_norm": 0.4822199745251536, + "grad_max_sv": 0.4148616835474968, + "grad_min_sv": 1.325723769366507e-12, + "grad_condition": 228332485622.18976, + "lr": 0.0009755282581475766, + "time_sec": 132.07877397537231 + }, + { + "epoch": 16, + "train_loss": 4.565800028839111, + "train_acc": 0.0173, + "test_loss": 6.017549203491211, + "test_acc": 0.0137, + "lyapunov": 1.6085086640189676, + "grad_norm": 0.47773503355798047, + "grad_max_sv": 0.37624144479632377, + "grad_min_sv": 1.8790570016513782e-12, + "grad_condition": 187345627300.82098, + "lr": 0.0009721881851187403, + "time_sec": 132.12643265724182 + }, + { + "epoch": 17, + "train_loss": 4.561137200317383, + "train_acc": 0.01712, + "test_loss": 5.580053092956543, + "test_acc": 0.0107, + "lyapunov": 1.6103480209779861, + "grad_norm": 0.42330979896069637, + "grad_max_sv": 0.3250656593590975, + "grad_min_sv": 2.3677161192719408e-12, + "grad_condition": 147724357967.11288, + "lr": 0.0009686409947459456, + "time_sec": 132.14898109436035 + }, + { + "epoch": 18, + "train_loss": 4.563034916381836, + "train_acc": 0.0177, + "test_loss": 6.472257780456543, + "test_acc": 0.012, + "lyapunov": 1.60859798714328, + "grad_norm": 0.39753763021030414, + "grad_max_sv": 0.3068309862166643, + "grad_min_sv": 1.984737901050091e-12, + "grad_condition": 141601417281.96045, + "lr": 0.0009648882429441254, + "time_sec": 132.13856673240662 + }, + { + "epoch": 19, + "train_loss": 4.573127483978271, + "train_acc": 0.01616, + "test_loss": 6.564729704284668, + "test_acc": 0.01, + "lyapunov": 1.6016948787147736, + "grad_norm": 0.37413654436559074, + "grad_max_sv": 0.25983951464295385, + "grad_min_sv": 8.805135414126768e-13, + "grad_condition": 167002019939.4643, + "lr": 0.00096093157579425, + "time_sec": 132.11500477790833 + }, + { + "epoch": 20, + "train_loss": 4.56939130859375, + "train_acc": 0.01528, + "test_loss": 5.16709538116455, + "test_acc": 0.01, + "lyapunov": 1.597558982841804, + "grad_norm": 0.39362856256863293, + "grad_max_sv": 0.2981186196208, + "grad_min_sv": 1.14360007788262e-12, + "grad_condition": 172580154761.56354, + "lr": 0.0009567727288213001, + "time_sec": 132.1002917289734 + }, + { + "epoch": 21, + "train_loss": 4.562076300048828, + "train_acc": 0.01692, + "test_loss": 7.266219122314453, + "test_acc": 0.01, + "lyapunov": 1.583339158531345, + "grad_norm": 0.3838804885339558, + "grad_max_sv": 0.2798105400055647, + "grad_min_sv": 7.450625884139858e-13, + "grad_condition": 177009367673.91373, + "lr": 0.0009524135262330095, + "time_sec": 132.13163590431213 + }, + { + "epoch": 22, + "train_loss": 4.559008093414307, + "train_acc": 0.01742, + "test_loss": 8.447665538024902, + "test_acc": 0.01, + "lyapunov": 1.603207119285603, + "grad_norm": 0.34832863438111206, + "grad_max_sv": 0.26395418867468834, + "grad_min_sv": 1.4773422168547318e-12, + "grad_condition": 143366348092.1024, + "lr": 0.0009478558801197061, + "time_sec": 132.09874486923218 + }, + { + "epoch": 23, + "train_loss": 4.567956644134521, + "train_acc": 0.01592, + "test_loss": 6.940740246582031, + "test_acc": 0.01, + "lyapunov": 1.585778128460545, + "grad_norm": 0.3751847661218295, + "grad_max_sv": 0.2457405323628336, + "grad_min_sv": 6.231746074838346e-13, + "grad_condition": 170137728056.1702, + "lr": 0.000943101789615607, + "time_sec": 132.0928874015808 + }, + { + "epoch": 24, + "train_loss": 4.56678815246582, + "train_acc": 0.01628, + "test_loss": 7.364704632568359, + "test_acc": 0.01, + "lyapunov": 1.5802125275287482, + "grad_norm": 0.3399018458628351, + "grad_max_sv": 0.2711117286235094, + "grad_min_sv": 9.27439371401471e-13, + "grad_condition": 170001968568.01523, + "lr": 0.0009381533400219313, + "time_sec": 132.12326908111572 + }, + { + "epoch": 25, + "train_loss": 4.551226531219482, + "train_acc": 0.01722, + "test_loss": 7.127618463134765, + "test_acc": 0.01, + "lyapunov": 1.5777013463437404, + "grad_norm": 0.3789618085380604, + "grad_max_sv": 0.2764745395630598, + "grad_min_sv": 1.510240189536528e-12, + "grad_condition": 150249480387.73657, + "lr": 0.0009330127018922189, + "time_sec": 132.14744663238525 + }, + { + "epoch": 26, + "train_loss": 4.533589083099365, + "train_acc": 0.01782, + "test_loss": 7.280224295043945, + "test_acc": 0.01, + "lyapunov": 1.5766756863850158, + "grad_norm": 0.4098165679041348, + "grad_max_sv": 0.32836851589381694, + "grad_min_sv": 1.6846995700798532e-12, + "grad_condition": 162596172663.19934, + "lr": 0.000927682130080253, + "time_sec": 132.10132360458374 + }, + { + "epoch": 27, + "train_loss": 4.5178348692321775, + "train_acc": 0.01944, + "test_loss": 4.609143519592285, + "test_acc": 0.01, + "lyapunov": 1.5718533059825068, + "grad_norm": 0.4317006812537803, + "grad_max_sv": 0.299236249551177, + "grad_min_sv": 2.0935759289783253e-12, + "grad_condition": 152648919866.78998, + "lr": 0.0009221639627510072, + "time_sec": 132.11033844947815 + }, + { + "epoch": 28, + "train_loss": 4.538441289978027, + "train_acc": 0.01874, + "test_loss": 5.727067053222656, + "test_acc": 0.01, + "lyapunov": 1.5787607407021096, + "grad_norm": 0.4781702015089973, + "grad_max_sv": 0.31850807219743726, + "grad_min_sv": 3.363601657944103e-12, + "grad_condition": 113571776097.28023, + "lr": 0.0009164606203550494, + "time_sec": 132.13339686393738 + }, + { + "epoch": 29, + "train_loss": 4.55489263671875, + "train_acc": 0.01978, + "test_loss": 6.314897917175293, + "test_acc": 0.01, + "lyapunov": 1.6226641564722866, + "grad_norm": 0.39702511856584055, + "grad_max_sv": 0.3101757925003767, + "grad_min_sv": 1.643950862890769e-12, + "grad_condition": 162529843580.92197, + "lr": 0.0009105746045668516, + "time_sec": 132.10528302192688 + }, + { + "epoch": 30, + "train_loss": 4.5577034072875975, + "train_acc": 0.01934, + "test_loss": 5.7611766616821285, + "test_acc": 0.01, + "lyapunov": 1.629781426371211, + "grad_norm": 0.4775298671802556, + "grad_max_sv": 0.3297189258038998, + "grad_min_sv": 3.2226531698260168e-12, + "grad_condition": 123880857814.76614, + "lr": 0.0009045084971874733, + "time_sec": 132.16758227348328 + }, + { + "epoch": 31, + "train_loss": 4.549954524230957, + "train_acc": 0.01922, + "test_loss": 6.9685128242492675, + "test_acc": 0.01, + "lyapunov": 1.6153524620148836, + "grad_norm": 0.39506087923244415, + "grad_max_sv": 0.305246427282691, + "grad_min_sv": 2.963371775308759e-12, + "grad_condition": 116809738976.30655, + "lr": 0.0008982649590120977, + "time_sec": 132.1613085269928 + }, + { + "epoch": 32, + "train_loss": 4.541183842926025, + "train_acc": 0.02124, + "test_loss": 6.829874574279785, + "test_acc": 0.01, + "lyapunov": 1.6133781327006151, + "grad_norm": 0.38947657187455065, + "grad_max_sv": 0.2715518455952406, + "grad_min_sv": 2.244930278252747e-12, + "grad_condition": 123331380509.9804, + "lr": 0.0008918467286629196, + "time_sec": 132.16536712646484 + }, + { + "epoch": 33, + "train_loss": 4.53525604888916, + "train_acc": 0.02098, + "test_loss": 6.518293627166748, + "test_acc": 0.01, + "lyapunov": 1.6150689750071376, + "grad_norm": 0.42014951113026694, + "grad_max_sv": 0.2435957606881857, + "grad_min_sv": 2.048687606811065e-12, + "grad_condition": 116665598250.77344, + "lr": 0.0008852566213878943, + "time_sec": 132.09782457351685 + }, + { + "epoch": 34, + "train_loss": 4.5325355252075195, + "train_acc": 0.01958, + "test_loss": 6.317331722259522, + "test_acc": 0.01, + "lyapunov": 1.5877615957308913, + "grad_norm": 0.3361598121090629, + "grad_max_sv": 0.2522958844900131, + "grad_min_sv": 3.651040784603148e-12, + "grad_condition": 86623505850.41478, + "lr": 0.000878497527825878, + "time_sec": 132.10610961914062 + }, + { + "epoch": 35, + "train_loss": 4.536015074005127, + "train_acc": 0.01868, + "test_loss": 6.3701594413757325, + "test_acc": 0.01, + "lyapunov": 1.5917383560439204, + "grad_norm": 0.34920551391182975, + "grad_max_sv": 0.23412882573902608, + "grad_min_sv": 2.182336791137283e-12, + "grad_condition": 102971407638.13591, + "lr": 0.000871572412738697, + "time_sec": 132.09818148612976 + }, + { + "epoch": 36, + "train_loss": 4.530319141998291, + "train_acc": 0.0189, + "test_loss": 6.076102793121338, + "test_acc": 0.01, + "lyapunov": 1.6073461313686712, + "grad_norm": 0.3121785959415577, + "grad_max_sv": 0.2200178649276495, + "grad_min_sv": 3.2766681152194533e-12, + "grad_condition": 85204262775.15216, + "lr": 0.0008644843137107055, + "time_sec": 132.1121485233307 + }, + { + "epoch": 37, + "train_loss": 4.530366974945069, + "train_acc": 0.02034, + "test_loss": 5.606327301025391, + "test_acc": 0.01, + "lyapunov": 1.6122757229963531, + "grad_norm": 0.3191242103818429, + "grad_max_sv": 0.20528502985835076, + "grad_min_sv": 1.8868968590479396e-12, + "grad_condition": 90563087741.60693, + "lr": 0.0008572363398164014, + "time_sec": 132.1431803703308 + }, + { + "epoch": 38, + "train_loss": 4.531652006530762, + "train_acc": 0.0181, + "test_loss": 6.281176449584961, + "test_acc": 0.01, + "lyapunov": 1.5978836668726732, + "grad_norm": 0.3226311590239451, + "grad_max_sv": 0.18021098636090754, + "grad_min_sv": 1.3471604261713563e-12, + "grad_condition": 97967821962.4504, + "lr": 0.0008498316702566826, + "time_sec": 132.1808111667633 + }, + { + "epoch": 39, + "train_loss": 4.515576623077393, + "train_acc": 0.02002, + "test_loss": 7.3591477447509765, + "test_acc": 0.01, + "lyapunov": 1.595075506688384, + "grad_norm": 0.29392491905513246, + "grad_max_sv": 0.175280692987144, + "grad_min_sv": 1.3060439555812542e-12, + "grad_condition": 99096247746.24886, + "lr": 0.0008422735529643442, + "time_sec": 132.13058257102966 + }, + { + "epoch": 40, + "train_loss": 4.508498954620362, + "train_acc": 0.02058, + "test_loss": 5.166109811401367, + "test_acc": 0.01, + "lyapunov": 1.592364840190429, + "grad_norm": 0.31050287296978984, + "grad_max_sv": 0.18211948983371257, + "grad_min_sv": 2.1916040644331514e-12, + "grad_condition": 89426467797.39761, + "lr": 0.0008345653031794289, + "time_sec": 132.1956102848053 + }, + { + "epoch": 41, + "train_loss": 4.594321117401123, + "train_acc": 0.01546, + "test_loss": 7.777395164489746, + "test_acc": 0.01, + "lyapunov": 1.6293273725168174, + "grad_norm": 1.0042516112855135, + "grad_max_sv": 0.14036097445059567, + "grad_min_sv": 2.5427231651336982e-11, + "grad_condition": 81054501201.00836, + "lr": 0.0008267103019950526, + "time_sec": 132.13326239585876 + }, + { + "epoch": 42, + "train_loss": 4.569071527404785, + "train_acc": 0.01844, + "test_loss": 7.213038313293457, + "test_acc": 0.01, + "lyapunov": 1.6979200718043101, + "grad_norm": 0.26172862173554357, + "grad_max_sv": 0.16976843364536762, + "grad_min_sv": 1.3973847074078634e-12, + "grad_condition": 86625374599.54195, + "lr": 0.0008187119948743447, + "time_sec": 132.11792135238647 + }, + { + "epoch": 43, + "train_loss": 4.558605685272217, + "train_acc": 0.01936, + "test_loss": 7.291248056030273, + "test_acc": 0.01, + "lyapunov": 1.6884295074531184, + "grad_norm": 0.28281726127535384, + "grad_max_sv": 0.16570937782526016, + "grad_min_sv": 1.422441962513273e-12, + "grad_condition": 88001604691.41785, + "lr": 0.000810573890139155, + "time_sec": 132.1009702682495 + }, + { + "epoch": 44, + "train_loss": 4.560630667114258, + "train_acc": 0.01868, + "test_loss": 7.16728485031128, + "test_acc": 0.01, + "lyapunov": 1.686604334875141, + "grad_norm": 0.28505793697030324, + "grad_max_sv": 0.15897216144949197, + "grad_min_sv": 1.4942365308149637e-12, + "grad_condition": 86276532282.80447, + "lr": 0.0008022995574311873, + "time_sec": 132.1154272556305 + }, + { + "epoch": 45, + "train_loss": 4.5725548426818845, + "train_acc": 0.0188, + "test_loss": 7.126261402893066, + "test_acc": 0.01, + "lyapunov": 1.686247174087388, + "grad_norm": 0.235009326711948, + "grad_max_sv": 0.15716111175715924, + "grad_min_sv": 7.169276878089038e-13, + "grad_condition": 108521610164.79031, + "lr": 0.0007938926261462363, + "time_sec": 132.11932492256165 + }, + { + "epoch": 46, + "train_loss": 4.583313959960938, + "train_acc": 0.0172, + "test_loss": 5.289773531341552, + "test_acc": 0.01, + "lyapunov": 1.698270396198458, + "grad_norm": 0.313539150382163, + "grad_max_sv": 0.16240414716303347, + "grad_min_sv": 6.375463347288685e-13, + "grad_condition": 111380569067.90488, + "lr": 0.0007853567838422158, + "time_sec": 132.14860010147095 + }, + { + "epoch": 47, + "train_loss": 4.578197394866943, + "train_acc": 0.01782, + "test_loss": 6.591432273864746, + "test_acc": 0.01, + "lyapunov": 1.6831631639119609, + "grad_norm": 0.2604809257680144, + "grad_max_sv": 0.15823213588446378, + "grad_min_sv": 1.3005127228431431e-12, + "grad_condition": 88272206869.29628, + "lr": 0.0007766957746216719, + "time_sec": 132.12520599365234 + }, + { + "epoch": 48, + "train_loss": 4.578674370269775, + "train_acc": 0.01816, + "test_loss": 5.157715400695801, + "test_acc": 0.01, + "lyapunov": 1.6778625536452778, + "grad_norm": 0.36451993025813884, + "grad_max_sv": 0.16272996473126114, + "grad_min_sv": 2.5139523132342427e-12, + "grad_condition": 93980395518.9741, + "lr": 0.0007679133974894982, + "time_sec": 132.10149908065796 + }, + { + "epoch": 49, + "train_loss": 4.558167927093506, + "train_acc": 0.0207, + "test_loss": 5.5524071670532225, + "test_acc": 0.01, + "lyapunov": 1.654131231710429, + "grad_norm": 0.26398153340032604, + "grad_max_sv": 0.15602914486080408, + "grad_min_sv": 8.142784605144219e-11, + "grad_condition": 49953288517.76509, + "lr": 0.000759013504686565, + "time_sec": 132.14293909072876 + }, + { + "epoch": 50, + "train_loss": 4.556328114318847, + "train_acc": 0.02032, + "test_loss": 5.053372247314453, + "test_acc": 0.01, + "lyapunov": 1.658374283319849, + "grad_norm": 0.24338078400550828, + "grad_max_sv": 0.1512946780771017, + "grad_min_sv": 2.964903017923289e-12, + "grad_condition": 67110635284.64429, + "lr": 0.0007499999999999998, + "time_sec": 132.1664924621582 + }, + { + "epoch": 51, + "train_loss": 4.570141744995118, + "train_acc": 0.01988, + "test_loss": 5.131472052001953, + "test_acc": 0.01, + "lyapunov": 1.6845884472512833, + "grad_norm": 0.2817728093100986, + "grad_max_sv": 0.13915783632546663, + "grad_min_sv": 1.7209330912965342e-12, + "grad_condition": 70074791169.44548, + "lr": 0.0007408768370508575, + "time_sec": 132.25617241859436 + }, + { + "epoch": 52, + "train_loss": 4.574759218902588, + "train_acc": 0.01936, + "test_loss": 5.048821273803711, + "test_acc": 0.01, + "lyapunov": 1.6568556862414037, + "grad_norm": 0.2134662683751272, + "grad_max_sv": 0.13759722150862216, + "grad_min_sv": 1.421003107907492e-12, + "grad_condition": 75951660314.10495, + "lr": 0.0007316480175599307, + "time_sec": 132.24415564537048 + }, + { + "epoch": 53, + "train_loss": 4.578046445617676, + "train_acc": 0.01878, + "test_loss": 5.305573741149902, + "test_acc": 0.01, + "lyapunov": 1.6395436802788463, + "grad_norm": 0.20939237447265202, + "grad_max_sv": 0.13288239240646363, + "grad_min_sv": 8.329158668790625e-13, + "grad_condition": 89438685434.2227, + "lr": 0.0007223175895924635, + "time_sec": 132.20375537872314 + }, + { + "epoch": 54, + "train_loss": 4.581330629272461, + "train_acc": 0.0165, + "test_loss": 5.532207501983643, + "test_acc": 0.01, + "lyapunov": 1.6444858135774618, + "grad_norm": 0.2762560677540659, + "grad_max_sv": 0.12445617569610476, + "grad_min_sv": 3.912145951191304e-12, + "grad_condition": 83557962455.66768, + "lr": 0.0007128896457825361, + "time_sec": 132.15107369422913 + }, + { + "epoch": 55, + "train_loss": 4.581049518737793, + "train_acc": 0.01652, + "test_loss": 5.197387743377686, + "test_acc": 0.01, + "lyapunov": 1.6384336021550172, + "grad_norm": 0.23390564725407778, + "grad_max_sv": 0.1323490994051099, + "grad_min_sv": 6.793781517885129e-13, + "grad_condition": 88731637332.26297, + "lr": 0.0007033683215378998, + "time_sec": 132.17300724983215 + }, + { + "epoch": 56, + "train_loss": 4.584884506378174, + "train_acc": 0.01634, + "test_loss": 6.454191752624512, + "test_acc": 0.01, + "lyapunov": 1.6743981499806084, + "grad_norm": 0.25387218343472684, + "grad_max_sv": 0.13131952080875636, + "grad_min_sv": 5.318952729656952e-13, + "grad_condition": 95324952785.9041, + "lr": 0.0006937577932260512, + "time_sec": 132.16189765930176 + }, + { + "epoch": 57, + "train_loss": 4.586065352630615, + "train_acc": 0.01452, + "test_loss": 6.120808155822754, + "test_acc": 0.01, + "lyapunov": 1.635638156815258, + "grad_norm": 0.19075779973568727, + "grad_max_sv": 0.10836047828197479, + "grad_min_sv": 3.0117655839699465e-13, + "grad_condition": 89022659140.15048, + "lr": 0.0006840622763423388, + "time_sec": 132.1572346687317 + }, + { + "epoch": 58, + "train_loss": 4.587811795196533, + "train_acc": 0.01474, + "test_loss": 5.800351502990723, + "test_acc": 0.01, + "lyapunov": 1.6200943285851832, + "grad_norm": 0.23045480693280587, + "grad_max_sv": 0.10783510617911815, + "grad_min_sv": 1.62684212425452e-13, + "grad_condition": 94564165099.07333, + "lr": 0.0006742860236609073, + "time_sec": 132.15808749198914 + }, + { + "epoch": 59, + "train_loss": 4.591301085662842, + "train_acc": 0.01376, + "test_loss": 5.996090186309814, + "test_acc": 0.01, + "lyapunov": 1.6170085330143609, + "grad_norm": 0.1857451149070646, + "grad_max_sv": 0.10361974723637105, + "grad_min_sv": 1.6122890156067053e-13, + "grad_condition": 91694547176.55017, + "lr": 0.0006644333233692913, + "time_sec": 132.1711368560791 + }, + { + "epoch": 60, + "train_loss": 4.585452033386231, + "train_acc": 0.01522, + "test_loss": 5.83253670501709, + "test_acc": 0.01, + "lyapunov": 1.6162819191622917, + "grad_norm": 0.27013125926112547, + "grad_max_sv": 0.10345460344105958, + "grad_min_sv": 2.5520667445480586e-13, + "grad_condition": 86471116288.19133, + "lr": 0.0006545084971874734, + "time_sec": 132.12959480285645 + }, + { + "epoch": 61, + "train_loss": 4.575745923614502, + "train_acc": 0.01574, + "test_loss": 5.912968054962159, + "test_acc": 0.01, + "lyapunov": 1.6168097483227626, + "grad_norm": 0.19203323317006551, + "grad_max_sv": 0.1045845141634345, + "grad_min_sv": 2.8391874312669906e-13, + "grad_condition": 84748109291.00053, + "lr": 0.0006445158984722354, + "time_sec": 132.1811854839325 + }, + { + "epoch": 62, + "train_loss": 4.581840614318848, + "train_acc": 0.01504, + "test_loss": 5.784942044067383, + "test_acc": 0.01, + "lyapunov": 1.6041824201793622, + "grad_norm": 0.18322487540118004, + "grad_max_sv": 0.11089323591440917, + "grad_min_sv": 2.605932741312656e-13, + "grad_condition": 91338998422.90005, + "lr": 0.0006344599103076324, + "time_sec": 132.1614978313446 + }, + { + "epoch": 63, + "train_loss": 4.60023887878418, + "train_acc": 0.01528, + "test_loss": 5.64439457244873, + "test_acc": 0.01, + "lyapunov": 1.6233063558178484, + "grad_norm": 0.2113660918385516, + "grad_max_sv": 0.10892452355474233, + "grad_min_sv": 2.537344721436935e-13, + "grad_condition": 90408295734.5693, + "lr": 0.0006243449435824269, + "time_sec": 132.14256119728088 + }, + { + "epoch": 64, + "train_loss": 4.589049236907959, + "train_acc": 0.01542, + "test_loss": 5.874572355651855, + "test_acc": 0.01, + "lyapunov": 1.6047841283061621, + "grad_norm": 0.18184052006950477, + "grad_max_sv": 0.10828140377998352, + "grad_min_sv": 2.791036279353835e-13, + "grad_condition": 88102791154.87807, + "lr": 0.0006141754350553275, + "time_sec": 132.15559458732605 + }, + { + "epoch": 65, + "train_loss": 4.5660726802062985, + "train_acc": 0.01638, + "test_loss": 5.8140344772338866, + "test_acc": 0.01, + "lyapunov": 1.5915922386871884, + "grad_norm": 0.19423334716784915, + "grad_max_sv": 0.10693365205079317, + "grad_min_sv": 3.330885965231205e-13, + "grad_condition": 83112992316.30193, + "lr": 0.0006039558454088793, + "time_sec": 132.18004989624023 + }, + { + "epoch": 66, + "train_loss": 4.580396204833985, + "train_acc": 0.01542, + "test_loss": 5.797694694519043, + "test_acc": 0.01, + "lyapunov": 1.5965009342374095, + "grad_norm": 0.2125232867000169, + "grad_max_sv": 0.10570351034402847, + "grad_min_sv": 2.978146282169481e-13, + "grad_condition": 85693424811.33855, + "lr": 0.000593690657292862, + "time_sec": 132.2843222618103 + }, + { + "epoch": 67, + "train_loss": 4.573282337646484, + "train_acc": 0.01564, + "test_loss": 5.954542552185059, + "test_acc": 0.01, + "lyapunov": 1.601048025938556, + "grad_norm": 0.18603658324598782, + "grad_max_sv": 0.10089892633259297, + "grad_min_sv": 3.469332375289147e-13, + "grad_condition": 80778127108.38254, + "lr": 0.0005833843733580507, + "time_sec": 132.31548929214478 + }, + { + "epoch": 68, + "train_loss": 4.571360148773193, + "train_acc": 0.0161, + "test_loss": 5.669797957611084, + "test_acc": 0.01, + "lyapunov": 1.5947835719798837, + "grad_norm": 0.20014910112057685, + "grad_max_sv": 0.105499835498631, + "grad_min_sv": 9.770913933804e-13, + "grad_condition": 66387740803.896385, + "lr": 0.0005730415142812054, + "time_sec": 132.14850521087646 + }, + { + "epoch": 69, + "train_loss": 4.578122979125976, + "train_acc": 0.01662, + "test_loss": 6.221010691070557, + "test_acc": 0.01, + "lyapunov": 1.6033955156955573, + "grad_norm": 0.30693039018142426, + "grad_max_sv": 0.11157863736152648, + "grad_min_sv": 8.756002305516403e-13, + "grad_condition": 80609250127.91284, + "lr": 0.0005626666167821517, + "time_sec": 132.37923741340637 + }, + { + "epoch": 70, + "train_loss": 4.565648191833496, + "train_acc": 0.01792, + "test_loss": 5.099743925476075, + "test_acc": 0.01, + "lyapunov": 1.6167474094864047, + "grad_norm": 0.22355495861014546, + "grad_max_sv": 0.1181858729571104, + "grad_min_sv": 4.5336824184788683e-13, + "grad_condition": 88479511676.05211, + "lr": 0.0005522642316338265, + "time_sec": 132.16482520103455 + }, + { + "epoch": 71, + "train_loss": 4.5823839192199705, + "train_acc": 0.01686, + "test_loss": 5.610829375457763, + "test_acc": 0.01, + "lyapunov": 1.640915547795308, + "grad_norm": 0.21533848262037789, + "grad_max_sv": 0.10482716094702482, + "grad_min_sv": 2.352225111137488e-13, + "grad_condition": 88706026678.10991, + "lr": 0.0005418389216661573, + "time_sec": 132.1553201675415 + }, + { + "epoch": 72, + "train_loss": 4.586939775238037, + "train_acc": 0.01644, + "test_loss": 5.6766823959350585, + "test_acc": 0.01, + "lyapunov": 1.6386277257938824, + "grad_norm": 0.21193209754597628, + "grad_max_sv": 0.09875305313616992, + "grad_min_sv": 3.8445128177488697e-13, + "grad_condition": 80890057907.66025, + "lr": 0.0005313952597646563, + "time_sec": 132.1702263355255 + }, + { + "epoch": 73, + "train_loss": 4.565450923156738, + "train_acc": 0.01786, + "test_loss": 5.090951374053955, + "test_acc": 0.01, + "lyapunov": 1.5904299654924046, + "grad_norm": 0.19354037031175023, + "grad_max_sv": 0.10569104105234146, + "grad_min_sv": 4.874789243593624e-13, + "grad_condition": 80729120343.229, + "lr": 0.0005209378268645994, + "time_sec": 132.16868782043457 + }, + { + "epoch": 74, + "train_loss": 4.5504186448669435, + "train_acc": 0.0181, + "test_loss": 5.612113465881348, + "test_acc": 0.01, + "lyapunov": 1.5932684325806015, + "grad_norm": 0.2020325382395806, + "grad_max_sv": 0.1039424953982234, + "grad_min_sv": 1.1594278629870026e-12, + "grad_condition": 62545889757.239746, + "lr": 0.0005104712099416781, + "time_sec": 132.14726519584656 + }, + { + "epoch": 75, + "train_loss": 4.5482193190002445, + "train_acc": 0.01858, + "test_loss": 6.069068190002441, + "test_acc": 0.01, + "lyapunov": 1.604267351767596, + "grad_norm": 0.2266064763923867, + "grad_max_sv": 0.11460568010807037, + "grad_min_sv": 1.7911878418656585e-12, + "grad_condition": 63236708994.86294, + "lr": 0.0004999999999999996, + "time_sec": 132.14808058738708 + }, + { + "epoch": 76, + "train_loss": 4.547421706695556, + "train_acc": 0.01796, + "test_loss": 5.810434713745117, + "test_acc": 0.01, + "lyapunov": 1.6127760651166483, + "grad_norm": 0.21661099340887846, + "grad_max_sv": 0.11015285402536393, + "grad_min_sv": 1.6610576221168998e-12, + "grad_condition": 56473316901.58356, + "lr": 0.0004895287900583212, + "time_sec": 132.38169169425964 + }, + { + "epoch": 77, + "train_loss": 4.5509974664306645, + "train_acc": 0.02, + "test_loss": 5.662685046386719, + "test_acc": 0.01, + "lyapunov": 1.6085883635084341, + "grad_norm": 0.22829542556288998, + "grad_max_sv": 0.11323911305516958, + "grad_min_sv": 1.2826856675589158e-12, + "grad_condition": 59045967769.00034, + "lr": 0.0004790621731353997, + "time_sec": 132.19757294654846 + }, + { + "epoch": 78, + "train_loss": 4.551352957153321, + "train_acc": 0.01882, + "test_loss": 5.566857955932617, + "test_acc": 0.01, + "lyapunov": 1.6337723820410726, + "grad_norm": 0.25602140985448185, + "grad_max_sv": 0.11203370597213506, + "grad_min_sv": 1.3258904637988123e-12, + "grad_condition": 62071250445.38745, + "lr": 0.000468604740235343, + "time_sec": 132.21045851707458 + }, + { + "epoch": 79, + "train_loss": 4.545634266510009, + "train_acc": 0.01956, + "test_loss": 5.292388404846191, + "test_acc": 0.01, + "lyapunov": 1.633863453365043, + "grad_norm": 0.261991339098316, + "grad_max_sv": 0.11294185262013343, + "grad_min_sv": 2.2926638646691538e-12, + "grad_condition": 57437613489.9528, + "lr": 0.00045816107833384175, + "time_sec": 132.16106390953064 + }, + { + "epoch": 80, + "train_loss": 4.544438370513916, + "train_acc": 0.02008, + "test_loss": 5.594520863342285, + "test_acc": 0.01, + "lyapunov": 1.6360818525714338, + "grad_norm": 0.27680249132769946, + "grad_max_sv": 0.12154058534651994, + "grad_min_sv": 4.6932727855827e-12, + "grad_condition": 38848618049.80592, + "lr": 0.0004477357683661729, + "time_sec": 132.17013382911682 + }, + { + "epoch": 81, + "train_loss": 4.539229464416504, + "train_acc": 0.02094, + "test_loss": 5.203748289489746, + "test_acc": 0.01, + "lyapunov": 1.6401681241476933, + "grad_norm": 0.2346300301923333, + "grad_max_sv": 0.11762278378009797, + "grad_min_sv": 4.245260345659918e-12, + "grad_condition": 45140986862.910706, + "lr": 0.00043733338321784746, + "time_sec": 132.1922423839569 + }, + { + "epoch": 82, + "train_loss": 4.511806388244629, + "train_acc": 0.02256, + "test_loss": 5.1750801635742185, + "test_acc": 0.01, + "lyapunov": 1.6131305651896446, + "grad_norm": 0.21894630317091804, + "grad_max_sv": 0.11400092151015997, + "grad_min_sv": 1.204121461777062e-11, + "grad_condition": 37883001192.43938, + "lr": 0.0004269584857187939, + "time_sec": 132.2294306755066 + }, + { + "epoch": 83, + "train_loss": 4.560598617706299, + "train_acc": 0.01922, + "test_loss": 5.039254272460938, + "test_acc": 0.01, + "lyapunov": 1.6179730105583014, + "grad_norm": 0.6818929560069714, + "grad_max_sv": 0.10932031758129597, + "grad_min_sv": 3.5758800721917905e-11, + "grad_condition": 41961243110.78183, + "lr": 0.0004166156266419484, + "time_sec": 132.16398668289185 + }, + { + "epoch": 84, + "train_loss": 4.538027311553955, + "train_acc": 0.02012, + "test_loss": 5.358105621337891, + "test_acc": 0.01, + "lyapunov": 1.630713469841901, + "grad_norm": 0.23515180969917246, + "grad_max_sv": 0.11126796789467334, + "grad_min_sv": 3.733440409242942e-12, + "grad_condition": 42021389131.16902, + "lr": 0.0004063093427071373, + "time_sec": 132.17217254638672 + }, + { + "epoch": 85, + "train_loss": 4.533066810150147, + "train_acc": 0.02142, + "test_loss": 5.210582428741455, + "test_acc": 0.01, + "lyapunov": 1.6099314771954665, + "grad_norm": 0.23743119261123188, + "grad_max_sv": 0.11509178727865219, + "grad_min_sv": 9.24621530124588e-12, + "grad_condition": 33409415784.932446, + "lr": 0.0003960441545911199, + "time_sec": 132.18297863006592 + }, + { + "epoch": 86, + "train_loss": 4.514812325439453, + "train_acc": 0.02338, + "test_loss": 5.010178847503662, + "test_acc": 0.01, + "lyapunov": 1.5926586319418514, + "grad_norm": 0.2162543490750504, + "grad_max_sv": 0.1109484301880002, + "grad_min_sv": 4.5705949216622454e-10, + "grad_condition": 11504727044.022625, + "lr": 0.0003858245649446718, + "time_sec": 132.147221326828 + }, + { + "epoch": 87, + "train_loss": 4.511024246826172, + "train_acc": 0.022, + "test_loss": 5.345004454040527, + "test_acc": 0.01, + "lyapunov": 1.5887958646735267, + "grad_norm": 0.25657197110027863, + "grad_max_sv": 0.1051843574270606, + "grad_min_sv": 1.705161448824656e-10, + "grad_condition": 25039598073.63558, + "lr": 0.00037565505641757235, + "time_sec": 132.14885830879211 + }, + { + "epoch": 88, + "train_loss": 4.505899262237548, + "train_acc": 0.02334, + "test_loss": 4.936904384613037, + "test_acc": 0.01, + "lyapunov": 1.6046001039197684, + "grad_norm": 0.24194115234056338, + "grad_max_sv": 0.11062774620950222, + "grad_min_sv": 8.66749245303117e-11, + "grad_condition": 18998356971.070953, + "lr": 0.00036554008969236695, + "time_sec": 132.13108325004578 + }, + { + "epoch": 89, + "train_loss": 4.509913777923584, + "train_acc": 0.02288, + "test_loss": 4.863644284057617, + "test_acc": 0.01, + "lyapunov": 1.6005188049867636, + "grad_norm": 0.2399799817677917, + "grad_max_sv": 0.10860499612490457, + "grad_min_sv": 6.798252102655834e-11, + "grad_condition": 18908436070.961212, + "lr": 0.0003554841015277638, + "time_sec": 132.194641828537 + }, + { + "epoch": 90, + "train_loss": 4.537508490905762, + "train_acc": 0.02064, + "test_loss": 5.445182901763916, + "test_acc": 0.01, + "lyapunov": 1.5926521418954405, + "grad_norm": 0.1984924919711564, + "grad_max_sv": 0.1050485922023654, + "grad_min_sv": 7.577653377773176e-12, + "grad_condition": 30774293544.0844, + "lr": 0.000345491502812526, + "time_sec": 132.17840719223022 + }, + { + "epoch": 91, + "train_loss": 4.521757569274902, + "train_acc": 0.02238, + "test_loss": 5.262060061645508, + "test_acc": 0.01, + "lyapunov": 1.5892650910350672, + "grad_norm": 0.2847263318092328, + "grad_max_sv": 0.10287641081959009, + "grad_min_sv": 1.91736922530795e-10, + "grad_condition": 18967974102.564293, + "lr": 0.0003355666766307081, + "time_sec": 132.18149828910828 + }, + { + "epoch": 92, + "train_loss": 4.519360184631347, + "train_acc": 0.02082, + "test_loss": 5.320795262908936, + "test_acc": 0.01, + "lyapunov": 1.5871959750914513, + "grad_norm": 0.2370639034610865, + "grad_max_sv": 0.10874731410294772, + "grad_min_sv": 7.319739596956258e-12, + "grad_condition": 27639015872.358166, + "lr": 0.00032571397633909225, + "time_sec": 132.22724723815918 + }, + { + "epoch": 93, + "train_loss": 4.512343827972412, + "train_acc": 0.022, + "test_loss": 5.345669583129883, + "test_acc": 0.01, + "lyapunov": 1.5883484478191952, + "grad_norm": 0.23157908229447258, + "grad_max_sv": 0.10562088992446661, + "grad_min_sv": 1.2009558277386558e-11, + "grad_condition": 16084905305.476273, + "lr": 0.00031593772365766094, + "time_sec": 132.24062776565552 + }, + { + "epoch": 94, + "train_loss": 4.507626133422852, + "train_acc": 0.02282, + "test_loss": 5.232546983337403, + "test_acc": 0.01, + "lyapunov": 1.582219293355332, + "grad_norm": 0.25414870293495084, + "grad_max_sv": 0.10162105709314347, + "grad_min_sv": 1.5387781568668625e-11, + "grad_condition": 19577209942.564514, + "lr": 0.0003062422067739483, + "time_sec": 132.21938920021057 + }, + { + "epoch": 95, + "train_loss": 4.5046430790710446, + "train_acc": 0.02322, + "test_loss": 5.702656979370118, + "test_acc": 0.01, + "lyapunov": 1.5933423502670834, + "grad_norm": 0.22296672954904517, + "grad_max_sv": 0.10369365382939577, + "grad_min_sv": 1.464815680454453e-11, + "grad_condition": 19604050143.141273, + "lr": 0.00029663167846209965, + "time_sec": 132.21640634536743 + }, + { + "epoch": 96, + "train_loss": 4.50480010559082, + "train_acc": 0.02282, + "test_loss": 5.597961514282226, + "test_acc": 0.01, + "lyapunov": 1.583764209771705, + "grad_norm": 0.25490663774480726, + "grad_max_sv": 0.10260288586723618, + "grad_min_sv": 1.5525958737926244e-11, + "grad_condition": 16728424588.234934, + "lr": 0.00028711035421746345, + "time_sec": 132.1660978794098 + }, + { + "epoch": 97, + "train_loss": 4.469037200622559, + "train_acc": 0.02894, + "test_loss": 5.864905759429932, + "test_acc": 0.01, + "lyapunov": 1.5917478577255288, + "grad_norm": 0.23870917284644627, + "grad_max_sv": 0.12171203531324863, + "grad_min_sv": 1.4733043387116664e-09, + "grad_condition": 1570381038.4230928, + "lr": 0.00027768241040753615, + "time_sec": 132.178719997406 + }, + { + "epoch": 98, + "train_loss": 4.470558769683838, + "train_acc": 0.02786, + "test_loss": 6.108024346923828, + "test_acc": 0.01, + "lyapunov": 1.5934783141021533, + "grad_norm": 0.30827407557184827, + "grad_max_sv": 0.12690354958176614, + "grad_min_sv": 1.3345814640474545e-09, + "grad_condition": 2937579113.826585, + "lr": 0.00026835198244006903, + "time_sec": 132.1512405872345 + }, + { + "epoch": 99, + "train_loss": 4.484580178527832, + "train_acc": 0.02542, + "test_loss": 5.846526190185547, + "test_acc": 0.01, + "lyapunov": 1.5788978844347512, + "grad_norm": 0.221869552528174, + "grad_max_sv": 0.11516296844929456, + "grad_min_sv": 6.437623919727277e-10, + "grad_condition": 3127665808.238943, + "lr": 0.0002591231629491421, + "time_sec": 132.13360047340393 + }, + { + "epoch": 100, + "train_loss": 4.483458242340088, + "train_acc": 0.0259, + "test_loss": 5.841338038635254, + "test_acc": 0.01, + "lyapunov": 1.5934071232900595, + "grad_norm": 0.27882300961773687, + "grad_max_sv": 0.11602762639522553, + "grad_min_sv": 7.004058964700434e-10, + "grad_condition": 3782223950.51213, + "lr": 0.0002499999999999997, + "time_sec": 132.2558717727661 + }, + { + "epoch": 101, + "train_loss": 4.499455378265381, + "train_acc": 0.02344, + "test_loss": 5.443247247314453, + "test_acc": 0.01, + "lyapunov": 1.5859141483941042, + "grad_norm": 0.25072615175177326, + "grad_max_sv": 0.11183246672153473, + "grad_min_sv": 1.6060449399156376e-10, + "grad_condition": 6795488555.526062, + "lr": 0.00024098649531343477, + "time_sec": 132.28790807724 + }, + { + "epoch": 102, + "train_loss": 4.49708987487793, + "train_acc": 0.02284, + "test_loss": 5.607777552032471, + "test_acc": 0.01, + "lyapunov": 1.5908644315226914, + "grad_norm": 0.22348474047746483, + "grad_max_sv": 0.11046325713396073, + "grad_min_sv": 3.8719351463923063e-10, + "grad_condition": 6001916881.77612, + "lr": 0.0002320866025105016, + "time_sec": 132.18588161468506 + }, + { + "epoch": 103, + "train_loss": 4.4955732382202145, + "train_acc": 0.0236, + "test_loss": 5.745177990722656, + "test_acc": 0.01, + "lyapunov": 1.5917734240022157, + "grad_norm": 0.2534263836701249, + "grad_max_sv": 0.110052939504385, + "grad_min_sv": 2.750547882733342e-10, + "grad_condition": 9464587786.428852, + "lr": 0.0002233042253783278, + "time_sec": 132.16262555122375 + }, + { + "epoch": 104, + "train_loss": 4.501874127349853, + "train_acc": 0.02266, + "test_loss": 5.61523842163086, + "test_acc": 0.01, + "lyapunov": 1.58528883255961, + "grad_norm": 0.27420737869929585, + "grad_max_sv": 0.10906471610069275, + "grad_min_sv": 2.0978145145694022e-10, + "grad_condition": 9953736672.96781, + "lr": 0.000214643216157784, + "time_sec": 132.20356059074402 + }, + { + "epoch": 105, + "train_loss": 4.527709134521484, + "train_acc": 0.02124, + "test_loss": 5.809187103271484, + "test_acc": 0.01, + "lyapunov": 1.5925516539522449, + "grad_norm": 0.23170044660415676, + "grad_max_sv": 0.1055134791880846, + "grad_min_sv": 7.825866377728172e-11, + "grad_condition": 26017131256.645947, + "lr": 0.00020610737385376332, + "time_sec": 132.20340204238892 + }, + { + "epoch": 106, + "train_loss": 4.538254840545655, + "train_acc": 0.02052, + "test_loss": 5.702211804962158, + "test_acc": 0.01, + "lyapunov": 1.5994793835198482, + "grad_norm": 0.22739631788820852, + "grad_max_sv": 0.10190589521080255, + "grad_min_sv": 2.392879430639463e-12, + "grad_condition": 41858905566.539444, + "lr": 0.00019770044256881242, + "time_sec": 132.2257125377655 + }, + { + "epoch": 107, + "train_loss": 4.537451904602051, + "train_acc": 0.01914, + "test_loss": 5.932393156433106, + "test_acc": 0.01, + "lyapunov": 1.5854461083326803, + "grad_norm": 0.21156136855576158, + "grad_max_sv": 0.09718370195478201, + "grad_min_sv": 2.1334573155528867e-12, + "grad_condition": 44438773786.1716, + "lr": 0.0001894261098608447, + "time_sec": 132.20696210861206 + }, + { + "epoch": 108, + "train_loss": 4.54288639175415, + "train_acc": 0.01946, + "test_loss": 6.020662310791016, + "test_acc": 0.01, + "lyapunov": 1.5982869247646283, + "grad_norm": 0.22336362248783215, + "grad_max_sv": 0.0942000387236476, + "grad_min_sv": 2.070612785490142e-12, + "grad_condition": 38681493255.63291, + "lr": 0.000181288005125655, + "time_sec": 132.15775275230408 + }, + { + "epoch": 109, + "train_loss": 4.539118989257813, + "train_acc": 0.02004, + "test_loss": 5.875737568664551, + "test_acc": 0.01, + "lyapunov": 1.597143233889509, + "grad_norm": 0.24209283453668126, + "grad_max_sv": 0.09231847468599881, + "grad_min_sv": 2.4290148967334254e-12, + "grad_condition": 41122755985.59834, + "lr": 0.0001732896980049473, + "time_sec": 132.2014491558075 + }, + { + "epoch": 110, + "train_loss": 4.533240603179932, + "train_acc": 0.02078, + "test_loss": 6.020731507873535, + "test_acc": 0.01, + "lyapunov": 1.5895807243064237, + "grad_norm": 0.24031990384630442, + "grad_max_sv": 0.09458559956401587, + "grad_min_sv": 4.9697159162748165e-12, + "grad_condition": 34976084384.10825, + "lr": 0.00016543469682057076, + "time_sec": 132.15150785446167 + }, + { + "epoch": 111, + "train_loss": 4.518356960906982, + "train_acc": 0.02294, + "test_loss": 5.969912101745606, + "test_acc": 0.01, + "lyapunov": 1.604492220122491, + "grad_norm": 0.22602265116800407, + "grad_max_sv": 0.09987993091344834, + "grad_min_sv": 2.419991108871221e-10, + "grad_condition": 19549830485.2588, + "lr": 0.00015772644703565552, + "time_sec": 132.23562288284302 + }, + { + "epoch": 112, + "train_loss": 4.52961797088623, + "train_acc": 0.02194, + "test_loss": 5.610896324157715, + "test_acc": 0.01, + "lyapunov": 1.6014201195953448, + "grad_norm": 0.24431543872984524, + "grad_max_sv": 0.09510019868612289, + "grad_min_sv": 1.6583184662959947e-11, + "grad_condition": 24172749617.446175, + "lr": 0.00015016832974331713, + "time_sec": 132.2202250957489 + }, + { + "epoch": 113, + "train_loss": 4.534737938232422, + "train_acc": 0.02108, + "test_loss": 5.882650997924805, + "test_acc": 0.01, + "lyapunov": 1.6089779333690244, + "grad_norm": 0.2408463440419859, + "grad_max_sv": 0.09545416701585055, + "grad_min_sv": 8.265506817575693e-12, + "grad_condition": 26886346060.009724, + "lr": 0.00014276366018359834, + "time_sec": 132.39671301841736 + }, + { + "epoch": 114, + "train_loss": 4.528099235992432, + "train_acc": 0.0216, + "test_loss": 6.349718654632569, + "test_acc": 0.01, + "lyapunov": 1.6125300259846251, + "grad_norm": 0.24308443287212356, + "grad_max_sv": 0.09617761392146348, + "grad_min_sv": 2.4579975111898598e-11, + "grad_condition": 33881398145.36089, + "lr": 0.00013551568628929425, + "time_sec": 132.3225646018982 + }, + { + "epoch": 115, + "train_loss": 4.519340593109131, + "train_acc": 0.02402, + "test_loss": 6.121589573669434, + "test_acc": 0.01, + "lyapunov": 1.6377504332291195, + "grad_norm": 0.2592364007942639, + "grad_max_sv": 0.09955059625208378, + "grad_min_sv": 9.771481077080514e-11, + "grad_condition": 10355098029.396868, + "lr": 0.00012842758726130276, + "time_sec": 132.17340803146362 + }, + { + "epoch": 116, + "train_loss": 4.532410475921631, + "train_acc": 0.02288, + "test_loss": 6.244934426879883, + "test_acc": 0.01, + "lyapunov": 1.666187497660937, + "grad_norm": 0.31169546460365094, + "grad_max_sv": 0.09843376744538546, + "grad_min_sv": 5.1638096920723736e-11, + "grad_condition": 18012362556.947014, + "lr": 0.0001215024721741218, + "time_sec": 132.24165844917297 + }, + { + "epoch": 117, + "train_loss": 4.535684629211426, + "train_acc": 0.0223, + "test_loss": 6.586191843414307, + "test_acc": 0.01, + "lyapunov": 1.6899945476780767, + "grad_norm": 0.3135195405807995, + "grad_max_sv": 0.10071753729134798, + "grad_min_sv": 7.336645736394951e-11, + "grad_condition": 12673080594.516361, + "lr": 0.00011474337861210538, + "time_sec": 132.23825097084045 + }, + { + "epoch": 118, + "train_loss": 4.546351953430176, + "train_acc": 0.02212, + "test_loss": 6.257575799560547, + "test_acc": 0.01, + "lyapunov": 1.7288513323839974, + "grad_norm": 0.41941424039533404, + "grad_max_sv": 0.09607745744287968, + "grad_min_sv": 7.789500681913805e-11, + "grad_condition": 16545952885.282751, + "lr": 0.00010815327133708009, + "time_sec": 132.21766591072083 + }, + { + "epoch": 119, + "train_loss": 4.531073229370117, + "train_acc": 0.02256, + "test_loss": 6.456183740997314, + "test_acc": 0.01, + "lyapunov": 1.6964583756673672, + "grad_norm": 0.25613400920512375, + "grad_max_sv": 0.09485051818192006, + "grad_min_sv": 4.685287637259971e-11, + "grad_condition": 12061244650.910728, + "lr": 0.00010173504098790182, + "time_sec": 132.30614709854126 + }, + { + "epoch": 120, + "train_loss": 4.541061541137696, + "train_acc": 0.0237, + "test_loss": 6.413670517730713, + "test_acc": 0.01, + "lyapunov": 1.739644906709871, + "grad_norm": 0.3693183435156443, + "grad_max_sv": 0.09833505425194744, + "grad_min_sv": 3.894246489996689e-11, + "grad_condition": 17507367358.884224, + "lr": 9.549150281252629e-05, + "time_sec": 132.18320536613464 + }, + { + "epoch": 121, + "train_loss": 4.5607890040588375, + "train_acc": 0.0232, + "test_loss": 6.3454551567077635, + "test_acc": 0.01, + "lyapunov": 1.8264712491608641, + "grad_norm": 0.8551675055665584, + "grad_max_sv": 0.1001248000189662, + "grad_min_sv": 3.8870165434796247e-10, + "grad_condition": 11774673434.16497, + "lr": 8.942539543314794e-05, + "time_sec": 132.19883823394775 + }, + { + "epoch": 122, + "train_loss": 4.561086259918213, + "train_acc": 0.02154, + "test_loss": 5.992345477294922, + "test_acc": 0.01, + "lyapunov": 1.802467906566532, + "grad_norm": 0.35207234081524835, + "grad_max_sv": 0.09587623235711362, + "grad_min_sv": 3.822705043577684e-10, + "grad_condition": 17845122251.05708, + "lr": 8.353937964495024e-05, + "time_sec": 132.44755220413208 + }, + { + "epoch": 123, + "train_loss": 4.573194706115722, + "train_acc": 0.02058, + "test_loss": 5.8545154296875, + "test_acc": 0.01, + "lyapunov": 1.816409704020566, + "grad_norm": 0.3735027051691648, + "grad_max_sv": 0.09373153795404505, + "grad_min_sv": 2.715693798334913e-11, + "grad_condition": 28875711989.57364, + "lr": 7.783603724899243e-05, + "time_sec": 132.26207613945007 + }, + { + "epoch": 124, + "train_loss": 4.572661248168945, + "train_acc": 0.02148, + "test_loss": 5.896555422973633, + "test_acc": 0.01, + "lyapunov": 1.8480512553163806, + "grad_norm": 0.3134804302549242, + "grad_max_sv": 0.09899624399840831, + "grad_min_sv": 1.2754484528129877e-10, + "grad_condition": 31805856694.423676, + "lr": 7.231786991974666e-05, + "time_sec": 132.45608854293823 + }, + { + "epoch": 125, + "train_loss": 4.580600358886719, + "train_acc": 0.02084, + "test_loss": 5.708856204223633, + "test_acc": 0.01, + "lyapunov": 1.8661305547675209, + "grad_norm": 0.5029799512519317, + "grad_max_sv": 0.10123962573707104, + "grad_min_sv": 1.8373754739270858e-11, + "grad_condition": 32052285848.35261, + "lr": 6.698729810778072e-05, + "time_sec": 132.43874192237854 + }, + { + "epoch": 126, + "train_loss": 4.609690670166016, + "train_acc": 0.01856, + "test_loss": 5.770978012084961, + "test_acc": 0.01, + "lyapunov": 1.9074160238665998, + "grad_norm": 1.9260693563122895, + "grad_max_sv": 0.08174233604597703, + "grad_min_sv": 5.527462332474612e-11, + "grad_condition": 24363510202.6125, + "lr": 6.184665997806817e-05, + "time_sec": 132.24991106987 + }, + { + "epoch": 127, + "train_loss": 4.640943519897461, + "train_acc": 0.01876, + "test_loss": 5.077701470947265, + "test_acc": 0.01, + "lyapunov": 1.9559716467967119, + "grad_norm": 1.0457106969740626, + "grad_max_sv": 0.09646339530616928, + "grad_min_sv": 3.4253201033677874e-10, + "grad_condition": 17416671105.52501, + "lr": 5.6898210384392595e-05, + "time_sec": 132.16351675987244 + }, + { + "epoch": 128, + "train_loss": 4.598363189086914, + "train_acc": 0.02078, + "test_loss": 4.975116259765625, + "test_acc": 0.01, + "lyapunov": 1.8845891751291808, + "grad_norm": 0.8220120863964331, + "grad_max_sv": 0.08199532476752439, + "grad_min_sv": 8.623996275121066e-10, + "grad_condition": 9056773581.269657, + "lr": 5.214411988029363e-05, + "time_sec": 132.3097848892212 + }, + { + "epoch": 129, + "train_loss": 4.541455926513672, + "train_acc": 0.0247, + "test_loss": 5.7549523315429685, + "test_acc": 0.01, + "lyapunov": 1.8803200340636856, + "grad_norm": 0.2569299215166405, + "grad_max_sv": 0.10282012969255447, + "grad_min_sv": 1.0507987653726909e-09, + "grad_condition": 9769165472.089832, + "lr": 4.7586473766990294e-05, + "time_sec": 132.27577376365662 + }, + { + "epoch": 130, + "train_loss": 4.584647702636719, + "train_acc": 0.02022, + "test_loss": 5.332480350494385, + "test_acc": 0.01, + "lyapunov": 1.901323552326778, + "grad_norm": 0.3548472872087693, + "grad_max_sv": 0.1086544806137681, + "grad_min_sv": 9.814503552650124e-11, + "grad_condition": 22478674485.849125, + "lr": 4.32272711786996e-05, + "time_sec": 132.3002369403839 + }, + { + "epoch": 131, + "train_loss": 4.581521871185303, + "train_acc": 0.02126, + "test_loss": 5.6270052955627445, + "test_acc": 0.01, + "lyapunov": 1.9170096432766341, + "grad_norm": 0.21502212949334182, + "grad_max_sv": 0.10107578802853823, + "grad_min_sv": 4.709314182512565e-12, + "grad_condition": 28702045833.35929, + "lr": 3.906842420574966e-05, + "time_sec": 132.58341455459595 + }, + { + "epoch": 132, + "train_loss": 4.603923379821778, + "train_acc": 0.02086, + "test_loss": 5.753756982421875, + "test_acc": 0.01, + "lyapunov": 2.0209065084262274, + "grad_norm": 0.24096511248455096, + "grad_max_sv": 0.09993877708911895, + "grad_min_sv": 7.1246287590231335e-12, + "grad_condition": 29623139032.43003, + "lr": 3.5111757055874305e-05, + "time_sec": 132.31662130355835 + }, + { + "epoch": 133, + "train_loss": 4.622827220458984, + "train_acc": 0.02166, + "test_loss": 5.880264813232422, + "test_acc": 0.01, + "lyapunov": 2.0902158723157993, + "grad_norm": 0.37428368144939567, + "grad_max_sv": 0.09831619988790408, + "grad_min_sv": 4.434330920707163e-12, + "grad_condition": 32791799106.98709, + "lr": 3.1359005254054254e-05, + "time_sec": 132.16932916641235 + }, + { + "epoch": 134, + "train_loss": 4.6172026605224605, + "train_acc": 0.02178, + "test_loss": 5.7553314712524415, + "test_acc": 0.01, + "lyapunov": 2.0609848694423274, + "grad_norm": 1.1257846952613533, + "grad_max_sv": 0.09743457045406104, + "grad_min_sv": 3.0741354169823606e-11, + "grad_condition": 13593193192.516785, + "lr": 2.7811814881259484e-05, + "time_sec": 132.19739365577698 + }, + { + "epoch": 135, + "train_loss": 4.635151025238037, + "train_acc": 0.021, + "test_loss": 5.5024827880859375, + "test_acc": 0.01, + "lyapunov": 1.9769353912309613, + "grad_norm": 2.02772923429031, + "grad_max_sv": 0.07839736734087524, + "grad_min_sv": 3.7352801946025573e-10, + "grad_condition": 6440628915.387049, + "lr": 2.4471741852423218e-05, + "time_sec": 132.1603286266327 + }, + { + "epoch": 136, + "train_loss": 4.68249575958252, + "train_acc": 0.0219, + "test_loss": 5.25179546508789, + "test_acc": 0.01, + "lyapunov": 2.0190668633526854, + "grad_norm": 1.6997169038698898, + "grad_max_sv": 0.08753072819376939, + "grad_min_sv": 1.2251687187667402e-09, + "grad_condition": 432467715.9748623, + "lr": 2.1340251233966362e-05, + "time_sec": 132.14581847190857 + }, + { + "epoch": 137, + "train_loss": 4.631195866546631, + "train_acc": 0.02544, + "test_loss": 5.392911587524414, + "test_acc": 0.01, + "lyapunov": 1.9715384879075657, + "grad_norm": 0.7892430119447663, + "grad_max_sv": 0.10768030200561043, + "grad_min_sv": 1.7614047353271475e-09, + "grad_condition": 109282059.02686039, + "lr": 1.8418716601170932e-05, + "time_sec": 132.1871361732483 + }, + { + "epoch": 138, + "train_loss": 4.587350132141113, + "train_acc": 0.02568, + "test_loss": 5.4693435791015625, + "test_acc": 0.01, + "lyapunov": 1.991891508821941, + "grad_norm": 0.7469521916290953, + "grad_max_sv": 0.11756768673658372, + "grad_min_sv": 1.9356462725657374e-09, + "grad_condition": 1022350892.4888865, + "lr": 1.570841943568445e-05, + "time_sec": 132.11142563819885 + }, + { + "epoch": 139, + "train_loss": 4.577352908630371, + "train_acc": 0.02708, + "test_loss": 5.601054759979248, + "test_acc": 0.01, + "lyapunov": 1.9843372856564534, + "grad_norm": 0.8085739729926078, + "grad_max_sv": 0.12083102430333384, + "grad_min_sv": 1.96632062201673e-09, + "grad_condition": 76824680.74466217, + "lr": 1.3210548563419845e-05, + "time_sec": 132.16676545143127 + }, + { + "epoch": 140, + "train_loss": 4.552192511444092, + "train_acc": 0.02732, + "test_loss": 5.383674153137207, + "test_acc": 0.01, + "lyapunov": 1.9721098985818342, + "grad_norm": 0.6793156974859339, + "grad_max_sv": 0.12086031896079703, + "grad_min_sv": 1.9605524922258888e-09, + "grad_condition": 123266932.04338643, + "lr": 1.0926199633097203e-05, + "time_sec": 132.13540196418762 + }, + { + "epoch": 141, + "train_loss": 4.551412692871094, + "train_acc": 0.02748, + "test_loss": 5.406689046478271, + "test_acc": 0.01, + "lyapunov": 1.9343544891118394, + "grad_norm": 0.6725109238271549, + "grad_max_sv": 0.11751907898869832, + "grad_min_sv": 1.9861858326650564e-09, + "grad_condition": 74216850.21639355, + "lr": 8.856374635655688e-06, + "time_sec": 132.12982821464539 + }, + { + "epoch": 142, + "train_loss": 4.727527248229981, + "train_acc": 0.01824, + "test_loss": 5.770706779479981, + "test_acc": 0.01, + "lyapunov": 2.350969208475879, + "grad_norm": 2.282933232543126, + "grad_max_sv": 0.11755687685454178, + "grad_min_sv": 1.4490837774683643e-09, + "grad_condition": 631119004.4434631, + "lr": 7.001981464747503e-06, + "time_sec": 132.14570784568787 + }, + { + "epoch": 143, + "train_loss": 4.774733398284912, + "train_acc": 0.01748, + "test_loss": 5.42293524093628, + "test_acc": 0.01, + "lyapunov": 2.5337743533541786, + "grad_norm": 3.084857123459247, + "grad_max_sv": 0.08506426704443584, + "grad_min_sv": 1.0878406072247764e-09, + "grad_condition": 95670235.35140035, + "lr": 5.3638335185058295e-06, + "time_sec": 132.17597699165344 + }, + { + "epoch": 144, + "train_loss": 4.801961855010986, + "train_acc": 0.01764, + "test_loss": 5.572767419433593, + "test_acc": 0.01, + "lyapunov": 2.5992656010191153, + "grad_norm": 2.2910220858954014, + "grad_max_sv": 0.14899966653709953, + "grad_min_sv": 2.0148015595278023e-09, + "grad_condition": 176782893.45203692, + "lr": 3.942649342761114e-06, + "time_sec": 132.12091755867004 + }, + { + "epoch": 145, + "train_loss": 4.850462348022461, + "train_acc": 0.02024, + "test_loss": 5.516320917510987, + "test_acc": 0.01, + "lyapunov": 2.7130372066936834, + "grad_norm": 1.0265954725835216, + "grad_max_sv": 0.21464332040486625, + "grad_min_sv": 3.1526066665652634e-09, + "grad_condition": 97161987.48706797, + "lr": 2.7390523158633524e-06, + "time_sec": 132.0690953731537 + }, + { + "epoch": 146, + "train_loss": 4.856118622894287, + "train_acc": 0.02, + "test_loss": 5.461014266967774, + "test_acc": 0.01, + "lyapunov": 2.718469413040239, + "grad_norm": 1.0099887200055417, + "grad_max_sv": 0.15561392254603562, + "grad_min_sv": 2.2754747437366604e-09, + "grad_condition": 1019144627.7729056, + "lr": 1.7535703752478133e-06, + "time_sec": 132.11823773384094 + }, + { + "epoch": 147, + "train_loss": 4.924606959075928, + "train_acc": 0.01686, + "test_loss": 20.649002047729493, + "test_acc": 0.01, + "lyapunov": 2.6374005685986766, + "grad_norm": 3.1423913582004523, + "grad_max_sv": 0.21941849166760222, + "grad_min_sv": 3.0307538921017438e-09, + "grad_condition": 120403007.5867976, + "lr": 9.866357858642196e-07, + "time_sec": 132.07725739479065 + }, + { + "epoch": 148, + "train_loss": 4.767027478179932, + "train_acc": 0.01794, + "test_loss": 5.494908865356446, + "test_acc": 0.01, + "lyapunov": 2.1720430088774934, + "grad_norm": 3.0001678190775194, + "grad_max_sv": 0.06730101421089785, + "grad_min_sv": 5.6080486708198344e-11, + "grad_condition": 32628105419.335045, + "lr": 4.38584950570808e-07, + "time_sec": 132.16628646850586 + }, + { + "epoch": 149, + "train_loss": 4.725253110198975, + "train_acc": 0.01852, + "test_loss": 5.4529930709838865, + "test_acc": 0.01, + "lyapunov": 2.1247258430246805, + "grad_norm": 2.425421227254264, + "grad_max_sv": 0.06302208096294634, + "grad_min_sv": 8.06056723307697e-12, + "grad_condition": 24980400399.38557, + "lr": 1.096582625772501e-07, + "time_sec": 132.17798447608948 + }, + { + "epoch": 150, + "train_loss": 4.724624121398926, + "train_acc": 0.01896, + "test_loss": 5.454324950408935, + "test_acc": 0.01, + "lyapunov": 2.1117066599219045, + "grad_norm": 2.2782652512729027, + "grad_max_sv": 0.06824387344677234, + "grad_min_sv": 1.3984562009526476e-11, + "grad_condition": 35779591216.93815, + "lr": 0.0, + "time_sec": 132.24787974357605 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.052905302276612, + "train_acc": 0.01584, + "test_loss": 4.867012271118164, + "test_acc": 0.0108, + "lyapunov": 2.5116785645789808, + "grad_norm": 5.121741212106656, + "grad_max_sv": 4.439184683561325, + "grad_min_sv": 8.58994061270213e-08, + "grad_condition": 81112713.35007669, + "lr": 0.0009998903417374227, + "time_sec": 177.38097023963928 + }, + { + "epoch": 2, + "train_loss": 4.7834703578186035, + "train_acc": 0.0185, + "test_loss": 4.856568830871582, + "test_acc": 0.0105, + "lyapunov": 2.04087689069226, + "grad_norm": 3.485253038009916, + "grad_max_sv": 2.8998831868171693, + "grad_min_sv": 5.773870767437905e-08, + "grad_condition": 487880276.00022805, + "lr": 0.0009995614150494292, + "time_sec": 177.40509605407715 + }, + { + "epoch": 3, + "train_loss": 4.663032297821045, + "train_acc": 0.01814, + "test_loss": 4.829788903808594, + "test_acc": 0.01, + "lyapunov": 1.8697960974310366, + "grad_norm": 2.5433134222817766, + "grad_max_sv": 1.7969021894054094, + "grad_min_sv": 3.7302616086586385e-08, + "grad_condition": 424272904.7057018, + "lr": 0.0009990133642141358, + "time_sec": 177.55998063087463 + }, + { + "epoch": 4, + "train_loss": 4.580566212463379, + "train_acc": 0.01816, + "test_loss": 5.0227375442504885, + "test_acc": 0.01, + "lyapunov": 1.7420489681346336, + "grad_norm": 1.5123120559078784, + "grad_max_sv": 1.0997331857681274, + "grad_min_sv": 2.3435378404546015e-08, + "grad_condition": 50550380.27519056, + "lr": 0.0009982464296247522, + "time_sec": 177.36285305023193 + }, + { + "epoch": 5, + "train_loss": 4.571687319335937, + "train_acc": 0.0169, + "test_loss": 4.605651480102539, + "test_acc": 0.01, + "lyapunov": 1.7220315366144985, + "grad_norm": 1.03184611340308, + "grad_max_sv": 0.7467024937272072, + "grad_min_sv": 9.665682879938559e-09, + "grad_condition": 55185094270.727005, + "lr": 0.0009972609476841367, + "time_sec": 177.37269806861877 + }, + { + "epoch": 6, + "train_loss": 4.555875413513184, + "train_acc": 0.01516, + "test_loss": 4.674408260345459, + "test_acc": 0.01, + "lyapunov": 1.7398752916194593, + "grad_norm": 0.9957876060665515, + "grad_max_sv": 0.5100040049292147, + "grad_min_sv": 2.519896859816943e-10, + "grad_condition": 106528792765.2457, + "lr": 0.000996057350657239, + "time_sec": 177.46758604049683 + }, + { + "epoch": 7, + "train_loss": 4.543562595672608, + "train_acc": 0.01678, + "test_loss": 4.860989706420899, + "test_acc": 0.01, + "lyapunov": 1.7311897963818992, + "grad_norm": 0.6570743063224779, + "grad_max_sv": 0.5500264666974545, + "grad_min_sv": 1.8619091907383225e-09, + "grad_condition": 101307067487.53836, + "lr": 0.000994636166481494, + "time_sec": 177.4092240333557 + }, + { + "epoch": 8, + "train_loss": 4.546422679748535, + "train_acc": 0.01748, + "test_loss": 4.704587471008301, + "test_acc": 0.01, + "lyapunov": 1.7199046867887686, + "grad_norm": 0.6503196899352705, + "grad_max_sv": 0.4841625154018402, + "grad_min_sv": 1.3860141552013199e-09, + "grad_condition": 92427076016.0824, + "lr": 0.0009929980185352525, + "time_sec": 177.34343218803406 + }, + { + "epoch": 9, + "train_loss": 4.555562373046875, + "train_acc": 0.01632, + "test_loss": 4.984462910461426, + "test_acc": 0.01, + "lyapunov": 1.7168824087323435, + "grad_norm": 0.4710924143848028, + "grad_max_sv": 0.3569773003458977, + "grad_min_sv": 2.9924371274558933e-12, + "grad_condition": 163638150611.22946, + "lr": 0.0009911436253643444, + "time_sec": 177.2937033176422 + }, + { + "epoch": 10, + "train_loss": 4.572519063873291, + "train_acc": 0.01446, + "test_loss": 4.622131011962891, + "test_acc": 0.01, + "lyapunov": 1.6881294174267507, + "grad_norm": 0.5058537650400963, + "grad_max_sv": 0.36440472304821014, + "grad_min_sv": 6.516127066976764e-13, + "grad_condition": 259926216911.04242, + "lr": 0.0009890738003669028, + "time_sec": 177.31165838241577 + }, + { + "epoch": 11, + "train_loss": 4.565913163909912, + "train_acc": 0.01558, + "test_loss": 5.445963431549072, + "test_acc": 0.01, + "lyapunov": 1.6539141406183657, + "grad_norm": 0.48047604578041114, + "grad_max_sv": 0.3803807333111763, + "grad_min_sv": 9.42464814059806e-13, + "grad_condition": 226641538861.88174, + "lr": 0.00098678945143658, + "time_sec": 177.28680086135864 + }, + { + "epoch": 12, + "train_loss": 4.585704666290283, + "train_acc": 0.01426, + "test_loss": 5.591514777374267, + "test_acc": 0.01, + "lyapunov": 1.6391262849578467, + "grad_norm": 0.3984247324953335, + "grad_max_sv": 0.32813584208488467, + "grad_min_sv": 9.868289842027034e-13, + "grad_condition": 205156435878.04105, + "lr": 0.0009842915805643154, + "time_sec": 177.34117722511292 + }, + { + "epoch": 13, + "train_loss": 4.604436149597168, + "train_acc": 0.01222, + "test_loss": 4.690793671417237, + "test_acc": 0.01, + "lyapunov": 1.641747108810698, + "grad_norm": 0.3654356558343784, + "grad_max_sv": 0.2650721728801727, + "grad_min_sv": 2.5128712845214346e-14, + "grad_condition": 259015002047.89975, + "lr": 0.000981581283398829, + "time_sec": 177.3893666267395 + }, + { + "epoch": 14, + "train_loss": 4.607583849945068, + "train_acc": 0.01194, + "test_loss": 4.637583544921875, + "test_acc": 0.01, + "lyapunov": 1.647905475953046, + "grad_norm": 0.3152206467371112, + "grad_max_sv": 0.24337820373475552, + "grad_min_sv": 2.2884600952186276e-19, + "grad_condition": 243378149152.73965, + "lr": 0.0009786597487660333, + "time_sec": 177.42928194999695 + }, + { + "epoch": 15, + "train_loss": 4.609895180664062, + "train_acc": 0.01204, + "test_loss": 4.618253812408447, + "test_acc": 0.01, + "lyapunov": 1.631026401239283, + "grad_norm": 0.2910629294744733, + "grad_max_sv": 0.25453653037548063, + "grad_min_sv": 1.096334686408586e-14, + "grad_condition": 251632031244.05, + "lr": 0.0009755282581475766, + "time_sec": 177.26571369171143 + }, + { + "epoch": 16, + "train_loss": 4.620552892456055, + "train_acc": 0.01092, + "test_loss": 4.829088508605957, + "test_acc": 0.01, + "lyapunov": 1.6514442287137747, + "grad_norm": 0.32315656842976964, + "grad_max_sv": 0.2540007773786783, + "grad_min_sv": 2.6148553957350966e-15, + "grad_condition": 253349213677.79898, + "lr": 0.0009721881851187403, + "time_sec": 177.23212313652039 + }, + { + "epoch": 17, + "train_loss": 4.645780512695312, + "train_acc": 0.01148, + "test_loss": 5.213332609558106, + "test_acc": 0.0118, + "lyapunov": 1.7068933586940132, + "grad_norm": 0.4780888546414525, + "grad_max_sv": 0.33272466212511065, + "grad_min_sv": 1.1442340742877327e-13, + "grad_condition": 310520393785.63025, + "lr": 0.0009686409947459456, + "time_sec": 177.3003396987915 + }, + { + "epoch": 18, + "train_loss": 4.643788212127686, + "train_acc": 0.01072, + "test_loss": 4.7405077087402345, + "test_acc": 0.01, + "lyapunov": 1.700578610305591, + "grad_norm": 0.4623759718719876, + "grad_max_sv": 0.36730299033224584, + "grad_min_sv": 3.818205128193156e-15, + "grad_condition": 365867778353.78564, + "lr": 0.0009648882429441254, + "time_sec": 177.37098169326782 + }, + { + "epoch": 19, + "train_loss": 4.6578716897583, + "train_acc": 0.0106, + "test_loss": 5.001485794830322, + "test_acc": 0.01, + "lyapunov": 1.7619636241737229, + "grad_norm": 0.5961977275221398, + "grad_max_sv": 0.3942902203649282, + "grad_min_sv": 2.946577326860146e-13, + "grad_condition": 343308843771.1844, + "lr": 0.00096093157579425, + "time_sec": 177.48300218582153 + }, + { + "epoch": 20, + "train_loss": 4.671879530639648, + "train_acc": 0.00988, + "test_loss": 4.9071829193115235, + "test_acc": 0.01, + "lyapunov": 1.8025801248867492, + "grad_norm": 0.5059310784067265, + "grad_max_sv": 0.3557112220674753, + "grad_min_sv": 1.5333297747627812e-13, + "grad_condition": 328969482461.7643, + "lr": 0.0009567727288213001, + "time_sec": 177.32300353050232 + }, + { + "epoch": 21, + "train_loss": 4.653441105194092, + "train_acc": 0.0101, + "test_loss": 5.037871252441406, + "test_acc": 0.01, + "lyapunov": 1.7085216252700142, + "grad_norm": 0.3698981456336605, + "grad_max_sv": 0.32922359369695187, + "grad_min_sv": 2.0854029706572434e-14, + "grad_condition": 323091955093.61206, + "lr": 0.0009524135262330095, + "time_sec": 177.3196620941162 + }, + { + "epoch": 22, + "train_loss": 4.632678106536865, + "train_acc": 0.01074, + "test_loss": 5.238784426116943, + "test_acc": 0.01, + "lyapunov": 1.6952984226329246, + "grad_norm": 0.4241090659984796, + "grad_max_sv": 0.386181453615427, + "grad_min_sv": 2.802362135740985e-14, + "grad_condition": 377561785396.401, + "lr": 0.0009478558801197061, + "time_sec": 177.29510116577148 + }, + { + "epoch": 23, + "train_loss": 4.638225617523194, + "train_acc": 0.01138, + "test_loss": 5.275448854064941, + "test_acc": 0.01, + "lyapunov": 1.6717191449821454, + "grad_norm": 0.4690453217532838, + "grad_max_sv": 0.36180934831500056, + "grad_min_sv": 7.689419929357006e-14, + "grad_condition": 343504771054.1229, + "lr": 0.000943101789615607, + "time_sec": 177.27985095977783 + }, + { + "epoch": 24, + "train_loss": 4.645476407775879, + "train_acc": 0.01184, + "test_loss": 5.105841419219971, + "test_acc": 0.01, + "lyapunov": 1.6884696520198033, + "grad_norm": 0.46211885946676406, + "grad_max_sv": 0.41755540743470193, + "grad_min_sv": 3.2064806913220934e-13, + "grad_condition": 342942332027.1542, + "lr": 0.0009381533400219313, + "time_sec": 177.25587034225464 + }, + { + "epoch": 25, + "train_loss": 4.6320624351501465, + "train_acc": 0.0119, + "test_loss": 6.030343013000488, + "test_acc": 0.01, + "lyapunov": 1.707195217042323, + "grad_norm": 0.5021589283462617, + "grad_max_sv": 0.39102165041840636, + "grad_min_sv": 5.243264004713223e-13, + "grad_condition": 307511385553.97986, + "lr": 0.0009330127018922189, + "time_sec": 177.37623739242554 + }, + { + "epoch": 26, + "train_loss": 4.612996809234619, + "train_acc": 0.0124, + "test_loss": 4.7069967758178715, + "test_acc": 0.01, + "lyapunov": 1.6614662732004815, + "grad_norm": 0.41182683188165653, + "grad_max_sv": 0.36811394318938256, + "grad_min_sv": 1.8671300799803038e-13, + "grad_condition": 326597103772.6738, + "lr": 0.000927682130080253, + "time_sec": 177.34338855743408 + }, + { + "epoch": 27, + "train_loss": 4.615120216217041, + "train_acc": 0.01294, + "test_loss": 5.169810830688476, + "test_acc": 0.01, + "lyapunov": 1.6869621197585865, + "grad_norm": 0.48352542649856634, + "grad_max_sv": 0.40701944530010226, + "grad_min_sv": 2.212590997783025e-13, + "grad_condition": 351263915868.759, + "lr": 0.0009221639627510072, + "time_sec": 177.37520146369934 + }, + { + "epoch": 28, + "train_loss": 4.618173647613525, + "train_acc": 0.0121, + "test_loss": 4.701211013793945, + "test_acc": 0.01, + "lyapunov": 1.6625224543959283, + "grad_norm": 0.49633059160738635, + "grad_max_sv": 0.42104807291179897, + "grad_min_sv": 8.098768546668247e-14, + "grad_condition": 390777126515.4154, + "lr": 0.0009164606203550494, + "time_sec": 177.30147242546082 + }, + { + "epoch": 29, + "train_loss": 4.620836652526855, + "train_acc": 0.01168, + "test_loss": 5.855577803039551, + "test_acc": 0.01, + "lyapunov": 1.6738867168231388, + "grad_norm": 0.46837018531534874, + "grad_max_sv": 0.41829773411154747, + "grad_min_sv": 6.839261746330108e-14, + "grad_condition": 396621981755.1995, + "lr": 0.0009105746045668516, + "time_sec": 177.59404516220093 + }, + { + "epoch": 30, + "train_loss": 4.620147025604248, + "train_acc": 0.01212, + "test_loss": 5.105264408111572, + "test_acc": 0.0024, + "lyapunov": 1.6637281100158496, + "grad_norm": 0.5269676291306111, + "grad_max_sv": 0.4443404793739319, + "grad_min_sv": 4.246975380253858e-14, + "grad_condition": 429585177175.7853, + "lr": 0.0009045084971874733, + "time_sec": 177.3182647228241 + }, + { + "epoch": 31, + "train_loss": 4.6263528985595705, + "train_acc": 0.01214, + "test_loss": 4.881978817749023, + "test_acc": 0.01, + "lyapunov": 1.679152080774917, + "grad_norm": 0.4813838001178168, + "grad_max_sv": 0.44175935424864293, + "grad_min_sv": 7.640593233486203e-14, + "grad_condition": 412963565609.7972, + "lr": 0.0008982649590120977, + "time_sec": 177.52869391441345 + }, + { + "epoch": 32, + "train_loss": 4.64666208404541, + "train_acc": 0.01024, + "test_loss": 4.607140179443359, + "test_acc": 0.01, + "lyapunov": 1.6733192260308034, + "grad_norm": 0.9644658562133654, + "grad_max_sv": 0.32155169621109964, + "grad_min_sv": 4.501243792038921e-14, + "grad_condition": 307022698703.9159, + "lr": 0.0008918467286629196, + "time_sec": 177.55723929405212 + }, + { + "epoch": 33, + "train_loss": 4.629158392181396, + "train_acc": 0.01256, + "test_loss": 4.610281867980957, + "test_acc": 0.01, + "lyapunov": 1.7062030826383234, + "grad_norm": 0.8603320661340712, + "grad_max_sv": 0.3315905283205211, + "grad_min_sv": 1.30026839163971e-13, + "grad_condition": 311972159847.4972, + "lr": 0.0008852566213878943, + "time_sec": 177.52309370040894 + }, + { + "epoch": 34, + "train_loss": 4.61046769607544, + "train_acc": 0.01252, + "test_loss": 4.61788650970459, + "test_acc": 0.01, + "lyapunov": 1.6976071282116043, + "grad_norm": 0.49261012177272534, + "grad_max_sv": 0.3965699575841427, + "grad_min_sv": 1.5454696301012257e-13, + "grad_condition": 361671513434.2426, + "lr": 0.000878497527825878, + "time_sec": 177.35865092277527 + }, + { + "epoch": 35, + "train_loss": 4.610115225982666, + "train_acc": 0.0133, + "test_loss": 4.610134786224365, + "test_acc": 0.01, + "lyapunov": 1.7059512098731897, + "grad_norm": 0.6359621148942639, + "grad_max_sv": 0.38861413495615127, + "grad_min_sv": 4.932618749060156e-13, + "grad_condition": 303490840826.2363, + "lr": 0.000871572412738697, + "time_sec": 177.262850522995 + }, + { + "epoch": 36, + "train_loss": 4.599939749145507, + "train_acc": 0.01366, + "test_loss": 4.967366139221191, + "test_acc": 0.01, + "lyapunov": 1.6910303544510357, + "grad_norm": 0.48781695526823965, + "grad_max_sv": 0.3771605670452118, + "grad_min_sv": 1.087613697669073e-12, + "grad_condition": 257003832809.76837, + "lr": 0.0008644843137107055, + "time_sec": 177.29217314720154 + }, + { + "epoch": 37, + "train_loss": 4.5619960546875, + "train_acc": 0.01694, + "test_loss": 4.731475791931152, + "test_acc": 0.01, + "lyapunov": 1.6942788399089024, + "grad_norm": 0.5025968244527356, + "grad_max_sv": 0.3710522945970297, + "grad_min_sv": 1.7366462838151458e-12, + "grad_condition": 182613054683.41757, + "lr": 0.0008572363398164014, + "time_sec": 177.32313704490662 + }, + { + "epoch": 38, + "train_loss": 4.565163485412597, + "train_acc": 0.01702, + "test_loss": 4.821879299926758, + "test_acc": 0.01, + "lyapunov": 1.7136198645052703, + "grad_norm": 0.3647367948752072, + "grad_max_sv": 0.2595147430896759, + "grad_min_sv": 8.982830963644869e-13, + "grad_condition": 165264606800.54236, + "lr": 0.0008498316702566826, + "time_sec": 177.30079579353333 + }, + { + "epoch": 39, + "train_loss": 4.564778382873535, + "train_acc": 0.01674, + "test_loss": 4.7682116500854494, + "test_acc": 0.01, + "lyapunov": 1.717852655579062, + "grad_norm": 0.3050778193964112, + "grad_max_sv": 0.23688307516276835, + "grad_min_sv": 7.061831886877416e-13, + "grad_condition": 158702297955.0819, + "lr": 0.0008422735529643442, + "time_sec": 177.48431873321533 + }, + { + "epoch": 40, + "train_loss": 4.5591833352661135, + "train_acc": 0.0181, + "test_loss": 4.824417631530761, + "test_acc": 0.01, + "lyapunov": 1.7331721334506178, + "grad_norm": 0.3159273980899205, + "grad_max_sv": 0.2037038005888462, + "grad_min_sv": 9.425467893049303e-13, + "grad_condition": 137011838971.33943, + "lr": 0.0008345653031794289, + "time_sec": 177.31830286979675 + }, + { + "epoch": 41, + "train_loss": 4.578043832092285, + "train_acc": 0.01756, + "test_loss": 4.636139833068848, + "test_acc": 0.01, + "lyapunov": 1.8264592937801196, + "grad_norm": 0.3694732916545973, + "grad_max_sv": 0.18727784380316734, + "grad_min_sv": 5.982392141838314e-13, + "grad_condition": 126511514412.27226, + "lr": 0.0008267103019950526, + "time_sec": 177.335711479187 + }, + { + "epoch": 42, + "train_loss": 4.673806926269531, + "train_acc": 0.01194, + "test_loss": 4.6080057914733885, + "test_acc": 0.01, + "lyapunov": 1.9006618404632334, + "grad_norm": 1.9332134687963871, + "grad_max_sv": 0.11263461007879413, + "grad_min_sv": 3.077567965127664e-13, + "grad_condition": 84300063979.57101, + "lr": 0.0008187119948743447, + "time_sec": 177.32483506202698 + }, + { + "epoch": 43, + "train_loss": 4.688161468811035, + "train_acc": 0.01068, + "test_loss": 4.629961785125732, + "test_acc": 0.01, + "lyapunov": 1.7131454627532179, + "grad_norm": 0.6010997717026842, + "grad_max_sv": 0.29899735348299145, + "grad_min_sv": 2.479182783007377e-09, + "grad_condition": 66211640983.312706, + "lr": 0.000810573890139155, + "time_sec": 177.3025574684143 + }, + { + "epoch": 44, + "train_loss": 4.646988244628906, + "train_acc": 0.0095, + "test_loss": 4.6228884521484375, + "test_acc": 0.01, + "lyapunov": 1.5909017861041876, + "grad_norm": 0.3503759029299944, + "grad_max_sv": 0.2046256795525551, + "grad_min_sv": 3.5303733441678653e-14, + "grad_condition": 197873606364.90146, + "lr": 0.0008022995574311873, + "time_sec": 177.30037641525269 + }, + { + "epoch": 45, + "train_loss": 4.643654596862793, + "train_acc": 0.00948, + "test_loss": 4.658484869384766, + "test_acc": 0.01, + "lyapunov": 1.5862659612275145, + "grad_norm": 0.2656233273924739, + "grad_max_sv": 0.17473686374723912, + "grad_min_sv": 1.813760877293352e-16, + "grad_condition": 174705104463.56973, + "lr": 0.0007938926261462363, + "time_sec": 177.3814389705658 + }, + { + "epoch": 46, + "train_loss": 4.64409400894165, + "train_acc": 0.0089, + "test_loss": 4.812335470581055, + "test_acc": 0.01, + "lyapunov": 1.590341107619693, + "grad_norm": 0.2648745471846797, + "grad_max_sv": 0.16318325139582157, + "grad_min_sv": 9.479088537998935e-17, + "grad_condition": 163165251374.67862, + "lr": 0.0007853567838422158, + "time_sec": 177.3781590461731 + }, + { + "epoch": 47, + "train_loss": 4.643036758270264, + "train_acc": 0.00928, + "test_loss": 4.609914025878906, + "test_acc": 0.01, + "lyapunov": 1.5894581573393645, + "grad_norm": 0.2691116464860412, + "grad_max_sv": 0.15965580381453037, + "grad_min_sv": 1.0509738482436128e-46, + "grad_condition": 159655803814.53036, + "lr": 0.0007766957746216719, + "time_sec": 177.31791877746582 + }, + { + "epoch": 48, + "train_loss": 4.642327072753906, + "train_acc": 0.00992, + "test_loss": 4.8127995941162105, + "test_acc": 0.01, + "lyapunov": 1.5860872100991057, + "grad_norm": 0.23492399170085265, + "grad_max_sv": 0.1611787799745798, + "grad_min_sv": 6.216856363016735e-39, + "grad_condition": 161178779974.57983, + "lr": 0.0007679133974894982, + "time_sec": 177.36284637451172 + }, + { + "epoch": 49, + "train_loss": 4.642729123077393, + "train_acc": 0.00984, + "test_loss": 4.621463303375244, + "test_acc": 0.01, + "lyapunov": 1.591500211859603, + "grad_norm": 0.21793856766380534, + "grad_max_sv": 0.15185034908354283, + "grad_min_sv": 2.264801692824062e-26, + "grad_condition": 151850349083.53925, + "lr": 0.000759013504686565, + "time_sec": 177.32554411888123 + }, + { + "epoch": 50, + "train_loss": 4.643996462554932, + "train_acc": 0.0102, + "test_loss": 4.609245301818848, + "test_acc": 0.01, + "lyapunov": 1.5983945966681556, + "grad_norm": 0.22457837692293584, + "grad_max_sv": 0.15547131709754466, + "grad_min_sv": 0.0, + "grad_condition": 155471317097.54468, + "lr": 0.0007499999999999998, + "time_sec": 177.34761261940002 + }, + { + "epoch": 51, + "train_loss": 4.6476463407897946, + "train_acc": 0.0094, + "test_loss": 4.637005358123779, + "test_acc": 0.01, + "lyapunov": 1.608639404291997, + "grad_norm": 0.22991701525164646, + "grad_max_sv": 0.14587618354707957, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 145876183547.07956, + "lr": 0.0007408768370508575, + "time_sec": 177.40973281860352 + }, + { + "epoch": 52, + "train_loss": 4.643522353057861, + "train_acc": 0.0091, + "test_loss": 4.635898374176025, + "test_acc": 0.01, + "lyapunov": 1.5934445269577338, + "grad_norm": 0.2512821617756961, + "grad_max_sv": 0.11034320006147028, + "grad_min_sv": 4.951726746617114e-32, + "grad_condition": 110343200061.47026, + "lr": 0.0007316480175599307, + "time_sec": 177.36693692207336 + }, + { + "epoch": 53, + "train_loss": 4.652315429840088, + "train_acc": 0.00954, + "test_loss": 4.609224298095703, + "test_acc": 0.01, + "lyapunov": 1.634396403951718, + "grad_norm": 0.5467593180422932, + "grad_max_sv": 0.09123059632256628, + "grad_min_sv": 2.430316909663535e-15, + "grad_condition": 90896353773.23637, + "lr": 0.0007223175895924635, + "time_sec": 177.31507325172424 + }, + { + "epoch": 54, + "train_loss": 4.651325719604492, + "train_acc": 0.00994, + "test_loss": 4.626620025634765, + "test_acc": 0.01, + "lyapunov": 1.611309678048429, + "grad_norm": 0.2940157240002703, + "grad_max_sv": 0.13391106240451336, + "grad_min_sv": 3.421636554179791e-13, + "grad_condition": 110883017208.70781, + "lr": 0.0007128896457825361, + "time_sec": 177.39624953269958 + }, + { + "epoch": 55, + "train_loss": 4.64362153503418, + "train_acc": 0.00934, + "test_loss": 4.62131148147583, + "test_acc": 0.01, + "lyapunov": 1.5918327890088797, + "grad_norm": 0.17460806885429525, + "grad_max_sv": 0.08889081897214055, + "grad_min_sv": 1.944495872420277e-15, + "grad_condition": 88670543660.1524, + "lr": 0.0007033683215378998, + "time_sec": 177.32203340530396 + }, + { + "epoch": 56, + "train_loss": 4.644567786254883, + "train_acc": 0.00952, + "test_loss": 4.62790345993042, + "test_acc": 0.01, + "lyapunov": 1.5998888466974048, + "grad_norm": 0.16766781878427695, + "grad_max_sv": 0.07534359227865935, + "grad_min_sv": 6.543167764955624e-20, + "grad_condition": 75343581885.12659, + "lr": 0.0006937577932260512, + "time_sec": 177.3884792327881 + }, + { + "epoch": 57, + "train_loss": 4.644828259429931, + "train_acc": 0.00976, + "test_loss": 4.606487982940674, + "test_acc": 0.01, + "lyapunov": 1.5974730362977518, + "grad_norm": 0.1793373629191484, + "grad_max_sv": 0.07966042589396238, + "grad_min_sv": 6.23405577303343e-15, + "grad_condition": 78875044427.86894, + "lr": 0.0006840622763423388, + "time_sec": 177.43391919136047 + }, + { + "epoch": 58, + "train_loss": 4.644080760650635, + "train_acc": 0.0091, + "test_loss": 4.625753155517578, + "test_acc": 0.01, + "lyapunov": 1.6024256923314555, + "grad_norm": 0.2678862199559515, + "grad_max_sv": 0.06979989502578973, + "grad_min_sv": 2.271738328433089e-16, + "grad_condition": 69772902566.56038, + "lr": 0.0006742860236609073, + "time_sec": 177.34277653694153 + }, + { + "epoch": 59, + "train_loss": 4.642539700622558, + "train_acc": 0.0104, + "test_loss": 4.606066676330566, + "test_acc": 0.01, + "lyapunov": 1.5953022006832425, + "grad_norm": 0.18186171250969738, + "grad_max_sv": 0.052746226685121654, + "grad_min_sv": 0.0, + "grad_condition": 52746226685.12166, + "lr": 0.0006644333233692913, + "time_sec": 177.2813150882721 + }, + { + "epoch": 60, + "train_loss": 4.643028160400391, + "train_acc": 0.0096, + "test_loss": 4.606985287475586, + "test_acc": 0.01, + "lyapunov": 1.5944073910603438, + "grad_norm": 0.16605928285367347, + "grad_max_sv": 0.04408669015392661, + "grad_min_sv": 0.0, + "grad_condition": 44086690153.926605, + "lr": 0.0006545084971874734, + "time_sec": 177.34340691566467 + }, + { + "epoch": 61, + "train_loss": 4.641566214599609, + "train_acc": 0.00942, + "test_loss": 4.6096303787231445, + "test_acc": 0.01, + "lyapunov": 1.5902936217730002, + "grad_norm": 0.17097577525317767, + "grad_max_sv": 0.048659399058669804, + "grad_min_sv": 0.0, + "grad_condition": 48659399058.6698, + "lr": 0.0006445158984722354, + "time_sec": 177.41231846809387 + }, + { + "epoch": 62, + "train_loss": 4.643437232666016, + "train_acc": 0.00904, + "test_loss": 4.614830825805664, + "test_acc": 0.01, + "lyapunov": 1.597925158717748, + "grad_norm": 0.17398079786227064, + "grad_max_sv": 0.04662688081152737, + "grad_min_sv": 0.0, + "grad_condition": 46626880811.52737, + "lr": 0.0006344599103076324, + "time_sec": 177.41233468055725 + }, + { + "epoch": 63, + "train_loss": 4.64204384475708, + "train_acc": 0.01014, + "test_loss": 4.608532351684571, + "test_acc": 0.01, + "lyapunov": 1.591071292567436, + "grad_norm": 0.18148049003675806, + "grad_max_sv": 0.03887187172658742, + "grad_min_sv": 0.0, + "grad_condition": 38871871726.58742, + "lr": 0.0006243449435824269, + "time_sec": 177.32782816886902 + }, + { + "epoch": 64, + "train_loss": 4.642362080993652, + "train_acc": 0.00976, + "test_loss": 4.605919379425049, + "test_acc": 0.01, + "lyapunov": 1.59339769935364, + "grad_norm": 0.16947785318867856, + "grad_max_sv": 0.04678878029808402, + "grad_min_sv": 0.0, + "grad_condition": 46788780298.08402, + "lr": 0.0006141754350553275, + "time_sec": 177.36176109313965 + }, + { + "epoch": 65, + "train_loss": 4.64135870513916, + "train_acc": 0.0098, + "test_loss": 4.6061177238464355, + "test_acc": 0.01, + "lyapunov": 1.5889410545758884, + "grad_norm": 0.200660646453697, + "grad_max_sv": 0.052430361462756994, + "grad_min_sv": 0.0, + "grad_condition": 52430361462.75699, + "lr": 0.0006039558454088793, + "time_sec": 177.57254838943481 + }, + { + "epoch": 66, + "train_loss": 4.6474862211608885, + "train_acc": 0.00968, + "test_loss": 4.605675552368164, + "test_acc": 0.01, + "lyapunov": 1.6025549606289096, + "grad_norm": 0.24193311739345152, + "grad_max_sv": 0.06446847971528769, + "grad_min_sv": 8.023691354480991e-14, + "grad_condition": 58142616242.219055, + "lr": 0.000593690657292862, + "time_sec": 177.27647042274475 + }, + { + "epoch": 67, + "train_loss": 4.6455588671875, + "train_acc": 0.00932, + "test_loss": 4.608942795562744, + "test_acc": 0.01, + "lyapunov": 1.6029961197577474, + "grad_norm": 0.5642775506276186, + "grad_max_sv": 0.06661056466400624, + "grad_min_sv": 4.989178535200188e-27, + "grad_condition": 66610564664.00575, + "lr": 0.0005833843733580507, + "time_sec": 177.30575489997864 + }, + { + "epoch": 68, + "train_loss": 4.6422839654541015, + "train_acc": 0.00948, + "test_loss": 4.613675955200195, + "test_acc": 0.01, + "lyapunov": 1.5871542494010438, + "grad_norm": 0.40260870408483307, + "grad_max_sv": 0.06906388867646455, + "grad_min_sv": 2.943967978666477e-19, + "grad_condition": 69063862019.90744, + "lr": 0.0005730415142812054, + "time_sec": 177.3839509487152 + }, + { + "epoch": 69, + "train_loss": 4.641787251281738, + "train_acc": 0.0095, + "test_loss": 4.605676875305176, + "test_acc": 0.01, + "lyapunov": 1.5912645625336397, + "grad_norm": 0.34254968614340625, + "grad_max_sv": 0.04287184816785157, + "grad_min_sv": 0.0, + "grad_condition": 42871848167.85156, + "lr": 0.0005626666167821517, + "time_sec": 177.32984590530396 + }, + { + "epoch": 70, + "train_loss": 4.651252772827148, + "train_acc": 0.00948, + "test_loss": 4.605676740264893, + "test_acc": 0.01, + "lyapunov": 1.6005148091889403, + "grad_norm": 0.32314191918702384, + "grad_max_sv": 0.07503386735916137, + "grad_min_sv": 1.515944273746056e-14, + "grad_condition": 72060515877.79199, + "lr": 0.0005522642316338265, + "time_sec": 177.35727500915527 + }, + { + "epoch": 71, + "train_loss": 4.642202633666992, + "train_acc": 0.00952, + "test_loss": 4.60564603805542, + "test_acc": 0.01, + "lyapunov": 1.5934118678807603, + "grad_norm": 0.19098601600212814, + "grad_max_sv": 0.04769439417868852, + "grad_min_sv": 0.0, + "grad_condition": 47694394178.68852, + "lr": 0.0005418389216661573, + "time_sec": 177.31805086135864 + }, + { + "epoch": 72, + "train_loss": 4.643372284545898, + "train_acc": 0.01042, + "test_loss": 4.605551630401611, + "test_acc": 0.01, + "lyapunov": 1.6024812432506201, + "grad_norm": 0.1850692588702891, + "grad_max_sv": 0.029727647779509425, + "grad_min_sv": 0.0, + "grad_condition": 29727647779.509422, + "lr": 0.0005313952597646563, + "time_sec": 177.26796555519104 + }, + { + "epoch": 73, + "train_loss": 4.640834873046875, + "train_acc": 0.01012, + "test_loss": 4.605487160491943, + "test_acc": 0.01, + "lyapunov": 1.5882229832432153, + "grad_norm": 0.18526548732293277, + "grad_max_sv": 0.037329256813973186, + "grad_min_sv": 0.0, + "grad_condition": 37329256813.97318, + "lr": 0.0005209378268645994, + "time_sec": 177.25225377082825 + }, + { + "epoch": 74, + "train_loss": 4.64209197479248, + "train_acc": 0.00906, + "test_loss": 4.605482194519043, + "test_acc": 0.01, + "lyapunov": 1.5956125628307958, + "grad_norm": 0.19272835899448448, + "grad_max_sv": 0.03931440911255777, + "grad_min_sv": 0.0, + "grad_condition": 39314409112.55777, + "lr": 0.0005104712099416781, + "time_sec": 177.2522575855255 + }, + { + "epoch": 75, + "train_loss": 4.646220574035644, + "train_acc": 0.00904, + "test_loss": 4.605418196105957, + "test_acc": 0.01, + "lyapunov": 1.6149345593684166, + "grad_norm": 0.18848455976917208, + "grad_max_sv": 0.03723890888504684, + "grad_min_sv": 0.0, + "grad_condition": 37238908885.04684, + "lr": 0.0004999999999999996, + "time_sec": 177.2818944454193 + }, + { + "epoch": 76, + "train_loss": 4.648384475402832, + "train_acc": 0.00998, + "test_loss": 4.6053966011047365, + "test_acc": 0.01, + "lyapunov": 1.6287647842446251, + "grad_norm": 1.8057917745549752, + "grad_max_sv": 0.029743389310897327, + "grad_min_sv": 3.7199142558296474e-21, + "grad_condition": 29743389301.013134, + "lr": 0.0004895287900583212, + "time_sec": 177.26618552207947 + }, + { + "epoch": 77, + "train_loss": 4.721213637390137, + "train_acc": 0.00964, + "test_loss": 4.6436636322021485, + "test_acc": 0.01, + "lyapunov": 2.058074002985454, + "grad_norm": 3.091860129305993, + "grad_max_sv": 0.054268574403249656, + "grad_min_sv": 8.376052745740116e-34, + "grad_condition": 54268574403.24966, + "lr": 0.0004790621731353997, + "time_sec": 177.27104544639587 + }, + { + "epoch": 78, + "train_loss": 4.721108419342041, + "train_acc": 0.0102, + "test_loss": 4.665742019653321, + "test_acc": 0.01, + "lyapunov": 2.0632075443292215, + "grad_norm": 0.16746757148328467, + "grad_max_sv": 0.05550560392439365, + "grad_min_sv": 2.1720126197034665e-45, + "grad_condition": 55505603924.393654, + "lr": 0.000468604740235343, + "time_sec": 177.2460799217224 + }, + { + "epoch": 79, + "train_loss": 4.748111321258545, + "train_acc": 0.00948, + "test_loss": 4.609986500549317, + "test_acc": 0.01, + "lyapunov": 2.195971542307178, + "grad_norm": 0.24040083874318255, + "grad_max_sv": 0.05709849054073857, + "grad_min_sv": 1.4965270295518628e-39, + "grad_condition": 57098490540.73856, + "lr": 0.00045816107833384175, + "time_sec": 177.27070450782776 + }, + { + "epoch": 80, + "train_loss": 4.7519070631408695, + "train_acc": 0.0117, + "test_loss": 4.627280041503906, + "test_acc": 0.01, + "lyapunov": 2.2188175566056194, + "grad_norm": 0.8805430521303074, + "grad_max_sv": 0.057838325266129684, + "grad_min_sv": 1.5422340573742856e-42, + "grad_condition": 57838325266.129684, + "lr": 0.0004477357683661729, + "time_sec": 177.29695653915405 + }, + { + "epoch": 81, + "train_loss": 4.677329037322998, + "train_acc": 0.00938, + "test_loss": 4.61901457901001, + "test_acc": 0.01, + "lyapunov": 1.7923584527066907, + "grad_norm": 0.8776582765129182, + "grad_max_sv": 0.04953184952028096, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 49531849520.28096, + "lr": 0.00043733338321784746, + "time_sec": 177.28252363204956 + }, + { + "epoch": 82, + "train_loss": 4.649648946685791, + "train_acc": 0.00968, + "test_loss": 4.616988354492188, + "test_acc": 0.01, + "lyapunov": 1.636922500627425, + "grad_norm": 1.3865972070708266, + "grad_max_sv": 0.01087386254221201, + "grad_min_sv": 0.0, + "grad_condition": 10873862542.21201, + "lr": 0.0004269584857187939, + "time_sec": 177.24314332008362 + }, + { + "epoch": 83, + "train_loss": 4.642039197845459, + "train_acc": 0.00996, + "test_loss": 4.614689962768555, + "test_acc": 0.01, + "lyapunov": 1.5991996630378391, + "grad_norm": 1.3716621678192378, + "grad_max_sv": 0.018109424225986003, + "grad_min_sv": 0.0, + "grad_condition": 18109424225.986004, + "lr": 0.0004166156266419484, + "time_sec": 177.229647397995 + }, + { + "epoch": 84, + "train_loss": 4.641844508972168, + "train_acc": 0.00878, + "test_loss": 4.617015579223633, + "test_acc": 0.01, + "lyapunov": 1.60060031792087, + "grad_norm": 1.3175623049235154, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 177.2538447380066 + }, + { + "epoch": 85, + "train_loss": 4.643175181274414, + "train_acc": 0.0094, + "test_loss": 4.614698597717285, + "test_acc": 0.01, + "lyapunov": 1.6059161156339719, + "grad_norm": 1.2845631564383488, + "grad_max_sv": 0.008081613527610897, + "grad_min_sv": 0.0, + "grad_condition": 8081613527.610898, + "lr": 0.0003960441545911199, + "time_sec": 177.20055627822876 + }, + { + "epoch": 86, + "train_loss": 4.643574464263916, + "train_acc": 0.0098, + "test_loss": 4.614707907104492, + "test_acc": 0.01, + "lyapunov": 1.6075664575752395, + "grad_norm": 1.4187544153998444, + "grad_max_sv": 0.00905034514144063, + "grad_min_sv": 0.0, + "grad_condition": 9050345141.440632, + "lr": 0.0003858245649446718, + "time_sec": 177.21315360069275 + }, + { + "epoch": 87, + "train_loss": 4.694294710845948, + "train_acc": 0.00954, + "test_loss": 4.623233102416992, + "test_acc": 0.01, + "lyapunov": 1.9175829625190677, + "grad_norm": 4.082558395603232, + "grad_max_sv": 0.02438779656608254, + "grad_min_sv": 6.337662028039815e-35, + "grad_condition": 24387796566.082542, + "lr": 0.00037565505641757235, + "time_sec": 177.25639843940735 + }, + { + "epoch": 88, + "train_loss": 4.717588612060547, + "train_acc": 0.01098, + "test_loss": 4.654013455200196, + "test_acc": 0.01, + "lyapunov": 2.087744262822144, + "grad_norm": 0.17835559132091938, + "grad_max_sv": 0.07744973180815577, + "grad_min_sv": 2.3523356446513927e-16, + "grad_condition": 77434631231.10988, + "lr": 0.00036554008969236695, + "time_sec": 177.38599228858948 + }, + { + "epoch": 89, + "train_loss": 4.734110566711426, + "train_acc": 0.0155, + "test_loss": 4.653230757141113, + "test_acc": 0.01, + "lyapunov": 2.1995491454058596, + "grad_norm": 0.13356986466644585, + "grad_max_sv": 0.0670669173821807, + "grad_min_sv": 2.875717693613099e-34, + "grad_condition": 67066917382.18069, + "lr": 0.0003554841015277638, + "time_sec": 177.2775719165802 + }, + { + "epoch": 90, + "train_loss": 4.692502493743897, + "train_acc": 0.01608, + "test_loss": 4.685703827667236, + "test_acc": 0.01, + "lyapunov": 2.1217137315998906, + "grad_norm": 0.18454505411948288, + "grad_max_sv": 0.09909263849258423, + "grad_min_sv": 9.485088852608362e-15, + "grad_condition": 98142092685.66644, + "lr": 0.000345491502812526, + "time_sec": 177.33423161506653 + }, + { + "epoch": 91, + "train_loss": 4.689375361785888, + "train_acc": 0.01532, + "test_loss": 5.054153802490235, + "test_acc": 0.01, + "lyapunov": 2.080054032528187, + "grad_norm": 0.5188803350503319, + "grad_max_sv": 0.1383956030011177, + "grad_min_sv": 3.288818752125065e-14, + "grad_condition": 133990904819.13261, + "lr": 0.0003355666766307081, + "time_sec": 177.33309030532837 + }, + { + "epoch": 92, + "train_loss": 4.63797587173462, + "train_acc": 0.01862, + "test_loss": 4.71228084487915, + "test_acc": 0.01, + "lyapunov": 2.1218495975674876, + "grad_norm": 0.6784268973745995, + "grad_max_sv": 0.1671210890635848, + "grad_min_sv": 7.533849064621124e-14, + "grad_condition": 156896122443.4754, + "lr": 0.00032571397633909225, + "time_sec": 177.35465455055237 + }, + { + "epoch": 93, + "train_loss": 4.629223160095215, + "train_acc": 0.0201, + "test_loss": 4.768279981994629, + "test_acc": 0.01, + "lyapunov": 2.231684987807213, + "grad_norm": 0.2698404719461384, + "grad_max_sv": 0.1522567519918084, + "grad_min_sv": 2.610390891244236e-13, + "grad_condition": 128146800497.54839, + "lr": 0.00031593772365766094, + "time_sec": 177.41608834266663 + }, + { + "epoch": 94, + "train_loss": 4.672454256744385, + "train_acc": 0.0155, + "test_loss": 4.625922811889648, + "test_acc": 0.01, + "lyapunov": 2.0642213479942066, + "grad_norm": 1.2838784932252858, + "grad_max_sv": 0.1068689662408179, + "grad_min_sv": 3.5497216486826963e-13, + "grad_condition": 81702903527.8157, + "lr": 0.0003062422067739483, + "time_sec": 177.35895490646362 + }, + { + "epoch": 95, + "train_loss": 4.682060436248779, + "train_acc": 0.01154, + "test_loss": 5.053488528442383, + "test_acc": 0.01, + "lyapunov": 1.908135286377519, + "grad_norm": 1.423394417746509, + "grad_max_sv": 0.06458842717497518, + "grad_min_sv": 2.2284196585027795e-14, + "grad_condition": 62761299140.91392, + "lr": 0.00029663167846209965, + "time_sec": 177.43999791145325 + }, + { + "epoch": 96, + "train_loss": 4.64783102355957, + "train_acc": 0.0158, + "test_loss": 5.105888792419433, + "test_acc": 0.01, + "lyapunov": 1.9445471297139707, + "grad_norm": 0.21161345330658576, + "grad_max_sv": 0.09921222645789385, + "grad_min_sv": 5.191301724766352e-14, + "grad_condition": 94303871341.31389, + "lr": 0.00028711035421746345, + "time_sec": 177.3871088027954 + }, + { + "epoch": 97, + "train_loss": 4.619986424102783, + "train_acc": 0.01798, + "test_loss": 4.954860754394531, + "test_acc": 0.01, + "lyapunov": 1.9772856226357658, + "grad_norm": 0.22380684108271168, + "grad_max_sv": 0.10661779213696718, + "grad_min_sv": 6.269415747523095e-14, + "grad_condition": 100907105733.10144, + "lr": 0.00027768241040753615, + "time_sec": 177.3668417930603 + }, + { + "epoch": 98, + "train_loss": 4.708672041168213, + "train_acc": 0.01462, + "test_loss": 5.008634625244141, + "test_acc": 0.01, + "lyapunov": 2.0945300257114496, + "grad_norm": 1.4979433862072131, + "grad_max_sv": 0.09214200942307252, + "grad_min_sv": 8.393969521570709e-14, + "grad_condition": 84461106378.82773, + "lr": 0.00026835198244006903, + "time_sec": 177.33356857299805 + }, + { + "epoch": 99, + "train_loss": 4.692991460723877, + "train_acc": 0.01672, + "test_loss": 4.888367279052734, + "test_acc": 0.01, + "lyapunov": 2.20108045184094, + "grad_norm": 0.385891368064135, + "grad_max_sv": 0.11020931415259838, + "grad_min_sv": 4.014219483338492e-13, + "grad_condition": 88357297169.3239, + "lr": 0.0002591231629491421, + "time_sec": 177.36116933822632 + }, + { + "epoch": 100, + "train_loss": 4.679412184295654, + "train_acc": 0.01748, + "test_loss": 4.801361751556397, + "test_acc": 0.01, + "lyapunov": 2.1626759752288196, + "grad_norm": 0.29188655689728976, + "grad_max_sv": 0.10528047941625118, + "grad_min_sv": 7.079886157137732e-13, + "grad_condition": 70271036997.56067, + "lr": 0.0002499999999999997, + "time_sec": 177.36359167099 + }, + { + "epoch": 101, + "train_loss": 4.670090843048095, + "train_acc": 0.01908, + "test_loss": 4.845812666320801, + "test_acc": 0.01, + "lyapunov": 2.191265623282898, + "grad_norm": 0.2721459181488543, + "grad_max_sv": 0.11140938717871904, + "grad_min_sv": 9.673542537562727e-13, + "grad_condition": 69811952897.07645, + "lr": 0.00024098649531343477, + "time_sec": 177.350919008255 + }, + { + "epoch": 102, + "train_loss": 4.7038639653015135, + "train_acc": 0.01622, + "test_loss": 4.827154957580566, + "test_acc": 0.01, + "lyapunov": 2.236257368036548, + "grad_norm": 0.37089976502154626, + "grad_max_sv": 0.10384687632322312, + "grad_min_sv": 6.884885540002143e-13, + "grad_condition": 72812162645.31807, + "lr": 0.0002320866025105016, + "time_sec": 177.35117840766907 + }, + { + "epoch": 103, + "train_loss": 4.815245042877197, + "train_acc": 0.01124, + "test_loss": 4.606607830810547, + "test_acc": 0.01, + "lyapunov": 2.2844167551421144, + "grad_norm": 4.100047695451907, + "grad_max_sv": 0.05260885274793026, + "grad_min_sv": 1.3802032362544088e-13, + "grad_condition": 46932354731.69929, + "lr": 0.0002233042253783278, + "time_sec": 177.36591219902039 + }, + { + "epoch": 104, + "train_loss": 4.874257210388183, + "train_acc": 0.0107, + "test_loss": 4.615321169281006, + "test_acc": 0.01, + "lyapunov": 2.5303738708691217, + "grad_norm": 4.641557506783305, + "grad_max_sv": 0.04989699286900873, + "grad_min_sv": 6.455291206487273e-16, + "grad_condition": 49867710747.47777, + "lr": 0.000214643216157784, + "time_sec": 177.35230231285095 + }, + { + "epoch": 105, + "train_loss": 4.723299936981201, + "train_acc": 0.01176, + "test_loss": 4.638908140563965, + "test_acc": 0.01, + "lyapunov": 2.0839424148544934, + "grad_norm": 1.355378299816155, + "grad_max_sv": 0.07086729909481657, + "grad_min_sv": 3.4057078840793797e-16, + "grad_condition": 70843059990.87044, + "lr": 0.00020610737385376332, + "time_sec": 177.27781128883362 + }, + { + "epoch": 106, + "train_loss": 4.7231269412231445, + "train_acc": 0.01514, + "test_loss": 4.6237520652771, + "test_acc": 0.01, + "lyapunov": 2.1920783269740736, + "grad_norm": 0.23046249442621652, + "grad_max_sv": 0.08427620781585574, + "grad_min_sv": 2.6872672205060264e-14, + "grad_condition": 82259478658.28171, + "lr": 0.00019770044256881242, + "time_sec": 177.32385993003845 + }, + { + "epoch": 107, + "train_loss": 4.718143957061767, + "train_acc": 0.01406, + "test_loss": 6.732960067749024, + "test_acc": 0.01, + "lyapunov": 2.1179436051937017, + "grad_norm": 2.388318428417535, + "grad_max_sv": 0.06378129383232674, + "grad_min_sv": 4.2658139494079437e-14, + "grad_condition": 60789693053.35014, + "lr": 0.0001894261098608447, + "time_sec": 177.3540232181549 + }, + { + "epoch": 108, + "train_loss": 4.714431188049317, + "train_acc": 0.01334, + "test_loss": 4.613714739990234, + "test_acc": 0.01, + "lyapunov": 2.1213468349803133, + "grad_norm": 2.8791461854741613, + "grad_max_sv": 0.07117215000674204, + "grad_min_sv": 1.694507032491845e-13, + "grad_condition": 60059951698.86328, + "lr": 0.000181288005125655, + "time_sec": 177.47124576568604 + }, + { + "epoch": 109, + "train_loss": 4.721813513946533, + "train_acc": 0.01472, + "test_loss": 4.676416804504394, + "test_acc": 0.01, + "lyapunov": 2.25968545111244, + "grad_norm": 2.212408550707043, + "grad_max_sv": 0.07278494546897427, + "grad_min_sv": 3.1126578738112443e-13, + "grad_condition": 57077814227.08296, + "lr": 0.0001732896980049473, + "time_sec": 177.3752965927124 + }, + { + "epoch": 110, + "train_loss": 4.620515478363037, + "train_acc": 0.0199, + "test_loss": 4.849770021820069, + "test_acc": 0.01, + "lyapunov": 2.1241518365757543, + "grad_norm": 0.4180712607860875, + "grad_max_sv": 0.11002402473702984, + "grad_min_sv": 1.172731082199846e-12, + "grad_condition": 61549668598.997536, + "lr": 0.00016543469682057076, + "time_sec": 177.33867812156677 + }, + { + "epoch": 111, + "train_loss": 4.623785068969727, + "train_acc": 0.0175, + "test_loss": 4.637153623199463, + "test_acc": 0.01, + "lyapunov": 2.0509809773901235, + "grad_norm": 0.8463969572958269, + "grad_max_sv": 0.11101528165804334, + "grad_min_sv": 1.87112152381424e-12, + "grad_condition": 53576443216.59273, + "lr": 0.00015772644703565552, + "time_sec": 177.3645510673523 + }, + { + "epoch": 112, + "train_loss": 4.6054680319213865, + "train_acc": 0.01996, + "test_loss": 4.732485404968262, + "test_acc": 0.01, + "lyapunov": 1.9695151327820994, + "grad_norm": 0.286979599544395, + "grad_max_sv": 0.11297413185238839, + "grad_min_sv": 1.5087152961486214e-12, + "grad_condition": 66174816958.725464, + "lr": 0.00015016832974331713, + "time_sec": 177.3794810771942 + }, + { + "epoch": 113, + "train_loss": 4.6047257371520995, + "train_acc": 0.021, + "test_loss": 4.738913871765137, + "test_acc": 0.01, + "lyapunov": 2.0082323267636704, + "grad_norm": 0.34791771509662284, + "grad_max_sv": 0.11338779628276825, + "grad_min_sv": 1.4891821340656678e-12, + "grad_condition": 59376578972.79028, + "lr": 0.00014276366018359834, + "time_sec": 177.3533172607422 + }, + { + "epoch": 114, + "train_loss": 4.588227640686035, + "train_acc": 0.02222, + "test_loss": 4.73422000579834, + "test_acc": 0.01, + "lyapunov": 2.009492777497567, + "grad_norm": 0.35363950275472883, + "grad_max_sv": 0.1159886697307229, + "grad_min_sv": 1.90550844743669e-12, + "grad_condition": 54207670472.89293, + "lr": 0.00013551568628929425, + "time_sec": 177.36692142486572 + }, + { + "epoch": 115, + "train_loss": 4.6900716258239745, + "train_acc": 0.01612, + "test_loss": 4.658303358459473, + "test_acc": 0.01, + "lyapunov": 2.135267421412651, + "grad_norm": 1.3246217912641853, + "grad_max_sv": 0.10598969534124456, + "grad_min_sv": 1.3219100092920473e-12, + "grad_condition": 61126734552.39955, + "lr": 0.00012842758726130276, + "time_sec": 177.3328320980072 + }, + { + "epoch": 116, + "train_loss": 4.786548847961426, + "train_acc": 0.01006, + "test_loss": 4.61871778717041, + "test_acc": 0.01, + "lyapunov": 2.3106003911293986, + "grad_norm": 0.20288682229149946, + "grad_max_sv": 0.07976289726793766, + "grad_min_sv": 9.703750835778777e-14, + "grad_condition": 73480681043.72867, + "lr": 0.0001215024721741218, + "time_sec": 177.3196315765381 + }, + { + "epoch": 117, + "train_loss": 4.737495873718261, + "train_acc": 0.00978, + "test_loss": 5.255185474395752, + "test_acc": 0.01, + "lyapunov": 2.141355973680306, + "grad_norm": 1.2090832667169469, + "grad_max_sv": 0.06462649000441803, + "grad_min_sv": 4.712035785133647e-14, + "grad_condition": 61562797934.37225, + "lr": 0.00011474337861210538, + "time_sec": 177.3440716266632 + }, + { + "epoch": 118, + "train_loss": 4.7640791331481935, + "train_acc": 0.01042, + "test_loss": 4.606605186462402, + "test_acc": 0.01, + "lyapunov": 2.2581872031511856, + "grad_norm": 1.4638342931368784, + "grad_max_sv": 0.06105093636777751, + "grad_min_sv": 3.379161065598181e-14, + "grad_condition": 58851399772.93186, + "lr": 0.00010815327133708009, + "time_sec": 177.32141637802124 + }, + { + "epoch": 119, + "train_loss": 4.764838110656738, + "train_acc": 0.01, + "test_loss": 4.609263079833984, + "test_acc": 0.01, + "lyapunov": 2.2616506915568086, + "grad_norm": 1.5774818313640573, + "grad_max_sv": 0.05949288122285177, + "grad_min_sv": 9.459326270127109e-15, + "grad_condition": 58897801267.18583, + "lr": 0.00010173504098790182, + "time_sec": 177.3150999546051 + }, + { + "epoch": 120, + "train_loss": 4.745092378540039, + "train_acc": 0.00954, + "test_loss": 4.691408560180664, + "test_acc": 0.01, + "lyapunov": 2.1814588677242894, + "grad_norm": 0.9224368099956493, + "grad_max_sv": 0.06503358271721853, + "grad_min_sv": 6.0891251611874775e-15, + "grad_condition": 64617582544.06616, + "lr": 9.549150281252629e-05, + "time_sec": 177.2845914363861 + }, + { + "epoch": 121, + "train_loss": 4.715786669311523, + "train_acc": 0.00966, + "test_loss": 4.7921840202331545, + "test_acc": 0.01, + "lyapunov": 2.0026006262625575, + "grad_norm": 9.006667150025358, + "grad_max_sv": 0.008544169525441167, + "grad_min_sv": 2.554875264407016e-15, + "grad_condition": 8406179861.052277, + "lr": 8.942539543314794e-05, + "time_sec": 177.5404670238495 + }, + { + "epoch": 122, + "train_loss": 4.728659786224365, + "train_acc": 0.01478, + "test_loss": 4.716466751098633, + "test_acc": 0.01, + "lyapunov": 2.2308361682745503, + "grad_norm": 2.3677820237911122, + "grad_max_sv": 0.08329055261057261, + "grad_min_sv": 5.30326773979997e-14, + "grad_condition": 78769851023.79935, + "lr": 8.353937964495024e-05, + "time_sec": 177.3092577457428 + }, + { + "epoch": 123, + "train_loss": 4.741206109161377, + "train_acc": 0.01406, + "test_loss": 4.632773582458496, + "test_acc": 0.01, + "lyapunov": 2.229069578982985, + "grad_norm": 3.8848615316118043, + "grad_max_sv": 0.07590833908627041, + "grad_min_sv": 3.6579889540451006e-14, + "grad_condition": 72297092377.36781, + "lr": 7.783603724899243e-05, + "time_sec": 177.35984468460083 + }, + { + "epoch": 124, + "train_loss": 4.9050667370605465, + "train_acc": 0.0107, + "test_loss": 4.692931840515136, + "test_acc": 0.01, + "lyapunov": 2.5950029045724503, + "grad_norm": 8.40683796480657, + "grad_max_sv": 0.020135342784899812, + "grad_min_sv": 1.1905984424824726e-14, + "grad_condition": 19073293863.494404, + "lr": 7.231786991974666e-05, + "time_sec": 177.38076376914978 + }, + { + "epoch": 125, + "train_loss": 4.918515665893555, + "train_acc": 0.01042, + "test_loss": 4.800165419769287, + "test_acc": 0.01, + "lyapunov": 2.6619165169308556, + "grad_norm": 9.502093865016478, + "grad_max_sv": 0.0075993670089607775, + "grad_min_sv": 1.2921884398822422e-14, + "grad_condition": 6651468556.477142, + "lr": 6.698729810778072e-05, + "time_sec": 177.32155227661133 + }, + { + "epoch": 126, + "train_loss": 4.9456257382202145, + "train_acc": 0.0101, + "test_loss": 4.7986811172485355, + "test_acc": 0.01, + "lyapunov": 2.735420986209684, + "grad_norm": 9.875822964888467, + "grad_max_sv": 2.0739924829859918e-08, + "grad_min_sv": 1.5032395739436103e-20, + "grad_condition": 20739.924347962224, + "lr": 6.184665997806817e-05, + "time_sec": 177.3872947692871 + }, + { + "epoch": 127, + "train_loss": 4.886805105133057, + "train_acc": 0.01126, + "test_loss": 4.686759169006348, + "test_acc": 0.01, + "lyapunov": 2.63063982624532, + "grad_norm": 7.634737807457953, + "grad_max_sv": 0.027599985009449268, + "grad_min_sv": 1.635026756284981e-14, + "grad_condition": 25865594145.297913, + "lr": 5.6898210384392595e-05, + "time_sec": 177.42079973220825 + }, + { + "epoch": 128, + "train_loss": 4.948583959960938, + "train_acc": 0.01006, + "test_loss": 4.721134532165527, + "test_acc": 0.01, + "lyapunov": 2.7480261216078268, + "grad_norm": 9.950271022813126, + "grad_max_sv": 1.1180130898673368e-08, + "grad_min_sv": 9.511312933176111e-21, + "grad_condition": 11180.130536020879, + "lr": 5.214411988029363e-05, + "time_sec": 177.41947960853577 + }, + { + "epoch": 129, + "train_loss": 4.9554425132751465, + "train_acc": 0.0104, + "test_loss": 4.75336584854126, + "test_acc": 0.01, + "lyapunov": 2.751198763127827, + "grad_norm": 9.975110420091031, + "grad_max_sv": 0.0031297963534476316, + "grad_min_sv": 4.913090963459592e-16, + "grad_condition": 3069475100.3614955, + "lr": 4.7586473766990294e-05, + "time_sec": 177.42596411705017 + }, + { + "epoch": 130, + "train_loss": 4.96307178024292, + "train_acc": 0.01048, + "test_loss": 4.728824792480469, + "test_acc": 0.01, + "lyapunov": 2.754974961585706, + "grad_norm": 9.999999996542677, + "grad_max_sv": 6.772306379056181e-09, + "grad_min_sv": 1.446285168596469e-20, + "grad_condition": 6772.306171552807, + "lr": 4.32272711786996e-05, + "time_sec": 177.44565844535828 + }, + { + "epoch": 131, + "train_loss": 4.956811699676513, + "train_acc": 0.0093, + "test_loss": 4.750110374450683, + "test_acc": 0.01, + "lyapunov": 2.7515772535368, + "grad_norm": 10.000000073356507, + "grad_max_sv": 5.959159604055491e-09, + "grad_min_sv": 1.476098261934064e-20, + "grad_condition": 5959.1593520792685, + "lr": 3.906842420574966e-05, + "time_sec": 177.42677664756775 + }, + { + "epoch": 132, + "train_loss": 4.9561549958801265, + "train_acc": 0.01016, + "test_loss": 5.696090490722656, + "test_acc": 0.01, + "lyapunov": 2.7502345179048038, + "grad_norm": 9.999999973626117, + "grad_max_sv": 7.992252583702286e-09, + "grad_min_sv": 2.4784692224406337e-20, + "grad_condition": 7992.2521699460685, + "lr": 3.5111757055874305e-05, + "time_sec": 177.4220016002655 + }, + { + "epoch": 133, + "train_loss": 4.857832619476318, + "train_acc": 0.01246, + "test_loss": 4.677371379089355, + "test_acc": 0.01, + "lyapunov": 2.512646475411437, + "grad_norm": 7.117012627349442, + "grad_max_sv": 0.031855909609874486, + "grad_min_sv": 1.649919424059889e-14, + "grad_condition": 30285643652.368275, + "lr": 3.1359005254054254e-05, + "time_sec": 177.3773238658905 + }, + { + "epoch": 134, + "train_loss": 4.68506044845581, + "train_acc": 0.01548, + "test_loss": 4.609123469543457, + "test_acc": 0.01, + "lyapunov": 2.1184186959815454, + "grad_norm": 1.9204167306730333, + "grad_max_sv": 0.09412179148760884, + "grad_min_sv": 4.6394519786537835e-14, + "grad_condition": 89429686329.23029, + "lr": 2.7811814881259484e-05, + "time_sec": 177.34491610527039 + }, + { + "epoch": 135, + "train_loss": 4.681999072875977, + "train_acc": 0.01576, + "test_loss": 4.83034912109375, + "test_acc": 0.01, + "lyapunov": 2.150207258551322, + "grad_norm": 1.143763847197843, + "grad_max_sv": 0.10519317688898003, + "grad_min_sv": 5.07688327121443e-14, + "grad_condition": 99689376270.31213, + "lr": 2.4471741852423218e-05, + "time_sec": 177.33815479278564 + }, + { + "epoch": 136, + "train_loss": 4.695164921264649, + "train_acc": 0.01672, + "test_loss": 4.654338619232178, + "test_acc": 0.01, + "lyapunov": 2.2090382295496322, + "grad_norm": 1.1474803627472534, + "grad_max_sv": 0.11123525651727122, + "grad_min_sv": 9.495798219714258e-14, + "grad_condition": 102782907554.42734, + "lr": 2.1340251233966362e-05, + "time_sec": 177.36866855621338 + }, + { + "epoch": 137, + "train_loss": 4.692152431335449, + "train_acc": 0.01646, + "test_loss": 4.81933528137207, + "test_acc": 0.01, + "lyapunov": 2.2094227846931007, + "grad_norm": 0.6303897036424283, + "grad_max_sv": 0.11831559501588344, + "grad_min_sv": 8.349289767505628e-14, + "grad_condition": 109746710531.71823, + "lr": 1.8418716601170932e-05, + "time_sec": 177.3661823272705 + }, + { + "epoch": 138, + "train_loss": 4.6894233569335935, + "train_acc": 0.01706, + "test_loss": 4.791972970581055, + "test_acc": 0.01, + "lyapunov": 2.2000036544507116, + "grad_norm": 2.1899555272870477, + "grad_max_sv": 0.09350968728547274, + "grad_min_sv": 4.120797655506886e-14, + "grad_condition": 88843401487.6287, + "lr": 1.570841943568445e-05, + "time_sec": 177.3641233444214 + }, + { + "epoch": 139, + "train_loss": 4.694636091156005, + "train_acc": 0.0159, + "test_loss": 4.829331467437744, + "test_acc": 0.01, + "lyapunov": 2.215796913942108, + "grad_norm": 0.9784986049838148, + "grad_max_sv": 0.12486231978982687, + "grad_min_sv": 1.0247936181848821e-13, + "grad_condition": 113419375367.18208, + "lr": 1.3210548563419845e-05, + "time_sec": 177.35728001594543 + }, + { + "epoch": 140, + "train_loss": 4.694870633392334, + "train_acc": 0.01644, + "test_loss": 4.815142876434326, + "test_acc": 0.01, + "lyapunov": 2.217364390487866, + "grad_norm": 1.2916272628863348, + "grad_max_sv": 0.11291685290662548, + "grad_min_sv": 5.3537487011776554e-14, + "grad_condition": 106360741194.21178, + "lr": 1.0926199633097203e-05, + "time_sec": 177.3576626777649 + }, + { + "epoch": 141, + "train_loss": 4.677861398468018, + "train_acc": 0.0173, + "test_loss": 4.815771765899658, + "test_acc": 0.01, + "lyapunov": 2.1779102489466555, + "grad_norm": 0.8766949577062909, + "grad_max_sv": 0.12149501488558231, + "grad_min_sv": 8.143102612255778e-14, + "grad_condition": 111956733978.91446, + "lr": 8.856374635655688e-06, + "time_sec": 177.35283827781677 + }, + { + "epoch": 142, + "train_loss": 4.686267812042236, + "train_acc": 0.01684, + "test_loss": 4.823100394439697, + "test_acc": 0.01, + "lyapunov": 2.227254505962362, + "grad_norm": 0.5331148714010232, + "grad_max_sv": 0.1205288675238089, + "grad_min_sv": 8.176555294007943e-14, + "grad_condition": 111062530094.41301, + "lr": 7.001981464747503e-06, + "time_sec": 177.35118770599365 + }, + { + "epoch": 143, + "train_loss": 4.692831365509033, + "train_acc": 0.01716, + "test_loss": 4.897853678894043, + "test_acc": 0.01, + "lyapunov": 2.2571963544391913, + "grad_norm": 0.6114897960642978, + "grad_max_sv": 0.12478593328297125, + "grad_min_sv": 8.340670293644858e-14, + "grad_condition": 115479694388.34305, + "lr": 5.3638335185058295e-06, + "time_sec": 177.36120533943176 + }, + { + "epoch": 144, + "train_loss": 4.70658299621582, + "train_acc": 0.0171, + "test_loss": 4.83040984954834, + "test_acc": 0.01, + "lyapunov": 2.287657803586682, + "grad_norm": 0.9510676579378554, + "grad_max_sv": 0.1171010570952277, + "grad_min_sv": 6.361800175176714e-14, + "grad_condition": 109355119446.73831, + "lr": 3.942649342761114e-06, + "time_sec": 177.34865474700928 + }, + { + "epoch": 145, + "train_loss": 4.701995197296142, + "train_acc": 0.0173, + "test_loss": 4.613565782165527, + "test_acc": 0.01, + "lyapunov": 2.264257175233358, + "grad_norm": 0.8111639031310902, + "grad_max_sv": 0.11689584073509067, + "grad_min_sv": 7.425262413111732e-14, + "grad_condition": 108241392397.88205, + "lr": 2.7390523158633524e-06, + "time_sec": 177.34988021850586 + }, + { + "epoch": 146, + "train_loss": 4.698547594909668, + "train_acc": 0.01698, + "test_loss": 4.831944055175781, + "test_acc": 0.01, + "lyapunov": 2.264427444209223, + "grad_norm": 0.7687759810394293, + "grad_max_sv": 0.11922218743320086, + "grad_min_sv": 7.928289197503764e-14, + "grad_condition": 110429208233.33487, + "lr": 1.7535703752478133e-06, + "time_sec": 177.375305891037 + }, + { + "epoch": 147, + "train_loss": 4.703107703094482, + "train_acc": 0.01644, + "test_loss": 4.832024374389649, + "test_acc": 0.01, + "lyapunov": 2.262833438565969, + "grad_norm": 0.8980427547431384, + "grad_max_sv": 0.12822539806609132, + "grad_min_sv": 9.266738943909007e-14, + "grad_condition": 117774825403.93326, + "lr": 9.866357858642196e-07, + "time_sec": 177.37703728675842 + }, + { + "epoch": 148, + "train_loss": 4.694877036437989, + "train_acc": 0.01716, + "test_loss": 4.741145161437989, + "test_acc": 0.01, + "lyapunov": 2.2374743762833385, + "grad_norm": 1.2386113783762993, + "grad_max_sv": 0.13271797422266368, + "grad_min_sv": 9.874739286162734e-14, + "grad_condition": 121226456943.3418, + "lr": 4.38584950570808e-07, + "time_sec": 177.3770706653595 + }, + { + "epoch": 149, + "train_loss": 4.691502552185058, + "train_acc": 0.0184, + "test_loss": 4.9060412048339845, + "test_acc": 0.01, + "lyapunov": 2.2420086558822474, + "grad_norm": 1.0935576324459544, + "grad_max_sv": 0.1251808095059495, + "grad_min_sv": 7.87008918289173e-14, + "grad_condition": 115742557747.01627, + "lr": 1.096582625772501e-07, + "time_sec": 177.38786363601685 + }, + { + "epoch": 150, + "train_loss": 4.682859961853027, + "train_acc": 0.0175, + "test_loss": 4.898887846374512, + "test_acc": 0.01, + "lyapunov": 2.2194432437877216, + "grad_norm": 0.9410314426818256, + "grad_max_sv": 0.12126885750057496, + "grad_min_sv": 7.283089248142724e-14, + "grad_condition": 113197772104.82927, + "lr": 0.0, + "time_sec": 177.3536741733551 + } + ] + } +} \ No newline at end of file -- cgit v1.2.3