From cd99d6b874d9d09b3bb87b8485cc787885af71f1 Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Tue, 13 Jan 2026 23:49:05 -0600 Subject: init commit --- .../cifar100_20260102-133933/config.json | 23 + .../cifar100_20260102-133933/results.json | 16822 +++++++++++++++++++ 2 files changed, 16845 insertions(+) create mode 100644 runs/depth_scaling_weak_reg/cifar100_20260102-133933/config.json create mode 100644 runs/depth_scaling_weak_reg/cifar100_20260102-133933/results.json (limited to 'runs/depth_scaling_weak_reg') diff --git a/runs/depth_scaling_weak_reg/cifar100_20260102-133933/config.json b/runs/depth_scaling_weak_reg/cifar100_20260102-133933/config.json new file mode 100644 index 0000000..68e32f4 --- /dev/null +++ b/runs/depth_scaling_weak_reg/cifar100_20260102-133933/config.json @@ -0,0 +1,23 @@ +{ + "dataset": "cifar100", + "depths": [ + 4, + 8, + 12, + 16 + ], + "T": 4, + "epochs": 150, + "batch_size": 128, + "lr": 0.001, + "lambda_reg": 0.01, + "lambda_target": -0.1, + "data_dir": "./data", + "out_dir": "runs/depth_scaling_weak_reg", + "device": "cuda", + "seed": 42, + "no_progress": false, + "reg_type": "squared", + "warmup_epochs": 20, + "stable_init": false +} \ No newline at end of file diff --git a/runs/depth_scaling_weak_reg/cifar100_20260102-133933/results.json b/runs/depth_scaling_weak_reg/cifar100_20260102-133933/results.json new file mode 100644 index 0000000..e4187b3 --- /dev/null +++ b/runs/depth_scaling_weak_reg/cifar100_20260102-133933/results.json @@ -0,0 +1,16822 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 4.33289975402832, + "train_acc": 0.0996, + "test_loss": 3.709950496673584, + "test_acc": 0.161, + "lyapunov": null, + "grad_norm": 6.2810299448077185, + "grad_max_sv": 4.92810994386673, + "grad_min_sv": 1.1473994767641216e-07, + "grad_condition": 56571499.99764378, + "lr": 0.0009998903417374227, + "time_sec": 17.50081491470337 + }, + { + "epoch": 2, + "train_loss": 3.485806705932617, + "train_acc": 0.18754, + "test_loss": 3.376948810195923, + "test_acc": 0.2251, + "lyapunov": null, + "grad_norm": 4.472632624179186, + "grad_max_sv": 3.2327494621276855, + "grad_min_sv": 8.310527727373173e-08, + "grad_condition": 92291044.07744889, + "lr": 0.0009995614150494292, + "time_sec": 15.760291576385498 + }, + { + "epoch": 3, + "train_loss": 3.0275221601867677, + "train_acc": 0.26082, + "test_loss": 2.7881758056640624, + "test_acc": 0.3042, + "lyapunov": null, + "grad_norm": 3.543386902664438, + "grad_max_sv": 2.3667378187179566, + "grad_min_sv": 6.621326131828198e-08, + "grad_condition": 41824057.350124836, + "lr": 0.0009990133642141358, + "time_sec": 15.514073610305786 + }, + { + "epoch": 4, + "train_loss": 2.7166115661621095, + "train_acc": 0.31484, + "test_loss": 2.8865633476257324, + "test_acc": 0.306, + "lyapunov": null, + "grad_norm": 2.9695578850260107, + "grad_max_sv": 1.8169075399637222, + "grad_min_sv": 5.518442924568046e-08, + "grad_condition": 70749082.65805705, + "lr": 0.0009982464296247522, + "time_sec": 15.510918378829956 + }, + { + "epoch": 5, + "train_loss": 2.494141845779419, + "train_acc": 0.3584, + "test_loss": 2.5619307788848875, + "test_acc": 0.3568, + "lyapunov": null, + "grad_norm": 2.6232237351536, + "grad_max_sv": 1.5905334174633026, + "grad_min_sv": 4.9858857542606216e-08, + "grad_condition": 41263576.62486158, + "lr": 0.0009972609476841367, + "time_sec": 15.509635925292969 + }, + { + "epoch": 6, + "train_loss": 2.320282641906738, + "train_acc": 0.3967, + "test_loss": 2.443246061706543, + "test_acc": 0.3819, + "lyapunov": null, + "grad_norm": 2.4166519099880834, + "grad_max_sv": 1.350677639245987, + "grad_min_sv": 4.6017904989370526e-08, + "grad_condition": 199449118.7803008, + "lr": 0.000996057350657239, + "time_sec": 15.4894278049469 + }, + { + "epoch": 7, + "train_loss": 2.1808267082214354, + "train_acc": 0.4256, + "test_loss": 3.2315720008850097, + "test_acc": 0.2771, + "lyapunov": null, + "grad_norm": 2.2480641483115495, + "grad_max_sv": 1.2442059576511384, + "grad_min_sv": 4.327689683836233e-08, + "grad_condition": 140166953.30948788, + "lr": 0.000994636166481494, + "time_sec": 15.505986452102661 + }, + { + "epoch": 8, + "train_loss": 2.0691979400634763, + "train_acc": 0.44868, + "test_loss": 3.139005694770813, + "test_acc": 0.2922, + "lyapunov": null, + "grad_norm": 2.097068048120337, + "grad_max_sv": 1.1334303438663482, + "grad_min_sv": 4.030898569928887e-08, + "grad_condition": 47058431.20376512, + "lr": 0.0009929980185352525, + "time_sec": 15.508616924285889 + }, + { + "epoch": 9, + "train_loss": 1.9553286380004882, + "train_acc": 0.47388, + "test_loss": 3.06018212890625, + "test_acc": 0.2879, + "lyapunov": null, + "grad_norm": 1.9713724036682645, + "grad_max_sv": 1.038258707523346, + "grad_min_sv": 3.804477004820672e-08, + "grad_condition": 77979087.0502029, + "lr": 0.0009911436253643444, + "time_sec": 15.48607587814331 + }, + { + "epoch": 10, + "train_loss": 1.8515163943099975, + "train_acc": 0.49774, + "test_loss": 2.287493668937683, + "test_acc": 0.4192, + "lyapunov": null, + "grad_norm": 1.8543819342692063, + "grad_max_sv": 0.9413492172956467, + "grad_min_sv": 3.5232182887812157e-08, + "grad_condition": 36736583.24879627, + "lr": 0.0009890738003669028, + "time_sec": 15.491151571273804 + }, + { + "epoch": 11, + "train_loss": 1.7691326560211182, + "train_acc": 0.51778, + "test_loss": 2.5470476570129397, + "test_acc": 0.3842, + "lyapunov": null, + "grad_norm": 1.768792816734991, + "grad_max_sv": 0.8943161860108375, + "grad_min_sv": 3.4390645303750134e-08, + "grad_condition": 45963677.14752157, + "lr": 0.00098678945143658, + "time_sec": 15.483253002166748 + }, + { + "epoch": 12, + "train_loss": 1.7075069317245484, + "train_acc": 0.53152, + "test_loss": 2.238752745628357, + "test_acc": 0.4335, + "lyapunov": null, + "grad_norm": 1.7084576219376304, + "grad_max_sv": 0.8465132102370262, + "grad_min_sv": 3.267220019254058e-08, + "grad_condition": 51222076.76950155, + "lr": 0.0009842915805643154, + "time_sec": 15.505992412567139 + }, + { + "epoch": 13, + "train_loss": 1.6453962017059327, + "train_acc": 0.54646, + "test_loss": 2.2896381731033326, + "test_acc": 0.4371, + "lyapunov": null, + "grad_norm": 1.629227704057604, + "grad_max_sv": 0.7849430561065673, + "grad_min_sv": 3.048308783726306e-08, + "grad_condition": 49261336.09204699, + "lr": 0.000981581283398829, + "time_sec": 15.521925926208496 + }, + { + "epoch": 14, + "train_loss": 1.583652059249878, + "train_acc": 0.559, + "test_loss": 2.231475386047363, + "test_acc": 0.4447, + "lyapunov": null, + "grad_norm": 1.5707542622000317, + "grad_max_sv": 0.7640527755022049, + "grad_min_sv": 2.978501200262551e-08, + "grad_condition": 62214276.83025722, + "lr": 0.0009786597487660333, + "time_sec": 15.50330901145935 + }, + { + "epoch": 15, + "train_loss": 1.5233635874176026, + "train_acc": 0.57468, + "test_loss": 2.3873890338897703, + "test_acc": 0.4225, + "lyapunov": null, + "grad_norm": 1.5152337058048917, + "grad_max_sv": 0.7098304882645607, + "grad_min_sv": 2.8289248441004666e-08, + "grad_condition": 37683711.46213076, + "lr": 0.0009755282581475766, + "time_sec": 15.519577026367188 + }, + { + "epoch": 16, + "train_loss": 1.4734115508651733, + "train_acc": 0.58734, + "test_loss": 2.1620190448760988, + "test_acc": 0.4513, + "lyapunov": null, + "grad_norm": 1.4620144380830962, + "grad_max_sv": 0.6853510558605194, + "grad_min_sv": 2.7198121724594793e-08, + "grad_condition": 137021461.41215044, + "lr": 0.0009721881851187403, + "time_sec": 15.513172388076782 + }, + { + "epoch": 17, + "train_loss": 1.431630831222534, + "train_acc": 0.59564, + "test_loss": 1.9172396266937255, + "test_acc": 0.5024, + "lyapunov": null, + "grad_norm": 1.4276998910319496, + "grad_max_sv": 0.6633460417389869, + "grad_min_sv": 2.6781568132627776e-08, + "grad_condition": 41230574.51697217, + "lr": 0.0009686409947459456, + "time_sec": 15.516494750976562 + }, + { + "epoch": 18, + "train_loss": 1.3981995740127564, + "train_acc": 0.60392, + "test_loss": 2.1783405241012574, + "test_acc": 0.4624, + "lyapunov": null, + "grad_norm": 1.3826851562537303, + "grad_max_sv": 0.642112186551094, + "grad_min_sv": 2.605378342582232e-08, + "grad_condition": 70245110.5573006, + "lr": 0.0009648882429441254, + "time_sec": 15.527103185653687 + }, + { + "epoch": 19, + "train_loss": 1.3383694774627686, + "train_acc": 0.61906, + "test_loss": 2.2048003927230835, + "test_acc": 0.4565, + "lyapunov": null, + "grad_norm": 1.3417355395808768, + "grad_max_sv": 0.6297966443002224, + "grad_min_sv": 2.567137112885476e-08, + "grad_condition": 39411867.34818512, + "lr": 0.00096093157579425, + "time_sec": 15.498464107513428 + }, + { + "epoch": 20, + "train_loss": 1.2989597080612183, + "train_acc": 0.62828, + "test_loss": 2.1187970054626466, + "test_acc": 0.4759, + "lyapunov": null, + "grad_norm": 1.310174265483923, + "grad_max_sv": 0.5846366092562676, + "grad_min_sv": 2.433472365281908e-08, + "grad_condition": 41729077.3118221, + "lr": 0.0009567727288213001, + "time_sec": 15.521925449371338 + }, + { + "epoch": 21, + "train_loss": 1.2696203424072265, + "train_acc": 0.63738, + "test_loss": 2.017310855102539, + "test_acc": 0.498, + "lyapunov": null, + "grad_norm": 1.2788912160386405, + "grad_max_sv": 0.5787257492542267, + "grad_min_sv": 2.3941703536367598e-08, + "grad_condition": 35819914.448526636, + "lr": 0.0009524135262330095, + "time_sec": 15.542917966842651 + }, + { + "epoch": 22, + "train_loss": 1.2354631609344482, + "train_acc": 0.64396, + "test_loss": 2.263232828140259, + "test_acc": 0.4598, + "lyapunov": null, + "grad_norm": 1.2570154376068237, + "grad_max_sv": 0.5728676535189152, + "grad_min_sv": 2.366019752966797e-08, + "grad_condition": 131457468.84297612, + "lr": 0.0009478558801197061, + "time_sec": 15.517506837844849 + }, + { + "epoch": 23, + "train_loss": 1.1960591842269896, + "train_acc": 0.65442, + "test_loss": 1.7755502307891846, + "test_acc": 0.5416, + "lyapunov": null, + "grad_norm": 1.224198984956637, + "grad_max_sv": 0.5530765049159527, + "grad_min_sv": 2.2842870851802477e-08, + "grad_condition": 77533795.14185917, + "lr": 0.000943101789615607, + "time_sec": 15.505609512329102 + }, + { + "epoch": 24, + "train_loss": 1.1622001237487793, + "train_acc": 0.66348, + "test_loss": 1.9274122953414916, + "test_acc": 0.5097, + "lyapunov": null, + "grad_norm": 1.200614940809103, + "grad_max_sv": 0.5359078221023083, + "grad_min_sv": 2.2578253261462676e-08, + "grad_condition": 35876257.64226432, + "lr": 0.0009381533400219313, + "time_sec": 15.532605648040771 + }, + { + "epoch": 25, + "train_loss": 1.1352633666992187, + "train_acc": 0.66762, + "test_loss": 1.875099267578125, + "test_acc": 0.5225, + "lyapunov": null, + "grad_norm": 1.1758911900864482, + "grad_max_sv": 0.52755291685462, + "grad_min_sv": 2.204597005367459e-08, + "grad_condition": 49952571.97210871, + "lr": 0.0009330127018922189, + "time_sec": 15.546083450317383 + }, + { + "epoch": 26, + "train_loss": 1.1007922913360595, + "train_acc": 0.67576, + "test_loss": 1.9364961219787598, + "test_acc": 0.5179, + "lyapunov": null, + "grad_norm": 1.1568297424160785, + "grad_max_sv": 0.509132108092308, + "grad_min_sv": 2.1692141624618522e-08, + "grad_condition": 31942028.007370222, + "lr": 0.000927682130080253, + "time_sec": 15.529866456985474 + }, + { + "epoch": 27, + "train_loss": 1.0767492464828492, + "train_acc": 0.68284, + "test_loss": 1.8350654315948487, + "test_acc": 0.5356, + "lyapunov": null, + "grad_norm": 1.1437020183690754, + "grad_max_sv": 0.5028271451592445, + "grad_min_sv": 2.0899893600143103e-08, + "grad_condition": 110961134.04101834, + "lr": 0.0009221639627510072, + "time_sec": 15.512263774871826 + }, + { + "epoch": 28, + "train_loss": 1.046666657180786, + "train_acc": 0.69276, + "test_loss": 1.7424863245010376, + "test_acc": 0.555, + "lyapunov": null, + "grad_norm": 1.1208714755249298, + "grad_max_sv": 0.4959542900323868, + "grad_min_sv": 2.0676914266187786e-08, + "grad_condition": 101016033.05430314, + "lr": 0.0009164606203550494, + "time_sec": 15.524545192718506 + }, + { + "epoch": 29, + "train_loss": 1.0245877030944823, + "train_acc": 0.69756, + "test_loss": 1.8015550178527833, + "test_acc": 0.5461, + "lyapunov": null, + "grad_norm": 1.0975980976876525, + "grad_max_sv": 0.5063327789306641, + "grad_min_sv": 2.0803712974526434e-08, + "grad_condition": 39600116.138457105, + "lr": 0.0009105746045668516, + "time_sec": 15.59637975692749 + }, + { + "epoch": 30, + "train_loss": 0.9965687858200073, + "train_acc": 0.70398, + "test_loss": 1.8630317890167236, + "test_acc": 0.5361, + "lyapunov": null, + "grad_norm": 1.085671076034073, + "grad_max_sv": 0.48614486977458, + "grad_min_sv": 2.0165644172565055e-08, + "grad_condition": 49392575.5692039, + "lr": 0.0009045084971874733, + "time_sec": 15.563995122909546 + }, + { + "epoch": 31, + "train_loss": 0.9731001928901672, + "train_acc": 0.71184, + "test_loss": 1.8755411792755128, + "test_acc": 0.5353, + "lyapunov": null, + "grad_norm": 1.0679123024514685, + "grad_max_sv": 0.4686537399888039, + "grad_min_sv": 1.968864739628623e-08, + "grad_condition": 240929504.49198055, + "lr": 0.0008982649590120977, + "time_sec": 15.52276349067688 + }, + { + "epoch": 32, + "train_loss": 0.9574742518615723, + "train_acc": 0.71522, + "test_loss": 1.966079172515869, + "test_acc": 0.5257, + "lyapunov": null, + "grad_norm": 1.0549795383573466, + "grad_max_sv": 0.46632925793528557, + "grad_min_sv": 1.951352061593456e-08, + "grad_condition": 295342313.37488973, + "lr": 0.0008918467286629196, + "time_sec": 15.520017385482788 + }, + { + "epoch": 33, + "train_loss": 0.9316390480804443, + "train_acc": 0.721, + "test_loss": 1.8315558645248413, + "test_acc": 0.5401, + "lyapunov": null, + "grad_norm": 1.034011012270133, + "grad_max_sv": 0.4538381576538086, + "grad_min_sv": 1.9127925688505742e-08, + "grad_condition": 62099518.07834904, + "lr": 0.0008852566213878943, + "time_sec": 15.512933492660522 + }, + { + "epoch": 34, + "train_loss": 0.9120938426017762, + "train_acc": 0.7261, + "test_loss": 1.7715516666412354, + "test_acc": 0.56, + "lyapunov": null, + "grad_norm": 1.018012226306812, + "grad_max_sv": 0.4342078812420368, + "grad_min_sv": 1.863907480720295e-08, + "grad_condition": 55521122.14975482, + "lr": 0.000878497527825878, + "time_sec": 15.513373374938965 + }, + { + "epoch": 35, + "train_loss": 0.8977002004814147, + "train_acc": 0.7291, + "test_loss": 1.8452600439071656, + "test_acc": 0.5518, + "lyapunov": null, + "grad_norm": 1.0178881474508787, + "grad_max_sv": 0.44193900674581527, + "grad_min_sv": 1.8550129185501697e-08, + "grad_condition": 93431923.09371561, + "lr": 0.000871572412738697, + "time_sec": 15.527926445007324 + }, + { + "epoch": 36, + "train_loss": 0.8736581074142457, + "train_acc": 0.73646, + "test_loss": 2.0875708852767945, + "test_acc": 0.5136, + "lyapunov": null, + "grad_norm": 0.9933147429061643, + "grad_max_sv": 0.4358292184770107, + "grad_min_sv": 1.7923193362801016e-08, + "grad_condition": 41313615.5111606, + "lr": 0.0008644843137107055, + "time_sec": 15.528854131698608 + }, + { + "epoch": 37, + "train_loss": 0.8518191300582886, + "train_acc": 0.74148, + "test_loss": 1.8187555240631104, + "test_acc": 0.5565, + "lyapunov": null, + "grad_norm": 0.9863366017587146, + "grad_max_sv": 0.4345082275569439, + "grad_min_sv": 1.8289939288096414e-08, + "grad_condition": 37135379.43907313, + "lr": 0.0008572363398164014, + "time_sec": 15.514251232147217 + }, + { + "epoch": 38, + "train_loss": 0.8278528201293945, + "train_acc": 0.74744, + "test_loss": 1.8957544691085815, + "test_acc": 0.5479, + "lyapunov": null, + "grad_norm": 0.9718366328703895, + "grad_max_sv": 0.4258884690701962, + "grad_min_sv": 1.7940690534568037e-08, + "grad_condition": 38161268.62452008, + "lr": 0.0008498316702566826, + "time_sec": 15.506083726882935 + }, + { + "epoch": 39, + "train_loss": 0.798656528968811, + "train_acc": 0.75718, + "test_loss": 1.9370916620254517, + "test_acc": 0.5443, + "lyapunov": null, + "grad_norm": 0.9514934716586184, + "grad_max_sv": 0.40630103424191477, + "grad_min_sv": 1.7226211236620602e-08, + "grad_condition": 63755454.2160631, + "lr": 0.0008422735529643442, + "time_sec": 15.525374412536621 + }, + { + "epoch": 40, + "train_loss": 0.7949527891349792, + "train_acc": 0.75612, + "test_loss": 1.9300818992614746, + "test_acc": 0.5444, + "lyapunov": null, + "grad_norm": 0.9518849566802269, + "grad_max_sv": 0.41264484599232676, + "grad_min_sv": 1.7320033419976345e-08, + "grad_condition": 71258340.68307252, + "lr": 0.0008345653031794289, + "time_sec": 15.514223098754883 + }, + { + "epoch": 41, + "train_loss": 0.7800736420440674, + "train_acc": 0.76092, + "test_loss": 2.1826710233688353, + "test_acc": 0.5121, + "lyapunov": null, + "grad_norm": 0.9421685148359034, + "grad_max_sv": 0.40409224331378935, + "grad_min_sv": 1.691150508667874e-08, + "grad_condition": 345654413.3917384, + "lr": 0.0008267103019950526, + "time_sec": 15.510631322860718 + }, + { + "epoch": 42, + "train_loss": 0.7606543594741821, + "train_acc": 0.76552, + "test_loss": 1.7444187334060668, + "test_acc": 0.5761, + "lyapunov": null, + "grad_norm": 0.9302180534057477, + "grad_max_sv": 0.4034069195389748, + "grad_min_sv": 1.674752794118828e-08, + "grad_condition": 187498474.59295964, + "lr": 0.0008187119948743447, + "time_sec": 15.507594585418701 + }, + { + "epoch": 43, + "train_loss": 0.7451812291145324, + "train_acc": 0.76968, + "test_loss": 1.820609942626953, + "test_acc": 0.5634, + "lyapunov": null, + "grad_norm": 0.9187888919616172, + "grad_max_sv": 0.394838485121727, + "grad_min_sv": 1.6672148600571644e-08, + "grad_condition": 56769710.51124905, + "lr": 0.000810573890139155, + "time_sec": 15.512874603271484 + }, + { + "epoch": 44, + "train_loss": 0.7292991390800476, + "train_acc": 0.77396, + "test_loss": 1.8102552856445313, + "test_acc": 0.5634, + "lyapunov": null, + "grad_norm": 0.9089946204958224, + "grad_max_sv": 0.39304503202438357, + "grad_min_sv": 1.6251661138361184e-08, + "grad_condition": 193447433.86841393, + "lr": 0.0008022995574311873, + "time_sec": 15.537316083908081 + }, + { + "epoch": 45, + "train_loss": 0.7157383707046509, + "train_acc": 0.77738, + "test_loss": 1.8844748260498048, + "test_acc": 0.5593, + "lyapunov": null, + "grad_norm": 0.8994653204683742, + "grad_max_sv": 0.3988529540598392, + "grad_min_sv": 1.6325957580970442e-08, + "grad_condition": 54473409.952947155, + "lr": 0.0007938926261462363, + "time_sec": 15.51323914527893 + }, + { + "epoch": 46, + "train_loss": 0.6963709331703186, + "train_acc": 0.78558, + "test_loss": 1.8685519542694091, + "test_acc": 0.563, + "lyapunov": null, + "grad_norm": 0.8836539374270754, + "grad_max_sv": 0.38309651911258696, + "grad_min_sv": 1.622744421926614e-08, + "grad_condition": 3231715814.638464, + "lr": 0.0007853567838422158, + "time_sec": 15.551738262176514 + }, + { + "epoch": 47, + "train_loss": 0.6900019631767272, + "train_acc": 0.78668, + "test_loss": 1.811813512802124, + "test_acc": 0.5763, + "lyapunov": null, + "grad_norm": 0.8854563355184056, + "grad_max_sv": 0.37948372438549993, + "grad_min_sv": 1.591407078824214e-08, + "grad_condition": 86097943.52094127, + "lr": 0.0007766957746216719, + "time_sec": 15.52332854270935 + }, + { + "epoch": 48, + "train_loss": 0.6717638036727905, + "train_acc": 0.7908, + "test_loss": 1.9893609804153443, + "test_acc": 0.5507, + "lyapunov": null, + "grad_norm": 0.8721188285130878, + "grad_max_sv": 0.3669671848416328, + "grad_min_sv": 1.5458188379704507e-08, + "grad_condition": 720626524.2072407, + "lr": 0.0007679133974894982, + "time_sec": 15.529719114303589 + }, + { + "epoch": 49, + "train_loss": 0.652132972278595, + "train_acc": 0.79636, + "test_loss": 1.871591491317749, + "test_acc": 0.5706, + "lyapunov": null, + "grad_norm": 0.8610127100132879, + "grad_max_sv": 0.3813806749880314, + "grad_min_sv": 1.5637395279349818e-08, + "grad_condition": 67273400.43069258, + "lr": 0.000759013504686565, + "time_sec": 15.516782522201538 + }, + { + "epoch": 50, + "train_loss": 0.6417575373268127, + "train_acc": 0.7999, + "test_loss": 1.8759121324539185, + "test_acc": 0.5687, + "lyapunov": null, + "grad_norm": 0.8591044618003006, + "grad_max_sv": 0.38072986006736753, + "grad_min_sv": 1.565713501627819e-08, + "grad_condition": 55185790.37378442, + "lr": 0.0007499999999999998, + "time_sec": 15.543827533721924 + }, + { + "epoch": 51, + "train_loss": 0.6307680229568482, + "train_acc": 0.79994, + "test_loss": 1.9557111139297485, + "test_acc": 0.5642, + "lyapunov": null, + "grad_norm": 0.8496261914652145, + "grad_max_sv": 0.38124899938702583, + "grad_min_sv": 1.580709338699915e-08, + "grad_condition": 67955800.0382034, + "lr": 0.0007408768370508575, + "time_sec": 15.528074502944946 + }, + { + "epoch": 52, + "train_loss": 0.6069645390129089, + "train_acc": 0.8104, + "test_loss": 1.8226323192596436, + "test_acc": 0.5778, + "lyapunov": null, + "grad_norm": 0.8325663719029547, + "grad_max_sv": 0.3573085680603981, + "grad_min_sv": 1.4999965303533202e-08, + "grad_condition": 117426728.55119577, + "lr": 0.0007316480175599307, + "time_sec": 15.539650917053223 + }, + { + "epoch": 53, + "train_loss": 0.5986839054489136, + "train_acc": 0.81126, + "test_loss": 1.9225407358169555, + "test_acc": 0.5703, + "lyapunov": null, + "grad_norm": 0.8295876660526361, + "grad_max_sv": 0.3688795052468777, + "grad_min_sv": 1.5020806476331165e-08, + "grad_condition": 743822598.6922982, + "lr": 0.0007223175895924635, + "time_sec": 15.524444103240967 + }, + { + "epoch": 54, + "train_loss": 0.5895059976959228, + "train_acc": 0.81418, + "test_loss": 1.8881375560760498, + "test_acc": 0.5708, + "lyapunov": null, + "grad_norm": 0.818745610011949, + "grad_max_sv": 0.3618172124028206, + "grad_min_sv": 1.4792169821236518e-08, + "grad_condition": 311609952.49503106, + "lr": 0.0007128896457825361, + "time_sec": 15.522985935211182 + }, + { + "epoch": 55, + "train_loss": 0.5790713099765777, + "train_acc": 0.81868, + "test_loss": 1.851567367553711, + "test_acc": 0.5823, + "lyapunov": null, + "grad_norm": 0.8187745614092103, + "grad_max_sv": 0.3530171699821949, + "grad_min_sv": 1.452992542064907e-08, + "grad_condition": 155586172.7557343, + "lr": 0.0007033683215378998, + "time_sec": 15.516283750534058 + }, + { + "epoch": 56, + "train_loss": 0.5677402771568298, + "train_acc": 0.822, + "test_loss": 1.8971572834014891, + "test_acc": 0.5741, + "lyapunov": null, + "grad_norm": 0.8109973851194381, + "grad_max_sv": 0.35008599534630774, + "grad_min_sv": 1.4616400946347585e-08, + "grad_condition": 122954701.90391079, + "lr": 0.0006937577932260512, + "time_sec": 15.534748792648315 + }, + { + "epoch": 57, + "train_loss": 0.5641013541221619, + "train_acc": 0.82468, + "test_loss": 1.8544835914611817, + "test_acc": 0.5803, + "lyapunov": null, + "grad_norm": 0.8033724572915313, + "grad_max_sv": 0.344899994507432, + "grad_min_sv": 1.4224262010636459e-08, + "grad_condition": 1377225234.7418208, + "lr": 0.0006840622763423388, + "time_sec": 15.513275384902954 + }, + { + "epoch": 58, + "train_loss": 0.5405077212142945, + "train_acc": 0.83038, + "test_loss": 1.970599070739746, + "test_acc": 0.564, + "lyapunov": null, + "grad_norm": 0.7927873462878091, + "grad_max_sv": 0.3396155469119549, + "grad_min_sv": 1.3780443174418732e-08, + "grad_condition": 182519018.73843473, + "lr": 0.0006742860236609073, + "time_sec": 15.554621934890747 + }, + { + "epoch": 59, + "train_loss": 0.5328652268409729, + "train_acc": 0.83082, + "test_loss": 1.8392395721435546, + "test_acc": 0.5876, + "lyapunov": null, + "grad_norm": 0.7894763440743573, + "grad_max_sv": 0.3522858999669552, + "grad_min_sv": 1.4281633905349755e-08, + "grad_condition": 109810093.02889256, + "lr": 0.0006644333233692913, + "time_sec": 15.517175674438477 + }, + { + "epoch": 60, + "train_loss": 0.5278578138160706, + "train_acc": 0.83336, + "test_loss": 2.0256912494659423, + "test_acc": 0.5601, + "lyapunov": null, + "grad_norm": 0.7805932399493629, + "grad_max_sv": 0.33713038042187693, + "grad_min_sv": 1.3718366050075038e-08, + "grad_condition": 215530844.85079318, + "lr": 0.0006545084971874734, + "time_sec": 15.505738019943237 + }, + { + "epoch": 61, + "train_loss": 0.5176565620994568, + "train_acc": 0.83556, + "test_loss": 1.9843173877716065, + "test_acc": 0.5662, + "lyapunov": null, + "grad_norm": 0.7781213617860828, + "grad_max_sv": 0.34235822334885596, + "grad_min_sv": 1.3829460821304651e-08, + "grad_condition": 166938522.97901836, + "lr": 0.0006445158984722354, + "time_sec": 15.510056972503662 + }, + { + "epoch": 62, + "train_loss": 0.5051395326137543, + "train_acc": 0.83992, + "test_loss": 1.8313960775375366, + "test_acc": 0.5831, + "lyapunov": null, + "grad_norm": 0.7649243890515134, + "grad_max_sv": 0.3260902684181929, + "grad_min_sv": 1.3774559579418644e-08, + "grad_condition": 82478486.92255004, + "lr": 0.0006344599103076324, + "time_sec": 15.541491270065308 + }, + { + "epoch": 63, + "train_loss": 0.49586085123062135, + "train_acc": 0.84164, + "test_loss": 1.9260399576187133, + "test_acc": 0.5748, + "lyapunov": null, + "grad_norm": 0.7652357534403171, + "grad_max_sv": 0.34158613085746764, + "grad_min_sv": 1.3498082356271784e-08, + "grad_condition": 263543331.4884905, + "lr": 0.0006243449435824269, + "time_sec": 15.52653431892395 + }, + { + "epoch": 64, + "train_loss": 0.4807168690109253, + "train_acc": 0.84668, + "test_loss": 1.8585652179718017, + "test_acc": 0.5873, + "lyapunov": null, + "grad_norm": 0.7513551904434514, + "grad_max_sv": 0.3280766326934099, + "grad_min_sv": 1.3634163315012771e-08, + "grad_condition": 57055577.557981655, + "lr": 0.0006141754350553275, + "time_sec": 15.526658535003662 + }, + { + "epoch": 65, + "train_loss": 0.47260116580963135, + "train_acc": 0.84834, + "test_loss": 1.9012826635360718, + "test_acc": 0.5776, + "lyapunov": null, + "grad_norm": 0.7483579760337495, + "grad_max_sv": 0.32314833588898184, + "grad_min_sv": 1.3236332240852689e-08, + "grad_condition": 301375478.05543464, + "lr": 0.0006039558454088793, + "time_sec": 15.532294988632202 + }, + { + "epoch": 66, + "train_loss": 0.46123015544891355, + "train_acc": 0.85242, + "test_loss": 1.9859778638839722, + "test_acc": 0.5735, + "lyapunov": null, + "grad_norm": 0.7421019055709072, + "grad_max_sv": 0.3263105019927025, + "grad_min_sv": 1.3596849376355108e-08, + "grad_condition": 313983387.1066474, + "lr": 0.000593690657292862, + "time_sec": 15.5251145362854 + }, + { + "epoch": 67, + "train_loss": 0.4601145356178284, + "train_acc": 0.85254, + "test_loss": 1.8722857538223268, + "test_acc": 0.5841, + "lyapunov": null, + "grad_norm": 0.7408779549862098, + "grad_max_sv": 0.3230173833668232, + "grad_min_sv": 1.340270877701194e-08, + "grad_condition": 254415771.74014935, + "lr": 0.0005833843733580507, + "time_sec": 15.547546625137329 + }, + { + "epoch": 68, + "train_loss": 0.4442843551063538, + "train_acc": 0.85846, + "test_loss": 1.9014101182937622, + "test_acc": 0.5901, + "lyapunov": null, + "grad_norm": 0.726390105657036, + "grad_max_sv": 0.31147900260984895, + "grad_min_sv": 1.2510136173510267e-08, + "grad_condition": 74933256.04093306, + "lr": 0.0005730415142812054, + "time_sec": 15.552660703659058 + }, + { + "epoch": 69, + "train_loss": 0.43935043266296386, + "train_acc": 0.85762, + "test_loss": 1.8650325706481934, + "test_acc": 0.597, + "lyapunov": null, + "grad_norm": 0.7246554453569696, + "grad_max_sv": 0.31471570432186124, + "grad_min_sv": 1.2821802319006037e-08, + "grad_condition": 380382985.75691664, + "lr": 0.0005626666167821517, + "time_sec": 15.537629127502441 + }, + { + "epoch": 70, + "train_loss": 0.4237213344478607, + "train_acc": 0.86326, + "test_loss": 1.9569523294448852, + "test_acc": 0.5852, + "lyapunov": null, + "grad_norm": 0.7192339976242655, + "grad_max_sv": 0.31687899492681026, + "grad_min_sv": 1.2885098506741632e-08, + "grad_condition": 170905682.3340375, + "lr": 0.0005522642316338265, + "time_sec": 15.540661811828613 + }, + { + "epoch": 71, + "train_loss": 0.4210721292114258, + "train_acc": 0.86542, + "test_loss": 1.8978070093154906, + "test_acc": 0.5901, + "lyapunov": null, + "grad_norm": 0.7126602595414533, + "grad_max_sv": 0.31185401007533076, + "grad_min_sv": 1.2703713765660484e-08, + "grad_condition": 109451591.5178098, + "lr": 0.0005418389216661573, + "time_sec": 15.52872371673584 + }, + { + "epoch": 72, + "train_loss": 0.4073511661529541, + "train_acc": 0.86814, + "test_loss": 1.9296504669189454, + "test_acc": 0.5799, + "lyapunov": null, + "grad_norm": 0.7043070251395208, + "grad_max_sv": 0.3181886296719313, + "grad_min_sv": 1.293510755832894e-08, + "grad_condition": 114381253.05033526, + "lr": 0.0005313952597646563, + "time_sec": 15.533472299575806 + }, + { + "epoch": 73, + "train_loss": 0.402773690700531, + "train_acc": 0.8694, + "test_loss": 1.9097788103103637, + "test_acc": 0.5862, + "lyapunov": null, + "grad_norm": 0.6990408270244555, + "grad_max_sv": 0.3128418132662773, + "grad_min_sv": 1.2784014379778677e-08, + "grad_condition": 285713754.94993323, + "lr": 0.0005209378268645994, + "time_sec": 15.534166812896729 + }, + { + "epoch": 74, + "train_loss": 0.3923648566055298, + "train_acc": 0.87324, + "test_loss": 2.03479278717041, + "test_acc": 0.5731, + "lyapunov": null, + "grad_norm": 0.6947288015374449, + "grad_max_sv": 0.30756589137017726, + "grad_min_sv": 1.2547299702361792e-08, + "grad_condition": 96096022.64687933, + "lr": 0.0005104712099416781, + "time_sec": 15.532297134399414 + }, + { + "epoch": 75, + "train_loss": 0.3855631015777588, + "train_acc": 0.87418, + "test_loss": 1.9891023809432984, + "test_acc": 0.5829, + "lyapunov": null, + "grad_norm": 0.6909138607463989, + "grad_max_sv": 0.3085081819444895, + "grad_min_sv": 1.2179017949351389e-08, + "grad_condition": 181155822.36130485, + "lr": 0.0004999999999999996, + "time_sec": 15.53008222579956 + }, + { + "epoch": 76, + "train_loss": 0.38342618799209593, + "train_acc": 0.87512, + "test_loss": 1.9072554616928101, + "test_acc": 0.5857, + "lyapunov": null, + "grad_norm": 0.6904521379873841, + "grad_max_sv": 0.2994091097265482, + "grad_min_sv": 1.2141872210783e-08, + "grad_condition": 376685212.82283676, + "lr": 0.0004895287900583212, + "time_sec": 15.53481936454773 + }, + { + "epoch": 77, + "train_loss": 0.3725630757713318, + "train_acc": 0.879, + "test_loss": 1.9034398189544677, + "test_acc": 0.5909, + "lyapunov": null, + "grad_norm": 0.6822282432684434, + "grad_max_sv": 0.30867698080837724, + "grad_min_sv": 1.2084137563164733e-08, + "grad_condition": 124507553.7311234, + "lr": 0.0004790621731353997, + "time_sec": 15.53526520729065 + }, + { + "epoch": 78, + "train_loss": 0.36642052476882936, + "train_acc": 0.88036, + "test_loss": 2.005714999771118, + "test_acc": 0.5791, + "lyapunov": null, + "grad_norm": 0.6791157792781891, + "grad_max_sv": 0.3038751546293497, + "grad_min_sv": 1.207316775980044e-08, + "grad_condition": 349442982.68712926, + "lr": 0.000468604740235343, + "time_sec": 15.530872821807861 + }, + { + "epoch": 79, + "train_loss": 0.3598951160621643, + "train_acc": 0.88272, + "test_loss": 1.9046739515304565, + "test_acc": 0.5988, + "lyapunov": null, + "grad_norm": 0.6729333436216095, + "grad_max_sv": 0.2982245538383722, + "grad_min_sv": 1.1723929679136568e-08, + "grad_condition": 1205163983.0705116, + "lr": 0.00045816107833384175, + "time_sec": 15.522129774093628 + }, + { + "epoch": 80, + "train_loss": 0.3540581908321381, + "train_acc": 0.88478, + "test_loss": 1.9243260189056397, + "test_acc": 0.5951, + "lyapunov": null, + "grad_norm": 0.6669931804639248, + "grad_max_sv": 0.3037246517837048, + "grad_min_sv": 1.2220161819086195e-08, + "grad_condition": 223413264.33208403, + "lr": 0.0004477357683661729, + "time_sec": 15.549994230270386 + }, + { + "epoch": 81, + "train_loss": 0.34355100545883177, + "train_acc": 0.88742, + "test_loss": 1.9262817459106445, + "test_acc": 0.5958, + "lyapunov": null, + "grad_norm": 0.6569466554473731, + "grad_max_sv": 0.29243352748453616, + "grad_min_sv": 1.170117877253088e-08, + "grad_condition": 464973323.75393283, + "lr": 0.00043733338321784746, + "time_sec": 15.547070503234863 + }, + { + "epoch": 82, + "train_loss": 0.34255793330192563, + "train_acc": 0.88874, + "test_loss": 1.9720558526992797, + "test_acc": 0.5872, + "lyapunov": null, + "grad_norm": 0.6552470780369282, + "grad_max_sv": 0.2913744479417801, + "grad_min_sv": 1.1602940852128291e-08, + "grad_condition": 379547195.8692357, + "lr": 0.0004269584857187939, + "time_sec": 15.539148807525635 + }, + { + "epoch": 83, + "train_loss": 0.33223292098999024, + "train_acc": 0.89188, + "test_loss": 2.019339463806152, + "test_acc": 0.585, + "lyapunov": null, + "grad_norm": 0.6482255503134596, + "grad_max_sv": 0.29046328365802765, + "grad_min_sv": 1.167401027790671e-08, + "grad_condition": 268408260.80112848, + "lr": 0.0004166156266419484, + "time_sec": 15.544889688491821 + }, + { + "epoch": 84, + "train_loss": 0.32708690958976744, + "train_acc": 0.89336, + "test_loss": 1.9602216457366943, + "test_acc": 0.5938, + "lyapunov": null, + "grad_norm": 0.6433934813074033, + "grad_max_sv": 0.2879111871123314, + "grad_min_sv": 1.1351589188253464e-08, + "grad_condition": 188243954.40924165, + "lr": 0.0004063093427071373, + "time_sec": 15.550781965255737 + }, + { + "epoch": 85, + "train_loss": 0.31329795719623565, + "train_acc": 0.8972, + "test_loss": 1.991354573059082, + "test_acc": 0.5942, + "lyapunov": null, + "grad_norm": 0.6339396843798872, + "grad_max_sv": 0.28407732769846916, + "grad_min_sv": 1.1356117259747612e-08, + "grad_condition": 64588865.71423088, + "lr": 0.0003960441545911199, + "time_sec": 15.540690422058105 + }, + { + "epoch": 86, + "train_loss": 0.31019552572250364, + "train_acc": 0.89866, + "test_loss": 1.9719594646453857, + "test_acc": 0.5916, + "lyapunov": null, + "grad_norm": 0.6314602087474198, + "grad_max_sv": 0.2975065462291241, + "grad_min_sv": 1.1250381844012114e-08, + "grad_condition": 267735889.39588803, + "lr": 0.0003858245649446718, + "time_sec": 15.549985647201538 + }, + { + "epoch": 87, + "train_loss": 0.30400290882587433, + "train_acc": 0.90182, + "test_loss": 1.942669277191162, + "test_acc": 0.5984, + "lyapunov": null, + "grad_norm": 0.6234369716199227, + "grad_max_sv": 0.2763492401689291, + "grad_min_sv": 1.0957708114665777e-08, + "grad_condition": 5505096156.702031, + "lr": 0.00037565505641757235, + "time_sec": 15.53608751296997 + }, + { + "epoch": 88, + "train_loss": 0.3001856433391571, + "train_acc": 0.90274, + "test_loss": 2.014521084976196, + "test_acc": 0.5937, + "lyapunov": null, + "grad_norm": 0.6239192041834897, + "grad_max_sv": 0.28164005614817145, + "grad_min_sv": 1.1160251596519303e-08, + "grad_condition": 533470961.33396375, + "lr": 0.00036554008969236695, + "time_sec": 15.56088900566101 + }, + { + "epoch": 89, + "train_loss": 0.30338367694854734, + "train_acc": 0.90064, + "test_loss": 1.979864009284973, + "test_acc": 0.6017, + "lyapunov": null, + "grad_norm": 0.6299076254668111, + "grad_max_sv": 0.2958707671612501, + "grad_min_sv": 1.13771603407406e-08, + "grad_condition": 134758675.13849258, + "lr": 0.0003554841015277638, + "time_sec": 15.550455093383789 + }, + { + "epoch": 90, + "train_loss": 0.2935330862474442, + "train_acc": 0.90366, + "test_loss": 1.9741040142059325, + "test_acc": 0.6007, + "lyapunov": null, + "grad_norm": 0.6206987643782347, + "grad_max_sv": 0.2804367758333683, + "grad_min_sv": 1.0834553977861344e-08, + "grad_condition": 214777124.87099543, + "lr": 0.000345491502812526, + "time_sec": 15.536914110183716 + }, + { + "epoch": 91, + "train_loss": 0.2862379360961914, + "train_acc": 0.90742, + "test_loss": 1.9401994998931884, + "test_acc": 0.6104, + "lyapunov": null, + "grad_norm": 0.6086508393860313, + "grad_max_sv": 0.2811594821512699, + "grad_min_sv": 1.092561629813249e-08, + "grad_condition": 271875410.4752922, + "lr": 0.0003355666766307081, + "time_sec": 15.532741785049438 + }, + { + "epoch": 92, + "train_loss": 0.2794467659568787, + "train_acc": 0.909, + "test_loss": 1.9841965021133423, + "test_acc": 0.5991, + "lyapunov": null, + "grad_norm": 0.6027972331709979, + "grad_max_sv": 0.28370837941765786, + "grad_min_sv": 1.0951137730322303e-08, + "grad_condition": 527178528.5349765, + "lr": 0.00032571397633909225, + "time_sec": 15.541855573654175 + }, + { + "epoch": 93, + "train_loss": 0.27913901576042177, + "train_acc": 0.90928, + "test_loss": 2.0108478397369383, + "test_acc": 0.5974, + "lyapunov": null, + "grad_norm": 0.6045146611097038, + "grad_max_sv": 0.27212534099817276, + "grad_min_sv": 1.0377901878133589e-08, + "grad_condition": 208529865.9529999, + "lr": 0.00031593772365766094, + "time_sec": 15.550946950912476 + }, + { + "epoch": 94, + "train_loss": 0.2697591744232178, + "train_acc": 0.91192, + "test_loss": 1.9851827640533448, + "test_acc": 0.6061, + "lyapunov": null, + "grad_norm": 0.5934923958008231, + "grad_max_sv": 0.28020478039979935, + "grad_min_sv": 1.0768861019735086e-08, + "grad_condition": 559075477.9879827, + "lr": 0.0003062422067739483, + "time_sec": 15.537599802017212 + }, + { + "epoch": 95, + "train_loss": 0.26339089239120483, + "train_acc": 0.91464, + "test_loss": 2.0132868352890014, + "test_acc": 0.605, + "lyapunov": null, + "grad_norm": 0.5878826586259216, + "grad_max_sv": 0.2773489121347666, + "grad_min_sv": 1.0672221813050332e-08, + "grad_condition": 469515095.8970634, + "lr": 0.00029663167846209965, + "time_sec": 15.53743839263916 + }, + { + "epoch": 96, + "train_loss": 0.2638236730861664, + "train_acc": 0.914, + "test_loss": 2.116576941871643, + "test_acc": 0.588, + "lyapunov": null, + "grad_norm": 0.5876599339339599, + "grad_max_sv": 0.2637676265090704, + "grad_min_sv": 1.0212088024752312e-08, + "grad_condition": 1850515172.2076042, + "lr": 0.00028711035421746345, + "time_sec": 15.549452781677246 + }, + { + "epoch": 97, + "train_loss": 0.2536590715312958, + "train_acc": 0.91706, + "test_loss": 1.9441264961242677, + "test_acc": 0.6106, + "lyapunov": null, + "grad_norm": 0.5801862895467766, + "grad_max_sv": 0.25957776233553886, + "grad_min_sv": 9.974970699780373e-09, + "grad_condition": 248670450.2290464, + "lr": 0.00027768241040753615, + "time_sec": 15.566162586212158 + }, + { + "epoch": 98, + "train_loss": 0.2510867093276978, + "train_acc": 0.91934, + "test_loss": 1.9544865245819092, + "test_acc": 0.6095, + "lyapunov": null, + "grad_norm": 0.5734772931002381, + "grad_max_sv": 0.2618825018405914, + "grad_min_sv": 1.0204099554038393e-08, + "grad_condition": 154473221.86993745, + "lr": 0.00026835198244006903, + "time_sec": 15.556537866592407 + }, + { + "epoch": 99, + "train_loss": 0.2408148485183716, + "train_acc": 0.92144, + "test_loss": 2.0714619358062745, + "test_acc": 0.6001, + "lyapunov": null, + "grad_norm": 0.5671726549187834, + "grad_max_sv": 0.2644516408443451, + "grad_min_sv": 1.0195976151089816e-08, + "grad_condition": 965788263.4202464, + "lr": 0.0002591231629491421, + "time_sec": 15.544485092163086 + }, + { + "epoch": 100, + "train_loss": 0.2370221872997284, + "train_acc": 0.92336, + "test_loss": 1.9870514595031739, + "test_acc": 0.5993, + "lyapunov": null, + "grad_norm": 0.5626687820046147, + "grad_max_sv": 0.2684344034641981, + "grad_min_sv": 1.0188884960694519e-08, + "grad_condition": 610815770.0447185, + "lr": 0.0002499999999999997, + "time_sec": 15.558927297592163 + }, + { + "epoch": 101, + "train_loss": 0.23374522658348085, + "train_acc": 0.92286, + "test_loss": 2.04856148109436, + "test_acc": 0.6012, + "lyapunov": null, + "grad_norm": 0.5627280147031988, + "grad_max_sv": 0.2735305614769459, + "grad_min_sv": 9.946851818598556e-09, + "grad_condition": 75149496.54857874, + "lr": 0.00024098649531343477, + "time_sec": 15.551362752914429 + }, + { + "epoch": 102, + "train_loss": 0.23789083916664125, + "train_acc": 0.9232, + "test_loss": 2.077917391014099, + "test_acc": 0.5911, + "lyapunov": null, + "grad_norm": 0.5654678978420247, + "grad_max_sv": 0.268671840056777, + "grad_min_sv": 1.0081382883705969e-08, + "grad_condition": 760769280.8309836, + "lr": 0.0002320866025105016, + "time_sec": 15.548651456832886 + }, + { + "epoch": 103, + "train_loss": 0.23046596057415009, + "train_acc": 0.9256, + "test_loss": 2.0280915761947633, + "test_acc": 0.6086, + "lyapunov": null, + "grad_norm": 0.5555946067131698, + "grad_max_sv": 0.26063189692795274, + "grad_min_sv": 9.972913740403238e-09, + "grad_condition": 800339375.9782455, + "lr": 0.0002233042253783278, + "time_sec": 15.55325436592102 + }, + { + "epoch": 104, + "train_loss": 0.22575416645526886, + "train_acc": 0.92736, + "test_loss": 1.991520732498169, + "test_acc": 0.6106, + "lyapunov": null, + "grad_norm": 0.5502200269097622, + "grad_max_sv": 0.2645552083849907, + "grad_min_sv": 9.78625991994355e-09, + "grad_condition": 782453911.4088255, + "lr": 0.000214643216157784, + "time_sec": 15.555955410003662 + }, + { + "epoch": 105, + "train_loss": 0.21851825959682464, + "train_acc": 0.93044, + "test_loss": 2.0155545722961428, + "test_acc": 0.6061, + "lyapunov": null, + "grad_norm": 0.5402375136024744, + "grad_max_sv": 0.24004080072045325, + "grad_min_sv": 9.457498292795847e-09, + "grad_condition": 1962228069.4928844, + "lr": 0.00020610737385376332, + "time_sec": 15.539866924285889 + }, + { + "epoch": 106, + "train_loss": 0.21933655521392822, + "train_acc": 0.9294, + "test_loss": 1.9992694971084595, + "test_acc": 0.6088, + "lyapunov": null, + "grad_norm": 0.5407905761670532, + "grad_max_sv": 0.2569248087704182, + "grad_min_sv": 9.955755829070199e-09, + "grad_condition": 488709715.88661134, + "lr": 0.00019770044256881242, + "time_sec": 15.556296348571777 + }, + { + "epoch": 107, + "train_loss": 0.21396025347709655, + "train_acc": 0.93126, + "test_loss": 1.9869402378082275, + "test_acc": 0.6133, + "lyapunov": null, + "grad_norm": 0.5348948965534774, + "grad_max_sv": 0.2521795704960823, + "grad_min_sv": 9.633937683630606e-09, + "grad_condition": 369579410.89431655, + "lr": 0.0001894261098608447, + "time_sec": 15.540535688400269 + }, + { + "epoch": 108, + "train_loss": 0.21082828907966614, + "train_acc": 0.93162, + "test_loss": 1.9967963357925416, + "test_acc": 0.6085, + "lyapunov": null, + "grad_norm": 0.5340121730088487, + "grad_max_sv": 0.26667983680963514, + "grad_min_sv": 1.0154884861647561e-08, + "grad_condition": 142198444.83812565, + "lr": 0.000181288005125655, + "time_sec": 15.588162899017334 + }, + { + "epoch": 109, + "train_loss": 0.20589717533111573, + "train_acc": 0.93354, + "test_loss": 1.997142894744873, + "test_acc": 0.6074, + "lyapunov": null, + "grad_norm": 0.531812789994753, + "grad_max_sv": 0.2566185683012009, + "grad_min_sv": 9.651047487091794e-09, + "grad_condition": 371853099.6491888, + "lr": 0.0001732896980049473, + "time_sec": 15.551778316497803 + }, + { + "epoch": 110, + "train_loss": 0.20528564952850342, + "train_acc": 0.93468, + "test_loss": 1.9464295757293701, + "test_acc": 0.6128, + "lyapunov": null, + "grad_norm": 0.5263915646231926, + "grad_max_sv": 0.26407470293343066, + "grad_min_sv": 9.794896905736998e-09, + "grad_condition": 2887517153.125839, + "lr": 0.00016543469682057076, + "time_sec": 15.528143405914307 + }, + { + "epoch": 111, + "train_loss": 0.19939620697975158, + "train_acc": 0.93512, + "test_loss": 2.0247394777297973, + "test_acc": 0.6088, + "lyapunov": null, + "grad_norm": 0.5199006680221581, + "grad_max_sv": 0.25051676370203496, + "grad_min_sv": 9.47750784957048e-09, + "grad_condition": 633146043.8326647, + "lr": 0.00015772644703565552, + "time_sec": 15.546777248382568 + }, + { + "epoch": 112, + "train_loss": 0.19768739170074462, + "train_acc": 0.93558, + "test_loss": 2.0370516593933106, + "test_acc": 0.6068, + "lyapunov": null, + "grad_norm": 0.5201803443080029, + "grad_max_sv": 0.24434743784368038, + "grad_min_sv": 9.287056545494165e-09, + "grad_condition": 110967293.52368338, + "lr": 0.00015016832974331713, + "time_sec": 15.55789828300476 + }, + { + "epoch": 113, + "train_loss": 0.19503466765403749, + "train_acc": 0.93582, + "test_loss": 2.0127569778442385, + "test_acc": 0.6108, + "lyapunov": null, + "grad_norm": 0.5185105554457012, + "grad_max_sv": 0.25643752217292787, + "grad_min_sv": 9.366854652635356e-09, + "grad_condition": 1367545407.0462277, + "lr": 0.00014276366018359834, + "time_sec": 15.548904418945312 + }, + { + "epoch": 114, + "train_loss": 0.19106607246875762, + "train_acc": 0.93774, + "test_loss": 2.0063432996749877, + "test_acc": 0.6062, + "lyapunov": null, + "grad_norm": 0.5144662331475203, + "grad_max_sv": 0.252225586026907, + "grad_min_sv": 9.432733346151356e-09, + "grad_condition": 93492891.55482593, + "lr": 0.00013551568628929425, + "time_sec": 15.545198440551758 + }, + { + "epoch": 115, + "train_loss": 0.1892847189235687, + "train_acc": 0.93952, + "test_loss": 1.9861349111557007, + "test_acc": 0.6132, + "lyapunov": null, + "grad_norm": 0.5113690167861914, + "grad_max_sv": 0.24835538007318975, + "grad_min_sv": 9.181027646031764e-09, + "grad_condition": 397291225.7944182, + "lr": 0.00012842758726130276, + "time_sec": 15.535498142242432 + }, + { + "epoch": 116, + "train_loss": 0.1890865376853943, + "train_acc": 0.93908, + "test_loss": 2.0632496139526366, + "test_acc": 0.6051, + "lyapunov": null, + "grad_norm": 0.5106134953187779, + "grad_max_sv": 0.25654816515743734, + "grad_min_sv": 9.516519037361913e-09, + "grad_condition": 599031804.2047107, + "lr": 0.0001215024721741218, + "time_sec": 15.540488958358765 + }, + { + "epoch": 117, + "train_loss": 0.1820236085987091, + "train_acc": 0.9423, + "test_loss": 2.0187086570739745, + "test_acc": 0.6079, + "lyapunov": null, + "grad_norm": 0.5019942855204272, + "grad_max_sv": 0.24775034934282303, + "grad_min_sv": 9.149960274288e-09, + "grad_condition": 1319010860.9552953, + "lr": 0.00011474337861210538, + "time_sec": 15.56420636177063 + }, + { + "epoch": 118, + "train_loss": 0.18246942345619202, + "train_acc": 0.942, + "test_loss": 2.050747388458252, + "test_acc": 0.6086, + "lyapunov": null, + "grad_norm": 0.5013646247138603, + "grad_max_sv": 0.25135475769639015, + "grad_min_sv": 9.33531562634024e-09, + "grad_condition": 323765358.2689257, + "lr": 0.00010815327133708009, + "time_sec": 15.536325931549072 + }, + { + "epoch": 119, + "train_loss": 0.1821983718967438, + "train_acc": 0.94258, + "test_loss": 2.047995585823059, + "test_acc": 0.6057, + "lyapunov": null, + "grad_norm": 0.5011920926334492, + "grad_max_sv": 0.24903758093714715, + "grad_min_sv": 9.00506958363169e-09, + "grad_condition": 369047774.2258805, + "lr": 0.00010173504098790182, + "time_sec": 15.548452854156494 + }, + { + "epoch": 120, + "train_loss": 0.17862510696411132, + "train_acc": 0.94496, + "test_loss": 2.066082696914673, + "test_acc": 0.6064, + "lyapunov": null, + "grad_norm": 0.4919439871423072, + "grad_max_sv": 0.24307375513017176, + "grad_min_sv": 8.880053682772159e-09, + "grad_condition": 4482965048.089623, + "lr": 9.549150281252629e-05, + "time_sec": 15.545986890792847 + }, + { + "epoch": 121, + "train_loss": 0.17715791575431825, + "train_acc": 0.9433, + "test_loss": 2.0107405862808228, + "test_acc": 0.6146, + "lyapunov": null, + "grad_norm": 0.4938358036401035, + "grad_max_sv": 0.24697510711848736, + "grad_min_sv": 9.213949292647198e-09, + "grad_condition": 345420741.19239944, + "lr": 8.942539543314794e-05, + "time_sec": 15.568331956863403 + }, + { + "epoch": 122, + "train_loss": 0.16989687209129334, + "train_acc": 0.94618, + "test_loss": 2.044198879814148, + "test_acc": 0.611, + "lyapunov": null, + "grad_norm": 0.4832835136645179, + "grad_max_sv": 0.2455986063927412, + "grad_min_sv": 9.204115481711503e-09, + "grad_condition": 367602073.55865693, + "lr": 8.353937964495024e-05, + "time_sec": 15.56007719039917 + }, + { + "epoch": 123, + "train_loss": 0.1723685458612442, + "train_acc": 0.9443, + "test_loss": 2.012871974563599, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.4888221870883898, + "grad_max_sv": 0.23854922354221345, + "grad_min_sv": 8.63350490934488e-09, + "grad_condition": 5808463452.940133, + "lr": 7.783603724899243e-05, + "time_sec": 15.557473182678223 + }, + { + "epoch": 124, + "train_loss": 0.16869316206455232, + "train_acc": 0.9467, + "test_loss": 2.067115762138367, + "test_acc": 0.6115, + "lyapunov": null, + "grad_norm": 0.48269660774706274, + "grad_max_sv": 0.24038059040904045, + "grad_min_sv": 8.786777593874049e-09, + "grad_condition": 908637161.7032757, + "lr": 7.231786991974666e-05, + "time_sec": 15.582384824752808 + }, + { + "epoch": 125, + "train_loss": 0.17133760773181916, + "train_acc": 0.94556, + "test_loss": 2.04983889465332, + "test_acc": 0.612, + "lyapunov": null, + "grad_norm": 0.4873195931263442, + "grad_max_sv": 0.24550650343298913, + "grad_min_sv": 9.158816541098405e-09, + "grad_condition": 2506136246.983276, + "lr": 6.698729810778072e-05, + "time_sec": 15.538672924041748 + }, + { + "epoch": 126, + "train_loss": 0.16753606813669206, + "train_acc": 0.94616, + "test_loss": 2.041084182357788, + "test_acc": 0.6124, + "lyapunov": null, + "grad_norm": 0.47963342880713666, + "grad_max_sv": 0.23605941832065583, + "grad_min_sv": 8.880202983542473e-09, + "grad_condition": 259590659.92757973, + "lr": 6.184665997806817e-05, + "time_sec": 15.555017948150635 + }, + { + "epoch": 127, + "train_loss": 0.16307862406730653, + "train_acc": 0.94852, + "test_loss": 2.0575376665115357, + "test_acc": 0.6101, + "lyapunov": null, + "grad_norm": 0.47745975112622574, + "grad_max_sv": 0.2415751673281193, + "grad_min_sv": 8.65501490613426e-09, + "grad_condition": 906844857.6290891, + "lr": 5.6898210384392595e-05, + "time_sec": 15.544172286987305 + }, + { + "epoch": 128, + "train_loss": 0.1647679444026947, + "train_acc": 0.9478, + "test_loss": 2.083808217048645, + "test_acc": 0.6112, + "lyapunov": null, + "grad_norm": 0.4772307176298673, + "grad_max_sv": 0.24646385088562967, + "grad_min_sv": 9.007787716056557e-09, + "grad_condition": 952403487.2306192, + "lr": 5.214411988029363e-05, + "time_sec": 15.569987058639526 + }, + { + "epoch": 129, + "train_loss": 0.16221783504486084, + "train_acc": 0.9489, + "test_loss": 2.037674939918518, + "test_acc": 0.6141, + "lyapunov": null, + "grad_norm": 0.47719707993092136, + "grad_max_sv": 0.24447002522647382, + "grad_min_sv": 8.718893083382862e-09, + "grad_condition": 576774993.0051876, + "lr": 4.7586473766990294e-05, + "time_sec": 15.550950765609741 + }, + { + "epoch": 130, + "train_loss": 0.1623430322790146, + "train_acc": 0.94826, + "test_loss": 2.0267721549987794, + "test_acc": 0.612, + "lyapunov": null, + "grad_norm": 0.4758398131142258, + "grad_max_sv": 0.24824610278010367, + "grad_min_sv": 9.009834131589248e-09, + "grad_condition": 284470826.5323583, + "lr": 4.32272711786996e-05, + "time_sec": 15.55129861831665 + }, + { + "epoch": 131, + "train_loss": 0.15758139282703398, + "train_acc": 0.95048, + "test_loss": 2.059408118247986, + "test_acc": 0.6128, + "lyapunov": null, + "grad_norm": 0.4662610158212716, + "grad_max_sv": 0.24175717495381832, + "grad_min_sv": 8.851933427532142e-09, + "grad_condition": 643199875.2224789, + "lr": 3.906842420574966e-05, + "time_sec": 15.541762351989746 + }, + { + "epoch": 132, + "train_loss": 0.1609997308921814, + "train_acc": 0.95002, + "test_loss": 2.045307534980774, + "test_acc": 0.6147, + "lyapunov": null, + "grad_norm": 0.4725451311353625, + "grad_max_sv": 0.24064127989113332, + "grad_min_sv": 8.780672330747398e-09, + "grad_condition": 476655844.989127, + "lr": 3.5111757055874305e-05, + "time_sec": 15.541023969650269 + }, + { + "epoch": 133, + "train_loss": 0.1624057853126526, + "train_acc": 0.9483, + "test_loss": 2.0316320575714113, + "test_acc": 0.6138, + "lyapunov": null, + "grad_norm": 0.47661507996640506, + "grad_max_sv": 0.23734962083399297, + "grad_min_sv": 8.76026350001306e-09, + "grad_condition": 2222364938.5971713, + "lr": 3.1359005254054254e-05, + "time_sec": 15.546375274658203 + }, + { + "epoch": 134, + "train_loss": 0.15793843518733977, + "train_acc": 0.95012, + "test_loss": 2.009011124992371, + "test_acc": 0.6152, + "lyapunov": null, + "grad_norm": 0.4705522562479762, + "grad_max_sv": 0.2360381469130516, + "grad_min_sv": 8.697313022294068e-09, + "grad_condition": 644188463.3118798, + "lr": 2.7811814881259484e-05, + "time_sec": 15.535383224487305 + }, + { + "epoch": 135, + "train_loss": 0.1600447882938385, + "train_acc": 0.94882, + "test_loss": 2.0992555170059206, + "test_acc": 0.6116, + "lyapunov": null, + "grad_norm": 0.4740303567864555, + "grad_max_sv": 0.24014706909656525, + "grad_min_sv": 8.802092827005225e-09, + "grad_condition": 608133158.8685883, + "lr": 2.4471741852423218e-05, + "time_sec": 15.567442417144775 + }, + { + "epoch": 136, + "train_loss": 0.15536398038864135, + "train_acc": 0.95102, + "test_loss": 2.0009073398590087, + "test_acc": 0.6133, + "lyapunov": null, + "grad_norm": 0.4650573516543509, + "grad_max_sv": 0.2419031746685505, + "grad_min_sv": 8.691076524734372e-09, + "grad_condition": 1297451669.4427776, + "lr": 2.1340251233966362e-05, + "time_sec": 15.541702508926392 + }, + { + "epoch": 137, + "train_loss": 0.15388678150177001, + "train_acc": 0.95152, + "test_loss": 2.0588031789779664, + "test_acc": 0.6133, + "lyapunov": null, + "grad_norm": 0.4625524612009038, + "grad_max_sv": 0.23246029894798995, + "grad_min_sv": 8.55227140121942e-09, + "grad_condition": 558781802.1816812, + "lr": 1.8418716601170932e-05, + "time_sec": 15.551306247711182 + }, + { + "epoch": 138, + "train_loss": 0.15315138070583342, + "train_acc": 0.95186, + "test_loss": 2.081510241127014, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.4628330778697609, + "grad_max_sv": 0.2313590131700039, + "grad_min_sv": 8.49984760574983e-09, + "grad_condition": 496139239.8313856, + "lr": 1.570841943568445e-05, + "time_sec": 15.549960374832153 + }, + { + "epoch": 139, + "train_loss": 0.1517414856362343, + "train_acc": 0.95122, + "test_loss": 2.1018941421508788, + "test_acc": 0.6069, + "lyapunov": null, + "grad_norm": 0.45954699142087607, + "grad_max_sv": 0.22898922748863698, + "grad_min_sv": 8.333344929736807e-09, + "grad_condition": 238482611.7054514, + "lr": 1.3210548563419845e-05, + "time_sec": 15.544589757919312 + }, + { + "epoch": 140, + "train_loss": 0.1531998627448082, + "train_acc": 0.95216, + "test_loss": 2.029728894042969, + "test_acc": 0.6155, + "lyapunov": null, + "grad_norm": 0.4574810737914109, + "grad_max_sv": 0.22382316328585147, + "grad_min_sv": 8.472814887390025e-09, + "grad_condition": 1000717243.145359, + "lr": 1.0926199633097203e-05, + "time_sec": 15.54127812385559 + }, + { + "epoch": 141, + "train_loss": 0.15507912192344667, + "train_acc": 0.95104, + "test_loss": 2.011727011489868, + "test_acc": 0.6168, + "lyapunov": null, + "grad_norm": 0.4664603521539474, + "grad_max_sv": 0.23848050832748413, + "grad_min_sv": 8.786545021297401e-09, + "grad_condition": 732680612.277679, + "lr": 8.856374635655688e-06, + "time_sec": 15.545313358306885 + }, + { + "epoch": 142, + "train_loss": 0.14621373735427856, + "train_acc": 0.9549, + "test_loss": 2.0063492603302002, + "test_acc": 0.6154, + "lyapunov": null, + "grad_norm": 0.4513118926325404, + "grad_max_sv": 0.22816910743713378, + "grad_min_sv": 8.362062203174508e-09, + "grad_condition": 331969469.2276871, + "lr": 7.001981464747503e-06, + "time_sec": 15.560540199279785 + }, + { + "epoch": 143, + "train_loss": 0.15461997192382812, + "train_acc": 0.95162, + "test_loss": 2.0485921478271485, + "test_acc": 0.6157, + "lyapunov": null, + "grad_norm": 0.4617048546189355, + "grad_max_sv": 0.2284447643905878, + "grad_min_sv": 8.47374921810612e-09, + "grad_condition": 135172237.34044403, + "lr": 5.3638335185058295e-06, + "time_sec": 15.543501138687134 + }, + { + "epoch": 144, + "train_loss": 0.15076595012664795, + "train_acc": 0.95258, + "test_loss": 2.0360546085357667, + "test_acc": 0.6157, + "lyapunov": null, + "grad_norm": 0.45674363291414855, + "grad_max_sv": 0.24305424690246583, + "grad_min_sv": 8.728739433463626e-09, + "grad_condition": 1124480354.7926626, + "lr": 3.942649342761114e-06, + "time_sec": 15.542458057403564 + }, + { + "epoch": 145, + "train_loss": 0.15159784895181655, + "train_acc": 0.9528, + "test_loss": 2.0412604253768922, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.4594436764027667, + "grad_max_sv": 0.23490218743681907, + "grad_min_sv": 8.654648834876751e-09, + "grad_condition": 723824947.9780848, + "lr": 2.7390523158633524e-06, + "time_sec": 15.557586431503296 + }, + { + "epoch": 146, + "train_loss": 0.14902694682121276, + "train_acc": 0.95336, + "test_loss": 2.0020324548721313, + "test_acc": 0.6179, + "lyapunov": null, + "grad_norm": 0.4560431994507587, + "grad_max_sv": 0.23076346889138222, + "grad_min_sv": 8.323158351257205e-09, + "grad_condition": 1469772291.140429, + "lr": 1.7535703752478133e-06, + "time_sec": 15.585474014282227 + }, + { + "epoch": 147, + "train_loss": 0.15434911180973052, + "train_acc": 0.95198, + "test_loss": 2.0673148109436035, + "test_acc": 0.61, + "lyapunov": null, + "grad_norm": 0.46368415666342994, + "grad_max_sv": 0.2282502643764019, + "grad_min_sv": 8.658979086919108e-09, + "grad_condition": 285812014.7645295, + "lr": 9.866357858642196e-07, + "time_sec": 15.550001859664917 + }, + { + "epoch": 148, + "train_loss": 0.15094998855590822, + "train_acc": 0.95184, + "test_loss": 2.0560613121032714, + "test_acc": 0.6104, + "lyapunov": null, + "grad_norm": 0.45852974392342616, + "grad_max_sv": 0.2286764368414879, + "grad_min_sv": 8.554375543280744e-09, + "grad_condition": 2915751413.0661488, + "lr": 4.38584950570808e-07, + "time_sec": 15.554803848266602 + }, + { + "epoch": 149, + "train_loss": 0.15165723780632018, + "train_acc": 0.9523, + "test_loss": 2.015529384994507, + "test_acc": 0.6157, + "lyapunov": null, + "grad_norm": 0.46002009289404105, + "grad_max_sv": 0.22944259103387593, + "grad_min_sv": 8.688443671012007e-09, + "grad_condition": 1114534732.0327039, + "lr": 1.096582625772501e-07, + "time_sec": 15.552348375320435 + }, + { + "epoch": 150, + "train_loss": 0.15093138063430786, + "train_acc": 0.95178, + "test_loss": 2.0286103109359743, + "test_acc": 0.6155, + "lyapunov": null, + "grad_norm": 0.459240762365123, + "grad_max_sv": 0.23097772970795633, + "grad_min_sv": 8.62825303557177e-09, + "grad_condition": 215912666.61667585, + "lr": 0.0, + "time_sec": 15.52827525138855 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.632121693878174, + "train_acc": 0.05938, + "test_loss": 4.3297391143798825, + "test_acc": 0.0664, + "lyapunov": null, + "grad_norm": 6.328457015016986, + "grad_max_sv": 5.408737313747406, + "grad_min_sv": 1.0897963745037931e-07, + "grad_condition": 168531087.74149805, + "lr": 0.0009998903417374227, + "time_sec": 32.6737802028656 + }, + { + "epoch": 2, + "train_loss": 3.9319187049865723, + "train_acc": 0.1152, + "test_loss": 4.050583203125, + "test_acc": 0.0937, + "lyapunov": null, + "grad_norm": 4.867346581955153, + "grad_max_sv": 4.17314025759697, + "grad_min_sv": 8.790160169747096e-08, + "grad_condition": 71966498.42246147, + "lr": 0.0009995614150494292, + "time_sec": 32.59041929244995 + }, + { + "epoch": 3, + "train_loss": 3.572258767166138, + "train_acc": 0.16268, + "test_loss": 3.745136415863037, + "test_acc": 0.1249, + "lyapunov": null, + "grad_norm": 4.057272969878525, + "grad_max_sv": 3.325912243127823, + "grad_min_sv": 7.355040792383916e-08, + "grad_condition": 251958754.94074526, + "lr": 0.0009990133642141358, + "time_sec": 32.60651421546936 + }, + { + "epoch": 4, + "train_loss": 3.317695609741211, + "train_acc": 0.2021, + "test_loss": 3.4792282402038572, + "test_acc": 0.1798, + "lyapunov": null, + "grad_norm": 3.452052815802292, + "grad_max_sv": 2.6816291749477386, + "grad_min_sv": 6.40003586127591e-08, + "grad_condition": 48043084.69643873, + "lr": 0.0009982464296247522, + "time_sec": 32.610963582992554 + }, + { + "epoch": 5, + "train_loss": 3.092158460845947, + "train_acc": 0.24132, + "test_loss": 3.2143890380859377, + "test_acc": 0.222, + "lyapunov": null, + "grad_norm": 2.9524390406908076, + "grad_max_sv": 2.168670669198036, + "grad_min_sv": 5.5379370200725475e-08, + "grad_condition": 43696217.43236198, + "lr": 0.0009972609476841367, + "time_sec": 32.5818829536438 + }, + { + "epoch": 6, + "train_loss": 2.9058062841796874, + "train_acc": 0.27294, + "test_loss": 3.2074112480163572, + "test_acc": 0.2194, + "lyapunov": null, + "grad_norm": 2.57958278800403, + "grad_max_sv": 1.780178052186966, + "grad_min_sv": 4.7776146384903574e-08, + "grad_condition": 1848525002.9149213, + "lr": 0.000996057350657239, + "time_sec": 32.6005117893219 + }, + { + "epoch": 7, + "train_loss": 2.7440347719573976, + "train_acc": 0.30466, + "test_loss": 2.9435305278778077, + "test_acc": 0.2714, + "lyapunov": null, + "grad_norm": 2.277468502288279, + "grad_max_sv": 1.4704686373472213, + "grad_min_sv": 4.214769255828088e-08, + "grad_condition": 87867836.19293296, + "lr": 0.000994636166481494, + "time_sec": 32.58062410354614 + }, + { + "epoch": 8, + "train_loss": 2.5896647484588624, + "train_acc": 0.33356, + "test_loss": 2.948492342376709, + "test_acc": 0.2784, + "lyapunov": null, + "grad_norm": 2.080738094824845, + "grad_max_sv": 1.2972008675336837, + "grad_min_sv": 3.925207184285462e-08, + "grad_condition": 57024186.09067024, + "lr": 0.0009929980185352525, + "time_sec": 32.58458232879639 + }, + { + "epoch": 9, + "train_loss": 2.459988908996582, + "train_acc": 0.35858, + "test_loss": 2.692073212814331, + "test_acc": 0.3191, + "lyapunov": null, + "grad_norm": 1.8931611467668827, + "grad_max_sv": 1.0899816483259201, + "grad_min_sv": 3.568325461777988e-08, + "grad_condition": 41689265.343041986, + "lr": 0.0009911436253643444, + "time_sec": 32.631547927856445 + }, + { + "epoch": 10, + "train_loss": 2.3509777881622314, + "train_acc": 0.38242, + "test_loss": 2.63925862197876, + "test_acc": 0.3376, + "lyapunov": null, + "grad_norm": 1.7454969754890177, + "grad_max_sv": 0.9403600230813026, + "grad_min_sv": 3.235623415795419e-08, + "grad_condition": 166681162.0522917, + "lr": 0.0009890738003669028, + "time_sec": 32.5898699760437 + }, + { + "epoch": 11, + "train_loss": 2.240717023162842, + "train_acc": 0.40634, + "test_loss": 2.586192742919922, + "test_acc": 0.3468, + "lyapunov": null, + "grad_norm": 1.6356772403864936, + "grad_max_sv": 0.8401816442608834, + "grad_min_sv": 3.0695412359116324e-08, + "grad_condition": 46339599.574546196, + "lr": 0.00098678945143658, + "time_sec": 32.60019516944885 + }, + { + "epoch": 12, + "train_loss": 2.150723339614868, + "train_acc": 0.42764, + "test_loss": 2.5081653465270994, + "test_acc": 0.3604, + "lyapunov": null, + "grad_norm": 1.539862593793604, + "grad_max_sv": 0.7298938989639282, + "grad_min_sv": 2.8854253044871547e-08, + "grad_condition": 118561305.59874734, + "lr": 0.0009842915805643154, + "time_sec": 32.5900239944458 + }, + { + "epoch": 13, + "train_loss": 2.077368303375244, + "train_acc": 0.44568, + "test_loss": 2.568132899475098, + "test_acc": 0.3585, + "lyapunov": null, + "grad_norm": 1.4723672761634128, + "grad_max_sv": 0.6842682436108589, + "grad_min_sv": 2.7446241608608535e-08, + "grad_condition": 64908883.256854534, + "lr": 0.000981581283398829, + "time_sec": 32.59382939338684 + }, + { + "epoch": 14, + "train_loss": 2.0015520175552366, + "train_acc": 0.45878, + "test_loss": 2.359411000823975, + "test_acc": 0.3979, + "lyapunov": null, + "grad_norm": 1.4099515750601779, + "grad_max_sv": 0.6421961732208729, + "grad_min_sv": 2.6565446014509274e-08, + "grad_condition": 71627981.91741171, + "lr": 0.0009786597487660333, + "time_sec": 32.5654022693634 + }, + { + "epoch": 15, + "train_loss": 1.92437475730896, + "train_acc": 0.47772, + "test_loss": 2.472025180053711, + "test_acc": 0.3906, + "lyapunov": null, + "grad_norm": 1.3459519071373947, + "grad_max_sv": 0.6087979272007942, + "grad_min_sv": 2.560336604950919e-08, + "grad_condition": 34509883.57703115, + "lr": 0.0009755282581475766, + "time_sec": 32.58217000961304 + }, + { + "epoch": 16, + "train_loss": 1.8615227836608887, + "train_acc": 0.49226, + "test_loss": 2.307891809463501, + "test_acc": 0.4094, + "lyapunov": null, + "grad_norm": 1.2973867545451028, + "grad_max_sv": 0.5710282117128372, + "grad_min_sv": 2.453752707409773e-08, + "grad_condition": 36574514.71659913, + "lr": 0.0009721881851187403, + "time_sec": 32.596822023391724 + }, + { + "epoch": 17, + "train_loss": 1.802868537979126, + "train_acc": 0.50886, + "test_loss": 2.2938802921295167, + "test_acc": 0.4221, + "lyapunov": null, + "grad_norm": 1.2452273376049152, + "grad_max_sv": 0.5199026010930539, + "grad_min_sv": 2.340585743814544e-08, + "grad_condition": 342878125.6004232, + "lr": 0.0009686409947459456, + "time_sec": 32.60429286956787 + }, + { + "epoch": 18, + "train_loss": 1.7442895928955078, + "train_acc": 0.51714, + "test_loss": 2.236089334487915, + "test_acc": 0.4271, + "lyapunov": null, + "grad_norm": 1.2180663030761465, + "grad_max_sv": 0.5071025155484676, + "grad_min_sv": 2.2677409150517748e-08, + "grad_condition": 28124440.44399274, + "lr": 0.0009648882429441254, + "time_sec": 32.602014780044556 + }, + { + "epoch": 19, + "train_loss": 1.6970758875274659, + "train_acc": 0.5288, + "test_loss": 2.269014080619812, + "test_acc": 0.4297, + "lyapunov": null, + "grad_norm": 1.1807714582797586, + "grad_max_sv": 0.48886668086051943, + "grad_min_sv": 2.2144371079890757e-08, + "grad_condition": 106195313.77170546, + "lr": 0.00096093157579425, + "time_sec": 32.598830699920654 + }, + { + "epoch": 20, + "train_loss": 1.6365631005477905, + "train_acc": 0.54472, + "test_loss": 2.207360274887085, + "test_acc": 0.436, + "lyapunov": null, + "grad_norm": 1.1615499746942015, + "grad_max_sv": 0.4807134747505188, + "grad_min_sv": 2.17387078838005e-08, + "grad_condition": 30534006.683917098, + "lr": 0.0009567727288213001, + "time_sec": 32.62669658660889 + }, + { + "epoch": 21, + "train_loss": 1.5996088504409791, + "train_acc": 0.5518, + "test_loss": 2.162942098236084, + "test_acc": 0.4467, + "lyapunov": null, + "grad_norm": 1.1385398419975716, + "grad_max_sv": 0.4639912240207195, + "grad_min_sv": 2.164455609743321e-08, + "grad_condition": 34733858.620799676, + "lr": 0.0009524135262330095, + "time_sec": 32.57893466949463 + }, + { + "epoch": 22, + "train_loss": 1.5533830882263184, + "train_acc": 0.56456, + "test_loss": 2.069672204208374, + "test_acc": 0.4682, + "lyapunov": null, + "grad_norm": 1.105827614828544, + "grad_max_sv": 0.4397671535611153, + "grad_min_sv": 2.0469476113421648e-08, + "grad_condition": 59293957.641380526, + "lr": 0.0009478558801197061, + "time_sec": 32.592012882232666 + }, + { + "epoch": 23, + "train_loss": 1.5176535759735108, + "train_acc": 0.57006, + "test_loss": 2.0970192640304566, + "test_acc": 0.4684, + "lyapunov": null, + "grad_norm": 1.086052388682902, + "grad_max_sv": 0.43858923241496084, + "grad_min_sv": 2.046667464117302e-08, + "grad_condition": 35773676.26880551, + "lr": 0.000943101789615607, + "time_sec": 32.5931761264801 + }, + { + "epoch": 24, + "train_loss": 1.477093031578064, + "train_acc": 0.58008, + "test_loss": 2.188412786483765, + "test_acc": 0.4477, + "lyapunov": null, + "grad_norm": 1.0622037979632382, + "grad_max_sv": 0.4300272732973099, + "grad_min_sv": 1.9922828573210387e-08, + "grad_condition": 698939447.7433442, + "lr": 0.0009381533400219313, + "time_sec": 32.60242199897766 + }, + { + "epoch": 25, + "train_loss": 1.4371894707489015, + "train_acc": 0.59004, + "test_loss": 2.122577444076538, + "test_acc": 0.4692, + "lyapunov": null, + "grad_norm": 1.04397117940108, + "grad_max_sv": 0.4235057145357132, + "grad_min_sv": 1.9742879536072122e-08, + "grad_condition": 93042430.3451734, + "lr": 0.0009330127018922189, + "time_sec": 32.598466634750366 + }, + { + "epoch": 26, + "train_loss": 1.3991303316879273, + "train_acc": 0.60234, + "test_loss": 2.1244462642669677, + "test_acc": 0.4699, + "lyapunov": null, + "grad_norm": 1.0210898725417539, + "grad_max_sv": 0.40390279740095136, + "grad_min_sv": 1.8844751671631688e-08, + "grad_condition": 47754997.0376553, + "lr": 0.000927682130080253, + "time_sec": 32.592235803604126 + }, + { + "epoch": 27, + "train_loss": 1.364674404411316, + "train_acc": 0.60842, + "test_loss": 2.0718156879425047, + "test_acc": 0.4869, + "lyapunov": null, + "grad_norm": 1.0037772283209996, + "grad_max_sv": 0.3884199522435665, + "grad_min_sv": 1.8489455115566767e-08, + "grad_condition": 43105120.31376915, + "lr": 0.0009221639627510072, + "time_sec": 32.572012186050415 + }, + { + "epoch": 28, + "train_loss": 1.3162348063278198, + "train_acc": 0.61978, + "test_loss": 2.1498897790908815, + "test_acc": 0.4713, + "lyapunov": null, + "grad_norm": 0.9854083051437647, + "grad_max_sv": 0.3941055417060852, + "grad_min_sv": 1.821508043287068e-08, + "grad_condition": 30019049.587522883, + "lr": 0.0009164606203550494, + "time_sec": 32.61202049255371 + }, + { + "epoch": 29, + "train_loss": 1.297664141960144, + "train_acc": 0.62526, + "test_loss": 2.3637782512664796, + "test_acc": 0.4422, + "lyapunov": null, + "grad_norm": 0.9700497222817057, + "grad_max_sv": 0.3905577354133129, + "grad_min_sv": 1.821864164487305e-08, + "grad_condition": 629447610.4912466, + "lr": 0.0009105746045668516, + "time_sec": 32.58795166015625 + }, + { + "epoch": 30, + "train_loss": 1.2600679531478882, + "train_acc": 0.63614, + "test_loss": 2.236318463897705, + "test_acc": 0.4642, + "lyapunov": null, + "grad_norm": 0.9648418713428535, + "grad_max_sv": 0.3880395792424679, + "grad_min_sv": 1.79835488431368e-08, + "grad_condition": 33437877.521342166, + "lr": 0.0009045084971874733, + "time_sec": 32.592060804367065 + }, + { + "epoch": 31, + "train_loss": 1.2364020344924926, + "train_acc": 0.6392, + "test_loss": 2.154664192008972, + "test_acc": 0.4837, + "lyapunov": null, + "grad_norm": 0.9476087844284748, + "grad_max_sv": 0.37929297238588333, + "grad_min_sv": 1.7732854504237672e-08, + "grad_condition": 30046805.177095603, + "lr": 0.0008982649590120977, + "time_sec": 32.59076547622681 + }, + { + "epoch": 32, + "train_loss": 1.2136566867446898, + "train_acc": 0.64694, + "test_loss": 2.199513331604004, + "test_acc": 0.4778, + "lyapunov": null, + "grad_norm": 0.9338298401569052, + "grad_max_sv": 0.37298540845513345, + "grad_min_sv": 1.7272915649006737e-08, + "grad_condition": 120572832.59615937, + "lr": 0.0008918467286629196, + "time_sec": 32.57135725021362 + }, + { + "epoch": 33, + "train_loss": 1.1726405830383302, + "train_acc": 0.65704, + "test_loss": 2.218723740005493, + "test_acc": 0.4793, + "lyapunov": null, + "grad_norm": 0.9186289446612895, + "grad_max_sv": 0.36610164269804957, + "grad_min_sv": 1.691525762653745e-08, + "grad_condition": 39660914.14999861, + "lr": 0.0008852566213878943, + "time_sec": 32.601572036743164 + }, + { + "epoch": 34, + "train_loss": 1.154909267578125, + "train_acc": 0.66198, + "test_loss": 2.138614348602295, + "test_acc": 0.4903, + "lyapunov": null, + "grad_norm": 0.9096977178269975, + "grad_max_sv": 0.35240189358592033, + "grad_min_sv": 1.6346752562679256e-08, + "grad_condition": 28792957.326603055, + "lr": 0.000878497527825878, + "time_sec": 32.60771727561951 + }, + { + "epoch": 35, + "train_loss": 1.1216133372497559, + "train_acc": 0.67002, + "test_loss": 2.213481376647949, + "test_acc": 0.4852, + "lyapunov": null, + "grad_norm": 0.8992657150515471, + "grad_max_sv": 0.35492446199059485, + "grad_min_sv": 1.6565864218234803e-08, + "grad_condition": 393144492.32520485, + "lr": 0.000871572412738697, + "time_sec": 32.58352470397949 + }, + { + "epoch": 36, + "train_loss": 1.0938994792556762, + "train_acc": 0.6756, + "test_loss": 2.1187156969070435, + "test_acc": 0.4974, + "lyapunov": null, + "grad_norm": 0.8902191223787412, + "grad_max_sv": 0.350722486525774, + "grad_min_sv": 1.6364247077023385e-08, + "grad_condition": 126613263.38187504, + "lr": 0.0008644843137107055, + "time_sec": 32.59000611305237 + }, + { + "epoch": 37, + "train_loss": 1.0754410801696777, + "train_acc": 0.6814, + "test_loss": 2.217418428230286, + "test_acc": 0.4887, + "lyapunov": null, + "grad_norm": 0.8719795019891965, + "grad_max_sv": 0.3433336988091469, + "grad_min_sv": 1.592541527747904e-08, + "grad_condition": 45545796.735647485, + "lr": 0.0008572363398164014, + "time_sec": 32.60146522521973 + }, + { + "epoch": 38, + "train_loss": 1.0556351538848876, + "train_acc": 0.68502, + "test_loss": 2.1800481369018554, + "test_acc": 0.4913, + "lyapunov": null, + "grad_norm": 0.8630956493497981, + "grad_max_sv": 0.3439564138650894, + "grad_min_sv": 1.570069879108793e-08, + "grad_condition": 28425423.95662601, + "lr": 0.0008498316702566826, + "time_sec": 32.60637044906616 + }, + { + "epoch": 39, + "train_loss": 1.0295844860839845, + "train_acc": 0.69618, + "test_loss": 2.1829655769348144, + "test_acc": 0.4986, + "lyapunov": null, + "grad_norm": 0.8554154024062846, + "grad_max_sv": 0.3512345805764198, + "grad_min_sv": 1.5957714531028567e-08, + "grad_condition": 62541984.17020081, + "lr": 0.0008422735529643442, + "time_sec": 32.61399698257446 + }, + { + "epoch": 40, + "train_loss": 1.0112493921279908, + "train_acc": 0.69542, + "test_loss": 2.115514920043945, + "test_acc": 0.5068, + "lyapunov": null, + "grad_norm": 0.8451701822146587, + "grad_max_sv": 0.33329174295067787, + "grad_min_sv": 1.5776219639690447e-08, + "grad_condition": 79832859.74387346, + "lr": 0.0008345653031794289, + "time_sec": 32.59746503829956 + }, + { + "epoch": 41, + "train_loss": 0.9991068764877319, + "train_acc": 0.70524, + "test_loss": 2.1873803031921386, + "test_acc": 0.5026, + "lyapunov": null, + "grad_norm": 0.8386854236688683, + "grad_max_sv": 0.3401566706597805, + "grad_min_sv": 1.5360383298634872e-08, + "grad_condition": 43801080.16344115, + "lr": 0.0008267103019950526, + "time_sec": 32.59045386314392 + }, + { + "epoch": 42, + "train_loss": 0.9736099641036987, + "train_acc": 0.70656, + "test_loss": 2.2409844583511354, + "test_acc": 0.484, + "lyapunov": null, + "grad_norm": 0.8291105761436245, + "grad_max_sv": 0.3179293151944876, + "grad_min_sv": 1.515972618756911e-08, + "grad_condition": 175687310.61382082, + "lr": 0.0008187119948743447, + "time_sec": 32.5880651473999 + }, + { + "epoch": 43, + "train_loss": 0.9563352813720704, + "train_acc": 0.71086, + "test_loss": 2.169837693977356, + "test_acc": 0.5013, + "lyapunov": null, + "grad_norm": 0.8214651478429573, + "grad_max_sv": 0.32580503448843956, + "grad_min_sv": 1.5053166909501094e-08, + "grad_condition": 45931164.8331637, + "lr": 0.000810573890139155, + "time_sec": 32.591588735580444 + }, + { + "epoch": 44, + "train_loss": 0.9295883957672119, + "train_acc": 0.71936, + "test_loss": 2.251956279373169, + "test_acc": 0.4997, + "lyapunov": null, + "grad_norm": 0.8193081635018687, + "grad_max_sv": 0.32752322033047676, + "grad_min_sv": 1.4865808058064228e-08, + "grad_condition": 254763425.4176507, + "lr": 0.0008022995574311873, + "time_sec": 32.61137008666992 + }, + { + "epoch": 45, + "train_loss": 0.9107750263214112, + "train_acc": 0.72198, + "test_loss": 2.268050945854187, + "test_acc": 0.5036, + "lyapunov": null, + "grad_norm": 0.8071951496588088, + "grad_max_sv": 0.31014049649238584, + "grad_min_sv": 1.4501045726526829e-08, + "grad_condition": 256138795.03682867, + "lr": 0.0007938926261462363, + "time_sec": 32.593836069107056 + }, + { + "epoch": 46, + "train_loss": 0.8840146226882934, + "train_acc": 0.73248, + "test_loss": 2.3333316173553467, + "test_acc": 0.4926, + "lyapunov": null, + "grad_norm": 0.8047440668964249, + "grad_max_sv": 0.31894322782754897, + "grad_min_sv": 1.4521474396306938e-08, + "grad_condition": 366185371.2855145, + "lr": 0.0007853567838422158, + "time_sec": 32.59914994239807 + }, + { + "epoch": 47, + "train_loss": 0.8691444579315185, + "train_acc": 0.73506, + "test_loss": 2.273669585800171, + "test_acc": 0.5092, + "lyapunov": null, + "grad_norm": 0.7946642486035804, + "grad_max_sv": 0.31746402755379677, + "grad_min_sv": 1.4334432538176678e-08, + "grad_condition": 162800049.316121, + "lr": 0.0007766957746216719, + "time_sec": 32.5816068649292 + }, + { + "epoch": 48, + "train_loss": 0.8467469311523438, + "train_acc": 0.741, + "test_loss": 2.3683644687652587, + "test_acc": 0.4945, + "lyapunov": null, + "grad_norm": 0.7803020466173483, + "grad_max_sv": 0.3124201364815235, + "grad_min_sv": 1.4153699946437004e-08, + "grad_condition": 81379073.14693151, + "lr": 0.0007679133974894982, + "time_sec": 32.57855439186096 + }, + { + "epoch": 49, + "train_loss": 0.8276354433059693, + "train_acc": 0.746, + "test_loss": 2.348865856933594, + "test_acc": 0.503, + "lyapunov": null, + "grad_norm": 0.7770327449715543, + "grad_max_sv": 0.30877858959138393, + "grad_min_sv": 1.405619010335507e-08, + "grad_condition": 259362022.72191978, + "lr": 0.000759013504686565, + "time_sec": 32.5961549282074 + }, + { + "epoch": 50, + "train_loss": 0.80362072599411, + "train_acc": 0.75188, + "test_loss": 2.347606075668335, + "test_acc": 0.5064, + "lyapunov": null, + "grad_norm": 0.7718135549452135, + "grad_max_sv": 0.30650909021496775, + "grad_min_sv": 1.3926891059834468e-08, + "grad_condition": 238755237.18455774, + "lr": 0.0007499999999999998, + "time_sec": 32.58652114868164 + }, + { + "epoch": 51, + "train_loss": 0.8076738609695434, + "train_acc": 0.75194, + "test_loss": 2.373729175186157, + "test_acc": 0.5041, + "lyapunov": null, + "grad_norm": 0.7691476122825985, + "grad_max_sv": 0.3075005076825619, + "grad_min_sv": 1.4049615590372433e-08, + "grad_condition": 73058100.40653792, + "lr": 0.0007408768370508575, + "time_sec": 32.58296465873718 + }, + { + "epoch": 52, + "train_loss": 0.7910924855804443, + "train_acc": 0.7557, + "test_loss": 2.5056129333496093, + "test_acc": 0.4897, + "lyapunov": null, + "grad_norm": 0.7617026431727135, + "grad_max_sv": 0.30800686217844486, + "grad_min_sv": 1.3826496124760835e-08, + "grad_condition": 189334380.72842854, + "lr": 0.0007316480175599307, + "time_sec": 32.627697229385376 + }, + { + "epoch": 53, + "train_loss": 0.7633206834983826, + "train_acc": 0.7641, + "test_loss": 2.3725709945678712, + "test_acc": 0.5126, + "lyapunov": null, + "grad_norm": 0.7544211785558737, + "grad_max_sv": 0.30351532325148584, + "grad_min_sv": 1.3343727502980462e-08, + "grad_condition": 487544076.1331793, + "lr": 0.0007223175895924635, + "time_sec": 32.59920334815979 + }, + { + "epoch": 54, + "train_loss": 0.7502616233825684, + "train_acc": 0.76742, + "test_loss": 2.359281371307373, + "test_acc": 0.5152, + "lyapunov": null, + "grad_norm": 0.7449828291399098, + "grad_max_sv": 0.2959673821926117, + "grad_min_sv": 1.3208014700916496e-08, + "grad_condition": 415965115.75810707, + "lr": 0.0007128896457825361, + "time_sec": 32.60435223579407 + }, + { + "epoch": 55, + "train_loss": 0.7417902284240723, + "train_acc": 0.7716, + "test_loss": 2.374223888015747, + "test_acc": 0.5043, + "lyapunov": null, + "grad_norm": 0.7381687420433285, + "grad_max_sv": 0.3085921786725521, + "grad_min_sv": 1.3457176572216622e-08, + "grad_condition": 355960264.02652407, + "lr": 0.0007033683215378998, + "time_sec": 32.6069917678833 + }, + { + "epoch": 56, + "train_loss": 0.7201570138549804, + "train_acc": 0.7776, + "test_loss": 2.5289041973114013, + "test_acc": 0.4991, + "lyapunov": null, + "grad_norm": 0.7319471417339568, + "grad_max_sv": 0.29403203129768374, + "grad_min_sv": 1.3126435492380462e-08, + "grad_condition": 102701306.62398617, + "lr": 0.0006937577932260512, + "time_sec": 32.61118412017822 + }, + { + "epoch": 57, + "train_loss": 0.7068166098403931, + "train_acc": 0.78014, + "test_loss": 2.4984960187911986, + "test_acc": 0.5052, + "lyapunov": null, + "grad_norm": 0.7313348821028376, + "grad_max_sv": 0.29538995064795015, + "grad_min_sv": 1.3354313459223998e-08, + "grad_condition": 518081595.0689063, + "lr": 0.0006840622763423388, + "time_sec": 32.60887265205383 + }, + { + "epoch": 58, + "train_loss": 0.6831113540458679, + "train_acc": 0.78586, + "test_loss": 2.4188764556884768, + "test_acc": 0.518, + "lyapunov": null, + "grad_norm": 0.7143603896389841, + "grad_max_sv": 0.29249175675213335, + "grad_min_sv": 1.2939957244606504e-08, + "grad_condition": 33033746.120541465, + "lr": 0.0006742860236609073, + "time_sec": 32.601460456848145 + }, + { + "epoch": 59, + "train_loss": 0.6521933509063721, + "train_acc": 0.79658, + "test_loss": 2.519079330062866, + "test_acc": 0.5081, + "lyapunov": null, + "grad_norm": 0.7094825210310041, + "grad_max_sv": 0.27764824479818345, + "grad_min_sv": 1.2391195380878628e-08, + "grad_condition": 38272959.65325786, + "lr": 0.0006644333233692913, + "time_sec": 32.58081579208374 + }, + { + "epoch": 60, + "train_loss": 0.6619705676078796, + "train_acc": 0.79326, + "test_loss": 2.333610046005249, + "test_acc": 0.5202, + "lyapunov": null, + "grad_norm": 0.7158904181821417, + "grad_max_sv": 0.29634682424366476, + "grad_min_sv": 1.2927760025221828e-08, + "grad_condition": 806783312.9815924, + "lr": 0.0006545084971874734, + "time_sec": 32.598530530929565 + }, + { + "epoch": 61, + "train_loss": 0.6327084550857544, + "train_acc": 0.80318, + "test_loss": 2.7702214424133302, + "test_acc": 0.4886, + "lyapunov": null, + "grad_norm": 0.6927365988787307, + "grad_max_sv": 0.2794598635286093, + "grad_min_sv": 1.2447203880106006e-08, + "grad_condition": 244549645.06864405, + "lr": 0.0006445158984722354, + "time_sec": 32.589969873428345 + }, + { + "epoch": 62, + "train_loss": 0.6203266059684753, + "train_acc": 0.80486, + "test_loss": 2.5082049884796143, + "test_acc": 0.5118, + "lyapunov": null, + "grad_norm": 0.6988717073980814, + "grad_max_sv": 0.2840553306043148, + "grad_min_sv": 1.2491288047325466e-08, + "grad_condition": 101912630.48903121, + "lr": 0.0006344599103076324, + "time_sec": 32.59857964515686 + }, + { + "epoch": 63, + "train_loss": 0.6090077508735656, + "train_acc": 0.80778, + "test_loss": 2.395359074211121, + "test_acc": 0.5237, + "lyapunov": null, + "grad_norm": 0.6924649230907168, + "grad_max_sv": 0.28618163615465164, + "grad_min_sv": 1.2502628839519692e-08, + "grad_condition": 86451645.85493946, + "lr": 0.0006243449435824269, + "time_sec": 32.59611201286316 + }, + { + "epoch": 64, + "train_loss": 0.5851399483680725, + "train_acc": 0.81618, + "test_loss": 2.6245384033203125, + "test_acc": 0.5032, + "lyapunov": null, + "grad_norm": 0.6839001107173612, + "grad_max_sv": 0.2753404140472412, + "grad_min_sv": 1.2281741042230454e-08, + "grad_condition": 70111759.32223424, + "lr": 0.0006141754350553275, + "time_sec": 32.60530376434326 + }, + { + "epoch": 65, + "train_loss": 0.5797093585586548, + "train_acc": 0.81722, + "test_loss": 2.4680503940582277, + "test_acc": 0.5167, + "lyapunov": null, + "grad_norm": 0.6773491015596559, + "grad_max_sv": 0.27119120582938194, + "grad_min_sv": 1.2128182125259457e-08, + "grad_condition": 29329714.921859503, + "lr": 0.0006039558454088793, + "time_sec": 32.5996458530426 + }, + { + "epoch": 66, + "train_loss": 0.5708195768547059, + "train_acc": 0.81862, + "test_loss": 2.4628547510147096, + "test_acc": 0.5236, + "lyapunov": null, + "grad_norm": 0.6613679437961346, + "grad_max_sv": 0.26192650087177755, + "grad_min_sv": 1.1950785359839815e-08, + "grad_condition": 160810765.41863006, + "lr": 0.000593690657292862, + "time_sec": 32.58818459510803 + }, + { + "epoch": 67, + "train_loss": 0.5540103606033325, + "train_acc": 0.82488, + "test_loss": 2.5581001953125, + "test_acc": 0.5113, + "lyapunov": null, + "grad_norm": 0.6580039591912937, + "grad_max_sv": 0.26643663719296456, + "grad_min_sv": 1.1754694354861039e-08, + "grad_condition": 139954745.95012397, + "lr": 0.0005833843733580507, + "time_sec": 32.588828563690186 + }, + { + "epoch": 68, + "train_loss": 0.5371956534671783, + "train_acc": 0.83146, + "test_loss": 2.4913981197357176, + "test_acc": 0.5163, + "lyapunov": null, + "grad_norm": 0.6562028097910022, + "grad_max_sv": 0.2671597957611084, + "grad_min_sv": 1.1955810450079568e-08, + "grad_condition": 199995064.23504788, + "lr": 0.0005730415142812054, + "time_sec": 32.60130739212036 + }, + { + "epoch": 69, + "train_loss": 0.5199291269493103, + "train_acc": 0.8348, + "test_loss": 2.515257999801636, + "test_acc": 0.523, + "lyapunov": null, + "grad_norm": 0.6492002375684193, + "grad_max_sv": 0.2655692081898451, + "grad_min_sv": 1.1676840729751837e-08, + "grad_condition": 55632325.70461162, + "lr": 0.0005626666167821517, + "time_sec": 32.59207487106323 + }, + { + "epoch": 70, + "train_loss": 0.5226033975219726, + "train_acc": 0.83408, + "test_loss": 2.587105647659302, + "test_acc": 0.5168, + "lyapunov": null, + "grad_norm": 0.6499925227037865, + "grad_max_sv": 0.2678232524544001, + "grad_min_sv": 1.1628125096488362e-08, + "grad_condition": 77360064.86943628, + "lr": 0.0005522642316338265, + "time_sec": 32.590487241744995 + }, + { + "epoch": 71, + "train_loss": 0.5042788141441346, + "train_acc": 0.83962, + "test_loss": 2.6780290996551512, + "test_acc": 0.5155, + "lyapunov": null, + "grad_norm": 0.6413478404511022, + "grad_max_sv": 0.27476422004401685, + "grad_min_sv": 1.1976047363526643e-08, + "grad_condition": 41599766.64955167, + "lr": 0.0005418389216661573, + "time_sec": 32.608052015304565 + }, + { + "epoch": 72, + "train_loss": 0.4914130021476746, + "train_acc": 0.84254, + "test_loss": 2.6799634628295896, + "test_acc": 0.5112, + "lyapunov": null, + "grad_norm": 0.6421521571868845, + "grad_max_sv": 0.2752946551889181, + "grad_min_sv": 1.1535952295846363e-08, + "grad_condition": 173057108.07366484, + "lr": 0.0005313952597646563, + "time_sec": 32.58746814727783 + }, + { + "epoch": 73, + "train_loss": 0.47570753255844117, + "train_acc": 0.84862, + "test_loss": 2.6893883739471436, + "test_acc": 0.5176, + "lyapunov": null, + "grad_norm": 0.6327416673284769, + "grad_max_sv": 0.26813027672469614, + "grad_min_sv": 1.1660086559998895e-08, + "grad_condition": 123233932.43288596, + "lr": 0.0005209378268645994, + "time_sec": 32.60110855102539 + }, + { + "epoch": 74, + "train_loss": 0.4707356683158875, + "train_acc": 0.84916, + "test_loss": 2.705184066772461, + "test_acc": 0.5134, + "lyapunov": null, + "grad_norm": 0.6317510073059565, + "grad_max_sv": 0.2683044508099556, + "grad_min_sv": 1.1382765011114238e-08, + "grad_condition": 37315987.94800802, + "lr": 0.0005104712099416781, + "time_sec": 32.60347580909729 + }, + { + "epoch": 75, + "train_loss": 0.4641658597373962, + "train_acc": 0.851, + "test_loss": 2.6986205451965333, + "test_acc": 0.5208, + "lyapunov": null, + "grad_norm": 0.6209909677536577, + "grad_max_sv": 0.26425978280603885, + "grad_min_sv": 1.1168030037561616e-08, + "grad_condition": 226919825.38563904, + "lr": 0.0004999999999999996, + "time_sec": 32.67061495780945 + }, + { + "epoch": 76, + "train_loss": 0.4528690433597565, + "train_acc": 0.85586, + "test_loss": 2.613859156417847, + "test_acc": 0.522, + "lyapunov": null, + "grad_norm": 0.617797835183575, + "grad_max_sv": 0.2607017453759909, + "grad_min_sv": 1.1361421214071965e-08, + "grad_condition": 237143111.14919743, + "lr": 0.0004895287900583212, + "time_sec": 32.602660179138184 + }, + { + "epoch": 77, + "train_loss": 0.43447011494636534, + "train_acc": 0.86002, + "test_loss": 2.6867597301483155, + "test_acc": 0.5196, + "lyapunov": null, + "grad_norm": 0.6028807353159102, + "grad_max_sv": 0.25386805906891824, + "grad_min_sv": 1.0792874089306064e-08, + "grad_condition": 509544290.6528182, + "lr": 0.0004790621731353997, + "time_sec": 32.60628342628479 + }, + { + "epoch": 78, + "train_loss": 0.42801210759162905, + "train_acc": 0.8611, + "test_loss": 2.7353676914215086, + "test_acc": 0.52, + "lyapunov": null, + "grad_norm": 0.6041598500376273, + "grad_max_sv": 0.2545783918350935, + "grad_min_sv": 1.0714695224773794e-08, + "grad_condition": 431729490.20616114, + "lr": 0.000468604740235343, + "time_sec": 32.59142065048218 + }, + { + "epoch": 79, + "train_loss": 0.41789625541687014, + "train_acc": 0.86464, + "test_loss": 2.693261518859863, + "test_acc": 0.524, + "lyapunov": null, + "grad_norm": 0.6071031366199182, + "grad_max_sv": 0.2566175889223814, + "grad_min_sv": 1.1114151432636614e-08, + "grad_condition": 3634833064.8054137, + "lr": 0.00045816107833384175, + "time_sec": 32.58738827705383 + }, + { + "epoch": 80, + "train_loss": 0.40703976345062254, + "train_acc": 0.87002, + "test_loss": 2.6887667331695555, + "test_acc": 0.5243, + "lyapunov": null, + "grad_norm": 0.5984471308299292, + "grad_max_sv": 0.2493945002555847, + "grad_min_sv": 1.061133420021676e-08, + "grad_condition": 80474406.45535596, + "lr": 0.0004477357683661729, + "time_sec": 32.61637735366821 + }, + { + "epoch": 81, + "train_loss": 0.40051113874435423, + "train_acc": 0.87134, + "test_loss": 2.6440505380630492, + "test_acc": 0.5185, + "lyapunov": null, + "grad_norm": 0.5907746722415285, + "grad_max_sv": 0.2511758103966713, + "grad_min_sv": 1.0482470419665486e-08, + "grad_condition": 1750678236.5886657, + "lr": 0.00043733338321784746, + "time_sec": 32.62238121032715 + }, + { + "epoch": 82, + "train_loss": 0.3885132439041138, + "train_acc": 0.87488, + "test_loss": 2.7878334438323975, + "test_acc": 0.5162, + "lyapunov": null, + "grad_norm": 0.58430027482298, + "grad_max_sv": 0.25240526124835017, + "grad_min_sv": 1.0581684940520058e-08, + "grad_condition": 269640397.6570332, + "lr": 0.0004269584857187939, + "time_sec": 32.626975536346436 + }, + { + "epoch": 83, + "train_loss": 0.3814581998252869, + "train_acc": 0.87684, + "test_loss": 2.8386356674194335, + "test_acc": 0.5142, + "lyapunov": null, + "grad_norm": 0.5766781312947917, + "grad_max_sv": 0.2504258405417204, + "grad_min_sv": 1.0411958474738914e-08, + "grad_condition": 184559288.66339245, + "lr": 0.0004166156266419484, + "time_sec": 32.611592292785645 + }, + { + "epoch": 84, + "train_loss": 0.3717445139122009, + "train_acc": 0.88038, + "test_loss": 2.814955038833618, + "test_acc": 0.5166, + "lyapunov": null, + "grad_norm": 0.5724757927650855, + "grad_max_sv": 0.23919779919087886, + "grad_min_sv": 1.010720067685334e-08, + "grad_condition": 6504970059.230141, + "lr": 0.0004063093427071373, + "time_sec": 32.595086336135864 + }, + { + "epoch": 85, + "train_loss": 0.3631134850883484, + "train_acc": 0.88234, + "test_loss": 2.896529895401001, + "test_acc": 0.517, + "lyapunov": null, + "grad_norm": 0.5716828110080233, + "grad_max_sv": 0.2572952527552843, + "grad_min_sv": 1.0620267017896757e-08, + "grad_condition": 140581074.527008, + "lr": 0.0003960441545911199, + "time_sec": 32.626396894454956 + }, + { + "epoch": 86, + "train_loss": 0.35211850923538207, + "train_acc": 0.88516, + "test_loss": 2.830642932128906, + "test_acc": 0.5181, + "lyapunov": null, + "grad_norm": 0.5652345515826299, + "grad_max_sv": 0.2406426455825567, + "grad_min_sv": 1.0035951097248087e-08, + "grad_condition": 157363298.29417515, + "lr": 0.0003858245649446718, + "time_sec": 32.61501336097717 + }, + { + "epoch": 87, + "train_loss": 0.34102174520492556, + "train_acc": 0.88968, + "test_loss": 2.76530976524353, + "test_acc": 0.5259, + "lyapunov": null, + "grad_norm": 0.5558383090650325, + "grad_max_sv": 0.2345995433628559, + "grad_min_sv": 9.800732628240105e-09, + "grad_condition": 383896288.09718305, + "lr": 0.00037565505641757235, + "time_sec": 32.634864807128906 + }, + { + "epoch": 88, + "train_loss": 0.33726214722633363, + "train_acc": 0.891, + "test_loss": 2.733760427856445, + "test_acc": 0.5244, + "lyapunov": null, + "grad_norm": 0.5538822301303683, + "grad_max_sv": 0.24563388302922248, + "grad_min_sv": 1.0018650633061843e-08, + "grad_condition": 118611521.33186904, + "lr": 0.00036554008969236695, + "time_sec": 32.63033366203308 + }, + { + "epoch": 89, + "train_loss": 0.3301980359172821, + "train_acc": 0.89216, + "test_loss": 2.918773532867432, + "test_acc": 0.5118, + "lyapunov": null, + "grad_norm": 0.5552064063111142, + "grad_max_sv": 0.24537508748471737, + "grad_min_sv": 9.913944656316995e-09, + "grad_condition": 272975400.6376897, + "lr": 0.0003554841015277638, + "time_sec": 32.60276007652283 + }, + { + "epoch": 90, + "train_loss": 0.3163340950202942, + "train_acc": 0.89878, + "test_loss": 2.7766964824676514, + "test_acc": 0.5264, + "lyapunov": null, + "grad_norm": 0.5400768317130968, + "grad_max_sv": 0.2411129016429186, + "grad_min_sv": 9.687033342576507e-09, + "grad_condition": 416321682.5560986, + "lr": 0.000345491502812526, + "time_sec": 32.60790824890137 + }, + { + "epoch": 91, + "train_loss": 0.3076762091016769, + "train_acc": 0.90074, + "test_loss": 2.825528881454468, + "test_acc": 0.5256, + "lyapunov": null, + "grad_norm": 0.5366393429500814, + "grad_max_sv": 0.24289038106799127, + "grad_min_sv": 9.893315243748933e-09, + "grad_condition": 8008206003.687421, + "lr": 0.0003355666766307081, + "time_sec": 32.62208580970764 + }, + { + "epoch": 92, + "train_loss": 0.30529593547821043, + "train_acc": 0.90092, + "test_loss": 2.869784680175781, + "test_acc": 0.5238, + "lyapunov": null, + "grad_norm": 0.5363473916144786, + "grad_max_sv": 0.23521617650985718, + "grad_min_sv": 9.505784433422663e-09, + "grad_condition": 442565148.9721116, + "lr": 0.00032571397633909225, + "time_sec": 32.64980983734131 + }, + { + "epoch": 93, + "train_loss": 0.29787114533424375, + "train_acc": 0.90402, + "test_loss": 2.8699749797821044, + "test_acc": 0.5267, + "lyapunov": null, + "grad_norm": 0.5298781438333415, + "grad_max_sv": 0.24197408594191075, + "grad_min_sv": 9.770249323687654e-09, + "grad_condition": 379108533.64883816, + "lr": 0.00031593772365766094, + "time_sec": 32.627405643463135 + }, + { + "epoch": 94, + "train_loss": 0.29400105224609374, + "train_acc": 0.9062, + "test_loss": 2.895481134033203, + "test_acc": 0.5249, + "lyapunov": null, + "grad_norm": 0.5247094262999626, + "grad_max_sv": 0.2358103074133396, + "grad_min_sv": 9.420375624100835e-09, + "grad_condition": 235198291.065983, + "lr": 0.0003062422067739483, + "time_sec": 32.62435960769653 + }, + { + "epoch": 95, + "train_loss": 0.28872565462112426, + "train_acc": 0.90588, + "test_loss": 3.11293623046875, + "test_acc": 0.5069, + "lyapunov": null, + "grad_norm": 0.5215261224841182, + "grad_max_sv": 0.25088537521660326, + "grad_min_sv": 9.650516582192756e-09, + "grad_condition": 1840672432.8984706, + "lr": 0.00029663167846209965, + "time_sec": 32.61182975769043 + }, + { + "epoch": 96, + "train_loss": 0.28140667702674865, + "train_acc": 0.91062, + "test_loss": 3.0343638908386232, + "test_acc": 0.515, + "lyapunov": null, + "grad_norm": 0.5141206525756735, + "grad_max_sv": 0.23001555018126965, + "grad_min_sv": 9.238026586018063e-09, + "grad_condition": 420023753.8812055, + "lr": 0.00028711035421746345, + "time_sec": 32.68735599517822 + }, + { + "epoch": 97, + "train_loss": 0.2734098640537262, + "train_acc": 0.91134, + "test_loss": 2.8863599807739257, + "test_acc": 0.5278, + "lyapunov": null, + "grad_norm": 0.5123884758919174, + "grad_max_sv": 0.23177284747362137, + "grad_min_sv": 9.441876753363276e-09, + "grad_condition": 389841901.45972645, + "lr": 0.00027768241040753615, + "time_sec": 32.61720895767212 + }, + { + "epoch": 98, + "train_loss": 0.26842240329742434, + "train_acc": 0.91246, + "test_loss": 3.0170704383850095, + "test_acc": 0.5129, + "lyapunov": null, + "grad_norm": 0.5119534215929997, + "grad_max_sv": 0.2332689631730318, + "grad_min_sv": 9.159953092601272e-09, + "grad_condition": 580671793.4936365, + "lr": 0.00026835198244006903, + "time_sec": 32.664491415023804 + }, + { + "epoch": 99, + "train_loss": 0.26015502326965334, + "train_acc": 0.91556, + "test_loss": 2.9550776737213136, + "test_acc": 0.5235, + "lyapunov": null, + "grad_norm": 0.5002440418943672, + "grad_max_sv": 0.23028606474399566, + "grad_min_sv": 9.332162127502312e-09, + "grad_condition": 808479124.7268131, + "lr": 0.0002591231629491421, + "time_sec": 32.647944688797 + }, + { + "epoch": 100, + "train_loss": 0.2549975943994522, + "train_acc": 0.91682, + "test_loss": 2.9257835506439207, + "test_acc": 0.5273, + "lyapunov": null, + "grad_norm": 0.49921981594604525, + "grad_max_sv": 0.23579159304499625, + "grad_min_sv": 9.433937244070211e-09, + "grad_condition": 407472481.62626183, + "lr": 0.0002499999999999997, + "time_sec": 32.635313987731934 + }, + { + "epoch": 101, + "train_loss": 0.24892131799697875, + "train_acc": 0.91962, + "test_loss": 3.0537579055786135, + "test_acc": 0.5204, + "lyapunov": null, + "grad_norm": 0.494706284038144, + "grad_max_sv": 0.23495413847267627, + "grad_min_sv": 9.133226261815851e-09, + "grad_condition": 1270457560.953787, + "lr": 0.00024098649531343477, + "time_sec": 32.63528537750244 + }, + { + "epoch": 102, + "train_loss": 0.24037195320129395, + "train_acc": 0.92222, + "test_loss": 2.9084070110321045, + "test_acc": 0.5314, + "lyapunov": null, + "grad_norm": 0.486463679580628, + "grad_max_sv": 0.22473125196993352, + "grad_min_sv": 8.789323869932975e-09, + "grad_condition": 149506255.08150166, + "lr": 0.0002320866025105016, + "time_sec": 32.62351393699646 + }, + { + "epoch": 103, + "train_loss": 0.23799612444877624, + "train_acc": 0.92292, + "test_loss": 2.9349034282684325, + "test_acc": 0.5289, + "lyapunov": null, + "grad_norm": 0.48727629294890773, + "grad_max_sv": 0.2274385754019022, + "grad_min_sv": 8.963414135660514e-09, + "grad_condition": 465258851.1966427, + "lr": 0.0002233042253783278, + "time_sec": 32.61650204658508 + }, + { + "epoch": 104, + "train_loss": 0.23054517783164977, + "train_acc": 0.92504, + "test_loss": 2.938683780670166, + "test_acc": 0.5266, + "lyapunov": null, + "grad_norm": 0.47776558566177757, + "grad_max_sv": 0.22822440713644027, + "grad_min_sv": 8.97047937394209e-09, + "grad_condition": 448967200.7070708, + "lr": 0.000214643216157784, + "time_sec": 32.62421631813049 + }, + { + "epoch": 105, + "train_loss": 0.22744343911170958, + "train_acc": 0.9273, + "test_loss": 2.9878555629730226, + "test_acc": 0.5259, + "lyapunov": null, + "grad_norm": 0.47552946244552535, + "grad_max_sv": 0.22355719469487667, + "grad_min_sv": 8.578639451193789e-09, + "grad_condition": 1230595930.5020957, + "lr": 0.00020610737385376332, + "time_sec": 32.64089250564575 + }, + { + "epoch": 106, + "train_loss": 0.2254838338279724, + "train_acc": 0.92664, + "test_loss": 2.890159453201294, + "test_acc": 0.5325, + "lyapunov": null, + "grad_norm": 0.4754280898805139, + "grad_max_sv": 0.22736473716795444, + "grad_min_sv": 8.855452674882275e-09, + "grad_condition": 227786621.55556726, + "lr": 0.00019770044256881242, + "time_sec": 32.62216234207153 + }, + { + "epoch": 107, + "train_loss": 0.21862738111495972, + "train_acc": 0.92946, + "test_loss": 2.9494735862731933, + "test_acc": 0.5339, + "lyapunov": null, + "grad_norm": 0.46844112806059024, + "grad_max_sv": 0.22530344501137733, + "grad_min_sv": 8.94512247944998e-09, + "grad_condition": 238603916.54803166, + "lr": 0.0001894261098608447, + "time_sec": 32.69642758369446 + }, + { + "epoch": 108, + "train_loss": 0.21242757941246032, + "train_acc": 0.93128, + "test_loss": 2.888539296340942, + "test_acc": 0.5374, + "lyapunov": null, + "grad_norm": 0.45815473843013677, + "grad_max_sv": 0.21505159176886082, + "grad_min_sv": 8.673661599459954e-09, + "grad_condition": 180782176.2580329, + "lr": 0.000181288005125655, + "time_sec": 32.64587926864624 + }, + { + "epoch": 109, + "train_loss": 0.20814263255119322, + "train_acc": 0.9323, + "test_loss": 2.9850453857421875, + "test_acc": 0.5313, + "lyapunov": null, + "grad_norm": 0.45710108435427255, + "grad_max_sv": 0.21654113940894604, + "grad_min_sv": 8.38159002782262e-09, + "grad_condition": 1071851437.3139431, + "lr": 0.0001732896980049473, + "time_sec": 32.6502947807312 + }, + { + "epoch": 110, + "train_loss": 0.21159317121982574, + "train_acc": 0.9313, + "test_loss": 2.9875508575439453, + "test_acc": 0.5337, + "lyapunov": null, + "grad_norm": 0.46209344732614477, + "grad_max_sv": 0.22466418109834194, + "grad_min_sv": 8.643569696542997e-09, + "grad_condition": 2628798540.5647016, + "lr": 0.00016543469682057076, + "time_sec": 32.64112162590027 + }, + { + "epoch": 111, + "train_loss": 0.20016858710289, + "train_acc": 0.93604, + "test_loss": 2.93681678276062, + "test_acc": 0.5316, + "lyapunov": null, + "grad_norm": 0.4518735980614093, + "grad_max_sv": 0.22103419229388238, + "grad_min_sv": 8.257411067674052e-09, + "grad_condition": 376107488.32890815, + "lr": 0.00015772644703565552, + "time_sec": 32.656370639801025 + }, + { + "epoch": 112, + "train_loss": 0.19515520360946656, + "train_acc": 0.9368, + "test_loss": 2.9751342456817627, + "test_acc": 0.5344, + "lyapunov": null, + "grad_norm": 0.44656573715114095, + "grad_max_sv": 0.21552282944321632, + "grad_min_sv": 8.250081655857e-09, + "grad_condition": 213559178.74106574, + "lr": 0.00015016832974331713, + "time_sec": 32.641249656677246 + }, + { + "epoch": 113, + "train_loss": 0.19505731956481934, + "train_acc": 0.9374, + "test_loss": 3.01028088684082, + "test_acc": 0.5328, + "lyapunov": null, + "grad_norm": 0.447762267994011, + "grad_max_sv": 0.22150389216840266, + "grad_min_sv": 8.272555637278515e-09, + "grad_condition": 575576846.4228761, + "lr": 0.00014276366018359834, + "time_sec": 32.61401128768921 + }, + { + "epoch": 114, + "train_loss": 0.19351220841407776, + "train_acc": 0.93888, + "test_loss": 3.0259054725646974, + "test_acc": 0.5329, + "lyapunov": null, + "grad_norm": 0.4440731938660848, + "grad_max_sv": 0.20611900761723517, + "grad_min_sv": 7.938974335932768e-09, + "grad_condition": 2117664654.6003728, + "lr": 0.00013551568628929425, + "time_sec": 32.62533736228943 + }, + { + "epoch": 115, + "train_loss": 0.18517933310508727, + "train_acc": 0.94, + "test_loss": 2.979716062164307, + "test_acc": 0.5322, + "lyapunov": null, + "grad_norm": 0.43223199561721015, + "grad_max_sv": 0.20325944386422634, + "grad_min_sv": 7.998736221349781e-09, + "grad_condition": 2267473453.6187987, + "lr": 0.00012842758726130276, + "time_sec": 32.59545683860779 + }, + { + "epoch": 116, + "train_loss": 0.18197948449134826, + "train_acc": 0.94188, + "test_loss": 3.0201827381134034, + "test_acc": 0.5299, + "lyapunov": null, + "grad_norm": 0.4333502572268812, + "grad_max_sv": 0.211935805529356, + "grad_min_sv": 7.94614953417757e-09, + "grad_condition": 758773851.5504032, + "lr": 0.0001215024721741218, + "time_sec": 32.5964834690094 + }, + { + "epoch": 117, + "train_loss": 0.18007635980367662, + "train_acc": 0.94096, + "test_loss": 3.027638053512573, + "test_acc": 0.53, + "lyapunov": null, + "grad_norm": 0.43212977193693003, + "grad_max_sv": 0.1994217723608017, + "grad_min_sv": 7.8184707179383e-09, + "grad_condition": 413386528.92379594, + "lr": 0.00011474337861210538, + "time_sec": 32.62613034248352 + }, + { + "epoch": 118, + "train_loss": 0.18450939226150512, + "train_acc": 0.9413, + "test_loss": 3.0377433166503907, + "test_acc": 0.5314, + "lyapunov": null, + "grad_norm": 0.4368133766676491, + "grad_max_sv": 0.21917820498347282, + "grad_min_sv": 8.205953756171974e-09, + "grad_condition": 451115729.3745159, + "lr": 0.00010815327133708009, + "time_sec": 32.633800745010376 + }, + { + "epoch": 119, + "train_loss": 0.17563085342884063, + "train_acc": 0.94378, + "test_loss": 3.031028490447998, + "test_acc": 0.531, + "lyapunov": null, + "grad_norm": 0.4297303205355355, + "grad_max_sv": 0.2180554073303938, + "grad_min_sv": 8.280064745706892e-09, + "grad_condition": 1295134584.8432426, + "lr": 0.00010173504098790182, + "time_sec": 32.608771324157715 + }, + { + "epoch": 120, + "train_loss": 0.1728181059885025, + "train_acc": 0.94516, + "test_loss": 3.0397233207702636, + "test_acc": 0.535, + "lyapunov": null, + "grad_norm": 0.42541267725329557, + "grad_max_sv": 0.2076257921755314, + "grad_min_sv": 7.818187247555716e-09, + "grad_condition": 538624769.2984645, + "lr": 9.549150281252629e-05, + "time_sec": 32.623777627944946 + }, + { + "epoch": 121, + "train_loss": 0.17342313063144685, + "train_acc": 0.94358, + "test_loss": 3.090806385421753, + "test_acc": 0.5259, + "lyapunov": null, + "grad_norm": 0.4279826646645282, + "grad_max_sv": 0.211811538413167, + "grad_min_sv": 8.37733668044671e-09, + "grad_condition": 2584607111.9359965, + "lr": 8.942539543314794e-05, + "time_sec": 32.60838270187378 + }, + { + "epoch": 122, + "train_loss": 0.16821347290039063, + "train_acc": 0.94568, + "test_loss": 2.970914940261841, + "test_acc": 0.5383, + "lyapunov": null, + "grad_norm": 0.4143477437049123, + "grad_max_sv": 0.2086195493116975, + "grad_min_sv": 7.770506423206147e-09, + "grad_condition": 706067729.9607236, + "lr": 8.353937964495024e-05, + "time_sec": 32.60011887550354 + }, + { + "epoch": 123, + "train_loss": 0.165188626871109, + "train_acc": 0.94708, + "test_loss": 3.146423945236206, + "test_acc": 0.5236, + "lyapunov": null, + "grad_norm": 0.4157699706699544, + "grad_max_sv": 0.2090679880231619, + "grad_min_sv": 7.940607924059733e-09, + "grad_condition": 557759889.9569094, + "lr": 7.783603724899243e-05, + "time_sec": 32.60132360458374 + }, + { + "epoch": 124, + "train_loss": 0.16185669136047362, + "train_acc": 0.94898, + "test_loss": 3.092581678771973, + "test_acc": 0.5309, + "lyapunov": null, + "grad_norm": 0.41386427981868507, + "grad_max_sv": 0.21234715208411217, + "grad_min_sv": 7.842563700820488e-09, + "grad_condition": 1249888567.8033772, + "lr": 7.231786991974666e-05, + "time_sec": 32.604347705841064 + }, + { + "epoch": 125, + "train_loss": 0.16584392420291902, + "train_acc": 0.947, + "test_loss": 3.1019040981292725, + "test_acc": 0.5267, + "lyapunov": null, + "grad_norm": 0.4192277900989539, + "grad_max_sv": 0.20565972849726677, + "grad_min_sv": 7.802029632162505e-09, + "grad_condition": 314909668.4775388, + "lr": 6.698729810778072e-05, + "time_sec": 32.616387605667114 + }, + { + "epoch": 126, + "train_loss": 0.1582554586648941, + "train_acc": 0.94992, + "test_loss": 3.092884744262695, + "test_acc": 0.5336, + "lyapunov": null, + "grad_norm": 0.40895799504788816, + "grad_max_sv": 0.20402971263974906, + "grad_min_sv": 7.793592751714762e-09, + "grad_condition": 105561894.73739907, + "lr": 6.184665997806817e-05, + "time_sec": 32.63440942764282 + }, + { + "epoch": 127, + "train_loss": 0.16116769627571106, + "train_acc": 0.94914, + "test_loss": 3.0276394256591797, + "test_acc": 0.5365, + "lyapunov": null, + "grad_norm": 0.4111628609488252, + "grad_max_sv": 0.20847035236656666, + "grad_min_sv": 7.640062939045199e-09, + "grad_condition": 818297996.510643, + "lr": 5.6898210384392595e-05, + "time_sec": 32.61918830871582 + }, + { + "epoch": 128, + "train_loss": 0.15127705811262132, + "train_acc": 0.95128, + "test_loss": 3.0493050357818605, + "test_acc": 0.53, + "lyapunov": null, + "grad_norm": 0.3977211579636293, + "grad_max_sv": 0.19759772382676602, + "grad_min_sv": 7.73080679484497e-09, + "grad_condition": 898008339.7060969, + "lr": 5.214411988029363e-05, + "time_sec": 32.60267949104309 + }, + { + "epoch": 129, + "train_loss": 0.15520440853118897, + "train_acc": 0.95012, + "test_loss": 3.1105175033569337, + "test_acc": 0.5289, + "lyapunov": null, + "grad_norm": 0.40439158508263096, + "grad_max_sv": 0.20421933494508265, + "grad_min_sv": 7.601044078008046e-09, + "grad_condition": 854191017.3859537, + "lr": 4.7586473766990294e-05, + "time_sec": 32.63329720497131 + }, + { + "epoch": 130, + "train_loss": 0.15371531970977784, + "train_acc": 0.95122, + "test_loss": 3.1062196437835694, + "test_acc": 0.5303, + "lyapunov": null, + "grad_norm": 0.40117927218947497, + "grad_max_sv": 0.20184723120182751, + "grad_min_sv": 7.375536336827384e-09, + "grad_condition": 1954247045.763169, + "lr": 4.32272711786996e-05, + "time_sec": 32.65104269981384 + }, + { + "epoch": 131, + "train_loss": 0.15117946271419525, + "train_acc": 0.95178, + "test_loss": 3.0734384868621825, + "test_acc": 0.5323, + "lyapunov": null, + "grad_norm": 0.4012856870279909, + "grad_max_sv": 0.21056946255266668, + "grad_min_sv": 7.716869526735613e-09, + "grad_condition": 1786469845.4801903, + "lr": 3.906842420574966e-05, + "time_sec": 32.60900163650513 + }, + { + "epoch": 132, + "train_loss": 0.14829608782052994, + "train_acc": 0.95304, + "test_loss": 3.1062648803710937, + "test_acc": 0.5321, + "lyapunov": null, + "grad_norm": 0.3934246590182889, + "grad_max_sv": 0.20152232367545367, + "grad_min_sv": 7.815424931572126e-09, + "grad_condition": 230026115.20600373, + "lr": 3.5111757055874305e-05, + "time_sec": 32.66224122047424 + }, + { + "epoch": 133, + "train_loss": 0.15090471013069154, + "train_acc": 0.95132, + "test_loss": 3.0866109645843505, + "test_acc": 0.5312, + "lyapunov": null, + "grad_norm": 0.3996390840824327, + "grad_max_sv": 0.20301406253129245, + "grad_min_sv": 7.4918664647039e-09, + "grad_condition": 163102203.53997582, + "lr": 3.1359005254054254e-05, + "time_sec": 32.708242893218994 + }, + { + "epoch": 134, + "train_loss": 0.14860970255374908, + "train_acc": 0.9524, + "test_loss": 3.0676291301727296, + "test_acc": 0.5382, + "lyapunov": null, + "grad_norm": 0.39867382966168935, + "grad_max_sv": 0.20453516952693462, + "grad_min_sv": 7.668875320722217e-09, + "grad_condition": 3561154814.827286, + "lr": 2.7811814881259484e-05, + "time_sec": 32.66806650161743 + }, + { + "epoch": 135, + "train_loss": 0.14866124527454377, + "train_acc": 0.95314, + "test_loss": 3.0443356689453127, + "test_acc": 0.5355, + "lyapunov": null, + "grad_norm": 0.39739197124103876, + "grad_max_sv": 0.1973813423886895, + "grad_min_sv": 7.404128056498482e-09, + "grad_condition": 129758782.41388819, + "lr": 2.4471741852423218e-05, + "time_sec": 32.678155183792114 + }, + { + "epoch": 136, + "train_loss": 0.14828838193655014, + "train_acc": 0.95252, + "test_loss": 3.123971256637573, + "test_acc": 0.529, + "lyapunov": null, + "grad_norm": 0.39827457639069835, + "grad_max_sv": 0.20285094752907754, + "grad_min_sv": 7.759793476660656e-09, + "grad_condition": 294182608.68720245, + "lr": 2.1340251233966362e-05, + "time_sec": 32.672452211380005 + }, + { + "epoch": 137, + "train_loss": 0.14890135494709014, + "train_acc": 0.95234, + "test_loss": 3.066171446609497, + "test_acc": 0.5396, + "lyapunov": null, + "grad_norm": 0.39748835107394653, + "grad_max_sv": 0.2081820584833622, + "grad_min_sv": 7.64267313203143e-09, + "grad_condition": 141448400.9724085, + "lr": 1.8418716601170932e-05, + "time_sec": 32.69361972808838 + }, + { + "epoch": 138, + "train_loss": 0.14276867793083192, + "train_acc": 0.95434, + "test_loss": 2.9989293914794923, + "test_acc": 0.5428, + "lyapunov": null, + "grad_norm": 0.38807574698322655, + "grad_max_sv": 0.1993431432172656, + "grad_min_sv": 7.447289089579367e-09, + "grad_condition": 237129012.49201822, + "lr": 1.570841943568445e-05, + "time_sec": 32.62693667411804 + }, + { + "epoch": 139, + "train_loss": 0.14445265219688416, + "train_acc": 0.9544, + "test_loss": 3.0897484813690186, + "test_acc": 0.5346, + "lyapunov": null, + "grad_norm": 0.3916453630848962, + "grad_max_sv": 0.20243223942816257, + "grad_min_sv": 7.469635450430522e-09, + "grad_condition": 1043014999.102849, + "lr": 1.3210548563419845e-05, + "time_sec": 32.64464712142944 + }, + { + "epoch": 140, + "train_loss": 0.1427642147541046, + "train_acc": 0.9543, + "test_loss": 3.031327156829834, + "test_acc": 0.535, + "lyapunov": null, + "grad_norm": 0.3886355958956018, + "grad_max_sv": 0.2018580801784992, + "grad_min_sv": 7.621796357590304e-09, + "grad_condition": 664163142.124336, + "lr": 1.0926199633097203e-05, + "time_sec": 32.660330057144165 + }, + { + "epoch": 141, + "train_loss": 0.14185610869407653, + "train_acc": 0.9552, + "test_loss": 3.0772051303863526, + "test_acc": 0.5339, + "lyapunov": null, + "grad_norm": 0.3868195908541027, + "grad_max_sv": 0.20251359287649393, + "grad_min_sv": 7.470099435509178e-09, + "grad_condition": 425734882.57352364, + "lr": 8.856374635655688e-06, + "time_sec": 32.65519666671753 + }, + { + "epoch": 142, + "train_loss": 0.14422438275337218, + "train_acc": 0.9542, + "test_loss": 3.103548192977905, + "test_acc": 0.5319, + "lyapunov": null, + "grad_norm": 0.39048104436108116, + "grad_max_sv": 0.19756273850798606, + "grad_min_sv": 7.4290536656012455e-09, + "grad_condition": 408291234.33779216, + "lr": 7.001981464747503e-06, + "time_sec": 32.636162996292114 + }, + { + "epoch": 143, + "train_loss": 0.14353974442481995, + "train_acc": 0.95526, + "test_loss": 3.060520997619629, + "test_acc": 0.5365, + "lyapunov": null, + "grad_norm": 0.3873027950363726, + "grad_max_sv": 0.19281232934445142, + "grad_min_sv": 7.347835982718376e-09, + "grad_condition": 456218223.5586403, + "lr": 5.3638335185058295e-06, + "time_sec": 32.627941608428955 + }, + { + "epoch": 144, + "train_loss": 0.13766098391532897, + "train_acc": 0.9576, + "test_loss": 3.074265901184082, + "test_acc": 0.5353, + "lyapunov": null, + "grad_norm": 0.37947012727353063, + "grad_max_sv": 0.19440167173743247, + "grad_min_sv": 7.409312191900257e-09, + "grad_condition": 2253415311.1792517, + "lr": 3.942649342761114e-06, + "time_sec": 32.63689088821411 + }, + { + "epoch": 145, + "train_loss": 0.14109201768398286, + "train_acc": 0.955, + "test_loss": 3.0755377796173096, + "test_acc": 0.5336, + "lyapunov": null, + "grad_norm": 0.38757758709785933, + "grad_max_sv": 0.19704692922532557, + "grad_min_sv": 7.600344460430633e-09, + "grad_condition": 469385402.5993269, + "lr": 2.7390523158633524e-06, + "time_sec": 32.65139961242676 + }, + { + "epoch": 146, + "train_loss": 0.14299009400129317, + "train_acc": 0.95634, + "test_loss": 3.0686098056793214, + "test_acc": 0.5358, + "lyapunov": null, + "grad_norm": 0.3850727042582934, + "grad_max_sv": 0.1909997107461095, + "grad_min_sv": 7.485124286425553e-09, + "grad_condition": 317122274.6411962, + "lr": 1.7535703752478133e-06, + "time_sec": 32.62571930885315 + }, + { + "epoch": 147, + "train_loss": 0.14365630741119384, + "train_acc": 0.95492, + "test_loss": 3.0893563858032227, + "test_acc": 0.5323, + "lyapunov": null, + "grad_norm": 0.38951329739569457, + "grad_max_sv": 0.2036223117262125, + "grad_min_sv": 7.65796798573963e-09, + "grad_condition": 1755238199.022799, + "lr": 9.866357858642196e-07, + "time_sec": 32.66820478439331 + }, + { + "epoch": 148, + "train_loss": 0.14392941450595856, + "train_acc": 0.95442, + "test_loss": 3.10996495513916, + "test_acc": 0.5333, + "lyapunov": null, + "grad_norm": 0.39173062163314015, + "grad_max_sv": 0.2063495099544525, + "grad_min_sv": 7.663834788052687e-09, + "grad_condition": 222918819.47768226, + "lr": 4.38584950570808e-07, + "time_sec": 32.634111404418945 + }, + { + "epoch": 149, + "train_loss": 0.14141702308177947, + "train_acc": 0.95578, + "test_loss": 3.0389966430664064, + "test_acc": 0.534, + "lyapunov": null, + "grad_norm": 0.38560681907582933, + "grad_max_sv": 0.19791325442492963, + "grad_min_sv": 7.532627289183036e-09, + "grad_condition": 849506689.896325, + "lr": 1.096582625772501e-07, + "time_sec": 32.64178252220154 + }, + { + "epoch": 150, + "train_loss": 0.13974891964912414, + "train_acc": 0.95672, + "test_loss": 3.210689444732666, + "test_acc": 0.5203, + "lyapunov": null, + "grad_norm": 0.38256728324762407, + "grad_max_sv": 0.20051277466118336, + "grad_min_sv": 7.596204577376211e-09, + "grad_condition": 281856943.28215134, + "lr": 0.0, + "time_sec": 32.64586281776428 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.859638395690918, + "train_acc": 0.03152, + "test_loss": 4.889715194702148, + "test_acc": 0.0151, + "lyapunov": null, + "grad_norm": 5.954232576741242, + "grad_max_sv": 5.307005989551544, + "grad_min_sv": 1.001358835961419e-07, + "grad_condition": 552075674.3072966, + "lr": 0.0009998903417374227, + "time_sec": 49.65645170211792 + }, + { + "epoch": 2, + "train_loss": 4.319389633789062, + "train_acc": 0.06024, + "test_loss": 5.013766458129883, + "test_acc": 0.0173, + "lyapunov": null, + "grad_norm": 4.418586259398957, + "grad_max_sv": 3.914894813299179, + "grad_min_sv": 7.522509295060376e-08, + "grad_condition": 339384355.6156703, + "lr": 0.0009995614150494292, + "time_sec": 49.6905255317688 + }, + { + "epoch": 3, + "train_loss": 4.047966442337036, + "train_acc": 0.0854, + "test_loss": 4.641720515441895, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 3.6205755412998126, + "grad_max_sv": 3.0519568264484405, + "grad_min_sv": 6.229751747799384e-08, + "grad_condition": 84094199.64624369, + "lr": 0.0009990133642141358, + "time_sec": 49.67904877662659 + }, + { + "epoch": 4, + "train_loss": 3.8478125959777834, + "train_acc": 0.11184, + "test_loss": 4.577606916809082, + "test_acc": 0.0413, + "lyapunov": null, + "grad_norm": 2.9979318778142026, + "grad_max_sv": 2.4593356758356095, + "grad_min_sv": 5.274777346020443e-08, + "grad_condition": 52832830.62142773, + "lr": 0.0009982464296247522, + "time_sec": 49.67163610458374 + }, + { + "epoch": 5, + "train_loss": 3.684693914794922, + "train_acc": 0.13424, + "test_loss": 4.5975259506225585, + "test_acc": 0.0484, + "lyapunov": null, + "grad_norm": 2.4914069485113255, + "grad_max_sv": 1.926499155163765, + "grad_min_sv": 4.2776759201501593e-08, + "grad_condition": 50734104.8860247, + "lr": 0.0009972609476841367, + "time_sec": 49.65700626373291 + }, + { + "epoch": 6, + "train_loss": 3.55050880859375, + "train_acc": 0.1559, + "test_loss": 4.727248001098633, + "test_acc": 0.0533, + "lyapunov": null, + "grad_norm": 2.1100231817712625, + "grad_max_sv": 1.550008636713028, + "grad_min_sv": 3.687378071770553e-08, + "grad_condition": 46855667.58563471, + "lr": 0.000996057350657239, + "time_sec": 49.679567098617554 + }, + { + "epoch": 7, + "train_loss": 3.442862378692627, + "train_acc": 0.17636, + "test_loss": 4.301828503417969, + "test_acc": 0.0729, + "lyapunov": null, + "grad_norm": 1.8012200630844488, + "grad_max_sv": 1.2357391178607942, + "grad_min_sv": 3.1382046258854325e-08, + "grad_condition": 65722163.37376006, + "lr": 0.000994636166481494, + "time_sec": 49.68814516067505 + }, + { + "epoch": 8, + "train_loss": 3.3536919964599607, + "train_acc": 0.18966, + "test_loss": 4.951620690155029, + "test_acc": 0.0532, + "lyapunov": null, + "grad_norm": 1.5680920854613782, + "grad_max_sv": 0.9788420423865318, + "grad_min_sv": 2.7002664731989868e-08, + "grad_condition": 58096765.61809726, + "lr": 0.0009929980185352525, + "time_sec": 49.675843238830566 + }, + { + "epoch": 9, + "train_loss": 3.269279045944214, + "train_acc": 0.20574, + "test_loss": 5.401820195770264, + "test_acc": 0.0537, + "lyapunov": null, + "grad_norm": 1.4267226502196788, + "grad_max_sv": 0.8291853129863739, + "grad_min_sv": 2.482418245408624e-08, + "grad_condition": 42172648.46717249, + "lr": 0.0009911436253643444, + "time_sec": 49.66762089729309 + }, + { + "epoch": 10, + "train_loss": 3.214019367523193, + "train_acc": 0.21578, + "test_loss": 4.996800016784668, + "test_acc": 0.0595, + "lyapunov": null, + "grad_norm": 1.3189803040238792, + "grad_max_sv": 0.7221315041184425, + "grad_min_sv": 2.3845375857201035e-08, + "grad_condition": 34648921.193528794, + "lr": 0.0009890738003669028, + "time_sec": 49.68191909790039 + }, + { + "epoch": 11, + "train_loss": 3.1423779235076905, + "train_acc": 0.23122, + "test_loss": 5.491759350585937, + "test_acc": 0.0514, + "lyapunov": null, + "grad_norm": 1.210815553275265, + "grad_max_sv": 0.6110412269830704, + "grad_min_sv": 2.156598551961153e-08, + "grad_condition": 36027430.82270874, + "lr": 0.00098678945143658, + "time_sec": 49.66831660270691 + }, + { + "epoch": 12, + "train_loss": 3.0939224156188967, + "train_acc": 0.23894, + "test_loss": 5.521206758117676, + "test_acc": 0.0477, + "lyapunov": null, + "grad_norm": 1.1454683736798692, + "grad_max_sv": 0.552279046177864, + "grad_min_sv": 2.1021200163895414e-08, + "grad_condition": 39875827.083382726, + "lr": 0.0009842915805643154, + "time_sec": 49.684069871902466 + }, + { + "epoch": 13, + "train_loss": 3.0491431757354737, + "train_acc": 0.24658, + "test_loss": 5.578466902160645, + "test_acc": 0.0531, + "lyapunov": null, + "grad_norm": 1.0920545496350367, + "grad_max_sv": 0.5008575700223445, + "grad_min_sv": 1.9939987251638147e-08, + "grad_condition": 78676545.0266799, + "lr": 0.000981581283398829, + "time_sec": 49.6787166595459 + }, + { + "epoch": 14, + "train_loss": 3.014207199859619, + "train_acc": 0.254, + "test_loss": 6.077666107940674, + "test_acc": 0.0514, + "lyapunov": null, + "grad_norm": 1.0343273898251877, + "grad_max_sv": 0.4525983504951, + "grad_min_sv": 1.86659577294801e-08, + "grad_condition": 28329944.590861797, + "lr": 0.0009786597487660333, + "time_sec": 49.7034227848053 + }, + { + "epoch": 15, + "train_loss": 2.9751409410095215, + "train_acc": 0.26042, + "test_loss": 6.2586611465454105, + "test_acc": 0.0429, + "lyapunov": null, + "grad_norm": 0.9902696753407212, + "grad_max_sv": 0.4210175834596157, + "grad_min_sv": 1.8090482711841106e-08, + "grad_condition": 25656377.04280036, + "lr": 0.0009755282581475766, + "time_sec": 49.6661171913147 + }, + { + "epoch": 16, + "train_loss": 2.93480419670105, + "train_acc": 0.26668, + "test_loss": 6.385146492004394, + "test_acc": 0.0363, + "lyapunov": null, + "grad_norm": 0.9387810522360384, + "grad_max_sv": 0.3934634834527969, + "grad_min_sv": 1.7115417286998197e-08, + "grad_condition": 344149202.01430434, + "lr": 0.0009721881851187403, + "time_sec": 49.67508864402771 + }, + { + "epoch": 17, + "train_loss": 2.8986016393280027, + "train_acc": 0.27286, + "test_loss": 6.562953887939453, + "test_acc": 0.0361, + "lyapunov": null, + "grad_norm": 0.9054609985871933, + "grad_max_sv": 0.35425483882427217, + "grad_min_sv": 1.6415356418608695e-08, + "grad_condition": 30574676.413671672, + "lr": 0.0009686409947459456, + "time_sec": 49.667582750320435 + }, + { + "epoch": 18, + "train_loss": 2.8772469989013674, + "train_acc": 0.2794, + "test_loss": 6.930446549987793, + "test_acc": 0.0423, + "lyapunov": null, + "grad_norm": 0.8844780733693258, + "grad_max_sv": 0.3656620219349861, + "grad_min_sv": 1.635258776149645e-08, + "grad_condition": 220836338.85584363, + "lr": 0.0009648882429441254, + "time_sec": 49.656644105911255 + }, + { + "epoch": 19, + "train_loss": 2.8373563732910156, + "train_acc": 0.28908, + "test_loss": 6.081598696136474, + "test_acc": 0.0401, + "lyapunov": null, + "grad_norm": 0.860957997804604, + "grad_max_sv": 0.3348636828362942, + "grad_min_sv": 1.5952280629782932e-08, + "grad_condition": 31599881.191394538, + "lr": 0.00096093157579425, + "time_sec": 49.67035698890686 + }, + { + "epoch": 20, + "train_loss": 2.8054893614959715, + "train_acc": 0.2914, + "test_loss": 6.01144070892334, + "test_acc": 0.0445, + "lyapunov": null, + "grad_norm": 0.8471187482170223, + "grad_max_sv": 0.3353402022272348, + "grad_min_sv": 1.5952383431577788e-08, + "grad_condition": 75803422.19622198, + "lr": 0.0009567727288213001, + "time_sec": 49.653173208236694 + }, + { + "epoch": 21, + "train_loss": 2.7821781129455565, + "train_acc": 0.29886, + "test_loss": 7.499567970275879, + "test_acc": 0.0423, + "lyapunov": null, + "grad_norm": 0.8293106417876014, + "grad_max_sv": 0.3269222855567932, + "grad_min_sv": 1.5338675737885944e-08, + "grad_condition": 29362265.48882215, + "lr": 0.0009524135262330095, + "time_sec": 49.67377185821533 + }, + { + "epoch": 22, + "train_loss": 2.7638499293518066, + "train_acc": 0.3032, + "test_loss": 6.383679943847656, + "test_acc": 0.0362, + "lyapunov": null, + "grad_norm": 0.8165833245054394, + "grad_max_sv": 0.3245947003364563, + "grad_min_sv": 1.5419339931266317e-08, + "grad_condition": 58376388.8753622, + "lr": 0.0009478558801197061, + "time_sec": 49.67671012878418 + }, + { + "epoch": 23, + "train_loss": 2.724514207687378, + "train_acc": 0.30706, + "test_loss": 5.952158892822266, + "test_acc": 0.0445, + "lyapunov": null, + "grad_norm": 0.8021101720231821, + "grad_max_sv": 0.3072248637676239, + "grad_min_sv": 1.4965002159694764e-08, + "grad_condition": 25664610.21875491, + "lr": 0.000943101789615607, + "time_sec": 49.704936265945435 + }, + { + "epoch": 24, + "train_loss": 2.708938373336792, + "train_acc": 0.31268, + "test_loss": 7.5166516456604, + "test_acc": 0.0558, + "lyapunov": null, + "grad_norm": 0.7795707854426385, + "grad_max_sv": 0.29907657466828824, + "grad_min_sv": 1.422086394337052e-08, + "grad_condition": 39674541.25272976, + "lr": 0.0009381533400219313, + "time_sec": 49.666532039642334 + }, + { + "epoch": 25, + "train_loss": 2.682072137298584, + "train_acc": 0.31728, + "test_loss": 6.62000643157959, + "test_acc": 0.0482, + "lyapunov": null, + "grad_norm": 0.7808971742139675, + "grad_max_sv": 0.29099693447351455, + "grad_min_sv": 1.4521361274555389e-08, + "grad_condition": 22205234.5206615, + "lr": 0.0009330127018922189, + "time_sec": 49.69266104698181 + }, + { + "epoch": 26, + "train_loss": 2.65549779296875, + "train_acc": 0.32384, + "test_loss": 6.58011586227417, + "test_acc": 0.052, + "lyapunov": null, + "grad_norm": 0.7695010065575659, + "grad_max_sv": 0.2835450112819672, + "grad_min_sv": 1.4190736662145209e-08, + "grad_condition": 50519202.54503296, + "lr": 0.000927682130080253, + "time_sec": 49.67102766036987 + }, + { + "epoch": 27, + "train_loss": 2.6304065126037597, + "train_acc": 0.32698, + "test_loss": 6.6322671501159665, + "test_acc": 0.0419, + "lyapunov": null, + "grad_norm": 0.750705382257285, + "grad_max_sv": 0.27432012744247913, + "grad_min_sv": 1.3865758934084037e-08, + "grad_condition": 41972624.03893653, + "lr": 0.0009221639627510072, + "time_sec": 49.66697978973389 + }, + { + "epoch": 28, + "train_loss": 2.6134433952331544, + "train_acc": 0.33008, + "test_loss": 6.623760261535645, + "test_acc": 0.0423, + "lyapunov": null, + "grad_norm": 0.7482482474592583, + "grad_max_sv": 0.27728364057838917, + "grad_min_sv": 1.3751216751400897e-08, + "grad_condition": 38932458.33089183, + "lr": 0.0009164606203550494, + "time_sec": 49.65370750427246 + }, + { + "epoch": 29, + "train_loss": 2.5960432355499266, + "train_acc": 0.33412, + "test_loss": 6.534938531494141, + "test_acc": 0.0482, + "lyapunov": null, + "grad_norm": 0.7410723983323744, + "grad_max_sv": 0.27464564964175225, + "grad_min_sv": 1.3711500621016448e-08, + "grad_condition": 42857069.88633077, + "lr": 0.0009105746045668516, + "time_sec": 49.68619203567505 + }, + { + "epoch": 30, + "train_loss": 2.5654613037872314, + "train_acc": 0.33868, + "test_loss": 6.90097837600708, + "test_acc": 0.0477, + "lyapunov": null, + "grad_norm": 0.7344540179832404, + "grad_max_sv": 0.2711446277797222, + "grad_min_sv": 1.3932310100051027e-08, + "grad_condition": 25213443.65097971, + "lr": 0.0009045084971874733, + "time_sec": 49.68855595588684 + }, + { + "epoch": 31, + "train_loss": 2.549656229248047, + "train_acc": 0.34158, + "test_loss": 6.697615758514404, + "test_acc": 0.0512, + "lyapunov": null, + "grad_norm": 0.7268186183289101, + "grad_max_sv": 0.27280680015683173, + "grad_min_sv": 1.357802058565838e-08, + "grad_condition": 23483839.830407344, + "lr": 0.0008982649590120977, + "time_sec": 49.676591873168945 + }, + { + "epoch": 32, + "train_loss": 2.5242956202697755, + "train_acc": 0.34892, + "test_loss": 6.319401416778565, + "test_acc": 0.053, + "lyapunov": null, + "grad_norm": 0.7259604933893773, + "grad_max_sv": 0.26320211961865425, + "grad_min_sv": 1.3533629053541497e-08, + "grad_condition": 39445604.10623846, + "lr": 0.0008918467286629196, + "time_sec": 49.692715883255005 + }, + { + "epoch": 33, + "train_loss": 2.5224684230804444, + "train_acc": 0.3463, + "test_loss": 7.63949846572876, + "test_acc": 0.039, + "lyapunov": null, + "grad_norm": 0.7143557279471436, + "grad_max_sv": 0.2541281133890152, + "grad_min_sv": 1.3116104637111991e-08, + "grad_condition": 39274316.41978644, + "lr": 0.0008852566213878943, + "time_sec": 49.73993396759033 + }, + { + "epoch": 34, + "train_loss": 2.497994396820068, + "train_acc": 0.35334, + "test_loss": 7.870207711791992, + "test_acc": 0.0503, + "lyapunov": null, + "grad_norm": 0.7116544610237331, + "grad_max_sv": 0.2558239698410034, + "grad_min_sv": 1.3238359958256396e-08, + "grad_condition": 21655318.49170895, + "lr": 0.000878497527825878, + "time_sec": 49.68305444717407 + }, + { + "epoch": 35, + "train_loss": 2.4686731043243406, + "train_acc": 0.35928, + "test_loss": 7.18174976348877, + "test_acc": 0.0357, + "lyapunov": null, + "grad_norm": 0.7007920609781888, + "grad_max_sv": 0.2539347130805254, + "grad_min_sv": 1.3282394706326528e-08, + "grad_condition": 21108486.486423627, + "lr": 0.000871572412738697, + "time_sec": 49.695449113845825 + }, + { + "epoch": 36, + "train_loss": 2.460664310836792, + "train_acc": 0.36364, + "test_loss": 7.128146871948243, + "test_acc": 0.0449, + "lyapunov": null, + "grad_norm": 0.69614807393942, + "grad_max_sv": 0.2554327756166458, + "grad_min_sv": 1.2980320013289415e-08, + "grad_condition": 22519369.226881642, + "lr": 0.0008644843137107055, + "time_sec": 49.66995120048523 + }, + { + "epoch": 37, + "train_loss": 2.4368207202148437, + "train_acc": 0.36728, + "test_loss": 7.258980679321289, + "test_acc": 0.0415, + "lyapunov": null, + "grad_norm": 0.6961411904435771, + "grad_max_sv": 0.24668896421790124, + "grad_min_sv": 1.2852767725113345e-08, + "grad_condition": 46202463.301736034, + "lr": 0.0008572363398164014, + "time_sec": 49.647136211395264 + }, + { + "epoch": 38, + "train_loss": 2.427408982620239, + "train_acc": 0.36802, + "test_loss": 7.733517263793945, + "test_acc": 0.048, + "lyapunov": null, + "grad_norm": 0.6919372250511854, + "grad_max_sv": 0.24009289182722568, + "grad_min_sv": 1.2789621656184025e-08, + "grad_condition": 20990751.217783477, + "lr": 0.0008498316702566826, + "time_sec": 49.67976427078247 + }, + { + "epoch": 39, + "train_loss": 2.4084082847595214, + "train_acc": 0.37116, + "test_loss": 8.442286386108398, + "test_acc": 0.0456, + "lyapunov": null, + "grad_norm": 0.6930170401512381, + "grad_max_sv": 0.24679070636630057, + "grad_min_sv": 1.2866078272222303e-08, + "grad_condition": 27175517.495315444, + "lr": 0.0008422735529643442, + "time_sec": 49.96265935897827 + }, + { + "epoch": 40, + "train_loss": 2.3789397065734863, + "train_acc": 0.377, + "test_loss": 8.60147202758789, + "test_acc": 0.0553, + "lyapunov": null, + "grad_norm": 0.6866977951205424, + "grad_max_sv": 0.2372380755841732, + "grad_min_sv": 1.2673489289960482e-08, + "grad_condition": 25134605.150391974, + "lr": 0.0008345653031794289, + "time_sec": 49.673630714416504 + }, + { + "epoch": 41, + "train_loss": 2.3719822661590575, + "train_acc": 0.37826, + "test_loss": 9.859453852844238, + "test_acc": 0.0381, + "lyapunov": null, + "grad_norm": 0.6832268983806022, + "grad_max_sv": 0.24582902267575263, + "grad_min_sv": 1.2850037944822646e-08, + "grad_condition": 24608396.69926225, + "lr": 0.0008267103019950526, + "time_sec": 49.68519139289856 + }, + { + "epoch": 42, + "train_loss": 2.3532817036437987, + "train_acc": 0.38358, + "test_loss": 7.662250825500489, + "test_acc": 0.0529, + "lyapunov": null, + "grad_norm": 0.6785583478283931, + "grad_max_sv": 0.242770054936409, + "grad_min_sv": 1.2961682474554869e-08, + "grad_condition": 22449199.409221668, + "lr": 0.0008187119948743447, + "time_sec": 49.68075966835022 + }, + { + "epoch": 43, + "train_loss": 2.330468462142944, + "train_acc": 0.3888, + "test_loss": 8.202189974975585, + "test_acc": 0.0414, + "lyapunov": null, + "grad_norm": 0.6778240032010198, + "grad_max_sv": 0.2364946186542511, + "grad_min_sv": 1.2662658638307179e-08, + "grad_condition": 81811853.66536663, + "lr": 0.000810573890139155, + "time_sec": 49.672260999679565 + }, + { + "epoch": 44, + "train_loss": 2.3200248764038087, + "train_acc": 0.39056, + "test_loss": 9.49625231628418, + "test_acc": 0.0399, + "lyapunov": null, + "grad_norm": 0.6781391809835111, + "grad_max_sv": 0.24071150235831737, + "grad_min_sv": 1.2508382562365084e-08, + "grad_condition": 46107093.29369648, + "lr": 0.0008022995574311873, + "time_sec": 49.77734994888306 + }, + { + "epoch": 45, + "train_loss": 2.3097952668762205, + "train_acc": 0.39266, + "test_loss": 8.424926385498047, + "test_acc": 0.0424, + "lyapunov": null, + "grad_norm": 0.671559529535967, + "grad_max_sv": 0.23751593232154847, + "grad_min_sv": 1.2544404863999715e-08, + "grad_condition": 159847416.163928, + "lr": 0.0007938926261462363, + "time_sec": 49.67583131790161 + }, + { + "epoch": 46, + "train_loss": 2.289791601486206, + "train_acc": 0.39376, + "test_loss": 7.675090921020508, + "test_acc": 0.0463, + "lyapunov": null, + "grad_norm": 0.6682654857478311, + "grad_max_sv": 0.23650372885167598, + "grad_min_sv": 1.2501646582535608e-08, + "grad_condition": 33733351.01726882, + "lr": 0.0007853567838422158, + "time_sec": 49.67869472503662 + }, + { + "epoch": 47, + "train_loss": 2.2834349323272707, + "train_acc": 0.39658, + "test_loss": 7.4819295173645015, + "test_acc": 0.0379, + "lyapunov": null, + "grad_norm": 0.6667226769561037, + "grad_max_sv": 0.2302993658930063, + "grad_min_sv": 1.2218414741083095e-08, + "grad_condition": 51227874.749703094, + "lr": 0.0007766957746216719, + "time_sec": 49.7194459438324 + }, + { + "epoch": 48, + "train_loss": 2.25024987701416, + "train_acc": 0.40146, + "test_loss": 8.022064225769043, + "test_acc": 0.0413, + "lyapunov": null, + "grad_norm": 0.6618464076252294, + "grad_max_sv": 0.23088047429919242, + "grad_min_sv": 1.2327867555256277e-08, + "grad_condition": 35182939.78342288, + "lr": 0.0007679133974894982, + "time_sec": 49.70452952384949 + }, + { + "epoch": 49, + "train_loss": 2.2388064471435545, + "train_acc": 0.40452, + "test_loss": 8.151009174346925, + "test_acc": 0.0628, + "lyapunov": null, + "grad_norm": 0.6630494068959804, + "grad_max_sv": 0.23379013687372208, + "grad_min_sv": 1.2465736873301658e-08, + "grad_condition": 33085394.279290985, + "lr": 0.000759013504686565, + "time_sec": 49.68948721885681 + }, + { + "epoch": 50, + "train_loss": 2.2181204542541506, + "train_acc": 0.41212, + "test_loss": 9.250449546813964, + "test_acc": 0.04, + "lyapunov": null, + "grad_norm": 0.6652991845905551, + "grad_max_sv": 0.22462675608694554, + "grad_min_sv": 1.2323866713237486e-08, + "grad_condition": 22263373.145076137, + "lr": 0.0007499999999999998, + "time_sec": 49.666321992874146 + }, + { + "epoch": 51, + "train_loss": 2.20994104057312, + "train_acc": 0.41342, + "test_loss": 9.559111304473877, + "test_acc": 0.0409, + "lyapunov": null, + "grad_norm": 0.6598918836052567, + "grad_max_sv": 0.23548415303230286, + "grad_min_sv": 1.2407575328277076e-08, + "grad_condition": 20825798.946305078, + "lr": 0.0007408768370508575, + "time_sec": 49.68445158004761 + }, + { + "epoch": 52, + "train_loss": 2.1999930603790285, + "train_acc": 0.41448, + "test_loss": 11.003676113891602, + "test_acc": 0.0334, + "lyapunov": null, + "grad_norm": 0.6588199824582822, + "grad_max_sv": 0.23691155388951302, + "grad_min_sv": 1.2400961009462197e-08, + "grad_condition": 41350669.39745356, + "lr": 0.0007316480175599307, + "time_sec": 49.71706438064575 + }, + { + "epoch": 53, + "train_loss": 2.180186467590332, + "train_acc": 0.42046, + "test_loss": 9.763460252380371, + "test_acc": 0.0326, + "lyapunov": null, + "grad_norm": 0.6586330831149164, + "grad_max_sv": 0.23136127404868603, + "grad_min_sv": 1.2327406417877996e-08, + "grad_condition": 21391463.196456783, + "lr": 0.0007223175895924635, + "time_sec": 49.695746421813965 + }, + { + "epoch": 54, + "train_loss": 2.1679266621398927, + "train_acc": 0.42156, + "test_loss": 7.939757450866699, + "test_acc": 0.0488, + "lyapunov": null, + "grad_norm": 0.6589906387540297, + "grad_max_sv": 0.2307649329304695, + "grad_min_sv": 1.2288389259623722e-08, + "grad_condition": 45621544.84620191, + "lr": 0.0007128896457825361, + "time_sec": 49.76089358329773 + }, + { + "epoch": 55, + "train_loss": 2.142840644683838, + "train_acc": 0.42656, + "test_loss": 8.888317533874512, + "test_acc": 0.0462, + "lyapunov": null, + "grad_norm": 0.6547801166710938, + "grad_max_sv": 0.22659273855388165, + "grad_min_sv": 1.2303670693381008e-08, + "grad_condition": 23597081.72903175, + "lr": 0.0007033683215378998, + "time_sec": 49.6726438999176 + }, + { + "epoch": 56, + "train_loss": 2.135846128311157, + "train_acc": 0.42756, + "test_loss": 8.83825325088501, + "test_acc": 0.0604, + "lyapunov": null, + "grad_norm": 0.657016926749893, + "grad_max_sv": 0.22309886030852794, + "grad_min_sv": 1.2188990075601147e-08, + "grad_condition": 23345059.14599296, + "lr": 0.0006937577932260512, + "time_sec": 49.6900200843811 + }, + { + "epoch": 57, + "train_loss": 2.1248773579406737, + "train_acc": 0.42806, + "test_loss": 10.463209185791015, + "test_acc": 0.0394, + "lyapunov": null, + "grad_norm": 0.6560747230768702, + "grad_max_sv": 0.22913397066295146, + "grad_min_sv": 1.2386757172744289e-08, + "grad_condition": 23336570.811041903, + "lr": 0.0006840622763423388, + "time_sec": 49.66491365432739 + }, + { + "epoch": 58, + "train_loss": 2.098032854232788, + "train_acc": 0.43608, + "test_loss": 8.402244955444337, + "test_acc": 0.0576, + "lyapunov": null, + "grad_norm": 0.6521436690740889, + "grad_max_sv": 0.22335078455507756, + "grad_min_sv": 1.2130738608930047e-08, + "grad_condition": 82226340.7870448, + "lr": 0.0006742860236609073, + "time_sec": 49.69048047065735 + }, + { + "epoch": 59, + "train_loss": 2.0929744161224364, + "train_acc": 0.43502, + "test_loss": 9.000237996673585, + "test_acc": 0.0422, + "lyapunov": null, + "grad_norm": 0.6596559776024251, + "grad_max_sv": 0.23497166410088538, + "grad_min_sv": 1.2387185107515242e-08, + "grad_condition": 84888311.49192938, + "lr": 0.0006644333233692913, + "time_sec": 49.65994358062744 + }, + { + "epoch": 60, + "train_loss": 2.065872961578369, + "train_acc": 0.43954, + "test_loss": 9.074447032165528, + "test_acc": 0.0437, + "lyapunov": null, + "grad_norm": 0.6572494317540103, + "grad_max_sv": 0.22353526391088963, + "grad_min_sv": 1.2282747853184506e-08, + "grad_condition": 47637090.98705881, + "lr": 0.0006545084971874734, + "time_sec": 49.6876540184021 + }, + { + "epoch": 61, + "train_loss": 2.0577297566223143, + "train_acc": 0.44062, + "test_loss": 9.532735338592529, + "test_acc": 0.0441, + "lyapunov": null, + "grad_norm": 0.6541690793509286, + "grad_max_sv": 0.22554977014660835, + "grad_min_sv": 1.222446728982307e-08, + "grad_condition": 40444318.030873686, + "lr": 0.0006445158984722354, + "time_sec": 49.701878786087036 + }, + { + "epoch": 62, + "train_loss": 2.043477922668457, + "train_acc": 0.4471, + "test_loss": 8.881709355926514, + "test_acc": 0.0408, + "lyapunov": null, + "grad_norm": 0.6528989117370432, + "grad_max_sv": 0.23128659874200821, + "grad_min_sv": 1.2199498941600773e-08, + "grad_condition": 25373537.768767178, + "lr": 0.0006344599103076324, + "time_sec": 49.68139433860779 + }, + { + "epoch": 63, + "train_loss": 2.0370414685821534, + "train_acc": 0.44656, + "test_loss": 8.181381430053712, + "test_acc": 0.0499, + "lyapunov": null, + "grad_norm": 0.6483431218966593, + "grad_max_sv": 0.22313697412610053, + "grad_min_sv": 1.205714866697738e-08, + "grad_condition": 41928205.378838554, + "lr": 0.0006243449435824269, + "time_sec": 49.67868185043335 + }, + { + "epoch": 64, + "train_loss": 2.023549471588135, + "train_acc": 0.45312, + "test_loss": 8.274014418029784, + "test_acc": 0.0515, + "lyapunov": null, + "grad_norm": 0.6449925645502804, + "grad_max_sv": 0.22069306187331678, + "grad_min_sv": 1.2058881553381195e-08, + "grad_condition": 93235177.09487496, + "lr": 0.0006141754350553275, + "time_sec": 49.690672397613525 + }, + { + "epoch": 65, + "train_loss": 2.0048684004974366, + "train_acc": 0.45552, + "test_loss": 9.286334159851075, + "test_acc": 0.046, + "lyapunov": null, + "grad_norm": 0.650044692049561, + "grad_max_sv": 0.23110067173838617, + "grad_min_sv": 1.2122515255985274e-08, + "grad_condition": 470414401.9889208, + "lr": 0.0006039558454088793, + "time_sec": 49.68914556503296 + }, + { + "epoch": 66, + "train_loss": 1.9918653341674806, + "train_acc": 0.4583, + "test_loss": 8.949441627502441, + "test_acc": 0.0572, + "lyapunov": null, + "grad_norm": 0.6465380976944957, + "grad_max_sv": 0.21693982630968095, + "grad_min_sv": 1.1910990151131617e-08, + "grad_condition": 25883377.52860467, + "lr": 0.000593690657292862, + "time_sec": 49.68254733085632 + }, + { + "epoch": 67, + "train_loss": 1.9803133847808838, + "train_acc": 0.46144, + "test_loss": 8.32604729232788, + "test_acc": 0.0508, + "lyapunov": null, + "grad_norm": 0.6479922287995563, + "grad_max_sv": 0.22669611796736716, + "grad_min_sv": 1.2100678287163547e-08, + "grad_condition": 28151058.773615837, + "lr": 0.0005833843733580507, + "time_sec": 49.68208575248718 + }, + { + "epoch": 68, + "train_loss": 1.9607464070892333, + "train_acc": 0.46388, + "test_loss": 9.707257481384277, + "test_acc": 0.0398, + "lyapunov": null, + "grad_norm": 0.6492114877298168, + "grad_max_sv": 0.2241646781563759, + "grad_min_sv": 1.210112051674983e-08, + "grad_condition": 25377171.051344726, + "lr": 0.0005730415142812054, + "time_sec": 49.68517184257507 + }, + { + "epoch": 69, + "train_loss": 1.9513853014373779, + "train_acc": 0.46884, + "test_loss": 8.47444464416504, + "test_acc": 0.0488, + "lyapunov": null, + "grad_norm": 0.6463513268584093, + "grad_max_sv": 0.2142929717898369, + "grad_min_sv": 1.1840976324450914e-08, + "grad_condition": 50285850.63139588, + "lr": 0.0005626666167821517, + "time_sec": 49.704482555389404 + }, + { + "epoch": 70, + "train_loss": 1.9367229152679444, + "train_acc": 0.47148, + "test_loss": 6.999028721618652, + "test_acc": 0.0484, + "lyapunov": null, + "grad_norm": 0.6501650263515466, + "grad_max_sv": 0.22791170775890351, + "grad_min_sv": 1.1914296331461127e-08, + "grad_condition": 36101160.51683195, + "lr": 0.0005522642316338265, + "time_sec": 49.665884256362915 + }, + { + "epoch": 71, + "train_loss": 1.9213849370574951, + "train_acc": 0.47454, + "test_loss": 8.607553945922852, + "test_acc": 0.046, + "lyapunov": null, + "grad_norm": 0.645136682733363, + "grad_max_sv": 0.21353928446769715, + "grad_min_sv": 1.1971198099480773e-08, + "grad_condition": 27321985.78115796, + "lr": 0.0005418389216661573, + "time_sec": 49.681238651275635 + }, + { + "epoch": 72, + "train_loss": 1.9093179278945922, + "train_acc": 0.47998, + "test_loss": 8.757230839538574, + "test_acc": 0.0444, + "lyapunov": null, + "grad_norm": 0.6452662854365648, + "grad_max_sv": 0.21823508627712726, + "grad_min_sv": 1.2026960773126038e-08, + "grad_condition": 26413534.165089346, + "lr": 0.0005313952597646563, + "time_sec": 49.692418575286865 + }, + { + "epoch": 73, + "train_loss": 1.8866335528182983, + "train_acc": 0.48264, + "test_loss": 10.402983039093018, + "test_acc": 0.0401, + "lyapunov": null, + "grad_norm": 0.6525277024285655, + "grad_max_sv": 0.23297128714621068, + "grad_min_sv": 1.2263412779017768e-08, + "grad_condition": 34782890.77935375, + "lr": 0.0005209378268645994, + "time_sec": 49.73197340965271 + }, + { + "epoch": 74, + "train_loss": 1.8747241662979126, + "train_acc": 0.48344, + "test_loss": 9.54773469543457, + "test_acc": 0.0397, + "lyapunov": null, + "grad_norm": 0.6482441280543788, + "grad_max_sv": 0.2259498331695795, + "grad_min_sv": 1.2019296095205911e-08, + "grad_condition": 47977623.301262416, + "lr": 0.0005104712099416781, + "time_sec": 49.6679584980011 + }, + { + "epoch": 75, + "train_loss": 1.8684229253387452, + "train_acc": 0.48648, + "test_loss": 9.898564820861816, + "test_acc": 0.0438, + "lyapunov": null, + "grad_norm": 0.6519077278808565, + "grad_max_sv": 0.23051740378141403, + "grad_min_sv": 1.2129807108740564e-08, + "grad_condition": 24509410.587565698, + "lr": 0.0004999999999999996, + "time_sec": 49.68412518501282 + }, + { + "epoch": 76, + "train_loss": 1.85779982421875, + "train_acc": 0.48786, + "test_loss": 9.483146997070312, + "test_acc": 0.0513, + "lyapunov": null, + "grad_norm": 0.6486728105276228, + "grad_max_sv": 0.2221123144030571, + "grad_min_sv": 1.1975807984176967e-08, + "grad_condition": 20557013.381313976, + "lr": 0.0004895287900583212, + "time_sec": 49.723254919052124 + }, + { + "epoch": 77, + "train_loss": 1.8444078363037109, + "train_acc": 0.49074, + "test_loss": 10.222208703613282, + "test_acc": 0.0465, + "lyapunov": null, + "grad_norm": 0.6454821533339739, + "grad_max_sv": 0.22238644734025, + "grad_min_sv": 1.2053597833738827e-08, + "grad_condition": 34583488.93828535, + "lr": 0.0004790621731353997, + "time_sec": 49.71964693069458 + }, + { + "epoch": 78, + "train_loss": 1.8336746375274657, + "train_acc": 0.49452, + "test_loss": 8.982472491455079, + "test_acc": 0.0428, + "lyapunov": null, + "grad_norm": 0.648872980564532, + "grad_max_sv": 0.22544824704527855, + "grad_min_sv": 1.2111463587594073e-08, + "grad_condition": 31218528.70310817, + "lr": 0.000468604740235343, + "time_sec": 49.689850091934204 + }, + { + "epoch": 79, + "train_loss": 1.8146154912948609, + "train_acc": 0.49856, + "test_loss": 9.511101889038086, + "test_acc": 0.0569, + "lyapunov": null, + "grad_norm": 0.6499657747983872, + "grad_max_sv": 0.21684016697108746, + "grad_min_sv": 1.2001167985428717e-08, + "grad_condition": 84780015.32537413, + "lr": 0.00045816107833384175, + "time_sec": 49.710490465164185 + }, + { + "epoch": 80, + "train_loss": 1.8103199542617798, + "train_acc": 0.49682, + "test_loss": 9.03535528869629, + "test_acc": 0.0596, + "lyapunov": null, + "grad_norm": 0.6479208488258928, + "grad_max_sv": 0.22531640119850635, + "grad_min_sv": 1.2292646991984846e-08, + "grad_condition": 22454640.541646004, + "lr": 0.0004477357683661729, + "time_sec": 49.691465616226196 + }, + { + "epoch": 81, + "train_loss": 1.7893104940414428, + "train_acc": 0.5054, + "test_loss": 10.460518026733398, + "test_acc": 0.0488, + "lyapunov": null, + "grad_norm": 0.644923356628824, + "grad_max_sv": 0.22309624291956426, + "grad_min_sv": 1.1942367686423872e-08, + "grad_condition": 28913062.47388742, + "lr": 0.00043733338321784746, + "time_sec": 49.66995024681091 + }, + { + "epoch": 82, + "train_loss": 1.7721799975585937, + "train_acc": 0.5086, + "test_loss": 10.09628585510254, + "test_acc": 0.0616, + "lyapunov": null, + "grad_norm": 0.6459601896535213, + "grad_max_sv": 0.22903541326522828, + "grad_min_sv": 1.2041541591623073e-08, + "grad_condition": 38183958.25474138, + "lr": 0.0004269584857187939, + "time_sec": 49.695367097854614 + }, + { + "epoch": 83, + "train_loss": 1.7660796548080444, + "train_acc": 0.51202, + "test_loss": 10.205337027740478, + "test_acc": 0.0579, + "lyapunov": null, + "grad_norm": 0.6415386933312663, + "grad_max_sv": 0.22064069882035256, + "grad_min_sv": 1.1835727964371045e-08, + "grad_condition": 49707962.67813484, + "lr": 0.0004166156266419484, + "time_sec": 49.68897724151611 + }, + { + "epoch": 84, + "train_loss": 1.7528482787322999, + "train_acc": 0.51238, + "test_loss": 10.510674937438965, + "test_acc": 0.0551, + "lyapunov": null, + "grad_norm": 0.6420313460573799, + "grad_max_sv": 0.22029150500893593, + "grad_min_sv": 1.19002487544706e-08, + "grad_condition": 28010796.791804053, + "lr": 0.0004063093427071373, + "time_sec": 49.67009973526001 + }, + { + "epoch": 85, + "train_loss": 1.7304393712615966, + "train_acc": 0.51912, + "test_loss": 10.982994299316406, + "test_acc": 0.0439, + "lyapunov": null, + "grad_norm": 0.6491775563207881, + "grad_max_sv": 0.22494816593825817, + "grad_min_sv": 1.1919110563807233e-08, + "grad_condition": 71167015.99452889, + "lr": 0.0003960441545911199, + "time_sec": 49.67024207115173 + }, + { + "epoch": 86, + "train_loss": 1.7296760926055907, + "train_acc": 0.5179, + "test_loss": 12.183889169311524, + "test_acc": 0.0429, + "lyapunov": null, + "grad_norm": 0.6457181992143765, + "grad_max_sv": 0.2269137304276228, + "grad_min_sv": 1.2231672415208283e-08, + "grad_condition": 26257302.177514024, + "lr": 0.0003858245649446718, + "time_sec": 49.69754147529602 + }, + { + "epoch": 87, + "train_loss": 1.7160073374938964, + "train_acc": 0.51966, + "test_loss": 10.396235189819336, + "test_acc": 0.0548, + "lyapunov": null, + "grad_norm": 0.6493023336876179, + "grad_max_sv": 0.22961441613733768, + "grad_min_sv": 1.215062691052593e-08, + "grad_condition": 63860503.24509815, + "lr": 0.00037565505641757235, + "time_sec": 49.73331546783447 + }, + { + "epoch": 88, + "train_loss": 1.69604633644104, + "train_acc": 0.52544, + "test_loss": 9.340446753692627, + "test_acc": 0.0728, + "lyapunov": null, + "grad_norm": 0.6443840050432499, + "grad_max_sv": 0.22305018082261086, + "grad_min_sv": 1.2058662629543803e-08, + "grad_condition": 22903366.234294124, + "lr": 0.00036554008969236695, + "time_sec": 49.68258500099182 + }, + { + "epoch": 89, + "train_loss": 1.686116159324646, + "train_acc": 0.53046, + "test_loss": 10.22809548034668, + "test_acc": 0.0669, + "lyapunov": null, + "grad_norm": 0.6527471973752481, + "grad_max_sv": 0.22662671245634555, + "grad_min_sv": 1.212674889117249e-08, + "grad_condition": 24089254.056239497, + "lr": 0.0003554841015277638, + "time_sec": 49.68924427032471 + }, + { + "epoch": 90, + "train_loss": 1.671509605369568, + "train_acc": 0.5327, + "test_loss": 9.615215731811523, + "test_acc": 0.0688, + "lyapunov": null, + "grad_norm": 0.6462652078206819, + "grad_max_sv": 0.2236987181007862, + "grad_min_sv": 1.189017963393324e-08, + "grad_condition": 27612763.066882085, + "lr": 0.000345491502812526, + "time_sec": 49.69840717315674 + }, + { + "epoch": 91, + "train_loss": 1.6624984580993651, + "train_acc": 0.536, + "test_loss": 10.048842260742187, + "test_acc": 0.0609, + "lyapunov": null, + "grad_norm": 0.6438868018824426, + "grad_max_sv": 0.22928938865661622, + "grad_min_sv": 1.231375408305979e-08, + "grad_condition": 31102496.91751959, + "lr": 0.0003355666766307081, + "time_sec": 49.69345760345459 + }, + { + "epoch": 92, + "train_loss": 1.6454121144866944, + "train_acc": 0.53824, + "test_loss": 10.659886444854736, + "test_acc": 0.0582, + "lyapunov": null, + "grad_norm": 0.6459174779206647, + "grad_max_sv": 0.22271668426692487, + "grad_min_sv": 1.1955724458709294e-08, + "grad_condition": 49431884.87251066, + "lr": 0.00032571397633909225, + "time_sec": 49.689369201660156 + }, + { + "epoch": 93, + "train_loss": 1.6353191635131836, + "train_acc": 0.53906, + "test_loss": 9.965699587249755, + "test_acc": 0.0575, + "lyapunov": null, + "grad_norm": 0.6423202651542173, + "grad_max_sv": 0.22649669870734215, + "grad_min_sv": 1.204985802111258e-08, + "grad_condition": 25156716.815343075, + "lr": 0.00031593772365766094, + "time_sec": 49.73896932601929 + }, + { + "epoch": 94, + "train_loss": 1.6325202992630006, + "train_acc": 0.5431, + "test_loss": 9.071397685241699, + "test_acc": 0.0695, + "lyapunov": null, + "grad_norm": 0.6428245517224749, + "grad_max_sv": 0.21980281323194503, + "grad_min_sv": 1.192267656546786e-08, + "grad_condition": 22650711.599471536, + "lr": 0.0003062422067739483, + "time_sec": 49.7198269367218 + }, + { + "epoch": 95, + "train_loss": 1.606196717262268, + "train_acc": 0.54818, + "test_loss": 8.367816310882569, + "test_acc": 0.0776, + "lyapunov": null, + "grad_norm": 0.6457909724289436, + "grad_max_sv": 0.2224169909954071, + "grad_min_sv": 1.1999331593626206e-08, + "grad_condition": 35216671.30915074, + "lr": 0.00029663167846209965, + "time_sec": 49.690680742263794 + }, + { + "epoch": 96, + "train_loss": 1.6063461293792725, + "train_acc": 0.54828, + "test_loss": 9.27298110961914, + "test_acc": 0.077, + "lyapunov": null, + "grad_norm": 0.6446146439502599, + "grad_max_sv": 0.2188148509711027, + "grad_min_sv": 1.2013536745437981e-08, + "grad_condition": 88105839.14324757, + "lr": 0.00028711035421746345, + "time_sec": 49.71056294441223 + }, + { + "epoch": 97, + "train_loss": 1.5933577481079102, + "train_acc": 0.55202, + "test_loss": 9.449084450531005, + "test_acc": 0.0758, + "lyapunov": null, + "grad_norm": 0.6476968381150254, + "grad_max_sv": 0.2339034289121628, + "grad_min_sv": 1.203146541908784e-08, + "grad_condition": 43551634.44199026, + "lr": 0.00027768241040753615, + "time_sec": 49.69766879081726 + }, + { + "epoch": 98, + "train_loss": 1.591065004196167, + "train_acc": 0.55214, + "test_loss": 10.3419208984375, + "test_acc": 0.0686, + "lyapunov": null, + "grad_norm": 0.6433842947219884, + "grad_max_sv": 0.22184760086238384, + "grad_min_sv": 1.171166537222712e-08, + "grad_condition": 26591015.123455554, + "lr": 0.00026835198244006903, + "time_sec": 49.6741418838501 + }, + { + "epoch": 99, + "train_loss": 1.5708992581558228, + "train_acc": 0.5541, + "test_loss": 9.679233166503906, + "test_acc": 0.0741, + "lyapunov": null, + "grad_norm": 0.6511371493998432, + "grad_max_sv": 0.2350587610155344, + "grad_min_sv": 1.220192144338328e-08, + "grad_condition": 37240674.16621633, + "lr": 0.0002591231629491421, + "time_sec": 49.696285009384155 + }, + { + "epoch": 100, + "train_loss": 1.551100101852417, + "train_acc": 0.56348, + "test_loss": 9.432355596923829, + "test_acc": 0.0791, + "lyapunov": null, + "grad_norm": 0.6453243326384995, + "grad_max_sv": 0.22425665520131588, + "grad_min_sv": 1.2029662103951732e-08, + "grad_condition": 30738494.303994678, + "lr": 0.0002499999999999997, + "time_sec": 49.68436861038208 + }, + { + "epoch": 101, + "train_loss": 1.5532271942901612, + "train_acc": 0.55978, + "test_loss": 9.434040171051025, + "test_acc": 0.0616, + "lyapunov": null, + "grad_norm": 0.639433522086335, + "grad_max_sv": 0.22706145085394383, + "grad_min_sv": 1.1892038905697566e-08, + "grad_condition": 56298122.78127275, + "lr": 0.00024098649531343477, + "time_sec": 49.683493852615356 + }, + { + "epoch": 102, + "train_loss": 1.5348824725341796, + "train_acc": 0.56456, + "test_loss": 10.389439101409913, + "test_acc": 0.0669, + "lyapunov": null, + "grad_norm": 0.6490720874290529, + "grad_max_sv": 0.23154064677655697, + "grad_min_sv": 1.2121260535569167e-08, + "grad_condition": 30682476.79699411, + "lr": 0.0002320866025105016, + "time_sec": 49.69867157936096 + }, + { + "epoch": 103, + "train_loss": 1.5266431330871582, + "train_acc": 0.56858, + "test_loss": 9.94574862060547, + "test_acc": 0.0678, + "lyapunov": null, + "grad_norm": 0.6437239166160994, + "grad_max_sv": 0.2314249102026224, + "grad_min_sv": 1.192760386778402e-08, + "grad_condition": 52932333.028864086, + "lr": 0.0002233042253783278, + "time_sec": 49.71239686012268 + }, + { + "epoch": 104, + "train_loss": 1.519191276550293, + "train_acc": 0.57046, + "test_loss": 9.50103433227539, + "test_acc": 0.0756, + "lyapunov": null, + "grad_norm": 0.6490448400504286, + "grad_max_sv": 0.23123296946287156, + "grad_min_sv": 1.2113768893540212e-08, + "grad_condition": 24236864.820650473, + "lr": 0.000214643216157784, + "time_sec": 49.689404010772705 + }, + { + "epoch": 105, + "train_loss": 1.5005081454086304, + "train_acc": 0.57444, + "test_loss": 9.965099095916749, + "test_acc": 0.0693, + "lyapunov": null, + "grad_norm": 0.6491011183929278, + "grad_max_sv": 0.22836548648774624, + "grad_min_sv": 1.202852232956575e-08, + "grad_condition": 27582529.6104938, + "lr": 0.00020610737385376332, + "time_sec": 49.67269563674927 + }, + { + "epoch": 106, + "train_loss": 1.5033813332748414, + "train_acc": 0.57306, + "test_loss": 9.635030019378663, + "test_acc": 0.0721, + "lyapunov": null, + "grad_norm": 0.6461521493499768, + "grad_max_sv": 0.2266597468405962, + "grad_min_sv": 1.2111771000022919e-08, + "grad_condition": 32769351.940291226, + "lr": 0.00019770044256881242, + "time_sec": 49.71150064468384 + }, + { + "epoch": 107, + "train_loss": 1.4887806078338623, + "train_acc": 0.577, + "test_loss": 10.65841329498291, + "test_acc": 0.0621, + "lyapunov": null, + "grad_norm": 0.6428151411383272, + "grad_max_sv": 0.22908008880913258, + "grad_min_sv": 1.1953098076264434e-08, + "grad_condition": 60404332.43394003, + "lr": 0.0001894261098608447, + "time_sec": 49.65379071235657 + }, + { + "epoch": 108, + "train_loss": 1.482557979812622, + "train_acc": 0.58012, + "test_loss": 10.995663577270507, + "test_acc": 0.0558, + "lyapunov": null, + "grad_norm": 0.6434848500971246, + "grad_max_sv": 0.22304323464632034, + "grad_min_sv": 1.1954295589533537e-08, + "grad_condition": 28308633.14617728, + "lr": 0.000181288005125655, + "time_sec": 49.6809778213501 + }, + { + "epoch": 109, + "train_loss": 1.4807045125961305, + "train_acc": 0.5761, + "test_loss": 10.382141474914551, + "test_acc": 0.0543, + "lyapunov": null, + "grad_norm": 0.6485812273480447, + "grad_max_sv": 0.22851772867143155, + "grad_min_sv": 1.2086838673680545e-08, + "grad_condition": 39819633.75962995, + "lr": 0.0001732896980049473, + "time_sec": 49.699816942214966 + }, + { + "epoch": 110, + "train_loss": 1.4687647978973388, + "train_acc": 0.5798, + "test_loss": 10.746252852630615, + "test_acc": 0.0581, + "lyapunov": null, + "grad_norm": 0.6477491765248105, + "grad_max_sv": 0.22796588242053986, + "grad_min_sv": 1.190428549864629e-08, + "grad_condition": 2481403210.897232, + "lr": 0.00016543469682057076, + "time_sec": 49.70393252372742 + }, + { + "epoch": 111, + "train_loss": 1.4610351712417602, + "train_acc": 0.58472, + "test_loss": 10.381590240478516, + "test_acc": 0.0706, + "lyapunov": null, + "grad_norm": 0.6432863166727308, + "grad_max_sv": 0.2280182782560587, + "grad_min_sv": 1.178467980700315e-08, + "grad_condition": 23561638.903859288, + "lr": 0.00015772644703565552, + "time_sec": 49.700050592422485 + }, + { + "epoch": 112, + "train_loss": 1.4397893406677247, + "train_acc": 0.58872, + "test_loss": 10.338137576293946, + "test_acc": 0.0599, + "lyapunov": null, + "grad_norm": 0.6467494327669687, + "grad_max_sv": 0.23485867716372014, + "grad_min_sv": 1.2035307057900458e-08, + "grad_condition": 31595880.944000162, + "lr": 0.00015016832974331713, + "time_sec": 49.682395696640015 + }, + { + "epoch": 113, + "train_loss": 1.437483701095581, + "train_acc": 0.58918, + "test_loss": 10.246157286834716, + "test_acc": 0.0695, + "lyapunov": null, + "grad_norm": 0.6445199386088715, + "grad_max_sv": 0.23770148158073426, + "grad_min_sv": 1.204057071199638e-08, + "grad_condition": 42814307.32532358, + "lr": 0.00014276366018359834, + "time_sec": 49.908040046691895 + }, + { + "epoch": 114, + "train_loss": 1.4359378748321534, + "train_acc": 0.59064, + "test_loss": 11.039534825134277, + "test_acc": 0.0677, + "lyapunov": null, + "grad_norm": 0.6454549822167893, + "grad_max_sv": 0.22823763974010944, + "grad_min_sv": 1.1876733774273188e-08, + "grad_condition": 291761738.736855, + "lr": 0.00013551568628929425, + "time_sec": 49.7189781665802 + }, + { + "epoch": 115, + "train_loss": 1.4275243659210206, + "train_acc": 0.59006, + "test_loss": 10.528610446166992, + "test_acc": 0.0607, + "lyapunov": null, + "grad_norm": 0.6419174836339578, + "grad_max_sv": 0.22392887100577355, + "grad_min_sv": 1.179641136994647e-08, + "grad_condition": 29644163.335674204, + "lr": 0.00012842758726130276, + "time_sec": 49.72235894203186 + }, + { + "epoch": 116, + "train_loss": 1.4133833700942993, + "train_acc": 0.5968, + "test_loss": 10.820313760375976, + "test_acc": 0.0656, + "lyapunov": null, + "grad_norm": 0.6402862784743208, + "grad_max_sv": 0.22353913970291614, + "grad_min_sv": 1.189429957625457e-08, + "grad_condition": 228542897.39170122, + "lr": 0.0001215024721741218, + "time_sec": 49.67416787147522 + }, + { + "epoch": 117, + "train_loss": 1.411485424194336, + "train_acc": 0.5969, + "test_loss": 10.931598986816406, + "test_acc": 0.0577, + "lyapunov": null, + "grad_norm": 0.6432402391559784, + "grad_max_sv": 0.23203586414456367, + "grad_min_sv": 1.2139712961961591e-08, + "grad_condition": 110163949.25366247, + "lr": 0.00011474337861210538, + "time_sec": 49.663209676742554 + }, + { + "epoch": 118, + "train_loss": 1.4068245391845704, + "train_acc": 0.59776, + "test_loss": 10.183176309204102, + "test_acc": 0.0661, + "lyapunov": null, + "grad_norm": 0.6353695968506081, + "grad_max_sv": 0.22307165674865245, + "grad_min_sv": 1.1665305550689898e-08, + "grad_condition": 28831682.14909323, + "lr": 0.00010815327133708009, + "time_sec": 49.666460037231445 + }, + { + "epoch": 119, + "train_loss": 1.402758886642456, + "train_acc": 0.59658, + "test_loss": 10.164851486968994, + "test_acc": 0.068, + "lyapunov": null, + "grad_norm": 0.6425028916342753, + "grad_max_sv": 0.22779931575059892, + "grad_min_sv": 1.1958535095502044e-08, + "grad_condition": 21934342.409149133, + "lr": 0.00010173504098790182, + "time_sec": 49.68137216567993 + }, + { + "epoch": 120, + "train_loss": 1.3951943067932129, + "train_acc": 0.60152, + "test_loss": 11.044304919433594, + "test_acc": 0.0561, + "lyapunov": null, + "grad_norm": 0.6395037593133598, + "grad_max_sv": 0.2298117656260729, + "grad_min_sv": 1.1937653743299138e-08, + "grad_condition": 30714208.442827284, + "lr": 9.549150281252629e-05, + "time_sec": 49.67395067214966 + }, + { + "epoch": 121, + "train_loss": 1.3848629484176636, + "train_acc": 0.60518, + "test_loss": 10.719858755493163, + "test_acc": 0.0613, + "lyapunov": null, + "grad_norm": 0.6409039434710538, + "grad_max_sv": 0.23021112196147442, + "grad_min_sv": 1.2000797192275591e-08, + "grad_condition": 88094665.51588485, + "lr": 8.942539543314794e-05, + "time_sec": 49.68539309501648 + }, + { + "epoch": 122, + "train_loss": 1.383416772441864, + "train_acc": 0.60336, + "test_loss": 10.908498886108399, + "test_acc": 0.0602, + "lyapunov": null, + "grad_norm": 0.6396202658591345, + "grad_max_sv": 0.22649863585829735, + "grad_min_sv": 1.1872581198724142e-08, + "grad_condition": 24190316.34547751, + "lr": 8.353937964495024e-05, + "time_sec": 49.74323534965515 + }, + { + "epoch": 123, + "train_loss": 1.3830355605316162, + "train_acc": 0.60662, + "test_loss": 11.06073507385254, + "test_acc": 0.0596, + "lyapunov": null, + "grad_norm": 0.6414185355965266, + "grad_max_sv": 0.22901145406067372, + "grad_min_sv": 1.187639367683513e-08, + "grad_condition": 38920910.596085645, + "lr": 7.783603724899243e-05, + "time_sec": 49.67411923408508 + }, + { + "epoch": 124, + "train_loss": 1.3857973796844483, + "train_acc": 0.60354, + "test_loss": 10.73814365234375, + "test_acc": 0.058, + "lyapunov": null, + "grad_norm": 0.6388025229517722, + "grad_max_sv": 0.22876498848199844, + "grad_min_sv": 1.190297436205745e-08, + "grad_condition": 61209450.617177986, + "lr": 7.231786991974666e-05, + "time_sec": 49.68229269981384 + }, + { + "epoch": 125, + "train_loss": 1.3747353953552246, + "train_acc": 0.60488, + "test_loss": 10.233182415771484, + "test_acc": 0.0698, + "lyapunov": null, + "grad_norm": 0.642290857798361, + "grad_max_sv": 0.22858595848083496, + "grad_min_sv": 1.182404016433769e-08, + "grad_condition": 50222976.90316618, + "lr": 6.698729810778072e-05, + "time_sec": 49.67239689826965 + }, + { + "epoch": 126, + "train_loss": 1.3646390200805665, + "train_acc": 0.60798, + "test_loss": 10.712554415893555, + "test_acc": 0.0619, + "lyapunov": null, + "grad_norm": 0.6444346593730015, + "grad_max_sv": 0.23416251130402088, + "grad_min_sv": 1.2051934158291423e-08, + "grad_condition": 38371603.51946256, + "lr": 6.184665997806817e-05, + "time_sec": 49.68101644515991 + }, + { + "epoch": 127, + "train_loss": 1.361701746749878, + "train_acc": 0.60984, + "test_loss": 9.981337495422363, + "test_acc": 0.0742, + "lyapunov": null, + "grad_norm": 0.6391219138584087, + "grad_max_sv": 0.23171120844781398, + "grad_min_sv": 1.1982857561071424e-08, + "grad_condition": 80290314.45824501, + "lr": 5.6898210384392595e-05, + "time_sec": 49.681220054626465 + }, + { + "epoch": 128, + "train_loss": 1.3609810097122192, + "train_acc": 0.61026, + "test_loss": 10.686243629455566, + "test_acc": 0.0651, + "lyapunov": null, + "grad_norm": 0.6439476104223152, + "grad_max_sv": 0.22856098897755145, + "grad_min_sv": 1.2080658841340242e-08, + "grad_condition": 28175177.95872122, + "lr": 5.214411988029363e-05, + "time_sec": 49.72053813934326 + }, + { + "epoch": 129, + "train_loss": 1.3554223305892945, + "train_acc": 0.61004, + "test_loss": 10.743426461791993, + "test_acc": 0.0659, + "lyapunov": null, + "grad_norm": 0.6410742403804591, + "grad_max_sv": 0.2301864292472601, + "grad_min_sv": 1.2166552429415666e-08, + "grad_condition": 26883740.735421486, + "lr": 4.7586473766990294e-05, + "time_sec": 49.71993637084961 + }, + { + "epoch": 130, + "train_loss": 1.3562946186447145, + "train_acc": 0.6077, + "test_loss": 10.435369656372071, + "test_acc": 0.07, + "lyapunov": null, + "grad_norm": 0.6419847905771429, + "grad_max_sv": 0.22915421687066556, + "grad_min_sv": 1.1826203434595062e-08, + "grad_condition": 26459291.18493547, + "lr": 4.32272711786996e-05, + "time_sec": 49.67161846160889 + }, + { + "epoch": 131, + "train_loss": 1.3406062643051146, + "train_acc": 0.61452, + "test_loss": 10.232965176391602, + "test_acc": 0.0678, + "lyapunov": null, + "grad_norm": 0.6370445726404382, + "grad_max_sv": 0.23454157300293446, + "grad_min_sv": 1.1869287505628101e-08, + "grad_condition": 26190518.474281415, + "lr": 3.906842420574966e-05, + "time_sec": 49.69346308708191 + }, + { + "epoch": 132, + "train_loss": 1.3423929140090942, + "train_acc": 0.61212, + "test_loss": 10.508147541046142, + "test_acc": 0.0657, + "lyapunov": null, + "grad_norm": 0.6410256128509625, + "grad_max_sv": 0.232170420140028, + "grad_min_sv": 1.2030591597239626e-08, + "grad_condition": 38638903.82439326, + "lr": 3.5111757055874305e-05, + "time_sec": 49.67495393753052 + }, + { + "epoch": 133, + "train_loss": 1.3460839172744752, + "train_acc": 0.61412, + "test_loss": 11.195313647460937, + "test_acc": 0.0626, + "lyapunov": null, + "grad_norm": 0.6429018549385016, + "grad_max_sv": 0.22996835298836232, + "grad_min_sv": 1.206329222035174e-08, + "grad_condition": 47960756.54148909, + "lr": 3.1359005254054254e-05, + "time_sec": 49.69527316093445 + }, + { + "epoch": 134, + "train_loss": 1.3375833387374878, + "train_acc": 0.6131, + "test_loss": 10.936044439697266, + "test_acc": 0.0556, + "lyapunov": null, + "grad_norm": 0.6427950071886837, + "grad_max_sv": 0.23044503889977933, + "grad_min_sv": 1.1702977692571587e-08, + "grad_condition": 172511605.9590092, + "lr": 2.7811814881259484e-05, + "time_sec": 49.67974376678467 + }, + { + "epoch": 135, + "train_loss": 1.3292542763519286, + "train_acc": 0.6175, + "test_loss": 11.204447370910644, + "test_acc": 0.0576, + "lyapunov": null, + "grad_norm": 0.6335156215396465, + "grad_max_sv": 0.22653024196624755, + "grad_min_sv": 1.1913050027706484e-08, + "grad_condition": 46289474.00172033, + "lr": 2.4471741852423218e-05, + "time_sec": 49.67492651939392 + }, + { + "epoch": 136, + "train_loss": 1.3332611156845093, + "train_acc": 0.61622, + "test_loss": 11.09446642150879, + "test_acc": 0.0641, + "lyapunov": null, + "grad_norm": 0.639400888793753, + "grad_max_sv": 0.2354104857891798, + "grad_min_sv": 1.1935800509066397e-08, + "grad_condition": 30595182.302482974, + "lr": 2.1340251233966362e-05, + "time_sec": 49.64705729484558 + }, + { + "epoch": 137, + "train_loss": 1.3288326668548585, + "train_acc": 0.62004, + "test_loss": 11.325076202392578, + "test_acc": 0.062, + "lyapunov": null, + "grad_norm": 0.6365332740022154, + "grad_max_sv": 0.2240052442997694, + "grad_min_sv": 1.164015398930074e-08, + "grad_condition": 27973787.98439459, + "lr": 1.8418716601170932e-05, + "time_sec": 49.68620848655701 + }, + { + "epoch": 138, + "train_loss": 1.3296554833221434, + "train_acc": 0.61622, + "test_loss": 11.250219662475587, + "test_acc": 0.0656, + "lyapunov": null, + "grad_norm": 0.6416267203331275, + "grad_max_sv": 0.232584772631526, + "grad_min_sv": 1.1945704529031654e-08, + "grad_condition": 41196373.456140414, + "lr": 1.570841943568445e-05, + "time_sec": 49.66656708717346 + }, + { + "epoch": 139, + "train_loss": 1.3251214186096192, + "train_acc": 0.61704, + "test_loss": 10.805933337402344, + "test_acc": 0.0671, + "lyapunov": null, + "grad_norm": 0.6410925237069093, + "grad_max_sv": 0.228699629381299, + "grad_min_sv": 1.1985534767444684e-08, + "grad_condition": 22417985.97103992, + "lr": 1.3210548563419845e-05, + "time_sec": 49.6790714263916 + }, + { + "epoch": 140, + "train_loss": 1.3237634344863891, + "train_acc": 0.61592, + "test_loss": 11.067021920776368, + "test_acc": 0.0679, + "lyapunov": null, + "grad_norm": 0.6375015765314956, + "grad_max_sv": 0.2266246847808361, + "grad_min_sv": 1.1820416521979294e-08, + "grad_condition": 28316613.45845435, + "lr": 1.0926199633097203e-05, + "time_sec": 49.67349076271057 + }, + { + "epoch": 141, + "train_loss": 1.3261828830718994, + "train_acc": 0.61808, + "test_loss": 11.25090906982422, + "test_acc": 0.0649, + "lyapunov": null, + "grad_norm": 0.6392179494036954, + "grad_max_sv": 0.23167021423578263, + "grad_min_sv": 1.2066529587410196e-08, + "grad_condition": 375343945.2928153, + "lr": 8.856374635655688e-06, + "time_sec": 49.67690658569336 + }, + { + "epoch": 142, + "train_loss": 1.3263437029266358, + "train_acc": 0.6176, + "test_loss": 10.572230374145509, + "test_acc": 0.07, + "lyapunov": null, + "grad_norm": 0.6394711874249032, + "grad_max_sv": 0.23341582007706166, + "grad_min_sv": 1.1937908653281148e-08, + "grad_condition": 26227900.21107275, + "lr": 7.001981464747503e-06, + "time_sec": 49.66385054588318 + }, + { + "epoch": 143, + "train_loss": 1.3200650732803345, + "train_acc": 0.6172, + "test_loss": 10.543097203826905, + "test_acc": 0.071, + "lyapunov": null, + "grad_norm": 0.6395699639233869, + "grad_max_sv": 0.23363734520971774, + "grad_min_sv": 1.2132445016341253e-08, + "grad_condition": 52550434.07017521, + "lr": 5.3638335185058295e-06, + "time_sec": 49.66163873672485 + }, + { + "epoch": 144, + "train_loss": 1.3308382055664063, + "train_acc": 0.61434, + "test_loss": 11.178705859375, + "test_acc": 0.0624, + "lyapunov": null, + "grad_norm": 0.641534220219546, + "grad_max_sv": 0.22773880399763585, + "grad_min_sv": 1.1764350836031279e-08, + "grad_condition": 191867576.52061495, + "lr": 3.942649342761114e-06, + "time_sec": 49.664501667022705 + }, + { + "epoch": 145, + "train_loss": 1.3221956774902344, + "train_acc": 0.61904, + "test_loss": 11.177163687133788, + "test_acc": 0.0661, + "lyapunov": null, + "grad_norm": 0.6396000766480665, + "grad_max_sv": 0.22918766662478446, + "grad_min_sv": 1.1855643147935802e-08, + "grad_condition": 149369487.7789059, + "lr": 2.7390523158633524e-06, + "time_sec": 49.670830965042114 + }, + { + "epoch": 146, + "train_loss": 1.319600304031372, + "train_acc": 0.62, + "test_loss": 11.415747598266602, + "test_acc": 0.0657, + "lyapunov": null, + "grad_norm": 0.6396846512615422, + "grad_max_sv": 0.22678725458681584, + "grad_min_sv": 1.1900367663866817e-08, + "grad_condition": 60665945.689223036, + "lr": 1.7535703752478133e-06, + "time_sec": 49.67027306556702 + }, + { + "epoch": 147, + "train_loss": 1.3258844360733033, + "train_acc": 0.6182, + "test_loss": 10.442874749755859, + "test_acc": 0.071, + "lyapunov": null, + "grad_norm": 0.6386988292192789, + "grad_max_sv": 0.22648476548492907, + "grad_min_sv": 1.1830113375022044e-08, + "grad_condition": 41984523.9416481, + "lr": 9.866357858642196e-07, + "time_sec": 49.676053524017334 + }, + { + "epoch": 148, + "train_loss": 1.3224727532577514, + "train_acc": 0.61936, + "test_loss": 11.328163026428223, + "test_acc": 0.0619, + "lyapunov": null, + "grad_norm": 0.6401500534411335, + "grad_max_sv": 0.23168128840625285, + "grad_min_sv": 1.199023767622107e-08, + "grad_condition": 1050894253.8704536, + "lr": 4.38584950570808e-07, + "time_sec": 49.68360710144043 + }, + { + "epoch": 149, + "train_loss": 1.3274797118377686, + "train_acc": 0.61862, + "test_loss": 10.757389901733399, + "test_acc": 0.0685, + "lyapunov": null, + "grad_norm": 0.639463631187681, + "grad_max_sv": 0.22796367555856706, + "grad_min_sv": 1.1743270168784736e-08, + "grad_condition": 77090960.9883382, + "lr": 1.096582625772501e-07, + "time_sec": 49.68101191520691 + }, + { + "epoch": 150, + "train_loss": 1.321363949546814, + "train_acc": 0.61964, + "test_loss": 10.926936387634278, + "test_acc": 0.0644, + "lyapunov": null, + "grad_norm": 0.6382758828308119, + "grad_max_sv": 0.22843386456370354, + "grad_min_sv": 1.2169918700566385e-08, + "grad_condition": 23341884.35923662, + "lr": 0.0, + "time_sec": 49.69367837905884 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.089254416656495, + "train_acc": 0.01344, + "test_loss": 4.870831555175781, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.582063459208639, + "grad_max_sv": 5.0306542873382565, + "grad_min_sv": 8.441757832766683e-08, + "grad_condition": 74707534.78681344, + "lr": 0.0009998903417374227, + "time_sec": 66.74431419372559 + }, + { + "epoch": 2, + "train_loss": 4.736304296569824, + "train_acc": 0.02172, + "test_loss": 4.92340059890747, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.087296772772229, + "grad_max_sv": 3.672157108783722, + "grad_min_sv": 6.109624839933935e-08, + "grad_condition": 230714811.36310124, + "lr": 0.0009995614150494292, + "time_sec": 66.75134921073914 + }, + { + "epoch": 3, + "train_loss": 4.52685978515625, + "train_acc": 0.03204, + "test_loss": 5.045831031799317, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 3.1470044543912175, + "grad_max_sv": 2.6447540044784548, + "grad_min_sv": 4.639755384339139e-08, + "grad_condition": 65625701.84585605, + "lr": 0.0009990133642141358, + "time_sec": 66.81799459457397 + }, + { + "epoch": 4, + "train_loss": 4.371717319641113, + "train_acc": 0.04112, + "test_loss": 4.993129699707032, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 2.5123688948843395, + "grad_max_sv": 2.1027904629707335, + "grad_min_sv": 3.615837387664633e-08, + "grad_condition": 418817692.03399765, + "lr": 0.0009982464296247522, + "time_sec": 66.83444166183472 + }, + { + "epoch": 5, + "train_loss": 4.27407361251831, + "train_acc": 0.0488, + "test_loss": 5.161634465789795, + "test_acc": 0.0119, + "lyapunov": null, + "grad_norm": 1.9573801826064445, + "grad_max_sv": 1.613087645173073, + "grad_min_sv": 2.8529539808364034e-08, + "grad_condition": 62747668.20627429, + "lr": 0.0009972609476841367, + "time_sec": 66.78564238548279 + }, + { + "epoch": 6, + "train_loss": 4.183251854553222, + "train_acc": 0.05812, + "test_loss": 5.447854755401611, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 1.436449079599314, + "grad_max_sv": 1.0459295481443405, + "grad_min_sv": 2.0654144772258576e-08, + "grad_condition": 94732574.16372415, + "lr": 0.000996057350657239, + "time_sec": 66.77538251876831 + }, + { + "epoch": 7, + "train_loss": 4.103355536193848, + "train_acc": 0.06872, + "test_loss": 5.544150679016114, + "test_acc": 0.0124, + "lyapunov": null, + "grad_norm": 1.082624040556548, + "grad_max_sv": 0.678101472556591, + "grad_min_sv": 1.6660088839048904e-08, + "grad_condition": 49338508.46283151, + "lr": 0.000994636166481494, + "time_sec": 66.75594520568848 + }, + { + "epoch": 8, + "train_loss": 4.040529095458984, + "train_acc": 0.07876, + "test_loss": 5.577163777160645, + "test_acc": 0.0172, + "lyapunov": null, + "grad_norm": 0.963869121683512, + "grad_max_sv": 0.5578698106110096, + "grad_min_sv": 1.4817374840991882e-08, + "grad_condition": 46172185.25999212, + "lr": 0.0009929980185352525, + "time_sec": 66.77279257774353 + }, + { + "epoch": 9, + "train_loss": 3.999490645446777, + "train_acc": 0.0856, + "test_loss": 5.472281336975097, + "test_acc": 0.0116, + "lyapunov": null, + "grad_norm": 0.9198022107734598, + "grad_max_sv": 0.5003849364817142, + "grad_min_sv": 1.3862486752946878e-08, + "grad_condition": 137028895.09887612, + "lr": 0.0009911436253643444, + "time_sec": 66.76341032981873 + }, + { + "epoch": 10, + "train_loss": 3.9641557629394533, + "train_acc": 0.09124, + "test_loss": 5.43024553604126, + "test_acc": 0.0112, + "lyapunov": null, + "grad_norm": 0.8539816540258655, + "grad_max_sv": 0.4397390566766262, + "grad_min_sv": 1.3177782898221579e-08, + "grad_condition": 50953468.3517745, + "lr": 0.0009890738003669028, + "time_sec": 66.75870108604431 + }, + { + "epoch": 11, + "train_loss": 3.9142907052612306, + "train_acc": 0.09788, + "test_loss": 5.24972756652832, + "test_acc": 0.0174, + "lyapunov": null, + "grad_norm": 0.8303589651826888, + "grad_max_sv": 0.4246540553867817, + "grad_min_sv": 1.288730961390705e-08, + "grad_condition": 88294678.08247125, + "lr": 0.00098678945143658, + "time_sec": 66.76091003417969 + }, + { + "epoch": 12, + "train_loss": 3.881778168411255, + "train_acc": 0.1037, + "test_loss": 5.765969756317139, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.7855031029198277, + "grad_max_sv": 0.3756070680916309, + "grad_min_sv": 1.2611303298881715e-08, + "grad_condition": 36786532.210794725, + "lr": 0.0009842915805643154, + "time_sec": 66.83831191062927 + }, + { + "epoch": 13, + "train_loss": 3.8490214154815674, + "train_acc": 0.1068, + "test_loss": 5.832162282562256, + "test_acc": 0.0138, + "lyapunov": null, + "grad_norm": 0.7681061932199776, + "grad_max_sv": 0.3604050487279892, + "grad_min_sv": 1.2243067453593382e-08, + "grad_condition": 131143000.26933214, + "lr": 0.000981581283398829, + "time_sec": 66.98098254203796 + }, + { + "epoch": 14, + "train_loss": 3.828877674636841, + "train_acc": 0.11234, + "test_loss": 6.293205305480957, + "test_acc": 0.0134, + "lyapunov": null, + "grad_norm": 0.7460407539013362, + "grad_max_sv": 0.34510768875479697, + "grad_min_sv": 1.1813573212726692e-08, + "grad_condition": 49629148.15911349, + "lr": 0.0009786597487660333, + "time_sec": 66.84203433990479 + }, + { + "epoch": 15, + "train_loss": 3.803487832107544, + "train_acc": 0.1159, + "test_loss": 6.4087516273498535, + "test_acc": 0.013, + "lyapunov": null, + "grad_norm": 0.716379034773642, + "grad_max_sv": 0.3261814657598734, + "grad_min_sv": 1.1572917107960378e-08, + "grad_condition": 31644703.4401185, + "lr": 0.0009755282581475766, + "time_sec": 66.78494954109192 + }, + { + "epoch": 16, + "train_loss": 3.7821172668457033, + "train_acc": 0.11904, + "test_loss": 6.406122239685058, + "test_acc": 0.0123, + "lyapunov": null, + "grad_norm": 0.697749546532161, + "grad_max_sv": 0.31582852490246294, + "grad_min_sv": 1.1393312793206434e-08, + "grad_condition": 39132519.74005551, + "lr": 0.0009721881851187403, + "time_sec": 66.78941893577576 + }, + { + "epoch": 17, + "train_loss": 3.7480180199432374, + "train_acc": 0.12526, + "test_loss": 6.8633532814025875, + "test_acc": 0.0132, + "lyapunov": null, + "grad_norm": 0.6758633251362415, + "grad_max_sv": 0.2994280070066452, + "grad_min_sv": 1.1069095015581176e-08, + "grad_condition": 36563832.03358241, + "lr": 0.0009686409947459456, + "time_sec": 66.86767721176147 + }, + { + "epoch": 18, + "train_loss": 3.730831000213623, + "train_acc": 0.12792, + "test_loss": 6.246407075500488, + "test_acc": 0.0177, + "lyapunov": null, + "grad_norm": 0.664831990265232, + "grad_max_sv": 0.2994547080248594, + "grad_min_sv": 1.0997234457625626e-08, + "grad_condition": 122736750.78260681, + "lr": 0.0009648882429441254, + "time_sec": 66.77909207344055 + }, + { + "epoch": 19, + "train_loss": 3.716553072052002, + "train_acc": 0.12942, + "test_loss": 5.873876965332031, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6518241757841252, + "grad_max_sv": 0.29539270177483556, + "grad_min_sv": 1.0741561572852331e-08, + "grad_condition": 49669322.25294405, + "lr": 0.00096093157579425, + "time_sec": 66.85221266746521 + }, + { + "epoch": 20, + "train_loss": 3.6975706172180174, + "train_acc": 0.13298, + "test_loss": 6.400744886779785, + "test_acc": 0.0155, + "lyapunov": null, + "grad_norm": 0.6347864002121714, + "grad_max_sv": 0.28284979946911337, + "grad_min_sv": 1.0701284272607303e-08, + "grad_condition": 30013146.4819826, + "lr": 0.0009567727288213001, + "time_sec": 66.91982674598694 + }, + { + "epoch": 21, + "train_loss": 3.673498316040039, + "train_acc": 0.13564, + "test_loss": 6.160238801574707, + "test_acc": 0.0204, + "lyapunov": null, + "grad_norm": 0.6252581472584972, + "grad_max_sv": 0.27260397262871267, + "grad_min_sv": 1.0594542484282377e-08, + "grad_condition": 46350413.24314589, + "lr": 0.0009524135262330095, + "time_sec": 66.83625864982605 + }, + { + "epoch": 22, + "train_loss": 3.654527678833008, + "train_acc": 0.1393, + "test_loss": 6.9474281982421875, + "test_acc": 0.0176, + "lyapunov": null, + "grad_norm": 0.6149063083720292, + "grad_max_sv": 0.26224171184003353, + "grad_min_sv": 1.035294387718988e-08, + "grad_condition": 32282705.350815333, + "lr": 0.0009478558801197061, + "time_sec": 66.82992005348206 + }, + { + "epoch": 23, + "train_loss": 3.6450364729309084, + "train_acc": 0.14028, + "test_loss": 7.2393467880249025, + "test_acc": 0.0127, + "lyapunov": null, + "grad_norm": 0.6067467053692205, + "grad_max_sv": 0.26614573895931243, + "grad_min_sv": 1.0267544686692886e-08, + "grad_condition": 28213061.075003404, + "lr": 0.000943101789615607, + "time_sec": 66.82584643363953 + }, + { + "epoch": 24, + "train_loss": 3.623104200592041, + "train_acc": 0.14594, + "test_loss": 6.526107063293457, + "test_acc": 0.0187, + "lyapunov": null, + "grad_norm": 0.5980858749774747, + "grad_max_sv": 0.25203392654657364, + "grad_min_sv": 1.0098680717357534e-08, + "grad_condition": 50563247.00258337, + "lr": 0.0009381533400219313, + "time_sec": 66.82554173469543 + }, + { + "epoch": 25, + "train_loss": 3.6136645338439943, + "train_acc": 0.14728, + "test_loss": 7.030907647705078, + "test_acc": 0.0182, + "lyapunov": null, + "grad_norm": 0.594016587561951, + "grad_max_sv": 0.25378315448760985, + "grad_min_sv": 9.976338428627219e-09, + "grad_condition": 72065195.62747766, + "lr": 0.0009330127018922189, + "time_sec": 66.80855441093445 + }, + { + "epoch": 26, + "train_loss": 3.5951533477020265, + "train_acc": 0.15, + "test_loss": 6.8098891067504885, + "test_acc": 0.0193, + "lyapunov": null, + "grad_norm": 0.5888833643522708, + "grad_max_sv": 0.24365438856184482, + "grad_min_sv": 9.933017187935267e-09, + "grad_condition": 44149369.91233202, + "lr": 0.000927682130080253, + "time_sec": 66.90105819702148 + }, + { + "epoch": 27, + "train_loss": 3.5870719739532473, + "train_acc": 0.15012, + "test_loss": 6.188968405151368, + "test_acc": 0.0198, + "lyapunov": null, + "grad_norm": 0.5778870286561091, + "grad_max_sv": 0.23904258161783218, + "grad_min_sv": 9.864321945385335e-09, + "grad_condition": 29413784.94482057, + "lr": 0.0009221639627510072, + "time_sec": 66.80191397666931 + }, + { + "epoch": 28, + "train_loss": 3.5677108099365236, + "train_acc": 0.15438, + "test_loss": 7.111977198028565, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.565332521044754, + "grad_max_sv": 0.22653766870498657, + "grad_min_sv": 9.587734812674387e-09, + "grad_condition": 61781100.03898337, + "lr": 0.0009164606203550494, + "time_sec": 66.76739978790283 + }, + { + "epoch": 29, + "train_loss": 3.5525446216583254, + "train_acc": 0.1561, + "test_loss": 6.844758932495117, + "test_acc": 0.0209, + "lyapunov": null, + "grad_norm": 0.5709459777275144, + "grad_max_sv": 0.22716681994497775, + "grad_min_sv": 9.63618568827762e-09, + "grad_condition": 26044218.51829529, + "lr": 0.0009105746045668516, + "time_sec": 66.88382387161255 + }, + { + "epoch": 30, + "train_loss": 3.5511199297332765, + "train_acc": 0.15632, + "test_loss": 6.829617092895508, + "test_acc": 0.0179, + "lyapunov": null, + "grad_norm": 0.5599177583176913, + "grad_max_sv": 0.22315906584262848, + "grad_min_sv": 9.481845958392298e-09, + "grad_condition": 31696446.039096247, + "lr": 0.0009045084971874733, + "time_sec": 66.87736558914185 + }, + { + "epoch": 31, + "train_loss": 3.5346223778533936, + "train_acc": 0.15964, + "test_loss": 7.171929656982422, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5560980115082016, + "grad_max_sv": 0.22190811820328235, + "grad_min_sv": 9.472099816998369e-09, + "grad_condition": 65999783.19253375, + "lr": 0.0008982649590120977, + "time_sec": 67.13842725753784 + }, + { + "epoch": 32, + "train_loss": 3.523619603424072, + "train_acc": 0.16298, + "test_loss": 7.11264291381836, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.5484008571230936, + "grad_max_sv": 0.21031202785670758, + "grad_min_sv": 9.324677128358382e-09, + "grad_condition": 59831756.702754, + "lr": 0.0008918467286629196, + "time_sec": 66.85003089904785 + }, + { + "epoch": 33, + "train_loss": 3.503953924026489, + "train_acc": 0.1662, + "test_loss": 6.848249008178711, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5416204323895276, + "grad_max_sv": 0.2181798741221428, + "grad_min_sv": 9.399793365156769e-09, + "grad_condition": 389136802.1825175, + "lr": 0.0008852566213878943, + "time_sec": 66.87287449836731 + }, + { + "epoch": 34, + "train_loss": 3.505652629928589, + "train_acc": 0.16502, + "test_loss": 6.877189469909668, + "test_acc": 0.02, + "lyapunov": null, + "grad_norm": 0.5355113980631458, + "grad_max_sv": 0.20969012342393398, + "grad_min_sv": 9.270577998321538e-09, + "grad_condition": 31525454.84069126, + "lr": 0.000878497527825878, + "time_sec": 66.85899138450623 + }, + { + "epoch": 35, + "train_loss": 3.486978895339966, + "train_acc": 0.16714, + "test_loss": 7.1552359481811525, + "test_acc": 0.0172, + "lyapunov": null, + "grad_norm": 0.5346080374847578, + "grad_max_sv": 0.20298720821738242, + "grad_min_sv": 9.306896420202548e-09, + "grad_condition": 25441508.50613912, + "lr": 0.000871572412738697, + "time_sec": 66.81276679039001 + }, + { + "epoch": 36, + "train_loss": 3.481938878631592, + "train_acc": 0.1685, + "test_loss": 6.431350996398926, + "test_acc": 0.0245, + "lyapunov": null, + "grad_norm": 0.5311150175573837, + "grad_max_sv": 0.20061880052089692, + "grad_min_sv": 9.170909237576907e-09, + "grad_condition": 24479294.782169707, + "lr": 0.0008644843137107055, + "time_sec": 66.82223439216614 + }, + { + "epoch": 37, + "train_loss": 3.468437765579224, + "train_acc": 0.17124, + "test_loss": 6.530572232818604, + "test_acc": 0.0198, + "lyapunov": null, + "grad_norm": 0.5276521525054072, + "grad_max_sv": 0.19484757333993913, + "grad_min_sv": 9.140001265561804e-09, + "grad_condition": 33235283.773568917, + "lr": 0.0008572363398164014, + "time_sec": 66.81523728370667 + }, + { + "epoch": 38, + "train_loss": 3.4680467206573486, + "train_acc": 0.1688, + "test_loss": 7.093794832611084, + "test_acc": 0.0229, + "lyapunov": null, + "grad_norm": 0.5212998707352875, + "grad_max_sv": 0.19487478397786617, + "grad_min_sv": 8.903727073336642e-09, + "grad_condition": 56658397.537690006, + "lr": 0.0008498316702566826, + "time_sec": 66.73852157592773 + }, + { + "epoch": 39, + "train_loss": 3.446105847091675, + "train_acc": 0.17352, + "test_loss": 6.776045403289795, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.5212725973698809, + "grad_max_sv": 0.19792714342474937, + "grad_min_sv": 9.085871228303733e-09, + "grad_condition": 46760082.167771, + "lr": 0.0008422735529643442, + "time_sec": 67.0616934299469 + }, + { + "epoch": 40, + "train_loss": 3.4391634851837156, + "train_acc": 0.17672, + "test_loss": 7.587687799072266, + "test_acc": 0.0216, + "lyapunov": null, + "grad_norm": 0.5300570580240554, + "grad_max_sv": 0.20367281697690487, + "grad_min_sv": 9.141295443781256e-09, + "grad_condition": 126828260.46725988, + "lr": 0.0008345653031794289, + "time_sec": 66.80781960487366 + }, + { + "epoch": 41, + "train_loss": 3.4357695812988283, + "train_acc": 0.17624, + "test_loss": 7.211737112426758, + "test_acc": 0.0222, + "lyapunov": null, + "grad_norm": 0.5223568323053726, + "grad_max_sv": 0.19902292899787427, + "grad_min_sv": 9.146015303440613e-09, + "grad_condition": 25165381.505554177, + "lr": 0.0008267103019950526, + "time_sec": 66.90729665756226 + }, + { + "epoch": 42, + "train_loss": 3.426037024002075, + "train_acc": 0.17732, + "test_loss": 7.175137020874024, + "test_acc": 0.0218, + "lyapunov": null, + "grad_norm": 0.5101943237446857, + "grad_max_sv": 0.1887429542839527, + "grad_min_sv": 8.85594173063997e-09, + "grad_condition": 35650593.40143595, + "lr": 0.0008187119948743447, + "time_sec": 66.81169581413269 + }, + { + "epoch": 43, + "train_loss": 3.4184053784942625, + "train_acc": 0.17964, + "test_loss": 7.844732983398438, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5099518428696158, + "grad_max_sv": 0.19498886093497275, + "grad_min_sv": 9.008296121548742e-09, + "grad_condition": 27266459.636599384, + "lr": 0.000810573890139155, + "time_sec": 66.85266208648682 + }, + { + "epoch": 44, + "train_loss": 3.4024582288360596, + "train_acc": 0.18462, + "test_loss": 7.218817704772949, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.5122229926391642, + "grad_max_sv": 0.19076302275061607, + "grad_min_sv": 8.938243520849321e-09, + "grad_condition": 198668402.87631398, + "lr": 0.0008022995574311873, + "time_sec": 66.91685390472412 + }, + { + "epoch": 45, + "train_loss": 3.385272266693115, + "train_acc": 0.18668, + "test_loss": 8.044592700958251, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.5074072133149611, + "grad_max_sv": 0.18489782735705376, + "grad_min_sv": 9.009793366931972e-09, + "grad_condition": 24986066.478751726, + "lr": 0.0007938926261462363, + "time_sec": 66.84079718589783 + }, + { + "epoch": 46, + "train_loss": 3.3847679064178466, + "train_acc": 0.18552, + "test_loss": 7.005147599792481, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.5036864657569943, + "grad_max_sv": 0.18339827209711074, + "grad_min_sv": 8.858673714029486e-09, + "grad_condition": 25159828.95523686, + "lr": 0.0007853567838422158, + "time_sec": 66.77542781829834 + }, + { + "epoch": 47, + "train_loss": 3.377982001876831, + "train_acc": 0.18574, + "test_loss": 6.535616015625, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.5002497348288438, + "grad_max_sv": 0.17932576797902583, + "grad_min_sv": 8.886634791926973e-09, + "grad_condition": 22814741.087062966, + "lr": 0.0007766957746216719, + "time_sec": 66.77253365516663 + }, + { + "epoch": 48, + "train_loss": 3.3632313873291015, + "train_acc": 0.19082, + "test_loss": 7.1207671043396, + "test_acc": 0.0249, + "lyapunov": null, + "grad_norm": 0.5004802145477826, + "grad_max_sv": 0.18168221227824688, + "grad_min_sv": 8.832463756474479e-09, + "grad_condition": 138537611.52251583, + "lr": 0.0007679133974894982, + "time_sec": 66.92418003082275 + }, + { + "epoch": 49, + "train_loss": 3.357747060012817, + "train_acc": 0.19018, + "test_loss": 7.041590236663819, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.49897992316233614, + "grad_max_sv": 0.18335177674889563, + "grad_min_sv": 8.811863486113402e-09, + "grad_condition": 24782694.997001432, + "lr": 0.000759013504686565, + "time_sec": 66.93407106399536 + }, + { + "epoch": 50, + "train_loss": 3.3515787353515627, + "train_acc": 0.19116, + "test_loss": 7.133926119995118, + "test_acc": 0.0241, + "lyapunov": null, + "grad_norm": 0.4972756636640684, + "grad_max_sv": 0.17776267938315868, + "grad_min_sv": 8.856038616333883e-09, + "grad_condition": 23328516.218488432, + "lr": 0.0007499999999999998, + "time_sec": 66.77817225456238 + }, + { + "epoch": 51, + "train_loss": 3.3393478485870363, + "train_acc": 0.1922, + "test_loss": 7.253289399719239, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.49524275923022765, + "grad_max_sv": 0.17880769595503807, + "grad_min_sv": 8.821089803544812e-09, + "grad_condition": 428497019.7398695, + "lr": 0.0007408768370508575, + "time_sec": 66.96121120452881 + }, + { + "epoch": 52, + "train_loss": 3.3365701832580568, + "train_acc": 0.19238, + "test_loss": 7.805395611572266, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.4956823979190034, + "grad_max_sv": 0.1680080708116293, + "grad_min_sv": 8.769059598769114e-09, + "grad_condition": 192519788.1316063, + "lr": 0.0007316480175599307, + "time_sec": 66.85345005989075 + }, + { + "epoch": 53, + "train_loss": 3.333746835784912, + "train_acc": 0.19458, + "test_loss": 7.013431349182129, + "test_acc": 0.0268, + "lyapunov": null, + "grad_norm": 0.497942870580151, + "grad_max_sv": 0.1765025958418846, + "grad_min_sv": 8.990621409854516e-09, + "grad_condition": 29640482.665341068, + "lr": 0.0007223175895924635, + "time_sec": 66.77972507476807 + }, + { + "epoch": 54, + "train_loss": 3.3229647937011717, + "train_acc": 0.19666, + "test_loss": 7.03700419921875, + "test_acc": 0.0243, + "lyapunov": null, + "grad_norm": 0.4958771639794239, + "grad_max_sv": 0.17399827837944032, + "grad_min_sv": 8.823984976036315e-09, + "grad_condition": 29997915.373120725, + "lr": 0.0007128896457825361, + "time_sec": 66.93337392807007 + }, + { + "epoch": 55, + "train_loss": 3.3078488957214356, + "train_acc": 0.19844, + "test_loss": 6.824067575836182, + "test_acc": 0.0225, + "lyapunov": null, + "grad_norm": 0.4963143606211398, + "grad_max_sv": 0.17193161956965924, + "grad_min_sv": 8.793880154622791e-09, + "grad_condition": 23806580.86720205, + "lr": 0.0007033683215378998, + "time_sec": 66.84783434867859 + }, + { + "epoch": 56, + "train_loss": 3.300284340209961, + "train_acc": 0.19964, + "test_loss": 7.3765008331298825, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.4962049364593942, + "grad_max_sv": 0.17086058780550956, + "grad_min_sv": 8.957953683691456e-09, + "grad_condition": 34088411.744767606, + "lr": 0.0006937577932260512, + "time_sec": 66.7465398311615 + }, + { + "epoch": 57, + "train_loss": 3.279534700241089, + "train_acc": 0.20396, + "test_loss": 6.880362132263183, + "test_acc": 0.031, + "lyapunov": null, + "grad_norm": 0.4942484951978682, + "grad_max_sv": 0.17122924104332923, + "grad_min_sv": 8.887839456767078e-09, + "grad_condition": 34686400.377949044, + "lr": 0.0006840622763423388, + "time_sec": 66.75685214996338 + }, + { + "epoch": 58, + "train_loss": 3.2868811530303956, + "train_acc": 0.20222, + "test_loss": 7.637865020751953, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.49584322382013707, + "grad_max_sv": 0.17295786403119565, + "grad_min_sv": 8.86787135945255e-09, + "grad_condition": 24086270.85456165, + "lr": 0.0006742860236609073, + "time_sec": 66.78707718849182 + }, + { + "epoch": 59, + "train_loss": 3.282674100265503, + "train_acc": 0.20432, + "test_loss": 7.462895319366455, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.4926536100208224, + "grad_max_sv": 0.17441818714141846, + "grad_min_sv": 8.859609179623363e-09, + "grad_condition": 42859734.61314274, + "lr": 0.0006644333233692913, + "time_sec": 66.91234374046326 + }, + { + "epoch": 60, + "train_loss": 3.2728336755371092, + "train_acc": 0.20326, + "test_loss": 6.622286376953125, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.49419543709001157, + "grad_max_sv": 0.17417771629989148, + "grad_min_sv": 9.040606460675172e-09, + "grad_condition": 21337169.661871206, + "lr": 0.0006545084971874734, + "time_sec": 66.78437662124634 + }, + { + "epoch": 61, + "train_loss": 3.264115914764404, + "train_acc": 0.2048, + "test_loss": 6.766970691680908, + "test_acc": 0.0293, + "lyapunov": null, + "grad_norm": 0.4925004615834911, + "grad_max_sv": 0.16977979727089404, + "grad_min_sv": 8.89249160695993e-09, + "grad_condition": 22271635.1746474, + "lr": 0.0006445158984722354, + "time_sec": 66.78286385536194 + }, + { + "epoch": 62, + "train_loss": 3.2519623767852783, + "train_acc": 0.2083, + "test_loss": 6.320362659454346, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.4903714138516238, + "grad_max_sv": 0.16600825376808642, + "grad_min_sv": 8.826651234396243e-09, + "grad_condition": 113841496.65664235, + "lr": 0.0006344599103076324, + "time_sec": 66.76978707313538 + }, + { + "epoch": 63, + "train_loss": 3.2406803789520264, + "train_acc": 0.20842, + "test_loss": 6.0048693046569825, + "test_acc": 0.0332, + "lyapunov": null, + "grad_norm": 0.48923288902664697, + "grad_max_sv": 0.1636019229888916, + "grad_min_sv": 8.835183994138074e-09, + "grad_condition": 28712921.926048793, + "lr": 0.0006243449435824269, + "time_sec": 66.75778698921204 + }, + { + "epoch": 64, + "train_loss": 3.2432028374481203, + "train_acc": 0.21058, + "test_loss": 5.735058168792724, + "test_acc": 0.0351, + "lyapunov": null, + "grad_norm": 0.49165310678113583, + "grad_max_sv": 0.1661746773868799, + "grad_min_sv": 8.821747320142404e-09, + "grad_condition": 24572068.94149008, + "lr": 0.0006141754350553275, + "time_sec": 66.7586920261383 + }, + { + "epoch": 65, + "train_loss": 3.2308475701141357, + "train_acc": 0.21202, + "test_loss": 6.2612747291564945, + "test_acc": 0.0295, + "lyapunov": null, + "grad_norm": 0.4897367968481375, + "grad_max_sv": 0.16482470370829105, + "grad_min_sv": 8.864288811305521e-09, + "grad_condition": 21514378.277254187, + "lr": 0.0006039558454088793, + "time_sec": 66.74698638916016 + }, + { + "epoch": 66, + "train_loss": 3.2232217138671877, + "train_acc": 0.2127, + "test_loss": 6.067545962524414, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.48745580535363076, + "grad_max_sv": 0.1623400203883648, + "grad_min_sv": 8.756487956951275e-09, + "grad_condition": 24813070.869568076, + "lr": 0.000593690657292862, + "time_sec": 66.77337288856506 + }, + { + "epoch": 67, + "train_loss": 3.215757719116211, + "train_acc": 0.21252, + "test_loss": 6.517296158599853, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.48601974882564686, + "grad_max_sv": 0.16268517263233662, + "grad_min_sv": 8.78295952078112e-09, + "grad_condition": 21989330.302483782, + "lr": 0.0005833843733580507, + "time_sec": 66.75407552719116 + }, + { + "epoch": 68, + "train_loss": 3.2091114740753173, + "train_acc": 0.21522, + "test_loss": 6.124687364196777, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.49192871254287607, + "grad_max_sv": 0.16933195553719999, + "grad_min_sv": 9.03891372028287e-09, + "grad_condition": 23334475.39073747, + "lr": 0.0005730415142812054, + "time_sec": 66.7687680721283 + }, + { + "epoch": 69, + "train_loss": 3.2083391997528077, + "train_acc": 0.2149, + "test_loss": 6.357658093261719, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.4883277257153208, + "grad_max_sv": 0.16220727227628232, + "grad_min_sv": 8.759147329673311e-09, + "grad_condition": 21650621.599965747, + "lr": 0.0005626666167821517, + "time_sec": 66.75298261642456 + }, + { + "epoch": 70, + "train_loss": 3.192287651748657, + "train_acc": 0.21884, + "test_loss": 6.329555874633789, + "test_acc": 0.026, + "lyapunov": null, + "grad_norm": 0.4902759494986014, + "grad_max_sv": 0.1623948898166418, + "grad_min_sv": 8.965784165093638e-09, + "grad_condition": 20161244.332468193, + "lr": 0.0005522642316338265, + "time_sec": 66.76123976707458 + }, + { + "epoch": 71, + "train_loss": 3.19764753616333, + "train_acc": 0.2192, + "test_loss": 6.423630954742432, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.4863979881245643, + "grad_max_sv": 0.16165782324969769, + "grad_min_sv": 8.848893565116534e-09, + "grad_condition": 22136265.711468942, + "lr": 0.0005418389216661573, + "time_sec": 66.76352262496948 + }, + { + "epoch": 72, + "train_loss": 3.1839187537384035, + "train_acc": 0.21994, + "test_loss": 6.446183979797364, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.4889041887536974, + "grad_max_sv": 0.16505594030022622, + "grad_min_sv": 8.987748037481147e-09, + "grad_condition": 43981081.25474357, + "lr": 0.0005313952597646563, + "time_sec": 66.79931592941284 + }, + { + "epoch": 73, + "train_loss": 3.187308960342407, + "train_acc": 0.21954, + "test_loss": 6.563741957092285, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.4858937570988194, + "grad_max_sv": 0.15989821515977382, + "grad_min_sv": 8.734785567066083e-09, + "grad_condition": 21403260.9126192, + "lr": 0.0005209378268645994, + "time_sec": 66.80401682853699 + }, + { + "epoch": 74, + "train_loss": 3.171525285644531, + "train_acc": 0.22096, + "test_loss": 6.3379450691223145, + "test_acc": 0.0312, + "lyapunov": null, + "grad_norm": 0.4892042607088359, + "grad_max_sv": 0.16411556918174028, + "grad_min_sv": 8.98726121578708e-09, + "grad_condition": 21168833.2418665, + "lr": 0.0005104712099416781, + "time_sec": 66.80049800872803 + }, + { + "epoch": 75, + "train_loss": 3.1646966344451903, + "train_acc": 0.22346, + "test_loss": 6.526763028717041, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.4872344212322221, + "grad_max_sv": 0.16347934678196907, + "grad_min_sv": 8.94242010440749e-09, + "grad_condition": 62502067.37877717, + "lr": 0.0004999999999999996, + "time_sec": 66.74789333343506 + }, + { + "epoch": 76, + "train_loss": 3.1487132719421385, + "train_acc": 0.22644, + "test_loss": 6.988856857299805, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.4903951810445429, + "grad_max_sv": 0.16496667228639125, + "grad_min_sv": 8.828812622652115e-09, + "grad_condition": 55142543.089542985, + "lr": 0.0004895287900583212, + "time_sec": 66.76014757156372 + }, + { + "epoch": 77, + "train_loss": 3.1434121074676513, + "train_acc": 0.22544, + "test_loss": 6.655374778747559, + "test_acc": 0.0305, + "lyapunov": null, + "grad_norm": 0.49339407231232474, + "grad_max_sv": 0.16745336949825287, + "grad_min_sv": 9.039998791204873e-09, + "grad_condition": 20500343.229206834, + "lr": 0.0004790621731353997, + "time_sec": 66.77004861831665 + }, + { + "epoch": 78, + "train_loss": 3.1347723538970946, + "train_acc": 0.22916, + "test_loss": 7.025522061920166, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.48900666073886295, + "grad_max_sv": 0.16547333262860775, + "grad_min_sv": 9.023560618159898e-09, + "grad_condition": 20661502.35707375, + "lr": 0.000468604740235343, + "time_sec": 66.81849670410156 + }, + { + "epoch": 79, + "train_loss": 3.1304521063995363, + "train_acc": 0.22772, + "test_loss": 6.83003788986206, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.49174437465380544, + "grad_max_sv": 0.16336545161902905, + "grad_min_sv": 8.888891785130416e-09, + "grad_condition": 64322103.36932512, + "lr": 0.00045816107833384175, + "time_sec": 66.78076171875 + }, + { + "epoch": 80, + "train_loss": 3.127742724685669, + "train_acc": 0.22918, + "test_loss": 6.43679395904541, + "test_acc": 0.032, + "lyapunov": null, + "grad_norm": 0.4909292517764462, + "grad_max_sv": 0.16271441541612147, + "grad_min_sv": 8.940982496041805e-09, + "grad_condition": 21211899.117706068, + "lr": 0.0004477357683661729, + "time_sec": 66.78754663467407 + }, + { + "epoch": 81, + "train_loss": 3.1236261379241945, + "train_acc": 0.23066, + "test_loss": 7.037800202178955, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.4913270876663801, + "grad_max_sv": 0.16124934926629067, + "grad_min_sv": 9.025329496259448e-09, + "grad_condition": 85362661.37288797, + "lr": 0.00043733338321784746, + "time_sec": 66.79688453674316 + }, + { + "epoch": 82, + "train_loss": 3.11507862121582, + "train_acc": 0.23056, + "test_loss": 7.101603583526611, + "test_acc": 0.0291, + "lyapunov": null, + "grad_norm": 0.4894916013523125, + "grad_max_sv": 0.16085669696331023, + "grad_min_sv": 8.950784479572205e-09, + "grad_condition": 87868876.59340149, + "lr": 0.0004269584857187939, + "time_sec": 66.7501974105835 + }, + { + "epoch": 83, + "train_loss": 3.116716618041992, + "train_acc": 0.22918, + "test_loss": 6.28887403717041, + "test_acc": 0.0294, + "lyapunov": null, + "grad_norm": 0.4925235661397028, + "grad_max_sv": 0.16220005229115486, + "grad_min_sv": 8.838474697958621e-09, + "grad_condition": 26899756.554924734, + "lr": 0.0004166156266419484, + "time_sec": 66.7679078578949 + }, + { + "epoch": 84, + "train_loss": 3.1041577443695068, + "train_acc": 0.2323, + "test_loss": 6.514328240966797, + "test_acc": 0.0292, + "lyapunov": null, + "grad_norm": 0.4889104927800163, + "grad_max_sv": 0.16120262071490288, + "grad_min_sv": 8.874711328842045e-09, + "grad_condition": 70851883.05420288, + "lr": 0.0004063093427071373, + "time_sec": 66.79031205177307 + }, + { + "epoch": 85, + "train_loss": 3.1004569428253173, + "train_acc": 0.23348, + "test_loss": 7.033082975769043, + "test_acc": 0.028, + "lyapunov": null, + "grad_norm": 0.48981351073040363, + "grad_max_sv": 0.1627339120954275, + "grad_min_sv": 8.982540034008225e-09, + "grad_condition": 21584989.23095519, + "lr": 0.0003960441545911199, + "time_sec": 66.76853013038635 + }, + { + "epoch": 86, + "train_loss": 3.0884765031433106, + "train_acc": 0.23582, + "test_loss": 6.4175174667358394, + "test_acc": 0.0319, + "lyapunov": null, + "grad_norm": 0.4909005209545173, + "grad_max_sv": 0.1606820985674858, + "grad_min_sv": 9.03317559641792e-09, + "grad_condition": 21923171.60734531, + "lr": 0.0003858245649446718, + "time_sec": 66.74095106124878 + }, + { + "epoch": 87, + "train_loss": 3.084468610839844, + "train_acc": 0.23528, + "test_loss": 6.820941673278808, + "test_acc": 0.0346, + "lyapunov": null, + "grad_norm": 0.4910444068308361, + "grad_max_sv": 0.16328486651182175, + "grad_min_sv": 9.03909012639481e-09, + "grad_condition": 20668433.24898103, + "lr": 0.00037565505641757235, + "time_sec": 66.77276849746704 + }, + { + "epoch": 88, + "train_loss": 3.077918306808472, + "train_acc": 0.23762, + "test_loss": 7.089393431091309, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.49316824021455075, + "grad_max_sv": 0.16232325807213782, + "grad_min_sv": 8.968252801500043e-09, + "grad_condition": 22046163.188841425, + "lr": 0.00036554008969236695, + "time_sec": 66.99798655509949 + }, + { + "epoch": 89, + "train_loss": 3.067122574386597, + "train_acc": 0.2422, + "test_loss": 7.214799313354492, + "test_acc": 0.0262, + "lyapunov": null, + "grad_norm": 0.4900930253460835, + "grad_max_sv": 0.16194776631891727, + "grad_min_sv": 8.92576947075785e-09, + "grad_condition": 23633440.101474784, + "lr": 0.0003554841015277638, + "time_sec": 66.8372859954834 + }, + { + "epoch": 90, + "train_loss": 3.064559158935547, + "train_acc": 0.24176, + "test_loss": 6.606956069946289, + "test_acc": 0.0311, + "lyapunov": null, + "grad_norm": 0.49500701859693813, + "grad_max_sv": 0.1596249148249626, + "grad_min_sv": 9.159110832962502e-09, + "grad_condition": 101449769.49017647, + "lr": 0.000345491502812526, + "time_sec": 66.80407047271729 + }, + { + "epoch": 91, + "train_loss": 3.0553189851379394, + "train_acc": 0.24228, + "test_loss": 6.418565266418457, + "test_acc": 0.0298, + "lyapunov": null, + "grad_norm": 0.4925589055469173, + "grad_max_sv": 0.16153519973158836, + "grad_min_sv": 9.049669121019566e-09, + "grad_condition": 25195558.577611163, + "lr": 0.0003355666766307081, + "time_sec": 66.84762644767761 + }, + { + "epoch": 92, + "train_loss": 3.056331217575073, + "train_acc": 0.24102, + "test_loss": 6.7072321174621585, + "test_acc": 0.0297, + "lyapunov": null, + "grad_norm": 0.4902092468213939, + "grad_max_sv": 0.15823189355432987, + "grad_min_sv": 9.083058827297208e-09, + "grad_condition": 19504609.540315717, + "lr": 0.00032571397633909225, + "time_sec": 66.86433339118958 + }, + { + "epoch": 93, + "train_loss": 3.0426194298553466, + "train_acc": 0.24348, + "test_loss": 6.913128755950928, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.4911735992497643, + "grad_max_sv": 0.159795406088233, + "grad_min_sv": 9.066670242363628e-09, + "grad_condition": 23214972.26169469, + "lr": 0.00031593772365766094, + "time_sec": 66.7759199142456 + }, + { + "epoch": 94, + "train_loss": 3.037528529663086, + "train_acc": 0.24504, + "test_loss": 7.106588607025146, + "test_acc": 0.0302, + "lyapunov": null, + "grad_norm": 0.4929529595332672, + "grad_max_sv": 0.1604856878519058, + "grad_min_sv": 9.051675931015524e-09, + "grad_condition": 21107425.42350878, + "lr": 0.0003062422067739483, + "time_sec": 66.78619933128357 + }, + { + "epoch": 95, + "train_loss": 3.031129434738159, + "train_acc": 0.24594, + "test_loss": 6.687380312347412, + "test_acc": 0.0343, + "lyapunov": null, + "grad_norm": 0.4953276706434929, + "grad_max_sv": 0.161559634283185, + "grad_min_sv": 9.12235032790587e-09, + "grad_condition": 20865530.968957625, + "lr": 0.00029663167846209965, + "time_sec": 66.75159859657288 + }, + { + "epoch": 96, + "train_loss": 3.0335071311950683, + "train_acc": 0.24622, + "test_loss": 6.9309969345092775, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.49472621160413666, + "grad_max_sv": 0.16361592449247836, + "grad_min_sv": 9.16821370489096e-09, + "grad_condition": 19741213.590965096, + "lr": 0.00028711035421746345, + "time_sec": 66.79747915267944 + }, + { + "epoch": 97, + "train_loss": 3.02239688041687, + "train_acc": 0.24772, + "test_loss": 7.384179110717773, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.49668252150204156, + "grad_max_sv": 0.1612157329916954, + "grad_min_sv": 9.138712192546806e-09, + "grad_condition": 19515456.886604063, + "lr": 0.00027768241040753615, + "time_sec": 66.77070426940918 + }, + { + "epoch": 98, + "train_loss": 3.0209144953155516, + "train_acc": 0.2495, + "test_loss": 7.305615675354004, + "test_acc": 0.0317, + "lyapunov": null, + "grad_norm": 0.494528793101407, + "grad_max_sv": 0.16126883141696452, + "grad_min_sv": 9.159177710715839e-09, + "grad_condition": 20215757.378428128, + "lr": 0.00026835198244006903, + "time_sec": 66.74260830879211 + }, + { + "epoch": 99, + "train_loss": 3.0122002574157714, + "train_acc": 0.25114, + "test_loss": 7.417421994018555, + "test_acc": 0.0303, + "lyapunov": null, + "grad_norm": 0.49228142442927636, + "grad_max_sv": 0.16154562458395957, + "grad_min_sv": 9.115954194283127e-09, + "grad_condition": 21850408.12006226, + "lr": 0.0002591231629491421, + "time_sec": 66.74969696998596 + }, + { + "epoch": 100, + "train_loss": 3.00868815536499, + "train_acc": 0.25064, + "test_loss": 7.224837091064453, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.4973003819613091, + "grad_max_sv": 0.16211517453193663, + "grad_min_sv": 9.138123377439023e-09, + "grad_condition": 21471169.650275595, + "lr": 0.0002499999999999997, + "time_sec": 66.72979998588562 + }, + { + "epoch": 101, + "train_loss": 3.011574204711914, + "train_acc": 0.2497, + "test_loss": 6.693938585662842, + "test_acc": 0.0339, + "lyapunov": null, + "grad_norm": 0.49870597782363885, + "grad_max_sv": 0.16383521035313606, + "grad_min_sv": 9.208752457801062e-09, + "grad_condition": 21899884.68313645, + "lr": 0.00024098649531343477, + "time_sec": 66.81981372833252 + }, + { + "epoch": 102, + "train_loss": 2.9973224279022217, + "train_acc": 0.25212, + "test_loss": 7.171955642700195, + "test_acc": 0.0293, + "lyapunov": null, + "grad_norm": 0.49384909489104784, + "grad_max_sv": 0.16012208051979543, + "grad_min_sv": 9.107674342478944e-09, + "grad_condition": 20520016.087493956, + "lr": 0.0002320866025105016, + "time_sec": 66.76935577392578 + }, + { + "epoch": 103, + "train_loss": 2.995499693145752, + "train_acc": 0.25094, + "test_loss": 6.78625715637207, + "test_acc": 0.0325, + "lyapunov": null, + "grad_norm": 0.49679770851901156, + "grad_max_sv": 0.156817539408803, + "grad_min_sv": 9.188224817102685e-09, + "grad_condition": 20448268.20669184, + "lr": 0.0002233042253783278, + "time_sec": 66.76536107063293 + }, + { + "epoch": 104, + "train_loss": 2.9911633958435058, + "train_acc": 0.25294, + "test_loss": 6.982937800598145, + "test_acc": 0.0317, + "lyapunov": null, + "grad_norm": 0.5002169985890668, + "grad_max_sv": 0.16450526081025602, + "grad_min_sv": 9.203415965441941e-09, + "grad_condition": 21080045.597844083, + "lr": 0.000214643216157784, + "time_sec": 66.80186581611633 + }, + { + "epoch": 105, + "train_loss": 2.97890757850647, + "train_acc": 0.2546, + "test_loss": 6.943555125427246, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.4957530407349862, + "grad_max_sv": 0.16243297494947911, + "grad_min_sv": 9.268795320843682e-09, + "grad_condition": 36816221.64395736, + "lr": 0.00020610737385376332, + "time_sec": 66.76260590553284 + }, + { + "epoch": 106, + "train_loss": 2.9860270111846923, + "train_acc": 0.25422, + "test_loss": 6.844045399475098, + "test_acc": 0.0286, + "lyapunov": null, + "grad_norm": 0.4970903409324634, + "grad_max_sv": 0.15834328122437, + "grad_min_sv": 9.162484361502354e-09, + "grad_condition": 27996399.196730472, + "lr": 0.00019770044256881242, + "time_sec": 66.81156158447266 + }, + { + "epoch": 107, + "train_loss": 2.9742181201171873, + "train_acc": 0.25492, + "test_loss": 6.836753462219238, + "test_acc": 0.0325, + "lyapunov": null, + "grad_norm": 0.49623915815641473, + "grad_max_sv": 0.16143721528351307, + "grad_min_sv": 9.188978035423733e-09, + "grad_condition": 25866527.38494375, + "lr": 0.0001894261098608447, + "time_sec": 66.78573369979858 + }, + { + "epoch": 108, + "train_loss": 2.9732699408721923, + "train_acc": 0.25772, + "test_loss": 7.0074780044555665, + "test_acc": 0.0297, + "lyapunov": null, + "grad_norm": 0.4966129788540459, + "grad_max_sv": 0.15941952541470528, + "grad_min_sv": 9.252560334571669e-09, + "grad_condition": 21610869.60023473, + "lr": 0.000181288005125655, + "time_sec": 66.78538966178894 + }, + { + "epoch": 109, + "train_loss": 2.9633288761901855, + "train_acc": 0.25906, + "test_loss": 6.713782179260254, + "test_acc": 0.0305, + "lyapunov": null, + "grad_norm": 0.497676490763689, + "grad_max_sv": 0.16128081902861596, + "grad_min_sv": 9.127150218946057e-09, + "grad_condition": 20170938.10071696, + "lr": 0.0001732896980049473, + "time_sec": 66.74944472312927 + }, + { + "epoch": 110, + "train_loss": 2.9596293452453613, + "train_acc": 0.25876, + "test_loss": 6.65006120300293, + "test_acc": 0.0324, + "lyapunov": null, + "grad_norm": 0.49966634206789384, + "grad_max_sv": 0.15842259526252747, + "grad_min_sv": 9.107274745456806e-09, + "grad_condition": 20091051.99353394, + "lr": 0.00016543469682057076, + "time_sec": 66.75245332717896 + }, + { + "epoch": 111, + "train_loss": 2.956690885467529, + "train_acc": 0.2604, + "test_loss": 7.234065510559082, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.498577335908786, + "grad_max_sv": 0.1657148886471987, + "grad_min_sv": 9.283077205546331e-09, + "grad_condition": 24350919.05095337, + "lr": 0.00015772644703565552, + "time_sec": 66.78981685638428 + }, + { + "epoch": 112, + "train_loss": 2.94970266708374, + "train_acc": 0.2611, + "test_loss": 7.461113217163086, + "test_acc": 0.0294, + "lyapunov": null, + "grad_norm": 0.49706195111887286, + "grad_max_sv": 0.15587482824921609, + "grad_min_sv": 9.14300024579262e-09, + "grad_condition": 19620425.881544393, + "lr": 0.00015016832974331713, + "time_sec": 66.73882722854614 + }, + { + "epoch": 113, + "train_loss": 2.945457241821289, + "train_acc": 0.26064, + "test_loss": 6.851638394165039, + "test_acc": 0.0317, + "lyapunov": null, + "grad_norm": 0.49829859566301316, + "grad_max_sv": 0.16474134363234044, + "grad_min_sv": 9.221820057581098e-09, + "grad_condition": 26712873.31231401, + "lr": 0.00014276366018359834, + "time_sec": 66.77810740470886 + }, + { + "epoch": 114, + "train_loss": 2.946153409576416, + "train_acc": 0.2599, + "test_loss": 7.203242881011963, + "test_acc": 0.0296, + "lyapunov": null, + "grad_norm": 0.5000583559017892, + "grad_max_sv": 0.16016064565628768, + "grad_min_sv": 9.404633910525817e-09, + "grad_condition": 23574899.530670665, + "lr": 0.00013551568628929425, + "time_sec": 66.73546171188354 + }, + { + "epoch": 115, + "train_loss": 2.948209620437622, + "train_acc": 0.25884, + "test_loss": 6.701388775634766, + "test_acc": 0.0321, + "lyapunov": null, + "grad_norm": 0.5013184028480744, + "grad_max_sv": 0.16491747684776784, + "grad_min_sv": 9.35589676079318e-09, + "grad_condition": 33018704.287756693, + "lr": 0.00012842758726130276, + "time_sec": 66.75530242919922 + }, + { + "epoch": 116, + "train_loss": 2.9463114239501955, + "train_acc": 0.26204, + "test_loss": 7.220928353881836, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.4977560347764178, + "grad_max_sv": 0.16203629337251185, + "grad_min_sv": 9.154163846392117e-09, + "grad_condition": 21822336.390723675, + "lr": 0.0001215024721741218, + "time_sec": 66.75460624694824 + }, + { + "epoch": 117, + "train_loss": 2.9339290143585206, + "train_acc": 0.26458, + "test_loss": 7.120738798522949, + "test_acc": 0.0305, + "lyapunov": null, + "grad_norm": 0.5013641420003778, + "grad_max_sv": 0.16478117741644382, + "grad_min_sv": 9.288832453213658e-09, + "grad_condition": 27324943.297664374, + "lr": 0.00011474337861210538, + "time_sec": 66.75992965698242 + }, + { + "epoch": 118, + "train_loss": 2.9379910820770263, + "train_acc": 0.26084, + "test_loss": 7.117022830200195, + "test_acc": 0.0301, + "lyapunov": null, + "grad_norm": 0.5015663149610728, + "grad_max_sv": 0.16396238505840302, + "grad_min_sv": 9.336925840819354e-09, + "grad_condition": 20705205.815624513, + "lr": 0.00010815327133708009, + "time_sec": 66.76019549369812 + }, + { + "epoch": 119, + "train_loss": 2.9290156356811523, + "train_acc": 0.26498, + "test_loss": 7.457037506103515, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.5005105565315475, + "grad_max_sv": 0.1598517183214426, + "grad_min_sv": 9.317651539220151e-09, + "grad_condition": 19474341.874121707, + "lr": 0.00010173504098790182, + "time_sec": 66.77068591117859 + }, + { + "epoch": 120, + "train_loss": 2.9241028984069826, + "train_acc": 0.26356, + "test_loss": 6.841690950012207, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5028678839154062, + "grad_max_sv": 0.16410683281719685, + "grad_min_sv": 9.103373727059605e-09, + "grad_condition": 52015235.36119781, + "lr": 9.549150281252629e-05, + "time_sec": 66.7771668434143 + }, + { + "epoch": 121, + "train_loss": 2.916977886505127, + "train_acc": 0.26436, + "test_loss": 7.093948570251465, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.5039276644054499, + "grad_max_sv": 0.16179459281265735, + "grad_min_sv": 9.367120145167829e-09, + "grad_condition": 51831353.12293583, + "lr": 8.942539543314794e-05, + "time_sec": 67.04774737358093 + }, + { + "epoch": 122, + "train_loss": 2.9199959434509277, + "train_acc": 0.266, + "test_loss": 7.458375955200196, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.5029526689604006, + "grad_max_sv": 0.16233476884663106, + "grad_min_sv": 9.329605515917549e-09, + "grad_condition": 22157132.823347427, + "lr": 8.353937964495024e-05, + "time_sec": 66.80378198623657 + }, + { + "epoch": 123, + "train_loss": 2.9115442817687986, + "train_acc": 0.26938, + "test_loss": 6.9655703231811525, + "test_acc": 0.0314, + "lyapunov": null, + "grad_norm": 0.5030753967470114, + "grad_max_sv": 0.15974463373422623, + "grad_min_sv": 9.297508608147043e-09, + "grad_condition": 36046633.878638715, + "lr": 7.783603724899243e-05, + "time_sec": 66.80266833305359 + }, + { + "epoch": 124, + "train_loss": 2.9138562171173095, + "train_acc": 0.26954, + "test_loss": 6.97724497833252, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.5031663333888824, + "grad_max_sv": 0.16383831724524497, + "grad_min_sv": 9.310707842213883e-09, + "grad_condition": 28458147.706868507, + "lr": 7.231786991974666e-05, + "time_sec": 66.78245973587036 + }, + { + "epoch": 125, + "train_loss": 2.9108992396545412, + "train_acc": 0.26916, + "test_loss": 7.1801939224243165, + "test_acc": 0.0297, + "lyapunov": null, + "grad_norm": 0.5036349180632973, + "grad_max_sv": 0.16358038783073425, + "grad_min_sv": 9.299380029914595e-09, + "grad_condition": 19984336.2098884, + "lr": 6.698729810778072e-05, + "time_sec": 66.75985527038574 + }, + { + "epoch": 126, + "train_loss": 2.914398226470947, + "train_acc": 0.26724, + "test_loss": 7.200770987701416, + "test_acc": 0.0295, + "lyapunov": null, + "grad_norm": 0.5052014696250272, + "grad_max_sv": 0.16353870332241058, + "grad_min_sv": 9.381645610373467e-09, + "grad_condition": 21434605.046592515, + "lr": 6.184665997806817e-05, + "time_sec": 66.774897813797 + }, + { + "epoch": 127, + "train_loss": 2.900709945602417, + "train_acc": 0.27038, + "test_loss": 6.86236782836914, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.5062625750885013, + "grad_max_sv": 0.16417891010642052, + "grad_min_sv": 9.328811839681705e-09, + "grad_condition": 31439200.03537352, + "lr": 5.6898210384392595e-05, + "time_sec": 66.78050327301025 + }, + { + "epoch": 128, + "train_loss": 2.9011995401763917, + "train_acc": 0.2716, + "test_loss": 7.173482424926758, + "test_acc": 0.0289, + "lyapunov": null, + "grad_norm": 0.5054003063568236, + "grad_max_sv": 0.16145575419068336, + "grad_min_sv": 9.318279831083132e-09, + "grad_condition": 19322689.781916358, + "lr": 5.214411988029363e-05, + "time_sec": 66.76925420761108 + }, + { + "epoch": 129, + "train_loss": 2.901223872680664, + "train_acc": 0.27258, + "test_loss": 7.040973609161377, + "test_acc": 0.0316, + "lyapunov": null, + "grad_norm": 0.5048182342459864, + "grad_max_sv": 0.1658121332526207, + "grad_min_sv": 9.358181082830263e-09, + "grad_condition": 23747993.692621626, + "lr": 4.7586473766990294e-05, + "time_sec": 66.80085635185242 + }, + { + "epoch": 130, + "train_loss": 2.902728254547119, + "train_acc": 0.2709, + "test_loss": 6.8991255172729495, + "test_acc": 0.0295, + "lyapunov": null, + "grad_norm": 0.504200690210551, + "grad_max_sv": 0.16130973920226097, + "grad_min_sv": 9.333992067109276e-09, + "grad_condition": 48792402.15405806, + "lr": 4.32272711786996e-05, + "time_sec": 66.7733838558197 + }, + { + "epoch": 131, + "train_loss": 2.893923129730225, + "train_acc": 0.26964, + "test_loss": 7.059582917022705, + "test_acc": 0.0322, + "lyapunov": null, + "grad_norm": 0.5050579857883386, + "grad_max_sv": 0.16214525364339352, + "grad_min_sv": 9.388355001879386e-09, + "grad_condition": 310922612.4164163, + "lr": 3.906842420574966e-05, + "time_sec": 66.77927422523499 + }, + { + "epoch": 132, + "train_loss": 2.8922697412872314, + "train_acc": 0.27422, + "test_loss": 7.0280276306152345, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.5058650281247494, + "grad_max_sv": 0.16365451961755753, + "grad_min_sv": 9.290366345671153e-09, + "grad_condition": 19882692.340553276, + "lr": 3.5111757055874305e-05, + "time_sec": 66.77954649925232 + }, + { + "epoch": 133, + "train_loss": 2.900697283477783, + "train_acc": 0.27018, + "test_loss": 7.238303312683105, + "test_acc": 0.0317, + "lyapunov": null, + "grad_norm": 0.5051111613751295, + "grad_max_sv": 0.16027298532426357, + "grad_min_sv": 9.3600961287299e-09, + "grad_condition": 20324064.738057118, + "lr": 3.1359005254054254e-05, + "time_sec": 66.75997471809387 + }, + { + "epoch": 134, + "train_loss": 2.897649665527344, + "train_acc": 0.26928, + "test_loss": 7.020867985534668, + "test_acc": 0.0307, + "lyapunov": null, + "grad_norm": 0.5048089733174289, + "grad_max_sv": 0.16418067179620266, + "grad_min_sv": 9.411045018281605e-09, + "grad_condition": 20814583.819657672, + "lr": 2.7811814881259484e-05, + "time_sec": 66.75737643241882 + }, + { + "epoch": 135, + "train_loss": 2.8868365075683595, + "train_acc": 0.27108, + "test_loss": 7.227980157470703, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.505296469518053, + "grad_max_sv": 0.1626897618174553, + "grad_min_sv": 9.335086056938557e-09, + "grad_condition": 19121452.928086806, + "lr": 2.4471741852423218e-05, + "time_sec": 66.78665018081665 + }, + { + "epoch": 136, + "train_loss": 2.8893248936462403, + "train_acc": 0.2719, + "test_loss": 7.04058285369873, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.5047583466249539, + "grad_max_sv": 0.1616091288626194, + "grad_min_sv": 9.193184843242497e-09, + "grad_condition": 52822668.902298525, + "lr": 2.1340251233966362e-05, + "time_sec": 66.82355737686157 + }, + { + "epoch": 137, + "train_loss": 2.8932983180236818, + "train_acc": 0.2706, + "test_loss": 7.298259108734131, + "test_acc": 0.0306, + "lyapunov": null, + "grad_norm": 0.5064166482647556, + "grad_max_sv": 0.16595029644668102, + "grad_min_sv": 9.504852901964788e-09, + "grad_condition": 26232817.791797824, + "lr": 1.8418716601170932e-05, + "time_sec": 66.80469083786011 + }, + { + "epoch": 138, + "train_loss": 2.889240245513916, + "train_acc": 0.27282, + "test_loss": 7.01880281829834, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.504142027582102, + "grad_max_sv": 0.16221415363252162, + "grad_min_sv": 9.365972712671589e-09, + "grad_condition": 173714150.51916546, + "lr": 1.570841943568445e-05, + "time_sec": 66.81162881851196 + }, + { + "epoch": 139, + "train_loss": 2.8894276250457764, + "train_acc": 0.2742, + "test_loss": 7.018578756713867, + "test_acc": 0.0311, + "lyapunov": null, + "grad_norm": 0.505498638767792, + "grad_max_sv": 0.16305100470781325, + "grad_min_sv": 9.436683297281423e-09, + "grad_condition": 21739786.228019442, + "lr": 1.3210548563419845e-05, + "time_sec": 66.7770791053772 + }, + { + "epoch": 140, + "train_loss": 2.889230620346069, + "train_acc": 0.27218, + "test_loss": 7.308567997741699, + "test_acc": 0.0311, + "lyapunov": null, + "grad_norm": 0.5054575022404508, + "grad_max_sv": 0.16442596912384033, + "grad_min_sv": 9.343637030756469e-09, + "grad_condition": 19925860.99628629, + "lr": 1.0926199633097203e-05, + "time_sec": 66.79729318618774 + }, + { + "epoch": 141, + "train_loss": 2.888821849899292, + "train_acc": 0.27302, + "test_loss": 7.1829338531494145, + "test_acc": 0.0314, + "lyapunov": null, + "grad_norm": 0.5047487463390119, + "grad_max_sv": 0.16437522321939468, + "grad_min_sv": 9.408711654224077e-09, + "grad_condition": 21893279.61576708, + "lr": 8.856374635655688e-06, + "time_sec": 66.86598515510559 + }, + { + "epoch": 142, + "train_loss": 2.8799402445983886, + "train_acc": 0.2742, + "test_loss": 7.140073747253418, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.5045453289237622, + "grad_max_sv": 0.1649588480591774, + "grad_min_sv": 9.320059430814598e-09, + "grad_condition": 59261198.33071508, + "lr": 7.001981464747503e-06, + "time_sec": 66.8481650352478 + }, + { + "epoch": 143, + "train_loss": 2.8898901738739013, + "train_acc": 0.27182, + "test_loss": 7.103092768859863, + "test_acc": 0.0297, + "lyapunov": null, + "grad_norm": 0.5052816774210068, + "grad_max_sv": 0.16425308547914028, + "grad_min_sv": 9.34736955476856e-09, + "grad_condition": 23461625.085362356, + "lr": 5.3638335185058295e-06, + "time_sec": 66.8002393245697 + }, + { + "epoch": 144, + "train_loss": 2.8863021937561033, + "train_acc": 0.27274, + "test_loss": 7.1982520462036135, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.5044686932866996, + "grad_max_sv": 0.16509353555738926, + "grad_min_sv": 9.324032489155254e-09, + "grad_condition": 23942258.129928373, + "lr": 3.942649342761114e-06, + "time_sec": 66.81374979019165 + }, + { + "epoch": 145, + "train_loss": 2.8919877973175048, + "train_acc": 0.27214, + "test_loss": 7.1992824775695805, + "test_acc": 0.0289, + "lyapunov": null, + "grad_norm": 0.5042030290413125, + "grad_max_sv": 0.16350974403321744, + "grad_min_sv": 9.386586871662495e-09, + "grad_condition": 23933558.25798073, + "lr": 2.7390523158633524e-06, + "time_sec": 66.84291410446167 + }, + { + "epoch": 146, + "train_loss": 2.8929362953948976, + "train_acc": 0.27134, + "test_loss": 6.984002893066406, + "test_acc": 0.031, + "lyapunov": null, + "grad_norm": 0.5043351409430421, + "grad_max_sv": 0.16246499940752984, + "grad_min_sv": 9.333080052895127e-09, + "grad_condition": 53755875.38336539, + "lr": 1.7535703752478133e-06, + "time_sec": 66.95102620124817 + }, + { + "epoch": 147, + "train_loss": 2.8877293769836427, + "train_acc": 0.2731, + "test_loss": 7.257072169494629, + "test_acc": 0.0276, + "lyapunov": null, + "grad_norm": 0.5050095295755104, + "grad_max_sv": 0.16067363917827607, + "grad_min_sv": 9.417460497540553e-09, + "grad_condition": 19033069.438820988, + "lr": 9.866357858642196e-07, + "time_sec": 66.89330506324768 + }, + { + "epoch": 148, + "train_loss": 2.882035206298828, + "train_acc": 0.27536, + "test_loss": 7.237642462921142, + "test_acc": 0.0291, + "lyapunov": null, + "grad_norm": 0.504619461339764, + "grad_max_sv": 0.16399259269237518, + "grad_min_sv": 9.271372525265776e-09, + "grad_condition": 21886094.37639584, + "lr": 4.38584950570808e-07, + "time_sec": 66.8558566570282 + }, + { + "epoch": 149, + "train_loss": 2.8901185527038575, + "train_acc": 0.2736, + "test_loss": 7.19153920135498, + "test_acc": 0.0293, + "lyapunov": null, + "grad_norm": 0.5041490164370284, + "grad_max_sv": 0.16302622966468333, + "grad_min_sv": 9.21069388537532e-09, + "grad_condition": 20816419.226421457, + "lr": 1.096582625772501e-07, + "time_sec": 66.84155035018921 + }, + { + "epoch": 150, + "train_loss": 2.8903665699005128, + "train_acc": 0.27238, + "test_loss": 7.314303421020508, + "test_acc": 0.0277, + "lyapunov": null, + "grad_norm": 0.5045790947801017, + "grad_max_sv": 0.16631755232810974, + "grad_min_sv": 9.309531870393962e-09, + "grad_condition": 20772273.137153096, + "lr": 0.0, + "time_sec": 66.80794334411621 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 4.345122828216553, + "train_acc": 0.0989, + "test_loss": 3.642047788619995, + "test_acc": 0.1654, + "lyapunov": 2.273679957670324, + "grad_norm": 6.260445856958774, + "grad_max_sv": 4.898569625616074, + "grad_min_sv": 1.1334657320505315e-07, + "grad_condition": 85222715.313173, + "lr": 0.0009998903417374227, + "time_sec": 41.848464012145996 + }, + { + "epoch": 2, + "train_loss": 3.5630809851074217, + "train_acc": 0.18086, + "test_loss": 3.667209470367432, + "test_acc": 0.1901, + "lyapunov": 2.188295935425917, + "grad_norm": 4.65558304747868, + "grad_max_sv": 3.5230118453502657, + "grad_min_sv": 8.682233273438201e-08, + "grad_condition": 88235639.3885431, + "lr": 0.0009995614150494292, + "time_sec": 41.71617341041565 + }, + { + "epoch": 3, + "train_loss": 3.1361752326202392, + "train_acc": 0.24364, + "test_loss": 3.3074075031280517, + "test_acc": 0.2233, + "lyapunov": 2.1415735132553997, + "grad_norm": 3.7913818657372738, + "grad_max_sv": 2.674958550930023, + "grad_min_sv": 7.161170632596914e-08, + "grad_condition": 63512788.56348453, + "lr": 0.0009990133642141358, + "time_sec": 41.742589712142944 + }, + { + "epoch": 4, + "train_loss": 2.818405838470459, + "train_acc": 0.29608, + "test_loss": 3.031781585693359, + "test_acc": 0.2737, + "lyapunov": 2.120552156282508, + "grad_norm": 3.1978924836574523, + "grad_max_sv": 2.1132257640361787, + "grad_min_sv": 6.140957623523846e-08, + "grad_condition": 41436248.19292988, + "lr": 0.0009982464296247522, + "time_sec": 41.72683644294739 + }, + { + "epoch": 5, + "train_loss": 2.6039978585052492, + "train_acc": 0.33664, + "test_loss": 2.8726236545562744, + "test_acc": 0.3009, + "lyapunov": 2.0960761125740186, + "grad_norm": 2.7890150706964407, + "grad_max_sv": 1.7450146913528441, + "grad_min_sv": 5.3137798772251443e-08, + "grad_condition": 39716965.918141864, + "lr": 0.0009972609476841367, + "time_sec": 41.73356294631958 + }, + { + "epoch": 6, + "train_loss": 2.4260194576263427, + "train_acc": 0.37614, + "test_loss": 2.7733699851989746, + "test_acc": 0.326, + "lyapunov": 2.0747361539879723, + "grad_norm": 2.486278628264512, + "grad_max_sv": 1.4613764017820359, + "grad_min_sv": 4.773349010500638e-08, + "grad_condition": 40788863.17353636, + "lr": 0.000996057350657239, + "time_sec": 41.7393217086792 + }, + { + "epoch": 7, + "train_loss": 2.2890482838439943, + "train_acc": 0.40624, + "test_loss": 2.7100242050170897, + "test_acc": 0.3329, + "lyapunov": 2.057765728372442, + "grad_norm": 2.2355663124824687, + "grad_max_sv": 1.2315028876066207, + "grad_min_sv": 4.287546970238587e-08, + "grad_condition": 54190799.969633564, + "lr": 0.000994636166481494, + "time_sec": 41.695188760757446 + }, + { + "epoch": 8, + "train_loss": 2.184328906326294, + "train_acc": 0.4278, + "test_loss": 3.209503977203369, + "test_acc": 0.2887, + "lyapunov": 2.03700729495729, + "grad_norm": 2.0765061614907836, + "grad_max_sv": 1.1610283195972442, + "grad_min_sv": 4.00687799953503e-08, + "grad_condition": 89249974.56926174, + "lr": 0.0009929980185352525, + "time_sec": 41.739415884017944 + }, + { + "epoch": 9, + "train_loss": 2.106717535934448, + "train_acc": 0.4439, + "test_loss": 2.8961434120178224, + "test_acc": 0.3322, + "lyapunov": 2.0108512493655506, + "grad_norm": 1.9349953574193108, + "grad_max_sv": 1.0107193812727928, + "grad_min_sv": 3.7177804969312775e-08, + "grad_condition": 73644312.6485336, + "lr": 0.0009911436253643444, + "time_sec": 41.75891327857971 + }, + { + "epoch": 10, + "train_loss": 2.046322995223999, + "train_acc": 0.4606, + "test_loss": 3.1619003036499023, + "test_acc": 0.2861, + "lyapunov": 1.9493244422976013, + "grad_norm": 1.8008338771473693, + "grad_max_sv": 0.9106233805418015, + "grad_min_sv": 3.458326265255718e-08, + "grad_condition": 426643398.8001811, + "lr": 0.0009890738003669028, + "time_sec": 41.724793434143066 + }, + { + "epoch": 11, + "train_loss": 2.0470443756866454, + "train_acc": 0.45754, + "test_loss": 4.726581622314453, + "test_acc": 0.132, + "lyapunov": 1.806359241380716, + "grad_norm": 1.6667241887950914, + "grad_max_sv": 0.8278753355145454, + "grad_min_sv": 3.192113512962003e-08, + "grad_condition": 45569948.52666045, + "lr": 0.00098678945143658, + "time_sec": 41.766194105148315 + }, + { + "epoch": 12, + "train_loss": 2.091300444564819, + "train_acc": 0.4489, + "test_loss": 6.842439665222168, + "test_acc": 0.0701, + "lyapunov": 1.6469548641873137, + "grad_norm": 1.5001429357831788, + "grad_max_sv": 0.7203063145279884, + "grad_min_sv": 2.8685982090843192e-08, + "grad_condition": 1181136343.424305, + "lr": 0.0009842915805643154, + "time_sec": 41.76103091239929 + }, + { + "epoch": 13, + "train_loss": 2.1495789795684814, + "train_acc": 0.4347, + "test_loss": 12.390533666992187, + "test_acc": 0.0332, + "lyapunov": 1.524907083157688, + "grad_norm": 1.357991065809798, + "grad_max_sv": 0.6235657155513763, + "grad_min_sv": 2.559957669179269e-08, + "grad_condition": 33454022.4653193, + "lr": 0.000981581283398829, + "time_sec": 41.74048900604248 + }, + { + "epoch": 14, + "train_loss": 2.1686959735107423, + "train_acc": 0.4331, + "test_loss": 17.324827462768553, + "test_acc": 0.0125, + "lyapunov": 1.4686146608703887, + "grad_norm": 1.2534922135501005, + "grad_max_sv": 0.5804860837757587, + "grad_min_sv": 2.377185976398799e-08, + "grad_condition": 50488785.520982705, + "lr": 0.0009786597487660333, + "time_sec": 41.79189419746399 + }, + { + "epoch": 15, + "train_loss": 2.1587823439025877, + "train_acc": 0.43484, + "test_loss": 16.184048045349122, + "test_acc": 0.0101, + "lyapunov": 1.4566279469853471, + "grad_norm": 1.2107022136349788, + "grad_max_sv": 0.5652622655034065, + "grad_min_sv": 2.2604362226452678e-08, + "grad_condition": 35806635.9763861, + "lr": 0.0009755282581475766, + "time_sec": 41.749398708343506 + }, + { + "epoch": 16, + "train_loss": 2.24028721862793, + "train_acc": 0.41504, + "test_loss": 14.463521719360351, + "test_acc": 0.0125, + "lyapunov": 1.463649024134097, + "grad_norm": 1.224268307178237, + "grad_max_sv": 0.58356414437294, + "grad_min_sv": 2.2900912488577064e-08, + "grad_condition": 61506774.8063802, + "lr": 0.0009721881851187403, + "time_sec": 41.767138719558716 + }, + { + "epoch": 17, + "train_loss": 2.197388257369995, + "train_acc": 0.42664, + "test_loss": 15.289615742492677, + "test_acc": 0.01, + "lyapunov": 1.4573698674931246, + "grad_norm": 1.1745936162015678, + "grad_max_sv": 0.5660642378032208, + "grad_min_sv": 2.2495864565597047e-08, + "grad_condition": 31210721.463894047, + "lr": 0.0009686409947459456, + "time_sec": 41.71902322769165 + }, + { + "epoch": 18, + "train_loss": 2.1406205596160888, + "train_acc": 0.43818, + "test_loss": 17.7336371963501, + "test_acc": 0.0098, + "lyapunov": 1.4560003051977328, + "grad_norm": 1.1488293447697844, + "grad_max_sv": 0.5552306786179543, + "grad_min_sv": 2.1710132396685067e-08, + "grad_condition": 64010933.751302466, + "lr": 0.0009648882429441254, + "time_sec": 41.740118980407715 + }, + { + "epoch": 19, + "train_loss": 2.1107253352355957, + "train_acc": 0.4427, + "test_loss": 16.837382061767578, + "test_acc": 0.01, + "lyapunov": 1.4612409815458995, + "grad_norm": 1.1472532791884336, + "grad_max_sv": 0.5604257300496102, + "grad_min_sv": 2.1788039477471654e-08, + "grad_condition": 171767310.90465343, + "lr": 0.00096093157579425, + "time_sec": 41.73516607284546 + }, + { + "epoch": 20, + "train_loss": 2.0478131282806395, + "train_acc": 0.4582, + "test_loss": 16.04560538024902, + "test_acc": 0.01, + "lyapunov": 1.4647965620240897, + "grad_norm": 1.1189179896122796, + "grad_max_sv": 0.5224487766623497, + "grad_min_sv": 2.0951748809505676e-08, + "grad_condition": 42033338.387387484, + "lr": 0.0009567727288213001, + "time_sec": 41.719831466674805 + }, + { + "epoch": 21, + "train_loss": 2.2204883486938476, + "train_acc": 0.42222, + "test_loss": 13.492722917175293, + "test_acc": 0.0135, + "lyapunov": 1.4607551369215825, + "grad_norm": 1.1009643643354936, + "grad_max_sv": 0.5138206973671913, + "grad_min_sv": 2.087538478884321e-08, + "grad_condition": 39625814.29055409, + "lr": 0.0009524135262330095, + "time_sec": 41.71716284751892 + }, + { + "epoch": 22, + "train_loss": 2.1108740393829346, + "train_acc": 0.44414, + "test_loss": 10.789187107849122, + "test_acc": 0.0102, + "lyapunov": 1.452153721733776, + "grad_norm": 1.1025834390700462, + "grad_max_sv": 0.5186751410365105, + "grad_min_sv": 2.0848792592342846e-08, + "grad_condition": 89011620.30312964, + "lr": 0.0009478558801197061, + "time_sec": 41.72071313858032 + }, + { + "epoch": 23, + "train_loss": 1.9906964570236205, + "train_acc": 0.47008, + "test_loss": 12.002604922485352, + "test_acc": 0.0125, + "lyapunov": 1.4538751047895389, + "grad_norm": 1.0749591459609724, + "grad_max_sv": 0.499434107542038, + "grad_min_sv": 2.0483097359913494e-08, + "grad_condition": 36067401.20949165, + "lr": 0.000943101789615607, + "time_sec": 41.73177123069763 + }, + { + "epoch": 24, + "train_loss": 1.9467369974899291, + "train_acc": 0.47928, + "test_loss": 10.21612840270996, + "test_acc": 0.012, + "lyapunov": 1.462179490977236, + "grad_norm": 1.057190624864685, + "grad_max_sv": 0.4812349632382393, + "grad_min_sv": 1.985775003971943e-08, + "grad_condition": 439122994.3278316, + "lr": 0.0009381533400219313, + "time_sec": 41.76715135574341 + }, + { + "epoch": 25, + "train_loss": 1.9274399798583985, + "train_acc": 0.48482, + "test_loss": 10.605220227050781, + "test_acc": 0.0122, + "lyapunov": 1.4777010703635642, + "grad_norm": 1.038845556697297, + "grad_max_sv": 0.4696679309010506, + "grad_min_sv": 1.937961372211472e-08, + "grad_condition": 45663315.27575115, + "lr": 0.0009330127018922189, + "time_sec": 41.754496335983276 + }, + { + "epoch": 26, + "train_loss": 1.8965490600585937, + "train_acc": 0.49088, + "test_loss": 10.196444692993165, + "test_acc": 0.0103, + "lyapunov": 1.5161671653732924, + "grad_norm": 1.0307981939853097, + "grad_max_sv": 0.4717611216008663, + "grad_min_sv": 1.9327519586512243e-08, + "grad_condition": 96461690.8495032, + "lr": 0.000927682130080253, + "time_sec": 41.737120389938354 + }, + { + "epoch": 27, + "train_loss": 1.884097469177246, + "train_acc": 0.4982, + "test_loss": 10.597889468383789, + "test_acc": 0.0123, + "lyapunov": 1.5833752179694602, + "grad_norm": 1.0146704552097585, + "grad_max_sv": 0.4673022925853729, + "grad_min_sv": 1.917618910607377e-08, + "grad_condition": 32192665.879274238, + "lr": 0.0009221639627510072, + "time_sec": 41.73063254356384 + }, + { + "epoch": 28, + "train_loss": 1.8578104418563843, + "train_acc": 0.5034, + "test_loss": 9.287236483764648, + "test_acc": 0.017, + "lyapunov": 1.6747892195611354, + "grad_norm": 0.989988586491176, + "grad_max_sv": 0.45249250531196594, + "grad_min_sv": 1.8457542250160942e-08, + "grad_condition": 32054185.63348528, + "lr": 0.0009164606203550494, + "time_sec": 41.71113634109497 + }, + { + "epoch": 29, + "train_loss": 1.834356333580017, + "train_acc": 0.50832, + "test_loss": 12.138305050659179, + "test_acc": 0.01, + "lyapunov": 1.7328125092074693, + "grad_norm": 0.9644353292361907, + "grad_max_sv": 0.4445766285061836, + "grad_min_sv": 1.826234232171764e-08, + "grad_condition": 29277750.507297922, + "lr": 0.0009105746045668516, + "time_sec": 41.737956047058105 + }, + { + "epoch": 30, + "train_loss": 1.810653836517334, + "train_acc": 0.5128, + "test_loss": 11.570760047912598, + "test_acc": 0.0167, + "lyapunov": 1.7364137608681798, + "grad_norm": 0.9545104714701855, + "grad_max_sv": 0.4332597106695175, + "grad_min_sv": 1.7821457946876064e-08, + "grad_condition": 75116898.03321448, + "lr": 0.0009045084971874733, + "time_sec": 41.73191165924072 + }, + { + "epoch": 31, + "train_loss": 1.7940360905456543, + "train_acc": 0.51942, + "test_loss": 12.05395121154785, + "test_acc": 0.0152, + "lyapunov": 1.730164911740881, + "grad_norm": 0.9424489794980085, + "grad_max_sv": 0.4163834311068058, + "grad_min_sv": 1.7580776200121217e-08, + "grad_condition": 71781634.8284968, + "lr": 0.0008982649590120977, + "time_sec": 41.76260232925415 + }, + { + "epoch": 32, + "train_loss": 1.764079447441101, + "train_acc": 0.5262, + "test_loss": 11.69735246734619, + "test_acc": 0.0133, + "lyapunov": 1.7403116387784328, + "grad_norm": 0.91821833583086, + "grad_max_sv": 0.40526579022407533, + "grad_min_sv": 1.7294268717105156e-08, + "grad_condition": 28466138.249642067, + "lr": 0.0008918467286629196, + "time_sec": 41.76823139190674 + }, + { + "epoch": 33, + "train_loss": 1.751036173324585, + "train_acc": 0.52762, + "test_loss": 11.700557440185547, + "test_acc": 0.016, + "lyapunov": 1.7537712962426188, + "grad_norm": 0.909925919391314, + "grad_max_sv": 0.39359075799584387, + "grad_min_sv": 1.6999775425199926e-08, + "grad_condition": 94547209.98642035, + "lr": 0.0008852566213878943, + "time_sec": 41.73266649246216 + }, + { + "epoch": 34, + "train_loss": 1.7285531663131715, + "train_acc": 0.53388, + "test_loss": 14.241070452880859, + "test_acc": 0.01, + "lyapunov": 1.7564430843533763, + "grad_norm": 0.9007686052485974, + "grad_max_sv": 0.3874150216579437, + "grad_min_sv": 1.662327348064818e-08, + "grad_condition": 112275201.21762475, + "lr": 0.000878497527825878, + "time_sec": 41.72823667526245 + }, + { + "epoch": 35, + "train_loss": 1.7027341010665893, + "train_acc": 0.53832, + "test_loss": 12.757903733825684, + "test_acc": 0.01, + "lyapunov": 1.7510422882826433, + "grad_norm": 0.886721330769414, + "grad_max_sv": 0.3859048821032047, + "grad_min_sv": 1.6686874249050022e-08, + "grad_condition": 44676896.67358022, + "lr": 0.000871572412738697, + "time_sec": 41.73277544975281 + }, + { + "epoch": 36, + "train_loss": 1.6989579335403442, + "train_acc": 0.53834, + "test_loss": 11.037862075805664, + "test_acc": 0.0102, + "lyapunov": 1.7443612588336095, + "grad_norm": 0.8830820544047993, + "grad_max_sv": 0.3802352599799633, + "grad_min_sv": 1.6571208601157127e-08, + "grad_condition": 40953173.268342055, + "lr": 0.0008644843137107055, + "time_sec": 41.74021887779236 + }, + { + "epoch": 37, + "train_loss": 1.6595187205123902, + "train_acc": 0.54764, + "test_loss": 13.855162429809571, + "test_acc": 0.01, + "lyapunov": 1.7497367005214057, + "grad_norm": 0.8805179443959777, + "grad_max_sv": 0.38206519186496735, + "grad_min_sv": 1.6626910238556892e-08, + "grad_condition": 79050742.35563095, + "lr": 0.0008572363398164014, + "time_sec": 41.727495431900024 + }, + { + "epoch": 38, + "train_loss": 1.6525180630493164, + "train_acc": 0.5472, + "test_loss": 10.174911602783203, + "test_acc": 0.0102, + "lyapunov": 1.755283591387522, + "grad_norm": 0.8714972087631, + "grad_max_sv": 0.3799257561564445, + "grad_min_sv": 1.6515901316016546e-08, + "grad_condition": 33472502.364460837, + "lr": 0.0008498316702566826, + "time_sec": 41.72185707092285 + }, + { + "epoch": 39, + "train_loss": 1.6343883077239991, + "train_acc": 0.55552, + "test_loss": 9.518302935791016, + "test_acc": 0.01, + "lyapunov": 1.762697722600854, + "grad_norm": 0.8650903756259212, + "grad_max_sv": 0.373224213719368, + "grad_min_sv": 1.629653018659499e-08, + "grad_condition": 242558967.4404312, + "lr": 0.0008422735529643442, + "time_sec": 41.745888233184814 + }, + { + "epoch": 40, + "train_loss": 1.6239042503738403, + "train_acc": 0.55832, + "test_loss": 10.750873959350585, + "test_acc": 0.0101, + "lyapunov": 1.7671644626675969, + "grad_norm": 0.8615165918799466, + "grad_max_sv": 0.3635469309985638, + "grad_min_sv": 1.5863799457394024e-08, + "grad_condition": 25941539.54554946, + "lr": 0.0008345653031794289, + "time_sec": 41.70173764228821 + }, + { + "epoch": 41, + "train_loss": 1.5980668620681762, + "train_acc": 0.563, + "test_loss": 11.261173056030273, + "test_acc": 0.0105, + "lyapunov": 1.7558496117286975, + "grad_norm": 0.8470729441915447, + "grad_max_sv": 0.3594608798623085, + "grad_min_sv": 1.5847214656153353e-08, + "grad_condition": 160939362.18002337, + "lr": 0.0008267103019950526, + "time_sec": 41.731508016586304 + }, + { + "epoch": 42, + "train_loss": 1.594250914001465, + "train_acc": 0.56716, + "test_loss": 10.016403302001953, + "test_acc": 0.01, + "lyapunov": 1.766978118730628, + "grad_norm": 0.8410539632359486, + "grad_max_sv": 0.35176880434155466, + "grad_min_sv": 1.5649215069635236e-08, + "grad_condition": 50077833.56187671, + "lr": 0.0008187119948743447, + "time_sec": 41.71690511703491 + }, + { + "epoch": 43, + "train_loss": 1.5708948085403442, + "train_acc": 0.57018, + "test_loss": 11.715487506103516, + "test_acc": 0.01, + "lyapunov": 1.7680624424649016, + "grad_norm": 0.8364943892646896, + "grad_max_sv": 0.353987617790699, + "grad_min_sv": 1.5521426501192982e-08, + "grad_condition": 362645019.5271845, + "lr": 0.000810573890139155, + "time_sec": 41.77493691444397 + }, + { + "epoch": 44, + "train_loss": 1.5518158061981202, + "train_acc": 0.57474, + "test_loss": 11.870717695617676, + "test_acc": 0.0103, + "lyapunov": 1.7640279894289763, + "grad_norm": 0.8329281017119827, + "grad_max_sv": 0.3474211238324642, + "grad_min_sv": 1.53803134561592e-08, + "grad_condition": 49790886.09537061, + "lr": 0.0008022995574311873, + "time_sec": 41.73730731010437 + }, + { + "epoch": 45, + "train_loss": 1.5414947969436645, + "train_acc": 0.57792, + "test_loss": 14.768106381225586, + "test_acc": 0.01, + "lyapunov": 1.772820667842465, + "grad_norm": 0.824959319471384, + "grad_max_sv": 0.346543176472187, + "grad_min_sv": 1.499499133958415e-08, + "grad_condition": 49055951.18654322, + "lr": 0.0007938926261462363, + "time_sec": 41.74028420448303 + }, + { + "epoch": 46, + "train_loss": 1.5390674185943602, + "train_acc": 0.57778, + "test_loss": 10.678796853637696, + "test_acc": 0.0106, + "lyapunov": 1.7763960602338358, + "grad_norm": 0.8259227345781174, + "grad_max_sv": 0.34485682621598246, + "grad_min_sv": 1.532375328294755e-08, + "grad_condition": 29515175.585395336, + "lr": 0.0007853567838422158, + "time_sec": 41.71578240394592 + }, + { + "epoch": 47, + "train_loss": 1.5156348711013794, + "train_acc": 0.58496, + "test_loss": 12.33722748413086, + "test_acc": 0.01, + "lyapunov": 1.778136059146403, + "grad_norm": 0.8118804272027214, + "grad_max_sv": 0.33651591315865514, + "grad_min_sv": 1.48985853015704e-08, + "grad_condition": 32427765.904840797, + "lr": 0.0007766957746216719, + "time_sec": 41.76110529899597 + }, + { + "epoch": 48, + "train_loss": 1.503568607826233, + "train_acc": 0.5869, + "test_loss": 10.218246252441407, + "test_acc": 0.0125, + "lyapunov": 1.7889400653522034, + "grad_norm": 0.8112667421683987, + "grad_max_sv": 0.3342376798391342, + "grad_min_sv": 1.5198339796060335e-08, + "grad_condition": 81110927.62072141, + "lr": 0.0007679133974894982, + "time_sec": 41.798474073410034 + }, + { + "epoch": 49, + "train_loss": 1.4914441897201538, + "train_acc": 0.59068, + "test_loss": 10.23879136352539, + "test_acc": 0.0103, + "lyapunov": 1.7940370106636105, + "grad_norm": 0.8084640817095641, + "grad_max_sv": 0.3433864340186119, + "grad_min_sv": 1.5079113801271667e-08, + "grad_condition": 259924317.05383635, + "lr": 0.000759013504686565, + "time_sec": 41.759873151779175 + }, + { + "epoch": 50, + "train_loss": 1.477221953201294, + "train_acc": 0.5921, + "test_loss": 10.929328930664063, + "test_acc": 0.0102, + "lyapunov": 1.7905599601433406, + "grad_norm": 0.8111299716185066, + "grad_max_sv": 0.3306982435286045, + "grad_min_sv": 1.4904924214992343e-08, + "grad_condition": 87306318.24085236, + "lr": 0.0007499999999999998, + "time_sec": 41.733423948287964 + }, + { + "epoch": 51, + "train_loss": 1.456133448753357, + "train_acc": 0.59808, + "test_loss": 12.16511858215332, + "test_acc": 0.01, + "lyapunov": 1.7792884236406488, + "grad_norm": 0.8005480239065623, + "grad_max_sv": 0.3357121139764786, + "grad_min_sv": 1.5030659702985893e-08, + "grad_condition": 30183370.530579127, + "lr": 0.0007408768370508575, + "time_sec": 41.806249380111694 + }, + { + "epoch": 52, + "train_loss": 1.436393115272522, + "train_acc": 0.60276, + "test_loss": 11.33924033203125, + "test_acc": 0.0142, + "lyapunov": 1.7749551976733196, + "grad_norm": 0.7982513867356777, + "grad_max_sv": 0.32782707288861274, + "grad_min_sv": 1.476541508851903e-08, + "grad_condition": 63415053.39074744, + "lr": 0.0007316480175599307, + "time_sec": 41.759939193725586 + }, + { + "epoch": 53, + "train_loss": 1.4389901905822753, + "train_acc": 0.60084, + "test_loss": 11.576705731201171, + "test_acc": 0.0113, + "lyapunov": 1.766155862747251, + "grad_norm": 0.7938768037151195, + "grad_max_sv": 0.3293768920004368, + "grad_min_sv": 1.45633583338578e-08, + "grad_condition": 98098875.28367049, + "lr": 0.0007223175895924635, + "time_sec": 41.73505473136902 + }, + { + "epoch": 54, + "train_loss": 1.4107453610610963, + "train_acc": 0.60912, + "test_loss": 11.234718688964843, + "test_acc": 0.0156, + "lyapunov": 1.7835360521550678, + "grad_norm": 0.7862863339800243, + "grad_max_sv": 0.3239886038005352, + "grad_min_sv": 1.4647660306638805e-08, + "grad_condition": 285635859.79599005, + "lr": 0.0007128896457825361, + "time_sec": 41.779306411743164 + }, + { + "epoch": 55, + "train_loss": 1.4032011807250977, + "train_acc": 0.6082, + "test_loss": 12.058402252197265, + "test_acc": 0.0107, + "lyapunov": 1.7729148389128468, + "grad_norm": 0.7877789076276893, + "grad_max_sv": 0.32600906267762186, + "grad_min_sv": 1.4553093863334255e-08, + "grad_condition": 25654915.22441258, + "lr": 0.0007033683215378998, + "time_sec": 41.73508405685425 + }, + { + "epoch": 56, + "train_loss": 1.389821086883545, + "train_acc": 0.61304, + "test_loss": 13.385974339294433, + "test_acc": 0.0115, + "lyapunov": 1.7800112602960727, + "grad_norm": 0.780097891210278, + "grad_max_sv": 0.32187015265226365, + "grad_min_sv": 1.4437614045959001e-08, + "grad_condition": 33124328.491749655, + "lr": 0.0006937577932260512, + "time_sec": 41.74309992790222 + }, + { + "epoch": 57, + "train_loss": 1.376256035270691, + "train_acc": 0.61968, + "test_loss": 10.000209881591797, + "test_acc": 0.0157, + "lyapunov": 1.7677047642905388, + "grad_norm": 0.7757298452995354, + "grad_max_sv": 0.3148633047938347, + "grad_min_sv": 1.427116047281185e-08, + "grad_condition": 52388350.904575035, + "lr": 0.0006840622763423388, + "time_sec": 41.73425316810608 + }, + { + "epoch": 58, + "train_loss": 1.3577024307250976, + "train_acc": 0.6221, + "test_loss": 11.551155778503418, + "test_acc": 0.0108, + "lyapunov": 1.766695433870301, + "grad_norm": 0.7787106519229474, + "grad_max_sv": 0.3169295161962509, + "grad_min_sv": 1.427448586104052e-08, + "grad_condition": 167873010.74021894, + "lr": 0.0006742860236609073, + "time_sec": 41.72939348220825 + }, + { + "epoch": 59, + "train_loss": 1.3431843811035156, + "train_acc": 0.62504, + "test_loss": 10.233863699340821, + "test_acc": 0.0126, + "lyapunov": 1.767587873636914, + "grad_norm": 0.7718749591390539, + "grad_max_sv": 0.3105091955512762, + "grad_min_sv": 1.4096653365089363e-08, + "grad_condition": 84346381.61884929, + "lr": 0.0006644333233692913, + "time_sec": 41.71211218833923 + }, + { + "epoch": 60, + "train_loss": 1.3301828622055054, + "train_acc": 0.62656, + "test_loss": 9.515221376037598, + "test_acc": 0.016, + "lyapunov": 1.7664891353348637, + "grad_norm": 0.7687046852005539, + "grad_max_sv": 0.31579539775848386, + "grad_min_sv": 1.4306913373451912e-08, + "grad_condition": 38941146.332359776, + "lr": 0.0006545084971874734, + "time_sec": 41.73012900352478 + }, + { + "epoch": 61, + "train_loss": 1.319080140838623, + "train_acc": 0.63132, + "test_loss": 10.18255209350586, + "test_acc": 0.01, + "lyapunov": 1.758082925206255, + "grad_norm": 0.7656519838760512, + "grad_max_sv": 0.31509713754057883, + "grad_min_sv": 1.4063286060683743e-08, + "grad_condition": 36757136.13513379, + "lr": 0.0006445158984722354, + "time_sec": 41.74629807472229 + }, + { + "epoch": 62, + "train_loss": 1.3072694900894164, + "train_acc": 0.63358, + "test_loss": 9.852577113342285, + "test_acc": 0.0157, + "lyapunov": 1.7683055998419253, + "grad_norm": 0.7632626265760565, + "grad_max_sv": 0.30540504679083824, + "grad_min_sv": 1.411255184935456e-08, + "grad_condition": 35246238.545284316, + "lr": 0.0006344599103076324, + "time_sec": 41.72388529777527 + }, + { + "epoch": 63, + "train_loss": 1.302987167930603, + "train_acc": 0.63614, + "test_loss": 10.932140390014649, + "test_acc": 0.01, + "lyapunov": 1.7677838107204193, + "grad_norm": 0.7598643821024783, + "grad_max_sv": 0.31203090995550153, + "grad_min_sv": 1.3685938854424151e-08, + "grad_condition": 39311964.1113611, + "lr": 0.0006243449435824269, + "time_sec": 41.76644206047058 + }, + { + "epoch": 64, + "train_loss": 1.285763971786499, + "train_acc": 0.64012, + "test_loss": 11.513975454711915, + "test_acc": 0.01, + "lyapunov": 1.7577931804730154, + "grad_norm": 0.7633302291016576, + "grad_max_sv": 0.31339493915438654, + "grad_min_sv": 1.4064278855419055e-08, + "grad_condition": 33195309.931640428, + "lr": 0.0006141754350553275, + "time_sec": 41.7900927066803 + }, + { + "epoch": 65, + "train_loss": 1.268479045677185, + "train_acc": 0.64226, + "test_loss": 11.874932281494141, + "test_acc": 0.0102, + "lyapunov": 1.7744586839700294, + "grad_norm": 0.7570752901436341, + "grad_max_sv": 0.3083444222807884, + "grad_min_sv": 1.406103339388065e-08, + "grad_condition": 43393899.19734432, + "lr": 0.0006039558454088793, + "time_sec": 41.74698352813721 + }, + { + "epoch": 66, + "train_loss": 1.2628416799926758, + "train_acc": 0.64434, + "test_loss": 12.747333851623535, + "test_acc": 0.0099, + "lyapunov": 1.7652160459772095, + "grad_norm": 0.7571128878479004, + "grad_max_sv": 0.3126042574644089, + "grad_min_sv": 1.4062863940011993e-08, + "grad_condition": 60733680.441956446, + "lr": 0.000593690657292862, + "time_sec": 41.72180390357971 + }, + { + "epoch": 67, + "train_loss": 1.2434362339019776, + "train_acc": 0.64988, + "test_loss": 10.704685067749024, + "test_acc": 0.0101, + "lyapunov": 1.75891925093463, + "grad_norm": 0.7495262779991995, + "grad_max_sv": 0.308939852565527, + "grad_min_sv": 1.3881026922346606e-08, + "grad_condition": 36133582.94536222, + "lr": 0.0005833843733580507, + "time_sec": 41.790682554244995 + }, + { + "epoch": 68, + "train_loss": 1.2320277339935304, + "train_acc": 0.65302, + "test_loss": 9.829946832275391, + "test_acc": 0.0113, + "lyapunov": 1.7762341871285987, + "grad_norm": 0.7453247888859125, + "grad_max_sv": 0.3007917396724224, + "grad_min_sv": 1.3786684129393767e-08, + "grad_condition": 79783709.75702718, + "lr": 0.0005730415142812054, + "time_sec": 41.743003368377686 + }, + { + "epoch": 69, + "train_loss": 1.2199441442871093, + "train_acc": 0.65628, + "test_loss": 12.249142663574219, + "test_acc": 0.0104, + "lyapunov": 1.7720091150849677, + "grad_norm": 0.7485737482328051, + "grad_max_sv": 0.30392555296421053, + "grad_min_sv": 1.3645029822012544e-08, + "grad_condition": 53570537.02263519, + "lr": 0.0005626666167821517, + "time_sec": 41.72006964683533 + }, + { + "epoch": 70, + "train_loss": 1.2144978989028932, + "train_acc": 0.65798, + "test_loss": 11.88633623046875, + "test_acc": 0.0114, + "lyapunov": 1.7648274313153514, + "grad_norm": 0.7493531394049379, + "grad_max_sv": 0.31028358563780783, + "grad_min_sv": 1.3737555910886545e-08, + "grad_condition": 63226808.635275245, + "lr": 0.0005522642316338265, + "time_sec": 41.7224395275116 + }, + { + "epoch": 71, + "train_loss": 1.192921284866333, + "train_acc": 0.66314, + "test_loss": 11.224198191833496, + "test_acc": 0.0108, + "lyapunov": 1.770425531870264, + "grad_norm": 0.7375193088344132, + "grad_max_sv": 0.29694446846842765, + "grad_min_sv": 1.3482549720417181e-08, + "grad_condition": 47701044.66392641, + "lr": 0.0005418389216661573, + "time_sec": 41.73777651786804 + }, + { + "epoch": 72, + "train_loss": 1.1844216130065919, + "train_acc": 0.66336, + "test_loss": 11.026349151611328, + "test_acc": 0.0131, + "lyapunov": 1.7741029829625279, + "grad_norm": 0.7407625768939419, + "grad_max_sv": 0.30231842771172523, + "grad_min_sv": 1.3496719990929718e-08, + "grad_condition": 51346886.185487434, + "lr": 0.0005313952597646563, + "time_sec": 41.74572229385376 + }, + { + "epoch": 73, + "train_loss": 1.1756603861618042, + "train_acc": 0.66744, + "test_loss": 9.035702542114258, + "test_acc": 0.0119, + "lyapunov": 1.7680888843658331, + "grad_norm": 0.7332870405694026, + "grad_max_sv": 0.29791994765400887, + "grad_min_sv": 1.356694562977545e-08, + "grad_condition": 67898310.26018615, + "lr": 0.0005209378268645994, + "time_sec": 41.74131917953491 + }, + { + "epoch": 74, + "train_loss": 1.165503525543213, + "train_acc": 0.66762, + "test_loss": 12.354495669555664, + "test_acc": 0.0119, + "lyapunov": 1.7657780351541232, + "grad_norm": 0.7373585150690359, + "grad_max_sv": 0.29792211577296257, + "grad_min_sv": 1.339521861626336e-08, + "grad_condition": 67921318.07855129, + "lr": 0.0005104712099416781, + "time_sec": 41.732377767562866 + }, + { + "epoch": 75, + "train_loss": 1.15907166721344, + "train_acc": 0.66996, + "test_loss": 11.736955917358399, + "test_acc": 0.0107, + "lyapunov": 1.7724456491372775, + "grad_norm": 0.7381218970383491, + "grad_max_sv": 0.30278131291270255, + "grad_min_sv": 1.3430600983611873e-08, + "grad_condition": 1590939536.616202, + "lr": 0.0004999999999999996, + "time_sec": 41.76725125312805 + }, + { + "epoch": 76, + "train_loss": 1.1549719894790649, + "train_acc": 0.673, + "test_loss": 10.820277821350098, + "test_acc": 0.0131, + "lyapunov": 1.7753572616430804, + "grad_norm": 0.7324129490101708, + "grad_max_sv": 0.29599803127348423, + "grad_min_sv": 1.3179824837755704e-08, + "grad_condition": 69530865.36553702, + "lr": 0.0004895287900583212, + "time_sec": 41.7483696937561 + }, + { + "epoch": 77, + "train_loss": 1.1430336932373046, + "train_acc": 0.67594, + "test_loss": 12.702352023315429, + "test_acc": 0.0164, + "lyapunov": 1.7649742627082883, + "grad_norm": 0.7319965225806975, + "grad_max_sv": 0.30014127865433693, + "grad_min_sv": 1.362019530493086e-08, + "grad_condition": 26983075.532588482, + "lr": 0.0004790621731353997, + "time_sec": 41.7334041595459 + }, + { + "epoch": 78, + "train_loss": 1.139764607963562, + "train_acc": 0.67532, + "test_loss": 10.281317558288574, + "test_acc": 0.0113, + "lyapunov": 1.773946383725042, + "grad_norm": 0.7270136688563837, + "grad_max_sv": 0.2866762079298496, + "grad_min_sv": 1.3297384002936008e-08, + "grad_condition": 95739532.89705701, + "lr": 0.000468604740235343, + "time_sec": 41.72801947593689 + }, + { + "epoch": 79, + "train_loss": 1.1197996570205688, + "train_acc": 0.68366, + "test_loss": 10.05328071899414, + "test_acc": 0.0193, + "lyapunov": 1.7761001812527553, + "grad_norm": 0.7245272614612472, + "grad_max_sv": 0.295285864174366, + "grad_min_sv": 1.3208504343747985e-08, + "grad_condition": 55296028.27484087, + "lr": 0.00045816107833384175, + "time_sec": 41.710914611816406 + }, + { + "epoch": 80, + "train_loss": 1.1211604401397706, + "train_acc": 0.68064, + "test_loss": 10.973610772705078, + "test_acc": 0.0147, + "lyapunov": 1.7698543568706269, + "grad_norm": 0.7308867991275836, + "grad_max_sv": 0.29655324965715407, + "grad_min_sv": 1.3334803825038044e-08, + "grad_condition": 213961832.8340079, + "lr": 0.0004477357683661729, + "time_sec": 41.752094745635986 + }, + { + "epoch": 81, + "train_loss": 1.1020245618247986, + "train_acc": 0.6878, + "test_loss": 9.28792036743164, + "test_acc": 0.0134, + "lyapunov": 1.7763843307714633, + "grad_norm": 0.7203053332920707, + "grad_max_sv": 0.29178380146622657, + "grad_min_sv": 1.3194537250640903e-08, + "grad_condition": 74692731.83944798, + "lr": 0.00043733338321784746, + "time_sec": 41.739606857299805 + }, + { + "epoch": 82, + "train_loss": 1.0891459491539002, + "train_acc": 0.6923, + "test_loss": 11.004553327941894, + "test_acc": 0.0154, + "lyapunov": 1.7708229360068242, + "grad_norm": 0.7219577932651793, + "grad_max_sv": 0.28799295648932455, + "grad_min_sv": 1.3246153596701507e-08, + "grad_condition": 1727958352.0211291, + "lr": 0.0004269584857187939, + "time_sec": 41.79018187522888 + }, + { + "epoch": 83, + "train_loss": 1.080449527873993, + "train_acc": 0.69162, + "test_loss": 11.05731633605957, + "test_acc": 0.0141, + "lyapunov": 1.7651297466834184, + "grad_norm": 0.720622015563507, + "grad_max_sv": 0.2987635262310505, + "grad_min_sv": 1.3153302928434196e-08, + "grad_condition": 84860977.6783236, + "lr": 0.0004166156266419484, + "time_sec": 41.755199909210205 + }, + { + "epoch": 84, + "train_loss": 1.0714698913002014, + "train_acc": 0.6948, + "test_loss": 10.235596168518066, + "test_acc": 0.0185, + "lyapunov": 1.7632971120917278, + "grad_norm": 0.7204291113502606, + "grad_max_sv": 0.2882640101015568, + "grad_min_sv": 1.3200813259520162e-08, + "grad_condition": 64250575.37180309, + "lr": 0.0004063093427071373, + "time_sec": 41.73304057121277 + }, + { + "epoch": 85, + "train_loss": 1.0547249691009521, + "train_acc": 0.6967, + "test_loss": 9.355292175292968, + "test_acc": 0.0126, + "lyapunov": 1.770005767607628, + "grad_norm": 0.714725740267623, + "grad_max_sv": 0.2887449931353331, + "grad_min_sv": 1.2776617198950734e-08, + "grad_condition": 32537451.724384047, + "lr": 0.0003960441545911199, + "time_sec": 41.763319969177246 + }, + { + "epoch": 86, + "train_loss": 1.0497499071884155, + "train_acc": 0.6993, + "test_loss": 11.439105712890624, + "test_acc": 0.0116, + "lyapunov": 1.769535358909451, + "grad_norm": 0.7186835197284615, + "grad_max_sv": 0.2929870404303074, + "grad_min_sv": 1.3005664252496718e-08, + "grad_condition": 50358344.56965059, + "lr": 0.0003858245649446718, + "time_sec": 41.759509563446045 + }, + { + "epoch": 87, + "train_loss": 1.0480333641815185, + "train_acc": 0.70204, + "test_loss": 10.220489350891114, + "test_acc": 0.0168, + "lyapunov": 1.7779154966554374, + "grad_norm": 0.7156736279381971, + "grad_max_sv": 0.293089197576046, + "grad_min_sv": 1.2898874929279103e-08, + "grad_condition": 38639133.94479625, + "lr": 0.00037565505641757235, + "time_sec": 41.744720458984375 + }, + { + "epoch": 88, + "train_loss": 1.0331918328857421, + "train_acc": 0.70388, + "test_loss": 10.892332235717774, + "test_acc": 0.0121, + "lyapunov": 1.759305640864555, + "grad_norm": 0.7103154164514878, + "grad_max_sv": 0.2848528869450092, + "grad_min_sv": 1.3125346690068262e-08, + "grad_condition": 28688795.02721579, + "lr": 0.00036554008969236695, + "time_sec": 41.74627327919006 + }, + { + "epoch": 89, + "train_loss": 1.0360725844573975, + "train_acc": 0.70146, + "test_loss": 10.302078147888183, + "test_acc": 0.0113, + "lyapunov": 1.777204498610533, + "grad_norm": 0.7088384915136853, + "grad_max_sv": 0.28413923680782316, + "grad_min_sv": 1.2809459053186866e-08, + "grad_condition": 52519459.50215302, + "lr": 0.0003554841015277638, + "time_sec": 41.750773191452026 + }, + { + "epoch": 90, + "train_loss": 1.0214117762374877, + "train_acc": 0.70484, + "test_loss": 10.16612608642578, + "test_acc": 0.0121, + "lyapunov": 1.7840187842278834, + "grad_norm": 0.7097566485316775, + "grad_max_sv": 0.28452762179076674, + "grad_min_sv": 1.283485556169417e-08, + "grad_condition": 36967025.92542716, + "lr": 0.000345491502812526, + "time_sec": 41.747437715530396 + }, + { + "epoch": 91, + "train_loss": 1.0132212543487549, + "train_acc": 0.70924, + "test_loss": 11.091903131103516, + "test_acc": 0.0123, + "lyapunov": 1.7805987797734681, + "grad_norm": 0.7112179098858065, + "grad_max_sv": 0.29041158556938174, + "grad_min_sv": 1.3019207038660052e-08, + "grad_condition": 118334947.19681804, + "lr": 0.0003355666766307081, + "time_sec": 41.84413456916809 + }, + { + "epoch": 92, + "train_loss": 0.9958220034408569, + "train_acc": 0.71482, + "test_loss": 10.695934730529785, + "test_acc": 0.0125, + "lyapunov": 1.7850334808954498, + "grad_norm": 0.7041520599662644, + "grad_max_sv": 0.276868636906147, + "grad_min_sv": 1.2641634730345408e-08, + "grad_condition": 108378335.09120658, + "lr": 0.00032571397633909225, + "time_sec": 41.721917152404785 + }, + { + "epoch": 93, + "train_loss": 0.9925233172988892, + "train_acc": 0.71296, + "test_loss": 9.900304016113282, + "test_acc": 0.0142, + "lyapunov": 1.7714714616765757, + "grad_norm": 0.7010252437446836, + "grad_max_sv": 0.2805999223142862, + "grad_min_sv": 1.2807822971812321e-08, + "grad_condition": 124735230.310988, + "lr": 0.00031593772365766094, + "time_sec": 41.73945736885071 + }, + { + "epoch": 94, + "train_loss": 0.985612870979309, + "train_acc": 0.71518, + "test_loss": 10.369019525146484, + "test_acc": 0.0151, + "lyapunov": 1.7871656667850817, + "grad_norm": 0.7023173867680181, + "grad_max_sv": 0.28844468407332896, + "grad_min_sv": 1.2746448550468582e-08, + "grad_condition": 63791900.761746526, + "lr": 0.0003062422067739483, + "time_sec": 41.7353515625 + }, + { + "epoch": 95, + "train_loss": 0.9805331708526611, + "train_acc": 0.72106, + "test_loss": 10.547651748657227, + "test_acc": 0.0105, + "lyapunov": 1.7860868407027495, + "grad_norm": 0.6990201105068031, + "grad_max_sv": 0.27978494167327883, + "grad_min_sv": 1.2488151815426284e-08, + "grad_condition": 35452191.78787039, + "lr": 0.00029663167846209965, + "time_sec": 41.766570806503296 + }, + { + "epoch": 96, + "train_loss": 0.9642451547813415, + "train_acc": 0.72286, + "test_loss": 11.060740502929688, + "test_acc": 0.0101, + "lyapunov": 1.7756004104833774, + "grad_norm": 0.6950929636130921, + "grad_max_sv": 0.2777584385126829, + "grad_min_sv": 1.2606516046342886e-08, + "grad_condition": 90939925.58883393, + "lr": 0.00028711035421746345, + "time_sec": 41.759474992752075 + }, + { + "epoch": 97, + "train_loss": 0.9582952698898315, + "train_acc": 0.72416, + "test_loss": 10.613461477661133, + "test_acc": 0.0114, + "lyapunov": 1.7874563033013697, + "grad_norm": 0.7012998629347693, + "grad_max_sv": 0.2896071758121252, + "grad_min_sv": 1.2955023373506513e-08, + "grad_condition": 31672949.59152009, + "lr": 0.00027768241040753615, + "time_sec": 41.737287282943726 + }, + { + "epoch": 98, + "train_loss": 0.9639710576629639, + "train_acc": 0.72214, + "test_loss": 11.234573606872559, + "test_acc": 0.0134, + "lyapunov": 1.7810891217282971, + "grad_norm": 0.6990377551445951, + "grad_max_sv": 0.2823152020573616, + "grad_min_sv": 1.2558187708830437e-08, + "grad_condition": 78167153.5339839, + "lr": 0.00026835198244006903, + "time_sec": 41.74579834938049 + }, + { + "epoch": 99, + "train_loss": 0.9447334141540528, + "train_acc": 0.72846, + "test_loss": 10.620676115417481, + "test_acc": 0.0107, + "lyapunov": 1.7829816115786656, + "grad_norm": 0.6922495069322686, + "grad_max_sv": 0.28143189325928686, + "grad_min_sv": 1.2378237203031911e-08, + "grad_condition": 377146566.75206596, + "lr": 0.0002591231629491421, + "time_sec": 41.73288822174072 + }, + { + "epoch": 100, + "train_loss": 0.9382104275894165, + "train_acc": 0.72974, + "test_loss": 10.38056852722168, + "test_acc": 0.0121, + "lyapunov": 1.7843644152516904, + "grad_norm": 0.6919660624309919, + "grad_max_sv": 0.285617096722126, + "grad_min_sv": 1.2653852852692604e-08, + "grad_condition": 70667945.3735242, + "lr": 0.0002499999999999997, + "time_sec": 41.74325895309448 + }, + { + "epoch": 101, + "train_loss": 0.9415825703430176, + "train_acc": 0.72966, + "test_loss": 10.117093821716308, + "test_acc": 0.011, + "lyapunov": 1.791993932345944, + "grad_norm": 0.6955474621308447, + "grad_max_sv": 0.2884152356535196, + "grad_min_sv": 1.265317002563382e-08, + "grad_condition": 37090841.68628693, + "lr": 0.00024098649531343477, + "time_sec": 41.7480993270874 + }, + { + "epoch": 102, + "train_loss": 0.9256098588180542, + "train_acc": 0.733, + "test_loss": 10.386307803344726, + "test_acc": 0.013, + "lyapunov": 1.7790814763139886, + "grad_norm": 0.6940683931042843, + "grad_max_sv": 0.2775864779949188, + "grad_min_sv": 1.2400528336120598e-08, + "grad_condition": 33373897.247979783, + "lr": 0.0002320866025105016, + "time_sec": 41.73914933204651 + }, + { + "epoch": 103, + "train_loss": 0.9233090299606324, + "train_acc": 0.73216, + "test_loss": 11.106814224243164, + "test_acc": 0.0129, + "lyapunov": 1.7839170090682672, + "grad_norm": 0.690896164616605, + "grad_max_sv": 0.2870456736534834, + "grad_min_sv": 1.2781738229546841e-08, + "grad_condition": 169221408.83590072, + "lr": 0.0002233042253783278, + "time_sec": 41.74682021141052 + }, + { + "epoch": 104, + "train_loss": 0.9120979603004455, + "train_acc": 0.73614, + "test_loss": 10.833344114685058, + "test_acc": 0.0133, + "lyapunov": 1.7876447039796872, + "grad_norm": 0.6871057009031657, + "grad_max_sv": 0.2755177538841963, + "grad_min_sv": 1.2216805945347575e-08, + "grad_condition": 43150197.26668272, + "lr": 0.000214643216157784, + "time_sec": 41.74007225036621 + }, + { + "epoch": 105, + "train_loss": 0.9041895580101014, + "train_acc": 0.73994, + "test_loss": 11.046577230834961, + "test_acc": 0.0157, + "lyapunov": 1.8013225211511792, + "grad_norm": 0.6905793170265356, + "grad_max_sv": 0.2767405278980732, + "grad_min_sv": 1.2463037859806319e-08, + "grad_condition": 167250138.59340933, + "lr": 0.00020610737385376332, + "time_sec": 41.76123571395874 + }, + { + "epoch": 106, + "train_loss": 0.9033575478363037, + "train_acc": 0.73812, + "test_loss": 10.144949078369141, + "test_acc": 0.0148, + "lyapunov": 1.7953374297417644, + "grad_norm": 0.6900561070003776, + "grad_max_sv": 0.2854902070015669, + "grad_min_sv": 1.2487106774983215e-08, + "grad_condition": 51823781.44791423, + "lr": 0.00019770044256881242, + "time_sec": 41.76529264450073 + }, + { + "epoch": 107, + "train_loss": 0.8958642411613464, + "train_acc": 0.74114, + "test_loss": 11.918342785644532, + "test_acc": 0.0136, + "lyapunov": 1.7949548279842757, + "grad_norm": 0.6886091368835883, + "grad_max_sv": 0.2801966678351164, + "grad_min_sv": 1.2309067401461426e-08, + "grad_condition": 58878874.82596229, + "lr": 0.0001894261098608447, + "time_sec": 41.74768304824829 + }, + { + "epoch": 108, + "train_loss": 0.8952222912597656, + "train_acc": 0.74206, + "test_loss": 11.956568659973145, + "test_acc": 0.0131, + "lyapunov": 1.7988319720148735, + "grad_norm": 0.6837928322416345, + "grad_max_sv": 0.2708371184766293, + "grad_min_sv": 1.2263186236621815e-08, + "grad_condition": 66622654.04143127, + "lr": 0.000181288005125655, + "time_sec": 41.74733638763428 + }, + { + "epoch": 109, + "train_loss": 0.8803009853363037, + "train_acc": 0.74562, + "test_loss": 11.972533184814454, + "test_acc": 0.0151, + "lyapunov": 1.7921729173196856, + "grad_norm": 0.6800898894517242, + "grad_max_sv": 0.2744845002889633, + "grad_min_sv": 1.2226625573097394e-08, + "grad_condition": 28672449.587015696, + "lr": 0.0001732896980049473, + "time_sec": 41.75131416320801 + }, + { + "epoch": 110, + "train_loss": 0.8758692720031739, + "train_acc": 0.7465, + "test_loss": 11.761042765808105, + "test_acc": 0.013, + "lyapunov": 1.7973133560336765, + "grad_norm": 0.67944647159599, + "grad_max_sv": 0.2868840988725424, + "grad_min_sv": 1.246009697572492e-08, + "grad_condition": 170689698.95698687, + "lr": 0.00016543469682057076, + "time_sec": 41.74984264373779 + }, + { + "epoch": 111, + "train_loss": 0.8721175754928588, + "train_acc": 0.7469, + "test_loss": 8.282232776641846, + "test_acc": 0.0169, + "lyapunov": 1.799062220336836, + "grad_norm": 0.6803209885009608, + "grad_max_sv": 0.27374382950365544, + "grad_min_sv": 1.2184770360745834e-08, + "grad_condition": 30675743.962345827, + "lr": 0.00015772644703565552, + "time_sec": 41.7647271156311 + }, + { + "epoch": 112, + "train_loss": 0.8774008236503601, + "train_acc": 0.74816, + "test_loss": 9.170746116638183, + "test_acc": 0.0159, + "lyapunov": 1.8109373235336654, + "grad_norm": 0.6789085557101802, + "grad_max_sv": 0.27259538881480694, + "grad_min_sv": 1.211782079124646e-08, + "grad_condition": 40567413.26570592, + "lr": 0.00015016832974331713, + "time_sec": 41.75637173652649 + }, + { + "epoch": 113, + "train_loss": 0.8622464385795593, + "train_acc": 0.75106, + "test_loss": 10.053751289367677, + "test_acc": 0.0135, + "lyapunov": 1.8100936168904804, + "grad_norm": 0.6756576122805169, + "grad_max_sv": 0.28052372448146345, + "grad_min_sv": 1.2317235831543066e-08, + "grad_condition": 178723228.29974583, + "lr": 0.00014276366018359834, + "time_sec": 41.75319814682007 + }, + { + "epoch": 114, + "train_loss": 0.8690180336761475, + "train_acc": 0.75008, + "test_loss": 10.932594900512695, + "test_acc": 0.0156, + "lyapunov": 1.816387369199787, + "grad_norm": 0.6798747706483691, + "grad_max_sv": 0.27895807549357415, + "grad_min_sv": 1.2279261825225152e-08, + "grad_condition": 153643053.21690834, + "lr": 0.00013551568628929425, + "time_sec": 41.75379729270935 + }, + { + "epoch": 115, + "train_loss": 0.851261803779602, + "train_acc": 0.7541, + "test_loss": 10.868778268432617, + "test_acc": 0.0125, + "lyapunov": 1.813281281524912, + "grad_norm": 0.6742910500951893, + "grad_max_sv": 0.28160076327621936, + "grad_min_sv": 1.2291463845348627e-08, + "grad_condition": 76180606.22388497, + "lr": 0.00012842758726130276, + "time_sec": 41.73297882080078 + }, + { + "epoch": 116, + "train_loss": 0.846489698047638, + "train_acc": 0.75568, + "test_loss": 11.865378411865235, + "test_acc": 0.0141, + "lyapunov": 1.8190875562560527, + "grad_norm": 0.6753732752106246, + "grad_max_sv": 0.2776739463210106, + "grad_min_sv": 1.2337394268875645e-08, + "grad_condition": 140857727.14932525, + "lr": 0.0001215024721741218, + "time_sec": 41.80654764175415 + }, + { + "epoch": 117, + "train_loss": 0.8436802185821534, + "train_acc": 0.75682, + "test_loss": 10.257345919799805, + "test_acc": 0.0155, + "lyapunov": 1.8196433694161418, + "grad_norm": 0.6721854001510172, + "grad_max_sv": 0.2764026470482349, + "grad_min_sv": 1.2219355385346965e-08, + "grad_condition": 215926006.70871487, + "lr": 0.00011474337861210538, + "time_sec": 41.738430976867676 + }, + { + "epoch": 118, + "train_loss": 0.8449852162742615, + "train_acc": 0.75552, + "test_loss": 11.355014642333984, + "test_acc": 0.016, + "lyapunov": 1.840445002326575, + "grad_norm": 0.6737424908515164, + "grad_max_sv": 0.2740096665918827, + "grad_min_sv": 1.2083014176364481e-08, + "grad_condition": 65280969.212004915, + "lr": 0.00010815327133708009, + "time_sec": 41.757728815078735 + }, + { + "epoch": 119, + "train_loss": 0.841961736907959, + "train_acc": 0.75586, + "test_loss": 12.117664599609375, + "test_acc": 0.0145, + "lyapunov": 1.8274321559140139, + "grad_norm": 0.6714829654797964, + "grad_max_sv": 0.2699023999273777, + "grad_min_sv": 1.214259521597279e-08, + "grad_condition": 2220969999.5357943, + "lr": 0.00010173504098790182, + "time_sec": 41.74168586730957 + }, + { + "epoch": 120, + "train_loss": 0.8366392538833618, + "train_acc": 0.75704, + "test_loss": 11.201690646362305, + "test_acc": 0.014, + "lyapunov": 1.8226751738497058, + "grad_norm": 0.6690428269683097, + "grad_max_sv": 0.27311445139348506, + "grad_min_sv": 1.2121295115113256e-08, + "grad_condition": 201741131.01603514, + "lr": 9.549150281252629e-05, + "time_sec": 41.743924617767334 + }, + { + "epoch": 121, + "train_loss": 0.8258431200599671, + "train_acc": 0.75994, + "test_loss": 9.8936986907959, + "test_acc": 0.015, + "lyapunov": 1.81260391025592, + "grad_norm": 0.6690897555850577, + "grad_max_sv": 0.2733077108860016, + "grad_min_sv": 1.1923934299662431e-08, + "grad_condition": 45131886.19417761, + "lr": 8.942539543314794e-05, + "time_sec": 41.83616232872009 + }, + { + "epoch": 122, + "train_loss": 0.811839645729065, + "train_acc": 0.76544, + "test_loss": 10.331547076416015, + "test_acc": 0.0156, + "lyapunov": 1.8212599763479989, + "grad_norm": 0.662394538196827, + "grad_max_sv": 0.27026438154280186, + "grad_min_sv": 1.2078635636125768e-08, + "grad_condition": 54626942.43840529, + "lr": 8.353937964495024e-05, + "time_sec": 41.743398666381836 + }, + { + "epoch": 123, + "train_loss": 0.8154555973815918, + "train_acc": 0.76266, + "test_loss": 11.79904609375, + "test_acc": 0.0139, + "lyapunov": 1.8156985279239353, + "grad_norm": 0.669178340006855, + "grad_max_sv": 0.2794945202767849, + "grad_min_sv": 1.224900298101017e-08, + "grad_condition": 85610889.23653656, + "lr": 7.783603724899243e-05, + "time_sec": 41.73685550689697 + }, + { + "epoch": 124, + "train_loss": 0.8137769646453857, + "train_acc": 0.76432, + "test_loss": 12.765393380737304, + "test_acc": 0.0137, + "lyapunov": 1.8307919691285819, + "grad_norm": 0.6694226801939039, + "grad_max_sv": 0.27201326824724675, + "grad_min_sv": 1.2039878503379564e-08, + "grad_condition": 121197109.98967907, + "lr": 7.231786991974666e-05, + "time_sec": 41.73531937599182 + }, + { + "epoch": 125, + "train_loss": 0.8133161567115784, + "train_acc": 0.76326, + "test_loss": 12.784655738830567, + "test_acc": 0.0122, + "lyapunov": 1.8295393410850973, + "grad_norm": 0.6670756701256625, + "grad_max_sv": 0.27261514514684676, + "grad_min_sv": 1.2221596965835898e-08, + "grad_condition": 356380023.5179373, + "lr": 6.698729810778072e-05, + "time_sec": 41.763604164123535 + }, + { + "epoch": 126, + "train_loss": 0.8129604421806336, + "train_acc": 0.7628, + "test_loss": 13.225958226013184, + "test_acc": 0.0126, + "lyapunov": 1.8302826732015975, + "grad_norm": 0.6704810236042233, + "grad_max_sv": 0.2748331677168608, + "grad_min_sv": 1.2072974203171382e-08, + "grad_condition": 99544381.5634778, + "lr": 6.184665997806817e-05, + "time_sec": 41.77600121498108 + }, + { + "epoch": 127, + "train_loss": 0.8070299044799805, + "train_acc": 0.76676, + "test_loss": 13.664459396362306, + "test_acc": 0.013, + "lyapunov": 1.8359026521672983, + "grad_norm": 0.66477658106401, + "grad_max_sv": 0.2687961976975203, + "grad_min_sv": 1.1891753388948434e-08, + "grad_condition": 37293209.03174486, + "lr": 5.6898210384392595e-05, + "time_sec": 41.80121970176697 + }, + { + "epoch": 128, + "train_loss": 0.8090053428268432, + "train_acc": 0.76872, + "test_loss": 11.426691012573242, + "test_acc": 0.0115, + "lyapunov": 1.8378520700937646, + "grad_norm": 0.6632031001917765, + "grad_max_sv": 0.27344250604510306, + "grad_min_sv": 1.2066639863694829e-08, + "grad_condition": 31243719.523715306, + "lr": 5.214411988029363e-05, + "time_sec": 41.82421827316284 + }, + { + "epoch": 129, + "train_loss": 0.8079227607917786, + "train_acc": 0.76624, + "test_loss": 12.028020672607422, + "test_acc": 0.012, + "lyapunov": 1.859219463584978, + "grad_norm": 0.6629646499999615, + "grad_max_sv": 0.27192687802016735, + "grad_min_sv": 1.2157243324886768e-08, + "grad_condition": 125856538.14945057, + "lr": 4.7586473766990294e-05, + "time_sec": 41.83568787574768 + }, + { + "epoch": 130, + "train_loss": 0.7962826109504699, + "train_acc": 0.7715, + "test_loss": 12.105734626770019, + "test_acc": 0.0127, + "lyapunov": 1.853679660945902, + "grad_norm": 0.6594694106467661, + "grad_max_sv": 0.270331434905529, + "grad_min_sv": 1.185781129120489e-08, + "grad_condition": 59035305.181543544, + "lr": 4.32272711786996e-05, + "time_sec": 41.799023389816284 + }, + { + "epoch": 131, + "train_loss": 0.797652147064209, + "train_acc": 0.76824, + "test_loss": 11.730470477294922, + "test_acc": 0.0123, + "lyapunov": 1.8584958918564154, + "grad_norm": 0.6609614524699726, + "grad_max_sv": 0.2734715912491083, + "grad_min_sv": 1.1940296155456276e-08, + "grad_condition": 342790586.28990173, + "lr": 3.906842420574966e-05, + "time_sec": 41.75147795677185 + }, + { + "epoch": 132, + "train_loss": 0.793139144744873, + "train_acc": 0.77118, + "test_loss": 12.504206140136718, + "test_acc": 0.0129, + "lyapunov": 1.8664770187319393, + "grad_norm": 0.6607237229942333, + "grad_max_sv": 0.27070250958204267, + "grad_min_sv": 1.1972255922060305e-08, + "grad_condition": 59875567.53617197, + "lr": 3.5111757055874305e-05, + "time_sec": 41.760621786117554 + }, + { + "epoch": 133, + "train_loss": 0.7921624578094483, + "train_acc": 0.7721, + "test_loss": 12.777486071777345, + "test_acc": 0.0129, + "lyapunov": 1.863871324702602, + "grad_norm": 0.6614213112629463, + "grad_max_sv": 0.27186350151896477, + "grad_min_sv": 1.1780043016051955e-08, + "grad_condition": 68024039.28497984, + "lr": 3.1359005254054254e-05, + "time_sec": 42.07219076156616 + }, + { + "epoch": 134, + "train_loss": 0.7904575923538208, + "train_acc": 0.7699, + "test_loss": 12.88651337890625, + "test_acc": 0.0124, + "lyapunov": 1.85313686385484, + "grad_norm": 0.6619654920557065, + "grad_max_sv": 0.2733634263277054, + "grad_min_sv": 1.1941254937641866e-08, + "grad_condition": 116413237.48952556, + "lr": 2.7811814881259484e-05, + "time_sec": 41.78620004653931 + }, + { + "epoch": 135, + "train_loss": 0.7903749565505982, + "train_acc": 0.77092, + "test_loss": 13.76830639038086, + "test_acc": 0.0127, + "lyapunov": 1.8625033743241255, + "grad_norm": 0.6643518372959286, + "grad_max_sv": 0.27610865905880927, + "grad_min_sv": 1.1953594105523769e-08, + "grad_condition": 200115348.94944423, + "lr": 2.4471741852423218e-05, + "time_sec": 41.75718355178833 + }, + { + "epoch": 136, + "train_loss": 0.7883218976974488, + "train_acc": 0.77036, + "test_loss": 14.292781658935548, + "test_acc": 0.0127, + "lyapunov": 1.8804230857688142, + "grad_norm": 0.6645180835916397, + "grad_max_sv": 0.28091635145246985, + "grad_min_sv": 1.2041051395891844e-08, + "grad_condition": 172293384.14691827, + "lr": 2.1340251233966362e-05, + "time_sec": 41.77325367927551 + }, + { + "epoch": 137, + "train_loss": 0.787513043346405, + "train_acc": 0.77156, + "test_loss": 13.120205474853515, + "test_acc": 0.0118, + "lyapunov": 1.869988610067636, + "grad_norm": 0.6641823083713531, + "grad_max_sv": 0.27806338407099246, + "grad_min_sv": 1.2203783432418457e-08, + "grad_condition": 53694537.43194572, + "lr": 1.8418716601170932e-05, + "time_sec": 41.80371809005737 + }, + { + "epoch": 138, + "train_loss": 0.7822375239944458, + "train_acc": 0.77296, + "test_loss": 13.03838903503418, + "test_acc": 0.0122, + "lyapunov": 1.8764891554327572, + "grad_norm": 0.6569959403511353, + "grad_max_sv": 0.2655744932591915, + "grad_min_sv": 1.172578472877911e-08, + "grad_condition": 139773556.3686706, + "lr": 1.570841943568445e-05, + "time_sec": 41.84284281730652 + }, + { + "epoch": 139, + "train_loss": 0.7805222978591919, + "train_acc": 0.77466, + "test_loss": 12.327950807189941, + "test_acc": 0.0122, + "lyapunov": 1.8656533261394257, + "grad_norm": 0.6561511087384002, + "grad_max_sv": 0.2643951024860144, + "grad_min_sv": 1.164244644025203e-08, + "grad_condition": 33491467.770252932, + "lr": 1.3210548563419845e-05, + "time_sec": 41.83727669715881 + }, + { + "epoch": 140, + "train_loss": 0.7855155965614319, + "train_acc": 0.77192, + "test_loss": 13.026101483154298, + "test_acc": 0.0126, + "lyapunov": 1.8730976965726185, + "grad_norm": 0.6599127456140818, + "grad_max_sv": 0.2667284071445465, + "grad_min_sv": 1.1937072974012308e-08, + "grad_condition": 236751331.72185326, + "lr": 1.0926199633097203e-05, + "time_sec": 41.76897358894348 + }, + { + "epoch": 141, + "train_loss": 0.7812909572029114, + "train_acc": 0.77392, + "test_loss": 12.945702696228027, + "test_acc": 0.0116, + "lyapunov": 1.8839974741801582, + "grad_norm": 0.6585613427884496, + "grad_max_sv": 0.26870384998619556, + "grad_min_sv": 1.1752219593666457e-08, + "grad_condition": 68954849.34252027, + "lr": 8.856374635655688e-06, + "time_sec": 41.76629018783569 + }, + { + "epoch": 142, + "train_loss": 0.7811300833511352, + "train_acc": 0.7739, + "test_loss": 13.049443170166015, + "test_acc": 0.0123, + "lyapunov": 1.8791520260179135, + "grad_norm": 0.6560522540980063, + "grad_max_sv": 0.25867762304842473, + "grad_min_sv": 1.1660508410921145e-08, + "grad_condition": 58969719.72517464, + "lr": 7.001981464747503e-06, + "time_sec": 41.766427993774414 + }, + { + "epoch": 143, + "train_loss": 0.7802343584060669, + "train_acc": 0.77298, + "test_loss": 12.733855395507813, + "test_acc": 0.0128, + "lyapunov": 1.8745125151046402, + "grad_norm": 0.6568021483225246, + "grad_max_sv": 0.27304218113422396, + "grad_min_sv": 1.212674725220575e-08, + "grad_condition": 31816972.621490758, + "lr": 5.3638335185058295e-06, + "time_sec": 41.75397801399231 + }, + { + "epoch": 144, + "train_loss": 0.7806536671066284, + "train_acc": 0.77476, + "test_loss": 13.288220135498047, + "test_acc": 0.0116, + "lyapunov": 1.8822029039378056, + "grad_norm": 0.65622548824943, + "grad_max_sv": 0.27500034049153327, + "grad_min_sv": 1.210616192917624e-08, + "grad_condition": 135771786.30715096, + "lr": 3.942649342761114e-06, + "time_sec": 41.74063587188721 + }, + { + "epoch": 145, + "train_loss": 0.7727476877212525, + "train_acc": 0.77868, + "test_loss": 12.771284809875489, + "test_acc": 0.0118, + "lyapunov": 1.8848708657657398, + "grad_norm": 0.6509704415359339, + "grad_max_sv": 0.2654924627393484, + "grad_min_sv": 1.1833753260290236e-08, + "grad_condition": 63253515.975026414, + "lr": 2.7390523158633524e-06, + "time_sec": 41.75493144989014 + }, + { + "epoch": 146, + "train_loss": 0.774920754032135, + "train_acc": 0.77602, + "test_loss": 11.973253411865235, + "test_acc": 0.0128, + "lyapunov": 1.8840531790652848, + "grad_norm": 0.6537579811178159, + "grad_max_sv": 0.2739882215857506, + "grad_min_sv": 1.1937398355053863e-08, + "grad_condition": 164042036.35238856, + "lr": 1.7535703752478133e-06, + "time_sec": 41.76850652694702 + }, + { + "epoch": 147, + "train_loss": 0.7788493019866943, + "train_acc": 0.77474, + "test_loss": 12.56836795654297, + "test_acc": 0.0124, + "lyapunov": 1.8825494142444543, + "grad_norm": 0.65539511893324, + "grad_max_sv": 0.2706771694123745, + "grad_min_sv": 1.1889833076428324e-08, + "grad_condition": 42159067.77639109, + "lr": 9.866357858642196e-07, + "time_sec": 41.75876569747925 + }, + { + "epoch": 148, + "train_loss": 0.7780991253089905, + "train_acc": 0.77514, + "test_loss": 12.590273434448243, + "test_acc": 0.0125, + "lyapunov": 1.8843056740968123, + "grad_norm": 0.6571517590026161, + "grad_max_sv": 0.26878498420119284, + "grad_min_sv": 1.1823980811120905e-08, + "grad_condition": 69796389.45896903, + "lr": 4.38584950570808e-07, + "time_sec": 41.74810481071472 + }, + { + "epoch": 149, + "train_loss": 0.7777692156028747, + "train_acc": 0.77424, + "test_loss": 12.223853874206544, + "test_acc": 0.0121, + "lyapunov": 1.878731128504819, + "grad_norm": 0.6563572217839131, + "grad_max_sv": 0.26671431958675385, + "grad_min_sv": 1.186011775317075e-08, + "grad_condition": 36317778.677340195, + "lr": 1.096582625772501e-07, + "time_sec": 41.766427755355835 + }, + { + "epoch": 150, + "train_loss": 0.7732272885131836, + "train_acc": 0.77688, + "test_loss": 12.616454701232911, + "test_acc": 0.0122, + "lyapunov": 1.882308801726612, + "grad_norm": 0.654964904243624, + "grad_max_sv": 0.2760881375521421, + "grad_min_sv": 1.1988547765628965e-08, + "grad_condition": 45586606.69974294, + "lr": 0.0, + "time_sec": 41.74888467788696 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.8868685441589355, + "train_acc": 0.0329, + "test_loss": 5.835955558013916, + "test_acc": 0.0101, + "lyapunov": 2.7220060624125058, + "grad_norm": 5.812156307696722, + "grad_max_sv": 4.963531744480133, + "grad_min_sv": 1.0063162076967558e-07, + "grad_condition": 60577381.86856198, + "lr": 0.0009998903417374227, + "time_sec": 86.98101139068604 + }, + { + "epoch": 2, + "train_loss": 4.648734102935791, + "train_acc": 0.03168, + "test_loss": 5.273272645568848, + "test_acc": 0.0116, + "lyapunov": 1.8829401371729038, + "grad_norm": 3.9271799359325903, + "grad_max_sv": 3.2593957483768463, + "grad_min_sv": 7.00168735169246e-08, + "grad_condition": 6704995243.344969, + "lr": 0.0009995614150494292, + "time_sec": 86.99141383171082 + }, + { + "epoch": 3, + "train_loss": 4.5401412484741215, + "train_acc": 0.03192, + "test_loss": 5.1823678855896, + "test_acc": 0.0116, + "lyapunov": 1.671741279189849, + "grad_norm": 2.7526576635134052, + "grad_max_sv": 2.068139410018921, + "grad_min_sv": 4.9782242339535546e-08, + "grad_condition": 46749620.52678162, + "lr": 0.0009990133642141358, + "time_sec": 86.94570183753967 + }, + { + "epoch": 4, + "train_loss": 4.482065806884766, + "train_acc": 0.03614, + "test_loss": 5.456839122009278, + "test_acc": 0.0125, + "lyapunov": 1.6732522673009302, + "grad_norm": 2.1601992771147493, + "grad_max_sv": 1.546970361471176, + "grad_min_sv": 3.8277159042365835e-08, + "grad_condition": 46214535.63818577, + "lr": 0.0009982464296247522, + "time_sec": 86.99357056617737 + }, + { + "epoch": 5, + "train_loss": 4.416459924468994, + "train_acc": 0.0383, + "test_loss": 5.042759115600586, + "test_acc": 0.01, + "lyapunov": 1.6130115248053276, + "grad_norm": 1.4004295206677062, + "grad_max_sv": 0.8645520135760307, + "grad_min_sv": 2.2672172026935722e-08, + "grad_condition": 175123112.60315904, + "lr": 0.0009972609476841367, + "time_sec": 86.97992181777954 + }, + { + "epoch": 6, + "train_loss": 4.395440086669922, + "train_acc": 0.0401, + "test_loss": 5.0634123313903805, + "test_acc": 0.0128, + "lyapunov": 1.5916716637818709, + "grad_norm": 1.1633805279920075, + "grad_max_sv": 0.6950831398367882, + "grad_min_sv": 1.925970937871613e-08, + "grad_condition": 59401457.74683033, + "lr": 0.000996057350657239, + "time_sec": 86.97495365142822 + }, + { + "epoch": 7, + "train_loss": 4.376599430084228, + "train_acc": 0.04286, + "test_loss": 4.836668630218506, + "test_acc": 0.01, + "lyapunov": 1.5702608802434428, + "grad_norm": 1.0593143318075517, + "grad_max_sv": 0.6230248108506202, + "grad_min_sv": 1.715214276026833e-08, + "grad_condition": 89004595.82522376, + "lr": 0.000994636166481494, + "time_sec": 86.94613075256348 + }, + { + "epoch": 8, + "train_loss": 4.394542444458008, + "train_acc": 0.04012, + "test_loss": 4.783828695678711, + "test_acc": 0.0105, + "lyapunov": 1.5788988356700029, + "grad_norm": 0.9409085278354143, + "grad_max_sv": 0.5376082636415959, + "grad_min_sv": 1.4977826281320494e-08, + "grad_condition": 70368024.66979258, + "lr": 0.0009929980185352525, + "time_sec": 86.9745545387268 + }, + { + "epoch": 9, + "train_loss": 4.343202932891845, + "train_acc": 0.0467, + "test_loss": 4.718369251251221, + "test_acc": 0.0143, + "lyapunov": 1.578838681930776, + "grad_norm": 0.9193794265725351, + "grad_max_sv": 0.49778390526771543, + "grad_min_sv": 1.4809389686787355e-08, + "grad_condition": 36731155.53646419, + "lr": 0.0009911436253643444, + "time_sec": 86.94329404830933 + }, + { + "epoch": 10, + "train_loss": 4.346738121795655, + "train_acc": 0.04588, + "test_loss": 4.747097400665283, + "test_acc": 0.01, + "lyapunov": 1.5699478393930304, + "grad_norm": 0.7826254315559922, + "grad_max_sv": 0.4086857602000237, + "grad_min_sv": 1.2250536137944911e-08, + "grad_condition": 104959057.67411065, + "lr": 0.0009890738003669028, + "time_sec": 87.01483154296875 + }, + { + "epoch": 11, + "train_loss": 4.332594217224121, + "train_acc": 0.04862, + "test_loss": 4.891320510864258, + "test_acc": 0.01, + "lyapunov": 1.5761606662779513, + "grad_norm": 0.7137998587271801, + "grad_max_sv": 0.3616088554263115, + "grad_min_sv": 1.1035750030474745e-08, + "grad_condition": 65298844.773746744, + "lr": 0.00098678945143658, + "time_sec": 86.96892666816711 + }, + { + "epoch": 12, + "train_loss": 4.311053582611084, + "train_acc": 0.05042, + "test_loss": 4.748805415344238, + "test_acc": 0.0136, + "lyapunov": 1.581223778102709, + "grad_norm": 0.6987786961969137, + "grad_max_sv": 0.32796674892306327, + "grad_min_sv": 1.0473264228094692e-08, + "grad_condition": 55614992.08410585, + "lr": 0.0009842915805643154, + "time_sec": 86.95039057731628 + }, + { + "epoch": 13, + "train_loss": 4.285387758483886, + "train_acc": 0.05488, + "test_loss": 4.929604747009277, + "test_acc": 0.0129, + "lyapunov": 1.5752461502314223, + "grad_norm": 0.6473775537281783, + "grad_max_sv": 0.30444829240441323, + "grad_min_sv": 1.025112739139189e-08, + "grad_condition": 33302823.81112442, + "lr": 0.000981581283398829, + "time_sec": 86.96810054779053 + }, + { + "epoch": 14, + "train_loss": 4.329002091674805, + "train_acc": 0.0484, + "test_loss": 4.722304975891113, + "test_acc": 0.0113, + "lyapunov": 1.5697952088187723, + "grad_norm": 0.6066149539852266, + "grad_max_sv": 0.29504155144095423, + "grad_min_sv": 9.069441869735683e-09, + "grad_condition": 44069945.81851731, + "lr": 0.0009786597487660333, + "time_sec": 86.94814324378967 + }, + { + "epoch": 15, + "train_loss": 4.284536777191162, + "train_acc": 0.05596, + "test_loss": 5.023597773742676, + "test_acc": 0.012, + "lyapunov": 1.5501765512749361, + "grad_norm": 0.5804776517038385, + "grad_max_sv": 0.26920728757977486, + "grad_min_sv": 9.031740475298755e-09, + "grad_condition": 89195226.73600614, + "lr": 0.0009755282581475766, + "time_sec": 86.97197031974792 + }, + { + "epoch": 16, + "train_loss": 4.265627270050049, + "train_acc": 0.05928, + "test_loss": 4.827692833709717, + "test_acc": 0.0125, + "lyapunov": 1.5593034690603271, + "grad_norm": 0.5649471876682739, + "grad_max_sv": 0.2615423481911421, + "grad_min_sv": 8.80059825986157e-09, + "grad_condition": 38662576.4691389, + "lr": 0.0009721881851187403, + "time_sec": 86.95526337623596 + }, + { + "epoch": 17, + "train_loss": 4.308344786529541, + "train_acc": 0.05356, + "test_loss": 4.86770267944336, + "test_acc": 0.0083, + "lyapunov": 1.5524270220485794, + "grad_norm": 0.5305977948653878, + "grad_max_sv": 0.25252549946308134, + "grad_min_sv": 7.983495846353162e-09, + "grad_condition": 49375193.531422, + "lr": 0.0009686409947459456, + "time_sec": 86.9186339378357 + }, + { + "epoch": 18, + "train_loss": 4.310789455413818, + "train_acc": 0.05254, + "test_loss": 4.673085025787353, + "test_acc": 0.01, + "lyapunov": 1.547373825326905, + "grad_norm": 0.505989408187644, + "grad_max_sv": 0.23108725845813752, + "grad_min_sv": 7.435956640711172e-09, + "grad_condition": 43123277.24920449, + "lr": 0.0009648882429441254, + "time_sec": 86.99692630767822 + }, + { + "epoch": 19, + "train_loss": 4.275941365509033, + "train_acc": 0.0554, + "test_loss": 5.401819254302978, + "test_acc": 0.0098, + "lyapunov": 1.575231916154437, + "grad_norm": 0.6989570502511167, + "grad_max_sv": 0.2374715338461101, + "grad_min_sv": 7.549137073746266e-09, + "grad_condition": 1516160705.4318807, + "lr": 0.00096093157579425, + "time_sec": 87.07763409614563 + }, + { + "epoch": 20, + "train_loss": 4.2160577346801755, + "train_acc": 0.06188, + "test_loss": 4.661321237182618, + "test_acc": 0.01, + "lyapunov": 1.5690500422206985, + "grad_norm": 0.5291072815364315, + "grad_max_sv": 0.24560309313237666, + "grad_min_sv": 7.844638819217916e-09, + "grad_condition": 347805291.98508245, + "lr": 0.0009567727288213001, + "time_sec": 87.01470422744751 + }, + { + "epoch": 21, + "train_loss": 4.214956321716309, + "train_acc": 0.06394, + "test_loss": 5.004168435668945, + "test_acc": 0.01, + "lyapunov": 1.55478805440771, + "grad_norm": 0.5022895827339361, + "grad_max_sv": 0.2279700841754675, + "grad_min_sv": 7.494698731069782e-09, + "grad_condition": 69056465.69243297, + "lr": 0.0009524135262330095, + "time_sec": 86.94965100288391 + }, + { + "epoch": 22, + "train_loss": 4.211716468200684, + "train_acc": 0.06272, + "test_loss": 4.793123007202149, + "test_acc": 0.01, + "lyapunov": 1.5555359359897312, + "grad_norm": 0.49162357885598756, + "grad_max_sv": 0.21602830216288565, + "grad_min_sv": 7.42661886293794e-09, + "grad_condition": 47899051.52190702, + "lr": 0.0009478558801197061, + "time_sec": 86.94232034683228 + }, + { + "epoch": 23, + "train_loss": 4.195988226165771, + "train_acc": 0.065, + "test_loss": 4.785066618347168, + "test_acc": 0.01, + "lyapunov": 1.5451125815091535, + "grad_norm": 0.48554482713506764, + "grad_max_sv": 0.20978505425155164, + "grad_min_sv": 7.308397834138169e-09, + "grad_condition": 57654580.035860874, + "lr": 0.000943101789615607, + "time_sec": 86.9649133682251 + }, + { + "epoch": 24, + "train_loss": 4.1939692004394535, + "train_acc": 0.06604, + "test_loss": 4.668301161193848, + "test_acc": 0.01, + "lyapunov": 1.5433694166905434, + "grad_norm": 0.4798986336483395, + "grad_max_sv": 0.21675167605280876, + "grad_min_sv": 7.174587644126485e-09, + "grad_condition": 50862502.06484151, + "lr": 0.0009381533400219313, + "time_sec": 86.94376063346863 + }, + { + "epoch": 25, + "train_loss": 4.19334780670166, + "train_acc": 0.06576, + "test_loss": 4.736515522766113, + "test_acc": 0.01, + "lyapunov": 1.5393451330302013, + "grad_norm": 0.4662802930400461, + "grad_max_sv": 0.20134809613227844, + "grad_min_sv": 7.031141516233852e-09, + "grad_condition": 33947861.7867923, + "lr": 0.0009330127018922189, + "time_sec": 86.96570682525635 + }, + { + "epoch": 26, + "train_loss": 4.180844131164551, + "train_acc": 0.06732, + "test_loss": 4.750217501831055, + "test_acc": 0.01, + "lyapunov": 1.5386863751789492, + "grad_norm": 0.4611088098769563, + "grad_max_sv": 0.19665082693099975, + "grad_min_sv": 6.920672646071324e-09, + "grad_condition": 36414119.70447004, + "lr": 0.000927682130080253, + "time_sec": 86.91903853416443 + }, + { + "epoch": 27, + "train_loss": 4.185037852935791, + "train_acc": 0.06616, + "test_loss": 4.6968753662109375, + "test_acc": 0.01, + "lyapunov": 1.537141337114222, + "grad_norm": 0.4445484510965817, + "grad_max_sv": 0.2015372473746538, + "grad_min_sv": 6.726753586094869e-09, + "grad_condition": 103270066.7857457, + "lr": 0.0009221639627510072, + "time_sec": 86.9379210472107 + }, + { + "epoch": 28, + "train_loss": 4.190574891281128, + "train_acc": 0.06716, + "test_loss": 4.920410514831543, + "test_acc": 0.01, + "lyapunov": 1.5525898277911994, + "grad_norm": 0.4566542078451628, + "grad_max_sv": 0.1792749162763357, + "grad_min_sv": 6.546373623045332e-09, + "grad_condition": 78356491.53621121, + "lr": 0.0009164606203550494, + "time_sec": 86.93841648101807 + }, + { + "epoch": 29, + "train_loss": 4.180019518737793, + "train_acc": 0.06908, + "test_loss": 4.91687992477417, + "test_acc": 0.01, + "lyapunov": 1.5407177566567345, + "grad_norm": 0.43344690178182577, + "grad_max_sv": 0.18290962614119052, + "grad_min_sv": 6.677244744970889e-09, + "grad_condition": 193011560.0763206, + "lr": 0.0009105746045668516, + "time_sec": 86.94041228294373 + }, + { + "epoch": 30, + "train_loss": 4.176376322937012, + "train_acc": 0.06936, + "test_loss": 4.777800242614746, + "test_acc": 0.01, + "lyapunov": 1.534477433280262, + "grad_norm": 0.42932203210281256, + "grad_max_sv": 0.18090479113161564, + "grad_min_sv": 6.6192410509789e-09, + "grad_condition": 229577220.8995716, + "lr": 0.0009045084971874733, + "time_sec": 86.93214845657349 + }, + { + "epoch": 31, + "train_loss": 4.1660814703369144, + "train_acc": 0.07102, + "test_loss": 5.056566352844238, + "test_acc": 0.01, + "lyapunov": 1.5318606555309442, + "grad_norm": 0.4239591600781453, + "grad_max_sv": 0.17118308506906033, + "grad_min_sv": 6.635534946508592e-09, + "grad_condition": 29815266.689775515, + "lr": 0.0008982649590120977, + "time_sec": 86.9801459312439 + }, + { + "epoch": 32, + "train_loss": 4.1669150354003905, + "train_acc": 0.07152, + "test_loss": 4.7432677307128905, + "test_acc": 0.01, + "lyapunov": 1.5303372562388935, + "grad_norm": 0.42192508499171244, + "grad_max_sv": 0.17523783259093761, + "grad_min_sv": 6.511007812765035e-09, + "grad_condition": 40414301.30092957, + "lr": 0.0008918467286629196, + "time_sec": 86.93055391311646 + }, + { + "epoch": 33, + "train_loss": 4.177858955383301, + "train_acc": 0.06938, + "test_loss": 4.758124336242676, + "test_acc": 0.01, + "lyapunov": 1.5353793033858394, + "grad_norm": 0.42820211396491675, + "grad_max_sv": 0.17152037434279918, + "grad_min_sv": 6.41136407800863e-09, + "grad_condition": 78795613.54081726, + "lr": 0.0008852566213878943, + "time_sec": 86.94400405883789 + }, + { + "epoch": 34, + "train_loss": 4.181727910308838, + "train_acc": 0.06804, + "test_loss": 4.683254829406739, + "test_acc": 0.01, + "lyapunov": 1.5587525105537356, + "grad_norm": 0.4154576543177753, + "grad_max_sv": 0.1630621150135994, + "grad_min_sv": 6.162790580632738e-09, + "grad_condition": 68340521.63126534, + "lr": 0.000878497527825878, + "time_sec": 86.93004965782166 + }, + { + "epoch": 35, + "train_loss": 4.208544900970459, + "train_acc": 0.06306, + "test_loss": 4.718585105895996, + "test_acc": 0.01, + "lyapunov": 1.5500410609233104, + "grad_norm": 0.3865003997673685, + "grad_max_sv": 0.15796905308961867, + "grad_min_sv": 5.649645064623176e-09, + "grad_condition": 63351773.654954754, + "lr": 0.000871572412738697, + "time_sec": 86.95951509475708 + }, + { + "epoch": 36, + "train_loss": 4.209841008148193, + "train_acc": 0.0624, + "test_loss": 4.799479325866699, + "test_acc": 0.01, + "lyapunov": 1.5291228870601605, + "grad_norm": 0.38680649491990404, + "grad_max_sv": 0.1646373827010393, + "grad_min_sv": 5.79466546829499e-09, + "grad_condition": 56823831.7925354, + "lr": 0.0008644843137107055, + "time_sec": 86.96009302139282 + }, + { + "epoch": 37, + "train_loss": 4.272466593933106, + "train_acc": 0.05266, + "test_loss": 4.855613878631591, + "test_acc": 0.01, + "lyapunov": 1.5562334264940618, + "grad_norm": 0.37061531171168033, + "grad_max_sv": 0.17256855219602585, + "grad_min_sv": 4.887432875490088e-09, + "grad_condition": 416940803.8173046, + "lr": 0.0008572363398164014, + "time_sec": 87.00441336631775 + }, + { + "epoch": 38, + "train_loss": 4.369705648193359, + "train_acc": 0.03928, + "test_loss": 4.9527251953125, + "test_acc": 0.0093, + "lyapunov": 1.6187922997242958, + "grad_norm": 0.33726725953664355, + "grad_max_sv": 0.16843934655189513, + "grad_min_sv": 2.4259941365468647e-09, + "grad_condition": 523051362.36644346, + "lr": 0.0008498316702566826, + "time_sec": 87.0337564945221 + }, + { + "epoch": 39, + "train_loss": 4.419442424468994, + "train_acc": 0.03648, + "test_loss": 4.654605149841308, + "test_acc": 0.01, + "lyapunov": 1.6483006477355957, + "grad_norm": 0.3745355743251292, + "grad_max_sv": 0.14972059521824121, + "grad_min_sv": 3.2977797229973015e-09, + "grad_condition": 225247622.29531756, + "lr": 0.0008422735529643442, + "time_sec": 87.03559732437134 + }, + { + "epoch": 40, + "train_loss": 4.342097230224609, + "train_acc": 0.04648, + "test_loss": 4.611628057861328, + "test_acc": 0.01, + "lyapunov": 1.5624720614279628, + "grad_norm": 0.340614014198837, + "grad_max_sv": 0.14854245409369468, + "grad_min_sv": 4.373499274887282e-09, + "grad_condition": 98828023.95197472, + "lr": 0.0008345653031794289, + "time_sec": 87.01033163070679 + }, + { + "epoch": 41, + "train_loss": 4.321761748199463, + "train_acc": 0.05098, + "test_loss": 4.634394804382325, + "test_acc": 0.01, + "lyapunov": 1.5627251454936268, + "grad_norm": 0.34424200245087344, + "grad_max_sv": 0.1472593817859888, + "grad_min_sv": 4.576645657589085e-09, + "grad_condition": 41582429.931975044, + "lr": 0.0008267103019950526, + "time_sec": 87.02087545394897 + }, + { + "epoch": 42, + "train_loss": 4.336793294677735, + "train_acc": 0.04814, + "test_loss": 4.750106883239746, + "test_acc": 0.01, + "lyapunov": 1.562337180842524, + "grad_norm": 0.3348951374350851, + "grad_max_sv": 0.14064551685005428, + "grad_min_sv": 4.340845933007917e-09, + "grad_condition": 200549627.53973636, + "lr": 0.0008187119948743447, + "time_sec": 87.0238869190216 + }, + { + "epoch": 43, + "train_loss": 4.405802797851562, + "train_acc": 0.03806, + "test_loss": 4.7633986679077145, + "test_acc": 0.01, + "lyapunov": 1.5599107458768293, + "grad_norm": 0.3360719439159513, + "grad_max_sv": 0.15633109211921692, + "grad_min_sv": 3.7276254510193455e-09, + "grad_condition": 70823369.716424, + "lr": 0.000810573890139155, + "time_sec": 87.02033281326294 + }, + { + "epoch": 44, + "train_loss": 4.3735290841674805, + "train_acc": 0.04124, + "test_loss": 4.801515933990479, + "test_acc": 0.01, + "lyapunov": 1.5446034419871961, + "grad_norm": 0.3233251791662432, + "grad_max_sv": 0.15177634693682193, + "grad_min_sv": 3.739056242705804e-09, + "grad_condition": 208295162.03785604, + "lr": 0.0008022995574311873, + "time_sec": 87.03142833709717 + }, + { + "epoch": 45, + "train_loss": 4.337905093994141, + "train_acc": 0.0471, + "test_loss": 4.926548869323731, + "test_acc": 0.01, + "lyapunov": 1.544969515422421, + "grad_norm": 0.33595101293068835, + "grad_max_sv": 0.1516191553324461, + "grad_min_sv": 3.987210877437475e-09, + "grad_condition": 164368190.47491115, + "lr": 0.0007938926261462363, + "time_sec": 86.99039697647095 + }, + { + "epoch": 46, + "train_loss": 4.346541597595214, + "train_acc": 0.04428, + "test_loss": 4.8608341247558595, + "test_acc": 0.01, + "lyapunov": 1.5419368658529218, + "grad_norm": 0.3159762444473148, + "grad_max_sv": 0.14429737031459808, + "grad_min_sv": 3.9462240453017395e-09, + "grad_condition": 538095319.5894905, + "lr": 0.0007853567838422158, + "time_sec": 87.01374340057373 + }, + { + "epoch": 47, + "train_loss": 4.339312688140869, + "train_acc": 0.04536, + "test_loss": 5.433785871124267, + "test_acc": 0.01, + "lyapunov": 1.5500127747845467, + "grad_norm": 0.34056795023315073, + "grad_max_sv": 0.15485984329134225, + "grad_min_sv": 3.9653568355974e-09, + "grad_condition": 112001560.11439368, + "lr": 0.0007766957746216719, + "time_sec": 87.01831102371216 + }, + { + "epoch": 48, + "train_loss": 4.32518587310791, + "train_acc": 0.046, + "test_loss": 5.1484094314575195, + "test_acc": 0.01, + "lyapunov": 1.560365958286978, + "grad_norm": 0.34490288181980205, + "grad_max_sv": 0.17489982210099697, + "grad_min_sv": 4.2351839486809425e-09, + "grad_condition": 61705070.509012245, + "lr": 0.0007679133974894982, + "time_sec": 87.04479813575745 + }, + { + "epoch": 49, + "train_loss": 4.267531641235352, + "train_acc": 0.05432, + "test_loss": 5.033274496459961, + "test_acc": 0.01, + "lyapunov": 1.5366158906151266, + "grad_norm": 0.3341919212572902, + "grad_max_sv": 0.15775893218815326, + "grad_min_sv": 4.352772933584326e-09, + "grad_condition": 91135353.40945777, + "lr": 0.000759013504686565, + "time_sec": 87.03758192062378 + }, + { + "epoch": 50, + "train_loss": 4.231792089385986, + "train_acc": 0.0574, + "test_loss": 5.012654959106445, + "test_acc": 0.01, + "lyapunov": 1.5314560354213276, + "grad_norm": 0.33835586225307046, + "grad_max_sv": 0.15273352302610874, + "grad_min_sv": 4.610002634145016e-09, + "grad_condition": 95621349.83087932, + "lr": 0.0007499999999999998, + "time_sec": 87.02117848396301 + }, + { + "epoch": 51, + "train_loss": 4.217709088897705, + "train_acc": 0.06214, + "test_loss": 4.961499259948731, + "test_acc": 0.01, + "lyapunov": 1.532185621273792, + "grad_norm": 0.3416812510567867, + "grad_max_sv": 0.14771231319755315, + "grad_min_sv": 4.692455504717863e-09, + "grad_condition": 38762044.12640218, + "lr": 0.0007408768370508575, + "time_sec": 86.99368810653687 + }, + { + "epoch": 52, + "train_loss": 4.251720480804443, + "train_acc": 0.0563, + "test_loss": 5.129425187683106, + "test_acc": 0.01, + "lyapunov": 1.5415819980909147, + "grad_norm": 0.37023392179214565, + "grad_max_sv": 0.14163506645709276, + "grad_min_sv": 4.612465075159999e-09, + "grad_condition": 38316259.45919823, + "lr": 0.0007316480175599307, + "time_sec": 87.01456809043884 + }, + { + "epoch": 53, + "train_loss": 4.253690295715332, + "train_acc": 0.0568, + "test_loss": 4.812875964355468, + "test_acc": 0.0132, + "lyapunov": 1.5413876192649003, + "grad_norm": 0.33782925041162415, + "grad_max_sv": 0.14739676434546709, + "grad_min_sv": 4.765125130590242e-09, + "grad_condition": 36325730.78579678, + "lr": 0.0007223175895924635, + "time_sec": 87.01148462295532 + }, + { + "epoch": 54, + "train_loss": 4.186111945190429, + "train_acc": 0.06596, + "test_loss": 4.7283723838806155, + "test_acc": 0.0105, + "lyapunov": 1.5397452423944498, + "grad_norm": 0.34901949980641434, + "grad_max_sv": 0.14486436657607554, + "grad_min_sv": 5.007936219880716e-09, + "grad_condition": 33957841.08981674, + "lr": 0.0007128896457825361, + "time_sec": 87.01034283638 + }, + { + "epoch": 55, + "train_loss": 4.226965001220703, + "train_acc": 0.05946, + "test_loss": 5.0994131385803225, + "test_acc": 0.01, + "lyapunov": 1.5427140854203794, + "grad_norm": 0.33574518731923997, + "grad_max_sv": 0.1379337849095464, + "grad_min_sv": 4.6546377016620785e-09, + "grad_condition": 35033403.794181205, + "lr": 0.0007033683215378998, + "time_sec": 87.02716326713562 + }, + { + "epoch": 56, + "train_loss": 4.275228694610596, + "train_acc": 0.05126, + "test_loss": 5.6790080192565915, + "test_acc": 0.0106, + "lyapunov": 1.5486624853690263, + "grad_norm": 0.32521941624733625, + "grad_max_sv": 0.1381490297615528, + "grad_min_sv": 4.0974726380101075e-09, + "grad_condition": 227289112.92801088, + "lr": 0.0006937577932260512, + "time_sec": 87.03791618347168 + }, + { + "epoch": 57, + "train_loss": 4.291394806976318, + "train_acc": 0.05138, + "test_loss": 5.555759259033203, + "test_acc": 0.01, + "lyapunov": 1.5378701308804095, + "grad_norm": 0.3069586773109854, + "grad_max_sv": 0.1346513893455267, + "grad_min_sv": 4.065951690612746e-09, + "grad_condition": 46617844.42276532, + "lr": 0.0006840622763423388, + "time_sec": 87.04759955406189 + }, + { + "epoch": 58, + "train_loss": 4.249909885101318, + "train_acc": 0.057, + "test_loss": 4.992578089141846, + "test_acc": 0.01, + "lyapunov": 1.536266983012714, + "grad_norm": 0.34838996163523644, + "grad_max_sv": 0.1345098938792944, + "grad_min_sv": 4.396801889586244e-09, + "grad_condition": 64136263.36505444, + "lr": 0.0006742860236609073, + "time_sec": 86.98516917228699 + }, + { + "epoch": 59, + "train_loss": 4.242862917938233, + "train_acc": 0.057, + "test_loss": 5.1998653221130375, + "test_acc": 0.0109, + "lyapunov": 1.5351955945534475, + "grad_norm": 0.3173941682006927, + "grad_max_sv": 0.13275786247104407, + "grad_min_sv": 4.269058501583239e-09, + "grad_condition": 108827031.14571735, + "lr": 0.0006644333233692913, + "time_sec": 86.99496340751648 + }, + { + "epoch": 60, + "train_loss": 4.358045599975586, + "train_acc": 0.04008, + "test_loss": 5.66520142211914, + "test_acc": 0.01, + "lyapunov": 1.538059144983511, + "grad_norm": 0.32769294068142363, + "grad_max_sv": 0.15341913774609567, + "grad_min_sv": 3.3530493617761613e-09, + "grad_condition": 141563570.6767326, + "lr": 0.0006545084971874734, + "time_sec": 86.98709297180176 + }, + { + "epoch": 61, + "train_loss": 4.379126887512207, + "train_acc": 0.03892, + "test_loss": 5.79373645401001, + "test_acc": 0.01, + "lyapunov": 1.5358953323510602, + "grad_norm": 0.29167390917673963, + "grad_max_sv": 0.15212837420403957, + "grad_min_sv": 3.1512680335413907e-09, + "grad_condition": 423820959.74051917, + "lr": 0.0006445158984722354, + "time_sec": 87.08233451843262 + }, + { + "epoch": 62, + "train_loss": 4.3699617782592775, + "train_acc": 0.0387, + "test_loss": 5.100420123291015, + "test_acc": 0.01, + "lyapunov": 1.5384678313189455, + "grad_norm": 0.31748131308229766, + "grad_max_sv": 0.1489308735355735, + "grad_min_sv": 2.9947165469668134e-09, + "grad_condition": 71467944.71145716, + "lr": 0.0006344599103076324, + "time_sec": 87.08040046691895 + }, + { + "epoch": 63, + "train_loss": 4.35802111907959, + "train_acc": 0.0405, + "test_loss": 5.097725323486328, + "test_acc": 0.01, + "lyapunov": 1.529050966967707, + "grad_norm": 0.29323437120463275, + "grad_max_sv": 0.1526517506688833, + "grad_min_sv": 3.053018635124083e-09, + "grad_condition": 75636072.16702321, + "lr": 0.0006243449435824269, + "time_sec": 87.12332153320312 + }, + { + "epoch": 64, + "train_loss": 4.344970562896728, + "train_acc": 0.0425, + "test_loss": 5.351859429168702, + "test_acc": 0.01, + "lyapunov": 1.5276264845562713, + "grad_norm": 0.28862904034232667, + "grad_max_sv": 0.14074937291443348, + "grad_min_sv": 3.229418670674944e-09, + "grad_condition": 58372064.62046027, + "lr": 0.0006141754350553275, + "time_sec": 87.1001365184784 + }, + { + "epoch": 65, + "train_loss": 4.348922080230713, + "train_acc": 0.04292, + "test_loss": 5.492067797851562, + "test_acc": 0.01, + "lyapunov": 1.5324354037604369, + "grad_norm": 0.2803352109178489, + "grad_max_sv": 0.13472131155431272, + "grad_min_sv": 2.467204887287612e-09, + "grad_condition": 665825207.1158358, + "lr": 0.0006039558454088793, + "time_sec": 87.11217975616455 + }, + { + "epoch": 66, + "train_loss": 4.333704286193847, + "train_acc": 0.04354, + "test_loss": 4.877685953521729, + "test_acc": 0.01, + "lyapunov": 1.534651099873321, + "grad_norm": 0.27635791494927536, + "grad_max_sv": 0.11872162725776433, + "grad_min_sv": 5.001605770283031e-10, + "grad_condition": 2355784759.8605924, + "lr": 0.000593690657292862, + "time_sec": 87.14824295043945 + }, + { + "epoch": 67, + "train_loss": 4.322627476806641, + "train_acc": 0.04472, + "test_loss": 4.8601047325134275, + "test_acc": 0.01, + "lyapunov": 1.5370692722022992, + "grad_norm": 0.2704991527712366, + "grad_max_sv": 0.12121895346790552, + "grad_min_sv": 3.3772064152387887e-10, + "grad_condition": 1436858758.7497945, + "lr": 0.0005833843733580507, + "time_sec": 87.15028619766235 + }, + { + "epoch": 68, + "train_loss": 4.326148190155029, + "train_acc": 0.04494, + "test_loss": 4.793710678100586, + "test_acc": 0.01, + "lyapunov": 1.5317091633901572, + "grad_norm": 0.2672898730595414, + "grad_max_sv": 0.11485066972672939, + "grad_min_sv": 1.6583841985768597e-10, + "grad_condition": 5336395004.707764, + "lr": 0.0005730415142812054, + "time_sec": 87.02114963531494 + }, + { + "epoch": 69, + "train_loss": 4.329122970428466, + "train_acc": 0.04536, + "test_loss": 4.8099893341064455, + "test_acc": 0.01, + "lyapunov": 1.5467721056145476, + "grad_norm": 0.32172718514384613, + "grad_max_sv": 0.11834470257163048, + "grad_min_sv": 1.1168446594628234e-09, + "grad_condition": 745395849.9775846, + "lr": 0.0005626666167821517, + "time_sec": 87.02938222885132 + }, + { + "epoch": 70, + "train_loss": 4.31241029083252, + "train_acc": 0.0463, + "test_loss": 4.952929071044922, + "test_acc": 0.01, + "lyapunov": 1.5362041597171208, + "grad_norm": 0.2753431538427545, + "grad_max_sv": 0.11906800698488951, + "grad_min_sv": 1.7476929946433003e-09, + "grad_condition": 756434714.2533172, + "lr": 0.0005522642316338265, + "time_sec": 87.02464318275452 + }, + { + "epoch": 71, + "train_loss": 4.31154488571167, + "train_acc": 0.04686, + "test_loss": 5.023902383422851, + "test_acc": 0.01, + "lyapunov": 1.5466017796255438, + "grad_norm": 0.2753267526599803, + "grad_max_sv": 0.11738765817135573, + "grad_min_sv": 2.3081605008377915e-09, + "grad_condition": 242689040.53309226, + "lr": 0.0005418389216661573, + "time_sec": 87.03318190574646 + }, + { + "epoch": 72, + "train_loss": 4.306096405944825, + "train_acc": 0.04658, + "test_loss": 5.104643942260743, + "test_acc": 0.01, + "lyapunov": 1.5303368059265645, + "grad_norm": 0.27899194256031273, + "grad_max_sv": 0.12330806013196707, + "grad_min_sv": 2.439638441677043e-09, + "grad_condition": 1381046238.5040848, + "lr": 0.0005313952597646563, + "time_sec": 87.03077554702759 + }, + { + "epoch": 73, + "train_loss": 4.311607224578857, + "train_acc": 0.04646, + "test_loss": 5.009871780395508, + "test_acc": 0.01, + "lyapunov": 1.5270253767442825, + "grad_norm": 0.27694139094749887, + "grad_max_sv": 0.11829848829656839, + "grad_min_sv": 1.4740073658175978e-09, + "grad_condition": 660054658.4010975, + "lr": 0.0005209378268645994, + "time_sec": 87.02628016471863 + }, + { + "epoch": 74, + "train_loss": 4.313855213012696, + "train_acc": 0.04592, + "test_loss": 5.476243537902832, + "test_acc": 0.01, + "lyapunov": 1.5314418053078225, + "grad_norm": 0.2784448703758454, + "grad_max_sv": 0.11976860761642456, + "grad_min_sv": 1.4007036064009327e-09, + "grad_condition": 315405562.3793217, + "lr": 0.0005104712099416781, + "time_sec": 87.02340960502625 + }, + { + "epoch": 75, + "train_loss": 4.311369212493896, + "train_acc": 0.0472, + "test_loss": 5.133029379272461, + "test_acc": 0.01, + "lyapunov": 1.5308379309866436, + "grad_norm": 0.3021498176054871, + "grad_max_sv": 0.11717559359967708, + "grad_min_sv": 1.0902342301513657e-09, + "grad_condition": 694118705.4805201, + "lr": 0.0004999999999999996, + "time_sec": 87.05124974250793 + }, + { + "epoch": 76, + "train_loss": 4.29647945022583, + "train_acc": 0.04768, + "test_loss": 4.956787372589111, + "test_acc": 0.01, + "lyapunov": 1.5325303791124192, + "grad_norm": 0.28226470528961883, + "grad_max_sv": 0.11491116061806679, + "grad_min_sv": 2.1826049294727118e-09, + "grad_condition": 851502522.821348, + "lr": 0.0004895287900583212, + "time_sec": 87.05739998817444 + }, + { + "epoch": 77, + "train_loss": 4.2993905654907225, + "train_acc": 0.04726, + "test_loss": 4.818333094787597, + "test_acc": 0.01, + "lyapunov": 1.5346041228765113, + "grad_norm": 0.27638064483217156, + "grad_max_sv": 0.11815577689558268, + "grad_min_sv": 2.18521279816801e-09, + "grad_condition": 346879910.4433508, + "lr": 0.0004790621731353997, + "time_sec": 87.03282046318054 + }, + { + "epoch": 78, + "train_loss": 4.300057550354004, + "train_acc": 0.04764, + "test_loss": 5.216551345825195, + "test_acc": 0.01, + "lyapunov": 1.5297756530439761, + "grad_norm": 0.2795747956169958, + "grad_max_sv": 0.11852586027234793, + "grad_min_sv": 1.5182026258343459e-09, + "grad_condition": 490972915.745468, + "lr": 0.000468604740235343, + "time_sec": 87.03314900398254 + }, + { + "epoch": 79, + "train_loss": 4.296518913421631, + "train_acc": 0.04822, + "test_loss": 4.796546273803711, + "test_acc": 0.01, + "lyapunov": 1.5296590721515744, + "grad_norm": 0.2795255751493857, + "grad_max_sv": 0.11349777709692717, + "grad_min_sv": 2.4189355944384187e-09, + "grad_condition": 3528233391.319597, + "lr": 0.00045816107833384175, + "time_sec": 87.05465078353882 + }, + { + "epoch": 80, + "train_loss": 4.293817173614502, + "train_acc": 0.04988, + "test_loss": 5.390813935852051, + "test_acc": 0.01, + "lyapunov": 1.5339140129821074, + "grad_norm": 0.28116623382258155, + "grad_max_sv": 0.11869933754205704, + "grad_min_sv": 2.218430284525036e-09, + "grad_condition": 239750601.46903428, + "lr": 0.0004477357683661729, + "time_sec": 87.02411317825317 + }, + { + "epoch": 81, + "train_loss": 4.308743771514893, + "train_acc": 0.04688, + "test_loss": 4.9387015426635745, + "test_acc": 0.01, + "lyapunov": 1.5359756373383504, + "grad_norm": 0.27564769795473687, + "grad_max_sv": 0.11904207207262515, + "grad_min_sv": 1.3827144019226776e-09, + "grad_condition": 1250382457.5368142, + "lr": 0.00043733338321784746, + "time_sec": 87.06971073150635 + }, + { + "epoch": 82, + "train_loss": 4.316180011596679, + "train_acc": 0.04802, + "test_loss": 4.819311853027344, + "test_acc": 0.01, + "lyapunov": 1.5405200875323752, + "grad_norm": 0.2695310056002572, + "grad_max_sv": 0.11497616600245238, + "grad_min_sv": 5.07012224977392e-10, + "grad_condition": 1003922073.3294013, + "lr": 0.0004269584857187939, + "time_sec": 87.01381373405457 + }, + { + "epoch": 83, + "train_loss": 4.3241317964172366, + "train_acc": 0.04642, + "test_loss": 5.559939542388916, + "test_acc": 0.01, + "lyapunov": 1.5336117997498768, + "grad_norm": 0.30799403664519254, + "grad_max_sv": 0.11631885562092066, + "grad_min_sv": 1.0995131752529269e-09, + "grad_condition": 2912542691.0373497, + "lr": 0.0004166156266419484, + "time_sec": 87.01211094856262 + }, + { + "epoch": 84, + "train_loss": 4.304221888427734, + "train_acc": 0.04712, + "test_loss": 5.7824999008178715, + "test_acc": 0.01, + "lyapunov": 1.5356234031565048, + "grad_norm": 0.27623908579456924, + "grad_max_sv": 0.11505712084472179, + "grad_min_sv": 1.2430747893055552e-09, + "grad_condition": 739728712.8387728, + "lr": 0.0004063093427071373, + "time_sec": 87.03186845779419 + }, + { + "epoch": 85, + "train_loss": 4.304068413696289, + "train_acc": 0.0475, + "test_loss": 5.2205657958984375, + "test_acc": 0.01, + "lyapunov": 1.548282836709181, + "grad_norm": 0.2741067528493452, + "grad_max_sv": 0.11491415649652481, + "grad_min_sv": 1.3353951820206655e-09, + "grad_condition": 457161263.0151564, + "lr": 0.0003960441545911199, + "time_sec": 87.02751231193542 + }, + { + "epoch": 86, + "train_loss": 4.307723725280762, + "train_acc": 0.04744, + "test_loss": 5.089657419586182, + "test_acc": 0.01, + "lyapunov": 1.5371347848716599, + "grad_norm": 0.2703438463012035, + "grad_max_sv": 0.11324898395687341, + "grad_min_sv": 8.378487995790769e-10, + "grad_condition": 3522705690.75045, + "lr": 0.0003858245649446718, + "time_sec": 87.02715706825256 + }, + { + "epoch": 87, + "train_loss": 4.309327346801758, + "train_acc": 0.04712, + "test_loss": 5.066932530212402, + "test_acc": 0.01, + "lyapunov": 1.535299950243567, + "grad_norm": 0.26305910205092736, + "grad_max_sv": 0.11055518221110106, + "grad_min_sv": 4.3744003958521707e-10, + "grad_condition": 3926209090.1259904, + "lr": 0.00037565505641757235, + "time_sec": 87.00939083099365 + }, + { + "epoch": 88, + "train_loss": 4.302119546661377, + "train_acc": 0.04826, + "test_loss": 4.713959245300293, + "test_acc": 0.01, + "lyapunov": 1.5447248967407305, + "grad_norm": 0.2948650300762129, + "grad_max_sv": 0.10960109252482653, + "grad_min_sv": 1.299059114424038e-09, + "grad_condition": 1649862428.0795467, + "lr": 0.00036554008969236695, + "time_sec": 86.99231100082397 + }, + { + "epoch": 89, + "train_loss": 4.222235094909668, + "train_acc": 0.05936, + "test_loss": 4.947286629486084, + "test_acc": 0.01, + "lyapunov": 1.5406827024181786, + "grad_norm": 0.29801127659352034, + "grad_max_sv": 0.11815546471625567, + "grad_min_sv": 3.884505487303062e-09, + "grad_condition": 332638345.8989955, + "lr": 0.0003554841015277638, + "time_sec": 86.96290874481201 + }, + { + "epoch": 90, + "train_loss": 4.206269663238525, + "train_acc": 0.06196, + "test_loss": 5.070217854309082, + "test_acc": 0.01, + "lyapunov": 1.5563946108683906, + "grad_norm": 0.2994269982908668, + "grad_max_sv": 0.11779715698212385, + "grad_min_sv": 3.982388553994132e-09, + "grad_condition": 53109317.27534769, + "lr": 0.000345491502812526, + "time_sec": 86.96194267272949 + }, + { + "epoch": 91, + "train_loss": 4.184974651947021, + "train_acc": 0.06586, + "test_loss": 4.788212018585205, + "test_acc": 0.01, + "lyapunov": 1.5359351665467558, + "grad_norm": 0.3140436055876291, + "grad_max_sv": 0.1192835196852684, + "grad_min_sv": 4.091862369597077e-09, + "grad_condition": 88707538.2703129, + "lr": 0.0003355666766307081, + "time_sec": 86.94303727149963 + }, + { + "epoch": 92, + "train_loss": 4.17854603012085, + "train_acc": 0.06482, + "test_loss": 4.927370552062988, + "test_acc": 0.01, + "lyapunov": 1.5374575045407581, + "grad_norm": 0.30674131521323145, + "grad_max_sv": 0.11535172853618861, + "grad_min_sv": 4.237652858393032e-09, + "grad_condition": 83659913.65034825, + "lr": 0.00032571397633909225, + "time_sec": 86.9555778503418 + }, + { + "epoch": 93, + "train_loss": 4.175330209197998, + "train_acc": 0.06626, + "test_loss": 4.7136772384643555, + "test_acc": 0.01, + "lyapunov": 1.5313739505265376, + "grad_norm": 0.3092012525879534, + "grad_max_sv": 0.11529328189790249, + "grad_min_sv": 4.273903241730492e-09, + "grad_condition": 83324467.585004, + "lr": 0.00031593772365766094, + "time_sec": 86.95363783836365 + }, + { + "epoch": 94, + "train_loss": 4.254087154998779, + "train_acc": 0.0545, + "test_loss": 6.608264208984375, + "test_acc": 0.01, + "lyapunov": 1.5392028648225242, + "grad_norm": 0.3313811080123765, + "grad_max_sv": 0.11369877494871616, + "grad_min_sv": 3.168524045134985e-09, + "grad_condition": 239544812.6275599, + "lr": 0.0003062422067739483, + "time_sec": 86.96967077255249 + }, + { + "epoch": 95, + "train_loss": 4.203709516601562, + "train_acc": 0.06272, + "test_loss": 5.2335342506408695, + "test_acc": 0.01, + "lyapunov": 1.5491435664998905, + "grad_norm": 0.2982597621611383, + "grad_max_sv": 0.11460016090422868, + "grad_min_sv": 4.0606391769892894e-09, + "grad_condition": 47941630.25136345, + "lr": 0.00029663167846209965, + "time_sec": 86.9920425415039 + }, + { + "epoch": 96, + "train_loss": 4.204792425079345, + "train_acc": 0.06306, + "test_loss": 7.403053276062011, + "test_acc": 0.01, + "lyapunov": 1.5504713561528785, + "grad_norm": 0.2973250691024306, + "grad_max_sv": 0.11604133322834968, + "grad_min_sv": 3.7637052361207474e-09, + "grad_condition": 491496513.2031948, + "lr": 0.00028711035421746345, + "time_sec": 87.00048351287842 + }, + { + "epoch": 97, + "train_loss": 4.31849955368042, + "train_acc": 0.04568, + "test_loss": 7.006944195556641, + "test_acc": 0.01, + "lyapunov": 1.5414063906120827, + "grad_norm": 0.27034960524342166, + "grad_max_sv": 0.11470378432422876, + "grad_min_sv": 1.2109832417221688e-09, + "grad_condition": 1416729003.9783182, + "lr": 0.00027768241040753615, + "time_sec": 86.98381400108337 + }, + { + "epoch": 98, + "train_loss": 4.3125907057189945, + "train_acc": 0.04504, + "test_loss": 6.8418953994750975, + "test_acc": 0.01, + "lyapunov": 1.5312741872904552, + "grad_norm": 0.2652378251823005, + "grad_max_sv": 0.11196322869509459, + "grad_min_sv": 8.317735150165442e-10, + "grad_condition": 2407386273.9108796, + "lr": 0.00026835198244006903, + "time_sec": 86.99899005889893 + }, + { + "epoch": 99, + "train_loss": 4.301244279174805, + "train_acc": 0.0473, + "test_loss": 7.093164874267578, + "test_acc": 0.01, + "lyapunov": 1.5387949861224046, + "grad_norm": 0.27009267897863193, + "grad_max_sv": 0.11189446654170751, + "grad_min_sv": 1.2108846141924145e-09, + "grad_condition": 438371071.4957386, + "lr": 0.0002591231629491421, + "time_sec": 86.9708981513977 + }, + { + "epoch": 100, + "train_loss": 4.292957291259766, + "train_acc": 0.0483, + "test_loss": 7.921586865234375, + "test_acc": 0.01, + "lyapunov": 1.5301602883716983, + "grad_norm": 0.269957629463293, + "grad_max_sv": 0.11394803524017334, + "grad_min_sv": 1.4573458890511891e-09, + "grad_condition": 922753679.5571249, + "lr": 0.0002499999999999997, + "time_sec": 86.97738790512085 + }, + { + "epoch": 101, + "train_loss": 4.287421778564453, + "train_acc": 0.0513, + "test_loss": 7.7924660919189455, + "test_acc": 0.01, + "lyapunov": 1.5450496938832277, + "grad_norm": 0.28642776215503646, + "grad_max_sv": 0.11340956594794989, + "grad_min_sv": 2.0538556702587306e-09, + "grad_condition": 238759080.3242866, + "lr": 0.00024098649531343477, + "time_sec": 86.98059034347534 + }, + { + "epoch": 102, + "train_loss": 4.232091545562744, + "train_acc": 0.05674, + "test_loss": 7.502766206359864, + "test_acc": 0.01, + "lyapunov": 1.5351537307509986, + "grad_norm": 0.2822002764723934, + "grad_max_sv": 0.11223722565919161, + "grad_min_sv": 3.631413643401249e-09, + "grad_condition": 44883366.00420923, + "lr": 0.0002320866025105016, + "time_sec": 86.98991203308105 + }, + { + "epoch": 103, + "train_loss": 4.225371129455566, + "train_acc": 0.05656, + "test_loss": 7.15355862121582, + "test_acc": 0.01, + "lyapunov": 1.5374192603103949, + "grad_norm": 0.28534078791067063, + "grad_max_sv": 0.10910792909562587, + "grad_min_sv": 3.6997169017847013e-09, + "grad_condition": 432680082.27477896, + "lr": 0.0002233042253783278, + "time_sec": 87.02942061424255 + }, + { + "epoch": 104, + "train_loss": 4.259049204101562, + "train_acc": 0.05352, + "test_loss": 5.869139344787597, + "test_acc": 0.01, + "lyapunov": 1.5383392858993061, + "grad_norm": 0.27867691558389857, + "grad_max_sv": 0.11480593234300614, + "grad_min_sv": 3.5299762349283448e-09, + "grad_condition": 70171572.71195477, + "lr": 0.000214643216157784, + "time_sec": 86.95629143714905 + }, + { + "epoch": 105, + "train_loss": 4.272113574829102, + "train_acc": 0.05168, + "test_loss": 5.520168752288819, + "test_acc": 0.01, + "lyapunov": 1.533821760541033, + "grad_norm": 0.27161597798881265, + "grad_max_sv": 0.10913974400609731, + "grad_min_sv": 3.2786617867484533e-09, + "grad_condition": 381829356.4775018, + "lr": 0.00020610737385376332, + "time_sec": 86.99734330177307 + }, + { + "epoch": 106, + "train_loss": 4.2996347805786135, + "train_acc": 0.04852, + "test_loss": 6.207507315063476, + "test_acc": 0.01, + "lyapunov": 1.542306883560727, + "grad_norm": 0.33667604894049824, + "grad_max_sv": 0.10918771754950285, + "grad_min_sv": 1.8414377505465707e-09, + "grad_condition": 388356450.963876, + "lr": 0.00019770044256881242, + "time_sec": 86.98377108573914 + }, + { + "epoch": 107, + "train_loss": 4.277384571228027, + "train_acc": 0.05192, + "test_loss": 5.813813595581054, + "test_acc": 0.01, + "lyapunov": 1.5573498227102371, + "grad_norm": 0.27065029192632944, + "grad_max_sv": 0.10987954996526242, + "grad_min_sv": 2.4647747798485496e-09, + "grad_condition": 186312821.68751103, + "lr": 0.0001894261098608447, + "time_sec": 86.97658634185791 + }, + { + "epoch": 108, + "train_loss": 4.248811683502197, + "train_acc": 0.05564, + "test_loss": 5.372588280487061, + "test_acc": 0.01, + "lyapunov": 1.5323523389713845, + "grad_norm": 0.28972275102919554, + "grad_max_sv": 0.11195205356925726, + "grad_min_sv": 3.6018193581973877e-09, + "grad_condition": 258686872.45386976, + "lr": 0.000181288005125655, + "time_sec": 86.98323941230774 + }, + { + "epoch": 109, + "train_loss": 4.248928556365967, + "train_acc": 0.05606, + "test_loss": 5.640845692443848, + "test_acc": 0.01, + "lyapunov": 1.536016465757814, + "grad_norm": 0.2788537343039685, + "grad_max_sv": 0.10843300186097622, + "grad_min_sv": 3.2726568575773553e-09, + "grad_condition": 109384835.96161847, + "lr": 0.0001732896980049473, + "time_sec": 86.99290323257446 + }, + { + "epoch": 110, + "train_loss": 4.258184987182617, + "train_acc": 0.05546, + "test_loss": 5.317471363830567, + "test_acc": 0.01, + "lyapunov": 1.5343971404882952, + "grad_norm": 0.27431191784323045, + "grad_max_sv": 0.11074544731527566, + "grad_min_sv": 3.0305070231051447e-09, + "grad_condition": 86266318.35712561, + "lr": 0.00016543469682057076, + "time_sec": 87.00314545631409 + }, + { + "epoch": 111, + "train_loss": 4.2609542189025875, + "train_acc": 0.05316, + "test_loss": 5.29417073059082, + "test_acc": 0.01, + "lyapunov": 1.5503652745195666, + "grad_norm": 0.3039662695641993, + "grad_max_sv": 0.1153217950835824, + "grad_min_sv": 3.1399053107561413e-09, + "grad_condition": 155517989.20554435, + "lr": 0.00015772644703565552, + "time_sec": 86.98289012908936 + }, + { + "epoch": 112, + "train_loss": 4.161646675872802, + "train_acc": 0.06866, + "test_loss": 4.968084820556641, + "test_acc": 0.01, + "lyapunov": 1.5330983741813913, + "grad_norm": 0.310726433856645, + "grad_max_sv": 0.11503051314502954, + "grad_min_sv": 4.5873159559145504e-09, + "grad_condition": 43329858.106001854, + "lr": 0.00015016832974331713, + "time_sec": 86.95993733406067 + }, + { + "epoch": 113, + "train_loss": 4.142913679122925, + "train_acc": 0.06906, + "test_loss": 4.971963974761963, + "test_acc": 0.01, + "lyapunov": 1.5326429456091293, + "grad_norm": 0.31597412483623394, + "grad_max_sv": 0.1160203531384468, + "grad_min_sv": 4.675401377152426e-09, + "grad_condition": 1359526359.2386715, + "lr": 0.00014276366018359834, + "time_sec": 86.9745397567749 + }, + { + "epoch": 114, + "train_loss": 4.132417506408691, + "train_acc": 0.07312, + "test_loss": 5.112189303588867, + "test_acc": 0.01, + "lyapunov": 1.5331226209240496, + "grad_norm": 0.318176263966868, + "grad_max_sv": 0.11246696598827839, + "grad_min_sv": 4.720653330042568e-09, + "grad_condition": 35846204.098323956, + "lr": 0.00013551568628929425, + "time_sec": 86.99593329429626 + }, + { + "epoch": 115, + "train_loss": 4.133183531036377, + "train_acc": 0.07248, + "test_loss": 5.057575880432129, + "test_acc": 0.01, + "lyapunov": 1.53298450857782, + "grad_norm": 0.31754098682504733, + "grad_max_sv": 0.1107523936778307, + "grad_min_sv": 4.621098260992884e-09, + "grad_condition": 36993194.345856234, + "lr": 0.00012842758726130276, + "time_sec": 87.01801228523254 + }, + { + "epoch": 116, + "train_loss": 4.1214919088745114, + "train_acc": 0.0733, + "test_loss": 5.330466777038574, + "test_acc": 0.01, + "lyapunov": 1.5355542081091411, + "grad_norm": 0.32114994194004043, + "grad_max_sv": 0.11312623880803585, + "grad_min_sv": 4.720178707617873e-09, + "grad_condition": 38967900.75172814, + "lr": 0.0001215024721741218, + "time_sec": 87.01585006713867 + }, + { + "epoch": 117, + "train_loss": 4.286661796417237, + "train_acc": 0.04898, + "test_loss": 5.4064821472167965, + "test_acc": 0.01, + "lyapunov": 1.5394237318917003, + "grad_norm": 0.26685158012091653, + "grad_max_sv": 0.10729111414402723, + "grad_min_sv": 1.8874711343571174e-09, + "grad_condition": 693536338.911531, + "lr": 0.00011474337861210538, + "time_sec": 87.01486086845398 + }, + { + "epoch": 118, + "train_loss": 4.234741138000488, + "train_acc": 0.05964, + "test_loss": 5.211770498657226, + "test_acc": 0.01, + "lyapunov": 1.5457742269081838, + "grad_norm": 0.30021925128900956, + "grad_max_sv": 0.11846681199967861, + "grad_min_sv": 3.153877188143833e-09, + "grad_condition": 188986875.56833678, + "lr": 0.00010815327133708009, + "time_sec": 87.00663447380066 + }, + { + "epoch": 119, + "train_loss": 4.11706687576294, + "train_acc": 0.07374, + "test_loss": 5.082122540283203, + "test_acc": 0.01, + "lyapunov": 1.5414114147805802, + "grad_norm": 0.3317800190412718, + "grad_max_sv": 0.11199022214859725, + "grad_min_sv": 4.8053149537610754e-09, + "grad_condition": 62930401.390989184, + "lr": 0.00010173504098790182, + "time_sec": 86.96685004234314 + }, + { + "epoch": 120, + "train_loss": 4.117903626403809, + "train_acc": 0.07546, + "test_loss": 5.197770183563232, + "test_acc": 0.01, + "lyapunov": 1.5391402732380821, + "grad_norm": 0.3199355742296335, + "grad_max_sv": 0.11221611741930246, + "grad_min_sv": 4.790622934632005e-09, + "grad_condition": 86663150.15576133, + "lr": 9.549150281252629e-05, + "time_sec": 86.98693466186523 + }, + { + "epoch": 121, + "train_loss": 4.1117572444152835, + "train_acc": 0.0731, + "test_loss": 5.003424510192871, + "test_acc": 0.01, + "lyapunov": 1.539994769084179, + "grad_norm": 0.3246450775964075, + "grad_max_sv": 0.11421162784099578, + "grad_min_sv": 4.825218762743999e-09, + "grad_condition": 33400464.678539503, + "lr": 8.942539543314794e-05, + "time_sec": 86.99330687522888 + }, + { + "epoch": 122, + "train_loss": 4.116242552490235, + "train_acc": 0.07584, + "test_loss": 4.9847313568115235, + "test_acc": 0.01, + "lyapunov": 1.5480006558206074, + "grad_norm": 0.33750598438594037, + "grad_max_sv": 0.1118525866419077, + "grad_min_sv": 4.747569511825978e-09, + "grad_condition": 47618770.58050732, + "lr": 8.353937964495024e-05, + "time_sec": 86.9736979007721 + }, + { + "epoch": 123, + "train_loss": 4.105294608764648, + "train_acc": 0.07574, + "test_loss": 5.05824465713501, + "test_acc": 0.01, + "lyapunov": 1.5419012167874504, + "grad_norm": 0.32186048919000465, + "grad_max_sv": 0.11163459308445453, + "grad_min_sv": 4.863006954980778e-09, + "grad_condition": 167271477.11441505, + "lr": 7.783603724899243e-05, + "time_sec": 86.99078607559204 + }, + { + "epoch": 124, + "train_loss": 4.099795688476562, + "train_acc": 0.07798, + "test_loss": 4.9984775840759275, + "test_acc": 0.01, + "lyapunov": 1.5369879031730125, + "grad_norm": 0.32609682562778786, + "grad_max_sv": 0.11664061844348908, + "grad_min_sv": 4.935543519539454e-09, + "grad_condition": 161438150.2658438, + "lr": 7.231786991974666e-05, + "time_sec": 86.99523687362671 + }, + { + "epoch": 125, + "train_loss": 4.098010378265381, + "train_acc": 0.07688, + "test_loss": 5.083614495849609, + "test_acc": 0.01, + "lyapunov": 1.538549063455723, + "grad_norm": 0.32299099779472384, + "grad_max_sv": 0.11511307284235954, + "grad_min_sv": 4.847106176500415e-09, + "grad_condition": 118399503.0509634, + "lr": 6.698729810778072e-05, + "time_sec": 86.96753239631653 + }, + { + "epoch": 126, + "train_loss": 4.094612486343384, + "train_acc": 0.07826, + "test_loss": 5.203778009033203, + "test_acc": 0.01, + "lyapunov": 1.5428017960180103, + "grad_norm": 0.3261007144041166, + "grad_max_sv": 0.1148404136300087, + "grad_min_sv": 4.916869680154923e-09, + "grad_condition": 37022153.39021693, + "lr": 6.184665997806817e-05, + "time_sec": 86.98804068565369 + }, + { + "epoch": 127, + "train_loss": 4.0985583738708495, + "train_acc": 0.07702, + "test_loss": 5.192792930603027, + "test_acc": 0.01, + "lyapunov": 1.5652157403623965, + "grad_norm": 0.3336587004311134, + "grad_max_sv": 0.11400137636810541, + "grad_min_sv": 4.8697245479123465e-09, + "grad_condition": 38028939.52694424, + "lr": 5.6898210384392595e-05, + "time_sec": 86.96705031394958 + }, + { + "epoch": 128, + "train_loss": 4.100992156219482, + "train_acc": 0.07846, + "test_loss": 5.085048861694336, + "test_acc": 0.01, + "lyapunov": 1.545605825036383, + "grad_norm": 0.3441323941200468, + "grad_max_sv": 0.11070230975747108, + "grad_min_sv": 4.843600412071658e-09, + "grad_condition": 56323581.22712644, + "lr": 5.214411988029363e-05, + "time_sec": 86.94498491287231 + }, + { + "epoch": 129, + "train_loss": 4.094791182403564, + "train_acc": 0.07688, + "test_loss": 5.265383574676513, + "test_acc": 0.01, + "lyapunov": 1.5531313541295277, + "grad_norm": 0.3267910766524594, + "grad_max_sv": 0.11236317530274391, + "grad_min_sv": 4.964851743616272e-09, + "grad_condition": 30209344.81093415, + "lr": 4.7586473766990294e-05, + "time_sec": 86.97897577285767 + }, + { + "epoch": 130, + "train_loss": 4.105339503173828, + "train_acc": 0.07892, + "test_loss": 5.464303984069824, + "test_acc": 0.01, + "lyapunov": 1.5928938599193798, + "grad_norm": 0.33640610863256226, + "grad_max_sv": 0.11975565832108259, + "grad_min_sv": 4.956666326168258e-09, + "grad_condition": 86093709.20654145, + "lr": 4.32272711786996e-05, + "time_sec": 86.97181296348572 + }, + { + "epoch": 131, + "train_loss": 4.1202142849731445, + "train_acc": 0.07638, + "test_loss": 5.086045352935791, + "test_acc": 0.01, + "lyapunov": 1.5752554455071763, + "grad_norm": 0.3476235527969191, + "grad_max_sv": 0.11470571290701628, + "grad_min_sv": 4.997092051955976e-09, + "grad_condition": 31166624.08007102, + "lr": 3.906842420574966e-05, + "time_sec": 86.96465158462524 + }, + { + "epoch": 132, + "train_loss": 4.098140075073243, + "train_acc": 0.07802, + "test_loss": 5.1546881439208985, + "test_acc": 0.01, + "lyapunov": 1.5599672675437635, + "grad_norm": 0.32910420756324915, + "grad_max_sv": 0.11396387908607722, + "grad_min_sv": 4.9758276735034634e-09, + "grad_condition": 28755480.58760929, + "lr": 3.5111757055874305e-05, + "time_sec": 86.97234416007996 + }, + { + "epoch": 133, + "train_loss": 4.097319039764404, + "train_acc": 0.07744, + "test_loss": 5.266991318511963, + "test_acc": 0.01, + "lyapunov": 1.5720745212281757, + "grad_norm": 0.3282133242838952, + "grad_max_sv": 0.11390211284160615, + "grad_min_sv": 5.047047665386606e-09, + "grad_condition": 79107620.94797075, + "lr": 3.1359005254054254e-05, + "time_sec": 86.98829984664917 + }, + { + "epoch": 134, + "train_loss": 4.099240714569092, + "train_acc": 0.07868, + "test_loss": 5.1082003204345705, + "test_acc": 0.01, + "lyapunov": 1.5893634911388388, + "grad_norm": 0.3513961369367751, + "grad_max_sv": 0.11567155160009861, + "grad_min_sv": 4.942956948264521e-09, + "grad_condition": 40535527.74084098, + "lr": 2.7811814881259484e-05, + "time_sec": 86.98272204399109 + }, + { + "epoch": 135, + "train_loss": 4.1100962098693845, + "train_acc": 0.07696, + "test_loss": 5.428898550415039, + "test_acc": 0.01, + "lyapunov": 1.5772409259205888, + "grad_norm": 0.32817769566527, + "grad_max_sv": 0.11089312192052603, + "grad_min_sv": 4.81819233365266e-09, + "grad_condition": 72686358.78433864, + "lr": 2.4471741852423218e-05, + "time_sec": 86.96906805038452 + }, + { + "epoch": 136, + "train_loss": 4.10700753326416, + "train_acc": 0.07708, + "test_loss": 5.684621694946289, + "test_acc": 0.01, + "lyapunov": 1.5801607196593224, + "grad_norm": 0.37785274061951857, + "grad_max_sv": 0.11316521279513836, + "grad_min_sv": 4.891583017460621e-09, + "grad_condition": 36465991.89449505, + "lr": 2.1340251233966362e-05, + "time_sec": 86.95840525627136 + }, + { + "epoch": 137, + "train_loss": 4.110885810089111, + "train_acc": 0.07508, + "test_loss": 5.579570821380615, + "test_acc": 0.01, + "lyapunov": 1.5708883823946005, + "grad_norm": 0.35149637028258535, + "grad_max_sv": 0.11634646914899349, + "grad_min_sv": 4.938844544639422e-09, + "grad_condition": 434569881.7137464, + "lr": 1.8418716601170932e-05, + "time_sec": 86.98812198638916 + }, + { + "epoch": 138, + "train_loss": 4.113671342010498, + "train_acc": 0.0751, + "test_loss": 5.221417890930176, + "test_acc": 0.01, + "lyapunov": 1.57883699501262, + "grad_norm": 0.3623192907836632, + "grad_max_sv": 0.11387990918010474, + "grad_min_sv": 4.910508299982297e-09, + "grad_condition": 42512106.818557374, + "lr": 1.570841943568445e-05, + "time_sec": 86.95657277107239 + }, + { + "epoch": 139, + "train_loss": 4.103298903198242, + "train_acc": 0.07658, + "test_loss": 5.294570021057129, + "test_acc": 0.01, + "lyapunov": 1.5839106051818184, + "grad_norm": 0.3338199572610109, + "grad_max_sv": 0.11476525086909532, + "grad_min_sv": 5.07050121750785e-09, + "grad_condition": 33506825.866475124, + "lr": 1.3210548563419845e-05, + "time_sec": 86.98819351196289 + }, + { + "epoch": 140, + "train_loss": 4.1040088185119625, + "train_acc": 0.07604, + "test_loss": 5.578106262207031, + "test_acc": 0.01, + "lyapunov": 1.5838946707718207, + "grad_norm": 0.3724797130647997, + "grad_max_sv": 0.11343933567404747, + "grad_min_sv": 4.96071488574612e-09, + "grad_condition": 36377482.2674368, + "lr": 1.0926199633097203e-05, + "time_sec": 87.02139043807983 + }, + { + "epoch": 141, + "train_loss": 4.112641759033203, + "train_acc": 0.07624, + "test_loss": 5.450056053161621, + "test_acc": 0.01, + "lyapunov": 1.5760344766899752, + "grad_norm": 0.36533164109272187, + "grad_max_sv": 0.11488107666373253, + "grad_min_sv": 4.998170264475244e-09, + "grad_condition": 39248086.6371146, + "lr": 8.856374635655688e-06, + "time_sec": 87.09755373001099 + }, + { + "epoch": 142, + "train_loss": 4.110099713745117, + "train_acc": 0.0751, + "test_loss": 5.3746546951293945, + "test_acc": 0.01, + "lyapunov": 1.5799316128196619, + "grad_norm": 0.33882488413102924, + "grad_max_sv": 0.1149375718086958, + "grad_min_sv": 4.975581699429021e-09, + "grad_condition": 27873380.275928926, + "lr": 7.001981464747503e-06, + "time_sec": 86.98368120193481 + }, + { + "epoch": 143, + "train_loss": 4.111169652252197, + "train_acc": 0.07464, + "test_loss": 5.482430593109131, + "test_acc": 0.01, + "lyapunov": 1.5838617754104498, + "grad_norm": 0.3907525660486928, + "grad_max_sv": 0.11294344365596772, + "grad_min_sv": 4.972342661051232e-09, + "grad_condition": 56574066.27463861, + "lr": 5.3638335185058295e-06, + "time_sec": 86.98776912689209 + }, + { + "epoch": 144, + "train_loss": 4.109548569641113, + "train_acc": 0.07474, + "test_loss": 5.386999281311035, + "test_acc": 0.01, + "lyapunov": 1.5824109358555825, + "grad_norm": 0.35450816124488377, + "grad_max_sv": 0.11456675231456756, + "grad_min_sv": 5.040034656289549e-09, + "grad_condition": 28129116.053885616, + "lr": 3.942649342761114e-06, + "time_sec": 86.98024988174438 + }, + { + "epoch": 145, + "train_loss": 4.105895345153809, + "train_acc": 0.07646, + "test_loss": 5.404526988220215, + "test_acc": 0.01, + "lyapunov": 1.5782298480763155, + "grad_norm": 0.32890225856019717, + "grad_max_sv": 0.11459225825965405, + "grad_min_sv": 4.992372309303716e-09, + "grad_condition": 30352933.747849993, + "lr": 2.7390523158633524e-06, + "time_sec": 87.0038857460022 + }, + { + "epoch": 146, + "train_loss": 4.105062242279053, + "train_acc": 0.07688, + "test_loss": 5.344121000671387, + "test_acc": 0.01, + "lyapunov": 1.580697044387193, + "grad_norm": 0.3835574914516311, + "grad_max_sv": 0.11529699396342039, + "grad_min_sv": 5.024812839427017e-09, + "grad_condition": 28505555.903579652, + "lr": 1.7535703752478133e-06, + "time_sec": 87.02643275260925 + }, + { + "epoch": 147, + "train_loss": 4.105375043106079, + "train_acc": 0.0774, + "test_loss": 5.325290232849121, + "test_acc": 0.01, + "lyapunov": 1.5789403549545562, + "grad_norm": 0.37968984215300994, + "grad_max_sv": 0.1154880104586482, + "grad_min_sv": 5.0540397828185285e-09, + "grad_condition": 236800965.07524818, + "lr": 9.866357858642196e-07, + "time_sec": 86.96237063407898 + }, + { + "epoch": 148, + "train_loss": 4.106910405731202, + "train_acc": 0.07802, + "test_loss": 5.253315858459473, + "test_acc": 0.01, + "lyapunov": 1.5811021160286711, + "grad_norm": 0.34326106915213195, + "grad_max_sv": 0.11614184193313122, + "grad_min_sv": 4.994901469171364e-09, + "grad_condition": 56096271.31483416, + "lr": 4.38584950570808e-07, + "time_sec": 86.99004936218262 + }, + { + "epoch": 149, + "train_loss": 4.101930983581543, + "train_acc": 0.07612, + "test_loss": 5.252623239898682, + "test_acc": 0.01, + "lyapunov": 1.5808270389161756, + "grad_norm": 0.32890029512732105, + "grad_max_sv": 0.11511041391640901, + "grad_min_sv": 4.989588534010103e-09, + "grad_condition": 32283184.00572153, + "lr": 1.096582625772501e-07, + "time_sec": 86.9653422832489 + }, + { + "epoch": 150, + "train_loss": 4.105507068939209, + "train_acc": 0.0767, + "test_loss": 5.325356979370117, + "test_acc": 0.01, + "lyapunov": 1.5831530841110308, + "grad_norm": 0.32872424704094605, + "grad_max_sv": 0.11464270018041134, + "grad_min_sv": 4.984313861991496e-09, + "grad_condition": 47970236.10911851, + "lr": 0.0, + "time_sec": 86.95947980880737 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 5.044638243713379, + "train_acc": 0.01744, + "test_loss": 4.888737399291992, + "test_acc": 0.0101, + "lyapunov": 2.5438788614004775, + "grad_norm": 5.194417701604951, + "grad_max_sv": 4.519656705856323, + "grad_min_sv": 8.791217535053519e-08, + "grad_condition": 76276812.51647735, + "lr": 0.0009998903417374227, + "time_sec": 132.28263092041016 + }, + { + "epoch": 2, + "train_loss": 4.746561761016846, + "train_acc": 0.02068, + "test_loss": 4.932491451263428, + "test_acc": 0.01, + "lyapunov": 1.9478983812015076, + "grad_norm": 3.62057951672503, + "grad_max_sv": 3.0427515387535093, + "grad_min_sv": 5.900428634852961e-08, + "grad_condition": 108761794.84725586, + "lr": 0.0009995614150494292, + "time_sec": 132.22165322303772 + }, + { + "epoch": 3, + "train_loss": 4.653761597747803, + "train_acc": 0.02044, + "test_loss": 4.652680480194092, + "test_acc": 0.0096, + "lyapunov": 1.728618367858555, + "grad_norm": 2.625722747628417, + "grad_max_sv": 1.9487905293703078, + "grad_min_sv": 4.100720090924326e-08, + "grad_condition": 220787964.58006114, + "lr": 0.0009990133642141358, + "time_sec": 132.218932390213 + }, + { + "epoch": 4, + "train_loss": 4.566257968444824, + "train_acc": 0.0202, + "test_loss": 4.701637998962402, + "test_acc": 0.01, + "lyapunov": 1.6333425154771342, + "grad_norm": 1.4991148871931466, + "grad_max_sv": 1.0714565500617028, + "grad_min_sv": 2.3121158282402022e-08, + "grad_condition": 84114314.08530891, + "lr": 0.0009982464296247522, + "time_sec": 132.2167730331421 + }, + { + "epoch": 5, + "train_loss": 4.541309765777588, + "train_acc": 0.02008, + "test_loss": 4.857759108734131, + "test_acc": 0.01, + "lyapunov": 1.6103907890636902, + "grad_norm": 1.1537501690229268, + "grad_max_sv": 0.8224508740007878, + "grad_min_sv": 1.6470128196970384e-08, + "grad_condition": 6997774636.897303, + "lr": 0.0009972609476841367, + "time_sec": 132.19794130325317 + }, + { + "epoch": 6, + "train_loss": 4.527589833526611, + "train_acc": 0.02172, + "test_loss": 4.70167085723877, + "test_acc": 0.01, + "lyapunov": 1.603051292621876, + "grad_norm": 0.9225520766276066, + "grad_max_sv": 0.6318209424614907, + "grad_min_sv": 1.1189797109089012e-08, + "grad_condition": 15636425112.20934, + "lr": 0.000996057350657239, + "time_sec": 132.21913647651672 + }, + { + "epoch": 7, + "train_loss": 4.515393820343018, + "train_acc": 0.02164, + "test_loss": 4.6568979660034175, + "test_acc": 0.01, + "lyapunov": 1.6002115541711792, + "grad_norm": 0.7369887244582876, + "grad_max_sv": 0.47892343774437907, + "grad_min_sv": 9.288682374783072e-09, + "grad_condition": 1455935385.8148131, + "lr": 0.000994636166481494, + "time_sec": 132.2325894832611 + }, + { + "epoch": 8, + "train_loss": 4.524283535614014, + "train_acc": 0.01938, + "test_loss": 4.6134964424133305, + "test_acc": 0.01, + "lyapunov": 1.5902926510252307, + "grad_norm": 0.5859004013732186, + "grad_max_sv": 0.3847638428211212, + "grad_min_sv": 2.614369980990735e-09, + "grad_condition": 29450829204.572437, + "lr": 0.0009929980185352525, + "time_sec": 132.23444652557373 + }, + { + "epoch": 9, + "train_loss": 4.526760426940918, + "train_acc": 0.01954, + "test_loss": 5.032786169433594, + "test_acc": 0.01, + "lyapunov": 1.591223902714527, + "grad_norm": 0.4921248583152587, + "grad_max_sv": 0.3309405084699392, + "grad_min_sv": 2.1669457121848862e-11, + "grad_condition": 86120259747.67252, + "lr": 0.0009911436253643444, + "time_sec": 132.28951215744019 + }, + { + "epoch": 10, + "train_loss": 4.5441475662231445, + "train_acc": 0.0174, + "test_loss": 5.262818550109864, + "test_acc": 0.01, + "lyapunov": 1.583890141123701, + "grad_norm": 0.41054293976266754, + "grad_max_sv": 0.2887417145073414, + "grad_min_sv": 5.969573957265053e-12, + "grad_condition": 78485792436.92993, + "lr": 0.0009890738003669028, + "time_sec": 132.22699999809265 + }, + { + "epoch": 11, + "train_loss": 4.54200564666748, + "train_acc": 0.01774, + "test_loss": 5.034979447937012, + "test_acc": 0.01, + "lyapunov": 1.5821573923310965, + "grad_norm": 0.4337541463718868, + "grad_max_sv": 0.3208182599395514, + "grad_min_sv": 3.2558498354953734e-12, + "grad_condition": 117922392029.53934, + "lr": 0.00098678945143658, + "time_sec": 132.25113081932068 + }, + { + "epoch": 12, + "train_loss": 4.547267101287842, + "train_acc": 0.0172, + "test_loss": 5.292049045562744, + "test_acc": 0.01, + "lyapunov": 1.581516192087432, + "grad_norm": 0.44629110826721646, + "grad_max_sv": 0.3241798661649227, + "grad_min_sv": 2.88259236333764e-12, + "grad_condition": 126579855744.97647, + "lr": 0.0009842915805643154, + "time_sec": 132.24692058563232 + }, + { + "epoch": 13, + "train_loss": 4.548395246429443, + "train_acc": 0.01726, + "test_loss": 5.0098185729980464, + "test_acc": 0.01, + "lyapunov": 1.5924869388570566, + "grad_norm": 0.3910527009838956, + "grad_max_sv": 0.290815357491374, + "grad_min_sv": 2.0179616276645193e-12, + "grad_condition": 131462303728.17729, + "lr": 0.000981581283398829, + "time_sec": 132.21567606925964 + }, + { + "epoch": 14, + "train_loss": 4.550349577026367, + "train_acc": 0.01826, + "test_loss": 5.525635553741455, + "test_acc": 0.01, + "lyapunov": 1.5734444621883694, + "grad_norm": 0.4381363141951614, + "grad_max_sv": 0.3424963358789682, + "grad_min_sv": 2.742631590449884e-12, + "grad_condition": 138381932658.16568, + "lr": 0.0009786597487660333, + "time_sec": 132.20392966270447 + }, + { + "epoch": 15, + "train_loss": 4.590004445495605, + "train_acc": 0.01372, + "test_loss": 4.605991929626465, + "test_acc": 0.01, + "lyapunov": 1.5673531516433676, + "grad_norm": 0.3466932806170291, + "grad_max_sv": 0.296209704503417, + "grad_min_sv": 3.2570735841952816e-13, + "grad_condition": 270379718997.00928, + "lr": 0.0009755282581475766, + "time_sec": 132.15680313110352 + }, + { + "epoch": 16, + "train_loss": 4.597338052825927, + "train_acc": 0.0123, + "test_loss": 4.6062582565307615, + "test_acc": 0.01, + "lyapunov": 1.5659459106757512, + "grad_norm": 0.3244936237553927, + "grad_max_sv": 0.2445746913552284, + "grad_min_sv": 1.14503196614307e-19, + "grad_condition": 244574661202.029, + "lr": 0.0009721881851187403, + "time_sec": 132.18825936317444 + }, + { + "epoch": 17, + "train_loss": 4.604924670715332, + "train_acc": 0.01142, + "test_loss": 5.089439725494385, + "test_acc": 0.01, + "lyapunov": 1.5628269779712647, + "grad_norm": 0.2220918074967122, + "grad_max_sv": 0.18584942631423473, + "grad_min_sv": 8.34177981161767e-21, + "grad_condition": 185849424343.33807, + "lr": 0.0009686409947459456, + "time_sec": 132.16283059120178 + }, + { + "epoch": 18, + "train_loss": 4.607286578063965, + "train_acc": 0.0112, + "test_loss": 5.187530244445801, + "test_acc": 0.01, + "lyapunov": 1.565722727714597, + "grad_norm": 0.2311884649663066, + "grad_max_sv": 0.19543762858957053, + "grad_min_sv": 5.1574374327507394e-20, + "grad_condition": 195437615290.85724, + "lr": 0.0009648882429441254, + "time_sec": 132.13635730743408 + }, + { + "epoch": 19, + "train_loss": 4.61034327545166, + "train_acc": 0.01174, + "test_loss": 5.394132858276367, + "test_acc": 0.01, + "lyapunov": 1.5600875893517223, + "grad_norm": 0.23851905207608506, + "grad_max_sv": 0.19998206980526448, + "grad_min_sv": 9.380418376861012e-20, + "grad_condition": 199982048153.8069, + "lr": 0.00096093157579425, + "time_sec": 132.16015791893005 + }, + { + "epoch": 20, + "train_loss": 4.607679443969727, + "train_acc": 0.01172, + "test_loss": 4.606257467651367, + "test_acc": 0.01, + "lyapunov": 1.5657494985843863, + "grad_norm": 0.28750715745925254, + "grad_max_sv": 0.22121081724762917, + "grad_min_sv": 1.7508908480303667e-20, + "grad_condition": 221210813068.7792, + "lr": 0.0009567727288213001, + "time_sec": 132.14381384849548 + }, + { + "epoch": 21, + "train_loss": 4.609621345062256, + "train_acc": 0.01162, + "test_loss": 6.805993372344971, + "test_acc": 0.01, + "lyapunov": 1.578941965651939, + "grad_norm": 0.2550578056439405, + "grad_max_sv": 0.21259882654994727, + "grad_min_sv": 7.00398727115791e-21, + "grad_condition": 212598825342.705, + "lr": 0.0009524135262330095, + "time_sec": 132.12960958480835 + }, + { + "epoch": 22, + "train_loss": 4.614004552154541, + "train_acc": 0.01174, + "test_loss": 6.928626864624023, + "test_acc": 0.01, + "lyapunov": 1.6368295936023487, + "grad_norm": 0.2863339336037474, + "grad_max_sv": 0.24568271338939668, + "grad_min_sv": 4.005824711625119e-19, + "grad_condition": 245682611000.0279, + "lr": 0.0009478558801197061, + "time_sec": 132.13737630844116 + }, + { + "epoch": 23, + "train_loss": 4.61306428604126, + "train_acc": 0.01084, + "test_loss": 7.185849070739746, + "test_acc": 0.01, + "lyapunov": 1.602015091330194, + "grad_norm": 0.28964762988733644, + "grad_max_sv": 0.23221975527703761, + "grad_min_sv": 1.2140301096546425e-19, + "grad_condition": 232219726205.52304, + "lr": 0.000943101789615607, + "time_sec": 132.11901998519897 + }, + { + "epoch": 24, + "train_loss": 4.609514785614014, + "train_acc": 0.01176, + "test_loss": 7.9425787109375, + "test_acc": 0.01, + "lyapunov": 1.5803568689414607, + "grad_norm": 0.30490617252608776, + "grad_max_sv": 0.2639826502650976, + "grad_min_sv": 5.796963872806471e-14, + "grad_condition": 255773552256.2649, + "lr": 0.0009381533400219313, + "time_sec": 132.1163353919983 + }, + { + "epoch": 25, + "train_loss": 4.610168565826416, + "train_acc": 0.01216, + "test_loss": 4.606657133483886, + "test_acc": 0.01, + "lyapunov": 1.6174019660486285, + "grad_norm": 0.4338889523406446, + "grad_max_sv": 0.352421772480011, + "grad_min_sv": 2.858652179792795e-14, + "grad_condition": 343985739223.6239, + "lr": 0.0009330127018922189, + "time_sec": 132.1448836326599 + }, + { + "epoch": 26, + "train_loss": 4.602957373809814, + "train_acc": 0.0139, + "test_loss": 4.60689501876831, + "test_acc": 0.01, + "lyapunov": 1.5834840398920162, + "grad_norm": 0.37408666176662725, + "grad_max_sv": 0.32772524692118166, + "grad_min_sv": 3.749828378124787e-15, + "grad_condition": 326905798885.44763, + "lr": 0.000927682130080253, + "time_sec": 132.18161749839783 + }, + { + "epoch": 27, + "train_loss": 4.602288271179199, + "train_acc": 0.0127, + "test_loss": 4.607086447143555, + "test_acc": 0.01, + "lyapunov": 1.6033268727914756, + "grad_norm": 0.3133873934549926, + "grad_max_sv": 0.28318417854607103, + "grad_min_sv": 1.4053103231960982e-19, + "grad_condition": 283184135871.7739, + "lr": 0.0009221639627510072, + "time_sec": 132.15349626541138 + }, + { + "epoch": 28, + "train_loss": 4.599534628295898, + "train_acc": 0.01238, + "test_loss": 4.607179332733154, + "test_acc": 0.01, + "lyapunov": 1.5838783384893862, + "grad_norm": 0.28044203644676124, + "grad_max_sv": 0.22863162867724895, + "grad_min_sv": 1.6998404058293805e-14, + "grad_condition": 225932681740.85928, + "lr": 0.0009164606203550494, + "time_sec": 132.16895461082458 + }, + { + "epoch": 29, + "train_loss": 4.6137677600097655, + "train_acc": 0.01148, + "test_loss": 4.6071212936401365, + "test_acc": 0.01, + "lyapunov": 1.5793116610983144, + "grad_norm": 0.4043334896103637, + "grad_max_sv": 0.2792932067066431, + "grad_min_sv": 6.979785668152621e-20, + "grad_condition": 279293193161.8634, + "lr": 0.0009105746045668516, + "time_sec": 132.12517476081848 + }, + { + "epoch": 30, + "train_loss": 4.6109746827697755, + "train_acc": 0.01164, + "test_loss": 4.60712117767334, + "test_acc": 0.01, + "lyapunov": 1.567364613418384, + "grad_norm": 0.4163703836042532, + "grad_max_sv": 0.36478146240115167, + "grad_min_sv": 7.22918393975139e-20, + "grad_condition": 364781435101.6523, + "lr": 0.0009045084971874733, + "time_sec": 132.16352105140686 + }, + { + "epoch": 31, + "train_loss": 4.605944149169922, + "train_acc": 0.01204, + "test_loss": 4.607294147491455, + "test_acc": 0.01, + "lyapunov": 1.5633528936854408, + "grad_norm": 0.4282661754861825, + "grad_max_sv": 0.37428555004298686, + "grad_min_sv": 3.523726329651146e-15, + "grad_condition": 372947347297.6079, + "lr": 0.0008982649590120977, + "time_sec": 132.1736705303192 + }, + { + "epoch": 32, + "train_loss": 4.607151614837647, + "train_acc": 0.01174, + "test_loss": 4.965260970306397, + "test_acc": 0.01, + "lyapunov": 1.567151257753982, + "grad_norm": 0.6871731859307328, + "grad_max_sv": 0.3966732671484351, + "grad_min_sv": 2.459540269323706e-13, + "grad_condition": 337927969229.285, + "lr": 0.0008918467286629196, + "time_sec": 132.1509928703308 + }, + { + "epoch": 33, + "train_loss": 4.572849920349121, + "train_acc": 0.01594, + "test_loss": 5.434487845611573, + "test_acc": 0.01, + "lyapunov": 1.5909836267876198, + "grad_norm": 0.4983392948901186, + "grad_max_sv": 0.39813167229294777, + "grad_min_sv": 1.161873685556449e-12, + "grad_condition": 227702269317.0141, + "lr": 0.0008852566213878943, + "time_sec": 132.19490098953247 + }, + { + "epoch": 34, + "train_loss": 4.5529717526245115, + "train_acc": 0.01786, + "test_loss": 7.468867630004882, + "test_acc": 0.01, + "lyapunov": 1.6261070256342973, + "grad_norm": 0.46191117234345114, + "grad_max_sv": 0.372063222900033, + "grad_min_sv": 6.055017475914798e-12, + "grad_condition": 194339316548.4907, + "lr": 0.000878497527825878, + "time_sec": 132.1919345855713 + }, + { + "epoch": 35, + "train_loss": 4.552744539794922, + "train_acc": 0.01796, + "test_loss": 7.381356469726563, + "test_acc": 0.01, + "lyapunov": 1.6300754760537306, + "grad_norm": 0.3913335269838584, + "grad_max_sv": 0.3187441911548376, + "grad_min_sv": 1.2147101427236567e-12, + "grad_condition": 181094396927.97137, + "lr": 0.000871572412738697, + "time_sec": 132.2208890914917 + }, + { + "epoch": 36, + "train_loss": 4.545732378387451, + "train_acc": 0.0185, + "test_loss": 6.369435263061524, + "test_acc": 0.01, + "lyapunov": 1.6891264677657496, + "grad_norm": 0.4023421314839126, + "grad_max_sv": 0.27849661782383917, + "grad_min_sv": 1.2045309520203572e-12, + "grad_condition": 162600481647.82434, + "lr": 0.0008644843137107055, + "time_sec": 132.2405445575714 + }, + { + "epoch": 37, + "train_loss": 4.548228894195557, + "train_acc": 0.01722, + "test_loss": 7.595510809326172, + "test_acc": 0.01, + "lyapunov": 1.6399826683351755, + "grad_norm": 0.32785947279892635, + "grad_max_sv": 0.24646181836724282, + "grad_min_sv": 1.1144540376717887e-12, + "grad_condition": 142996724505.05634, + "lr": 0.0008572363398164014, + "time_sec": 132.20914554595947 + }, + { + "epoch": 38, + "train_loss": 4.543028886108399, + "train_acc": 0.01816, + "test_loss": 4.888543309783936, + "test_acc": 0.01, + "lyapunov": 1.6415274277367555, + "grad_norm": 0.36725544979363267, + "grad_max_sv": 0.2625227510929108, + "grad_min_sv": 8.083071810175235e-13, + "grad_condition": 172740531071.31885, + "lr": 0.0008498316702566826, + "time_sec": 132.20954966545105 + }, + { + "epoch": 39, + "train_loss": 4.5178536532592775, + "train_acc": 0.01904, + "test_loss": 4.854824586486816, + "test_acc": 0.01, + "lyapunov": 1.6600466051979748, + "grad_norm": 0.3442219346031078, + "grad_max_sv": 0.26818443052470686, + "grad_min_sv": 1.2392144997831455e-10, + "grad_condition": 139625061390.49585, + "lr": 0.0008422735529643442, + "time_sec": 132.19685912132263 + }, + { + "epoch": 40, + "train_loss": 4.505179956970215, + "train_acc": 0.02088, + "test_loss": 4.844048503112793, + "test_acc": 0.01, + "lyapunov": 1.6231690346432464, + "grad_norm": 0.3308248689472589, + "grad_max_sv": 0.24531208872795104, + "grad_min_sv": 8.70188674038036e-13, + "grad_condition": 148735283472.73764, + "lr": 0.0008345653031794289, + "time_sec": 132.2236189842224 + }, + { + "epoch": 41, + "train_loss": 4.506130592651367, + "train_acc": 0.01928, + "test_loss": 4.914672109222412, + "test_acc": 0.01, + "lyapunov": 1.6156310108311647, + "grad_norm": 0.34666559565319927, + "grad_max_sv": 0.2545319116441533, + "grad_min_sv": 1.2733801445553737e-12, + "grad_condition": 149523748665.4712, + "lr": 0.0008267103019950526, + "time_sec": 132.2104136943817 + }, + { + "epoch": 42, + "train_loss": 4.5101413671875, + "train_acc": 0.02056, + "test_loss": 4.621368215942383, + "test_acc": 0.01, + "lyapunov": 1.6336908840462374, + "grad_norm": 0.3241366255110596, + "grad_max_sv": 0.21891080848872663, + "grad_min_sv": 1.1512116090779195e-12, + "grad_condition": 122009848246.22696, + "lr": 0.0008187119948743447, + "time_sec": 132.2324824333191 + }, + { + "epoch": 43, + "train_loss": 4.500468269653321, + "train_acc": 0.02002, + "test_loss": 4.619631646728515, + "test_acc": 0.01, + "lyapunov": 1.6379705243708227, + "grad_norm": 0.29206231901196783, + "grad_max_sv": 0.21775328405201436, + "grad_min_sv": 9.075425390948639e-13, + "grad_condition": 137264678374.34676, + "lr": 0.000810573890139155, + "time_sec": 132.2273235321045 + }, + { + "epoch": 44, + "train_loss": 4.504369869842529, + "train_acc": 0.0207, + "test_loss": 5.01533042755127, + "test_acc": 0.01, + "lyapunov": 1.6450194870419514, + "grad_norm": 0.2763803917772913, + "grad_max_sv": 0.21316498667001724, + "grad_min_sv": 1.673849618721596e-10, + "grad_condition": 126175785035.09848, + "lr": 0.0008022995574311873, + "time_sec": 132.22698497772217 + }, + { + "epoch": 45, + "train_loss": 4.489227379150391, + "train_acc": 0.02202, + "test_loss": 5.281286546325684, + "test_acc": 0.01, + "lyapunov": 1.6374380149499839, + "grad_norm": 0.3176279571801955, + "grad_max_sv": 0.17873445823788642, + "grad_min_sv": 1.2304303497600637e-12, + "grad_condition": 101202509036.36377, + "lr": 0.0007938926261462363, + "time_sec": 132.20335817337036 + }, + { + "epoch": 46, + "train_loss": 4.4754781695556645, + "train_acc": 0.02428, + "test_loss": 4.921717021179199, + "test_acc": 0.01, + "lyapunov": 1.6464493341763, + "grad_norm": 0.2681280301001706, + "grad_max_sv": 0.17985644955188035, + "grad_min_sv": 1.3362588847965504e-12, + "grad_condition": 93386854989.08954, + "lr": 0.0007853567838422158, + "time_sec": 132.2294237613678 + }, + { + "epoch": 47, + "train_loss": 4.4843887727355956, + "train_acc": 0.02234, + "test_loss": 7.356022555541992, + "test_acc": 0.01, + "lyapunov": 1.6308888724392943, + "grad_norm": 0.25384939635010767, + "grad_max_sv": 0.1692765463143587, + "grad_min_sv": 1.1116489597414646e-12, + "grad_condition": 95479012299.0026, + "lr": 0.0007766957746216719, + "time_sec": 132.17389154434204 + }, + { + "epoch": 48, + "train_loss": 4.489932708587647, + "train_acc": 0.02146, + "test_loss": 5.591143609619141, + "test_acc": 0.01, + "lyapunov": 1.624904204207613, + "grad_norm": 0.2834282328300824, + "grad_max_sv": 0.1764419574290514, + "grad_min_sv": 1.0379873725135676e-12, + "grad_condition": 105037245989.42903, + "lr": 0.0007679133974894982, + "time_sec": 132.2243902683258 + }, + { + "epoch": 49, + "train_loss": 4.4929616583251955, + "train_acc": 0.02276, + "test_loss": 6.3275483657836915, + "test_acc": 0.01, + "lyapunov": 1.6448206410688513, + "grad_norm": 0.2655085596039743, + "grad_max_sv": 0.1556264752522111, + "grad_min_sv": 1.3565563953662412e-12, + "grad_condition": 78993279462.78845, + "lr": 0.000759013504686565, + "time_sec": 132.23448371887207 + }, + { + "epoch": 50, + "train_loss": 4.493864802551269, + "train_acc": 0.0218, + "test_loss": 6.973974436950684, + "test_acc": 0.01, + "lyapunov": 1.659627731803738, + "grad_norm": 0.28425424073935585, + "grad_max_sv": 0.18429967994743493, + "grad_min_sv": 9.384450563735499e-13, + "grad_condition": 110532937320.3837, + "lr": 0.0007499999999999998, + "time_sec": 132.25930857658386 + }, + { + "epoch": 51, + "train_loss": 4.522420733642578, + "train_acc": 0.01868, + "test_loss": 4.937375754547119, + "test_acc": 0.01, + "lyapunov": 1.6338805454161467, + "grad_norm": 0.2832378081788649, + "grad_max_sv": 0.16554471366107465, + "grad_min_sv": 6.399005349884901e-13, + "grad_condition": 111941095169.29214, + "lr": 0.0007408768370508575, + "time_sec": 132.2530381679535 + }, + { + "epoch": 52, + "train_loss": 4.51394544265747, + "train_acc": 0.02004, + "test_loss": 4.949947265625, + "test_acc": 0.01, + "lyapunov": 1.6564022866661285, + "grad_norm": 0.2569974808081301, + "grad_max_sv": 0.16093138251453637, + "grad_min_sv": 6.63987584789182e-13, + "grad_condition": 110129904934.76086, + "lr": 0.0007316480175599307, + "time_sec": 132.27379298210144 + }, + { + "epoch": 53, + "train_loss": 4.515902042236328, + "train_acc": 0.0184, + "test_loss": 4.71345171508789, + "test_acc": 0.01, + "lyapunov": 1.7566138798623439, + "grad_norm": 0.2369986362168349, + "grad_max_sv": 0.13799025900661946, + "grad_min_sv": 3.938872182723276e-13, + "grad_condition": 103706230571.64572, + "lr": 0.0007223175895924635, + "time_sec": 132.24648523330688 + }, + { + "epoch": 54, + "train_loss": 4.507343007507324, + "train_acc": 0.01962, + "test_loss": 5.815953979492187, + "test_acc": 0.01, + "lyapunov": 1.7070205742135987, + "grad_norm": 0.21837291714877805, + "grad_max_sv": 0.14667334891855716, + "grad_min_sv": 7.159830807848235e-13, + "grad_condition": 99331750298.19199, + "lr": 0.0007128896457825361, + "time_sec": 132.25679302215576 + }, + { + "epoch": 55, + "train_loss": 4.52220260848999, + "train_acc": 0.01892, + "test_loss": 5.452748155212403, + "test_acc": 0.01, + "lyapunov": 1.6943485148422552, + "grad_norm": 0.21823199412254568, + "grad_max_sv": 0.14726879578083754, + "grad_min_sv": 4.993786788159144e-13, + "grad_condition": 110125627629.77768, + "lr": 0.0007033683215378998, + "time_sec": 132.24295473098755 + }, + { + "epoch": 56, + "train_loss": 4.517760644073486, + "train_acc": 0.01966, + "test_loss": 5.310019548034668, + "test_acc": 0.01, + "lyapunov": 1.666598134028637, + "grad_norm": 0.27575481022856835, + "grad_max_sv": 0.159072039835155, + "grad_min_sv": 8.19140483448747e-13, + "grad_condition": 98455503499.05495, + "lr": 0.0006937577932260512, + "time_sec": 132.24738717079163 + }, + { + "epoch": 57, + "train_loss": 4.517431168060303, + "train_acc": 0.0187, + "test_loss": 5.330130297088623, + "test_acc": 0.01, + "lyapunov": 1.6996850147271705, + "grad_norm": 0.2142938814263498, + "grad_max_sv": 0.15296285804361104, + "grad_min_sv": 5.46731619541962e-13, + "grad_condition": 107334669590.86357, + "lr": 0.0006840622763423388, + "time_sec": 132.25556707382202 + }, + { + "epoch": 58, + "train_loss": 4.524203992919922, + "train_acc": 0.01934, + "test_loss": 4.631337239074707, + "test_acc": 0.01, + "lyapunov": 1.6601122535403123, + "grad_norm": 0.38071312115160016, + "grad_max_sv": 0.1478794915601611, + "grad_min_sv": 5.737511134361469e-13, + "grad_condition": 105672598616.59512, + "lr": 0.0006742860236609073, + "time_sec": 132.21588516235352 + }, + { + "epoch": 59, + "train_loss": 4.533112649688721, + "train_acc": 0.01928, + "test_loss": 4.614070481872559, + "test_acc": 0.01, + "lyapunov": 1.6871729802597515, + "grad_norm": 0.22354549091325823, + "grad_max_sv": 0.1491293204948306, + "grad_min_sv": 5.561086742052611e-13, + "grad_condition": 106804687973.686, + "lr": 0.0006644333233692913, + "time_sec": 132.242027759552 + }, + { + "epoch": 60, + "train_loss": 4.5315521173095705, + "train_acc": 0.02022, + "test_loss": 4.8204547218322755, + "test_acc": 0.01, + "lyapunov": 1.6951440185537119, + "grad_norm": 0.2356177440109697, + "grad_max_sv": 0.1612277302891016, + "grad_min_sv": 5.374582387388506e-13, + "grad_condition": 117853729696.05392, + "lr": 0.0006545084971874734, + "time_sec": 132.19956374168396 + }, + { + "epoch": 61, + "train_loss": 4.624313970794677, + "train_acc": 0.01444, + "test_loss": 4.884371475982666, + "test_acc": 0.01, + "lyapunov": 1.8478093199107959, + "grad_norm": 0.6446062497850988, + "grad_max_sv": 0.13153424933552743, + "grad_min_sv": 4.43307425435177e-14, + "grad_condition": 126286920468.29468, + "lr": 0.0006445158984722354, + "time_sec": 132.2351415157318 + }, + { + "epoch": 62, + "train_loss": 4.584010941925049, + "train_acc": 0.0165, + "test_loss": 4.894680688476562, + "test_acc": 0.01, + "lyapunov": 1.7962361311973514, + "grad_norm": 0.3379422383623765, + "grad_max_sv": 0.14229719250288325, + "grad_min_sv": 3.853968397876282e-12, + "grad_condition": 119719885249.69711, + "lr": 0.0006344599103076324, + "time_sec": 132.2427797317505 + }, + { + "epoch": 63, + "train_loss": 4.571224823150635, + "train_acc": 0.01708, + "test_loss": 4.933466084289551, + "test_acc": 0.01, + "lyapunov": 1.7701643421826765, + "grad_norm": 0.29406061735388944, + "grad_max_sv": 0.1290382323481026, + "grad_min_sv": 3.384297744674036e-13, + "grad_condition": 102886417299.77242, + "lr": 0.0006243449435824269, + "time_sec": 132.27230858802795 + }, + { + "epoch": 64, + "train_loss": 4.572176381378174, + "train_acc": 0.01692, + "test_loss": 4.925536454772949, + "test_acc": 0.01, + "lyapunov": 1.7125693093175474, + "grad_norm": 0.31642107319747337, + "grad_max_sv": 0.12633156184165273, + "grad_min_sv": 3.844361968486623e-13, + "grad_condition": 100339022775.7365, + "lr": 0.0006141754350553275, + "time_sec": 132.2755582332611 + }, + { + "epoch": 65, + "train_loss": 4.566539025421142, + "train_acc": 0.01724, + "test_loss": 4.8255180152893065, + "test_acc": 0.01, + "lyapunov": 1.6813567855473979, + "grad_norm": 0.21217215097591452, + "grad_max_sv": 0.12823735997080804, + "grad_min_sv": 7.340280172423425e-13, + "grad_condition": 91502730084.41678, + "lr": 0.0006039558454088793, + "time_sec": 132.2553505897522 + }, + { + "epoch": 66, + "train_loss": 4.561831217956543, + "train_acc": 0.01774, + "test_loss": 4.8608188064575195, + "test_acc": 0.01, + "lyapunov": 1.6523664268996099, + "grad_norm": 0.20210281079232253, + "grad_max_sv": 0.11968965604901313, + "grad_min_sv": 4.079266689805691e-13, + "grad_condition": 94202890917.05841, + "lr": 0.000593690657292862, + "time_sec": 132.31720495224 + }, + { + "epoch": 67, + "train_loss": 4.559810174102783, + "train_acc": 0.01622, + "test_loss": 5.090761659240723, + "test_acc": 0.01, + "lyapunov": 1.7058433745523243, + "grad_norm": 0.23830013952325338, + "grad_max_sv": 0.12983359694480895, + "grad_min_sv": 5.25592816536707e-13, + "grad_condition": 97314361174.40314, + "lr": 0.0005833843733580507, + "time_sec": 132.32061171531677 + }, + { + "epoch": 68, + "train_loss": 4.554318789825439, + "train_acc": 0.01838, + "test_loss": 4.8764984359741215, + "test_acc": 0.01, + "lyapunov": 1.6370756315148396, + "grad_norm": 0.24307746265962757, + "grad_max_sv": 0.1385297266766429, + "grad_min_sv": 9.516272992157032e-13, + "grad_condition": 89505578683.61617, + "lr": 0.0005730415142812054, + "time_sec": 132.23725128173828 + }, + { + "epoch": 69, + "train_loss": 4.550240862579345, + "train_acc": 0.01842, + "test_loss": 4.706728840637207, + "test_acc": 0.01, + "lyapunov": 1.663184766574284, + "grad_norm": 0.21914449833420702, + "grad_max_sv": 0.13847338538616896, + "grad_min_sv": 1.7555114994722528e-12, + "grad_condition": 84509930269.4158, + "lr": 0.0005626666167821517, + "time_sec": 132.21598196029663 + }, + { + "epoch": 70, + "train_loss": 4.543930948791504, + "train_acc": 0.01884, + "test_loss": 4.77112534942627, + "test_acc": 0.01, + "lyapunov": 1.6348076089263877, + "grad_norm": 0.22655722248414084, + "grad_max_sv": 0.13967302590608596, + "grad_min_sv": 1.7844730483685788e-12, + "grad_condition": 70169493780.52583, + "lr": 0.0005522642316338265, + "time_sec": 132.24659180641174 + }, + { + "epoch": 71, + "train_loss": 4.550147514495849, + "train_acc": 0.01862, + "test_loss": 4.834368143463135, + "test_acc": 0.01, + "lyapunov": 1.7937614118961422, + "grad_norm": 0.24793040499268879, + "grad_max_sv": 0.1327341727912426, + "grad_min_sv": 1.5079386468906054e-12, + "grad_condition": 74829595372.89197, + "lr": 0.0005418389216661573, + "time_sec": 132.2455804347992 + }, + { + "epoch": 72, + "train_loss": 4.552345445098877, + "train_acc": 0.01912, + "test_loss": 4.769914060974121, + "test_acc": 0.01, + "lyapunov": 1.8443064695733893, + "grad_norm": 0.24815260715084336, + "grad_max_sv": 0.13855412546545268, + "grad_min_sv": 1.2129411714186336e-12, + "grad_condition": 77310077550.77002, + "lr": 0.0005313952597646563, + "time_sec": 132.23443746566772 + }, + { + "epoch": 73, + "train_loss": 4.553061253204346, + "train_acc": 0.01776, + "test_loss": 4.776901901245117, + "test_acc": 0.01, + "lyapunov": 1.8784060618456673, + "grad_norm": 0.24206848836729325, + "grad_max_sv": 0.13422367088496684, + "grad_min_sv": 1.5502055586231123e-12, + "grad_condition": 74418694767.02853, + "lr": 0.0005209378268645994, + "time_sec": 132.2477297782898 + }, + { + "epoch": 74, + "train_loss": 4.5650504145812985, + "train_acc": 0.01726, + "test_loss": 4.677373085021973, + "test_acc": 0.01, + "lyapunov": 2.036505249760035, + "grad_norm": 0.32979269230794855, + "grad_max_sv": 0.1318796591833234, + "grad_min_sv": 1.646385209418448e-12, + "grad_condition": 63836897876.012314, + "lr": 0.0005104712099416781, + "time_sec": 132.22952890396118 + }, + { + "epoch": 75, + "train_loss": 4.57617336807251, + "train_acc": 0.01786, + "test_loss": 4.616835848999023, + "test_acc": 0.01, + "lyapunov": 2.030317187004382, + "grad_norm": 0.2938483296643333, + "grad_max_sv": 0.13414279446005822, + "grad_min_sv": 1.9340055446416965e-12, + "grad_condition": 73082641730.47269, + "lr": 0.0004999999999999996, + "time_sec": 132.25613594055176 + }, + { + "epoch": 76, + "train_loss": 4.565168632965088, + "train_acc": 0.0181, + "test_loss": 4.6201394668579105, + "test_acc": 0.01, + "lyapunov": 2.036142018749891, + "grad_norm": 0.5803969427460377, + "grad_max_sv": 0.13362037800252438, + "grad_min_sv": 6.107379101776952e-11, + "grad_condition": 60506096476.786255, + "lr": 0.0004895287900583212, + "time_sec": 132.27694129943848 + }, + { + "epoch": 77, + "train_loss": 4.553473384246826, + "train_acc": 0.01976, + "test_loss": 4.620628718566895, + "test_acc": 0.01, + "lyapunov": 2.0780328457312818, + "grad_norm": 0.2782704985845232, + "grad_max_sv": 0.14284589197486638, + "grad_min_sv": 1.854976659335083e-10, + "grad_condition": 42847233488.325554, + "lr": 0.0004790621731353997, + "time_sec": 132.26103115081787 + }, + { + "epoch": 78, + "train_loss": 4.5616140226745605, + "train_acc": 0.01792, + "test_loss": 4.626071022033692, + "test_acc": 0.01, + "lyapunov": 1.9671210581079468, + "grad_norm": 0.3415997663590008, + "grad_max_sv": 0.12938279159352534, + "grad_min_sv": 2.1680093232892384e-12, + "grad_condition": 62778606980.34462, + "lr": 0.000468604740235343, + "time_sec": 132.24888706207275 + }, + { + "epoch": 79, + "train_loss": 4.549584400177002, + "train_acc": 0.01758, + "test_loss": 4.6499050521850585, + "test_acc": 0.01, + "lyapunov": 1.6479191719113713, + "grad_norm": 0.22768486883056455, + "grad_max_sv": 0.13782267570495604, + "grad_min_sv": 2.2589190836196397e-12, + "grad_condition": 58187815931.14058, + "lr": 0.00045816107833384175, + "time_sec": 132.21508741378784 + }, + { + "epoch": 80, + "train_loss": 4.540716835632324, + "train_acc": 0.0182, + "test_loss": 4.6769668510437015, + "test_acc": 0.01, + "lyapunov": 1.6410039263917966, + "grad_norm": 0.22539273820118624, + "grad_max_sv": 0.1366339573636651, + "grad_min_sv": 2.3197873492747292e-12, + "grad_condition": 57510828453.82015, + "lr": 0.0004477357683661729, + "time_sec": 132.27885460853577 + }, + { + "epoch": 81, + "train_loss": 4.533609462127686, + "train_acc": 0.01882, + "test_loss": 4.681292281341553, + "test_acc": 0.01, + "lyapunov": 1.6682149348661417, + "grad_norm": 0.22496286921066277, + "grad_max_sv": 0.13073906544595956, + "grad_min_sv": 3.693996283659785e-12, + "grad_condition": 54723789821.69408, + "lr": 0.00043733338321784746, + "time_sec": 132.25836849212646 + }, + { + "epoch": 82, + "train_loss": 4.51605119140625, + "train_acc": 0.02174, + "test_loss": 4.7835935256958, + "test_acc": 0.01, + "lyapunov": 1.6646205598436048, + "grad_norm": 0.22712967887738475, + "grad_max_sv": 0.12587737049907446, + "grad_min_sv": 2.648945604018108e-11, + "grad_condition": 30196840277.8026, + "lr": 0.0004269584857187939, + "time_sec": 132.24180698394775 + }, + { + "epoch": 83, + "train_loss": 4.507941231689453, + "train_acc": 0.02448, + "test_loss": 4.827603370666504, + "test_acc": 0.01, + "lyapunov": 1.6704938301954733, + "grad_norm": 0.2269977774248034, + "grad_max_sv": 0.12395998779684306, + "grad_min_sv": 1.905802010946644e-11, + "grad_condition": 34294495028.09624, + "lr": 0.0004166156266419484, + "time_sec": 132.24390172958374 + }, + { + "epoch": 84, + "train_loss": 4.500372490997314, + "train_acc": 0.02542, + "test_loss": 4.876207922363281, + "test_acc": 0.01, + "lyapunov": 1.7214652272441504, + "grad_norm": 0.23132806515179782, + "grad_max_sv": 0.1210111577063799, + "grad_min_sv": 9.387468116625564e-11, + "grad_condition": 9621041096.566025, + "lr": 0.0004063093427071373, + "time_sec": 132.30067777633667 + }, + { + "epoch": 85, + "train_loss": 4.506775596313476, + "train_acc": 0.0252, + "test_loss": 5.014707362365723, + "test_acc": 0.01, + "lyapunov": 1.7590646134008228, + "grad_norm": 0.22830756689472873, + "grad_max_sv": 0.12346377000212669, + "grad_min_sv": 6.280843614910677e-11, + "grad_condition": 20432945180.96639, + "lr": 0.0003960441545911199, + "time_sec": 132.24875044822693 + }, + { + "epoch": 86, + "train_loss": 4.503674255065918, + "train_acc": 0.02502, + "test_loss": 5.123861147308349, + "test_acc": 0.01, + "lyapunov": 1.7873460773921683, + "grad_norm": 0.22793289150199839, + "grad_max_sv": 0.11887687053531408, + "grad_min_sv": 2.6847267894328664e-10, + "grad_condition": 7838790213.069723, + "lr": 0.0003858245649446718, + "time_sec": 132.22668957710266 + }, + { + "epoch": 87, + "train_loss": 4.497553546142578, + "train_acc": 0.02546, + "test_loss": 5.000641200256347, + "test_acc": 0.01, + "lyapunov": 1.7931315877553446, + "grad_norm": 0.2712504132074006, + "grad_max_sv": 0.11843320988118648, + "grad_min_sv": 4.4306743149992746e-10, + "grad_condition": 10999789171.998688, + "lr": 0.00037565505641757235, + "time_sec": 132.27767729759216 + }, + { + "epoch": 88, + "train_loss": 4.504041076202393, + "train_acc": 0.02544, + "test_loss": 4.800168603515625, + "test_acc": 0.01, + "lyapunov": 1.7431830390335044, + "grad_norm": 0.4357562034559732, + "grad_max_sv": 0.13997758310288191, + "grad_min_sv": 1.599969276164237e-09, + "grad_condition": 215412127.35240164, + "lr": 0.00036554008969236695, + "time_sec": 132.29276990890503 + }, + { + "epoch": 89, + "train_loss": 4.475532397766114, + "train_acc": 0.02664, + "test_loss": 4.715342008972168, + "test_acc": 0.01, + "lyapunov": 1.6543668587799267, + "grad_norm": 0.2534739131949124, + "grad_max_sv": 0.13988024070858956, + "grad_min_sv": 1.6967725441157342e-09, + "grad_condition": 1816488902.9373162, + "lr": 0.0003554841015277638, + "time_sec": 132.33469939231873 + }, + { + "epoch": 90, + "train_loss": 4.5014734359741215, + "train_acc": 0.02494, + "test_loss": 4.766956174468994, + "test_acc": 0.01, + "lyapunov": 1.6369030182928686, + "grad_norm": 0.2405872458143331, + "grad_max_sv": 0.13693566247820854, + "grad_min_sv": 1.1299910191672644e-09, + "grad_condition": 7905736012.59196, + "lr": 0.000345491502812526, + "time_sec": 132.27467131614685 + }, + { + "epoch": 91, + "train_loss": 4.4850330815124515, + "train_acc": 0.02662, + "test_loss": 4.801043357849121, + "test_acc": 0.01, + "lyapunov": 1.6205377401903158, + "grad_norm": 0.25251912836936496, + "grad_max_sv": 0.13310890551656485, + "grad_min_sv": 1.7584631463408647e-09, + "grad_condition": 410912188.385899, + "lr": 0.0003355666766307081, + "time_sec": 132.3292293548584 + }, + { + "epoch": 92, + "train_loss": 4.478285171203614, + "train_acc": 0.02732, + "test_loss": 4.725028746032715, + "test_acc": 0.01, + "lyapunov": 1.6160098134404253, + "grad_norm": 0.25441873002388926, + "grad_max_sv": 0.13993064705282449, + "grad_min_sv": 1.93155749849544e-09, + "grad_condition": 199751821.86601692, + "lr": 0.00032571397633909225, + "time_sec": 132.2692050933838 + }, + { + "epoch": 93, + "train_loss": 4.4908812908935545, + "train_acc": 0.02836, + "test_loss": 4.671359706878662, + "test_acc": 0.01, + "lyapunov": 1.6600854970000285, + "grad_norm": 0.2444473076879741, + "grad_max_sv": 0.1248008267953992, + "grad_min_sv": 1.7864780033766125e-09, + "grad_condition": 120785367.48652825, + "lr": 0.00031593772365766094, + "time_sec": 132.25391960144043 + }, + { + "epoch": 94, + "train_loss": 4.4584466459655765, + "train_acc": 0.03008, + "test_loss": 4.773041061401367, + "test_acc": 0.01, + "lyapunov": 1.7164468176834418, + "grad_norm": 0.28467917727076003, + "grad_max_sv": 0.1313628673553467, + "grad_min_sv": 2.0522267858182062e-09, + "grad_condition": 150691171.6565817, + "lr": 0.0003062422067739483, + "time_sec": 132.28487992286682 + }, + { + "epoch": 95, + "train_loss": 4.462513684997559, + "train_acc": 0.03022, + "test_loss": 4.732938203430176, + "test_acc": 0.01, + "lyapunov": 1.7166713040198207, + "grad_norm": 0.2757729585206691, + "grad_max_sv": 0.12017263405959966, + "grad_min_sv": 1.947814394511939e-09, + "grad_condition": 261551685.50113732, + "lr": 0.00029663167846209965, + "time_sec": 132.2222764492035 + }, + { + "epoch": 96, + "train_loss": 4.513658727264405, + "train_acc": 0.02456, + "test_loss": 4.7326889297485355, + "test_acc": 0.01, + "lyapunov": 1.7018064461705629, + "grad_norm": 0.2822470578312882, + "grad_max_sv": 0.12428085524588824, + "grad_min_sv": 1.1056017166490043e-09, + "grad_condition": 12431115528.428802, + "lr": 0.00028711035421746345, + "time_sec": 132.26545095443726 + }, + { + "epoch": 97, + "train_loss": 4.516728609924316, + "train_acc": 0.0237, + "test_loss": 4.853408081817627, + "test_acc": 0.01, + "lyapunov": 1.653851221284598, + "grad_norm": 0.27107311593465117, + "grad_max_sv": 0.12758918832987548, + "grad_min_sv": 3.289233621468757e-10, + "grad_condition": 28681461916.937225, + "lr": 0.00027768241040753615, + "time_sec": 132.2840976715088 + }, + { + "epoch": 98, + "train_loss": 4.533613332366944, + "train_acc": 0.02008, + "test_loss": 4.757841390228272, + "test_acc": 0.01, + "lyapunov": 1.6602956071839003, + "grad_norm": 0.24937887404647158, + "grad_max_sv": 0.12755668330937625, + "grad_min_sv": 1.637392221351119e-11, + "grad_condition": 35891878690.01149, + "lr": 0.00026835198244006903, + "time_sec": 132.26396775245667 + }, + { + "epoch": 99, + "train_loss": 4.516425126495362, + "train_acc": 0.02204, + "test_loss": 5.0689602409362795, + "test_acc": 0.01, + "lyapunov": 1.649671731397624, + "grad_norm": 0.3760428152634102, + "grad_max_sv": 0.12145681547117419, + "grad_min_sv": 2.465238532103251e-10, + "grad_condition": 26484335910.020866, + "lr": 0.0002591231629491421, + "time_sec": 132.25630021095276 + }, + { + "epoch": 100, + "train_loss": 4.46243141571045, + "train_acc": 0.02698, + "test_loss": 5.080750173950196, + "test_acc": 0.01, + "lyapunov": 1.683909809497921, + "grad_norm": 0.24604819581470147, + "grad_max_sv": 0.12949452698230743, + "grad_min_sv": 1.3873823402621444e-09, + "grad_condition": 205935504.09920138, + "lr": 0.0002499999999999997, + "time_sec": 132.31890201568604 + }, + { + "epoch": 101, + "train_loss": 4.479820979156494, + "train_acc": 0.02656, + "test_loss": 5.241960939025879, + "test_acc": 0.01, + "lyapunov": 1.6413938111966224, + "grad_norm": 0.26545021941029495, + "grad_max_sv": 0.12426532283425332, + "grad_min_sv": 1.1097413117838826e-09, + "grad_condition": 6543202862.376254, + "lr": 0.00024098649531343477, + "time_sec": 132.3456118106842 + }, + { + "epoch": 102, + "train_loss": 4.48857103805542, + "train_acc": 0.02512, + "test_loss": 4.846586625671387, + "test_acc": 0.01, + "lyapunov": 1.6577006459541028, + "grad_norm": 0.2771691413716041, + "grad_max_sv": 0.11552865523844957, + "grad_min_sv": 8.681243191128172e-10, + "grad_condition": 11207902327.633982, + "lr": 0.0002320866025105016, + "time_sec": 132.33533692359924 + }, + { + "epoch": 103, + "train_loss": 4.532757512359619, + "train_acc": 0.02206, + "test_loss": 4.91052190246582, + "test_acc": 0.01, + "lyapunov": 1.7228632836085755, + "grad_norm": 0.26346543636546327, + "grad_max_sv": 0.11417562378883303, + "grad_min_sv": 8.0661757120252e-11, + "grad_condition": 32678271343.199852, + "lr": 0.0002233042253783278, + "time_sec": 132.22725749015808 + }, + { + "epoch": 104, + "train_loss": 4.517958878479004, + "train_acc": 0.0249, + "test_loss": 5.279689112854004, + "test_acc": 0.01, + "lyapunov": 1.713277810065033, + "grad_norm": 0.21405138195083573, + "grad_max_sv": 0.11346618756651879, + "grad_min_sv": 8.99416673544361e-12, + "grad_condition": 26709079521.762756, + "lr": 0.000214643216157784, + "time_sec": 132.2524712085724 + }, + { + "epoch": 105, + "train_loss": 4.522473559875488, + "train_acc": 0.02324, + "test_loss": 4.910793183135986, + "test_acc": 0.01, + "lyapunov": 1.760302792119858, + "grad_norm": 0.2193211536414268, + "grad_max_sv": 0.12119325567036868, + "grad_min_sv": 4.266613421611516e-11, + "grad_condition": 41317958682.32074, + "lr": 0.00020610737385376332, + "time_sec": 132.2919180393219 + }, + { + "epoch": 106, + "train_loss": 4.5262701414489745, + "train_acc": 0.02212, + "test_loss": 4.780918911743164, + "test_acc": 0.01, + "lyapunov": 1.8881931195173727, + "grad_norm": 0.22447681715550066, + "grad_max_sv": 0.12109036315232516, + "grad_min_sv": 2.540523981257295e-10, + "grad_condition": 22443327399.1386, + "lr": 0.00019770044256881242, + "time_sec": 132.2804832458496 + }, + { + "epoch": 107, + "train_loss": 4.517831496887207, + "train_acc": 0.02178, + "test_loss": 4.859129156494141, + "test_acc": 0.01, + "lyapunov": 1.7496231952896508, + "grad_norm": 0.24404950114508223, + "grad_max_sv": 0.10989357913349522, + "grad_min_sv": 1.2062066598699504e-10, + "grad_condition": 24861620610.77468, + "lr": 0.0001894261098608447, + "time_sec": 132.2669916152954 + }, + { + "epoch": 108, + "train_loss": 4.524006955108643, + "train_acc": 0.022, + "test_loss": 4.818874195861817, + "test_acc": 0.01, + "lyapunov": 1.7341366472756465, + "grad_norm": 0.26306425817630436, + "grad_max_sv": 0.11322787757962942, + "grad_min_sv": 8.81599610096784e-11, + "grad_condition": 29169330613.728638, + "lr": 0.000181288005125655, + "time_sec": 132.24967575073242 + }, + { + "epoch": 109, + "train_loss": 4.523561717224121, + "train_acc": 0.02132, + "test_loss": 4.89949398727417, + "test_acc": 0.01, + "lyapunov": 1.7583422078500928, + "grad_norm": 0.2680652540380179, + "grad_max_sv": 0.11568452939391136, + "grad_min_sv": 1.8575990422427677e-10, + "grad_condition": 29865077677.922016, + "lr": 0.0001732896980049473, + "time_sec": 132.27372288703918 + }, + { + "epoch": 110, + "train_loss": 4.523985668182373, + "train_acc": 0.02156, + "test_loss": 4.934449282073975, + "test_acc": 0.01, + "lyapunov": 1.7785463793503353, + "grad_norm": 0.29105138013714615, + "grad_max_sv": 0.11333111306885257, + "grad_min_sv": 1.1142799980158278e-10, + "grad_condition": 32626806046.198414, + "lr": 0.00016543469682057076, + "time_sec": 132.35266971588135 + }, + { + "epoch": 111, + "train_loss": 4.5137792361450195, + "train_acc": 0.02256, + "test_loss": 5.328282705688476, + "test_acc": 0.01, + "lyapunov": 1.784282084316244, + "grad_norm": 0.2718568628101196, + "grad_max_sv": 0.11029190895551437, + "grad_min_sv": 3.2994620465780594e-11, + "grad_condition": 21435932574.82325, + "lr": 0.00015772644703565552, + "time_sec": 132.29639315605164 + }, + { + "epoch": 112, + "train_loss": 4.5287425050354, + "train_acc": 0.02154, + "test_loss": 4.866233026885986, + "test_acc": 0.01, + "lyapunov": 1.8234167659983915, + "grad_norm": 0.7181696676152709, + "grad_max_sv": 0.11080491679967963, + "grad_min_sv": 9.598411841196433e-11, + "grad_condition": 21131646151.302395, + "lr": 0.00015016832974331713, + "time_sec": 132.22785329818726 + }, + { + "epoch": 113, + "train_loss": 4.53446008102417, + "train_acc": 0.02172, + "test_loss": 4.7556414230346675, + "test_acc": 0.01, + "lyapunov": 1.8720827319128128, + "grad_norm": 0.2982424838317109, + "grad_max_sv": 0.11564233805984259, + "grad_min_sv": 1.1366100612204778e-11, + "grad_condition": 33297559189.110718, + "lr": 0.00014276366018359834, + "time_sec": 132.28487348556519 + }, + { + "epoch": 114, + "train_loss": 4.532152935791015, + "train_acc": 0.02186, + "test_loss": 4.865617831420899, + "test_acc": 0.01, + "lyapunov": 1.8749572075236485, + "grad_norm": 0.3128369100696859, + "grad_max_sv": 0.10889359122447786, + "grad_min_sv": 1.121567636669266e-11, + "grad_condition": 32329751107.46931, + "lr": 0.00013551568628929425, + "time_sec": 132.27337980270386 + }, + { + "epoch": 115, + "train_loss": 4.53541379989624, + "train_acc": 0.02112, + "test_loss": 4.741897981262207, + "test_acc": 0.01, + "lyapunov": 1.9057784431120928, + "grad_norm": 0.2745511633601485, + "grad_max_sv": 0.12013480849564076, + "grad_min_sv": 1.335206909740819e-10, + "grad_condition": 26511680388.403683, + "lr": 0.00012842758726130276, + "time_sec": 132.32796025276184 + }, + { + "epoch": 116, + "train_loss": 4.528167925415039, + "train_acc": 0.02226, + "test_loss": 4.780342037963867, + "test_acc": 0.01, + "lyapunov": 1.8732325488039294, + "grad_norm": 0.26257944903115926, + "grad_max_sv": 0.1154415562748909, + "grad_min_sv": 1.6041397823653636e-11, + "grad_condition": 34787258241.614006, + "lr": 0.0001215024721741218, + "time_sec": 132.2490336894989 + }, + { + "epoch": 117, + "train_loss": 4.522953644866943, + "train_acc": 0.02162, + "test_loss": 4.739641496276856, + "test_acc": 0.01, + "lyapunov": 1.8529656442534892, + "grad_norm": 0.2727268094706684, + "grad_max_sv": 0.11305988898384385, + "grad_min_sv": 1.9489078277227068e-11, + "grad_condition": 18271460472.81977, + "lr": 0.00011474337861210538, + "time_sec": 132.25032210350037 + }, + { + "epoch": 118, + "train_loss": 4.522515398864746, + "train_acc": 0.0218, + "test_loss": 4.743156268310547, + "test_acc": 0.01, + "lyapunov": 1.8354669568483786, + "grad_norm": 0.21812995158496862, + "grad_max_sv": 0.11335933059453965, + "grad_min_sv": 1.7770811345629422e-11, + "grad_condition": 24365563841.45679, + "lr": 0.00010815327133708009, + "time_sec": 132.2527687549591 + }, + { + "epoch": 119, + "train_loss": 4.525841431427002, + "train_acc": 0.02164, + "test_loss": 4.714016912841797, + "test_acc": 0.01, + "lyapunov": 1.8096261015328605, + "grad_norm": 0.2933400535775977, + "grad_max_sv": 0.1168335797265172, + "grad_min_sv": 1.6312611610585672e-10, + "grad_condition": 20918604889.922924, + "lr": 0.00010173504098790182, + "time_sec": 132.267231464386 + }, + { + "epoch": 120, + "train_loss": 4.51864777267456, + "train_acc": 0.02246, + "test_loss": 4.818260918426514, + "test_acc": 0.01, + "lyapunov": 1.7693779590489613, + "grad_norm": 0.20718951240601688, + "grad_max_sv": 0.10794953405857086, + "grad_min_sv": 1.1165816146560076e-11, + "grad_condition": 26004625908.123756, + "lr": 9.549150281252629e-05, + "time_sec": 132.24092316627502 + }, + { + "epoch": 121, + "train_loss": 4.513626610717774, + "train_acc": 0.02172, + "test_loss": 4.7877141441345215, + "test_acc": 0.01, + "lyapunov": 1.7112558006935412, + "grad_norm": 0.20441382058891275, + "grad_max_sv": 0.10070603135973215, + "grad_min_sv": 5.326116745754119e-12, + "grad_condition": 32954861968.91792, + "lr": 8.942539543314794e-05, + "time_sec": 132.32292103767395 + }, + { + "epoch": 122, + "train_loss": 4.511023434753418, + "train_acc": 0.02162, + "test_loss": 4.857227470397949, + "test_acc": 0.01, + "lyapunov": 1.7272964283023649, + "grad_norm": 0.2021428518858731, + "grad_max_sv": 0.10296436455100774, + "grad_min_sv": 1.5577700448207808e-11, + "grad_condition": 18482807609.52593, + "lr": 8.353937964495024e-05, + "time_sec": 132.6510660648346 + }, + { + "epoch": 123, + "train_loss": 4.514791604614258, + "train_acc": 0.02288, + "test_loss": 4.8252052871704105, + "test_acc": 0.01, + "lyapunov": 1.740580289565084, + "grad_norm": 0.22696240060148393, + "grad_max_sv": 0.09938969779759646, + "grad_min_sv": 1.1437882548238259e-11, + "grad_condition": 16302265342.370092, + "lr": 7.783603724899243e-05, + "time_sec": 132.3826994895935 + }, + { + "epoch": 124, + "train_loss": 4.514339904327392, + "train_acc": 0.0222, + "test_loss": 4.813984481048584, + "test_acc": 0.01, + "lyapunov": 1.689259083984453, + "grad_norm": 0.19852103630620363, + "grad_max_sv": 0.09858787786215543, + "grad_min_sv": 1.0750563341485877e-11, + "grad_condition": 22030501554.32871, + "lr": 7.231786991974666e-05, + "time_sec": 132.5738594532013 + }, + { + "epoch": 125, + "train_loss": 4.514390753021241, + "train_acc": 0.02248, + "test_loss": 4.80667377166748, + "test_acc": 0.01, + "lyapunov": 1.7182339295706786, + "grad_norm": 0.19942460460386832, + "grad_max_sv": 0.100060392357409, + "grad_min_sv": 1.1270956048217663e-11, + "grad_condition": 22823012362.790337, + "lr": 6.698729810778072e-05, + "time_sec": 132.50823545455933 + }, + { + "epoch": 126, + "train_loss": 4.515155561218262, + "train_acc": 0.02208, + "test_loss": 4.83121703338623, + "test_acc": 0.01, + "lyapunov": 1.7485487692801238, + "grad_norm": 0.19913025130743606, + "grad_max_sv": 0.10064963772892951, + "grad_min_sv": 6.303761677791352e-12, + "grad_condition": 29996291803.755657, + "lr": 6.184665997806817e-05, + "time_sec": 132.32139468193054 + }, + { + "epoch": 127, + "train_loss": 4.519498745880127, + "train_acc": 0.0222, + "test_loss": 4.82270682220459, + "test_acc": 0.01, + "lyapunov": 1.753368593542777, + "grad_norm": 0.19807610716386245, + "grad_max_sv": 0.09752303529530763, + "grad_min_sv": 8.666520092513058e-12, + "grad_condition": 19023641146.62214, + "lr": 5.6898210384392595e-05, + "time_sec": 132.26067113876343 + }, + { + "epoch": 128, + "train_loss": 4.52323801864624, + "train_acc": 0.02056, + "test_loss": 5.1514449867248535, + "test_acc": 0.01, + "lyapunov": 1.7695821017560447, + "grad_norm": 0.22231031444321495, + "grad_max_sv": 0.09464265571295982, + "grad_min_sv": 3.8691049872084295e-12, + "grad_condition": 37862315656.40668, + "lr": 5.214411988029363e-05, + "time_sec": 132.34855723381042 + }, + { + "epoch": 129, + "train_loss": 4.52958849609375, + "train_acc": 0.02132, + "test_loss": 4.817114677429199, + "test_acc": 0.01, + "lyapunov": 1.8197325367451933, + "grad_norm": 0.22038917478813003, + "grad_max_sv": 0.09654771145433187, + "grad_min_sv": 3.837805751108681e-12, + "grad_condition": 34720840003.96797, + "lr": 4.7586473766990294e-05, + "time_sec": 132.38166642189026 + }, + { + "epoch": 130, + "train_loss": 4.534138793182373, + "train_acc": 0.02068, + "test_loss": 4.817256965637207, + "test_acc": 0.01, + "lyapunov": 1.8883260424484682, + "grad_norm": 0.197257535011672, + "grad_max_sv": 0.09597008451819419, + "grad_min_sv": 3.749032975950144e-12, + "grad_condition": 35630604171.973366, + "lr": 4.32272711786996e-05, + "time_sec": 132.3463578224182 + }, + { + "epoch": 131, + "train_loss": 4.560665507507324, + "train_acc": 0.0201, + "test_loss": 7.84898078994751, + "test_acc": 0.01, + "lyapunov": 2.1612947828629436, + "grad_norm": 0.898704109268479, + "grad_max_sv": 0.09020924572396324, + "grad_min_sv": 2.4590256743041826e-12, + "grad_condition": 40183040789.80008, + "lr": 3.906842420574966e-05, + "time_sec": 132.34411454200745 + }, + { + "epoch": 132, + "train_loss": 4.662711235961914, + "train_acc": 0.00912, + "test_loss": 4.675270185089111, + "test_acc": 0.01, + "lyapunov": 1.9170365873200204, + "grad_norm": 0.985529140055845, + "grad_max_sv": 0.052365996095613807, + "grad_min_sv": 5.043138273528284e-14, + "grad_condition": 49945086388.40376, + "lr": 3.5111757055874305e-05, + "time_sec": 132.29924774169922 + }, + { + "epoch": 133, + "train_loss": 4.558833842926026, + "train_acc": 0.0205, + "test_loss": 4.983620196533203, + "test_acc": 0.01, + "lyapunov": 2.437913965081315, + "grad_norm": 0.21719174539007674, + "grad_max_sv": 0.08432087264955043, + "grad_min_sv": 1.9419044561864295e-11, + "grad_condition": 24698029231.81626, + "lr": 3.1359005254054254e-05, + "time_sec": 132.27533149719238 + }, + { + "epoch": 134, + "train_loss": 4.549310289154053, + "train_acc": 0.02206, + "test_loss": 4.795253966522217, + "test_acc": 0.01, + "lyapunov": 2.4131780234749054, + "grad_norm": 0.22633597958807397, + "grad_max_sv": 0.09607531521469355, + "grad_min_sv": 3.153909599474668e-11, + "grad_condition": 21769631631.395184, + "lr": 2.7811814881259484e-05, + "time_sec": 132.20576786994934 + }, + { + "epoch": 135, + "train_loss": 4.550494029846192, + "train_acc": 0.02158, + "test_loss": 4.974422496032715, + "test_acc": 0.01, + "lyapunov": 2.2027124742717694, + "grad_norm": 0.37152128441369414, + "grad_max_sv": 0.0963487543962401, + "grad_min_sv": 9.98336880508485e-12, + "grad_condition": 36623182309.58069, + "lr": 2.4471741852423218e-05, + "time_sec": 132.19467067718506 + }, + { + "epoch": 136, + "train_loss": 4.6452084017944335, + "train_acc": 0.01278, + "test_loss": 4.613780563354492, + "test_acc": 0.01, + "lyapunov": 2.255611063574281, + "grad_norm": 1.8213468014305785, + "grad_max_sv": 0.053157788801672726, + "grad_min_sv": 1.0857787411328158e-12, + "grad_condition": 28889157844.30957, + "lr": 2.1340251233966362e-05, + "time_sec": 132.17661714553833 + }, + { + "epoch": 137, + "train_loss": 4.607472053527832, + "train_acc": 0.01634, + "test_loss": 4.916742666625977, + "test_acc": 0.01, + "lyapunov": 2.1947204740456, + "grad_norm": 1.1710449526904079, + "grad_max_sv": 0.07145409461636518, + "grad_min_sv": 1.5808348310341834e-12, + "grad_condition": 36654784264.39657, + "lr": 1.8418716601170932e-05, + "time_sec": 132.27569031715393 + }, + { + "epoch": 138, + "train_loss": 4.559258212890625, + "train_acc": 0.01984, + "test_loss": 4.965542991638183, + "test_acc": 0.01, + "lyapunov": 1.9919700287187192, + "grad_norm": 0.3580203625288606, + "grad_max_sv": 0.08741460712626577, + "grad_min_sv": 2.8563584239449506e-12, + "grad_condition": 35594890478.84314, + "lr": 1.570841943568445e-05, + "time_sec": 132.1866273880005 + }, + { + "epoch": 139, + "train_loss": 4.539822565460205, + "train_acc": 0.02032, + "test_loss": 4.894291995239258, + "test_acc": 0.01, + "lyapunov": 1.8103657451736959, + "grad_norm": 0.23861458794790022, + "grad_max_sv": 0.09107699207961559, + "grad_min_sv": 2.0939648879582646e-12, + "grad_condition": 40673153141.73503, + "lr": 1.3210548563419845e-05, + "time_sec": 132.21299076080322 + }, + { + "epoch": 140, + "train_loss": 4.528692821044922, + "train_acc": 0.0213, + "test_loss": 4.894965370178222, + "test_acc": 0.01, + "lyapunov": 1.788401810714351, + "grad_norm": 0.1949135712264777, + "grad_max_sv": 0.10017000269144774, + "grad_min_sv": 9.242681210645215e-12, + "grad_condition": 31313851187.813477, + "lr": 1.0926199633097203e-05, + "time_sec": 132.26792335510254 + }, + { + "epoch": 141, + "train_loss": 4.521334162139892, + "train_acc": 0.02234, + "test_loss": 4.86794594039917, + "test_acc": 0.01, + "lyapunov": 1.7388252769894612, + "grad_norm": 0.19475066885733908, + "grad_max_sv": 0.09781918786466122, + "grad_min_sv": 5.0263400937862384e-12, + "grad_condition": 31987601671.577065, + "lr": 8.856374635655688e-06, + "time_sec": 132.1968493461609 + }, + { + "epoch": 142, + "train_loss": 4.519183606109619, + "train_acc": 0.02114, + "test_loss": 4.901071472930909, + "test_acc": 0.01, + "lyapunov": 1.728894598343793, + "grad_norm": 0.19584047962539464, + "grad_max_sv": 0.09894849732518196, + "grad_min_sv": 9.404661996883385e-12, + "grad_condition": 29714150029.761383, + "lr": 7.001981464747503e-06, + "time_sec": 132.22681641578674 + }, + { + "epoch": 143, + "train_loss": 4.51677712387085, + "train_acc": 0.0226, + "test_loss": 4.950763639068604, + "test_acc": 0.01, + "lyapunov": 1.7029225710407851, + "grad_norm": 0.1968831393258508, + "grad_max_sv": 0.09533613510429859, + "grad_min_sv": 6.3565684754222856e-12, + "grad_condition": 27338799720.47678, + "lr": 5.3638335185058295e-06, + "time_sec": 132.20126152038574 + }, + { + "epoch": 144, + "train_loss": 4.518185277557373, + "train_acc": 0.02152, + "test_loss": 4.9513655952453615, + "test_acc": 0.01, + "lyapunov": 1.715206102946835, + "grad_norm": 0.19730468315875627, + "grad_max_sv": 0.09847171790897846, + "grad_min_sv": 8.042904299650991e-12, + "grad_condition": 25412259314.74212, + "lr": 3.942649342761114e-06, + "time_sec": 132.23193264007568 + }, + { + "epoch": 145, + "train_loss": 4.517314046325684, + "train_acc": 0.02308, + "test_loss": 5.002078984069824, + "test_acc": 0.01, + "lyapunov": 1.7169002776255693, + "grad_norm": 0.19706530472999553, + "grad_max_sv": 0.09748229458928108, + "grad_min_sv": 7.765136579259477e-12, + "grad_condition": 27711081726.502644, + "lr": 2.7390523158633524e-06, + "time_sec": 132.21612977981567 + }, + { + "epoch": 146, + "train_loss": 4.518855401306152, + "train_acc": 0.02096, + "test_loss": 5.010985830688477, + "test_acc": 0.01, + "lyapunov": 1.7291874501406383, + "grad_norm": 0.19669875555858216, + "grad_max_sv": 0.09733824878931045, + "grad_min_sv": 8.8679570698952e-12, + "grad_condition": 26609168229.480072, + "lr": 1.7535703752478133e-06, + "time_sec": 132.23784112930298 + }, + { + "epoch": 147, + "train_loss": 4.521316411132813, + "train_acc": 0.02082, + "test_loss": 5.031257997131347, + "test_acc": 0.01, + "lyapunov": 1.750539176604327, + "grad_norm": 0.19820855844552607, + "grad_max_sv": 0.09823240488767623, + "grad_min_sv": 5.8439703333718986e-12, + "grad_condition": 26546075710.87718, + "lr": 9.866357858642196e-07, + "time_sec": 132.26315879821777 + }, + { + "epoch": 148, + "train_loss": 4.521538203735352, + "train_acc": 0.02092, + "test_loss": 4.780371436309815, + "test_acc": 0.01, + "lyapunov": 1.7696317013572245, + "grad_norm": 0.20015199634206132, + "grad_max_sv": 0.0979210464283824, + "grad_min_sv": 6.957044250287782e-12, + "grad_condition": 28364480954.837574, + "lr": 4.38584950570808e-07, + "time_sec": 132.29415655136108 + }, + { + "epoch": 149, + "train_loss": 4.519690438537598, + "train_acc": 0.02194, + "test_loss": 4.993109432983398, + "test_acc": 0.01, + "lyapunov": 1.785507148489013, + "grad_norm": 0.20307877192283708, + "grad_max_sv": 0.10153117403388023, + "grad_min_sv": 6.7784031204093226e-12, + "grad_condition": 28739201400.2667, + "lr": 1.096582625772501e-07, + "time_sec": 132.2059965133667 + }, + { + "epoch": 150, + "train_loss": 4.520359083557129, + "train_acc": 0.02202, + "test_loss": 4.901946855926513, + "test_acc": 0.01, + "lyapunov": 1.799182962883464, + "grad_norm": 0.2039110690313897, + "grad_max_sv": 0.09756326731294393, + "grad_min_sv": 4.4820535969792195e-12, + "grad_condition": 30003518175.60987, + "lr": 0.0, + "time_sec": 132.2337782382965 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.048916976470947, + "train_acc": 0.01594, + "test_loss": 4.9240590103149415, + "test_acc": 0.0102, + "lyapunov": 2.4990125623200554, + "grad_norm": 5.2089414732509765, + "grad_max_sv": 4.538620001077652, + "grad_min_sv": 8.666914707022854e-08, + "grad_condition": 71759294.12196848, + "lr": 0.0009998903417374227, + "time_sec": 177.55314326286316 + }, + { + "epoch": 2, + "train_loss": 4.772639881439209, + "train_acc": 0.01864, + "test_loss": 4.818304029846192, + "test_acc": 0.0099, + "lyapunov": 2.0309148563448427, + "grad_norm": 3.4409358068870906, + "grad_max_sv": 2.870414561033249, + "grad_min_sv": 5.6283518207189687e-08, + "grad_condition": 73586735.46131077, + "lr": 0.0009995614150494292, + "time_sec": 177.54819798469543 + }, + { + "epoch": 3, + "train_loss": 4.669093980712891, + "train_acc": 0.01662, + "test_loss": 4.840026252746582, + "test_acc": 0.01, + "lyapunov": 1.8127321257920521, + "grad_norm": 3.5740462449452233, + "grad_max_sv": 1.5858038313788256, + "grad_min_sv": 3.197712202629892e-08, + "grad_condition": 124519530.3269566, + "lr": 0.0009990133642141358, + "time_sec": 177.56600260734558 + }, + { + "epoch": 4, + "train_loss": 4.6450184385681155, + "train_acc": 0.01972, + "test_loss": 4.742011805725098, + "test_acc": 0.01, + "lyapunov": 1.7917253379626652, + "grad_norm": 2.17612890921667, + "grad_max_sv": 1.7586730420589447, + "grad_min_sv": 3.2549927386771314e-08, + "grad_condition": 64076200.61726785, + "lr": 0.0009982464296247522, + "time_sec": 177.51368522644043 + }, + { + "epoch": 5, + "train_loss": 4.594644748687744, + "train_acc": 0.01754, + "test_loss": 4.605577088928222, + "test_acc": 0.01, + "lyapunov": 1.7579119772557408, + "grad_norm": 1.333506716487397, + "grad_max_sv": 1.0378288313746453, + "grad_min_sv": 1.8859317916021556e-08, + "grad_condition": 28097615866.07615, + "lr": 0.0009972609476841367, + "time_sec": 177.39786744117737 + }, + { + "epoch": 6, + "train_loss": 4.566596083679199, + "train_acc": 0.01696, + "test_loss": 4.624316529083252, + "test_acc": 0.01, + "lyapunov": 1.725943365670226, + "grad_norm": 0.9295373030977598, + "grad_max_sv": 0.5246448639780283, + "grad_min_sv": 5.9647606552511474e-09, + "grad_condition": 27370389371.584316, + "lr": 0.000996057350657239, + "time_sec": 177.5635268688202 + }, + { + "epoch": 7, + "train_loss": 4.573716998138428, + "train_acc": 0.01464, + "test_loss": 4.612767818450927, + "test_acc": 0.01, + "lyapunov": 1.7216917270284784, + "grad_norm": 0.48102952278246336, + "grad_max_sv": 0.38973032161593435, + "grad_min_sv": 3.736115294508798e-12, + "grad_condition": 134717305996.98454, + "lr": 0.000994636166481494, + "time_sec": 177.48547768592834 + }, + { + "epoch": 8, + "train_loss": 4.579797831115723, + "train_acc": 0.0145, + "test_loss": 4.623975819396972, + "test_acc": 0.01, + "lyapunov": 1.7258502177875061, + "grad_norm": 0.47333241602721, + "grad_max_sv": 0.37056842595338824, + "grad_min_sv": 1.4536960770203518e-12, + "grad_condition": 195457646315.7444, + "lr": 0.0009929980185352525, + "time_sec": 177.41426181793213 + }, + { + "epoch": 9, + "train_loss": 4.584737917633056, + "train_acc": 0.01374, + "test_loss": 4.618178663635254, + "test_acc": 0.01, + "lyapunov": 1.7207769378066977, + "grad_norm": 0.3840862596529102, + "grad_max_sv": 0.3212647676467896, + "grad_min_sv": 6.28349602709914e-13, + "grad_condition": 221408206735.65436, + "lr": 0.0009911436253643444, + "time_sec": 177.4136345386505 + }, + { + "epoch": 10, + "train_loss": 4.587927213897705, + "train_acc": 0.01364, + "test_loss": 4.62291756439209, + "test_acc": 0.01, + "lyapunov": 1.7215617986591272, + "grad_norm": 0.34052724634366244, + "grad_max_sv": 0.2760568205267191, + "grad_min_sv": 4.4077968183598767e-13, + "grad_condition": 207542599082.03424, + "lr": 0.0009890738003669028, + "time_sec": 177.3738307952881 + }, + { + "epoch": 11, + "train_loss": 4.5979031567382815, + "train_acc": 0.01294, + "test_loss": 4.6055679046630855, + "test_acc": 0.01, + "lyapunov": 1.7119133194999012, + "grad_norm": 0.28533253906361805, + "grad_max_sv": 0.22682507038116456, + "grad_min_sv": 3.0256303555137105e-13, + "grad_condition": 192169493993.88373, + "lr": 0.00098678945143658, + "time_sec": 177.4079394340515 + }, + { + "epoch": 12, + "train_loss": 4.60866346786499, + "train_acc": 0.01188, + "test_loss": 4.643439791870117, + "test_acc": 0.01, + "lyapunov": 1.7418107398025824, + "grad_norm": 0.22796411790946616, + "grad_max_sv": 0.18424283824861049, + "grad_min_sv": 6.381518018275396e-15, + "grad_condition": 183152957950.82562, + "lr": 0.0009842915805643154, + "time_sec": 177.39781975746155 + }, + { + "epoch": 13, + "train_loss": 4.610555019989014, + "train_acc": 0.01114, + "test_loss": 4.886381156921387, + "test_acc": 0.01, + "lyapunov": 1.781030819239214, + "grad_norm": 0.2991067631049297, + "grad_max_sv": 0.16204121466726065, + "grad_min_sv": 9.856118836595678e-18, + "grad_condition": 162039129961.8548, + "lr": 0.000981581283398829, + "time_sec": 177.444970369339 + }, + { + "epoch": 14, + "train_loss": 4.6126707130432125, + "train_acc": 0.01126, + "test_loss": 4.628372909545899, + "test_acc": 0.01, + "lyapunov": 1.725750547235884, + "grad_norm": 0.26417721241928865, + "grad_max_sv": 0.2243590321391821, + "grad_min_sv": 3.902749481375659e-15, + "grad_condition": 223472966711.7526, + "lr": 0.0009786597487660333, + "time_sec": 177.3752899169922 + }, + { + "epoch": 15, + "train_loss": 4.617655180206299, + "train_acc": 0.01182, + "test_loss": 4.621595803833007, + "test_acc": 0.01, + "lyapunov": 1.718031684151086, + "grad_norm": 0.30598909964825266, + "grad_max_sv": 0.27787347659468653, + "grad_min_sv": 8.767420220263753e-19, + "grad_condition": 277873177485.7358, + "lr": 0.0009755282581475766, + "time_sec": 177.3603708744049 + }, + { + "epoch": 16, + "train_loss": 4.622196079406739, + "train_acc": 0.01076, + "test_loss": 4.607522448730469, + "test_acc": 0.01, + "lyapunov": 1.7246177007475167, + "grad_norm": 0.3521789068955868, + "grad_max_sv": 0.3038882542401552, + "grad_min_sv": 1.2016902643201833e-15, + "grad_condition": 303454077086.20264, + "lr": 0.0009721881851187403, + "time_sec": 177.4582462310791 + }, + { + "epoch": 17, + "train_loss": 4.624571969909668, + "train_acc": 0.01036, + "test_loss": 4.606505413818359, + "test_acc": 0.01, + "lyapunov": 1.723605226982585, + "grad_norm": 0.38326593546292337, + "grad_max_sv": 0.3560586102306843, + "grad_min_sv": 2.0395849787621002e-18, + "grad_condition": 356057690991.14233, + "lr": 0.0009686409947459456, + "time_sec": 177.44416284561157 + }, + { + "epoch": 18, + "train_loss": 4.621964686126709, + "train_acc": 0.01194, + "test_loss": 4.6524422760009765, + "test_acc": 0.01, + "lyapunov": 1.7237175431702754, + "grad_norm": 0.42933412334227883, + "grad_max_sv": 0.34594915360212325, + "grad_min_sv": 2.951910203399657e-14, + "grad_condition": 338685423000.5939, + "lr": 0.0009648882429441254, + "time_sec": 177.52524948120117 + }, + { + "epoch": 19, + "train_loss": 4.627113620605469, + "train_acc": 0.0119, + "test_loss": 4.723296948242187, + "test_acc": 0.01, + "lyapunov": 1.729295022042511, + "grad_norm": 0.4059603924941295, + "grad_max_sv": 0.3793640684336424, + "grad_min_sv": 1.8575480189516096e-14, + "grad_condition": 373763779828.7423, + "lr": 0.00096093157579425, + "time_sec": 177.42243647575378 + }, + { + "epoch": 20, + "train_loss": 4.629038185424805, + "train_acc": 0.01024, + "test_loss": 4.753069805908203, + "test_acc": 0.01, + "lyapunov": 1.7227031398002448, + "grad_norm": 0.4075854332347789, + "grad_max_sv": 0.3644769866019487, + "grad_min_sv": 5.198212783961593e-17, + "grad_condition": 364460664015.28894, + "lr": 0.0009567727288213001, + "time_sec": 177.4082248210907 + }, + { + "epoch": 21, + "train_loss": 4.631191472625733, + "train_acc": 0.01058, + "test_loss": 4.638436957550049, + "test_acc": 0.01, + "lyapunov": 1.7267242444445714, + "grad_norm": 0.5086938418182457, + "grad_max_sv": 0.3896265499293804, + "grad_min_sv": 1.5346327658226146e-14, + "grad_condition": 383817509478.4017, + "lr": 0.0009524135262330095, + "time_sec": 177.36780858039856 + }, + { + "epoch": 22, + "train_loss": 4.62202378829956, + "train_acc": 0.01184, + "test_loss": 4.953248652648925, + "test_acc": 0.01, + "lyapunov": 1.73959963461932, + "grad_norm": 0.5026420951215756, + "grad_max_sv": 0.46916041933000086, + "grad_min_sv": 1.0611509345471128e-13, + "grad_condition": 433404810081.4076, + "lr": 0.0009478558801197061, + "time_sec": 177.39120984077454 + }, + { + "epoch": 23, + "train_loss": 4.655561924285888, + "train_acc": 0.01134, + "test_loss": 4.614388928985596, + "test_acc": 0.01, + "lyapunov": 1.7158038116172147, + "grad_norm": 1.1810184586126122, + "grad_max_sv": 0.4519379799548915, + "grad_min_sv": 7.408418462277921e-13, + "grad_condition": 323219770597.8288, + "lr": 0.000943101789615607, + "time_sec": 177.46234154701233 + }, + { + "epoch": 24, + "train_loss": 4.6525478160095215, + "train_acc": 0.01046, + "test_loss": 4.583759087371826, + "test_acc": 0.0136, + "lyapunov": 1.7016837676162915, + "grad_norm": 0.4223871229931315, + "grad_max_sv": 0.35212441682815554, + "grad_min_sv": 4.57826367676092e-13, + "grad_condition": 268725051834.9417, + "lr": 0.0009381533400219313, + "time_sec": 177.38567519187927 + }, + { + "epoch": 25, + "train_loss": 4.6400556893920895, + "train_acc": 0.01044, + "test_loss": 4.616389656829834, + "test_acc": 0.0099, + "lyapunov": 1.6980437918392288, + "grad_norm": 0.3628094150674986, + "grad_max_sv": 0.27896470986306665, + "grad_min_sv": 5.204616277156684e-13, + "grad_condition": 221304273008.43808, + "lr": 0.0009330127018922189, + "time_sec": 177.43163585662842 + }, + { + "epoch": 26, + "train_loss": 4.6332687809753414, + "train_acc": 0.01132, + "test_loss": 4.6006186569213865, + "test_acc": 0.0101, + "lyapunov": 1.6927479645785164, + "grad_norm": 0.24641839586724976, + "grad_max_sv": 0.19274084214121104, + "grad_min_sv": 1.5204884707303638e-13, + "grad_condition": 172697545598.00262, + "lr": 0.000927682130080253, + "time_sec": 177.42988181114197 + }, + { + "epoch": 27, + "train_loss": 4.6304932633972165, + "train_acc": 0.01176, + "test_loss": 4.600824389648437, + "test_acc": 0.0121, + "lyapunov": 1.689094999257256, + "grad_norm": 0.2106371658308628, + "grad_max_sv": 0.15872270464897156, + "grad_min_sv": 4.327200917175986e-14, + "grad_condition": 152902715496.53714, + "lr": 0.0009221639627510072, + "time_sec": 177.39303278923035 + }, + { + "epoch": 28, + "train_loss": 4.629396923675537, + "train_acc": 0.01166, + "test_loss": 4.604616398620606, + "test_acc": 0.0101, + "lyapunov": 1.6858887992551566, + "grad_norm": 0.18811331479099205, + "grad_max_sv": 0.1278645334765315, + "grad_min_sv": 3.0763842290774553e-15, + "grad_condition": 127437261984.96709, + "lr": 0.0009164606203550494, + "time_sec": 177.44443678855896 + }, + { + "epoch": 29, + "train_loss": 4.630837202911377, + "train_acc": 0.01124, + "test_loss": 4.605790467834472, + "test_acc": 0.0112, + "lyapunov": 1.698096739056775, + "grad_norm": 0.16407795456021065, + "grad_max_sv": 0.12659106738865375, + "grad_min_sv": 1.499613032946564e-14, + "grad_condition": 124587249155.51591, + "lr": 0.0009105746045668516, + "time_sec": 209.39057421684265 + }, + { + "epoch": 30, + "train_loss": 4.632938845672608, + "train_acc": 0.01078, + "test_loss": 4.605535964965821, + "test_acc": 0.01, + "lyapunov": 1.721212680992263, + "grad_norm": 0.14623452805810844, + "grad_max_sv": 0.0895103589631617, + "grad_min_sv": 2.4454116563252743e-17, + "grad_condition": 89508236588.70316, + "lr": 0.0009045084971874733, + "time_sec": 263.71145844459534 + }, + { + "epoch": 31, + "train_loss": 4.6352485572814945, + "train_acc": 0.0112, + "test_loss": 4.6054604011535645, + "test_acc": 0.01, + "lyapunov": 1.7183927132955292, + "grad_norm": 0.13735986593200813, + "grad_max_sv": 0.08641289453953505, + "grad_min_sv": 2.1599208623445815e-19, + "grad_condition": 86412869689.33823, + "lr": 0.0008982649590120977, + "time_sec": 311.83074378967285 + }, + { + "epoch": 32, + "train_loss": 4.635748368225098, + "train_acc": 0.00974, + "test_loss": 4.605395234680175, + "test_acc": 0.01, + "lyapunov": 1.7134143931176655, + "grad_norm": 0.17446187936414212, + "grad_max_sv": 0.07230882924050093, + "grad_min_sv": 2.0499702352325113e-18, + "grad_condition": 72308666455.08424, + "lr": 0.0008918467286629196, + "time_sec": 206.80873680114746 + }, + { + "epoch": 33, + "train_loss": 4.636022796936035, + "train_acc": 0.01104, + "test_loss": 4.605342939758301, + "test_acc": 0.01, + "lyapunov": 1.7072797111233178, + "grad_norm": 0.12775485225316266, + "grad_max_sv": 0.07838721368461847, + "grad_min_sv": 2.0077524348038727e-25, + "grad_condition": 78387213684.59717, + "lr": 0.0008852566213878943, + "time_sec": 177.3796088695526 + }, + { + "epoch": 34, + "train_loss": 4.633528546752929, + "train_acc": 0.01178, + "test_loss": 4.788667023468018, + "test_acc": 0.01, + "lyapunov": 1.7240971656101745, + "grad_norm": 0.16026338484780192, + "grad_max_sv": 0.10473363827913999, + "grad_min_sv": 2.938795050870516e-28, + "grad_condition": 104733638279.13995, + "lr": 0.000878497527825878, + "time_sec": 177.41194081306458 + }, + { + "epoch": 35, + "train_loss": 4.624666329345703, + "train_acc": 0.01136, + "test_loss": 5.226200386047363, + "test_acc": 0.01, + "lyapunov": 1.7259136810327125, + "grad_norm": 0.2569739718933783, + "grad_max_sv": 0.19082484748214484, + "grad_min_sv": 7.582241190689211e-21, + "grad_condition": 190824845966.0855, + "lr": 0.000871572412738697, + "time_sec": 177.39700889587402 + }, + { + "epoch": 36, + "train_loss": 4.627123330841065, + "train_acc": 0.01106, + "test_loss": 5.197575033569336, + "test_acc": 0.01, + "lyapunov": 1.7035798697215516, + "grad_norm": 0.2342701437740273, + "grad_max_sv": 0.1933449748903513, + "grad_min_sv": 4.0435418388449323e-16, + "grad_condition": 193267665932.28574, + "lr": 0.0008644843137107055, + "time_sec": 177.41947269439697 + }, + { + "epoch": 37, + "train_loss": 4.623688429870605, + "train_acc": 0.01228, + "test_loss": 5.3434977600097655, + "test_acc": 0.01, + "lyapunov": 1.7014210852210785, + "grad_norm": 0.2435898200695919, + "grad_max_sv": 0.19552289135754108, + "grad_min_sv": 1.9710870713741913e-14, + "grad_condition": 192339314767.31424, + "lr": 0.0008572363398164014, + "time_sec": 177.4062840938568 + }, + { + "epoch": 38, + "train_loss": 4.627209045410156, + "train_acc": 0.0116, + "test_loss": 4.930310776519775, + "test_acc": 0.01, + "lyapunov": 1.6914129315129935, + "grad_norm": 0.2434207416268828, + "grad_max_sv": 0.20356647074222564, + "grad_min_sv": 2.6648892114403326e-15, + "grad_condition": 203134465277.43094, + "lr": 0.0008498316702566826, + "time_sec": 177.36271357536316 + }, + { + "epoch": 39, + "train_loss": 4.628314941101074, + "train_acc": 0.01184, + "test_loss": 5.388680703735352, + "test_acc": 0.01, + "lyapunov": 1.7209080369271281, + "grad_norm": 0.24108489909819544, + "grad_max_sv": 0.1765925135463476, + "grad_min_sv": 4.7069473123967913e-17, + "grad_condition": 176582466610.76913, + "lr": 0.0008422735529643442, + "time_sec": 177.39468216896057 + }, + { + "epoch": 40, + "train_loss": 4.625946524658203, + "train_acc": 0.0119, + "test_loss": 4.863273342895508, + "test_acc": 0.01, + "lyapunov": 1.7870670105795117, + "grad_norm": 0.727001364303807, + "grad_max_sv": 0.1741473102461896, + "grad_min_sv": 5.483372577200482e-14, + "grad_condition": 174132598195.0865, + "lr": 0.0008345653031794289, + "time_sec": 177.38460063934326 + }, + { + "epoch": 41, + "train_loss": 4.618370082702636, + "train_acc": 0.01084, + "test_loss": 4.950934140014648, + "test_acc": 0.01, + "lyapunov": 1.7732248605059846, + "grad_norm": 0.2521209265558111, + "grad_max_sv": 0.21080664210021496, + "grad_min_sv": 2.1801601211656184e-15, + "grad_condition": 210412027690.9943, + "lr": 0.0008267103019950526, + "time_sec": 177.40589833259583 + }, + { + "epoch": 42, + "train_loss": 4.610718942565918, + "train_acc": 0.01212, + "test_loss": 7.700952398681641, + "test_acc": 0.01, + "lyapunov": 1.758358538303229, + "grad_norm": 0.2262926279020941, + "grad_max_sv": 0.20302451718598605, + "grad_min_sv": 1.10600662607193e-20, + "grad_condition": 203024514656.03546, + "lr": 0.0008187119948743447, + "time_sec": 177.34876775741577 + }, + { + "epoch": 43, + "train_loss": 4.606141467590332, + "train_acc": 0.0126, + "test_loss": 7.260737210083008, + "test_acc": 0.01, + "lyapunov": 1.744447447454838, + "grad_norm": 0.2851542550522695, + "grad_max_sv": 0.21981305070221424, + "grad_min_sv": 1.9235494463794543e-14, + "grad_condition": 216499492432.9622, + "lr": 0.000810573890139155, + "time_sec": 177.40913462638855 + }, + { + "epoch": 44, + "train_loss": 4.601487475891113, + "train_acc": 0.0128, + "test_loss": 5.16635424118042, + "test_acc": 0.01, + "lyapunov": 1.7291340120613117, + "grad_norm": 0.2699440262729163, + "grad_max_sv": 0.20689585730433463, + "grad_min_sv": 2.466958009425939e-19, + "grad_condition": 206895790884.03778, + "lr": 0.0008022995574311873, + "time_sec": 177.38782215118408 + }, + { + "epoch": 45, + "train_loss": 4.591192651062012, + "train_acc": 0.01422, + "test_loss": 6.655834066772461, + "test_acc": 0.01, + "lyapunov": 1.7150692890977006, + "grad_norm": 0.28144601635584615, + "grad_max_sv": 0.2269132848829031, + "grad_min_sv": 1.6461330492232466e-14, + "grad_condition": 223218018112.7304, + "lr": 0.0007938926261462363, + "time_sec": 177.46803164482117 + }, + { + "epoch": 46, + "train_loss": 4.602867374725342, + "train_acc": 0.01316, + "test_loss": 5.490540980529786, + "test_acc": 0.01, + "lyapunov": 1.693292896156116, + "grad_norm": 0.24534699162408347, + "grad_max_sv": 0.1824163768440485, + "grad_min_sv": 1.6389164265652973e-20, + "grad_condition": 182416373255.75787, + "lr": 0.0007853567838422158, + "time_sec": 177.46002006530762 + }, + { + "epoch": 47, + "train_loss": 4.597328397674561, + "train_acc": 0.01258, + "test_loss": 5.6005713050842285, + "test_acc": 0.01, + "lyapunov": 1.6882270821525007, + "grad_norm": 0.24736766244091873, + "grad_max_sv": 0.1808805840089917, + "grad_min_sv": 4.4237792356896464e-16, + "grad_condition": 180794446745.3838, + "lr": 0.0007766957746216719, + "time_sec": 177.49080419540405 + }, + { + "epoch": 48, + "train_loss": 4.582484985198975, + "train_acc": 0.01414, + "test_loss": 7.804601565551758, + "test_acc": 0.01, + "lyapunov": 1.677145477451022, + "grad_norm": 0.31722883706252114, + "grad_max_sv": 0.18667313270270824, + "grad_min_sv": 2.1003055486041867e-13, + "grad_condition": 164603162469.27765, + "lr": 0.0007679133974894982, + "time_sec": 177.4645369052887 + }, + { + "epoch": 49, + "train_loss": 4.577538666992187, + "train_acc": 0.0158, + "test_loss": 7.338934902954102, + "test_acc": 0.01, + "lyapunov": 1.6737191381356906, + "grad_norm": 0.27176948764450615, + "grad_max_sv": 0.21167084556072951, + "grad_min_sv": 1.3977730616832926e-13, + "grad_condition": 191144552719.7922, + "lr": 0.000759013504686565, + "time_sec": 177.49126935005188 + }, + { + "epoch": 50, + "train_loss": 4.59638880569458, + "train_acc": 0.01404, + "test_loss": 5.10722823638916, + "test_acc": 0.01, + "lyapunov": 1.671956715986247, + "grad_norm": 0.26939370533382595, + "grad_max_sv": 0.18750572949647903, + "grad_min_sv": 1.0450817113169082e-14, + "grad_condition": 185231728343.9213, + "lr": 0.0007499999999999998, + "time_sec": 177.43870544433594 + }, + { + "epoch": 51, + "train_loss": 4.668072533721924, + "train_acc": 0.00928, + "test_loss": 4.642842518615723, + "test_acc": 0.01, + "lyapunov": 1.7506864070892334, + "grad_norm": 4.20723126700393, + "grad_max_sv": 0.11143864877340093, + "grad_min_sv": 2.2844781948394107e-10, + "grad_condition": 90916894288.0092, + "lr": 0.0007408768370508575, + "time_sec": 177.38196682929993 + }, + { + "epoch": 52, + "train_loss": 4.656653161315918, + "train_acc": 0.01026, + "test_loss": 4.606846702575684, + "test_acc": 0.0109, + "lyapunov": 2.0379096894617885, + "grad_norm": 0.22584328878851162, + "grad_max_sv": 0.15865185912698507, + "grad_min_sv": 4.237939432829755e-14, + "grad_condition": 154812579370.5941, + "lr": 0.0007316480175599307, + "time_sec": 177.4069049358368 + }, + { + "epoch": 53, + "train_loss": 4.624548539581299, + "train_acc": 0.01206, + "test_loss": 4.591988240051269, + "test_acc": 0.0108, + "lyapunov": 1.9380365915005775, + "grad_norm": 0.18455669546764147, + "grad_max_sv": 0.144264667481184, + "grad_min_sv": 3.0135369837472823e-29, + "grad_condition": 144264667481.18402, + "lr": 0.0007223175895924635, + "time_sec": 177.3831648826599 + }, + { + "epoch": 54, + "train_loss": 4.62523192489624, + "train_acc": 0.01196, + "test_loss": 4.662603539276123, + "test_acc": 0.0115, + "lyapunov": 1.8538690906046602, + "grad_norm": 0.16875203065739722, + "grad_max_sv": 0.13258629180490972, + "grad_min_sv": 2.1261935993346854e-27, + "grad_condition": 132586291804.90942, + "lr": 0.0007128896457825361, + "time_sec": 177.39837741851807 + }, + { + "epoch": 55, + "train_loss": 4.618103570709229, + "train_acc": 0.01224, + "test_loss": 4.662747817993164, + "test_acc": 0.01, + "lyapunov": 1.818430106048389, + "grad_norm": 0.17848961414208012, + "grad_max_sv": 0.13809755481779576, + "grad_min_sv": 8.087096112362802e-21, + "grad_condition": 138097553610.04034, + "lr": 0.0007033683215378998, + "time_sec": 177.52203607559204 + }, + { + "epoch": 56, + "train_loss": 4.618657445373535, + "train_acc": 0.0124, + "test_loss": 4.87407505645752, + "test_acc": 0.0093, + "lyapunov": 1.823894908666001, + "grad_norm": 0.18543750572118317, + "grad_max_sv": 0.14992212541401387, + "grad_min_sv": 4.755824959031378e-20, + "grad_condition": 149922118173.12308, + "lr": 0.0006937577932260512, + "time_sec": 177.47833228111267 + }, + { + "epoch": 57, + "train_loss": 4.638716118164062, + "train_acc": 0.01132, + "test_loss": 4.697380699157715, + "test_acc": 0.0074, + "lyapunov": 1.9301730455340023, + "grad_norm": 1.1327037595020617, + "grad_max_sv": 0.10352908921777271, + "grad_min_sv": 1.4672657972174837e-15, + "grad_condition": 103275171970.27998, + "lr": 0.0006840622763423388, + "time_sec": 177.41063523292542 + }, + { + "epoch": 58, + "train_loss": 4.634389620513916, + "train_acc": 0.01308, + "test_loss": 4.868174443054199, + "test_acc": 0.0059, + "lyapunov": 1.9861629070223445, + "grad_norm": 0.1816396260328979, + "grad_max_sv": 0.12703904695808887, + "grad_min_sv": 9.108337282597643e-15, + "grad_condition": 125828577100.05904, + "lr": 0.0006742860236609073, + "time_sec": 177.45663285255432 + }, + { + "epoch": 59, + "train_loss": 4.6284795446777345, + "train_acc": 0.01374, + "test_loss": 5.1286182189941405, + "test_acc": 0.01, + "lyapunov": 1.9755443913857345, + "grad_norm": 0.20559100585355392, + "grad_max_sv": 0.1231135094538331, + "grad_min_sv": 1.2082700014990789e-14, + "grad_condition": 121596604673.82451, + "lr": 0.0006644333233692913, + "time_sec": 177.5128185749054 + }, + { + "epoch": 60, + "train_loss": 4.636205641326904, + "train_acc": 0.0115, + "test_loss": 4.707932521057129, + "test_acc": 0.01, + "lyapunov": 1.9764311627658737, + "grad_norm": 0.7528431503344459, + "grad_max_sv": 0.0953290374513017, + "grad_min_sv": 1.3276092129806932e-14, + "grad_condition": 93818089169.88062, + "lr": 0.0006545084971874734, + "time_sec": 177.4649202823639 + }, + { + "epoch": 61, + "train_loss": 4.609165121765137, + "train_acc": 0.0159, + "test_loss": 4.821864377593994, + "test_acc": 0.01, + "lyapunov": 1.9811749872953996, + "grad_norm": 0.21292025221505723, + "grad_max_sv": 0.09851566717252354, + "grad_min_sv": 1.2602267966756725e-13, + "grad_condition": 89959075908.7258, + "lr": 0.0006445158984722354, + "time_sec": 177.52925729751587 + }, + { + "epoch": 62, + "train_loss": 4.598135734863281, + "train_acc": 0.0165, + "test_loss": 4.7484822311401365, + "test_acc": 0.01, + "lyapunov": 2.0011070024631823, + "grad_norm": 0.25450255496206214, + "grad_max_sv": 0.1375024238601327, + "grad_min_sv": 1.2085104144187479e-13, + "grad_condition": 125436319300.4956, + "lr": 0.0006344599103076324, + "time_sec": 177.7304708957672 + }, + { + "epoch": 63, + "train_loss": 4.582272465057373, + "train_acc": 0.01704, + "test_loss": 4.8034347106933595, + "test_acc": 0.01, + "lyapunov": 1.9771778574380119, + "grad_norm": 0.2819579473518796, + "grad_max_sv": 0.14798616897314787, + "grad_min_sv": 2.917529686243967e-13, + "grad_condition": 121925482876.5081, + "lr": 0.0006243449435824269, + "time_sec": 177.5029547214508 + }, + { + "epoch": 64, + "train_loss": 4.5768210922241215, + "train_acc": 0.0185, + "test_loss": 4.794427262878418, + "test_acc": 0.01, + "lyapunov": 2.010085624197255, + "grad_norm": 0.2618373163486269, + "grad_max_sv": 0.13441164009273052, + "grad_min_sv": 2.818035869891495e-13, + "grad_condition": 114689570193.70369, + "lr": 0.0006141754350553275, + "time_sec": 177.46915483474731 + }, + { + "epoch": 65, + "train_loss": 4.581459019012451, + "train_acc": 0.01888, + "test_loss": 5.156883710479736, + "test_acc": 0.01, + "lyapunov": 1.996271950509542, + "grad_norm": 0.2772106238829377, + "grad_max_sv": 0.14674038868397474, + "grad_min_sv": 8.548366859722039e-13, + "grad_condition": 97732212277.66531, + "lr": 0.0006039558454088793, + "time_sec": 177.51422119140625 + }, + { + "epoch": 66, + "train_loss": 4.634421834564209, + "train_acc": 0.0126, + "test_loss": 4.81665114440918, + "test_acc": 0.01, + "lyapunov": 1.9383242672971448, + "grad_norm": 0.47617376682330925, + "grad_max_sv": 0.09843250698449993, + "grad_min_sv": 2.901256298607784e-14, + "grad_condition": 95396589397.15808, + "lr": 0.000593690657292862, + "time_sec": 177.50902652740479 + }, + { + "epoch": 67, + "train_loss": 4.612115941772461, + "train_acc": 0.0124, + "test_loss": 6.130619789886475, + "test_acc": 0.01, + "lyapunov": 1.7900500773164012, + "grad_norm": 0.1447788566664678, + "grad_max_sv": 0.10258051082491874, + "grad_min_sv": 4.432823598739315e-21, + "grad_condition": 102580510304.29665, + "lr": 0.0005833843733580507, + "time_sec": 177.45989155769348 + }, + { + "epoch": 68, + "train_loss": 4.601067236480713, + "train_acc": 0.01444, + "test_loss": 5.2316818511962895, + "test_acc": 0.01, + "lyapunov": 1.7777380013404904, + "grad_norm": 0.1520716462338762, + "grad_max_sv": 0.10410952400416136, + "grad_min_sv": 4.077326777723326e-15, + "grad_condition": 103565610079.67209, + "lr": 0.0005730415142812054, + "time_sec": 177.397207736969 + }, + { + "epoch": 69, + "train_loss": 4.598657707672119, + "train_acc": 0.013, + "test_loss": 5.097503046417236, + "test_acc": 0.01, + "lyapunov": 1.7404629303061443, + "grad_norm": 0.3871184457082642, + "grad_max_sv": 0.10422442324358058, + "grad_min_sv": 1.8154889959708973e-15, + "grad_condition": 103993314127.14293, + "lr": 0.0005626666167821517, + "time_sec": 177.44370555877686 + }, + { + "epoch": 70, + "train_loss": 4.64778597290039, + "train_acc": 0.0105, + "test_loss": 4.608603437805176, + "test_acc": 0.01, + "lyapunov": 1.7865622293613757, + "grad_norm": 2.3876786696903674, + "grad_max_sv": 0.09057229645604821, + "grad_min_sv": 1.53610898160012e-14, + "grad_condition": 88973114810.24387, + "lr": 0.0005522642316338265, + "time_sec": 177.42748093605042 + }, + { + "epoch": 71, + "train_loss": 4.598184258270264, + "train_acc": 0.01846, + "test_loss": 4.666911703491211, + "test_acc": 0.0112, + "lyapunov": 1.7932748675651258, + "grad_norm": 0.20106908445398256, + "grad_max_sv": 0.10719632245600223, + "grad_min_sv": 6.574236923292381e-13, + "grad_condition": 78243664083.21777, + "lr": 0.0005418389216661573, + "time_sec": 177.554673910141 + }, + { + "epoch": 72, + "train_loss": 4.589409804992676, + "train_acc": 0.0177, + "test_loss": 4.711094479370117, + "test_acc": 0.0097, + "lyapunov": 1.7896817514048817, + "grad_norm": 0.21964566445756573, + "grad_max_sv": 0.11253391858190298, + "grad_min_sv": 2.509497274764375e-12, + "grad_condition": 45783533854.40356, + "lr": 0.0005313952597646563, + "time_sec": 177.50412464141846 + }, + { + "epoch": 73, + "train_loss": 4.590103494720459, + "train_acc": 0.01788, + "test_loss": 4.630348364257813, + "test_acc": 0.0085, + "lyapunov": 1.790948787918481, + "grad_norm": 0.2220262076302429, + "grad_max_sv": 0.11815547421574593, + "grad_min_sv": 2.216876602499167e-12, + "grad_condition": 47452843482.59845, + "lr": 0.0005209378268645994, + "time_sec": 177.48806595802307 + }, + { + "epoch": 74, + "train_loss": 4.584798228759766, + "train_acc": 0.01806, + "test_loss": 4.731997722625732, + "test_acc": 0.0079, + "lyapunov": 1.7995114512455739, + "grad_norm": 0.22846540438439775, + "grad_max_sv": 0.1254099266603589, + "grad_min_sv": 9.066272885534926e-12, + "grad_condition": 40745914092.667564, + "lr": 0.0005104712099416781, + "time_sec": 177.5059473514557 + }, + { + "epoch": 75, + "train_loss": 4.595231973876953, + "train_acc": 0.01808, + "test_loss": 4.700939775085449, + "test_acc": 0.0083, + "lyapunov": 1.8095452175725757, + "grad_norm": 0.2192950837077278, + "grad_max_sv": 0.11508929487317801, + "grad_min_sv": 3.2825933404008327e-12, + "grad_condition": 50350606741.80017, + "lr": 0.0004999999999999996, + "time_sec": 177.50167965888977 + }, + { + "epoch": 76, + "train_loss": 4.581764100189209, + "train_acc": 0.01914, + "test_loss": 5.021898673248291, + "test_acc": 0.0136, + "lyapunov": 1.8122548505168437, + "grad_norm": 0.2207773307030423, + "grad_max_sv": 0.11397518068552018, + "grad_min_sv": 4.64014528772541e-12, + "grad_condition": 38904780932.69551, + "lr": 0.0004895287900583212, + "time_sec": 177.48214983940125 + }, + { + "epoch": 77, + "train_loss": 4.6112875914001465, + "train_acc": 0.01686, + "test_loss": 4.777989421081543, + "test_acc": 0.01, + "lyapunov": 1.8042393660606326, + "grad_norm": 0.20227736558382023, + "grad_max_sv": 0.11082722675055265, + "grad_min_sv": 4.1238775813024016e-12, + "grad_condition": 51771877886.454735, + "lr": 0.0004790621731353997, + "time_sec": 177.53421211242676 + }, + { + "epoch": 78, + "train_loss": 4.6304528376770016, + "train_acc": 0.01232, + "test_loss": 4.631612042236328, + "test_acc": 0.01, + "lyapunov": 1.7989057473209509, + "grad_norm": 0.17321951374234873, + "grad_max_sv": 0.11129376739263534, + "grad_min_sv": 1.8656762395422398e-13, + "grad_condition": 96477935168.63983, + "lr": 0.000468604740235343, + "time_sec": 177.469135761261 + }, + { + "epoch": 79, + "train_loss": 4.637705051422119, + "train_acc": 0.01126, + "test_loss": 4.632591462707519, + "test_acc": 0.01, + "lyapunov": 1.8160393945396405, + "grad_norm": 0.15699976023895548, + "grad_max_sv": 0.09548703515902161, + "grad_min_sv": 3.6497327768533775e-14, + "grad_condition": 91848039978.0037, + "lr": 0.00045816107833384175, + "time_sec": 177.4849989414215 + }, + { + "epoch": 80, + "train_loss": 4.641419131469727, + "train_acc": 0.01162, + "test_loss": 4.678064388275146, + "test_acc": 0.0113, + "lyapunov": 1.824865699119275, + "grad_norm": 0.34179817206126445, + "grad_max_sv": 0.10052354910603753, + "grad_min_sv": 4.310724816473457e-14, + "grad_condition": 97515647880.38889, + "lr": 0.0004477357683661729, + "time_sec": 177.4347095489502 + }, + { + "epoch": 81, + "train_loss": 4.626089483337402, + "train_acc": 0.01368, + "test_loss": 4.690298704528809, + "test_acc": 0.01, + "lyapunov": 1.8297587465447234, + "grad_norm": 0.19555822827695532, + "grad_max_sv": 0.12354116216301918, + "grad_min_sv": 3.412182233661048e-14, + "grad_condition": 120065771293.66782, + "lr": 0.00043733338321784746, + "time_sec": 177.5001676082611 + }, + { + "epoch": 82, + "train_loss": 4.590725216827392, + "train_acc": 0.01764, + "test_loss": 4.650773342895508, + "test_acc": 0.01, + "lyapunov": 1.8378781321103617, + "grad_norm": 0.20562924895848395, + "grad_max_sv": 0.11650247611105442, + "grad_min_sv": 3.1390578721014945e-13, + "grad_condition": 93506800941.94165, + "lr": 0.0004269584857187939, + "time_sec": 177.5188705921173 + }, + { + "epoch": 83, + "train_loss": 4.604648815155029, + "train_acc": 0.01452, + "test_loss": 4.742064354705811, + "test_acc": 0.01, + "lyapunov": 1.8501020215661323, + "grad_norm": 0.18456790602625103, + "grad_max_sv": 0.1151590246707201, + "grad_min_sv": 9.825957860555914e-14, + "grad_condition": 105847408109.60861, + "lr": 0.0004166156266419484, + "time_sec": 177.4660234451294 + }, + { + "epoch": 84, + "train_loss": 4.62983644317627, + "train_acc": 0.01318, + "test_loss": 5.077652665710449, + "test_acc": 0.01, + "lyapunov": 1.8849806194110295, + "grad_norm": 0.8125052512079809, + "grad_max_sv": 0.1045217255308156, + "grad_min_sv": 1.9072799584091284e-14, + "grad_condition": 101190098103.28586, + "lr": 0.0004063093427071373, + "time_sec": 177.4631519317627 + }, + { + "epoch": 85, + "train_loss": 4.610348142547608, + "train_acc": 0.01316, + "test_loss": 5.118058528137207, + "test_acc": 0.01, + "lyapunov": 1.871642042608822, + "grad_norm": 0.13933948706358035, + "grad_max_sv": 0.08974340837448835, + "grad_min_sv": 3.535425966726085e-27, + "grad_condition": 89743408374.48799, + "lr": 0.0003960441545911199, + "time_sec": 177.49748611450195 + }, + { + "epoch": 86, + "train_loss": 4.6110903297424315, + "train_acc": 0.01186, + "test_loss": 4.606361127471923, + "test_acc": 0.01, + "lyapunov": 1.8742803606535772, + "grad_norm": 0.14070329420704014, + "grad_max_sv": 0.09362018778920174, + "grad_min_sv": 6.952521961113038e-27, + "grad_condition": 93620187789.20113, + "lr": 0.0003858245649446718, + "time_sec": 177.50401282310486 + }, + { + "epoch": 87, + "train_loss": 4.613140257873535, + "train_acc": 0.01238, + "test_loss": 4.60641729888916, + "test_acc": 0.01, + "lyapunov": 1.8914529496751478, + "grad_norm": 0.14272725180676682, + "grad_max_sv": 0.08532685413956642, + "grad_min_sv": 5.950646978711828e-29, + "grad_condition": 85326854139.5664, + "lr": 0.00037565505641757235, + "time_sec": 177.63836789131165 + }, + { + "epoch": 88, + "train_loss": 4.616064016113281, + "train_acc": 0.01246, + "test_loss": 4.606465660095215, + "test_acc": 0.01, + "lyapunov": 1.9161930334232653, + "grad_norm": 0.13682970540188208, + "grad_max_sv": 0.09302938226610422, + "grad_min_sv": 7.072211804876899e-22, + "grad_condition": 93029382200.03003, + "lr": 0.00036554008969236695, + "time_sec": 177.45394277572632 + }, + { + "epoch": 89, + "train_loss": 4.6237612547302245, + "train_acc": 0.01166, + "test_loss": 4.6070164260864255, + "test_acc": 0.01, + "lyapunov": 2.1093987549662283, + "grad_norm": 0.13799970697477412, + "grad_max_sv": 0.08960749246180058, + "grad_min_sv": 6.981451179333121e-34, + "grad_condition": 89607492461.80057, + "lr": 0.0003554841015277638, + "time_sec": 177.4078447818756 + }, + { + "epoch": 90, + "train_loss": 4.64829606048584, + "train_acc": 0.01024, + "test_loss": 5.948853401184082, + "test_acc": 0.01, + "lyapunov": 1.8291754908573903, + "grad_norm": 1.3850611722503907, + "grad_max_sv": 0.1480995684862137, + "grad_min_sv": 4.606550655942372e-13, + "grad_condition": 114502964953.56998, + "lr": 0.000345491502812526, + "time_sec": 177.4575469493866 + }, + { + "epoch": 91, + "train_loss": 4.65536180480957, + "train_acc": 0.0089, + "test_loss": 5.329740146636963, + "test_acc": 0.01, + "lyapunov": 1.605381081171353, + "grad_norm": 0.974011977531608, + "grad_max_sv": 0.1478642074391246, + "grad_min_sv": 5.969162338227209e-10, + "grad_condition": 103863030721.42941, + "lr": 0.0003355666766307081, + "time_sec": 177.46386551856995 + }, + { + "epoch": 92, + "train_loss": 4.703534996643066, + "train_acc": 0.00968, + "test_loss": 6.427504180145264, + "test_acc": 0.01, + "lyapunov": 1.6079340096934678, + "grad_norm": 0.9722235577486973, + "grad_max_sv": 0.43087365981191394, + "grad_min_sv": 5.453390171592937e-09, + "grad_condition": 53113359044.8774, + "lr": 0.00032571397633909225, + "time_sec": 177.4694640636444 + }, + { + "epoch": 93, + "train_loss": 4.741092784576416, + "train_acc": 0.01008, + "test_loss": 4.898286245727539, + "test_acc": 0.01, + "lyapunov": 1.613801842150481, + "grad_norm": 1.6346890836346257, + "grad_max_sv": 0.6007082311436533, + "grad_min_sv": 8.501025247468166e-09, + "grad_condition": 15194027505.731958, + "lr": 0.00031593772365766094, + "time_sec": 177.60008549690247 + }, + { + "epoch": 94, + "train_loss": 4.64530430480957, + "train_acc": 0.00986, + "test_loss": 5.429140309143066, + "test_acc": 0.01, + "lyapunov": 1.5927760421162676, + "grad_norm": 0.2835894618084608, + "grad_max_sv": 0.15550447292625905, + "grad_min_sv": 7.553917717978667e-11, + "grad_condition": 129696614880.15556, + "lr": 0.0003062422067739483, + "time_sec": 177.51860213279724 + }, + { + "epoch": 95, + "train_loss": 4.638549526367187, + "train_acc": 0.0096, + "test_loss": 5.36515055770874, + "test_acc": 0.01, + "lyapunov": 1.5965131021216703, + "grad_norm": 0.20103446780697812, + "grad_max_sv": 0.1225690545514226, + "grad_min_sv": 9.654140498962059e-15, + "grad_condition": 121117921461.00528, + "lr": 0.00029663167846209965, + "time_sec": 177.52199840545654 + }, + { + "epoch": 96, + "train_loss": 4.638137784576416, + "train_acc": 0.0096, + "test_loss": 5.453123988342285, + "test_acc": 0.01, + "lyapunov": 1.5985023829028429, + "grad_norm": 0.18515787532724406, + "grad_max_sv": 0.11847074571996927, + "grad_min_sv": 8.552124032474723e-15, + "grad_condition": 117420626795.55217, + "lr": 0.00028711035421746345, + "time_sec": 177.4717402458191 + }, + { + "epoch": 97, + "train_loss": 4.636066844940186, + "train_acc": 0.01012, + "test_loss": 5.206941423034668, + "test_acc": 0.01, + "lyapunov": 1.599738584455017, + "grad_norm": 0.14221303873971214, + "grad_max_sv": 0.08317648619413376, + "grad_min_sv": 3.77452327693783e-16, + "grad_condition": 83144162799.83102, + "lr": 0.00027768241040753615, + "time_sec": 177.56506752967834 + }, + { + "epoch": 98, + "train_loss": 4.638936366577148, + "train_acc": 0.00954, + "test_loss": 7.9013794311523435, + "test_acc": 0.01, + "lyapunov": 1.628589593845865, + "grad_norm": 0.5961373706705821, + "grad_max_sv": 0.09680306557030463, + "grad_min_sv": 9.111214004746707e-11, + "grad_condition": 74975500149.68642, + "lr": 0.00026835198244006903, + "time_sec": 177.54391860961914 + }, + { + "epoch": 99, + "train_loss": 4.645994584197998, + "train_acc": 0.00976, + "test_loss": 5.960794914245605, + "test_acc": 0.01, + "lyapunov": 1.627340192685042, + "grad_norm": 0.4369750740410589, + "grad_max_sv": 0.15774182938039302, + "grad_min_sv": 1.8558587643080683e-10, + "grad_condition": 122819757394.17741, + "lr": 0.0002591231629491421, + "time_sec": 177.57049465179443 + }, + { + "epoch": 100, + "train_loss": 4.6382358056640625, + "train_acc": 0.01, + "test_loss": 5.899705020141601, + "test_acc": 0.01, + "lyapunov": 1.6051212756530098, + "grad_norm": 0.18412206012129323, + "grad_max_sv": 0.1038605472072959, + "grad_min_sv": 1.422221530597745e-13, + "grad_condition": 99036113090.37741, + "lr": 0.0002499999999999997, + "time_sec": 177.5935730934143 + }, + { + "epoch": 101, + "train_loss": 4.636023253479004, + "train_acc": 0.01014, + "test_loss": 6.029523161315918, + "test_acc": 0.01, + "lyapunov": 1.5906122072273507, + "grad_norm": 0.15318188656484213, + "grad_max_sv": 0.08877538926899434, + "grad_min_sv": 1.5779396501070167e-15, + "grad_condition": 88609247842.85104, + "lr": 0.00024098649531343477, + "time_sec": 177.56322169303894 + }, + { + "epoch": 102, + "train_loss": 4.639331659088135, + "train_acc": 0.00952, + "test_loss": 6.312074471282959, + "test_acc": 0.01, + "lyapunov": 1.5965099304228487, + "grad_norm": 0.21149544585382213, + "grad_max_sv": 0.12334259878844023, + "grad_min_sv": 1.4106560095489824e-13, + "grad_condition": 115526265000.40161, + "lr": 0.0002320866025105016, + "time_sec": 177.52338194847107 + }, + { + "epoch": 103, + "train_loss": 4.638908295288086, + "train_acc": 0.00948, + "test_loss": 4.882051207733154, + "test_acc": 0.01, + "lyapunov": 1.5894694816121056, + "grad_norm": 0.19092665368829964, + "grad_max_sv": 0.11500742509961129, + "grad_min_sv": 1.2131027142320157e-11, + "grad_condition": 107231941467.1062, + "lr": 0.0002233042253783278, + "time_sec": 177.51379299163818 + }, + { + "epoch": 104, + "train_loss": 4.6372373811340335, + "train_acc": 0.00962, + "test_loss": 5.414011867523193, + "test_acc": 0.01, + "lyapunov": 1.6031087450968944, + "grad_norm": 0.15294842248264393, + "grad_max_sv": 0.0859173422679305, + "grad_min_sv": 5.657292991931931e-14, + "grad_condition": 82522117185.93742, + "lr": 0.000214643216157784, + "time_sec": 177.51268887519836 + }, + { + "epoch": 105, + "train_loss": 4.635795275115967, + "train_acc": 0.00952, + "test_loss": 5.624617222595215, + "test_acc": 0.01, + "lyapunov": 1.5992870769842202, + "grad_norm": 0.14345400220333562, + "grad_max_sv": 0.0836037619970739, + "grad_min_sv": 4.952751755143825e-16, + "grad_condition": 83551071814.55841, + "lr": 0.00020610737385376332, + "time_sec": 177.4938223361969 + }, + { + "epoch": 106, + "train_loss": 4.635631282043457, + "train_acc": 0.00978, + "test_loss": 4.902723191833496, + "test_acc": 0.01, + "lyapunov": 1.6039166020615327, + "grad_norm": 0.13863679536098605, + "grad_max_sv": 0.07681595571339131, + "grad_min_sv": 2.972097177575839e-16, + "grad_condition": 76791636577.80779, + "lr": 0.00019770044256881242, + "time_sec": 177.68779873847961 + }, + { + "epoch": 107, + "train_loss": 4.645384068603516, + "train_acc": 0.0093, + "test_loss": 6.211756886291504, + "test_acc": 0.01, + "lyapunov": 1.6040416663260106, + "grad_norm": 0.4285837495694049, + "grad_max_sv": 0.13404025603085756, + "grad_min_sv": 7.59142371404923e-11, + "grad_condition": 124305006830.62077, + "lr": 0.0001894261098608447, + "time_sec": 177.70811343193054 + }, + { + "epoch": 108, + "train_loss": 4.649419489746093, + "train_acc": 0.00958, + "test_loss": 6.113496919250489, + "test_acc": 0.01, + "lyapunov": 1.6134913239027837, + "grad_norm": 0.4190137316614345, + "grad_max_sv": 0.17006937153637408, + "grad_min_sv": 2.99484826746914e-10, + "grad_condition": 110894680139.56035, + "lr": 0.000181288005125655, + "time_sec": 177.45785975456238 + }, + { + "epoch": 109, + "train_loss": 4.6518434753417965, + "train_acc": 0.00938, + "test_loss": 9.096184700012207, + "test_acc": 0.01, + "lyapunov": 1.6035581257032312, + "grad_norm": 0.3602645131442418, + "grad_max_sv": 0.21420479603111744, + "grad_min_sv": 8.198111248635677e-10, + "grad_condition": 72870526404.21088, + "lr": 0.0001732896980049473, + "time_sec": 177.46639800071716 + }, + { + "epoch": 110, + "train_loss": 4.641265626678467, + "train_acc": 0.0101, + "test_loss": 5.671052789306641, + "test_acc": 0.01, + "lyapunov": 1.615362436875053, + "grad_norm": 0.3716773742209685, + "grad_max_sv": 0.1214295782148838, + "grad_min_sv": 1.687510135228703e-14, + "grad_condition": 119109674941.48811, + "lr": 0.00016543469682057076, + "time_sec": 177.45601773262024 + }, + { + "epoch": 111, + "train_loss": 4.637753919525147, + "train_acc": 0.01002, + "test_loss": 6.3604964195251465, + "test_acc": 0.01, + "lyapunov": 1.5998067453389277, + "grad_norm": 0.20564624198536263, + "grad_max_sv": 0.09355268320068717, + "grad_min_sv": 6.394734869912112e-15, + "grad_condition": 92596418403.32889, + "lr": 0.00015772644703565552, + "time_sec": 177.40109944343567 + }, + { + "epoch": 112, + "train_loss": 4.6369399143981935, + "train_acc": 0.00954, + "test_loss": 6.245291988372803, + "test_acc": 0.01, + "lyapunov": 1.6006381612299654, + "grad_norm": 0.20224259148430365, + "grad_max_sv": 0.09645014414563775, + "grad_min_sv": 3.2489140728988684e-15, + "grad_condition": 96032457790.44434, + "lr": 0.00015016832974331713, + "time_sec": 177.41747522354126 + }, + { + "epoch": 113, + "train_loss": 4.637875361938477, + "train_acc": 0.00982, + "test_loss": 6.2253476379394534, + "test_acc": 0.01, + "lyapunov": 1.6173809291151784, + "grad_norm": 0.1994460538798247, + "grad_max_sv": 0.07964600441046059, + "grad_min_sv": 2.077123703886266e-14, + "grad_condition": 76603550085.65251, + "lr": 0.00014276366018359834, + "time_sec": 177.3594732284546 + }, + { + "epoch": 114, + "train_loss": 4.642988829956055, + "train_acc": 0.00916, + "test_loss": 5.641693086242676, + "test_acc": 0.01, + "lyapunov": 1.6124064763793555, + "grad_norm": 0.48468190481153556, + "grad_max_sv": 0.11619603158906103, + "grad_min_sv": 4.451716550246969e-11, + "grad_condition": 96077444915.60593, + "lr": 0.00013551568628929425, + "time_sec": 177.40932750701904 + }, + { + "epoch": 115, + "train_loss": 4.6442307968139644, + "train_acc": 0.01012, + "test_loss": 8.254900483703613, + "test_acc": 0.01, + "lyapunov": 1.608978744358053, + "grad_norm": 1.159165197770711, + "grad_max_sv": 0.13953377436846495, + "grad_min_sv": 4.497630394164946e-10, + "grad_condition": 84381423123.14908, + "lr": 0.00012842758726130276, + "time_sec": 177.39953756332397 + }, + { + "epoch": 116, + "train_loss": 4.636619221801758, + "train_acc": 0.00994, + "test_loss": 4.987443087005615, + "test_acc": 0.01, + "lyapunov": 1.6049028973445258, + "grad_norm": 0.446186009268613, + "grad_max_sv": 0.08837665086612105, + "grad_min_sv": 6.211874251106184e-11, + "grad_condition": 80804066614.84586, + "lr": 0.0001215024721741218, + "time_sec": 177.44137263298035 + }, + { + "epoch": 117, + "train_loss": 4.641505916442871, + "train_acc": 0.01016, + "test_loss": 4.949208921813965, + "test_acc": 0.01, + "lyapunov": 1.6085841079502154, + "grad_norm": 0.9725925367613142, + "grad_max_sv": 0.13967048060148954, + "grad_min_sv": 2.628647794184182e-10, + "grad_condition": 100637194728.04265, + "lr": 0.00011474337861210538, + "time_sec": 177.48751759529114 + }, + { + "epoch": 118, + "train_loss": 4.642201548309326, + "train_acc": 0.01054, + "test_loss": 5.226166139221191, + "test_acc": 0.01, + "lyapunov": 1.5997687919670358, + "grad_norm": 0.6972051835342679, + "grad_max_sv": 0.14701552018523217, + "grad_min_sv": 4.760884983617464e-11, + "grad_condition": 108994613515.33463, + "lr": 0.00010815327133708009, + "time_sec": 177.41592502593994 + }, + { + "epoch": 119, + "train_loss": 4.641398347625732, + "train_acc": 0.00996, + "test_loss": 5.12651353149414, + "test_acc": 0.01, + "lyapunov": 1.6191631671412827, + "grad_norm": 0.6848881343974178, + "grad_max_sv": 0.12515094466507434, + "grad_min_sv": 1.017373253136728e-10, + "grad_condition": 89472197284.59195, + "lr": 0.00010173504098790182, + "time_sec": 177.522531747818 + }, + { + "epoch": 120, + "train_loss": 4.639837428436279, + "train_acc": 0.00926, + "test_loss": 4.960876380157471, + "test_acc": 0.01, + "lyapunov": 1.6132944505232985, + "grad_norm": 0.44673930804252565, + "grad_max_sv": 0.10939746093936265, + "grad_min_sv": 1.0394761958741514e-14, + "grad_condition": 107693815501.36168, + "lr": 9.549150281252629e-05, + "time_sec": 177.40511012077332 + }, + { + "epoch": 121, + "train_loss": 4.6363514524841305, + "train_acc": 0.00966, + "test_loss": 5.175967210388183, + "test_acc": 0.01, + "lyapunov": 1.6238462918859613, + "grad_norm": 0.27652956652143607, + "grad_max_sv": 0.0465963042806834, + "grad_min_sv": 1.4721026716962783e-19, + "grad_condition": 46596285417.10557, + "lr": 8.942539543314794e-05, + "time_sec": 177.41101145744324 + }, + { + "epoch": 122, + "train_loss": 4.637189597320557, + "train_acc": 0.00952, + "test_loss": 4.859474555969238, + "test_acc": 0.01, + "lyapunov": 1.6088723078408205, + "grad_norm": 0.46187274354590935, + "grad_max_sv": 0.0683113451115787, + "grad_min_sv": 1.1281507971595486e-13, + "grad_condition": 61105449666.2855, + "lr": 8.353937964495024e-05, + "time_sec": 177.4073166847229 + }, + { + "epoch": 123, + "train_loss": 4.63709145324707, + "train_acc": 0.00984, + "test_loss": 5.632948218536377, + "test_acc": 0.01, + "lyapunov": 1.6050320531401183, + "grad_norm": 0.4533137974661839, + "grad_max_sv": 0.05574926282279193, + "grad_min_sv": 8.137487913081367e-16, + "grad_condition": 55654933351.81663, + "lr": 7.783603724899243e-05, + "time_sec": 177.38157057762146 + }, + { + "epoch": 124, + "train_loss": 4.637026580200195, + "train_acc": 0.00978, + "test_loss": 5.898529278564453, + "test_acc": 0.01, + "lyapunov": 1.6208249144541942, + "grad_norm": 0.5996176667008037, + "grad_max_sv": 0.0704139634501189, + "grad_min_sv": 4.8966876246396745e-16, + "grad_condition": 70361497723.57747, + "lr": 7.231786991974666e-05, + "time_sec": 177.72577548027039 + }, + { + "epoch": 125, + "train_loss": 4.6363291398620605, + "train_acc": 0.0089, + "test_loss": 5.236582487487793, + "test_acc": 0.01, + "lyapunov": 1.616811472436656, + "grad_norm": 0.33831176878400027, + "grad_max_sv": 0.046196744637563826, + "grad_min_sv": 1.4909370990647944e-32, + "grad_condition": 46196744637.56383, + "lr": 6.698729810778072e-05, + "time_sec": 177.48478984832764 + }, + { + "epoch": 126, + "train_loss": 4.636370783996582, + "train_acc": 0.01004, + "test_loss": 4.870031663513184, + "test_acc": 0.01, + "lyapunov": 1.6279964572023553, + "grad_norm": 0.37885020203826125, + "grad_max_sv": 0.05249005830846727, + "grad_min_sv": 1.1755456595782039e-18, + "grad_condition": 52489920943.6446, + "lr": 6.184665997806817e-05, + "time_sec": 177.4620487689972 + }, + { + "epoch": 127, + "train_loss": 4.635390359954834, + "train_acc": 0.01016, + "test_loss": 4.962027810668945, + "test_acc": 0.01, + "lyapunov": 1.611984146830371, + "grad_norm": 0.28972201295303096, + "grad_max_sv": 0.03446305748075247, + "grad_min_sv": 7.006492321624086e-47, + "grad_condition": 34463057480.752464, + "lr": 5.6898210384392595e-05, + "time_sec": 177.48631811141968 + }, + { + "epoch": 128, + "train_loss": 4.63566765335083, + "train_acc": 0.01038, + "test_loss": 4.9268453125, + "test_acc": 0.01, + "lyapunov": 1.6156681068717975, + "grad_norm": 0.30554545477243994, + "grad_max_sv": 0.04931030767038465, + "grad_min_sv": 1.0509738482436128e-46, + "grad_condition": 49310307670.38464, + "lr": 5.214411988029363e-05, + "time_sec": 177.44504189491272 + }, + { + "epoch": 129, + "train_loss": 4.635161056823731, + "train_acc": 0.01062, + "test_loss": 5.005131581878662, + "test_acc": 0.01, + "lyapunov": 1.603255180446693, + "grad_norm": 0.29597045222639246, + "grad_max_sv": 0.04633630895987153, + "grad_min_sv": 0.0, + "grad_condition": 46336308959.87154, + "lr": 4.7586473766990294e-05, + "time_sec": 177.4482295513153 + }, + { + "epoch": 130, + "train_loss": 4.635268541412353, + "train_acc": 0.00968, + "test_loss": 5.536978643035889, + "test_acc": 0.01, + "lyapunov": 1.6035685374608735, + "grad_norm": 0.3228889258229885, + "grad_max_sv": 0.050575141236186026, + "grad_min_sv": 2.8294806150482074e-24, + "grad_condition": 50575141235.93922, + "lr": 4.32272711786996e-05, + "time_sec": 177.43854761123657 + }, + { + "epoch": 131, + "train_loss": 4.635657294921875, + "train_acc": 0.00976, + "test_loss": 5.356072675323486, + "test_acc": 0.01, + "lyapunov": 1.607055471681268, + "grad_norm": 0.35518242144595247, + "grad_max_sv": 0.054671825980767606, + "grad_min_sv": 0.0, + "grad_condition": 54671825980.76761, + "lr": 3.906842420574966e-05, + "time_sec": 177.40531492233276 + }, + { + "epoch": 132, + "train_loss": 4.634914422302246, + "train_acc": 0.01088, + "test_loss": 4.779349794006348, + "test_acc": 0.01, + "lyapunov": 1.6039032625115437, + "grad_norm": 0.2990292675719232, + "grad_max_sv": 0.05361205390654504, + "grad_min_sv": 7.006492321624086e-47, + "grad_condition": 53612053906.54505, + "lr": 3.5111757055874305e-05, + "time_sec": 177.36806797981262 + }, + { + "epoch": 133, + "train_loss": 4.635733027191162, + "train_acc": 0.00964, + "test_loss": 4.856661106109619, + "test_acc": 0.01, + "lyapunov": 1.6130791512291756, + "grad_norm": 0.39511036979335445, + "grad_max_sv": 0.03940709177404642, + "grad_min_sv": 1.5677411879976878e-18, + "grad_condition": 39406908308.73201, + "lr": 3.1359005254054254e-05, + "time_sec": 177.4022798538208 + }, + { + "epoch": 134, + "train_loss": 4.63543024017334, + "train_acc": 0.0089, + "test_loss": 5.608733610534668, + "test_acc": 0.01, + "lyapunov": 1.6037682285699089, + "grad_norm": 0.3528315736091379, + "grad_max_sv": 0.05010063648223877, + "grad_min_sv": 1.6209519986077321e-43, + "grad_condition": 50100636482.23877, + "lr": 2.7811814881259484e-05, + "time_sec": 177.53771209716797 + }, + { + "epoch": 135, + "train_loss": 4.634734027557373, + "train_acc": 0.01036, + "test_loss": 5.453004119873047, + "test_acc": 0.01, + "lyapunov": 1.5970036806657797, + "grad_norm": 0.3306302998394907, + "grad_max_sv": 0.04091830984689295, + "grad_min_sv": 0.0, + "grad_condition": 40918309846.89295, + "lr": 2.4471741852423218e-05, + "time_sec": 177.73491024971008 + }, + { + "epoch": 136, + "train_loss": 4.634889769287109, + "train_acc": 0.01012, + "test_loss": 5.61275626373291, + "test_acc": 0.01, + "lyapunov": 1.6030333359223192, + "grad_norm": 0.3584868339271938, + "grad_max_sv": 0.04813642092049122, + "grad_min_sv": 0.0, + "grad_condition": 48136420920.49122, + "lr": 2.1340251233966362e-05, + "time_sec": 177.47666192054749 + }, + { + "epoch": 137, + "train_loss": 4.634823101654053, + "train_acc": 0.00898, + "test_loss": 5.494492791748047, + "test_acc": 0.01, + "lyapunov": 1.6009076339814363, + "grad_norm": 0.3442665566972448, + "grad_max_sv": 0.04324088403955102, + "grad_min_sv": 1.302727355514694e-16, + "grad_condition": 43227112318.92408, + "lr": 1.8418716601170932e-05, + "time_sec": 177.43186950683594 + }, + { + "epoch": 138, + "train_loss": 4.634750337219239, + "train_acc": 0.0096, + "test_loss": 5.465321458435058, + "test_acc": 0.01, + "lyapunov": 1.5992854443352547, + "grad_norm": 0.3114275638976126, + "grad_max_sv": 0.048599824076518416, + "grad_min_sv": 0.0, + "grad_condition": 48599824076.51842, + "lr": 1.570841943568445e-05, + "time_sec": 177.44206428527832 + }, + { + "epoch": 139, + "train_loss": 4.634701194000244, + "train_acc": 0.00994, + "test_loss": 5.445890211486817, + "test_acc": 0.01, + "lyapunov": 1.6023394165136624, + "grad_norm": 0.2984385666013259, + "grad_max_sv": 0.05471824295818806, + "grad_min_sv": 0.0, + "grad_condition": 54718242958.18806, + "lr": 1.3210548563419845e-05, + "time_sec": 177.45291948318481 + }, + { + "epoch": 140, + "train_loss": 4.635435326690674, + "train_acc": 0.01046, + "test_loss": 5.564372345733642, + "test_acc": 0.01, + "lyapunov": 1.6224369688716995, + "grad_norm": 0.356965982379088, + "grad_max_sv": 0.056407551001757386, + "grad_min_sv": 0.0, + "grad_condition": 56407551001.75737, + "lr": 1.0926199633097203e-05, + "time_sec": 177.42662239074707 + }, + { + "epoch": 141, + "train_loss": 4.635846597747803, + "train_acc": 0.01002, + "test_loss": 5.543685975646973, + "test_acc": 0.01, + "lyapunov": 1.6100939362860092, + "grad_norm": 0.6161070696788626, + "grad_max_sv": 0.04843842182308435, + "grad_min_sv": 2.0466509781533097e-18, + "grad_condition": 48438179590.49863, + "lr": 8.856374635655688e-06, + "time_sec": 177.483336687088 + }, + { + "epoch": 142, + "train_loss": 4.635108641204834, + "train_acc": 0.00982, + "test_loss": 5.731918490600586, + "test_acc": 0.01, + "lyapunov": 1.6129589291179882, + "grad_norm": 0.4083627218006193, + "grad_max_sv": 0.0446367921307683, + "grad_min_sv": 0.0, + "grad_condition": 44636792130.768295, + "lr": 7.001981464747503e-06, + "time_sec": 177.6863830089569 + }, + { + "epoch": 143, + "train_loss": 4.6343530229187015, + "train_acc": 0.00962, + "test_loss": 5.7064342742919925, + "test_acc": 0.01, + "lyapunov": 1.592842397787382, + "grad_norm": 0.3611323272348268, + "grad_max_sv": 0.040892344107851385, + "grad_min_sv": 0.0, + "grad_condition": 40892344107.85139, + "lr": 5.3638335185058295e-06, + "time_sec": 177.3921821117401 + }, + { + "epoch": 144, + "train_loss": 4.635800823974609, + "train_acc": 0.00984, + "test_loss": 5.901004859924316, + "test_acc": 0.01, + "lyapunov": 1.6111305766093456, + "grad_norm": 0.39027129071011346, + "grad_max_sv": 0.029163534101098777, + "grad_min_sv": 3.767791857425129e-21, + "grad_condition": 29163533831.10316, + "lr": 3.942649342761114e-06, + "time_sec": 177.42438793182373 + }, + { + "epoch": 145, + "train_loss": 4.635555237579346, + "train_acc": 0.01048, + "test_loss": 6.551739215087891, + "test_acc": 0.01, + "lyapunov": 1.6097711714942131, + "grad_norm": 0.36320203627531283, + "grad_max_sv": 0.017124367970973255, + "grad_min_sv": 0.0, + "grad_condition": 17124367970.973255, + "lr": 2.7390523158633524e-06, + "time_sec": 177.391455411911 + }, + { + "epoch": 146, + "train_loss": 4.6350125201416015, + "train_acc": 0.01, + "test_loss": 6.558631394958496, + "test_acc": 0.01, + "lyapunov": 1.6042376372515392, + "grad_norm": 0.26973086922695555, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 177.3625590801239 + }, + { + "epoch": 147, + "train_loss": 4.63512279953003, + "train_acc": 0.01002, + "test_loss": 5.517122210693359, + "test_acc": 0.01, + "lyapunov": 1.6108765181373148, + "grad_norm": 0.3057820136734528, + "grad_max_sv": 0.01200369345024228, + "grad_min_sv": 0.0, + "grad_condition": 12003693450.242281, + "lr": 9.866357858642196e-07, + "time_sec": 177.3631980419159 + }, + { + "epoch": 148, + "train_loss": 4.635027763061523, + "train_acc": 0.01052, + "test_loss": 5.6589608489990235, + "test_acc": 0.01, + "lyapunov": 1.6133907487630235, + "grad_norm": 0.3601184521971321, + "grad_max_sv": 0.03321786336600781, + "grad_min_sv": 0.0, + "grad_condition": 33217863366.007805, + "lr": 4.38584950570808e-07, + "time_sec": 177.42798614501953 + }, + { + "epoch": 149, + "train_loss": 4.63441861694336, + "train_acc": 0.00996, + "test_loss": 5.65132034072876, + "test_acc": 0.01, + "lyapunov": 1.5955471047355085, + "grad_norm": 0.31320719504990036, + "grad_max_sv": 0.025702585512772203, + "grad_min_sv": 0.0, + "grad_condition": 25702585512.7722, + "lr": 1.096582625772501e-07, + "time_sec": 177.36553716659546 + }, + { + "epoch": 150, + "train_loss": 4.633809689025879, + "train_acc": 0.01, + "test_loss": 5.651321833801269, + "test_acc": 0.01, + "lyapunov": 1.5837058953921814, + "grad_norm": 0.3206105198094455, + "grad_max_sv": 0.025445178616791964, + "grad_min_sv": 0.0, + "grad_condition": 25445178616.79196, + "lr": 0.0, + "time_sec": 177.3372402191162 + } + ] + } +} \ No newline at end of file -- cgit v1.2.3