diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:50:59 -0600 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:50:59 -0600 |
| commit | 00cf667cee7ffacb144d5805fc7e0ef443f3583a (patch) | |
| tree | 77d20a3adaecf96bf3aff0612bdd3b5fa1a7dc7e /runs/depth_scaling_extreme/cifar100_20260102-133536 | |
| parent | c53c04aa1d6ff75cb478a9498c370baa929c74b6 (diff) | |
| parent | cd99d6b874d9d09b3bb87b8485cc787885af71f1 (diff) | |
Merge master into main
Diffstat (limited to 'runs/depth_scaling_extreme/cifar100_20260102-133536')
| -rw-r--r-- | runs/depth_scaling_extreme/cifar100_20260102-133536/config.json | 23 | ||||
| -rw-r--r-- | runs/depth_scaling_extreme/cifar100_20260102-133536/results.json | 16822 |
2 files changed, 16845 insertions, 0 deletions
diff --git a/runs/depth_scaling_extreme/cifar100_20260102-133536/config.json b/runs/depth_scaling_extreme/cifar100_20260102-133536/config.json new file mode 100644 index 0000000..232b971 --- /dev/null +++ b/runs/depth_scaling_extreme/cifar100_20260102-133536/config.json @@ -0,0 +1,23 @@ +{ + "dataset": "cifar100", + "depths": [ + 4, + 8, + 12, + 16 + ], + "T": 4, + "epochs": 150, + "batch_size": 128, + "lr": 0.001, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "data_dir": "./data", + "out_dir": "runs/depth_scaling_extreme", + "device": "cuda", + "seed": 42, + "no_progress": false, + "reg_type": "extreme", + "warmup_epochs": 10, + "stable_init": false +}
\ No newline at end of file diff --git a/runs/depth_scaling_extreme/cifar100_20260102-133536/results.json b/runs/depth_scaling_extreme/cifar100_20260102-133536/results.json new file mode 100644 index 0000000..da04f1d --- /dev/null +++ b/runs/depth_scaling_extreme/cifar100_20260102-133536/results.json @@ -0,0 +1,16822 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 4.343964076461792, + "train_acc": 0.09708, + "test_loss": 3.543811529159546, + "test_acc": 0.178, + "lyapunov": null, + "grad_norm": 6.269401750352016, + "grad_max_sv": 4.853389507532119, + "grad_min_sv": 1.1399991213245642e-07, + "grad_condition": 49410459.259546064, + "lr": 0.0009998903417374227, + "time_sec": 17.48967719078064 + }, + { + "epoch": 2, + "train_loss": 3.498634079360962, + "train_acc": 0.18618, + "test_loss": 3.3043576583862304, + "test_acc": 0.2285, + "lyapunov": null, + "grad_norm": 4.48015812427802, + "grad_max_sv": 3.2765842854976652, + "grad_min_sv": 8.259257237019923e-08, + "grad_condition": 56768723.65171113, + "lr": 0.0009995614150494292, + "time_sec": 15.768706798553467 + }, + { + "epoch": 3, + "train_loss": 3.04044310256958, + "train_acc": 0.2548, + "test_loss": 2.8725222999572755, + "test_acc": 0.2924, + "lyapunov": null, + "grad_norm": 3.55888024814135, + "grad_max_sv": 2.3841808408498766, + "grad_min_sv": 6.6423866895704e-08, + "grad_condition": 55751994.429944515, + "lr": 0.0009990133642141358, + "time_sec": 15.510985374450684 + }, + { + "epoch": 4, + "train_loss": 2.7263157293701172, + "train_acc": 0.31422, + "test_loss": 2.7711315670013428, + "test_acc": 0.3186, + "lyapunov": null, + "grad_norm": 3.0054712784081077, + "grad_max_sv": 1.889515644311905, + "grad_min_sv": 5.657657032864805e-08, + "grad_condition": 39985039.73570454, + "lr": 0.0009982464296247522, + "time_sec": 15.517443418502808 + }, + { + "epoch": 5, + "train_loss": 2.501125616989136, + "train_acc": 0.35674, + "test_loss": 2.9253446578979494, + "test_acc": 0.3025, + "lyapunov": null, + "grad_norm": 2.6770187452123904, + "grad_max_sv": 1.6576285094022751, + "grad_min_sv": 5.1110754423905336e-08, + "grad_condition": 249213918.1838016, + "lr": 0.0009972609476841367, + "time_sec": 15.491940259933472 + }, + { + "epoch": 6, + "train_loss": 2.3297713035583496, + "train_acc": 0.39482, + "test_loss": 2.711188589477539, + "test_acc": 0.34, + "lyapunov": null, + "grad_norm": 2.4392881408652602, + "grad_max_sv": 1.3794412553310393, + "grad_min_sv": 4.6258278196820155e-08, + "grad_condition": 50327201.70401787, + "lr": 0.000996057350657239, + "time_sec": 15.4960355758667 + }, + { + "epoch": 7, + "train_loss": 2.1826580730438234, + "train_acc": 0.4237, + "test_loss": 2.9240353355407716, + "test_acc": 0.3138, + "lyapunov": null, + "grad_norm": 2.2647319573746367, + "grad_max_sv": 1.2694885402917861, + "grad_min_sv": 4.374653217176228e-08, + "grad_condition": 82278933.47227272, + "lr": 0.000994636166481494, + "time_sec": 15.493408203125 + }, + { + "epoch": 8, + "train_loss": 2.069816835021973, + "train_acc": 0.44902, + "test_loss": 2.372804375076294, + "test_acc": 0.4002, + "lyapunov": null, + "grad_norm": 2.1218192129795908, + "grad_max_sv": 1.1551768705248833, + "grad_min_sv": 4.046462118295624e-08, + "grad_condition": 85303714.17850836, + "lr": 0.0009929980185352525, + "time_sec": 15.50551438331604 + }, + { + "epoch": 9, + "train_loss": 1.9601647052764892, + "train_acc": 0.47258, + "test_loss": 2.7926211294174195, + "test_acc": 0.3302, + "lyapunov": null, + "grad_norm": 1.9879560065804707, + "grad_max_sv": 1.0480679154396058, + "grad_min_sv": 3.809713652880298e-08, + "grad_condition": 38148248.122299984, + "lr": 0.0009911436253643444, + "time_sec": 15.502174854278564 + }, + { + "epoch": 10, + "train_loss": 1.8568961290740966, + "train_acc": 0.4985, + "test_loss": 2.1515496990203857, + "test_acc": 0.4359, + "lyapunov": null, + "grad_norm": 1.8704034599240067, + "grad_max_sv": 0.954660838842392, + "grad_min_sv": 3.557788916253024e-08, + "grad_condition": 33434616.307420492, + "lr": 0.0009890738003669028, + "time_sec": 15.494043350219727 + }, + { + "epoch": 11, + "train_loss": 1.776247345046997, + "train_acc": 0.51626, + "test_loss": 3.0507505104064943, + "test_acc": 0.3238, + "lyapunov": null, + "grad_norm": 1.7890241739741972, + "grad_max_sv": 0.9063720315694809, + "grad_min_sv": 3.426323008787202e-08, + "grad_condition": 61761681.99942608, + "lr": 0.00098678945143658, + "time_sec": 15.514922618865967 + }, + { + "epoch": 12, + "train_loss": 1.7078360842895508, + "train_acc": 0.53048, + "test_loss": 2.31292974319458, + "test_acc": 0.4166, + "lyapunov": null, + "grad_norm": 1.70263132913962, + "grad_max_sv": 0.8448627695441246, + "grad_min_sv": 3.25305420267874e-08, + "grad_condition": 39762836.002720095, + "lr": 0.0009842915805643154, + "time_sec": 15.512236833572388 + }, + { + "epoch": 13, + "train_loss": 1.642545406112671, + "train_acc": 0.54468, + "test_loss": 2.1151635683059693, + "test_acc": 0.4542, + "lyapunov": null, + "grad_norm": 1.6326153323712562, + "grad_max_sv": 0.7792091608047486, + "grad_min_sv": 3.072967421080541e-08, + "grad_condition": 40398724.5062742, + "lr": 0.000981581283398829, + "time_sec": 15.52775263786316 + }, + { + "epoch": 14, + "train_loss": 1.5822788066482545, + "train_acc": 0.55844, + "test_loss": 2.1901147899627684, + "test_acc": 0.4442, + "lyapunov": null, + "grad_norm": 1.5714664236307732, + "grad_max_sv": 0.7666790142655373, + "grad_min_sv": 3.014917712151899e-08, + "grad_condition": 36440259.864575304, + "lr": 0.0009786597487660333, + "time_sec": 15.49522066116333 + }, + { + "epoch": 15, + "train_loss": 1.527083348121643, + "train_acc": 0.57474, + "test_loss": 2.207253874206543, + "test_acc": 0.4434, + "lyapunov": null, + "grad_norm": 1.5166965472664673, + "grad_max_sv": 0.7205035746097564, + "grad_min_sv": 2.8671640864286196e-08, + "grad_condition": 37644067.41259916, + "lr": 0.0009755282581475766, + "time_sec": 15.527036190032959 + }, + { + "epoch": 16, + "train_loss": 1.4771566902542115, + "train_acc": 0.58396, + "test_loss": 2.773860432815552, + "test_acc": 0.3614, + "lyapunov": null, + "grad_norm": 1.4643992166233941, + "grad_max_sv": 0.6832035273313523, + "grad_min_sv": 2.7150941947495787e-08, + "grad_condition": 54840700.39935936, + "lr": 0.0009721881851187403, + "time_sec": 15.509675741195679 + }, + { + "epoch": 17, + "train_loss": 1.428199899368286, + "train_acc": 0.59866, + "test_loss": 1.870191947555542, + "test_acc": 0.5152, + "lyapunov": null, + "grad_norm": 1.4232653571860572, + "grad_max_sv": 0.6645245268940926, + "grad_min_sv": 2.659839218738247e-08, + "grad_condition": 64765374.33171377, + "lr": 0.0009686409947459456, + "time_sec": 15.501691102981567 + }, + { + "epoch": 18, + "train_loss": 1.389814187927246, + "train_acc": 0.60686, + "test_loss": 1.9965633613586427, + "test_acc": 0.4906, + "lyapunov": null, + "grad_norm": 1.3736002352381822, + "grad_max_sv": 0.6367693401873111, + "grad_min_sv": 2.6041243064711672e-08, + "grad_condition": 38440962.91151965, + "lr": 0.0009648882429441254, + "time_sec": 15.50187873840332 + }, + { + "epoch": 19, + "train_loss": 1.3393130651092529, + "train_acc": 0.61704, + "test_loss": 1.9167281112670898, + "test_acc": 0.5019, + "lyapunov": null, + "grad_norm": 1.3427044997656652, + "grad_max_sv": 0.6211640179157257, + "grad_min_sv": 2.5033208689295706e-08, + "grad_condition": 100572765.61964989, + "lr": 0.00096093157579425, + "time_sec": 15.509443521499634 + }, + { + "epoch": 20, + "train_loss": 1.301365068283081, + "train_acc": 0.62906, + "test_loss": 1.810260859489441, + "test_acc": 0.5266, + "lyapunov": null, + "grad_norm": 1.3098878923784198, + "grad_max_sv": 0.5800249859690666, + "grad_min_sv": 2.400288523080052e-08, + "grad_condition": 59053795.8657949, + "lr": 0.0009567727288213001, + "time_sec": 15.525721073150635 + }, + { + "epoch": 21, + "train_loss": 1.2668152516555786, + "train_acc": 0.6385, + "test_loss": 2.1314996585845947, + "test_acc": 0.4677, + "lyapunov": null, + "grad_norm": 1.2730143826705373, + "grad_max_sv": 0.583588981628418, + "grad_min_sv": 2.4066221931962062e-08, + "grad_condition": 47275977.76230677, + "lr": 0.0009524135262330095, + "time_sec": 15.537385940551758 + }, + { + "epoch": 22, + "train_loss": 1.2356283584213257, + "train_acc": 0.6435, + "test_loss": 2.3030094453811647, + "test_acc": 0.4421, + "lyapunov": null, + "grad_norm": 1.2444276915676225, + "grad_max_sv": 0.5592368848621845, + "grad_min_sv": 2.3396670312259005e-08, + "grad_condition": 36650347.80275386, + "lr": 0.0009478558801197061, + "time_sec": 15.518898010253906 + }, + { + "epoch": 23, + "train_loss": 1.1962122634124757, + "train_acc": 0.65402, + "test_loss": 1.903352946662903, + "test_acc": 0.5168, + "lyapunov": null, + "grad_norm": 1.2244482194430535, + "grad_max_sv": 0.565939775109291, + "grad_min_sv": 2.3091259931246056e-08, + "grad_condition": 114104274.6151524, + "lr": 0.000943101789615607, + "time_sec": 15.571439027786255 + }, + { + "epoch": 24, + "train_loss": 1.1680951973342895, + "train_acc": 0.66134, + "test_loss": 2.0708827129364016, + "test_acc": 0.4957, + "lyapunov": null, + "grad_norm": 1.1965046095155352, + "grad_max_sv": 0.5413284927606583, + "grad_min_sv": 2.2230258531208412e-08, + "grad_condition": 32505035.94000066, + "lr": 0.0009381533400219313, + "time_sec": 15.524654865264893 + }, + { + "epoch": 25, + "train_loss": 1.1349483573532104, + "train_acc": 0.66956, + "test_loss": 1.9736009086608888, + "test_acc": 0.5102, + "lyapunov": null, + "grad_norm": 1.173400055119284, + "grad_max_sv": 0.5170449152588844, + "grad_min_sv": 2.16096693705925e-08, + "grad_condition": 39903559.78864221, + "lr": 0.0009330127018922189, + "time_sec": 15.542013883590698 + }, + { + "epoch": 26, + "train_loss": 1.1114656055831909, + "train_acc": 0.67594, + "test_loss": 1.9610388065338136, + "test_acc": 0.5082, + "lyapunov": null, + "grad_norm": 1.1552341739969219, + "grad_max_sv": 0.5210843287408352, + "grad_min_sv": 2.1618911905801898e-08, + "grad_condition": 115120503.79287314, + "lr": 0.000927682130080253, + "time_sec": 15.560054302215576 + }, + { + "epoch": 27, + "train_loss": 1.0816866703414918, + "train_acc": 0.68394, + "test_loss": 2.300510933303833, + "test_acc": 0.4608, + "lyapunov": null, + "grad_norm": 1.1270487628668246, + "grad_max_sv": 0.4985874108970165, + "grad_min_sv": 2.0799132844501188e-08, + "grad_condition": 82987435.7224399, + "lr": 0.0009221639627510072, + "time_sec": 15.573202133178711 + }, + { + "epoch": 28, + "train_loss": 1.059952162437439, + "train_acc": 0.6847, + "test_loss": 2.2763154903411866, + "test_acc": 0.4701, + "lyapunov": null, + "grad_norm": 1.1150940189037992, + "grad_max_sv": 0.4915841057896614, + "grad_min_sv": 2.0457985560815017e-08, + "grad_condition": 117138590.05599073, + "lr": 0.0009164606203550494, + "time_sec": 15.515011310577393 + }, + { + "epoch": 29, + "train_loss": 1.0306231698989867, + "train_acc": 0.69368, + "test_loss": 2.2471272750854494, + "test_acc": 0.4707, + "lyapunov": null, + "grad_norm": 1.091561834500795, + "grad_max_sv": 0.4975287884473801, + "grad_min_sv": 2.0274326531250635e-08, + "grad_condition": 343496136.58176744, + "lr": 0.0009105746045668516, + "time_sec": 15.50270962715149 + }, + { + "epoch": 30, + "train_loss": 1.006490296974182, + "train_acc": 0.7012, + "test_loss": 1.8151188419342041, + "test_acc": 0.5457, + "lyapunov": null, + "grad_norm": 1.0808034685161583, + "grad_max_sv": 0.48289466872811315, + "grad_min_sv": 2.0060075225404596e-08, + "grad_condition": 257401984.85631984, + "lr": 0.0009045084971874733, + "time_sec": 15.53312873840332 + }, + { + "epoch": 31, + "train_loss": 0.988988881187439, + "train_acc": 0.70468, + "test_loss": 1.8404255100250244, + "test_acc": 0.5381, + "lyapunov": null, + "grad_norm": 1.0748571288249447, + "grad_max_sv": 0.462377443164587, + "grad_min_sv": 1.9635248512447217e-08, + "grad_condition": 489140401.5860785, + "lr": 0.0008982649590120977, + "time_sec": 15.555314302444458 + }, + { + "epoch": 32, + "train_loss": 0.9635062801361084, + "train_acc": 0.71196, + "test_loss": 1.854098903274536, + "test_acc": 0.5419, + "lyapunov": null, + "grad_norm": 1.0495776449246816, + "grad_max_sv": 0.46274676769971845, + "grad_min_sv": 1.9459323465434443e-08, + "grad_condition": 92041194.40983152, + "lr": 0.0008918467286629196, + "time_sec": 15.513479948043823 + }, + { + "epoch": 33, + "train_loss": 0.9340785507965088, + "train_acc": 0.71992, + "test_loss": 1.8356395168304442, + "test_acc": 0.5433, + "lyapunov": null, + "grad_norm": 1.0398072613772185, + "grad_max_sv": 0.45619562119245527, + "grad_min_sv": 1.9050715303545184e-08, + "grad_condition": 87747830.56401631, + "lr": 0.0008852566213878943, + "time_sec": 15.517829418182373 + }, + { + "epoch": 34, + "train_loss": 0.9129554526519775, + "train_acc": 0.72572, + "test_loss": 1.8661289739608764, + "test_acc": 0.5416, + "lyapunov": null, + "grad_norm": 1.0199118426522369, + "grad_max_sv": 0.4442473478615284, + "grad_min_sv": 1.868702746710138e-08, + "grad_condition": 42913421.35168691, + "lr": 0.000878497527825878, + "time_sec": 15.533827304840088 + }, + { + "epoch": 35, + "train_loss": 0.9028591692924499, + "train_acc": 0.72924, + "test_loss": 1.7551298860549926, + "test_acc": 0.5597, + "lyapunov": null, + "grad_norm": 1.0089778262788507, + "grad_max_sv": 0.43264786079525946, + "grad_min_sv": 1.8316780511090648e-08, + "grad_condition": 63331133.73701396, + "lr": 0.000871572412738697, + "time_sec": 15.518927574157715 + }, + { + "epoch": 36, + "train_loss": 0.8709456444358825, + "train_acc": 0.7382, + "test_loss": 2.1472765481948852, + "test_acc": 0.5006, + "lyapunov": null, + "grad_norm": 0.9875463001166137, + "grad_max_sv": 0.430005656927824, + "grad_min_sv": 1.7798811584313068e-08, + "grad_condition": 90940963.83708307, + "lr": 0.0008644843137107055, + "time_sec": 15.526814699172974 + }, + { + "epoch": 37, + "train_loss": 0.8505911663246155, + "train_acc": 0.74218, + "test_loss": 1.8331342267990112, + "test_acc": 0.5523, + "lyapunov": null, + "grad_norm": 0.9791897305898843, + "grad_max_sv": 0.42675754353404044, + "grad_min_sv": 1.792359621902162e-08, + "grad_condition": 59272698.42367653, + "lr": 0.0008572363398164014, + "time_sec": 15.521918296813965 + }, + { + "epoch": 38, + "train_loss": 0.8315802090644836, + "train_acc": 0.7475, + "test_loss": 1.9036517213821411, + "test_acc": 0.5476, + "lyapunov": null, + "grad_norm": 0.9724844009666125, + "grad_max_sv": 0.42650427520275114, + "grad_min_sv": 1.7940990758476273e-08, + "grad_condition": 152760168.97703806, + "lr": 0.0008498316702566826, + "time_sec": 15.582866907119751 + }, + { + "epoch": 39, + "train_loss": 0.8243685752487183, + "train_acc": 0.74852, + "test_loss": 1.7936948488235473, + "test_acc": 0.5677, + "lyapunov": null, + "grad_norm": 0.9598921490017479, + "grad_max_sv": 0.4138942167162895, + "grad_min_sv": 1.7613742333156407e-08, + "grad_condition": 533618066.1366825, + "lr": 0.0008422735529643442, + "time_sec": 15.516271352767944 + }, + { + "epoch": 40, + "train_loss": 0.8057044812202454, + "train_acc": 0.7565, + "test_loss": 1.808411812210083, + "test_acc": 0.5658, + "lyapunov": null, + "grad_norm": 0.9538542272130858, + "grad_max_sv": 0.4244484819471836, + "grad_min_sv": 1.7626790971107808e-08, + "grad_condition": 163829749.9020123, + "lr": 0.0008345653031794289, + "time_sec": 15.51979684829712 + }, + { + "epoch": 41, + "train_loss": 0.7841885061645508, + "train_acc": 0.76222, + "test_loss": 1.8520248830795287, + "test_acc": 0.5592, + "lyapunov": null, + "grad_norm": 0.9398877148073365, + "grad_max_sv": 0.4056116588413715, + "grad_min_sv": 1.7369371559106117e-08, + "grad_condition": 54614245.02585721, + "lr": 0.0008267103019950526, + "time_sec": 15.515657424926758 + }, + { + "epoch": 42, + "train_loss": 0.765489040851593, + "train_acc": 0.76578, + "test_loss": 1.7736550596237182, + "test_acc": 0.5652, + "lyapunov": null, + "grad_norm": 0.9287734138199644, + "grad_max_sv": 0.40227611660957335, + "grad_min_sv": 1.7095986799831042e-08, + "grad_condition": 62696596.41944494, + "lr": 0.0008187119948743447, + "time_sec": 15.531492233276367 + }, + { + "epoch": 43, + "train_loss": 0.7523658062362671, + "train_acc": 0.76828, + "test_loss": 1.862604800415039, + "test_acc": 0.5527, + "lyapunov": null, + "grad_norm": 0.9192011925193997, + "grad_max_sv": 0.4043716721236706, + "grad_min_sv": 1.6709370530276767e-08, + "grad_condition": 50276838.15174754, + "lr": 0.000810573890139155, + "time_sec": 15.519644498825073 + }, + { + "epoch": 44, + "train_loss": 0.7335971118927002, + "train_acc": 0.77418, + "test_loss": 1.7547655418395995, + "test_acc": 0.5764, + "lyapunov": null, + "grad_norm": 0.9104057799361107, + "grad_max_sv": 0.39035323858261106, + "grad_min_sv": 1.6815737483022453e-08, + "grad_condition": 45228087.284967735, + "lr": 0.0008022995574311873, + "time_sec": 15.519366025924683 + }, + { + "epoch": 45, + "train_loss": 0.7196475598526001, + "train_acc": 0.7789, + "test_loss": 1.9343164527893066, + "test_acc": 0.5574, + "lyapunov": null, + "grad_norm": 0.9044725461231161, + "grad_max_sv": 0.39498561918735503, + "grad_min_sv": 1.610284234183912e-08, + "grad_condition": 79566359.88657416, + "lr": 0.0007938926261462363, + "time_sec": 15.51046633720398 + }, + { + "epoch": 46, + "train_loss": 0.7023829959106446, + "train_acc": 0.7836, + "test_loss": 1.8175951471328735, + "test_acc": 0.5704, + "lyapunov": null, + "grad_norm": 0.886027952458362, + "grad_max_sv": 0.383831874281168, + "grad_min_sv": 1.5835774637169147e-08, + "grad_condition": 277232736.60907316, + "lr": 0.0007853567838422158, + "time_sec": 15.502201318740845 + }, + { + "epoch": 47, + "train_loss": 0.692379617729187, + "train_acc": 0.7858, + "test_loss": 1.7909827726364136, + "test_acc": 0.5739, + "lyapunov": null, + "grad_norm": 0.8854139862941175, + "grad_max_sv": 0.3877114519476891, + "grad_min_sv": 1.60303614979429e-08, + "grad_condition": 56967588.242197834, + "lr": 0.0007766957746216719, + "time_sec": 15.53445816040039 + }, + { + "epoch": 48, + "train_loss": 0.6760443294715881, + "train_acc": 0.78938, + "test_loss": 1.9196774244308472, + "test_acc": 0.5563, + "lyapunov": null, + "grad_norm": 0.8760915073960837, + "grad_max_sv": 0.37504774928092954, + "grad_min_sv": 1.5830848163617128e-08, + "grad_condition": 63604699.64347188, + "lr": 0.0007679133974894982, + "time_sec": 15.531822443008423 + }, + { + "epoch": 49, + "train_loss": 0.6715626827049256, + "train_acc": 0.79074, + "test_loss": 1.9189249057769775, + "test_acc": 0.5548, + "lyapunov": null, + "grad_norm": 0.8712413577717205, + "grad_max_sv": 0.37739116996526717, + "grad_min_sv": 1.5668840121219052e-08, + "grad_condition": 35881824.87652787, + "lr": 0.000759013504686565, + "time_sec": 15.530819416046143 + }, + { + "epoch": 50, + "train_loss": 0.6447899807167053, + "train_acc": 0.79878, + "test_loss": 1.8417208972930907, + "test_acc": 0.5658, + "lyapunov": null, + "grad_norm": 0.8504083091663698, + "grad_max_sv": 0.36688936948776246, + "grad_min_sv": 1.517037322221193e-08, + "grad_condition": 71999401.07754412, + "lr": 0.0007499999999999998, + "time_sec": 15.513152837753296 + }, + { + "epoch": 51, + "train_loss": 0.6371639384269714, + "train_acc": 0.80052, + "test_loss": 1.9895338836669922, + "test_acc": 0.5435, + "lyapunov": null, + "grad_norm": 0.854000723051651, + "grad_max_sv": 0.3801948450505733, + "grad_min_sv": 1.544281589879043e-08, + "grad_condition": 196822188.685167, + "lr": 0.0007408768370508575, + "time_sec": 15.535704851150513 + }, + { + "epoch": 52, + "train_loss": 0.627970908241272, + "train_acc": 0.80326, + "test_loss": 1.7884189123153686, + "test_acc": 0.5795, + "lyapunov": null, + "grad_norm": 0.8489707889885099, + "grad_max_sv": 0.3610515870153904, + "grad_min_sv": 1.4917008953757583e-08, + "grad_condition": 116011092.17479134, + "lr": 0.0007316480175599307, + "time_sec": 15.520502090454102 + }, + { + "epoch": 53, + "train_loss": 0.6110728459739685, + "train_acc": 0.80756, + "test_loss": 1.9764576913833618, + "test_acc": 0.5586, + "lyapunov": null, + "grad_norm": 0.83239953497766, + "grad_max_sv": 0.35885564237833023, + "grad_min_sv": 1.4919259355011816e-08, + "grad_condition": 85456100.45031682, + "lr": 0.0007223175895924635, + "time_sec": 15.510826349258423 + }, + { + "epoch": 54, + "train_loss": 0.6081169471359253, + "train_acc": 0.8092, + "test_loss": 1.787416721534729, + "test_acc": 0.5872, + "lyapunov": null, + "grad_norm": 0.8301465677354521, + "grad_max_sv": 0.35901840403676033, + "grad_min_sv": 1.4836248149463494e-08, + "grad_condition": 71846187.92798834, + "lr": 0.0007128896457825361, + "time_sec": 15.538878440856934 + }, + { + "epoch": 55, + "train_loss": 0.5831116440963745, + "train_acc": 0.81676, + "test_loss": 1.870977353286743, + "test_acc": 0.5758, + "lyapunov": null, + "grad_norm": 0.8161779632209265, + "grad_max_sv": 0.3469956606626511, + "grad_min_sv": 1.4283351100312369e-08, + "grad_condition": 205730158.31150857, + "lr": 0.0007033683215378998, + "time_sec": 15.520758628845215 + }, + { + "epoch": 56, + "train_loss": 0.5736992453193664, + "train_acc": 0.81948, + "test_loss": 1.9110374048233032, + "test_acc": 0.5654, + "lyapunov": null, + "grad_norm": 0.8163787482015537, + "grad_max_sv": 0.35173602402210236, + "grad_min_sv": 1.4616037320724918e-08, + "grad_condition": 110269032.9871988, + "lr": 0.0006937577932260512, + "time_sec": 15.527177333831787 + }, + { + "epoch": 57, + "train_loss": 0.5601261650466919, + "train_acc": 0.82286, + "test_loss": 1.9212758470535278, + "test_acc": 0.5714, + "lyapunov": null, + "grad_norm": 0.8024223025099775, + "grad_max_sv": 0.3423969805240631, + "grad_min_sv": 1.4464966059321572e-08, + "grad_condition": 145895975.18417415, + "lr": 0.0006840622763423388, + "time_sec": 15.54552149772644 + }, + { + "epoch": 58, + "train_loss": 0.5606306306457519, + "train_acc": 0.8221, + "test_loss": 2.0131147371292113, + "test_acc": 0.5621, + "lyapunov": null, + "grad_norm": 0.8035713080677088, + "grad_max_sv": 0.3485363688319921, + "grad_min_sv": 1.4229694939721371e-08, + "grad_condition": 57271115.05511497, + "lr": 0.0006742860236609073, + "time_sec": 15.549937725067139 + }, + { + "epoch": 59, + "train_loss": 0.5377489028739929, + "train_acc": 0.82924, + "test_loss": 1.8628471519470216, + "test_acc": 0.5826, + "lyapunov": null, + "grad_norm": 0.791423222073838, + "grad_max_sv": 0.3482122249901295, + "grad_min_sv": 1.4126948262929705e-08, + "grad_condition": 419338835.22695076, + "lr": 0.0006644333233692913, + "time_sec": 15.527005434036255 + }, + { + "epoch": 60, + "train_loss": 0.5309908809089661, + "train_acc": 0.83234, + "test_loss": 1.8920386169433594, + "test_acc": 0.5797, + "lyapunov": null, + "grad_norm": 0.7863919696739998, + "grad_max_sv": 0.34046448543667795, + "grad_min_sv": 1.4143183188443028e-08, + "grad_condition": 568996122.5074177, + "lr": 0.0006545084971874734, + "time_sec": 15.548128843307495 + }, + { + "epoch": 61, + "train_loss": 0.5203311266136169, + "train_acc": 0.83484, + "test_loss": 1.9649493141174317, + "test_acc": 0.5687, + "lyapunov": null, + "grad_norm": 0.7768824997531635, + "grad_max_sv": 0.33470223769545554, + "grad_min_sv": 1.3756740831205594e-08, + "grad_condition": 127184951.10137768, + "lr": 0.0006445158984722354, + "time_sec": 15.560498714447021 + }, + { + "epoch": 62, + "train_loss": 0.5145069622135162, + "train_acc": 0.83484, + "test_loss": 1.9193354610443116, + "test_acc": 0.5768, + "lyapunov": null, + "grad_norm": 0.7768992242165623, + "grad_max_sv": 0.3374949935823679, + "grad_min_sv": 1.392062900142793e-08, + "grad_condition": 269252680.5306621, + "lr": 0.0006344599103076324, + "time_sec": 15.54216456413269 + }, + { + "epoch": 63, + "train_loss": 0.4961839492988586, + "train_acc": 0.84094, + "test_loss": 1.9531686166763305, + "test_acc": 0.5774, + "lyapunov": null, + "grad_norm": 0.7656554601321728, + "grad_max_sv": 0.3305441617965698, + "grad_min_sv": 1.350646871936149e-08, + "grad_condition": 6718951699.483927, + "lr": 0.0006243449435824269, + "time_sec": 15.524494886398315 + }, + { + "epoch": 64, + "train_loss": 0.4901823128700256, + "train_acc": 0.84378, + "test_loss": 1.916199884033203, + "test_acc": 0.5838, + "lyapunov": null, + "grad_norm": 0.7568470873721883, + "grad_max_sv": 0.3358922269195318, + "grad_min_sv": 1.3828968241716421e-08, + "grad_condition": 105377056.99567077, + "lr": 0.0006141754350553275, + "time_sec": 15.523052453994751 + }, + { + "epoch": 65, + "train_loss": 0.4791102393913269, + "train_acc": 0.84696, + "test_loss": 1.966923655128479, + "test_acc": 0.5744, + "lyapunov": null, + "grad_norm": 0.7524565950871801, + "grad_max_sv": 0.3334443997591734, + "grad_min_sv": 1.3628257438660571e-08, + "grad_condition": 1358568690.118565, + "lr": 0.0006039558454088793, + "time_sec": 15.542505741119385 + }, + { + "epoch": 66, + "train_loss": 0.4763075370979309, + "train_acc": 0.8466, + "test_loss": 2.0256323554992677, + "test_acc": 0.5715, + "lyapunov": null, + "grad_norm": 0.7479103571543138, + "grad_max_sv": 0.3313276808708906, + "grad_min_sv": 1.3539888895144903e-08, + "grad_condition": 95123075.17637601, + "lr": 0.000593690657292862, + "time_sec": 15.52782130241394 + }, + { + "epoch": 67, + "train_loss": 0.46114027640342714, + "train_acc": 0.85298, + "test_loss": 1.9059690628051758, + "test_acc": 0.5841, + "lyapunov": null, + "grad_norm": 0.7326621356364718, + "grad_max_sv": 0.31032404750585557, + "grad_min_sv": 1.290734452954437e-08, + "grad_condition": 1707779953.730576, + "lr": 0.0005833843733580507, + "time_sec": 15.55374813079834 + }, + { + "epoch": 68, + "train_loss": 0.44383577558517456, + "train_acc": 0.8584, + "test_loss": 1.9568644897460938, + "test_acc": 0.5843, + "lyapunov": null, + "grad_norm": 0.725687077482003, + "grad_max_sv": 0.3219859037548304, + "grad_min_sv": 1.2856303070697337e-08, + "grad_condition": 703953775.4983035, + "lr": 0.0005730415142812054, + "time_sec": 15.519795656204224 + }, + { + "epoch": 69, + "train_loss": 0.4424840718173981, + "train_acc": 0.85716, + "test_loss": 1.9289333599090577, + "test_acc": 0.5821, + "lyapunov": null, + "grad_norm": 0.7262659565623177, + "grad_max_sv": 0.3170352976769209, + "grad_min_sv": 1.2696636278106133e-08, + "grad_condition": 98778791.72991131, + "lr": 0.0005626666167821517, + "time_sec": 15.529230833053589 + }, + { + "epoch": 70, + "train_loss": 0.4398577031803131, + "train_acc": 0.85766, + "test_loss": 2.0977408306121825, + "test_acc": 0.5633, + "lyapunov": null, + "grad_norm": 0.728893181798991, + "grad_max_sv": 0.31492993645370004, + "grad_min_sv": 1.2796445524737576e-08, + "grad_condition": 90590113.78796592, + "lr": 0.0005522642316338265, + "time_sec": 15.529253244400024 + }, + { + "epoch": 71, + "train_loss": 0.4278151651573181, + "train_acc": 0.86234, + "test_loss": 1.921709558868408, + "test_acc": 0.5935, + "lyapunov": null, + "grad_norm": 0.7119527931237094, + "grad_max_sv": 0.31725598126649857, + "grad_min_sv": 1.2717853704533044e-08, + "grad_condition": 86258191.35057445, + "lr": 0.0005418389216661573, + "time_sec": 15.547401189804077 + }, + { + "epoch": 72, + "train_loss": 0.4124197146320343, + "train_acc": 0.86642, + "test_loss": 1.924353583908081, + "test_acc": 0.5915, + "lyapunov": null, + "grad_norm": 0.7082065157708266, + "grad_max_sv": 0.31442847587168216, + "grad_min_sv": 1.2634722947654082e-08, + "grad_condition": 597381800.0220104, + "lr": 0.0005313952597646563, + "time_sec": 15.526617527008057 + }, + { + "epoch": 73, + "train_loss": 0.40527023687362673, + "train_acc": 0.86938, + "test_loss": 1.971421655845642, + "test_acc": 0.5873, + "lyapunov": null, + "grad_norm": 0.6972509597964054, + "grad_max_sv": 0.30321186445653436, + "grad_min_sv": 1.2183027311507902e-08, + "grad_condition": 659840426.4881967, + "lr": 0.0005209378268645994, + "time_sec": 15.524028062820435 + }, + { + "epoch": 74, + "train_loss": 0.4031702409172058, + "train_acc": 0.86922, + "test_loss": 1.8892217210769653, + "test_acc": 0.5929, + "lyapunov": null, + "grad_norm": 0.6960139640264162, + "grad_max_sv": 0.31964847445487976, + "grad_min_sv": 1.2496163657663021e-08, + "grad_condition": 5526093760.284935, + "lr": 0.0005104712099416781, + "time_sec": 15.541268587112427 + }, + { + "epoch": 75, + "train_loss": 0.39247145907402037, + "train_acc": 0.8737, + "test_loss": 1.9193254402160644, + "test_acc": 0.5911, + "lyapunov": null, + "grad_norm": 0.6938082468572513, + "grad_max_sv": 0.306133383885026, + "grad_min_sv": 1.243469968555122e-08, + "grad_condition": 90770008.46636352, + "lr": 0.0004999999999999996, + "time_sec": 15.528103828430176 + }, + { + "epoch": 76, + "train_loss": 0.3918505529499054, + "train_acc": 0.87434, + "test_loss": 1.9542344440460204, + "test_acc": 0.5867, + "lyapunov": null, + "grad_norm": 0.6912213215583259, + "grad_max_sv": 0.30644708313047886, + "grad_min_sv": 1.2129230076178207e-08, + "grad_condition": 656508646.5699027, + "lr": 0.0004895287900583212, + "time_sec": 15.522168397903442 + }, + { + "epoch": 77, + "train_loss": 0.3794186065292358, + "train_acc": 0.87798, + "test_loss": 1.9260537242889404, + "test_acc": 0.5966, + "lyapunov": null, + "grad_norm": 0.6834830854985271, + "grad_max_sv": 0.3064906165003777, + "grad_min_sv": 1.1955120489751114e-08, + "grad_condition": 122103850.24004915, + "lr": 0.0004790621731353997, + "time_sec": 15.545487880706787 + }, + { + "epoch": 78, + "train_loss": 0.3696615171527863, + "train_acc": 0.8798, + "test_loss": 1.946743204498291, + "test_acc": 0.5926, + "lyapunov": null, + "grad_norm": 0.6767619134211336, + "grad_max_sv": 0.2977776523679495, + "grad_min_sv": 1.1791637707144615e-08, + "grad_condition": 372588324.2891523, + "lr": 0.000468604740235343, + "time_sec": 15.535629272460938 + }, + { + "epoch": 79, + "train_loss": 0.36537619757652284, + "train_acc": 0.88174, + "test_loss": 1.9460959537506104, + "test_acc": 0.5885, + "lyapunov": null, + "grad_norm": 0.6711953545344299, + "grad_max_sv": 0.2986964497715235, + "grad_min_sv": 1.177440820238594e-08, + "grad_condition": 589214191.9810541, + "lr": 0.00045816107833384175, + "time_sec": 15.525192499160767 + }, + { + "epoch": 80, + "train_loss": 0.3601113852787018, + "train_acc": 0.88298, + "test_loss": 1.987246592903137, + "test_acc": 0.5835, + "lyapunov": null, + "grad_norm": 0.6681297057813997, + "grad_max_sv": 0.2975290589034557, + "grad_min_sv": 1.1789076133361665e-08, + "grad_condition": 1583385514.8496976, + "lr": 0.0004477357683661729, + "time_sec": 15.530385732650757 + }, + { + "epoch": 81, + "train_loss": 0.3518340720653534, + "train_acc": 0.8847, + "test_loss": 1.9567889921188355, + "test_acc": 0.5931, + "lyapunov": null, + "grad_norm": 0.6659585947439052, + "grad_max_sv": 0.295102783292532, + "grad_min_sv": 1.1431068634628477e-08, + "grad_condition": 804368035.7057787, + "lr": 0.00043733338321784746, + "time_sec": 15.546995878219604 + }, + { + "epoch": 82, + "train_loss": 0.3462408744335175, + "train_acc": 0.88646, + "test_loss": 2.007093822479248, + "test_acc": 0.5852, + "lyapunov": null, + "grad_norm": 0.6586634750679704, + "grad_max_sv": 0.2972933381795883, + "grad_min_sv": 1.1704448067500172e-08, + "grad_condition": 977173625.5351397, + "lr": 0.0004269584857187939, + "time_sec": 15.535587310791016 + }, + { + "epoch": 83, + "train_loss": 0.33747674790382387, + "train_acc": 0.89044, + "test_loss": 1.9526693616867066, + "test_acc": 0.5917, + "lyapunov": null, + "grad_norm": 0.6508247061578019, + "grad_max_sv": 0.297639737278223, + "grad_min_sv": 1.1361412798581439e-08, + "grad_condition": 128555083.59517927, + "lr": 0.0004166156266419484, + "time_sec": 15.536566257476807 + }, + { + "epoch": 84, + "train_loss": 0.3325590915679932, + "train_acc": 0.89126, + "test_loss": 1.9067222114562987, + "test_acc": 0.6011, + "lyapunov": null, + "grad_norm": 0.6522973167379151, + "grad_max_sv": 0.281706926971674, + "grad_min_sv": 1.10261386872864e-08, + "grad_condition": 623262716.1426824, + "lr": 0.0004063093427071373, + "time_sec": 15.52798342704773 + }, + { + "epoch": 85, + "train_loss": 0.3278141854572296, + "train_acc": 0.89518, + "test_loss": 1.9726215780258178, + "test_acc": 0.594, + "lyapunov": null, + "grad_norm": 0.643823853564667, + "grad_max_sv": 0.2927782468497753, + "grad_min_sv": 1.1309383348302033e-08, + "grad_condition": 547831013.5772574, + "lr": 0.0003960441545911199, + "time_sec": 15.53898549079895 + }, + { + "epoch": 86, + "train_loss": 0.317587457818985, + "train_acc": 0.89712, + "test_loss": 1.9282952379226685, + "test_acc": 0.5968, + "lyapunov": null, + "grad_norm": 0.6371168124609629, + "grad_max_sv": 0.29028595611453056, + "grad_min_sv": 1.147984300944524e-08, + "grad_condition": 268906193.5734116, + "lr": 0.0003858245649446718, + "time_sec": 15.529613733291626 + }, + { + "epoch": 87, + "train_loss": 0.3119666923427582, + "train_acc": 0.89872, + "test_loss": 1.991708751106262, + "test_acc": 0.5956, + "lyapunov": null, + "grad_norm": 0.6329581145453558, + "grad_max_sv": 0.2849379751831293, + "grad_min_sv": 1.1153094022810228e-08, + "grad_condition": 266977673.1074769, + "lr": 0.00037565505641757235, + "time_sec": 15.539918661117554 + }, + { + "epoch": 88, + "train_loss": 0.304864205904007, + "train_acc": 0.90146, + "test_loss": 1.9851121433258057, + "test_acc": 0.595, + "lyapunov": null, + "grad_norm": 0.6285460294125618, + "grad_max_sv": 0.28998454511165617, + "grad_min_sv": 1.1332873445842746e-08, + "grad_condition": 289764591.30223703, + "lr": 0.00036554008969236695, + "time_sec": 15.521661520004272 + }, + { + "epoch": 89, + "train_loss": 0.30015240715026853, + "train_acc": 0.90194, + "test_loss": 2.0606800762176514, + "test_acc": 0.5865, + "lyapunov": null, + "grad_norm": 0.6267515983958646, + "grad_max_sv": 0.2926571309566498, + "grad_min_sv": 1.1169707006541962e-08, + "grad_condition": 128543979.97327559, + "lr": 0.0003554841015277638, + "time_sec": 15.544517040252686 + }, + { + "epoch": 90, + "train_loss": 0.2928112324333191, + "train_acc": 0.90618, + "test_loss": 1.9894328233718872, + "test_acc": 0.5946, + "lyapunov": null, + "grad_norm": 0.6130362562659067, + "grad_max_sv": 0.278825618699193, + "grad_min_sv": 1.0737035230270337e-08, + "grad_condition": 293449090.58323187, + "lr": 0.000345491502812526, + "time_sec": 15.550155401229858 + }, + { + "epoch": 91, + "train_loss": 0.2888556646347046, + "train_acc": 0.9048, + "test_loss": 2.049033945083618, + "test_acc": 0.5946, + "lyapunov": null, + "grad_norm": 0.6141720017951389, + "grad_max_sv": 0.2722177982330322, + "grad_min_sv": 1.0853245450406431e-08, + "grad_condition": 416564856.83874714, + "lr": 0.0003355666766307081, + "time_sec": 15.540212392807007 + }, + { + "epoch": 92, + "train_loss": 0.28862955547332764, + "train_acc": 0.90606, + "test_loss": 1.9920015350341798, + "test_acc": 0.5932, + "lyapunov": null, + "grad_norm": 0.6131904596449147, + "grad_max_sv": 0.27554026171565055, + "grad_min_sv": 1.072076380140459e-08, + "grad_condition": 1434525113.8124838, + "lr": 0.00032571397633909225, + "time_sec": 15.533208847045898 + }, + { + "epoch": 93, + "train_loss": 0.27849696086883546, + "train_acc": 0.9088, + "test_loss": 2.040655344772339, + "test_acc": 0.5953, + "lyapunov": null, + "grad_norm": 0.6038389917635373, + "grad_max_sv": 0.28117162361741066, + "grad_min_sv": 1.0650112780303394e-08, + "grad_condition": 424978967.5658449, + "lr": 0.00031593772365766094, + "time_sec": 15.551164865493774 + }, + { + "epoch": 94, + "train_loss": 0.2785502600288391, + "train_acc": 0.90902, + "test_loss": 2.0051936563491823, + "test_acc": 0.5956, + "lyapunov": null, + "grad_norm": 0.6035472955614215, + "grad_max_sv": 0.2856413472443819, + "grad_min_sv": 1.0634489876464731e-08, + "grad_condition": 208372273.8776492, + "lr": 0.0003062422067739483, + "time_sec": 15.564072608947754 + }, + { + "epoch": 95, + "train_loss": 0.26930244629859923, + "train_acc": 0.91258, + "test_loss": 2.040685438156128, + "test_acc": 0.594, + "lyapunov": null, + "grad_norm": 0.5913034236526281, + "grad_max_sv": 0.2773492123931646, + "grad_min_sv": 1.0436666836267581e-08, + "grad_condition": 707180505.7410402, + "lr": 0.00029663167846209965, + "time_sec": 15.536799669265747 + }, + { + "epoch": 96, + "train_loss": 0.2629419521713257, + "train_acc": 0.91478, + "test_loss": 2.049863017845154, + "test_acc": 0.5955, + "lyapunov": null, + "grad_norm": 0.5892858525841755, + "grad_max_sv": 0.2767842046916485, + "grad_min_sv": 1.0442346364686328e-08, + "grad_condition": 614093660.6555232, + "lr": 0.00028711035421746345, + "time_sec": 15.535489082336426 + }, + { + "epoch": 97, + "train_loss": 0.2566527827835083, + "train_acc": 0.91688, + "test_loss": 1.9312515392303466, + "test_acc": 0.61, + "lyapunov": null, + "grad_norm": 0.5789114105636759, + "grad_max_sv": 0.27370760031044483, + "grad_min_sv": 1.0440373288947078e-08, + "grad_condition": 395918905.44726604, + "lr": 0.00027768241040753615, + "time_sec": 15.557752132415771 + }, + { + "epoch": 98, + "train_loss": 0.2562578124713898, + "train_acc": 0.91532, + "test_loss": 1.9752160369873046, + "test_acc": 0.6068, + "lyapunov": null, + "grad_norm": 0.5860500863606897, + "grad_max_sv": 0.2706368513405323, + "grad_min_sv": 1.0393827978068954e-08, + "grad_condition": 238197929.67103285, + "lr": 0.00026835198244006903, + "time_sec": 15.544656753540039 + }, + { + "epoch": 99, + "train_loss": 0.24837030095100404, + "train_acc": 0.91922, + "test_loss": 2.085749612236023, + "test_acc": 0.5979, + "lyapunov": null, + "grad_norm": 0.5764803222767428, + "grad_max_sv": 0.27518525198101995, + "grad_min_sv": 1.0323591131044738e-08, + "grad_condition": 442181147.42095405, + "lr": 0.0002591231629491421, + "time_sec": 15.551199913024902 + }, + { + "epoch": 100, + "train_loss": 0.24750245269298554, + "train_acc": 0.91996, + "test_loss": 2.0216005535125734, + "test_acc": 0.5971, + "lyapunov": null, + "grad_norm": 0.5732281028086655, + "grad_max_sv": 0.2629762265831232, + "grad_min_sv": 1.018690741006259e-08, + "grad_condition": 228438659.32854, + "lr": 0.0002499999999999997, + "time_sec": 15.537281274795532 + }, + { + "epoch": 101, + "train_loss": 0.2413197231388092, + "train_acc": 0.9207, + "test_loss": 2.0327822509765623, + "test_acc": 0.5987, + "lyapunov": null, + "grad_norm": 0.5699929454007691, + "grad_max_sv": 0.2677549198269844, + "grad_min_sv": 1.0395906519314324e-08, + "grad_condition": 135340876.85474354, + "lr": 0.00024098649531343477, + "time_sec": 15.584813833236694 + }, + { + "epoch": 102, + "train_loss": 0.23438371506214142, + "train_acc": 0.92444, + "test_loss": 1.9691780755996704, + "test_acc": 0.6057, + "lyapunov": null, + "grad_norm": 0.5568861771033957, + "grad_max_sv": 0.26255625002086164, + "grad_min_sv": 1.0066820231081387e-08, + "grad_condition": 827084993.1357218, + "lr": 0.0002320866025105016, + "time_sec": 15.564095973968506 + }, + { + "epoch": 103, + "train_loss": 0.23686029078006746, + "train_acc": 0.9227, + "test_loss": 2.033883098602295, + "test_acc": 0.5965, + "lyapunov": null, + "grad_norm": 0.5613045577897411, + "grad_max_sv": 0.26336216777563093, + "grad_min_sv": 1.018771148546694e-08, + "grad_condition": 1162624760.318234, + "lr": 0.0002233042253783278, + "time_sec": 15.555514812469482 + }, + { + "epoch": 104, + "train_loss": 0.232201413936615, + "train_acc": 0.92396, + "test_loss": 1.9919283714294433, + "test_acc": 0.6038, + "lyapunov": null, + "grad_norm": 0.5589204345244685, + "grad_max_sv": 0.2624808818101883, + "grad_min_sv": 9.888480128086537e-09, + "grad_condition": 5125006664.350008, + "lr": 0.000214643216157784, + "time_sec": 15.55103611946106 + }, + { + "epoch": 105, + "train_loss": 0.22536927486419678, + "train_acc": 0.92692, + "test_loss": 2.0385340311050415, + "test_acc": 0.5947, + "lyapunov": null, + "grad_norm": 0.5535124902950697, + "grad_max_sv": 0.2575108613818884, + "grad_min_sv": 9.755115641402884e-09, + "grad_condition": 166338617.99336535, + "lr": 0.00020610737385376332, + "time_sec": 15.542803525924683 + }, + { + "epoch": 106, + "train_loss": 0.22605940510749817, + "train_acc": 0.92676, + "test_loss": 2.030563621902466, + "test_acc": 0.6007, + "lyapunov": null, + "grad_norm": 0.547779700018845, + "grad_max_sv": 0.25856886617839336, + "grad_min_sv": 9.660613463965267e-09, + "grad_condition": 255054607.73465315, + "lr": 0.00019770044256881242, + "time_sec": 15.550171136856079 + }, + { + "epoch": 107, + "train_loss": 0.22419200974464418, + "train_acc": 0.92824, + "test_loss": 1.9967736017227173, + "test_acc": 0.6058, + "lyapunov": null, + "grad_norm": 0.5499143700914649, + "grad_max_sv": 0.2611769150942564, + "grad_min_sv": 9.635462525471942e-09, + "grad_condition": 860011953.8858073, + "lr": 0.0001894261098608447, + "time_sec": 15.55410885810852 + }, + { + "epoch": 108, + "train_loss": 0.21630392609596252, + "train_acc": 0.9302, + "test_loss": 2.0519058053970336, + "test_acc": 0.5999, + "lyapunov": null, + "grad_norm": 0.5416266971698476, + "grad_max_sv": 0.26166511699557304, + "grad_min_sv": 9.752643477891654e-09, + "grad_condition": 3236269240.990809, + "lr": 0.000181288005125655, + "time_sec": 15.574140548706055 + }, + { + "epoch": 109, + "train_loss": 0.21062327845573425, + "train_acc": 0.93214, + "test_loss": 2.0300213758468626, + "test_acc": 0.6092, + "lyapunov": null, + "grad_norm": 0.5343489109994392, + "grad_max_sv": 0.25067234598100185, + "grad_min_sv": 9.564686373475517e-09, + "grad_condition": 72260141.60705423, + "lr": 0.0001732896980049473, + "time_sec": 15.548709154129028 + }, + { + "epoch": 110, + "train_loss": 0.21378290111541748, + "train_acc": 0.93186, + "test_loss": 1.967118263244629, + "test_acc": 0.6118, + "lyapunov": null, + "grad_norm": 0.5338327962076629, + "grad_max_sv": 0.25025314278900623, + "grad_min_sv": 9.40962894390579e-09, + "grad_condition": 170096554.9122977, + "lr": 0.00016543469682057076, + "time_sec": 15.540042638778687 + }, + { + "epoch": 111, + "train_loss": 0.201287554397583, + "train_acc": 0.9354, + "test_loss": 2.038306018638611, + "test_acc": 0.6008, + "lyapunov": null, + "grad_norm": 0.5239300445404682, + "grad_max_sv": 0.2577681414783001, + "grad_min_sv": 9.631198439469246e-09, + "grad_condition": 1749324651.4574604, + "lr": 0.00015772644703565552, + "time_sec": 15.548538446426392 + }, + { + "epoch": 112, + "train_loss": 0.2000931690311432, + "train_acc": 0.9347, + "test_loss": 2.0612026218414305, + "test_acc": 0.6032, + "lyapunov": null, + "grad_norm": 0.5260259376709223, + "grad_max_sv": 0.24985811933875085, + "grad_min_sv": 9.245042727136672e-09, + "grad_condition": 648150053.3842711, + "lr": 0.00015016832974331713, + "time_sec": 15.553885459899902 + }, + { + "epoch": 113, + "train_loss": 0.19753471722126006, + "train_acc": 0.93784, + "test_loss": 2.022400039100647, + "test_acc": 0.608, + "lyapunov": null, + "grad_norm": 0.5176321747709245, + "grad_max_sv": 0.2558797553181648, + "grad_min_sv": 9.707446643920925e-09, + "grad_condition": 315709221.54881674, + "lr": 0.00014276366018359834, + "time_sec": 15.539334297180176 + }, + { + "epoch": 114, + "train_loss": 0.19809397587776184, + "train_acc": 0.93654, + "test_loss": 2.0101557178497313, + "test_acc": 0.6125, + "lyapunov": null, + "grad_norm": 0.5250620048665217, + "grad_max_sv": 0.26220443546772004, + "grad_min_sv": 9.708422499471806e-09, + "grad_condition": 1735224596.1306622, + "lr": 0.00013551568628929425, + "time_sec": 15.544908046722412 + }, + { + "epoch": 115, + "train_loss": 0.19545854469299317, + "train_acc": 0.93772, + "test_loss": 2.030077984619141, + "test_acc": 0.6083, + "lyapunov": null, + "grad_norm": 0.5159095993296826, + "grad_max_sv": 0.25392336696386336, + "grad_min_sv": 9.075509158204195e-09, + "grad_condition": 387258285.34785974, + "lr": 0.00012842758726130276, + "time_sec": 15.545970439910889 + }, + { + "epoch": 116, + "train_loss": 0.1940010940551758, + "train_acc": 0.93664, + "test_loss": 2.055483460998535, + "test_acc": 0.6076, + "lyapunov": null, + "grad_norm": 0.5167827048953452, + "grad_max_sv": 0.24668554440140725, + "grad_min_sv": 9.22858311314806e-09, + "grad_condition": 143532705.50095612, + "lr": 0.0001215024721741218, + "time_sec": 15.540485620498657 + }, + { + "epoch": 117, + "train_loss": 0.19125311409950257, + "train_acc": 0.93884, + "test_loss": 2.056917554664612, + "test_acc": 0.6091, + "lyapunov": null, + "grad_norm": 0.5127430440891717, + "grad_max_sv": 0.2540026530623436, + "grad_min_sv": 9.185630342012189e-09, + "grad_condition": 963637817.0719798, + "lr": 0.00011474337861210538, + "time_sec": 15.524260759353638 + }, + { + "epoch": 118, + "train_loss": 0.19195901846885682, + "train_acc": 0.93844, + "test_loss": 2.0476279891967772, + "test_acc": 0.6091, + "lyapunov": null, + "grad_norm": 0.5143264365358208, + "grad_max_sv": 0.24739750139415265, + "grad_min_sv": 9.107876060114595e-09, + "grad_condition": 132060377.42390358, + "lr": 0.00010815327133708009, + "time_sec": 15.53121542930603 + }, + { + "epoch": 119, + "train_loss": 0.18706596221923827, + "train_acc": 0.9397, + "test_loss": 2.0857824016571045, + "test_acc": 0.6034, + "lyapunov": null, + "grad_norm": 0.5075097810084265, + "grad_max_sv": 0.24752915948629378, + "grad_min_sv": 9.200760431879798e-09, + "grad_condition": 434415663.04498273, + "lr": 0.00010173504098790182, + "time_sec": 15.540568828582764 + }, + { + "epoch": 120, + "train_loss": 0.18225831587314606, + "train_acc": 0.94122, + "test_loss": 2.0366894691467285, + "test_acc": 0.6099, + "lyapunov": null, + "grad_norm": 0.5003733018103885, + "grad_max_sv": 0.24654436334967614, + "grad_min_sv": 8.9422030484336e-09, + "grad_condition": 211858931.75925827, + "lr": 9.549150281252629e-05, + "time_sec": 15.564785957336426 + }, + { + "epoch": 121, + "train_loss": 0.18144633610725402, + "train_acc": 0.94162, + "test_loss": 2.018186179161072, + "test_acc": 0.6095, + "lyapunov": null, + "grad_norm": 0.4997667364187892, + "grad_max_sv": 0.2531637907028198, + "grad_min_sv": 9.341298896859903e-09, + "grad_condition": 464581409.54865587, + "lr": 8.942539543314794e-05, + "time_sec": 15.542123794555664 + }, + { + "epoch": 122, + "train_loss": 0.17677358429670334, + "train_acc": 0.94476, + "test_loss": 2.0442467012405396, + "test_acc": 0.6104, + "lyapunov": null, + "grad_norm": 0.4916910301577915, + "grad_max_sv": 0.24300660379230976, + "grad_min_sv": 9.315408781591233e-09, + "grad_condition": 418841824.3271101, + "lr": 8.353937964495024e-05, + "time_sec": 15.552602052688599 + }, + { + "epoch": 123, + "train_loss": 0.17309163184165954, + "train_acc": 0.94522, + "test_loss": 2.0207081670761107, + "test_acc": 0.615, + "lyapunov": null, + "grad_norm": 0.48870360224982806, + "grad_max_sv": 0.24264803603291513, + "grad_min_sv": 9.069228867680454e-09, + "grad_condition": 399150476.4316398, + "lr": 7.783603724899243e-05, + "time_sec": 15.560430765151978 + }, + { + "epoch": 124, + "train_loss": 0.17446059901714325, + "train_acc": 0.9439, + "test_loss": 2.080603874015808, + "test_acc": 0.6085, + "lyapunov": null, + "grad_norm": 0.49174251747904896, + "grad_max_sv": 0.24468368366360665, + "grad_min_sv": 8.949146113480106e-09, + "grad_condition": 452231631.8653839, + "lr": 7.231786991974666e-05, + "time_sec": 15.547534704208374 + }, + { + "epoch": 125, + "train_loss": 0.17117922018289566, + "train_acc": 0.94586, + "test_loss": 2.0775406326293946, + "test_acc": 0.6076, + "lyapunov": null, + "grad_norm": 0.4857512368977778, + "grad_max_sv": 0.23816991709172725, + "grad_min_sv": 8.740880118790266e-09, + "grad_condition": 1742259896.8071132, + "lr": 6.698729810778072e-05, + "time_sec": 15.556484937667847 + }, + { + "epoch": 126, + "train_loss": 0.17421807815074922, + "train_acc": 0.94434, + "test_loss": 2.0295333658218384, + "test_acc": 0.6116, + "lyapunov": null, + "grad_norm": 0.49199845150851745, + "grad_max_sv": 0.24616678878664972, + "grad_min_sv": 9.086304337581342e-09, + "grad_condition": 154095678.05538416, + "lr": 6.184665997806817e-05, + "time_sec": 15.563019275665283 + }, + { + "epoch": 127, + "train_loss": 0.17114187426567076, + "train_acc": 0.94642, + "test_loss": 2.01974128074646, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.48631942594512845, + "grad_max_sv": 0.23593781404197217, + "grad_min_sv": 8.839875137618692e-09, + "grad_condition": 362954270.15696913, + "lr": 5.6898210384392595e-05, + "time_sec": 15.550469160079956 + }, + { + "epoch": 128, + "train_loss": 0.1715845184803009, + "train_acc": 0.94614, + "test_loss": 2.067046044540405, + "test_acc": 0.6099, + "lyapunov": null, + "grad_norm": 0.4851851184655616, + "grad_max_sv": 0.22355937864631414, + "grad_min_sv": 8.763929938444131e-09, + "grad_condition": 162449459.43029913, + "lr": 5.214411988029363e-05, + "time_sec": 15.565791606903076 + }, + { + "epoch": 129, + "train_loss": 0.166365064535141, + "train_acc": 0.94706, + "test_loss": 2.0589212400436403, + "test_acc": 0.6117, + "lyapunov": null, + "grad_norm": 0.47650662112386427, + "grad_max_sv": 0.23299637958407401, + "grad_min_sv": 8.58995321821772e-09, + "grad_condition": 1187890269.5555089, + "lr": 4.7586473766990294e-05, + "time_sec": 15.547842264175415 + }, + { + "epoch": 130, + "train_loss": 0.16652157067775727, + "train_acc": 0.94746, + "test_loss": 2.0411241458892824, + "test_acc": 0.6139, + "lyapunov": null, + "grad_norm": 0.4829880385745403, + "grad_max_sv": 0.24537450559437274, + "grad_min_sv": 9.046333961733235e-09, + "grad_condition": 1491166621.1768012, + "lr": 4.32272711786996e-05, + "time_sec": 15.533848285675049 + }, + { + "epoch": 131, + "train_loss": 0.1641612592983246, + "train_acc": 0.9484, + "test_loss": 2.0629710180282594, + "test_acc": 0.6096, + "lyapunov": null, + "grad_norm": 0.4752395509385486, + "grad_max_sv": 0.2307592399418354, + "grad_min_sv": 8.615267874231488e-09, + "grad_condition": 711173370.4649035, + "lr": 3.906842420574966e-05, + "time_sec": 15.540260791778564 + }, + { + "epoch": 132, + "train_loss": 0.1616754886674881, + "train_acc": 0.94878, + "test_loss": 2.035876292037964, + "test_acc": 0.6125, + "lyapunov": null, + "grad_norm": 0.47295961532945835, + "grad_max_sv": 0.22868038788437844, + "grad_min_sv": 8.732005874520065e-09, + "grad_condition": 3251118426.1160374, + "lr": 3.5111757055874305e-05, + "time_sec": 15.562166213989258 + }, + { + "epoch": 133, + "train_loss": 0.16217615643501282, + "train_acc": 0.9476, + "test_loss": 2.0445367414474487, + "test_acc": 0.6137, + "lyapunov": null, + "grad_norm": 0.4778570288031603, + "grad_max_sv": 0.2444434817880392, + "grad_min_sv": 8.748851171471025e-09, + "grad_condition": 3796858345.264998, + "lr": 3.1359005254054254e-05, + "time_sec": 15.558940887451172 + }, + { + "epoch": 134, + "train_loss": 0.16224241252422333, + "train_acc": 0.94872, + "test_loss": 1.9999371147155762, + "test_acc": 0.6168, + "lyapunov": null, + "grad_norm": 0.47303885509046817, + "grad_max_sv": 0.24165684916079044, + "grad_min_sv": 9.011136297039368e-09, + "grad_condition": 657651631.009668, + "lr": 2.7811814881259484e-05, + "time_sec": 15.577393770217896 + }, + { + "epoch": 135, + "train_loss": 0.15856130658626558, + "train_acc": 0.94956, + "test_loss": 2.088929622459412, + "test_acc": 0.6086, + "lyapunov": null, + "grad_norm": 0.4705351818898507, + "grad_max_sv": 0.2420681372284889, + "grad_min_sv": 8.753394663621461e-09, + "grad_condition": 235691633.53025714, + "lr": 2.4471741852423218e-05, + "time_sec": 15.547684907913208 + }, + { + "epoch": 136, + "train_loss": 0.16095407760620117, + "train_acc": 0.9499, + "test_loss": 2.0105459590911865, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.47206684611132954, + "grad_max_sv": 0.2325299184769392, + "grad_min_sv": 8.340716379021119e-09, + "grad_condition": 213490150.3850596, + "lr": 2.1340251233966362e-05, + "time_sec": 15.550458431243896 + }, + { + "epoch": 137, + "train_loss": 0.15780925776958465, + "train_acc": 0.95028, + "test_loss": 2.0596799072265624, + "test_acc": 0.614, + "lyapunov": null, + "grad_norm": 0.46749802407213686, + "grad_max_sv": 0.23526970595121383, + "grad_min_sv": 8.684439107555993e-09, + "grad_condition": 462893579.51175565, + "lr": 1.8418716601170932e-05, + "time_sec": 15.548266649246216 + }, + { + "epoch": 138, + "train_loss": 0.1587288973045349, + "train_acc": 0.94948, + "test_loss": 2.0551964706420898, + "test_acc": 0.612, + "lyapunov": null, + "grad_norm": 0.47153455446201703, + "grad_max_sv": 0.24219317138195037, + "grad_min_sv": 8.867532288450372e-09, + "grad_condition": 354919003.0421229, + "lr": 1.570841943568445e-05, + "time_sec": 15.554182291030884 + }, + { + "epoch": 139, + "train_loss": 0.15548983236789704, + "train_acc": 0.95098, + "test_loss": 2.1055332246780396, + "test_acc": 0.6091, + "lyapunov": null, + "grad_norm": 0.4659621334711714, + "grad_max_sv": 0.22630110755562782, + "grad_min_sv": 8.369765158895704e-09, + "grad_condition": 288025216.3140677, + "lr": 1.3210548563419845e-05, + "time_sec": 15.554279565811157 + }, + { + "epoch": 140, + "train_loss": 0.15722209004878998, + "train_acc": 0.94932, + "test_loss": 2.0253973304748536, + "test_acc": 0.6144, + "lyapunov": null, + "grad_norm": 0.4671213285512787, + "grad_max_sv": 0.24112530723214148, + "grad_min_sv": 8.799361414860152e-09, + "grad_condition": 101473942.51670267, + "lr": 1.0926199633097203e-05, + "time_sec": 15.565106630325317 + }, + { + "epoch": 141, + "train_loss": 0.1592700968503952, + "train_acc": 0.94924, + "test_loss": 2.0313080627441407, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.4699275136234054, + "grad_max_sv": 0.2444250423461199, + "grad_min_sv": 8.847973696464798e-09, + "grad_condition": 908448270.9616123, + "lr": 8.856374635655688e-06, + "time_sec": 15.55463194847107 + }, + { + "epoch": 142, + "train_loss": 0.15532747163295746, + "train_acc": 0.95118, + "test_loss": 2.008699178314209, + "test_acc": 0.6192, + "lyapunov": null, + "grad_norm": 0.4610184251231722, + "grad_max_sv": 0.23061554618179797, + "grad_min_sv": 8.748990629626335e-09, + "grad_condition": 241893946.02809772, + "lr": 7.001981464747503e-06, + "time_sec": 15.561474323272705 + }, + { + "epoch": 143, + "train_loss": 0.15437357861995696, + "train_acc": 0.95214, + "test_loss": 2.0192801219940186, + "test_acc": 0.6131, + "lyapunov": null, + "grad_norm": 0.46171489792310033, + "grad_max_sv": 0.244815981015563, + "grad_min_sv": 8.664128418862618e-09, + "grad_condition": 8281447108.810431, + "lr": 5.3638335185058295e-06, + "time_sec": 15.572490692138672 + }, + { + "epoch": 144, + "train_loss": 0.16084941333293915, + "train_acc": 0.9486, + "test_loss": 2.0608045083999635, + "test_acc": 0.6113, + "lyapunov": null, + "grad_norm": 0.47339200023885886, + "grad_max_sv": 0.2388457827270031, + "grad_min_sv": 9.052978236327724e-09, + "grad_condition": 144494301.9918833, + "lr": 3.942649342761114e-06, + "time_sec": 15.550712585449219 + }, + { + "epoch": 145, + "train_loss": 0.15398479302883147, + "train_acc": 0.95164, + "test_loss": 2.015725050163269, + "test_acc": 0.6168, + "lyapunov": null, + "grad_norm": 0.4622016974922406, + "grad_max_sv": 0.23529170602560043, + "grad_min_sv": 8.609785807759709e-09, + "grad_condition": 1465136062.1413925, + "lr": 2.7390523158633524e-06, + "time_sec": 15.54736614227295 + }, + { + "epoch": 146, + "train_loss": 0.15756463160991668, + "train_acc": 0.94924, + "test_loss": 2.0068264724731444, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.4677425501468377, + "grad_max_sv": 0.23726253286004068, + "grad_min_sv": 9.065553345998738e-09, + "grad_condition": 1852729982.027478, + "lr": 1.7535703752478133e-06, + "time_sec": 15.577149868011475 + }, + { + "epoch": 147, + "train_loss": 0.15230673624992372, + "train_acc": 0.95226, + "test_loss": 2.0538794567108156, + "test_acc": 0.6143, + "lyapunov": null, + "grad_norm": 0.46178217514626596, + "grad_max_sv": 0.23420043475925922, + "grad_min_sv": 8.910292598023062e-09, + "grad_condition": 1115752222.2799745, + "lr": 9.866357858642196e-07, + "time_sec": 15.582788944244385 + }, + { + "epoch": 148, + "train_loss": 0.15486355890750886, + "train_acc": 0.95204, + "test_loss": 2.0418140579223634, + "test_acc": 0.611, + "lyapunov": null, + "grad_norm": 0.4626677417444915, + "grad_max_sv": 0.2311597354710102, + "grad_min_sv": 8.61424796008703e-09, + "grad_condition": 292353255.78508246, + "lr": 4.38584950570808e-07, + "time_sec": 15.558593273162842 + }, + { + "epoch": 149, + "train_loss": 0.15376032871723175, + "train_acc": 0.95072, + "test_loss": 2.0254113912582397, + "test_acc": 0.6152, + "lyapunov": null, + "grad_norm": 0.46378445338582247, + "grad_max_sv": 0.23868124112486838, + "grad_min_sv": 8.802115413756421e-09, + "grad_condition": 8819983975.28751, + "lr": 1.096582625772501e-07, + "time_sec": 15.582695960998535 + }, + { + "epoch": 150, + "train_loss": 0.15166712173461913, + "train_acc": 0.95298, + "test_loss": 2.0302507425308227, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.4579039358283547, + "grad_max_sv": 0.23529550824314355, + "grad_min_sv": 8.516837371203706e-09, + "grad_condition": 498601418.09154, + "lr": 0.0, + "time_sec": 15.550086498260498 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.614874582061767, + "train_acc": 0.06156, + "test_loss": 4.38669578704834, + "test_acc": 0.0657, + "lyapunov": null, + "grad_norm": 6.323308428814374, + "grad_max_sv": 5.359960746765137, + "grad_min_sv": 1.1092787926547665e-07, + "grad_condition": 241840462.01864615, + "lr": 0.0009998903417374227, + "time_sec": 32.694570779800415 + }, + { + "epoch": 2, + "train_loss": 3.912782407989502, + "train_acc": 0.12028, + "test_loss": 3.848427723312378, + "test_acc": 0.118, + "lyapunov": null, + "grad_norm": 4.77324154514733, + "grad_max_sv": 4.041838210821152, + "grad_min_sv": 8.605790392801627e-08, + "grad_condition": 202220647.26193482, + "lr": 0.0009995614150494292, + "time_sec": 32.55419659614563 + }, + { + "epoch": 3, + "train_loss": 3.5573863899230957, + "train_acc": 0.1643, + "test_loss": 3.6023266105651857, + "test_acc": 0.1585, + "lyapunov": null, + "grad_norm": 3.9026523361265673, + "grad_max_sv": 3.171142542362213, + "grad_min_sv": 7.174145993937842e-08, + "grad_condition": 60006708.94719837, + "lr": 0.0009990133642141358, + "time_sec": 32.57006239891052 + }, + { + "epoch": 4, + "train_loss": 3.2918895013427734, + "train_acc": 0.20484, + "test_loss": 3.40032841796875, + "test_acc": 0.1921, + "lyapunov": null, + "grad_norm": 3.296225475753861, + "grad_max_sv": 2.489927414059639, + "grad_min_sv": 6.087895453865678e-08, + "grad_condition": 84801852.08756194, + "lr": 0.0009982464296247522, + "time_sec": 32.551385164260864 + }, + { + "epoch": 5, + "train_loss": 3.0701215673065185, + "train_acc": 0.24178, + "test_loss": 3.1757254974365234, + "test_acc": 0.2263, + "lyapunov": null, + "grad_norm": 2.80278826466115, + "grad_max_sv": 1.9542321234941482, + "grad_min_sv": 5.1833250980237724e-08, + "grad_condition": 47076784.610062554, + "lr": 0.0009972609476841367, + "time_sec": 32.58115863800049 + }, + { + "epoch": 6, + "train_loss": 2.87079267288208, + "train_acc": 0.28012, + "test_loss": 3.024337570953369, + "test_acc": 0.2535, + "lyapunov": null, + "grad_norm": 2.403603088144213, + "grad_max_sv": 1.5701265573501586, + "grad_min_sv": 4.505473518712222e-08, + "grad_condition": 43327775.32023618, + "lr": 0.000996057350657239, + "time_sec": 32.5962495803833 + }, + { + "epoch": 7, + "train_loss": 2.693065844192505, + "train_acc": 0.31204, + "test_loss": 2.797925431442261, + "test_acc": 0.299, + "lyapunov": null, + "grad_norm": 2.107409497681618, + "grad_max_sv": 1.2474446296691895, + "grad_min_sv": 3.9491370495969844e-08, + "grad_condition": 40839114.91512512, + "lr": 0.000994636166481494, + "time_sec": 32.57605028152466 + }, + { + "epoch": 8, + "train_loss": 2.5460816731262206, + "train_acc": 0.34202, + "test_loss": 2.8177419860839845, + "test_acc": 0.3075, + "lyapunov": null, + "grad_norm": 1.9185526453264143, + "grad_max_sv": 1.0886232659220696, + "grad_min_sv": 3.5954989208164534e-08, + "grad_condition": 44071046.37090768, + "lr": 0.0009929980185352525, + "time_sec": 32.57583284378052 + }, + { + "epoch": 9, + "train_loss": 2.4140372009277344, + "train_acc": 0.3688, + "test_loss": 2.758051406097412, + "test_acc": 0.3113, + "lyapunov": null, + "grad_norm": 1.7735238166617053, + "grad_max_sv": 0.9418965801596642, + "grad_min_sv": 3.343987546311489e-08, + "grad_condition": 37679396.49383304, + "lr": 0.0009911436253643444, + "time_sec": 32.5771210193634 + }, + { + "epoch": 10, + "train_loss": 2.3149025343322753, + "train_acc": 0.38952, + "test_loss": 2.5977179332733153, + "test_acc": 0.3498, + "lyapunov": null, + "grad_norm": 1.6539870844732698, + "grad_max_sv": 0.8096891433000565, + "grad_min_sv": 3.0428849770447466e-08, + "grad_condition": 55575107.16143187, + "lr": 0.0009890738003669028, + "time_sec": 32.575756549835205 + }, + { + "epoch": 11, + "train_loss": 2.2090103378295898, + "train_acc": 0.41384, + "test_loss": 2.433280467605591, + "test_acc": 0.3762, + "lyapunov": null, + "grad_norm": 1.577041450877292, + "grad_max_sv": 0.7548397138714791, + "grad_min_sv": 2.9747529839418973e-08, + "grad_condition": 56618819.85903641, + "lr": 0.00098678945143658, + "time_sec": 32.57857155799866 + }, + { + "epoch": 12, + "train_loss": 2.1233900618743897, + "train_acc": 0.43214, + "test_loss": 2.3755472507476805, + "test_acc": 0.386, + "lyapunov": null, + "grad_norm": 1.5044133367483754, + "grad_max_sv": 0.6831597968935966, + "grad_min_sv": 2.8413930716619794e-08, + "grad_condition": 41935056.41931399, + "lr": 0.0009842915805643154, + "time_sec": 32.54568076133728 + }, + { + "epoch": 13, + "train_loss": 2.043979794654846, + "train_acc": 0.44964, + "test_loss": 2.540247434997559, + "test_acc": 0.3648, + "lyapunov": null, + "grad_norm": 1.43967816059591, + "grad_max_sv": 0.6475866869091987, + "grad_min_sv": 2.696438781979449e-08, + "grad_condition": 43955910.519633256, + "lr": 0.000981581283398829, + "time_sec": 32.56134867668152 + }, + { + "epoch": 14, + "train_loss": 1.9673399011611938, + "train_acc": 0.46626, + "test_loss": 2.2459139568328856, + "test_acc": 0.4145, + "lyapunov": null, + "grad_norm": 1.3886751914647821, + "grad_max_sv": 0.6111714348196984, + "grad_min_sv": 2.6264031974254642e-08, + "grad_condition": 36876705.401329875, + "lr": 0.0009786597487660333, + "time_sec": 32.547099351882935 + }, + { + "epoch": 15, + "train_loss": 1.9078269149398803, + "train_acc": 0.48202, + "test_loss": 2.468334749221802, + "test_acc": 0.3845, + "lyapunov": null, + "grad_norm": 1.333110821458258, + "grad_max_sv": 0.5854640513658523, + "grad_min_sv": 2.525855827828494e-08, + "grad_condition": 27365790.268571116, + "lr": 0.0009755282581475766, + "time_sec": 32.56628441810608 + }, + { + "epoch": 16, + "train_loss": 1.8472498971557618, + "train_acc": 0.49456, + "test_loss": 2.555999464797974, + "test_acc": 0.3705, + "lyapunov": null, + "grad_norm": 1.2983395893318297, + "grad_max_sv": 0.5621073499321938, + "grad_min_sv": 2.4648157814777248e-08, + "grad_condition": 27578711.41483445, + "lr": 0.0009721881851187403, + "time_sec": 32.56448459625244 + }, + { + "epoch": 17, + "train_loss": 1.7835501139068604, + "train_acc": 0.51166, + "test_loss": 2.653551648712158, + "test_acc": 0.3654, + "lyapunov": null, + "grad_norm": 1.250317149271239, + "grad_max_sv": 0.5256498865783215, + "grad_min_sv": 2.348344140257197e-08, + "grad_condition": 38306307.793817885, + "lr": 0.0009686409947459456, + "time_sec": 32.56841444969177 + }, + { + "epoch": 18, + "train_loss": 1.7303552620697022, + "train_acc": 0.52022, + "test_loss": 2.3404946056365965, + "test_acc": 0.4104, + "lyapunov": null, + "grad_norm": 1.2085559049781143, + "grad_max_sv": 0.5072395980358124, + "grad_min_sv": 2.2847334307796176e-08, + "grad_condition": 29171562.514913738, + "lr": 0.0009648882429441254, + "time_sec": 32.573736906051636 + }, + { + "epoch": 19, + "train_loss": 1.6674356607818603, + "train_acc": 0.53394, + "test_loss": 2.226296877670288, + "test_acc": 0.4375, + "lyapunov": null, + "grad_norm": 1.185830951207799, + "grad_max_sv": 0.49710184782743455, + "grad_min_sv": 2.2381147740668794e-08, + "grad_condition": 34905981.02477727, + "lr": 0.00096093157579425, + "time_sec": 32.58779191970825 + }, + { + "epoch": 20, + "train_loss": 1.6300001000213622, + "train_acc": 0.54574, + "test_loss": 2.212609383773804, + "test_acc": 0.4351, + "lyapunov": null, + "grad_norm": 1.1542781853931883, + "grad_max_sv": 0.482192575186491, + "grad_min_sv": 2.1483287293566634e-08, + "grad_condition": 31533011.261073686, + "lr": 0.0009567727288213001, + "time_sec": 32.56883144378662 + }, + { + "epoch": 21, + "train_loss": 1.589516068534851, + "train_acc": 0.55464, + "test_loss": 2.2913735172271728, + "test_acc": 0.4287, + "lyapunov": null, + "grad_norm": 1.128778182838579, + "grad_max_sv": 0.4631856270134449, + "grad_min_sv": 2.142580146080597e-08, + "grad_condition": 68091690.30679637, + "lr": 0.0009524135262330095, + "time_sec": 32.607911109924316 + }, + { + "epoch": 22, + "train_loss": 1.5522697276306152, + "train_acc": 0.56402, + "test_loss": 2.289428851890564, + "test_acc": 0.4342, + "lyapunov": null, + "grad_norm": 1.0966310847677752, + "grad_max_sv": 0.4329535707831383, + "grad_min_sv": 2.0387107224628664e-08, + "grad_condition": 31129076.225362398, + "lr": 0.0009478558801197061, + "time_sec": 32.591989040374756 + }, + { + "epoch": 23, + "train_loss": 1.506177180366516, + "train_acc": 0.57534, + "test_loss": 2.096093315887451, + "test_acc": 0.4714, + "lyapunov": null, + "grad_norm": 1.0828727243356455, + "grad_max_sv": 0.4337243750691414, + "grad_min_sv": 2.007666646819395e-08, + "grad_condition": 33110941.610705175, + "lr": 0.000943101789615607, + "time_sec": 32.58827042579651 + }, + { + "epoch": 24, + "train_loss": 1.4734246160507203, + "train_acc": 0.58362, + "test_loss": 2.0975764724731447, + "test_acc": 0.4708, + "lyapunov": null, + "grad_norm": 1.0667027948745171, + "grad_max_sv": 0.4297290474176407, + "grad_min_sv": 1.9938237383332336e-08, + "grad_condition": 41061577.72693956, + "lr": 0.0009381533400219313, + "time_sec": 32.577072858810425 + }, + { + "epoch": 25, + "train_loss": 1.426221365737915, + "train_acc": 0.5929, + "test_loss": 2.439549380493164, + "test_acc": 0.4145, + "lyapunov": null, + "grad_norm": 1.0428597208556587, + "grad_max_sv": 0.42340651378035543, + "grad_min_sv": 1.9947459928282284e-08, + "grad_condition": 27265596.43101754, + "lr": 0.0009330127018922189, + "time_sec": 32.561912059783936 + }, + { + "epoch": 26, + "train_loss": 1.4011604743194581, + "train_acc": 0.60118, + "test_loss": 2.060020211982727, + "test_acc": 0.4858, + "lyapunov": null, + "grad_norm": 1.0269989373175274, + "grad_max_sv": 0.40288332775235175, + "grad_min_sv": 1.900946326183206e-08, + "grad_condition": 47845234.271266595, + "lr": 0.000927682130080253, + "time_sec": 32.59456205368042 + }, + { + "epoch": 27, + "train_loss": 1.3614013753509522, + "train_acc": 0.61062, + "test_loss": 2.1725204816818238, + "test_acc": 0.4667, + "lyapunov": null, + "grad_norm": 1.0054165995388842, + "grad_max_sv": 0.3903233461081982, + "grad_min_sv": 1.854361656519754e-08, + "grad_condition": 51137688.38204093, + "lr": 0.0009221639627510072, + "time_sec": 32.562586307525635 + }, + { + "epoch": 28, + "train_loss": 1.3270175664520263, + "train_acc": 0.61688, + "test_loss": 2.1210414403915405, + "test_acc": 0.478, + "lyapunov": null, + "grad_norm": 0.9906491367639, + "grad_max_sv": 0.4020383097231388, + "grad_min_sv": 1.8380152456282105e-08, + "grad_condition": 60388301.6208367, + "lr": 0.0009164606203550494, + "time_sec": 32.578895807266235 + }, + { + "epoch": 29, + "train_loss": 1.2999025858688356, + "train_acc": 0.62384, + "test_loss": 2.3048962493896483, + "test_acc": 0.4513, + "lyapunov": null, + "grad_norm": 0.975821767543555, + "grad_max_sv": 0.3911690965294838, + "grad_min_sv": 1.8094355357448076e-08, + "grad_condition": 100917843.71111672, + "lr": 0.0009105746045668516, + "time_sec": 32.59432291984558 + }, + { + "epoch": 30, + "train_loss": 1.2684820668792725, + "train_acc": 0.63206, + "test_loss": 2.1987584600448606, + "test_acc": 0.4727, + "lyapunov": null, + "grad_norm": 0.963246322308275, + "grad_max_sv": 0.3789860099554062, + "grad_min_sv": 1.777753648804503e-08, + "grad_condition": 145169036.35257816, + "lr": 0.0009045084971874733, + "time_sec": 32.589643239974976 + }, + { + "epoch": 31, + "train_loss": 1.2416481491851807, + "train_acc": 0.63746, + "test_loss": 2.083261219024658, + "test_acc": 0.4955, + "lyapunov": null, + "grad_norm": 0.9468279342117294, + "grad_max_sv": 0.37791052013635634, + "grad_min_sv": 1.781307417403344e-08, + "grad_condition": 85288818.95068645, + "lr": 0.0008982649590120977, + "time_sec": 32.572959661483765 + }, + { + "epoch": 32, + "train_loss": 1.2152235523986816, + "train_acc": 0.64516, + "test_loss": 2.1265861782073974, + "test_acc": 0.4922, + "lyapunov": null, + "grad_norm": 0.939638022156826, + "grad_max_sv": 0.3743736259639263, + "grad_min_sv": 1.7475726503402013e-08, + "grad_condition": 39937766.35757337, + "lr": 0.0008918467286629196, + "time_sec": 32.5776686668396 + }, + { + "epoch": 33, + "train_loss": 1.1890566221237182, + "train_acc": 0.65154, + "test_loss": 2.1362180561065673, + "test_acc": 0.4933, + "lyapunov": null, + "grad_norm": 0.9223244191335361, + "grad_max_sv": 0.36790077239274976, + "grad_min_sv": 1.7170638504093728e-08, + "grad_condition": 50816815.42980307, + "lr": 0.0008852566213878943, + "time_sec": 32.575252056121826 + }, + { + "epoch": 34, + "train_loss": 1.1525033961486817, + "train_acc": 0.65804, + "test_loss": 2.156662327384949, + "test_acc": 0.4845, + "lyapunov": null, + "grad_norm": 0.9154670377021281, + "grad_max_sv": 0.3625148110091686, + "grad_min_sv": 1.652857618550385e-08, + "grad_condition": 49706014.6712556, + "lr": 0.000878497527825878, + "time_sec": 32.57192873954773 + }, + { + "epoch": 35, + "train_loss": 1.1320337384033203, + "train_acc": 0.66704, + "test_loss": 2.1313774436950683, + "test_acc": 0.4957, + "lyapunov": null, + "grad_norm": 0.9014519580175137, + "grad_max_sv": 0.3490591965615749, + "grad_min_sv": 1.6729596369856326e-08, + "grad_condition": 154412057.84985176, + "lr": 0.000871572412738697, + "time_sec": 32.586177349090576 + }, + { + "epoch": 36, + "train_loss": 1.1130982945632935, + "train_acc": 0.6707, + "test_loss": 2.174855179977417, + "test_acc": 0.4908, + "lyapunov": null, + "grad_norm": 0.8973976114979956, + "grad_max_sv": 0.35180609598755835, + "grad_min_sv": 1.6370007285826384e-08, + "grad_condition": 29099389.365660794, + "lr": 0.0008644843137107055, + "time_sec": 32.571165323257446 + }, + { + "epoch": 37, + "train_loss": 1.084113529548645, + "train_acc": 0.67904, + "test_loss": 2.0568256214141845, + "test_acc": 0.5104, + "lyapunov": null, + "grad_norm": 0.8758712018155839, + "grad_max_sv": 0.3535146668553352, + "grad_min_sv": 1.6385845152608324e-08, + "grad_condition": 92458916.02555758, + "lr": 0.0008572363398164014, + "time_sec": 32.58438062667847 + }, + { + "epoch": 38, + "train_loss": 1.051520336074829, + "train_acc": 0.6886, + "test_loss": 2.4247959348678587, + "test_acc": 0.4582, + "lyapunov": null, + "grad_norm": 0.8714219991625363, + "grad_max_sv": 0.33501161485910413, + "grad_min_sv": 1.58045286191566e-08, + "grad_condition": 26464429.978207294, + "lr": 0.0008498316702566826, + "time_sec": 32.62254238128662 + }, + { + "epoch": 39, + "train_loss": 1.0364685526657105, + "train_acc": 0.69124, + "test_loss": 2.1632789428710937, + "test_acc": 0.4967, + "lyapunov": null, + "grad_norm": 0.8652837401519792, + "grad_max_sv": 0.35404162034392356, + "grad_min_sv": 1.6141110134593185e-08, + "grad_condition": 128261357.3854497, + "lr": 0.0008422735529643442, + "time_sec": 32.600173234939575 + }, + { + "epoch": 40, + "train_loss": 1.0119728073120118, + "train_acc": 0.69654, + "test_loss": 2.117138882064819, + "test_acc": 0.5128, + "lyapunov": null, + "grad_norm": 0.8544168683475741, + "grad_max_sv": 0.3287078306078911, + "grad_min_sv": 1.551416066725153e-08, + "grad_condition": 36426750.154306374, + "lr": 0.0008345653031794289, + "time_sec": 32.560556173324585 + }, + { + "epoch": 41, + "train_loss": 0.9916562337112427, + "train_acc": 0.702, + "test_loss": 2.236895450210571, + "test_acc": 0.4897, + "lyapunov": null, + "grad_norm": 0.8467352944256887, + "grad_max_sv": 0.33691341876983644, + "grad_min_sv": 1.5836235171817757e-08, + "grad_condition": 44640488.00286798, + "lr": 0.0008267103019950526, + "time_sec": 32.5704402923584 + }, + { + "epoch": 42, + "train_loss": 0.9654732009506226, + "train_acc": 0.70762, + "test_loss": 2.1829694009780884, + "test_acc": 0.5012, + "lyapunov": null, + "grad_norm": 0.8362309446374243, + "grad_max_sv": 0.3233294114470482, + "grad_min_sv": 1.5228746941958747e-08, + "grad_condition": 51066866.33295958, + "lr": 0.0008187119948743447, + "time_sec": 32.580946922302246 + }, + { + "epoch": 43, + "train_loss": 0.9421817608642579, + "train_acc": 0.71428, + "test_loss": 2.195651917266846, + "test_acc": 0.5008, + "lyapunov": null, + "grad_norm": 0.826453683553485, + "grad_max_sv": 0.32826076112687586, + "grad_min_sv": 1.528739334566431e-08, + "grad_condition": 48228756.461630754, + "lr": 0.000810573890139155, + "time_sec": 32.58583116531372 + }, + { + "epoch": 44, + "train_loss": 0.9207255261230469, + "train_acc": 0.722, + "test_loss": 2.238926205635071, + "test_acc": 0.4977, + "lyapunov": null, + "grad_norm": 0.8269944395334025, + "grad_max_sv": 0.34641635976731777, + "grad_min_sv": 1.530284474415833e-08, + "grad_condition": 51107054.3673956, + "lr": 0.0008022995574311873, + "time_sec": 32.61741900444031 + }, + { + "epoch": 45, + "train_loss": 0.904716330947876, + "train_acc": 0.7249, + "test_loss": 2.275478556442261, + "test_acc": 0.4991, + "lyapunov": null, + "grad_norm": 0.8189924677653038, + "grad_max_sv": 0.3279395066201687, + "grad_min_sv": 1.51308111286802e-08, + "grad_condition": 78780549.87765977, + "lr": 0.0007938926261462363, + "time_sec": 32.5772967338562 + }, + { + "epoch": 46, + "train_loss": 0.8899834023284912, + "train_acc": 0.72848, + "test_loss": 2.3693980892181394, + "test_acc": 0.4868, + "lyapunov": null, + "grad_norm": 0.8092081146753185, + "grad_max_sv": 0.32307616621255875, + "grad_min_sv": 1.485347370837678e-08, + "grad_condition": 526886784.5179695, + "lr": 0.0007853567838422158, + "time_sec": 32.59701919555664 + }, + { + "epoch": 47, + "train_loss": 0.8707863888549805, + "train_acc": 0.7357, + "test_loss": 2.217044024658203, + "test_acc": 0.5125, + "lyapunov": null, + "grad_norm": 0.7942459076291833, + "grad_max_sv": 0.3131110444664955, + "grad_min_sv": 1.4527805920760972e-08, + "grad_condition": 40320257.63417223, + "lr": 0.0007766957746216719, + "time_sec": 32.601186990737915 + }, + { + "epoch": 48, + "train_loss": 0.843968966217041, + "train_acc": 0.74056, + "test_loss": 2.3307279125213625, + "test_acc": 0.4947, + "lyapunov": null, + "grad_norm": 0.7940745602376812, + "grad_max_sv": 0.32453064769506457, + "grad_min_sv": 1.4832890384008924e-08, + "grad_condition": 85497386.34462628, + "lr": 0.0007679133974894982, + "time_sec": 32.589070081710815 + }, + { + "epoch": 49, + "train_loss": 0.837805420036316, + "train_acc": 0.74426, + "test_loss": 2.2644015617370608, + "test_acc": 0.5075, + "lyapunov": null, + "grad_norm": 0.7804335428675169, + "grad_max_sv": 0.30536644347012043, + "grad_min_sv": 1.4050063589302054e-08, + "grad_condition": 84147442.26342316, + "lr": 0.000759013504686565, + "time_sec": 32.581034660339355 + }, + { + "epoch": 50, + "train_loss": 0.8142583678817749, + "train_acc": 0.752, + "test_loss": 2.269890809249878, + "test_acc": 0.5121, + "lyapunov": null, + "grad_norm": 0.7727513754535821, + "grad_max_sv": 0.31201698929071425, + "grad_min_sv": 1.4192447476664774e-08, + "grad_condition": 529475085.89009637, + "lr": 0.0007499999999999998, + "time_sec": 32.5786030292511 + }, + { + "epoch": 51, + "train_loss": 0.8065035782051087, + "train_acc": 0.75184, + "test_loss": 2.3187968933105467, + "test_acc": 0.5007, + "lyapunov": null, + "grad_norm": 0.7669314147862671, + "grad_max_sv": 0.3042456738650799, + "grad_min_sv": 1.3945495271061592e-08, + "grad_condition": 53477017.00064084, + "lr": 0.0007408768370508575, + "time_sec": 32.59546518325806 + }, + { + "epoch": 52, + "train_loss": 0.7823376733016968, + "train_acc": 0.75794, + "test_loss": 2.3489084259033204, + "test_acc": 0.5023, + "lyapunov": null, + "grad_norm": 0.7660884224056164, + "grad_max_sv": 0.3124966356903315, + "grad_min_sv": 1.4163892245178111e-08, + "grad_condition": 82942735.9050788, + "lr": 0.0007316480175599307, + "time_sec": 32.57622933387756 + }, + { + "epoch": 53, + "train_loss": 0.7739577153205871, + "train_acc": 0.75914, + "test_loss": 2.2757296672821044, + "test_acc": 0.5111, + "lyapunov": null, + "grad_norm": 0.7639316577777043, + "grad_max_sv": 0.30771007128059863, + "grad_min_sv": 1.3752394600712037e-08, + "grad_condition": 138666525.75968605, + "lr": 0.0007223175895924635, + "time_sec": 32.598307847976685 + }, + { + "epoch": 54, + "train_loss": 0.743152338142395, + "train_acc": 0.76718, + "test_loss": 2.3196601219177246, + "test_acc": 0.5129, + "lyapunov": null, + "grad_norm": 0.7528299785896518, + "grad_max_sv": 0.30092642940580844, + "grad_min_sv": 1.3266748091073088e-08, + "grad_condition": 63385725.469119295, + "lr": 0.0007128896457825361, + "time_sec": 32.58740997314453 + }, + { + "epoch": 55, + "train_loss": 0.7354863517570496, + "train_acc": 0.77182, + "test_loss": 2.3526000537872314, + "test_acc": 0.5126, + "lyapunov": null, + "grad_norm": 0.7451404222927475, + "grad_max_sv": 0.2990843068808317, + "grad_min_sv": 1.3328501980835322e-08, + "grad_condition": 285693408.6471442, + "lr": 0.0007033683215378998, + "time_sec": 32.598177671432495 + }, + { + "epoch": 56, + "train_loss": 0.7073092913246155, + "train_acc": 0.7807, + "test_loss": 2.3621452728271484, + "test_acc": 0.5099, + "lyapunov": null, + "grad_norm": 0.7373713712392547, + "grad_max_sv": 0.2979133691638708, + "grad_min_sv": 1.3183412926869725e-08, + "grad_condition": 238359097.8032841, + "lr": 0.0006937577932260512, + "time_sec": 32.583340883255005 + }, + { + "epoch": 57, + "train_loss": 0.6987956598091125, + "train_acc": 0.78072, + "test_loss": 2.3795434368133543, + "test_acc": 0.5118, + "lyapunov": null, + "grad_norm": 0.7319099756388497, + "grad_max_sv": 0.296065080165863, + "grad_min_sv": 1.3287117493418487e-08, + "grad_condition": 66678748.48095138, + "lr": 0.0006840622763423388, + "time_sec": 32.58512043952942 + }, + { + "epoch": 58, + "train_loss": 0.6792643665313721, + "train_acc": 0.78798, + "test_loss": 2.2789505527496337, + "test_acc": 0.5232, + "lyapunov": null, + "grad_norm": 0.7216342954651443, + "grad_max_sv": 0.29178132936358453, + "grad_min_sv": 1.2998765469215966e-08, + "grad_condition": 143960328.82346174, + "lr": 0.0006742860236609073, + "time_sec": 32.59812808036804 + }, + { + "epoch": 59, + "train_loss": 0.6515239137840271, + "train_acc": 0.79768, + "test_loss": 2.420798418426514, + "test_acc": 0.5115, + "lyapunov": null, + "grad_norm": 0.709630733203499, + "grad_max_sv": 0.28213805221021176, + "grad_min_sv": 1.2757892067435939e-08, + "grad_condition": 123971646.4732101, + "lr": 0.0006644333233692913, + "time_sec": 32.58280849456787 + }, + { + "epoch": 60, + "train_loss": 0.6553487308883666, + "train_acc": 0.79488, + "test_loss": 2.3734813625335693, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.7171951395685539, + "grad_max_sv": 0.29653852954506876, + "grad_min_sv": 1.3082359766325436e-08, + "grad_condition": 106198804.16444652, + "lr": 0.0006545084971874734, + "time_sec": 32.588764905929565 + }, + { + "epoch": 61, + "train_loss": 0.6462248212051391, + "train_acc": 0.79646, + "test_loss": 2.4995255168914796, + "test_acc": 0.5069, + "lyapunov": null, + "grad_norm": 0.7130456736602092, + "grad_max_sv": 0.2883887976408005, + "grad_min_sv": 1.2833410909310338e-08, + "grad_condition": 64162524.858568884, + "lr": 0.0006445158984722354, + "time_sec": 32.58893823623657 + }, + { + "epoch": 62, + "train_loss": 0.6120539363479615, + "train_acc": 0.80664, + "test_loss": 2.3868945693969725, + "test_acc": 0.5195, + "lyapunov": null, + "grad_norm": 0.6980011712580467, + "grad_max_sv": 0.2836525205522776, + "grad_min_sv": 1.238731829091011e-08, + "grad_condition": 64812932.89195301, + "lr": 0.0006344599103076324, + "time_sec": 32.590434312820435 + }, + { + "epoch": 63, + "train_loss": 0.5959844853591919, + "train_acc": 0.8111, + "test_loss": 2.3468752334594725, + "test_acc": 0.525, + "lyapunov": null, + "grad_norm": 0.6905636194872752, + "grad_max_sv": 0.28761959373950957, + "grad_min_sv": 1.2442233669057723e-08, + "grad_condition": 86059845.92255709, + "lr": 0.0006243449435824269, + "time_sec": 32.59946584701538 + }, + { + "epoch": 64, + "train_loss": 0.5868798995113372, + "train_acc": 0.814, + "test_loss": 2.3779570838928223, + "test_acc": 0.5301, + "lyapunov": null, + "grad_norm": 0.6807645033255275, + "grad_max_sv": 0.2786863997578621, + "grad_min_sv": 1.2551345890746136e-08, + "grad_condition": 61300128.303581215, + "lr": 0.0006141754350553275, + "time_sec": 32.58964800834656 + }, + { + "epoch": 65, + "train_loss": 0.579564445438385, + "train_acc": 0.81814, + "test_loss": 2.3675758209228515, + "test_acc": 0.5276, + "lyapunov": null, + "grad_norm": 0.6762152018324795, + "grad_max_sv": 0.26890397146344186, + "grad_min_sv": 1.2056215335787267e-08, + "grad_condition": 47300154.119489506, + "lr": 0.0006039558454088793, + "time_sec": 32.60079860687256 + }, + { + "epoch": 66, + "train_loss": 0.5755131871032715, + "train_acc": 0.81776, + "test_loss": 2.368547018814087, + "test_acc": 0.5303, + "lyapunov": null, + "grad_norm": 0.6799789031556194, + "grad_max_sv": 0.2802586030215025, + "grad_min_sv": 1.238221065554511e-08, + "grad_condition": 356778807.6018594, + "lr": 0.000593690657292862, + "time_sec": 32.591476917266846 + }, + { + "epoch": 67, + "train_loss": 0.5571317762947082, + "train_acc": 0.8247, + "test_loss": 2.4634271934509275, + "test_acc": 0.5205, + "lyapunov": null, + "grad_norm": 0.6677678505131144, + "grad_max_sv": 0.27768109291791915, + "grad_min_sv": 1.2071005670282603e-08, + "grad_condition": 480662632.86813325, + "lr": 0.0005833843733580507, + "time_sec": 32.58660840988159 + }, + { + "epoch": 68, + "train_loss": 0.5370455453109741, + "train_acc": 0.8293, + "test_loss": 2.459835057449341, + "test_acc": 0.5237, + "lyapunov": null, + "grad_norm": 0.6604613288412575, + "grad_max_sv": 0.2757783461362123, + "grad_min_sv": 1.1747383642929376e-08, + "grad_condition": 108487664.68233645, + "lr": 0.0005730415142812054, + "time_sec": 32.60331964492798 + }, + { + "epoch": 69, + "train_loss": 0.5335728300857544, + "train_acc": 0.82814, + "test_loss": 2.4432239379882814, + "test_acc": 0.5263, + "lyapunov": null, + "grad_norm": 0.6551820571178028, + "grad_max_sv": 0.2737420566380024, + "grad_min_sv": 1.1939705933487754e-08, + "grad_condition": 196906328.1819435, + "lr": 0.0005626666167821517, + "time_sec": 32.599244356155396 + }, + { + "epoch": 70, + "train_loss": 0.5145312023544312, + "train_acc": 0.83578, + "test_loss": 2.4909321453094484, + "test_acc": 0.526, + "lyapunov": null, + "grad_norm": 0.6472480309847657, + "grad_max_sv": 0.27335426174104216, + "grad_min_sv": 1.1793601722293045e-08, + "grad_condition": 68789489.73226814, + "lr": 0.0005522642316338265, + "time_sec": 32.63460826873779 + }, + { + "epoch": 71, + "train_loss": 0.5043477191543579, + "train_acc": 0.83958, + "test_loss": 2.553674084854126, + "test_acc": 0.5226, + "lyapunov": null, + "grad_norm": 0.6420259011516274, + "grad_max_sv": 0.2746612638235092, + "grad_min_sv": 1.1955708306352065e-08, + "grad_condition": 100316513.67004016, + "lr": 0.0005418389216661573, + "time_sec": 32.58567404747009 + }, + { + "epoch": 72, + "train_loss": 0.49948640129089356, + "train_acc": 0.84136, + "test_loss": 2.539296279144287, + "test_acc": 0.5233, + "lyapunov": null, + "grad_norm": 0.6383489418019058, + "grad_max_sv": 0.26922862641513345, + "grad_min_sv": 1.1503295074908466e-08, + "grad_condition": 354877772.1306223, + "lr": 0.0005313952597646563, + "time_sec": 32.625067949295044 + }, + { + "epoch": 73, + "train_loss": 0.47933840072631834, + "train_acc": 0.84752, + "test_loss": 2.595202964782715, + "test_acc": 0.5203, + "lyapunov": null, + "grad_norm": 0.6293105937361914, + "grad_max_sv": 0.26696190387010577, + "grad_min_sv": 1.1379859076203134e-08, + "grad_condition": 769443742.0120881, + "lr": 0.0005209378268645994, + "time_sec": 32.59942388534546 + }, + { + "epoch": 74, + "train_loss": 0.4770963186454773, + "train_acc": 0.8476, + "test_loss": 2.5404656970977784, + "test_acc": 0.5272, + "lyapunov": null, + "grad_norm": 0.6301014080106567, + "grad_max_sv": 0.2688163876533508, + "grad_min_sv": 1.135137725717314e-08, + "grad_condition": 215980241.0253767, + "lr": 0.0005104712099416781, + "time_sec": 32.577284812927246 + }, + { + "epoch": 75, + "train_loss": 0.4582629628944397, + "train_acc": 0.8522, + "test_loss": 2.6312942310333254, + "test_acc": 0.5218, + "lyapunov": null, + "grad_norm": 0.6260768127745926, + "grad_max_sv": 0.2644084498286247, + "grad_min_sv": 1.1460068141547555e-08, + "grad_condition": 441089953.66541755, + "lr": 0.0004999999999999996, + "time_sec": 32.60153841972351 + }, + { + "epoch": 76, + "train_loss": 0.45087591842651364, + "train_acc": 0.85542, + "test_loss": 2.606955569458008, + "test_acc": 0.5288, + "lyapunov": null, + "grad_norm": 0.6203644998630469, + "grad_max_sv": 0.25496261939406395, + "grad_min_sv": 1.1111845732349885e-08, + "grad_condition": 287467347.4027728, + "lr": 0.0004895287900583212, + "time_sec": 32.59224033355713 + }, + { + "epoch": 77, + "train_loss": 0.43747104292869565, + "train_acc": 0.85884, + "test_loss": 2.619938083267212, + "test_acc": 0.5268, + "lyapunov": null, + "grad_norm": 0.6157815434735789, + "grad_max_sv": 0.2686824891716242, + "grad_min_sv": 1.1295069601846564e-08, + "grad_condition": 54772967.39514383, + "lr": 0.0004790621731353997, + "time_sec": 32.588496685028076 + }, + { + "epoch": 78, + "train_loss": 0.42626130981445315, + "train_acc": 0.8639, + "test_loss": 2.7211667629241942, + "test_acc": 0.5166, + "lyapunov": null, + "grad_norm": 0.6100571736377234, + "grad_max_sv": 0.2599440861493349, + "grad_min_sv": 1.0853403832307776e-08, + "grad_condition": 774281553.8716226, + "lr": 0.000468604740235343, + "time_sec": 32.59684610366821 + }, + { + "epoch": 79, + "train_loss": 0.42017824411392213, + "train_acc": 0.86548, + "test_loss": 2.654300415802002, + "test_acc": 0.5221, + "lyapunov": null, + "grad_norm": 0.6001051149057299, + "grad_max_sv": 0.24722935520112516, + "grad_min_sv": 1.0637084493000242e-08, + "grad_condition": 458650799.53520596, + "lr": 0.00045816107833384175, + "time_sec": 32.60820508003235 + }, + { + "epoch": 80, + "train_loss": 0.4099808219718933, + "train_acc": 0.86866, + "test_loss": 2.584393338012695, + "test_acc": 0.5329, + "lyapunov": null, + "grad_norm": 0.5982008707692702, + "grad_max_sv": 0.25515949316322806, + "grad_min_sv": 1.0970911762039904e-08, + "grad_condition": 81697562.26452604, + "lr": 0.0004477357683661729, + "time_sec": 32.600223541259766 + }, + { + "epoch": 81, + "train_loss": 0.40091643369674684, + "train_acc": 0.87054, + "test_loss": 2.5790781299591066, + "test_acc": 0.5299, + "lyapunov": null, + "grad_norm": 0.5921623366892947, + "grad_max_sv": 0.2506237640976906, + "grad_min_sv": 1.07448340562759e-08, + "grad_condition": 1595967011.5033295, + "lr": 0.00043733338321784746, + "time_sec": 32.58992123603821 + }, + { + "epoch": 82, + "train_loss": 0.3906331276321411, + "train_acc": 0.87322, + "test_loss": 2.7007477321624758, + "test_acc": 0.5241, + "lyapunov": null, + "grad_norm": 0.5856158821091417, + "grad_max_sv": 0.2561802566051483, + "grad_min_sv": 1.0621720123753427e-08, + "grad_condition": 3931509005.8314238, + "lr": 0.0004269584857187939, + "time_sec": 32.60382795333862 + }, + { + "epoch": 83, + "train_loss": 0.3784799990653992, + "train_acc": 0.87816, + "test_loss": 2.7430577102661133, + "test_acc": 0.5207, + "lyapunov": null, + "grad_norm": 0.5840749227648773, + "grad_max_sv": 0.2521792113780975, + "grad_min_sv": 1.029234232418231e-08, + "grad_condition": 657974148.7642715, + "lr": 0.0004166156266419484, + "time_sec": 32.62590169906616 + }, + { + "epoch": 84, + "train_loss": 0.36473722780227663, + "train_acc": 0.88094, + "test_loss": 2.780077816390991, + "test_acc": 0.5253, + "lyapunov": null, + "grad_norm": 0.5771142116801258, + "grad_max_sv": 0.2527416229248047, + "grad_min_sv": 1.0504097070797302e-08, + "grad_condition": 275469675.99291694, + "lr": 0.0004063093427071373, + "time_sec": 32.60086488723755 + }, + { + "epoch": 85, + "train_loss": 0.3594164635372162, + "train_acc": 0.8828, + "test_loss": 2.728798849487305, + "test_acc": 0.53, + "lyapunov": null, + "grad_norm": 0.5699653767219048, + "grad_max_sv": 0.24389564469456673, + "grad_min_sv": 1.0148122779260471e-08, + "grad_condition": 81276062.17564048, + "lr": 0.0003960441545911199, + "time_sec": 32.61606812477112 + }, + { + "epoch": 86, + "train_loss": 0.35691798246383666, + "train_acc": 0.88444, + "test_loss": 2.667480911254883, + "test_acc": 0.5372, + "lyapunov": null, + "grad_norm": 0.5686015085963011, + "grad_max_sv": 0.24499542228877544, + "grad_min_sv": 1.018558375277638e-08, + "grad_condition": 533473379.8045244, + "lr": 0.0003858245649446718, + "time_sec": 32.58942675590515 + }, + { + "epoch": 87, + "train_loss": 0.3461787840080261, + "train_acc": 0.88862, + "test_loss": 2.7013081783294677, + "test_acc": 0.5331, + "lyapunov": null, + "grad_norm": 0.5662786550881038, + "grad_max_sv": 0.25225193947553637, + "grad_min_sv": 1.0258767205173492e-08, + "grad_condition": 57498974.23126312, + "lr": 0.00037565505641757235, + "time_sec": 32.62986612319946 + }, + { + "epoch": 88, + "train_loss": 0.3378766645145416, + "train_acc": 0.891, + "test_loss": 2.6787281810760497, + "test_acc": 0.5332, + "lyapunov": null, + "grad_norm": 0.5559997977216727, + "grad_max_sv": 0.24743575379252433, + "grad_min_sv": 1.0120435695037954e-08, + "grad_condition": 63021079.96171679, + "lr": 0.00036554008969236695, + "time_sec": 32.606411933898926 + }, + { + "epoch": 89, + "train_loss": 0.3277571000003815, + "train_acc": 0.8939, + "test_loss": 2.8289716995239256, + "test_acc": 0.5233, + "lyapunov": null, + "grad_norm": 0.5536940020063074, + "grad_max_sv": 0.24743517786264418, + "grad_min_sv": 9.960347746671566e-09, + "grad_condition": 378961859.9507846, + "lr": 0.0003554841015277638, + "time_sec": 32.61576008796692 + }, + { + "epoch": 90, + "train_loss": 0.31579964986801146, + "train_acc": 0.897, + "test_loss": 2.811709595108032, + "test_acc": 0.5249, + "lyapunov": null, + "grad_norm": 0.543683168726444, + "grad_max_sv": 0.24388404116034507, + "grad_min_sv": 9.773315148321748e-09, + "grad_condition": 122611563.57289734, + "lr": 0.000345491502812526, + "time_sec": 32.60401773452759 + }, + { + "epoch": 91, + "train_loss": 0.31306590376853943, + "train_acc": 0.89988, + "test_loss": 2.8455798820495604, + "test_acc": 0.5245, + "lyapunov": null, + "grad_norm": 0.5417887903872176, + "grad_max_sv": 0.24360701441764832, + "grad_min_sv": 9.947092209638963e-09, + "grad_condition": 83220580.4179602, + "lr": 0.0003355666766307081, + "time_sec": 32.57031607627869 + }, + { + "epoch": 92, + "train_loss": 0.30877333124160766, + "train_acc": 0.90048, + "test_loss": 2.828940309906006, + "test_acc": 0.525, + "lyapunov": null, + "grad_norm": 0.5415049670354658, + "grad_max_sv": 0.24773363061249257, + "grad_min_sv": 9.660245593604358e-09, + "grad_condition": 384286531.30052173, + "lr": 0.00032571397633909225, + "time_sec": 32.60402154922485 + }, + { + "epoch": 93, + "train_loss": 0.30664673944473264, + "train_acc": 0.90068, + "test_loss": 2.8073126644134523, + "test_acc": 0.5318, + "lyapunov": null, + "grad_norm": 0.5429616923879481, + "grad_max_sv": 0.2421899013221264, + "grad_min_sv": 9.822492379792797e-09, + "grad_condition": 831379739.8417737, + "lr": 0.00031593772365766094, + "time_sec": 32.604076623916626 + }, + { + "epoch": 94, + "train_loss": 0.2941160817909241, + "train_acc": 0.9056, + "test_loss": 2.787534133911133, + "test_acc": 0.5376, + "lyapunov": null, + "grad_norm": 0.5279598892402736, + "grad_max_sv": 0.2383882984519005, + "grad_min_sv": 9.415061244001654e-09, + "grad_condition": 160263524.9470215, + "lr": 0.0003062422067739483, + "time_sec": 32.60323166847229 + }, + { + "epoch": 95, + "train_loss": 0.28154629373550416, + "train_acc": 0.90866, + "test_loss": 2.893843098831177, + "test_acc": 0.5233, + "lyapunov": null, + "grad_norm": 0.5211541759637133, + "grad_max_sv": 0.23834086805582047, + "grad_min_sv": 9.38503141147476e-09, + "grad_condition": 587375608.3111145, + "lr": 0.00029663167846209965, + "time_sec": 32.61985802650452 + }, + { + "epoch": 96, + "train_loss": 0.2798216311311722, + "train_acc": 0.90954, + "test_loss": 2.857046318817139, + "test_acc": 0.5271, + "lyapunov": null, + "grad_norm": 0.5141615815369457, + "grad_max_sv": 0.22582133412361144, + "grad_min_sv": 9.48394347243843e-09, + "grad_condition": 354823428.4324465, + "lr": 0.00028711035421746345, + "time_sec": 32.58983588218689 + }, + { + "epoch": 97, + "train_loss": 0.2703013199234009, + "train_acc": 0.91322, + "test_loss": 2.82070970993042, + "test_acc": 0.5312, + "lyapunov": null, + "grad_norm": 0.5069094286336273, + "grad_max_sv": 0.23691595830023288, + "grad_min_sv": 9.323161761533304e-09, + "grad_condition": 145454324.17040363, + "lr": 0.00027768241040753615, + "time_sec": 32.62266421318054 + }, + { + "epoch": 98, + "train_loss": 0.26267928913116456, + "train_acc": 0.91478, + "test_loss": 2.831645970153809, + "test_acc": 0.5278, + "lyapunov": null, + "grad_norm": 0.5043739635219361, + "grad_max_sv": 0.2209805216640234, + "grad_min_sv": 8.822150978791878e-09, + "grad_condition": 1815220943.9156146, + "lr": 0.00026835198244006903, + "time_sec": 32.700286865234375 + }, + { + "epoch": 99, + "train_loss": 0.26799847937583926, + "train_acc": 0.91178, + "test_loss": 2.846790531921387, + "test_acc": 0.5325, + "lyapunov": null, + "grad_norm": 0.5097425849436117, + "grad_max_sv": 0.2252878088504076, + "grad_min_sv": 9.071544386052114e-09, + "grad_condition": 935108016.3819262, + "lr": 0.0002591231629491421, + "time_sec": 32.652007818222046 + }, + { + "epoch": 100, + "train_loss": 0.25687388509750364, + "train_acc": 0.91572, + "test_loss": 2.844114168548584, + "test_acc": 0.5301, + "lyapunov": null, + "grad_norm": 0.5030132191434431, + "grad_max_sv": 0.23471550829708576, + "grad_min_sv": 9.359147224233256e-09, + "grad_condition": 1089949405.9437118, + "lr": 0.0002499999999999997, + "time_sec": 32.63126802444458 + }, + { + "epoch": 101, + "train_loss": 0.2520920184612274, + "train_acc": 0.91798, + "test_loss": 2.8608716987609863, + "test_acc": 0.5348, + "lyapunov": null, + "grad_norm": 0.4963346315979647, + "grad_max_sv": 0.23927163816988467, + "grad_min_sv": 9.324820984531016e-09, + "grad_condition": 894019527.4128025, + "lr": 0.00024098649531343477, + "time_sec": 32.602155923843384 + }, + { + "epoch": 102, + "train_loss": 0.24177431715488434, + "train_acc": 0.92186, + "test_loss": 2.85232082862854, + "test_acc": 0.5306, + "lyapunov": null, + "grad_norm": 0.4891645436848551, + "grad_max_sv": 0.23208856917917728, + "grad_min_sv": 9.070336430615049e-09, + "grad_condition": 413341508.33558476, + "lr": 0.0002320866025105016, + "time_sec": 32.62471413612366 + }, + { + "epoch": 103, + "train_loss": 0.23854983226776122, + "train_acc": 0.9226, + "test_loss": 2.7920223457336424, + "test_acc": 0.5382, + "lyapunov": null, + "grad_norm": 0.48644276366286593, + "grad_max_sv": 0.22603111676871776, + "grad_min_sv": 8.893254901942704e-09, + "grad_condition": 414227262.00470644, + "lr": 0.0002233042253783278, + "time_sec": 32.613913774490356 + }, + { + "epoch": 104, + "train_loss": 0.23433040732383728, + "train_acc": 0.92414, + "test_loss": 2.901957023239136, + "test_acc": 0.5291, + "lyapunov": null, + "grad_norm": 0.48806246595990077, + "grad_max_sv": 0.23023997843265534, + "grad_min_sv": 8.815287426454724e-09, + "grad_condition": 346964056.15115684, + "lr": 0.000214643216157784, + "time_sec": 32.60389828681946 + }, + { + "epoch": 105, + "train_loss": 0.22986493856430054, + "train_acc": 0.92466, + "test_loss": 2.877705308151245, + "test_acc": 0.5327, + "lyapunov": null, + "grad_norm": 0.48085142050632557, + "grad_max_sv": 0.2137234926223755, + "grad_min_sv": 8.60617813108061e-09, + "grad_condition": 239445377.3352519, + "lr": 0.00020610737385376332, + "time_sec": 32.59467577934265 + }, + { + "epoch": 106, + "train_loss": 0.22199077575683593, + "train_acc": 0.9278, + "test_loss": 2.9010587142944337, + "test_acc": 0.5324, + "lyapunov": null, + "grad_norm": 0.4714371705778469, + "grad_max_sv": 0.21498987674713135, + "grad_min_sv": 8.473469289768664e-09, + "grad_condition": 350116894.28952634, + "lr": 0.00019770044256881242, + "time_sec": 32.608004570007324 + }, + { + "epoch": 107, + "train_loss": 0.2181517135620117, + "train_acc": 0.92994, + "test_loss": 2.878814113616943, + "test_acc": 0.534, + "lyapunov": null, + "grad_norm": 0.46943044216954516, + "grad_max_sv": 0.22595015838742255, + "grad_min_sv": 8.52424024444542e-09, + "grad_condition": 2514218217.9067893, + "lr": 0.0001894261098608447, + "time_sec": 32.63431739807129 + }, + { + "epoch": 108, + "train_loss": 0.21434411600112915, + "train_acc": 0.93118, + "test_loss": 2.866080297088623, + "test_acc": 0.5373, + "lyapunov": null, + "grad_norm": 0.46576217269588654, + "grad_max_sv": 0.22655029892921447, + "grad_min_sv": 8.725328624979017e-09, + "grad_condition": 801868312.6810858, + "lr": 0.000181288005125655, + "time_sec": 32.72058939933777 + }, + { + "epoch": 109, + "train_loss": 0.21005438403129578, + "train_acc": 0.93288, + "test_loss": 2.965788179779053, + "test_acc": 0.5307, + "lyapunov": null, + "grad_norm": 0.4614119226295971, + "grad_max_sv": 0.21423224844038485, + "grad_min_sv": 8.608944879022473e-09, + "grad_condition": 134715840.19015014, + "lr": 0.0001732896980049473, + "time_sec": 32.673903703689575 + }, + { + "epoch": 110, + "train_loss": 0.20861490973472596, + "train_acc": 0.93278, + "test_loss": 2.9108359115600586, + "test_acc": 0.5392, + "lyapunov": null, + "grad_norm": 0.4597024280145315, + "grad_max_sv": 0.22719990834593773, + "grad_min_sv": 8.59908984851554e-09, + "grad_condition": 192075671.7922108, + "lr": 0.00016543469682057076, + "time_sec": 32.63886094093323 + }, + { + "epoch": 111, + "train_loss": 0.2031750131702423, + "train_acc": 0.93542, + "test_loss": 2.8907776355743406, + "test_acc": 0.5398, + "lyapunov": null, + "grad_norm": 0.45125686654286246, + "grad_max_sv": 0.22084927894175052, + "grad_min_sv": 8.343052723680523e-09, + "grad_condition": 71193395.67698285, + "lr": 0.00015772644703565552, + "time_sec": 32.66804528236389 + }, + { + "epoch": 112, + "train_loss": 0.19805964677333832, + "train_acc": 0.93602, + "test_loss": 2.9214791831970213, + "test_acc": 0.535, + "lyapunov": null, + "grad_norm": 0.45121533997052793, + "grad_max_sv": 0.21654316522181033, + "grad_min_sv": 8.534410304156247e-09, + "grad_condition": 123620364.78518677, + "lr": 0.00015016832974331713, + "time_sec": 32.630356788635254 + }, + { + "epoch": 113, + "train_loss": 0.19659865329265594, + "train_acc": 0.93762, + "test_loss": 2.9189121520996095, + "test_acc": 0.5351, + "lyapunov": null, + "grad_norm": 0.4470395785797104, + "grad_max_sv": 0.2213457129895687, + "grad_min_sv": 8.339549602883605e-09, + "grad_condition": 274275470.40875286, + "lr": 0.00014276366018359834, + "time_sec": 32.62499737739563 + }, + { + "epoch": 114, + "train_loss": 0.18809852215766906, + "train_acc": 0.94016, + "test_loss": 2.985582607650757, + "test_acc": 0.5391, + "lyapunov": null, + "grad_norm": 0.43730893802732856, + "grad_max_sv": 0.21652991212904454, + "grad_min_sv": 8.204354757737229e-09, + "grad_condition": 2228692765.7982726, + "lr": 0.00013551568628929425, + "time_sec": 32.614506244659424 + }, + { + "epoch": 115, + "train_loss": 0.18862985968112947, + "train_acc": 0.93876, + "test_loss": 2.9296891693115232, + "test_acc": 0.5368, + "lyapunov": null, + "grad_norm": 0.43770037867272366, + "grad_max_sv": 0.21719331182539464, + "grad_min_sv": 8.40034150819866e-09, + "grad_condition": 1611148910.6771781, + "lr": 0.00012842758726130276, + "time_sec": 32.590333461761475 + }, + { + "epoch": 116, + "train_loss": 0.18695058307647705, + "train_acc": 0.94064, + "test_loss": 2.939223755645752, + "test_acc": 0.5384, + "lyapunov": null, + "grad_norm": 0.43433429186466, + "grad_max_sv": 0.21495764441788195, + "grad_min_sv": 8.100361084303062e-09, + "grad_condition": 5854028568.391862, + "lr": 0.0001215024721741218, + "time_sec": 32.61627745628357 + }, + { + "epoch": 117, + "train_loss": 0.18401632172584534, + "train_acc": 0.9416, + "test_loss": 2.9178254318237307, + "test_acc": 0.5382, + "lyapunov": null, + "grad_norm": 0.43458268972910447, + "grad_max_sv": 0.20661589913070202, + "grad_min_sv": 8.147711854419176e-09, + "grad_condition": 262010143.0723486, + "lr": 0.00011474337861210538, + "time_sec": 32.634137868881226 + }, + { + "epoch": 118, + "train_loss": 0.18033663163661956, + "train_acc": 0.9427, + "test_loss": 2.925826823425293, + "test_acc": 0.539, + "lyapunov": null, + "grad_norm": 0.42900090579769123, + "grad_max_sv": 0.20246973335742952, + "grad_min_sv": 7.991756401180133e-09, + "grad_condition": 630593044.3332715, + "lr": 0.00010815327133708009, + "time_sec": 32.62991404533386 + }, + { + "epoch": 119, + "train_loss": 0.1756329579257965, + "train_acc": 0.94382, + "test_loss": 2.9575962375640867, + "test_acc": 0.5364, + "lyapunov": null, + "grad_norm": 0.4245989192148294, + "grad_max_sv": 0.2097363706678152, + "grad_min_sv": 7.790207755134851e-09, + "grad_condition": 541328819.7909198, + "lr": 0.00010173504098790182, + "time_sec": 32.61990714073181 + }, + { + "epoch": 120, + "train_loss": 0.17752074500083923, + "train_acc": 0.943, + "test_loss": 2.984402207183838, + "test_acc": 0.5371, + "lyapunov": null, + "grad_norm": 0.42907850411654186, + "grad_max_sv": 0.2176469974219799, + "grad_min_sv": 8.196141195761492e-09, + "grad_condition": 1455305736.9709456, + "lr": 9.549150281252629e-05, + "time_sec": 32.62009358406067 + }, + { + "epoch": 121, + "train_loss": 0.1725271897983551, + "train_acc": 0.9447, + "test_loss": 2.9743667400360105, + "test_acc": 0.536, + "lyapunov": null, + "grad_norm": 0.422262051092585, + "grad_max_sv": 0.2079501125961542, + "grad_min_sv": 8.144436731624682e-09, + "grad_condition": 111029107.13270342, + "lr": 8.942539543314794e-05, + "time_sec": 32.66842198371887 + }, + { + "epoch": 122, + "train_loss": 0.16868778264045714, + "train_acc": 0.94718, + "test_loss": 2.9566415885925292, + "test_acc": 0.5371, + "lyapunov": null, + "grad_norm": 0.4165223870702016, + "grad_max_sv": 0.21388004645705222, + "grad_min_sv": 7.734497603701426e-09, + "grad_condition": 1329317698.2948136, + "lr": 8.353937964495024e-05, + "time_sec": 32.607342004776 + }, + { + "epoch": 123, + "train_loss": 0.1640772273159027, + "train_acc": 0.94856, + "test_loss": 3.0534807071685792, + "test_acc": 0.5337, + "lyapunov": null, + "grad_norm": 0.4100147528165505, + "grad_max_sv": 0.1933290047571063, + "grad_min_sv": 7.296350446246193e-09, + "grad_condition": 1444451901.4148755, + "lr": 7.783603724899243e-05, + "time_sec": 32.607924461364746 + }, + { + "epoch": 124, + "train_loss": 0.16604973594665529, + "train_acc": 0.94688, + "test_loss": 2.993713487243652, + "test_acc": 0.54, + "lyapunov": null, + "grad_norm": 0.41823426199952496, + "grad_max_sv": 0.207075222954154, + "grad_min_sv": 7.85820164139403e-09, + "grad_condition": 872896834.085886, + "lr": 7.231786991974666e-05, + "time_sec": 32.627970695495605 + }, + { + "epoch": 125, + "train_loss": 0.16303624733448027, + "train_acc": 0.94812, + "test_loss": 2.9622394554138185, + "test_acc": 0.5379, + "lyapunov": null, + "grad_norm": 0.41485915412359053, + "grad_max_sv": 0.21287606805562972, + "grad_min_sv": 8.07270578787045e-09, + "grad_condition": 94878921.53501868, + "lr": 6.698729810778072e-05, + "time_sec": 32.615166664123535 + }, + { + "epoch": 126, + "train_loss": 0.15940380114555358, + "train_acc": 0.94878, + "test_loss": 3.0216664451599122, + "test_acc": 0.5337, + "lyapunov": null, + "grad_norm": 0.40940184983431466, + "grad_max_sv": 0.2009254779666662, + "grad_min_sv": 7.574520318137742e-09, + "grad_condition": 1245573678.537202, + "lr": 6.184665997806817e-05, + "time_sec": 32.612011194229126 + }, + { + "epoch": 127, + "train_loss": 0.1607292701244354, + "train_acc": 0.94828, + "test_loss": 2.9907255443573, + "test_acc": 0.5383, + "lyapunov": null, + "grad_norm": 0.41311295177571106, + "grad_max_sv": 0.2103022612631321, + "grad_min_sv": 7.934495516734655e-09, + "grad_condition": 1981045820.0113425, + "lr": 5.6898210384392595e-05, + "time_sec": 32.62311267852783 + }, + { + "epoch": 128, + "train_loss": 0.15786261336803437, + "train_acc": 0.94878, + "test_loss": 2.959605949783325, + "test_acc": 0.541, + "lyapunov": null, + "grad_norm": 0.4074882653467691, + "grad_max_sv": 0.20439293198287486, + "grad_min_sv": 7.960480044827237e-09, + "grad_condition": 1396938529.2383535, + "lr": 5.214411988029363e-05, + "time_sec": 32.609647274017334 + }, + { + "epoch": 129, + "train_loss": 0.1574666795539856, + "train_acc": 0.94934, + "test_loss": 3.0880021881103517, + "test_acc": 0.5308, + "lyapunov": null, + "grad_norm": 0.4064826656284929, + "grad_max_sv": 0.20818514116108416, + "grad_min_sv": 7.770407870052663e-09, + "grad_condition": 375538570.58313566, + "lr": 4.7586473766990294e-05, + "time_sec": 32.61731743812561 + }, + { + "epoch": 130, + "train_loss": 0.152870930018425, + "train_acc": 0.95204, + "test_loss": 2.9848262096405027, + "test_acc": 0.5413, + "lyapunov": null, + "grad_norm": 0.3986563904029011, + "grad_max_sv": 0.20530760996043682, + "grad_min_sv": 7.818889642327836e-09, + "grad_condition": 2154043424.783707, + "lr": 4.32272711786996e-05, + "time_sec": 32.61918234825134 + }, + { + "epoch": 131, + "train_loss": 0.15438154235363005, + "train_acc": 0.95114, + "test_loss": 2.9789710178375244, + "test_acc": 0.5426, + "lyapunov": null, + "grad_norm": 0.4024417070574959, + "grad_max_sv": 0.2022467188537121, + "grad_min_sv": 7.597278266105283e-09, + "grad_condition": 1950086327.38053, + "lr": 3.906842420574966e-05, + "time_sec": 32.62202835083008 + }, + { + "epoch": 132, + "train_loss": 0.14874254384994506, + "train_acc": 0.95352, + "test_loss": 3.0375037422180178, + "test_acc": 0.5392, + "lyapunov": null, + "grad_norm": 0.3968136288986809, + "grad_max_sv": 0.19865386020392178, + "grad_min_sv": 7.604900639605893e-09, + "grad_condition": 140807357.42866144, + "lr": 3.5111757055874305e-05, + "time_sec": 32.67011499404907 + }, + { + "epoch": 133, + "train_loss": 0.15038901710510255, + "train_acc": 0.95308, + "test_loss": 3.0484798206329344, + "test_acc": 0.5354, + "lyapunov": null, + "grad_norm": 0.3985676191358705, + "grad_max_sv": 0.20562310479581355, + "grad_min_sv": 7.646398656867975e-09, + "grad_condition": 319304882.8675577, + "lr": 3.1359005254054254e-05, + "time_sec": 32.78828406333923 + }, + { + "epoch": 134, + "train_loss": 0.15090011917114257, + "train_acc": 0.95174, + "test_loss": 3.0233553348541258, + "test_acc": 0.5357, + "lyapunov": null, + "grad_norm": 0.4020500198756977, + "grad_max_sv": 0.2069926530122757, + "grad_min_sv": 7.71680147117551e-09, + "grad_condition": 341575666.7348074, + "lr": 2.7811814881259484e-05, + "time_sec": 32.81893181800842 + }, + { + "epoch": 135, + "train_loss": 0.14922723328590393, + "train_acc": 0.9526, + "test_loss": 2.9659065586090088, + "test_acc": 0.5445, + "lyapunov": null, + "grad_norm": 0.3978329464364341, + "grad_max_sv": 0.20179392956197262, + "grad_min_sv": 7.6255731287821e-09, + "grad_condition": 604174754.4278083, + "lr": 2.4471741852423218e-05, + "time_sec": 32.72992444038391 + }, + { + "epoch": 136, + "train_loss": 0.14605165558099747, + "train_acc": 0.95318, + "test_loss": 3.032598412322998, + "test_acc": 0.5366, + "lyapunov": null, + "grad_norm": 0.39366184589938236, + "grad_max_sv": 0.20618147775530815, + "grad_min_sv": 7.671137043554348e-09, + "grad_condition": 752388403.3630235, + "lr": 2.1340251233966362e-05, + "time_sec": 32.72515845298767 + }, + { + "epoch": 137, + "train_loss": 0.1457787049126625, + "train_acc": 0.95488, + "test_loss": 2.982140077209473, + "test_acc": 0.5406, + "lyapunov": null, + "grad_norm": 0.392743050498304, + "grad_max_sv": 0.1938252303749323, + "grad_min_sv": 7.403916825921182e-09, + "grad_condition": 1607378766.3872442, + "lr": 1.8418716601170932e-05, + "time_sec": 32.67524719238281 + }, + { + "epoch": 138, + "train_loss": 0.14674076547145842, + "train_acc": 0.95378, + "test_loss": 2.9361204231262206, + "test_acc": 0.5457, + "lyapunov": null, + "grad_norm": 0.3943262767319053, + "grad_max_sv": 0.20511250533163547, + "grad_min_sv": 7.68757224003068e-09, + "grad_condition": 733229682.6270201, + "lr": 1.570841943568445e-05, + "time_sec": 32.61559200286865 + }, + { + "epoch": 139, + "train_loss": 0.1475331647014618, + "train_acc": 0.95308, + "test_loss": 2.9983725143432616, + "test_acc": 0.5419, + "lyapunov": null, + "grad_norm": 0.3977778989458554, + "grad_max_sv": 0.20930965878069402, + "grad_min_sv": 7.65672412022828e-09, + "grad_condition": 5701863242.822145, + "lr": 1.3210548563419845e-05, + "time_sec": 32.61395025253296 + }, + { + "epoch": 140, + "train_loss": 0.14115534113407135, + "train_acc": 0.95556, + "test_loss": 2.991393402481079, + "test_acc": 0.5383, + "lyapunov": null, + "grad_norm": 0.3856384013171982, + "grad_max_sv": 0.21204831618815662, + "grad_min_sv": 7.897306178970832e-09, + "grad_condition": 127085133.9642816, + "lr": 1.0926199633097203e-05, + "time_sec": 32.646509408950806 + }, + { + "epoch": 141, + "train_loss": 0.14105249459266664, + "train_acc": 0.95562, + "test_loss": 2.9878240463256835, + "test_acc": 0.5392, + "lyapunov": null, + "grad_norm": 0.3871284997514462, + "grad_max_sv": 0.19716619774699212, + "grad_min_sv": 7.4092277403084874e-09, + "grad_condition": 1741040756.3705597, + "lr": 8.856374635655688e-06, + "time_sec": 32.647289991378784 + }, + { + "epoch": 142, + "train_loss": 0.14375008130550385, + "train_acc": 0.95434, + "test_loss": 2.9892458240509034, + "test_acc": 0.5392, + "lyapunov": null, + "grad_norm": 0.39243471184880735, + "grad_max_sv": 0.19629243165254592, + "grad_min_sv": 7.433162857537617e-09, + "grad_condition": 663172897.7860893, + "lr": 7.001981464747503e-06, + "time_sec": 32.63037371635437 + }, + { + "epoch": 143, + "train_loss": 0.14484988966464996, + "train_acc": 0.95374, + "test_loss": 3.005078562164307, + "test_acc": 0.541, + "lyapunov": null, + "grad_norm": 0.3927315675537109, + "grad_max_sv": 0.2067640382796526, + "grad_min_sv": 7.717835019151447e-09, + "grad_condition": 1087074704.470426, + "lr": 5.3638335185058295e-06, + "time_sec": 32.61275553703308 + }, + { + "epoch": 144, + "train_loss": 0.14234967883110047, + "train_acc": 0.95496, + "test_loss": 3.0190634880065916, + "test_acc": 0.5414, + "lyapunov": null, + "grad_norm": 0.389407660522802, + "grad_max_sv": 0.20883082449436188, + "grad_min_sv": 8.042504822162143e-09, + "grad_condition": 735296934.3497548, + "lr": 3.942649342761114e-06, + "time_sec": 32.630709171295166 + }, + { + "epoch": 145, + "train_loss": 0.14072841548681259, + "train_acc": 0.95612, + "test_loss": 2.974396339797974, + "test_acc": 0.5471, + "lyapunov": null, + "grad_norm": 0.3856929046195898, + "grad_max_sv": 0.19544588010758163, + "grad_min_sv": 7.138718509419373e-09, + "grad_condition": 5122409203.533503, + "lr": 2.7390523158633524e-06, + "time_sec": 32.635247468948364 + }, + { + "epoch": 146, + "train_loss": 0.14273023663520812, + "train_acc": 0.95578, + "test_loss": 2.9820834175109865, + "test_acc": 0.5441, + "lyapunov": null, + "grad_norm": 0.38656080604918364, + "grad_max_sv": 0.19659673869609834, + "grad_min_sv": 7.49241984375872e-09, + "grad_condition": 1201872260.69681, + "lr": 1.7535703752478133e-06, + "time_sec": 32.603397846221924 + }, + { + "epoch": 147, + "train_loss": 0.1410405499458313, + "train_acc": 0.95602, + "test_loss": 2.981495775222778, + "test_acc": 0.5419, + "lyapunov": null, + "grad_norm": 0.38881206566607257, + "grad_max_sv": 0.2015583546832204, + "grad_min_sv": 7.439259361047973e-09, + "grad_condition": 256637353.65744433, + "lr": 9.866357858642196e-07, + "time_sec": 32.6153359413147 + }, + { + "epoch": 148, + "train_loss": 0.14087454816818237, + "train_acc": 0.95532, + "test_loss": 3.0337733306884767, + "test_acc": 0.5407, + "lyapunov": null, + "grad_norm": 0.3869718856403076, + "grad_max_sv": 0.19626722503453492, + "grad_min_sv": 7.585891737774825e-09, + "grad_condition": 302680426.52042615, + "lr": 4.38584950570808e-07, + "time_sec": 32.6186146736145 + }, + { + "epoch": 149, + "train_loss": 0.14316360823869706, + "train_acc": 0.9544, + "test_loss": 2.9880101596832276, + "test_acc": 0.5412, + "lyapunov": null, + "grad_norm": 0.38865105056961796, + "grad_max_sv": 0.19493291191756726, + "grad_min_sv": 7.605263678024666e-09, + "grad_condition": 306741159.12086093, + "lr": 1.096582625772501e-07, + "time_sec": 32.618191719055176 + }, + { + "epoch": 150, + "train_loss": 0.14250738074302674, + "train_acc": 0.95574, + "test_loss": 3.0972991127014162, + "test_acc": 0.5341, + "lyapunov": null, + "grad_norm": 0.3882942108015414, + "grad_max_sv": 0.19360920544713736, + "grad_min_sv": 7.484912623034746e-09, + "grad_condition": 357186326.3835002, + "lr": 0.0, + "time_sec": 32.628779888153076 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.867076681213379, + "train_acc": 0.03032, + "test_loss": 4.947764100646973, + "test_acc": 0.0143, + "lyapunov": null, + "grad_norm": 5.924245355453859, + "grad_max_sv": 5.3032482981681826, + "grad_min_sv": 9.857900156173826e-08, + "grad_condition": 120242043.4723398, + "lr": 0.0009998903417374227, + "time_sec": 49.66225481033325 + }, + { + "epoch": 2, + "train_loss": 4.318109408493042, + "train_acc": 0.06186, + "test_loss": 4.948859809875488, + "test_acc": 0.0174, + "lyapunov": null, + "grad_norm": 4.473512739659572, + "grad_max_sv": 3.9397098541259767, + "grad_min_sv": 7.701884252586666e-08, + "grad_condition": 92549960.7307589, + "lr": 0.0009995614150494292, + "time_sec": 49.65573835372925 + }, + { + "epoch": 3, + "train_loss": 4.0393469068145755, + "train_acc": 0.0882, + "test_loss": 4.525526016235352, + "test_acc": 0.0246, + "lyapunov": null, + "grad_norm": 3.6557165978450756, + "grad_max_sv": 3.079137885570526, + "grad_min_sv": 6.436294224696979e-08, + "grad_condition": 7967774280.57207, + "lr": 0.0009990133642141358, + "time_sec": 49.633265256881714 + }, + { + "epoch": 4, + "train_loss": 3.846205193939209, + "train_acc": 0.11228, + "test_loss": 4.975083946228027, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 3.0659734946782295, + "grad_max_sv": 2.538968473672867, + "grad_min_sv": 5.467855347107697e-08, + "grad_condition": 79535259.28538653, + "lr": 0.0009982464296247522, + "time_sec": 49.63123106956482 + }, + { + "epoch": 5, + "train_loss": 3.691332396774292, + "train_acc": 0.13532, + "test_loss": 4.783598860931397, + "test_acc": 0.0369, + "lyapunov": null, + "grad_norm": 2.5536363471778976, + "grad_max_sv": 1.9760044306516646, + "grad_min_sv": 4.422183020880155e-08, + "grad_condition": 55126695.2664963, + "lr": 0.0009972609476841367, + "time_sec": 49.65209197998047 + }, + { + "epoch": 6, + "train_loss": 3.553630540008545, + "train_acc": 0.15754, + "test_loss": 4.568445386505127, + "test_acc": 0.0515, + "lyapunov": null, + "grad_norm": 2.12606891362942, + "grad_max_sv": 1.535008716583252, + "grad_min_sv": 3.7017866963418025e-08, + "grad_condition": 62102559.602248274, + "lr": 0.000996057350657239, + "time_sec": 49.673683881759644 + }, + { + "epoch": 7, + "train_loss": 3.4504250329589845, + "train_acc": 0.17538, + "test_loss": 4.65118264465332, + "test_acc": 0.054, + "lyapunov": null, + "grad_norm": 1.7701880091120692, + "grad_max_sv": 1.1685818210244179, + "grad_min_sv": 3.10900929667568e-08, + "grad_condition": 45005559.93922474, + "lr": 0.000994636166481494, + "time_sec": 49.64739394187927 + }, + { + "epoch": 8, + "train_loss": 3.3565325438690183, + "train_acc": 0.18776, + "test_loss": 4.876012271118164, + "test_acc": 0.0618, + "lyapunov": null, + "grad_norm": 1.5044376035669447, + "grad_max_sv": 0.8775043487548828, + "grad_min_sv": 2.6667509315028702e-08, + "grad_condition": 296430114.23387814, + "lr": 0.0009929980185352525, + "time_sec": 49.67679190635681 + }, + { + "epoch": 9, + "train_loss": 3.2745797639465333, + "train_acc": 0.20542, + "test_loss": 4.9326918502807615, + "test_acc": 0.0585, + "lyapunov": null, + "grad_norm": 1.3684138082571995, + "grad_max_sv": 0.7371457561850547, + "grad_min_sv": 2.4749053777195497e-08, + "grad_condition": 108871951.31387982, + "lr": 0.0009911436253643444, + "time_sec": 49.64658999443054 + }, + { + "epoch": 10, + "train_loss": 3.2189149342346193, + "train_acc": 0.214, + "test_loss": 5.03325620727539, + "test_acc": 0.0482, + "lyapunov": null, + "grad_norm": 1.2561694315834724, + "grad_max_sv": 0.6284460850059986, + "grad_min_sv": 2.2645430747258998e-08, + "grad_condition": 33572562.13603835, + "lr": 0.0009890738003669028, + "time_sec": 49.653048038482666 + }, + { + "epoch": 11, + "train_loss": 3.160115333251953, + "train_acc": 0.22594, + "test_loss": 6.272148492431641, + "test_acc": 0.0577, + "lyapunov": null, + "grad_norm": 1.1714413648507938, + "grad_max_sv": 0.5426148362457752, + "grad_min_sv": 2.1134999422800506e-08, + "grad_condition": 35214728.31695752, + "lr": 0.00098678945143658, + "time_sec": 49.695106506347656 + }, + { + "epoch": 12, + "train_loss": 3.109646647338867, + "train_acc": 0.23608, + "test_loss": 5.98844441986084, + "test_acc": 0.059, + "lyapunov": null, + "grad_norm": 1.106248438723714, + "grad_max_sv": 0.49079802110791204, + "grad_min_sv": 2.0135022657519207e-08, + "grad_condition": 43550673.1602456, + "lr": 0.0009842915805643154, + "time_sec": 49.64777135848999 + }, + { + "epoch": 13, + "train_loss": 3.0679126654815674, + "train_acc": 0.2429, + "test_loss": 5.38669468536377, + "test_acc": 0.0708, + "lyapunov": null, + "grad_norm": 1.0617767580006516, + "grad_max_sv": 0.4556848853826523, + "grad_min_sv": 1.974578255903303e-08, + "grad_condition": 49450086.08919337, + "lr": 0.000981581283398829, + "time_sec": 49.64315605163574 + }, + { + "epoch": 14, + "train_loss": 3.0292836235046385, + "train_acc": 0.2538, + "test_loss": 6.410186988830566, + "test_acc": 0.064, + "lyapunov": null, + "grad_norm": 1.0060226416432052, + "grad_max_sv": 0.4245763570070267, + "grad_min_sv": 1.8506429388942536e-08, + "grad_condition": 29580219.072595894, + "lr": 0.0009786597487660333, + "time_sec": 49.65712118148804 + }, + { + "epoch": 15, + "train_loss": 2.981404140319824, + "train_acc": 0.26162, + "test_loss": 5.5522136199951175, + "test_acc": 0.079, + "lyapunov": null, + "grad_norm": 0.9679737211436894, + "grad_max_sv": 0.39273724481463435, + "grad_min_sv": 1.7817760378235903e-08, + "grad_condition": 32708581.020238895, + "lr": 0.0009755282581475766, + "time_sec": 49.653464555740356 + }, + { + "epoch": 16, + "train_loss": 2.9441302935791014, + "train_acc": 0.2679, + "test_loss": 6.076311396789551, + "test_acc": 0.0558, + "lyapunov": null, + "grad_norm": 0.9232353580914646, + "grad_max_sv": 0.38061617463827135, + "grad_min_sv": 1.7214085454297924e-08, + "grad_condition": 27316628.630247217, + "lr": 0.0009721881851187403, + "time_sec": 49.67597222328186 + }, + { + "epoch": 17, + "train_loss": 2.9048094971466063, + "train_acc": 0.27692, + "test_loss": 6.079456564331054, + "test_acc": 0.0518, + "lyapunov": null, + "grad_norm": 0.891467290044791, + "grad_max_sv": 0.35018269568681715, + "grad_min_sv": 1.634932137728473e-08, + "grad_condition": 28285527.48074588, + "lr": 0.0009686409947459456, + "time_sec": 49.64990592002869 + }, + { + "epoch": 18, + "train_loss": 2.873079645462036, + "train_acc": 0.28224, + "test_loss": 6.066175770568847, + "test_acc": 0.0625, + "lyapunov": null, + "grad_norm": 0.8741844485503868, + "grad_max_sv": 0.35380034893751144, + "grad_min_sv": 1.5966123728672343e-08, + "grad_condition": 26291846.20197839, + "lr": 0.0009648882429441254, + "time_sec": 49.651339292526245 + }, + { + "epoch": 19, + "train_loss": 2.8434903021240236, + "train_acc": 0.28858, + "test_loss": 5.494677745056152, + "test_acc": 0.0941, + "lyapunov": null, + "grad_norm": 0.8557741380724747, + "grad_max_sv": 0.33219739720225333, + "grad_min_sv": 1.5816609089114308e-08, + "grad_condition": 24041708.13006859, + "lr": 0.00096093157579425, + "time_sec": 49.64615201950073 + }, + { + "epoch": 20, + "train_loss": 2.811087503204346, + "train_acc": 0.29328, + "test_loss": 5.656059492492676, + "test_acc": 0.0669, + "lyapunov": null, + "grad_norm": 0.8378343962997097, + "grad_max_sv": 0.3294540926814079, + "grad_min_sv": 1.5615107101796256e-08, + "grad_condition": 23976517.599521335, + "lr": 0.0009567727288213001, + "time_sec": 49.66048049926758 + }, + { + "epoch": 21, + "train_loss": 2.7742867500305177, + "train_acc": 0.3027, + "test_loss": 6.2807419387817385, + "test_acc": 0.0551, + "lyapunov": null, + "grad_norm": 0.822907042227662, + "grad_max_sv": 0.32042085379362106, + "grad_min_sv": 1.541958866979609e-08, + "grad_condition": 29484885.89671857, + "lr": 0.0009524135262330095, + "time_sec": 49.64675235748291 + }, + { + "epoch": 22, + "train_loss": 2.739880838623047, + "train_acc": 0.3066, + "test_loss": 6.388288533782959, + "test_acc": 0.0798, + "lyapunov": null, + "grad_norm": 0.8148392052716305, + "grad_max_sv": 0.3069480281323195, + "grad_min_sv": 1.4950799290258664e-08, + "grad_condition": 28309244.564152516, + "lr": 0.0009478558801197061, + "time_sec": 49.636857986450195 + }, + { + "epoch": 23, + "train_loss": 2.7262359308624267, + "train_acc": 0.30728, + "test_loss": 6.219175268554688, + "test_acc": 0.0797, + "lyapunov": null, + "grad_norm": 0.8001185522050407, + "grad_max_sv": 0.3042060166597366, + "grad_min_sv": 1.4733078970707858e-08, + "grad_condition": 48731628.77458956, + "lr": 0.000943101789615607, + "time_sec": 49.66920614242554 + }, + { + "epoch": 24, + "train_loss": 2.6896444255828857, + "train_acc": 0.31514, + "test_loss": 6.950405953216553, + "test_acc": 0.0681, + "lyapunov": null, + "grad_norm": 0.7902335651209668, + "grad_max_sv": 0.29678248390555384, + "grad_min_sv": 1.436923254514999e-08, + "grad_condition": 81486274.86742768, + "lr": 0.0009381533400219313, + "time_sec": 49.63133692741394 + }, + { + "epoch": 25, + "train_loss": 2.665062588043213, + "train_acc": 0.3211, + "test_loss": 5.463366045379638, + "test_acc": 0.0757, + "lyapunov": null, + "grad_norm": 0.7787106056593633, + "grad_max_sv": 0.289703868702054, + "grad_min_sv": 1.4815912328935976e-08, + "grad_condition": 29288675.239432998, + "lr": 0.0009330127018922189, + "time_sec": 49.62003183364868 + }, + { + "epoch": 26, + "train_loss": 2.6504075561523437, + "train_acc": 0.32334, + "test_loss": 5.581960006713867, + "test_acc": 0.076, + "lyapunov": null, + "grad_norm": 0.7765862590110221, + "grad_max_sv": 0.28965611904859545, + "grad_min_sv": 1.4621520069701965e-08, + "grad_condition": 49486165.52351975, + "lr": 0.000927682130080253, + "time_sec": 49.6389901638031 + }, + { + "epoch": 27, + "train_loss": 2.614381739425659, + "train_acc": 0.33194, + "test_loss": 5.60806091003418, + "test_acc": 0.0885, + "lyapunov": null, + "grad_norm": 0.7661123169926689, + "grad_max_sv": 0.2778739959001541, + "grad_min_sv": 1.4021614884798805e-08, + "grad_condition": 102919623.43599749, + "lr": 0.0009221639627510072, + "time_sec": 49.65237808227539 + }, + { + "epoch": 28, + "train_loss": 2.5988771228027345, + "train_acc": 0.3362, + "test_loss": 6.30830428314209, + "test_acc": 0.0788, + "lyapunov": null, + "grad_norm": 0.7544297292202896, + "grad_max_sv": 0.2770185124129057, + "grad_min_sv": 1.3951304235482187e-08, + "grad_condition": 27284734.9190725, + "lr": 0.0009164606203550494, + "time_sec": 49.64512538909912 + }, + { + "epoch": 29, + "train_loss": 2.568229464645386, + "train_acc": 0.3408, + "test_loss": 5.634605416870118, + "test_acc": 0.0881, + "lyapunov": null, + "grad_norm": 0.7537783086566691, + "grad_max_sv": 0.2754373669624329, + "grad_min_sv": 1.3882328608882944e-08, + "grad_condition": 36037607.075076535, + "lr": 0.0009105746045668516, + "time_sec": 49.83354067802429 + }, + { + "epoch": 30, + "train_loss": 2.5549702234649656, + "train_acc": 0.34176, + "test_loss": 5.78983073425293, + "test_acc": 0.0864, + "lyapunov": null, + "grad_norm": 0.7445001459037723, + "grad_max_sv": 0.26923939362168314, + "grad_min_sv": 1.3596951929650824e-08, + "grad_condition": 73994361.61909707, + "lr": 0.0009045084971874733, + "time_sec": 49.652652740478516 + }, + { + "epoch": 31, + "train_loss": 2.5326190648651123, + "train_acc": 0.34786, + "test_loss": 5.288684108734131, + "test_acc": 0.1055, + "lyapunov": null, + "grad_norm": 0.730348375021092, + "grad_max_sv": 0.2727065395563841, + "grad_min_sv": 1.3760889167047097e-08, + "grad_condition": 25673617.10480373, + "lr": 0.0008982649590120977, + "time_sec": 49.65483999252319 + }, + { + "epoch": 32, + "train_loss": 2.509755255126953, + "train_acc": 0.3526, + "test_loss": 5.09135297241211, + "test_acc": 0.1149, + "lyapunov": null, + "grad_norm": 0.7268611503644146, + "grad_max_sv": 0.2648207053542137, + "grad_min_sv": 1.3383840203815001e-08, + "grad_condition": 61829916.4522686, + "lr": 0.0008918467286629196, + "time_sec": 49.64020490646362 + }, + { + "epoch": 33, + "train_loss": 2.4931492380523683, + "train_acc": 0.3535, + "test_loss": 4.8521054679870605, + "test_acc": 0.0905, + "lyapunov": null, + "grad_norm": 0.7252118638296635, + "grad_max_sv": 0.26214006505906584, + "grad_min_sv": 1.3575532927401907e-08, + "grad_condition": 334808266.5462513, + "lr": 0.0008852566213878943, + "time_sec": 49.64065432548523 + }, + { + "epoch": 34, + "train_loss": 2.4606708142852782, + "train_acc": 0.36322, + "test_loss": 5.382892584228515, + "test_acc": 0.0873, + "lyapunov": null, + "grad_norm": 0.7248019714395398, + "grad_max_sv": 0.2584072381258011, + "grad_min_sv": 1.338938943051815e-08, + "grad_condition": 22159216.767137464, + "lr": 0.000878497527825878, + "time_sec": 49.6495418548584 + }, + { + "epoch": 35, + "train_loss": 2.4486713790893555, + "train_acc": 0.36274, + "test_loss": 6.107360326385498, + "test_acc": 0.088, + "lyapunov": null, + "grad_norm": 0.7179387338095772, + "grad_max_sv": 0.257593410089612, + "grad_min_sv": 1.3255892609975727e-08, + "grad_condition": 31085602.136499394, + "lr": 0.000871572412738697, + "time_sec": 49.6601026058197 + }, + { + "epoch": 36, + "train_loss": 2.4229932917785644, + "train_acc": 0.36894, + "test_loss": 5.342076141357422, + "test_acc": 0.1032, + "lyapunov": null, + "grad_norm": 0.7096950968080892, + "grad_max_sv": 0.2630200952291489, + "grad_min_sv": 1.3239768038332544e-08, + "grad_condition": 127101703.7953295, + "lr": 0.0008644843137107055, + "time_sec": 49.6635947227478 + }, + { + "epoch": 37, + "train_loss": 2.402267124176025, + "train_acc": 0.37332, + "test_loss": 5.335811291503906, + "test_acc": 0.094, + "lyapunov": null, + "grad_norm": 0.7120085793949865, + "grad_max_sv": 0.2575002573430538, + "grad_min_sv": 1.3368413254166712e-08, + "grad_condition": 22240358.280464128, + "lr": 0.0008572363398164014, + "time_sec": 49.641186237335205 + }, + { + "epoch": 38, + "train_loss": 2.3891987635040284, + "train_acc": 0.37632, + "test_loss": 5.805789661407471, + "test_acc": 0.0868, + "lyapunov": null, + "grad_norm": 0.7035846040354297, + "grad_max_sv": 0.24730649814009667, + "grad_min_sv": 1.3207518079205727e-08, + "grad_condition": 21910824.96396754, + "lr": 0.0008498316702566826, + "time_sec": 49.62650012969971 + }, + { + "epoch": 39, + "train_loss": 2.3623206945037842, + "train_acc": 0.38086, + "test_loss": 5.062893334960937, + "test_acc": 0.1092, + "lyapunov": null, + "grad_norm": 0.7017695804872179, + "grad_max_sv": 0.2500867433845997, + "grad_min_sv": 1.3118892544516925e-08, + "grad_condition": 25255887.129776128, + "lr": 0.0008422735529643442, + "time_sec": 49.67772555351257 + }, + { + "epoch": 40, + "train_loss": 2.3529662413024903, + "train_acc": 0.38294, + "test_loss": 5.610953298950196, + "test_acc": 0.0967, + "lyapunov": null, + "grad_norm": 0.6977946259413065, + "grad_max_sv": 0.24688060581684113, + "grad_min_sv": 1.2960891920821282e-08, + "grad_condition": 56123099.644835316, + "lr": 0.0008345653031794289, + "time_sec": 49.639814615249634 + }, + { + "epoch": 41, + "train_loss": 2.333562068939209, + "train_acc": 0.3903, + "test_loss": 5.925393104553223, + "test_acc": 0.091, + "lyapunov": null, + "grad_norm": 0.6938463445534568, + "grad_max_sv": 0.24459562487900258, + "grad_min_sv": 1.2906656435274221e-08, + "grad_condition": 25427891.502809733, + "lr": 0.0008267103019950526, + "time_sec": 49.65977430343628 + }, + { + "epoch": 42, + "train_loss": 2.3124754654693604, + "train_acc": 0.39228, + "test_loss": 5.738756129455567, + "test_acc": 0.0944, + "lyapunov": null, + "grad_norm": 0.6937138646925527, + "grad_max_sv": 0.24724075458943845, + "grad_min_sv": 1.319203219302123e-08, + "grad_condition": 45185002.54128989, + "lr": 0.0008187119948743447, + "time_sec": 49.621787548065186 + }, + { + "epoch": 43, + "train_loss": 2.297122774810791, + "train_acc": 0.39518, + "test_loss": 5.558856762695313, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 0.6954023940661026, + "grad_max_sv": 0.23504742681980134, + "grad_min_sv": 1.2803007077774598e-08, + "grad_condition": 74752626.21660146, + "lr": 0.000810573890139155, + "time_sec": 49.636855125427246 + }, + { + "epoch": 44, + "train_loss": 2.2821614197540283, + "train_acc": 0.3971, + "test_loss": 5.645317272186279, + "test_acc": 0.1193, + "lyapunov": null, + "grad_norm": 0.6907205928765684, + "grad_max_sv": 0.24622961431741713, + "grad_min_sv": 1.2981342747964141e-08, + "grad_condition": 26199709.677898668, + "lr": 0.0008022995574311873, + "time_sec": 49.64198565483093 + }, + { + "epoch": 45, + "train_loss": 2.2713894058227537, + "train_acc": 0.39952, + "test_loss": 5.601718740844727, + "test_acc": 0.115, + "lyapunov": null, + "grad_norm": 0.6820910668916103, + "grad_max_sv": 0.23520345650613309, + "grad_min_sv": 1.248807580886413e-08, + "grad_condition": 31636031.288275667, + "lr": 0.0007938926261462363, + "time_sec": 49.67773389816284 + }, + { + "epoch": 46, + "train_loss": 2.257637547302246, + "train_acc": 0.40164, + "test_loss": 6.1034967262268065, + "test_acc": 0.0963, + "lyapunov": null, + "grad_norm": 0.6857789433621205, + "grad_max_sv": 0.2412054430693388, + "grad_min_sv": 1.2735198454127961e-08, + "grad_condition": 23495873.85592956, + "lr": 0.0007853567838422158, + "time_sec": 49.70046591758728 + }, + { + "epoch": 47, + "train_loss": 2.2420009886932375, + "train_acc": 0.40796, + "test_loss": 6.0141721504211425, + "test_acc": 0.0994, + "lyapunov": null, + "grad_norm": 0.6884466036918674, + "grad_max_sv": 0.23858897313475608, + "grad_min_sv": 1.279806305862219e-08, + "grad_condition": 32602369.53036396, + "lr": 0.0007766957746216719, + "time_sec": 49.64759612083435 + }, + { + "epoch": 48, + "train_loss": 2.221109953689575, + "train_acc": 0.41348, + "test_loss": 5.113736025238037, + "test_acc": 0.1051, + "lyapunov": null, + "grad_norm": 0.6799436836768571, + "grad_max_sv": 0.23215029686689376, + "grad_min_sv": 1.2702428098948504e-08, + "grad_condition": 30660390.224244833, + "lr": 0.0007679133974894982, + "time_sec": 49.63391995429993 + }, + { + "epoch": 49, + "train_loss": 2.205668955535889, + "train_acc": 0.41396, + "test_loss": 5.725731170654297, + "test_acc": 0.1127, + "lyapunov": null, + "grad_norm": 0.6800157289733184, + "grad_max_sv": 0.23190808668732643, + "grad_min_sv": 1.2591927725513764e-08, + "grad_condition": 25226269.11831253, + "lr": 0.000759013504686565, + "time_sec": 49.659985303878784 + }, + { + "epoch": 50, + "train_loss": 2.178990175933838, + "train_acc": 0.41954, + "test_loss": 6.77099367980957, + "test_acc": 0.08, + "lyapunov": null, + "grad_norm": 0.6859317460073948, + "grad_max_sv": 0.24390893206000328, + "grad_min_sv": 1.3008656658125562e-08, + "grad_condition": 45710128.91239187, + "lr": 0.0007499999999999998, + "time_sec": 49.67057538032532 + }, + { + "epoch": 51, + "train_loss": 2.1731418634796142, + "train_acc": 0.42034, + "test_loss": 5.4437935821533205, + "test_acc": 0.1355, + "lyapunov": null, + "grad_norm": 0.6797845917426844, + "grad_max_sv": 0.23709770888090134, + "grad_min_sv": 1.2489326947640045e-08, + "grad_condition": 71005409.6953965, + "lr": 0.0007408768370508575, + "time_sec": 49.65837097167969 + }, + { + "epoch": 52, + "train_loss": 2.1565717080688476, + "train_acc": 0.42326, + "test_loss": 6.098255497741699, + "test_acc": 0.104, + "lyapunov": null, + "grad_norm": 0.6814943332144482, + "grad_max_sv": 0.24653270244598388, + "grad_min_sv": 1.2720437771694681e-08, + "grad_condition": 194840995.8680305, + "lr": 0.0007316480175599307, + "time_sec": 49.66200804710388 + }, + { + "epoch": 53, + "train_loss": 2.1340223332977293, + "train_acc": 0.42998, + "test_loss": 6.049259701538086, + "test_acc": 0.0861, + "lyapunov": null, + "grad_norm": 0.6777001479734457, + "grad_max_sv": 0.23873055540025234, + "grad_min_sv": 1.2421411374474723e-08, + "grad_condition": 32226811.25325196, + "lr": 0.0007223175895924635, + "time_sec": 49.665961027145386 + }, + { + "epoch": 54, + "train_loss": 2.126938176651001, + "train_acc": 0.43106, + "test_loss": 6.562160124969482, + "test_acc": 0.0789, + "lyapunov": null, + "grad_norm": 0.6759930609089722, + "grad_max_sv": 0.23779002986848355, + "grad_min_sv": 1.28305379175353e-08, + "grad_condition": 35566779.08443637, + "lr": 0.0007128896457825361, + "time_sec": 49.65031957626343 + }, + { + "epoch": 55, + "train_loss": 2.1051641911315917, + "train_acc": 0.43512, + "test_loss": 5.5847692222595215, + "test_acc": 0.094, + "lyapunov": null, + "grad_norm": 0.6809336732903097, + "grad_max_sv": 0.23433455340564252, + "grad_min_sv": 1.2507266784755888e-08, + "grad_condition": 39814021.79378623, + "lr": 0.0007033683215378998, + "time_sec": 49.65074586868286 + }, + { + "epoch": 56, + "train_loss": 2.092265638580322, + "train_acc": 0.43686, + "test_loss": 6.618711474609375, + "test_acc": 0.0951, + "lyapunov": null, + "grad_norm": 0.6774035816145235, + "grad_max_sv": 0.23422617167234422, + "grad_min_sv": 1.2562931204357363e-08, + "grad_condition": 42511854.242542446, + "lr": 0.0006937577932260512, + "time_sec": 49.67660713195801 + }, + { + "epoch": 57, + "train_loss": 2.0827418495941163, + "train_acc": 0.4403, + "test_loss": 6.194670201873779, + "test_acc": 0.0994, + "lyapunov": null, + "grad_norm": 0.6678254293340489, + "grad_max_sv": 0.2269128028303385, + "grad_min_sv": 1.2401744986512142e-08, + "grad_condition": 21973869.575117223, + "lr": 0.0006840622763423388, + "time_sec": 49.783742904663086 + }, + { + "epoch": 58, + "train_loss": 2.0623908683013914, + "train_acc": 0.44656, + "test_loss": 6.666766788482666, + "test_acc": 0.0993, + "lyapunov": null, + "grad_norm": 0.6720634537783472, + "grad_max_sv": 0.24044986441731453, + "grad_min_sv": 1.2775585303548275e-08, + "grad_condition": 25485277.371963684, + "lr": 0.0006742860236609073, + "time_sec": 49.669817209243774 + }, + { + "epoch": 59, + "train_loss": 2.0514604888153074, + "train_acc": 0.44538, + "test_loss": 6.695825149536133, + "test_acc": 0.1151, + "lyapunov": null, + "grad_norm": 0.6809315885518872, + "grad_max_sv": 0.24165161401033403, + "grad_min_sv": 1.2788197974178406e-08, + "grad_condition": 35590192.68303648, + "lr": 0.0006644333233692913, + "time_sec": 49.650195837020874 + }, + { + "epoch": 60, + "train_loss": 2.0252186447906495, + "train_acc": 0.45138, + "test_loss": 5.913940372467041, + "test_acc": 0.1163, + "lyapunov": null, + "grad_norm": 0.6772762313116852, + "grad_max_sv": 0.23192268945276737, + "grad_min_sv": 1.260488815824079e-08, + "grad_condition": 36769303.52556603, + "lr": 0.0006545084971874734, + "time_sec": 49.664047718048096 + }, + { + "epoch": 61, + "train_loss": 2.007682227020264, + "train_acc": 0.45666, + "test_loss": 5.868577780151367, + "test_acc": 0.115, + "lyapunov": null, + "grad_norm": 0.6759522840384884, + "grad_max_sv": 0.22865727171301842, + "grad_min_sv": 1.2542224199496577e-08, + "grad_condition": 24304675.366521474, + "lr": 0.0006445158984722354, + "time_sec": 49.672890186309814 + }, + { + "epoch": 62, + "train_loss": 1.995171699295044, + "train_acc": 0.46184, + "test_loss": 6.737825399017334, + "test_acc": 0.118, + "lyapunov": null, + "grad_norm": 0.6771801071307233, + "grad_max_sv": 0.23842737562954425, + "grad_min_sv": 1.2555753026860517e-08, + "grad_condition": 76751681.04997593, + "lr": 0.0006344599103076324, + "time_sec": 49.647465467453 + }, + { + "epoch": 63, + "train_loss": 1.981292818222046, + "train_acc": 0.46314, + "test_loss": 7.100067088317871, + "test_acc": 0.1095, + "lyapunov": null, + "grad_norm": 0.6713695448222669, + "grad_max_sv": 0.2343658696860075, + "grad_min_sv": 1.26902626518266e-08, + "grad_condition": 28181773.273861475, + "lr": 0.0006243449435824269, + "time_sec": 49.649380683898926 + }, + { + "epoch": 64, + "train_loss": 1.9733019332122803, + "train_acc": 0.46438, + "test_loss": 5.759408002471924, + "test_acc": 0.1153, + "lyapunov": null, + "grad_norm": 0.6738823550588381, + "grad_max_sv": 0.2319059170782566, + "grad_min_sv": 1.2463900067594125e-08, + "grad_condition": 40112949.74296764, + "lr": 0.0006141754350553275, + "time_sec": 49.66850161552429 + }, + { + "epoch": 65, + "train_loss": 1.9568941514587401, + "train_acc": 0.46904, + "test_loss": 7.127551719665528, + "test_acc": 0.0848, + "lyapunov": null, + "grad_norm": 0.6742441227866462, + "grad_max_sv": 0.23397597223520278, + "grad_min_sv": 1.25213092679044e-08, + "grad_condition": 46515106.210851446, + "lr": 0.0006039558454088793, + "time_sec": 49.66012144088745 + }, + { + "epoch": 66, + "train_loss": 1.9348979427337647, + "train_acc": 0.47398, + "test_loss": 6.236616806030273, + "test_acc": 0.1078, + "lyapunov": null, + "grad_norm": 0.6734446447786178, + "grad_max_sv": 0.23539532758295537, + "grad_min_sv": 1.2652164015081179e-08, + "grad_condition": 28579248.32682752, + "lr": 0.000593690657292862, + "time_sec": 49.64537501335144 + }, + { + "epoch": 67, + "train_loss": 1.9291245281600953, + "train_acc": 0.47196, + "test_loss": 6.798108719635009, + "test_acc": 0.094, + "lyapunov": null, + "grad_norm": 0.6760498050370345, + "grad_max_sv": 0.2377512652426958, + "grad_min_sv": 1.2435551444145432e-08, + "grad_condition": 25305099.629897654, + "lr": 0.0005833843733580507, + "time_sec": 49.67935347557068 + }, + { + "epoch": 68, + "train_loss": 1.9192953534317017, + "train_acc": 0.4772, + "test_loss": 6.608765222930908, + "test_acc": 0.0882, + "lyapunov": null, + "grad_norm": 0.6717332361493707, + "grad_max_sv": 0.23620884753763677, + "grad_min_sv": 1.2707171583026255e-08, + "grad_condition": 49129599.72542394, + "lr": 0.0005730415142812054, + "time_sec": 49.64025044441223 + }, + { + "epoch": 69, + "train_loss": 1.8987758751678467, + "train_acc": 0.47966, + "test_loss": 5.653663331604004, + "test_acc": 0.1227, + "lyapunov": null, + "grad_norm": 0.6705292453226563, + "grad_max_sv": 0.2265289269387722, + "grad_min_sv": 1.2440874884792063e-08, + "grad_condition": 96538400.80037068, + "lr": 0.0005626666167821517, + "time_sec": 49.66509675979614 + }, + { + "epoch": 70, + "train_loss": 1.884353363494873, + "train_acc": 0.48414, + "test_loss": 6.035382391357422, + "test_acc": 0.1021, + "lyapunov": null, + "grad_norm": 0.6680799244712567, + "grad_max_sv": 0.23454298377037047, + "grad_min_sv": 1.2329038198699571e-08, + "grad_condition": 23720736.796809513, + "lr": 0.0005522642316338265, + "time_sec": 49.65922212600708 + }, + { + "epoch": 71, + "train_loss": 1.8602378274917601, + "train_acc": 0.48812, + "test_loss": 6.718938314819336, + "test_acc": 0.0974, + "lyapunov": null, + "grad_norm": 0.6690275979174782, + "grad_max_sv": 0.22686633579432963, + "grad_min_sv": 1.2291359120092382e-08, + "grad_condition": 33025361.562200826, + "lr": 0.0005418389216661573, + "time_sec": 49.67633080482483 + }, + { + "epoch": 72, + "train_loss": 1.8526426247406005, + "train_acc": 0.49134, + "test_loss": 6.2294830772399905, + "test_acc": 0.1148, + "lyapunov": null, + "grad_norm": 0.6720197173871366, + "grad_max_sv": 0.23030848391354083, + "grad_min_sv": 1.2546923280204458e-08, + "grad_condition": 32378085.898901425, + "lr": 0.0005313952597646563, + "time_sec": 49.64814281463623 + }, + { + "epoch": 73, + "train_loss": 1.8410167992782593, + "train_acc": 0.4922, + "test_loss": 6.237728077697754, + "test_acc": 0.1122, + "lyapunov": null, + "grad_norm": 0.6700291325745232, + "grad_max_sv": 0.2350303005427122, + "grad_min_sv": 1.2499374603576474e-08, + "grad_condition": 114488188.85089114, + "lr": 0.0005209378268645994, + "time_sec": 49.64322113990784 + }, + { + "epoch": 74, + "train_loss": 1.8187053978729248, + "train_acc": 0.49946, + "test_loss": 6.824303936767578, + "test_acc": 0.097, + "lyapunov": null, + "grad_norm": 0.672244343544663, + "grad_max_sv": 0.23095075972378254, + "grad_min_sv": 1.2445574060215848e-08, + "grad_condition": 22890357.9667615, + "lr": 0.0005104712099416781, + "time_sec": 49.6670081615448 + }, + { + "epoch": 75, + "train_loss": 1.813272426071167, + "train_acc": 0.49968, + "test_loss": 5.798268667602539, + "test_acc": 0.1047, + "lyapunov": null, + "grad_norm": 0.6721278079431174, + "grad_max_sv": 0.23032179288566113, + "grad_min_sv": 1.2480348247911888e-08, + "grad_condition": 37321408.338354364, + "lr": 0.0004999999999999996, + "time_sec": 49.65290307998657 + }, + { + "epoch": 76, + "train_loss": 1.7899452612304687, + "train_acc": 0.50648, + "test_loss": 6.24032091217041, + "test_acc": 0.1125, + "lyapunov": null, + "grad_norm": 0.6727269345754596, + "grad_max_sv": 0.23410010598599912, + "grad_min_sv": 1.2507147805623786e-08, + "grad_condition": 71365024.07798055, + "lr": 0.0004895287900583212, + "time_sec": 49.65421724319458 + }, + { + "epoch": 77, + "train_loss": 1.7827668267822265, + "train_acc": 0.50734, + "test_loss": 6.399443918609619, + "test_acc": 0.1091, + "lyapunov": null, + "grad_norm": 0.6741506035504011, + "grad_max_sv": 0.230082393810153, + "grad_min_sv": 1.2451498095089608e-08, + "grad_condition": 36256669.36254879, + "lr": 0.0004790621731353997, + "time_sec": 49.70512247085571 + }, + { + "epoch": 78, + "train_loss": 1.7687860860443114, + "train_acc": 0.51008, + "test_loss": 6.445651992797852, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 0.6697954996039798, + "grad_max_sv": 0.22649035081267357, + "grad_min_sv": 1.2488184172876337e-08, + "grad_condition": 23806277.12272833, + "lr": 0.000468604740235343, + "time_sec": 49.662657499313354 + }, + { + "epoch": 79, + "train_loss": 1.7489702334594726, + "train_acc": 0.51562, + "test_loss": 6.530778681182861, + "test_acc": 0.117, + "lyapunov": null, + "grad_norm": 0.6739375451558363, + "grad_max_sv": 0.22849502116441728, + "grad_min_sv": 1.245096855617689e-08, + "grad_condition": 28709311.845186163, + "lr": 0.00045816107833384175, + "time_sec": 49.67883372306824 + }, + { + "epoch": 80, + "train_loss": 1.7359050400161744, + "train_acc": 0.51766, + "test_loss": 6.335304261016845, + "test_acc": 0.1135, + "lyapunov": null, + "grad_norm": 0.673084733583316, + "grad_max_sv": 0.23147543855011463, + "grad_min_sv": 1.262345546010346e-08, + "grad_condition": 67753848.58025023, + "lr": 0.0004477357683661729, + "time_sec": 49.67265200614929 + }, + { + "epoch": 81, + "train_loss": 1.728564892616272, + "train_acc": 0.5189, + "test_loss": 6.764313927459717, + "test_acc": 0.1148, + "lyapunov": null, + "grad_norm": 0.6723535831800918, + "grad_max_sv": 0.23651552833616735, + "grad_min_sv": 1.2691624282079595e-08, + "grad_condition": 48499713.46620417, + "lr": 0.00043733338321784746, + "time_sec": 49.660566329956055 + }, + { + "epoch": 82, + "train_loss": 1.7069255582427978, + "train_acc": 0.52546, + "test_loss": 6.82549387664795, + "test_acc": 0.1045, + "lyapunov": null, + "grad_norm": 0.6714222489059333, + "grad_max_sv": 0.23965975381433963, + "grad_min_sv": 1.2654725708646785e-08, + "grad_condition": 78105112.66743548, + "lr": 0.0004269584857187939, + "time_sec": 49.84282612800598 + }, + { + "epoch": 83, + "train_loss": 1.7002278206634522, + "train_acc": 0.52806, + "test_loss": 7.086389317321777, + "test_acc": 0.099, + "lyapunov": null, + "grad_norm": 0.6733522471613737, + "grad_max_sv": 0.23215787783265113, + "grad_min_sv": 1.2419085829162846e-08, + "grad_condition": 22634568.424719356, + "lr": 0.0004166156266419484, + "time_sec": 49.650322914123535 + }, + { + "epoch": 84, + "train_loss": 1.6763646780395507, + "train_acc": 0.5308, + "test_loss": 6.611732363891601, + "test_acc": 0.118, + "lyapunov": null, + "grad_norm": 0.6733553577608795, + "grad_max_sv": 0.2272573009133339, + "grad_min_sv": 1.2343867245023787e-08, + "grad_condition": 23864640.71802464, + "lr": 0.0004063093427071373, + "time_sec": 49.691351890563965 + }, + { + "epoch": 85, + "train_loss": 1.6756745571517944, + "train_acc": 0.53228, + "test_loss": 6.4739246078491215, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 0.6746656074581188, + "grad_max_sv": 0.23839143104851246, + "grad_min_sv": 1.2371040583429582e-08, + "grad_condition": 132338471.9659415, + "lr": 0.0003960441545911199, + "time_sec": 49.67355513572693 + }, + { + "epoch": 86, + "train_loss": 1.6653836363983154, + "train_acc": 0.53528, + "test_loss": 6.292951089477539, + "test_acc": 0.1177, + "lyapunov": null, + "grad_norm": 0.6721776058240324, + "grad_max_sv": 0.22739280313253402, + "grad_min_sv": 1.2439889082727084e-08, + "grad_condition": 50660277.29149826, + "lr": 0.0003858245649446718, + "time_sec": 49.70143532752991 + }, + { + "epoch": 87, + "train_loss": 1.6428289547348023, + "train_acc": 0.53956, + "test_loss": 6.49584349975586, + "test_acc": 0.1211, + "lyapunov": null, + "grad_norm": 0.6670785293463617, + "grad_max_sv": 0.23538414649665357, + "grad_min_sv": 1.2516606368029315e-08, + "grad_condition": 32919772.982234925, + "lr": 0.00037565505641757235, + "time_sec": 49.68615436553955 + }, + { + "epoch": 88, + "train_loss": 1.634814398727417, + "train_acc": 0.54118, + "test_loss": 6.50436838684082, + "test_acc": 0.1187, + "lyapunov": null, + "grad_norm": 0.6745663524438923, + "grad_max_sv": 0.23613668605685234, + "grad_min_sv": 1.2677799557381241e-08, + "grad_condition": 44607655.03080545, + "lr": 0.00036554008969236695, + "time_sec": 49.649219274520874 + }, + { + "epoch": 89, + "train_loss": 1.6165026095581054, + "train_acc": 0.54594, + "test_loss": 6.791359812164306, + "test_acc": 0.1115, + "lyapunov": null, + "grad_norm": 0.6737081832476569, + "grad_max_sv": 0.23479382395744325, + "grad_min_sv": 1.2516244720078146e-08, + "grad_condition": 190811782.4744936, + "lr": 0.0003554841015277638, + "time_sec": 49.683497190475464 + }, + { + "epoch": 90, + "train_loss": 1.6110337893676758, + "train_acc": 0.54666, + "test_loss": 6.632439305114746, + "test_acc": 0.1183, + "lyapunov": null, + "grad_norm": 0.6713968186469105, + "grad_max_sv": 0.22974373511970042, + "grad_min_sv": 1.2277071293614883e-08, + "grad_condition": 37068924.71238396, + "lr": 0.000345491502812526, + "time_sec": 49.636313676834106 + }, + { + "epoch": 91, + "train_loss": 1.5944184198379516, + "train_acc": 0.55296, + "test_loss": 6.748670170593262, + "test_acc": 0.1158, + "lyapunov": null, + "grad_norm": 0.6694050704454773, + "grad_max_sv": 0.23858524970710276, + "grad_min_sv": 1.2643264604705885e-08, + "grad_condition": 25877894.916739095, + "lr": 0.0003355666766307081, + "time_sec": 49.687766790390015 + }, + { + "epoch": 92, + "train_loss": 1.582156534500122, + "train_acc": 0.55502, + "test_loss": 7.055152958679199, + "test_acc": 0.125, + "lyapunov": null, + "grad_norm": 0.6711245974179065, + "grad_max_sv": 0.2372837509959936, + "grad_min_sv": 1.250213053222149e-08, + "grad_condition": 41995114.905596815, + "lr": 0.00032571397633909225, + "time_sec": 49.64969778060913 + }, + { + "epoch": 93, + "train_loss": 1.570514686050415, + "train_acc": 0.557, + "test_loss": 6.646953351593018, + "test_acc": 0.1247, + "lyapunov": null, + "grad_norm": 0.6694032992923055, + "grad_max_sv": 0.23712432235479355, + "grad_min_sv": 1.2480553441543071e-08, + "grad_condition": 337358114.5037104, + "lr": 0.00031593772365766094, + "time_sec": 49.64657950401306 + }, + { + "epoch": 94, + "train_loss": 1.5698510019683838, + "train_acc": 0.55662, + "test_loss": 6.813129180908203, + "test_acc": 0.1211, + "lyapunov": null, + "grad_norm": 0.6745313526600484, + "grad_max_sv": 0.23206005096435547, + "grad_min_sv": 1.2231206397012028e-08, + "grad_condition": 59878977.27942028, + "lr": 0.0003062422067739483, + "time_sec": 49.649224519729614 + }, + { + "epoch": 95, + "train_loss": 1.5525139013290405, + "train_acc": 0.56018, + "test_loss": 6.746605987548828, + "test_acc": 0.1185, + "lyapunov": null, + "grad_norm": 0.6673893510246934, + "grad_max_sv": 0.22761529460549354, + "grad_min_sv": 1.2434594947111078e-08, + "grad_condition": 55398196.865595676, + "lr": 0.00029663167846209965, + "time_sec": 49.65047597885132 + }, + { + "epoch": 96, + "train_loss": 1.5430318810653687, + "train_acc": 0.56506, + "test_loss": 7.396685010528564, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 0.6632435694537989, + "grad_max_sv": 0.22706211358308792, + "grad_min_sv": 1.2345683975036742e-08, + "grad_condition": 149601623.8160465, + "lr": 0.00028711035421746345, + "time_sec": 49.66360521316528 + }, + { + "epoch": 97, + "train_loss": 1.5200880788803102, + "train_acc": 0.57142, + "test_loss": 7.5394327842712405, + "test_acc": 0.1061, + "lyapunov": null, + "grad_norm": 0.6643317104321547, + "grad_max_sv": 0.23884013146162034, + "grad_min_sv": 1.2467270498123847e-08, + "grad_condition": 1731039266.2526886, + "lr": 0.00027768241040753615, + "time_sec": 49.65261173248291 + }, + { + "epoch": 98, + "train_loss": 1.518323214111328, + "train_acc": 0.5696, + "test_loss": 7.21264954071045, + "test_acc": 0.108, + "lyapunov": null, + "grad_norm": 0.6651950927793007, + "grad_max_sv": 0.23549152724444866, + "grad_min_sv": 1.2395403968501994e-08, + "grad_condition": 573884799.872338, + "lr": 0.00026835198244006903, + "time_sec": 49.66014313697815 + }, + { + "epoch": 99, + "train_loss": 1.5111107628631593, + "train_acc": 0.57066, + "test_loss": 7.129739350891113, + "test_acc": 0.1072, + "lyapunov": null, + "grad_norm": 0.6628965844959802, + "grad_max_sv": 0.23341625332832336, + "grad_min_sv": 1.2492304993921844e-08, + "grad_condition": 46595001.70183447, + "lr": 0.0002591231629491421, + "time_sec": 49.679956912994385 + }, + { + "epoch": 100, + "train_loss": 1.4924037743759155, + "train_acc": 0.57592, + "test_loss": 6.886035611724854, + "test_acc": 0.1178, + "lyapunov": null, + "grad_norm": 0.6657266029095829, + "grad_max_sv": 0.230366924777627, + "grad_min_sv": 1.2321952966298788e-08, + "grad_condition": 25117301.167941064, + "lr": 0.0002499999999999997, + "time_sec": 49.66248035430908 + }, + { + "epoch": 101, + "train_loss": 1.4861050595092773, + "train_acc": 0.57828, + "test_loss": 6.799741802978516, + "test_acc": 0.1228, + "lyapunov": null, + "grad_norm": 0.6686905715905375, + "grad_max_sv": 0.23545245304703713, + "grad_min_sv": 1.234361735047429e-08, + "grad_condition": 29444253.12861086, + "lr": 0.00024098649531343477, + "time_sec": 49.66140055656433 + }, + { + "epoch": 102, + "train_loss": 1.4725512704849244, + "train_acc": 0.58142, + "test_loss": 7.177790800476075, + "test_acc": 0.1098, + "lyapunov": null, + "grad_norm": 0.6650535279389591, + "grad_max_sv": 0.2346459224820137, + "grad_min_sv": 1.2347895218811633e-08, + "grad_condition": 32027930.26552541, + "lr": 0.0002320866025105016, + "time_sec": 49.670332193374634 + }, + { + "epoch": 103, + "train_loss": 1.4619587004852295, + "train_acc": 0.58584, + "test_loss": 6.925167604064941, + "test_acc": 0.1244, + "lyapunov": null, + "grad_norm": 0.6611290754227804, + "grad_max_sv": 0.23446624241769315, + "grad_min_sv": 1.2205713886457268e-08, + "grad_condition": 816637504.324081, + "lr": 0.0002233042253783278, + "time_sec": 49.66000247001648 + }, + { + "epoch": 104, + "train_loss": 1.4553011770248414, + "train_acc": 0.5884, + "test_loss": 6.954682211303711, + "test_acc": 0.1251, + "lyapunov": null, + "grad_norm": 0.6632380519638201, + "grad_max_sv": 0.2356626283377409, + "grad_min_sv": 1.2399409735769362e-08, + "grad_condition": 60742416.672109105, + "lr": 0.000214643216157784, + "time_sec": 49.647239685058594 + }, + { + "epoch": 105, + "train_loss": 1.4439967386245727, + "train_acc": 0.59044, + "test_loss": 6.935120243835449, + "test_acc": 0.1288, + "lyapunov": null, + "grad_norm": 0.6633451028650943, + "grad_max_sv": 0.2364518467336893, + "grad_min_sv": 1.255814783829301e-08, + "grad_condition": 22935173.07316313, + "lr": 0.00020610737385376332, + "time_sec": 49.683613300323486 + }, + { + "epoch": 106, + "train_loss": 1.4366886682128905, + "train_acc": 0.59094, + "test_loss": 7.093826289367676, + "test_acc": 0.1231, + "lyapunov": null, + "grad_norm": 0.663271217932332, + "grad_max_sv": 0.23506820090115071, + "grad_min_sv": 1.2124915337724529e-08, + "grad_condition": 42573443.94560614, + "lr": 0.00019770044256881242, + "time_sec": 49.66502928733826 + }, + { + "epoch": 107, + "train_loss": 1.4277326443862914, + "train_acc": 0.59332, + "test_loss": 7.7529417953491215, + "test_acc": 0.1059, + "lyapunov": null, + "grad_norm": 0.6635081985078852, + "grad_max_sv": 0.23835694566369056, + "grad_min_sv": 1.2204500224669013e-08, + "grad_condition": 105007030.04684536, + "lr": 0.0001894261098608447, + "time_sec": 49.66994285583496 + }, + { + "epoch": 108, + "train_loss": 1.422326604423523, + "train_acc": 0.59542, + "test_loss": 8.043737371826172, + "test_acc": 0.1043, + "lyapunov": null, + "grad_norm": 0.6616785437081295, + "grad_max_sv": 0.22960531041026117, + "grad_min_sv": 1.2122151026028316e-08, + "grad_condition": 29839800.824967705, + "lr": 0.000181288005125655, + "time_sec": 49.680773973464966 + }, + { + "epoch": 109, + "train_loss": 1.4067108069610597, + "train_acc": 0.60132, + "test_loss": 7.882626647949219, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 0.6582920448837728, + "grad_max_sv": 0.22414382882416248, + "grad_min_sv": 1.2327173726234264e-08, + "grad_condition": 31881244.227357633, + "lr": 0.0001732896980049473, + "time_sec": 49.65671181678772 + }, + { + "epoch": 110, + "train_loss": 1.4055479312515258, + "train_acc": 0.59848, + "test_loss": 7.415324240112304, + "test_acc": 0.1141, + "lyapunov": null, + "grad_norm": 0.661679386884237, + "grad_max_sv": 0.23660207092761992, + "grad_min_sv": 1.2329166683595904e-08, + "grad_condition": 108272302.88749842, + "lr": 0.00016543469682057076, + "time_sec": 49.66524934768677 + }, + { + "epoch": 111, + "train_loss": 1.384641782722473, + "train_acc": 0.60062, + "test_loss": 7.77435883102417, + "test_acc": 0.1081, + "lyapunov": null, + "grad_norm": 0.6613834178297813, + "grad_max_sv": 0.23533825390040874, + "grad_min_sv": 1.2306671472086388e-08, + "grad_condition": 187030204.42945534, + "lr": 0.00015772644703565552, + "time_sec": 49.685218334198 + }, + { + "epoch": 112, + "train_loss": 1.381474980392456, + "train_acc": 0.60532, + "test_loss": 7.833615634155273, + "test_acc": 0.104, + "lyapunov": null, + "grad_norm": 0.6615988288597077, + "grad_max_sv": 0.2345717329531908, + "grad_min_sv": 1.2362300387189217e-08, + "grad_condition": 73162687.85149845, + "lr": 0.00015016832974331713, + "time_sec": 49.6341872215271 + }, + { + "epoch": 113, + "train_loss": 1.3749549925613402, + "train_acc": 0.6076, + "test_loss": 8.104566619873047, + "test_acc": 0.1025, + "lyapunov": null, + "grad_norm": 0.6604353164865508, + "grad_max_sv": 0.2384736143052578, + "grad_min_sv": 1.2292912274919354e-08, + "grad_condition": 52201296.24398358, + "lr": 0.00014276366018359834, + "time_sec": 49.64921832084656 + }, + { + "epoch": 114, + "train_loss": 1.3708936805725098, + "train_acc": 0.6097, + "test_loss": 7.838578803253174, + "test_acc": 0.1036, + "lyapunov": null, + "grad_norm": 0.6597496756028915, + "grad_max_sv": 0.23329505324363708, + "grad_min_sv": 1.2220082992731029e-08, + "grad_condition": 32976955.71673715, + "lr": 0.00013551568628929425, + "time_sec": 49.66742539405823 + }, + { + "epoch": 115, + "train_loss": 1.3580178193664552, + "train_acc": 0.6117, + "test_loss": 7.769389814758301, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 0.6591668477181649, + "grad_max_sv": 0.231846559420228, + "grad_min_sv": 1.2077120317699475e-08, + "grad_condition": 27076158.4162421, + "lr": 0.00012842758726130276, + "time_sec": 49.66256380081177 + }, + { + "epoch": 116, + "train_loss": 1.3422759653091432, + "train_acc": 0.6159, + "test_loss": 7.609967884063721, + "test_acc": 0.1141, + "lyapunov": null, + "grad_norm": 0.6579812947199307, + "grad_max_sv": 0.23519065380096435, + "grad_min_sv": 1.2230205650217568e-08, + "grad_condition": 189591095.93009597, + "lr": 0.0001215024721741218, + "time_sec": 49.634645223617554 + }, + { + "epoch": 117, + "train_loss": 1.345062205543518, + "train_acc": 0.61326, + "test_loss": 7.671285011291504, + "test_acc": 0.105, + "lyapunov": null, + "grad_norm": 0.6573840865317447, + "grad_max_sv": 0.23232375495135785, + "grad_min_sv": 1.2127244358728361e-08, + "grad_condition": 27041308.62698097, + "lr": 0.00011474337861210538, + "time_sec": 49.721657037734985 + }, + { + "epoch": 118, + "train_loss": 1.3362547462463379, + "train_acc": 0.61754, + "test_loss": 7.603790494537353, + "test_acc": 0.118, + "lyapunov": null, + "grad_norm": 0.6535680641186965, + "grad_max_sv": 0.23125030547380448, + "grad_min_sv": 1.2125971138310377e-08, + "grad_condition": 30576924.72097805, + "lr": 0.00010815327133708009, + "time_sec": 49.65640139579773 + }, + { + "epoch": 119, + "train_loss": 1.324526766090393, + "train_acc": 0.6202, + "test_loss": 7.146679705810547, + "test_acc": 0.1277, + "lyapunov": null, + "grad_norm": 0.6537238175763526, + "grad_max_sv": 0.23054058961570262, + "grad_min_sv": 1.1861389216487329e-08, + "grad_condition": 94056785.7170029, + "lr": 0.00010173504098790182, + "time_sec": 49.64234375953674 + }, + { + "epoch": 120, + "train_loss": 1.3227774859619141, + "train_acc": 0.61932, + "test_loss": 7.841625230407715, + "test_acc": 0.1097, + "lyapunov": null, + "grad_norm": 0.6585881553925022, + "grad_max_sv": 0.23253618888556957, + "grad_min_sv": 1.2248489228428027e-08, + "grad_condition": 25671104.344326176, + "lr": 9.549150281252629e-05, + "time_sec": 49.64756202697754 + }, + { + "epoch": 121, + "train_loss": 1.3257021924591064, + "train_acc": 0.6197, + "test_loss": 7.281103452301025, + "test_acc": 0.118, + "lyapunov": null, + "grad_norm": 0.6606694721410599, + "grad_max_sv": 0.23401161096990108, + "grad_min_sv": 1.23878893578018e-08, + "grad_condition": 375331062.1698051, + "lr": 8.942539543314794e-05, + "time_sec": 49.69174933433533 + }, + { + "epoch": 122, + "train_loss": 1.3191473028182983, + "train_acc": 0.62362, + "test_loss": 7.608569123077393, + "test_acc": 0.1148, + "lyapunov": null, + "grad_norm": 0.6562147201330847, + "grad_max_sv": 0.2345144312828779, + "grad_min_sv": 1.2236037863488924e-08, + "grad_condition": 24169304.63512346, + "lr": 8.353937964495024e-05, + "time_sec": 49.66494059562683 + }, + { + "epoch": 123, + "train_loss": 1.3161669417953492, + "train_acc": 0.6228, + "test_loss": 7.431023121643066, + "test_acc": 0.1205, + "lyapunov": null, + "grad_norm": 0.655746689623802, + "grad_max_sv": 0.23210358433425426, + "grad_min_sv": 1.2093831353032769e-08, + "grad_condition": 27166665.91640096, + "lr": 7.783603724899243e-05, + "time_sec": 49.67143940925598 + }, + { + "epoch": 124, + "train_loss": 1.3053954098510743, + "train_acc": 0.62686, + "test_loss": 7.388921417236328, + "test_acc": 0.1239, + "lyapunov": null, + "grad_norm": 0.6544340773431996, + "grad_max_sv": 0.23393282927572728, + "grad_min_sv": 1.2000262163830433e-08, + "grad_condition": 40293302.03059441, + "lr": 7.231786991974666e-05, + "time_sec": 49.67071533203125 + }, + { + "epoch": 125, + "train_loss": 1.2986741017913819, + "train_acc": 0.62652, + "test_loss": 7.625472329711914, + "test_acc": 0.1109, + "lyapunov": null, + "grad_norm": 0.654291047734432, + "grad_max_sv": 0.233845991268754, + "grad_min_sv": 1.2233166646336002e-08, + "grad_condition": 32432564.646282505, + "lr": 6.698729810778072e-05, + "time_sec": 49.684485912323 + }, + { + "epoch": 126, + "train_loss": 1.2981608987426758, + "train_acc": 0.62768, + "test_loss": 7.55356981124878, + "test_acc": 0.1134, + "lyapunov": null, + "grad_norm": 0.6532735495423818, + "grad_max_sv": 0.23108058460056782, + "grad_min_sv": 1.2223132362862432e-08, + "grad_condition": 55869279.53066347, + "lr": 6.184665997806817e-05, + "time_sec": 49.673479080200195 + }, + { + "epoch": 127, + "train_loss": 1.284857452430725, + "train_acc": 0.6299, + "test_loss": 7.630035566711426, + "test_acc": 0.1177, + "lyapunov": null, + "grad_norm": 0.6535000654947392, + "grad_max_sv": 0.2305291261523962, + "grad_min_sv": 1.2025161797574179e-08, + "grad_condition": 38563624.65048842, + "lr": 5.6898210384392595e-05, + "time_sec": 49.65974545478821 + }, + { + "epoch": 128, + "train_loss": 1.2872473387527466, + "train_acc": 0.63074, + "test_loss": 7.816648463439941, + "test_acc": 0.1074, + "lyapunov": null, + "grad_norm": 0.6556232897791993, + "grad_max_sv": 0.23139363788068296, + "grad_min_sv": 1.2139861799154162e-08, + "grad_condition": 21620449.375102155, + "lr": 5.214411988029363e-05, + "time_sec": 49.67285084724426 + }, + { + "epoch": 129, + "train_loss": 1.2839203270721435, + "train_acc": 0.63198, + "test_loss": 7.686043922424316, + "test_acc": 0.1107, + "lyapunov": null, + "grad_norm": 0.6538397116362318, + "grad_max_sv": 0.23078379295766355, + "grad_min_sv": 1.2263055679251344e-08, + "grad_condition": 30132651.96333309, + "lr": 4.7586473766990294e-05, + "time_sec": 49.65816259384155 + }, + { + "epoch": 130, + "train_loss": 1.2879181386947631, + "train_acc": 0.6295, + "test_loss": 7.284703018951416, + "test_acc": 0.1212, + "lyapunov": null, + "grad_norm": 0.6543551128708801, + "grad_max_sv": 0.23338331654667854, + "grad_min_sv": 1.225495914608521e-08, + "grad_condition": 40111704.746262416, + "lr": 4.32272711786996e-05, + "time_sec": 49.689605712890625 + }, + { + "epoch": 131, + "train_loss": 1.2772941580581665, + "train_acc": 0.63226, + "test_loss": 7.628822850036621, + "test_acc": 0.1251, + "lyapunov": null, + "grad_norm": 0.6541078094500179, + "grad_max_sv": 0.23095286451280117, + "grad_min_sv": 1.2264368622755262e-08, + "grad_condition": 38044131.14626959, + "lr": 3.906842420574966e-05, + "time_sec": 49.65666127204895 + }, + { + "epoch": 132, + "train_loss": 1.2753728385543823, + "train_acc": 0.63298, + "test_loss": 7.4228827728271485, + "test_acc": 0.1168, + "lyapunov": null, + "grad_norm": 0.6518818291602195, + "grad_max_sv": 0.23020194619894027, + "grad_min_sv": 1.1869802908626159e-08, + "grad_condition": 130095361.367623, + "lr": 3.5111757055874305e-05, + "time_sec": 49.62563371658325 + }, + { + "epoch": 133, + "train_loss": 1.2734521606826783, + "train_acc": 0.63348, + "test_loss": 7.479303890991211, + "test_acc": 0.1168, + "lyapunov": null, + "grad_norm": 0.6504483122691227, + "grad_max_sv": 0.227764842659235, + "grad_min_sv": 1.2072418637681936e-08, + "grad_condition": 37256695.60868154, + "lr": 3.1359005254054254e-05, + "time_sec": 49.64572739601135 + }, + { + "epoch": 134, + "train_loss": 1.274392656326294, + "train_acc": 0.63436, + "test_loss": 7.501944967651367, + "test_acc": 0.1116, + "lyapunov": null, + "grad_norm": 0.6533051303811023, + "grad_max_sv": 0.2328547578305006, + "grad_min_sv": 1.2034401706412234e-08, + "grad_condition": 40122252.46818484, + "lr": 2.7811814881259484e-05, + "time_sec": 49.688488245010376 + }, + { + "epoch": 135, + "train_loss": 1.2655631539154053, + "train_acc": 0.63618, + "test_loss": 7.9619408744812015, + "test_acc": 0.1138, + "lyapunov": null, + "grad_norm": 0.6522208349357006, + "grad_max_sv": 0.22971462085843086, + "grad_min_sv": 1.197521229817644e-08, + "grad_condition": 29822770.962131202, + "lr": 2.4471741852423218e-05, + "time_sec": 49.65588617324829 + }, + { + "epoch": 136, + "train_loss": 1.268963059539795, + "train_acc": 0.6335, + "test_loss": 8.084682507324219, + "test_acc": 0.1141, + "lyapunov": null, + "grad_norm": 0.6529862474718996, + "grad_max_sv": 0.23661385849118233, + "grad_min_sv": 1.2099510114660372e-08, + "grad_condition": 34094776.57419702, + "lr": 2.1340251233966362e-05, + "time_sec": 49.656200885772705 + }, + { + "epoch": 137, + "train_loss": 1.2612542757034302, + "train_acc": 0.6373, + "test_loss": 7.560983388519287, + "test_acc": 0.1146, + "lyapunov": null, + "grad_norm": 0.6508053534033943, + "grad_max_sv": 0.22569148056209087, + "grad_min_sv": 1.1914575683696915e-08, + "grad_condition": 280667265.68574333, + "lr": 1.8418716601170932e-05, + "time_sec": 49.65742373466492 + }, + { + "epoch": 138, + "train_loss": 1.2553864584732055, + "train_acc": 0.63724, + "test_loss": 7.584266532897949, + "test_acc": 0.1163, + "lyapunov": null, + "grad_norm": 0.64933795247114, + "grad_max_sv": 0.23180973641574382, + "grad_min_sv": 1.2025156179151786e-08, + "grad_condition": 23289105.71118166, + "lr": 1.570841943568445e-05, + "time_sec": 49.662779092788696 + }, + { + "epoch": 139, + "train_loss": 1.2552764698028565, + "train_acc": 0.63738, + "test_loss": 7.664991424560547, + "test_acc": 0.1161, + "lyapunov": null, + "grad_norm": 0.647861365438169, + "grad_max_sv": 0.22521368972957134, + "grad_min_sv": 1.1958369547371284e-08, + "grad_condition": 24157211.07512205, + "lr": 1.3210548563419845e-05, + "time_sec": 49.63586139678955 + }, + { + "epoch": 140, + "train_loss": 1.2617371710586547, + "train_acc": 0.637, + "test_loss": 7.432257106018066, + "test_acc": 0.1164, + "lyapunov": null, + "grad_norm": 0.6509496619387883, + "grad_max_sv": 0.23083123862743377, + "grad_min_sv": 1.2025924561731571e-08, + "grad_condition": 23207394.355445042, + "lr": 1.0926199633097203e-05, + "time_sec": 49.651548862457275 + }, + { + "epoch": 141, + "train_loss": 1.25511916847229, + "train_acc": 0.63894, + "test_loss": 7.457573948669434, + "test_acc": 0.116, + "lyapunov": null, + "grad_norm": 0.6479708388764596, + "grad_max_sv": 0.23126726895570754, + "grad_min_sv": 1.2012513458253826e-08, + "grad_condition": 40012529.005553745, + "lr": 8.856374635655688e-06, + "time_sec": 49.65609169006348 + }, + { + "epoch": 142, + "train_loss": 1.2660139290618897, + "train_acc": 0.63534, + "test_loss": 7.780697847747803, + "test_acc": 0.1123, + "lyapunov": null, + "grad_norm": 0.6502312911760466, + "grad_max_sv": 0.2311037950217724, + "grad_min_sv": 1.2062704925208667e-08, + "grad_condition": 28805083.114098005, + "lr": 7.001981464747503e-06, + "time_sec": 49.662680864334106 + }, + { + "epoch": 143, + "train_loss": 1.253378801651001, + "train_acc": 0.63776, + "test_loss": 7.479852529907227, + "test_acc": 0.1136, + "lyapunov": null, + "grad_norm": 0.6474110087943552, + "grad_max_sv": 0.22780719213187695, + "grad_min_sv": 1.1970692369040608e-08, + "grad_condition": 894266882.7813612, + "lr": 5.3638335185058295e-06, + "time_sec": 49.69564867019653 + }, + { + "epoch": 144, + "train_loss": 1.2509675663757325, + "train_acc": 0.63908, + "test_loss": 7.574235760498047, + "test_acc": 0.1164, + "lyapunov": null, + "grad_norm": 0.648587834005495, + "grad_max_sv": 0.2315014570951462, + "grad_min_sv": 1.190292156366679e-08, + "grad_condition": 45610481.34808161, + "lr": 3.942649342761114e-06, + "time_sec": 49.65193223953247 + }, + { + "epoch": 145, + "train_loss": 1.2546575288009643, + "train_acc": 0.63926, + "test_loss": 7.842446206665039, + "test_acc": 0.1159, + "lyapunov": null, + "grad_norm": 0.6487401792218206, + "grad_max_sv": 0.23385348841547965, + "grad_min_sv": 1.184119967564956e-08, + "grad_condition": 37894572.43827629, + "lr": 2.7390523158633524e-06, + "time_sec": 49.66033387184143 + }, + { + "epoch": 146, + "train_loss": 1.256413402404785, + "train_acc": 0.6386, + "test_loss": 7.555493270874023, + "test_acc": 0.117, + "lyapunov": null, + "grad_norm": 0.6501641349918278, + "grad_max_sv": 0.23139567412436007, + "grad_min_sv": 1.2211040111703708e-08, + "grad_condition": 35059735.49931946, + "lr": 1.7535703752478133e-06, + "time_sec": 49.66970777511597 + }, + { + "epoch": 147, + "train_loss": 1.2524045500564576, + "train_acc": 0.64112, + "test_loss": 7.473281847381592, + "test_acc": 0.1172, + "lyapunov": null, + "grad_norm": 0.6478005484529865, + "grad_max_sv": 0.23428054936230183, + "grad_min_sv": 1.2012692547636039e-08, + "grad_condition": 64301722.17238464, + "lr": 9.866357858642196e-07, + "time_sec": 49.649775981903076 + }, + { + "epoch": 148, + "train_loss": 1.250693888015747, + "train_acc": 0.64042, + "test_loss": 8.20074097442627, + "test_acc": 0.1071, + "lyapunov": null, + "grad_norm": 0.6494618630292652, + "grad_max_sv": 0.23039772994816304, + "grad_min_sv": 1.1898679564727177e-08, + "grad_condition": 127077986.43711999, + "lr": 4.38584950570808e-07, + "time_sec": 49.63900947570801 + }, + { + "epoch": 149, + "train_loss": 1.253049038734436, + "train_acc": 0.63926, + "test_loss": 7.87840643157959, + "test_acc": 0.1119, + "lyapunov": null, + "grad_norm": 0.6507655723273512, + "grad_max_sv": 0.2329292245209217, + "grad_min_sv": 1.2133096874422655e-08, + "grad_condition": 34964952.175665215, + "lr": 1.096582625772501e-07, + "time_sec": 49.65436911582947 + }, + { + "epoch": 150, + "train_loss": 1.25349819355011, + "train_acc": 0.63778, + "test_loss": 7.748453028106689, + "test_acc": 0.1159, + "lyapunov": null, + "grad_norm": 0.6513717977450576, + "grad_max_sv": 0.2340761035680771, + "grad_min_sv": 1.2247920957737107e-08, + "grad_condition": 580487852.1798013, + "lr": 0.0, + "time_sec": 49.66983723640442 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.089254416656495, + "train_acc": 0.01344, + "test_loss": 4.870831555175781, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.582063459208639, + "grad_max_sv": 5.0306542873382565, + "grad_min_sv": 8.441757832766683e-08, + "grad_condition": 74707534.78681344, + "lr": 0.0009998903417374227, + "time_sec": 66.72781872749329 + }, + { + "epoch": 2, + "train_loss": 4.736304296569824, + "train_acc": 0.02172, + "test_loss": 4.92340059890747, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.087296772772229, + "grad_max_sv": 3.672157108783722, + "grad_min_sv": 6.109624839933935e-08, + "grad_condition": 230714811.36310124, + "lr": 0.0009995614150494292, + "time_sec": 66.72452092170715 + }, + { + "epoch": 3, + "train_loss": 4.52685978515625, + "train_acc": 0.03204, + "test_loss": 5.045831031799317, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 3.1470044543912175, + "grad_max_sv": 2.6447540044784548, + "grad_min_sv": 4.639755384339139e-08, + "grad_condition": 65625701.84585605, + "lr": 0.0009990133642141358, + "time_sec": 66.75468754768372 + }, + { + "epoch": 4, + "train_loss": 4.371717319641113, + "train_acc": 0.04112, + "test_loss": 4.993129699707032, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 2.5123688948843395, + "grad_max_sv": 2.1027904629707335, + "grad_min_sv": 3.615837387664633e-08, + "grad_condition": 418817692.03399765, + "lr": 0.0009982464296247522, + "time_sec": 66.7680299282074 + }, + { + "epoch": 5, + "train_loss": 4.27407361251831, + "train_acc": 0.0488, + "test_loss": 5.161634465789795, + "test_acc": 0.0119, + "lyapunov": null, + "grad_norm": 1.9573801826064445, + "grad_max_sv": 1.613087645173073, + "grad_min_sv": 2.8529539808364034e-08, + "grad_condition": 62747668.20627429, + "lr": 0.0009972609476841367, + "time_sec": 66.75485754013062 + }, + { + "epoch": 6, + "train_loss": 4.183251854553222, + "train_acc": 0.05812, + "test_loss": 5.447854755401611, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 1.436449079599314, + "grad_max_sv": 1.0459295481443405, + "grad_min_sv": 2.0654144772258576e-08, + "grad_condition": 94732574.16372415, + "lr": 0.000996057350657239, + "time_sec": 66.76473689079285 + }, + { + "epoch": 7, + "train_loss": 4.103355536193848, + "train_acc": 0.06872, + "test_loss": 5.544150679016114, + "test_acc": 0.0124, + "lyapunov": null, + "grad_norm": 1.082624040556548, + "grad_max_sv": 0.678101472556591, + "grad_min_sv": 1.6660088839048904e-08, + "grad_condition": 49338508.46283151, + "lr": 0.000994636166481494, + "time_sec": 66.74250817298889 + }, + { + "epoch": 8, + "train_loss": 4.040529095458984, + "train_acc": 0.07876, + "test_loss": 5.577163777160645, + "test_acc": 0.0172, + "lyapunov": null, + "grad_norm": 0.963869121683512, + "grad_max_sv": 0.5578698106110096, + "grad_min_sv": 1.4817374840991882e-08, + "grad_condition": 46172185.25999212, + "lr": 0.0009929980185352525, + "time_sec": 66.75457096099854 + }, + { + "epoch": 9, + "train_loss": 3.999490645446777, + "train_acc": 0.0856, + "test_loss": 5.472281336975097, + "test_acc": 0.0116, + "lyapunov": null, + "grad_norm": 0.9198022107734598, + "grad_max_sv": 0.5003849364817142, + "grad_min_sv": 1.3862486752946878e-08, + "grad_condition": 137028895.09887612, + "lr": 0.0009911436253643444, + "time_sec": 66.73336434364319 + }, + { + "epoch": 10, + "train_loss": 3.9641557629394533, + "train_acc": 0.09124, + "test_loss": 5.43024553604126, + "test_acc": 0.0112, + "lyapunov": null, + "grad_norm": 0.8539816540258655, + "grad_max_sv": 0.4397390566766262, + "grad_min_sv": 1.3177782898221579e-08, + "grad_condition": 50953468.3517745, + "lr": 0.0009890738003669028, + "time_sec": 66.74955892562866 + }, + { + "epoch": 11, + "train_loss": 3.912582547149658, + "train_acc": 0.09724, + "test_loss": 5.977069612121582, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 0.8304366482521061, + "grad_max_sv": 0.4253105387091637, + "grad_min_sv": 1.2851445623657253e-08, + "grad_condition": 192581837.7575304, + "lr": 0.00098678945143658, + "time_sec": 66.74551677703857 + }, + { + "epoch": 12, + "train_loss": 3.885940095291138, + "train_acc": 0.10388, + "test_loss": 5.707202329254151, + "test_acc": 0.0161, + "lyapunov": null, + "grad_norm": 0.7930567752358824, + "grad_max_sv": 0.3784016497433186, + "grad_min_sv": 1.2496499026196095e-08, + "grad_condition": 121475679.84002523, + "lr": 0.0009842915805643154, + "time_sec": 66.76995825767517 + }, + { + "epoch": 13, + "train_loss": 3.848949595184326, + "train_acc": 0.10982, + "test_loss": 5.604932201385498, + "test_acc": 0.0138, + "lyapunov": null, + "grad_norm": 0.7694655756397059, + "grad_max_sv": 0.36012797653675077, + "grad_min_sv": 1.2309415998654205e-08, + "grad_condition": 96913763.80192877, + "lr": 0.000981581283398829, + "time_sec": 66.89632487297058 + }, + { + "epoch": 14, + "train_loss": 3.822469270477295, + "train_acc": 0.11176, + "test_loss": 5.5594536964416505, + "test_acc": 0.0144, + "lyapunov": null, + "grad_norm": 0.751737952115685, + "grad_max_sv": 0.34815125875175, + "grad_min_sv": 1.1860258068707719e-08, + "grad_condition": 63821387.65591574, + "lr": 0.0009786597487660333, + "time_sec": 66.8272774219513 + }, + { + "epoch": 15, + "train_loss": 3.8008637019348144, + "train_acc": 0.11732, + "test_loss": 5.8510744079589845, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 0.7274896957635634, + "grad_max_sv": 0.3341310672461987, + "grad_min_sv": 1.185839371142805e-08, + "grad_condition": 51068114.03076443, + "lr": 0.0009755282581475766, + "time_sec": 66.75787544250488 + }, + { + "epoch": 16, + "train_loss": 3.7793116706085206, + "train_acc": 0.12078, + "test_loss": 6.094802139282226, + "test_acc": 0.0135, + "lyapunov": null, + "grad_norm": 0.7029997372387793, + "grad_max_sv": 0.31635181941092017, + "grad_min_sv": 1.1313535006052256e-08, + "grad_condition": 34061221.316739336, + "lr": 0.0009721881851187403, + "time_sec": 66.73489236831665 + }, + { + "epoch": 17, + "train_loss": 3.756349168548584, + "train_acc": 0.12318, + "test_loss": 6.524116158294678, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6891476510098721, + "grad_max_sv": 0.30746029056608676, + "grad_min_sv": 1.1205093228272567e-08, + "grad_condition": 55101632.74828547, + "lr": 0.0009686409947459456, + "time_sec": 66.7347002029419 + }, + { + "epoch": 18, + "train_loss": 3.736860103225708, + "train_acc": 0.12666, + "test_loss": 6.334092637634277, + "test_acc": 0.0151, + "lyapunov": null, + "grad_norm": 0.6735913591792417, + "grad_max_sv": 0.3038469754159451, + "grad_min_sv": 1.1184529693109707e-08, + "grad_condition": 266599149.22808576, + "lr": 0.0009648882429441254, + "time_sec": 66.79292225837708 + }, + { + "epoch": 19, + "train_loss": 3.721009854812622, + "train_acc": 0.13104, + "test_loss": 6.503785885620117, + "test_acc": 0.0158, + "lyapunov": null, + "grad_norm": 0.6543898752326373, + "grad_max_sv": 0.2952485930174589, + "grad_min_sv": 1.0702305973386839e-08, + "grad_condition": 36178987.94815246, + "lr": 0.00096093157579425, + "time_sec": 66.92458534240723 + }, + { + "epoch": 20, + "train_loss": 3.6978233711242674, + "train_acc": 0.13484, + "test_loss": 7.133095213317871, + "test_acc": 0.014, + "lyapunov": null, + "grad_norm": 0.6416047326169007, + "grad_max_sv": 0.2835653819143772, + "grad_min_sv": 1.061290202941656e-08, + "grad_condition": 29580333.508830875, + "lr": 0.0009567727288213001, + "time_sec": 66.78373384475708 + }, + { + "epoch": 21, + "train_loss": 3.678186371612549, + "train_acc": 0.13804, + "test_loss": 6.526899772644043, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 0.6346445495636812, + "grad_max_sv": 0.2758004698902369, + "grad_min_sv": 1.0650165743059103e-08, + "grad_condition": 50339413.533409506, + "lr": 0.0009524135262330095, + "time_sec": 66.93581771850586 + }, + { + "epoch": 22, + "train_loss": 3.6615531184387207, + "train_acc": 0.13652, + "test_loss": 7.463528224182129, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6211761686754148, + "grad_max_sv": 0.2590024430304766, + "grad_min_sv": 1.0093259970866963e-08, + "grad_condition": 54350139.527433194, + "lr": 0.0009478558801197061, + "time_sec": 66.7949447631836 + }, + { + "epoch": 23, + "train_loss": 3.646244419708252, + "train_acc": 0.14018, + "test_loss": 7.247557836151123, + "test_acc": 0.0133, + "lyapunov": null, + "grad_norm": 0.6087560504487702, + "grad_max_sv": 0.26471212282776835, + "grad_min_sv": 1.0175153231789525e-08, + "grad_condition": 76037868.51400027, + "lr": 0.000943101789615607, + "time_sec": 66.79549622535706 + }, + { + "epoch": 24, + "train_loss": 3.6286012983703615, + "train_acc": 0.14502, + "test_loss": 7.168135193634034, + "test_acc": 0.0191, + "lyapunov": null, + "grad_norm": 0.5998778506859267, + "grad_max_sv": 0.24980814158916473, + "grad_min_sv": 1.0037150326158706e-08, + "grad_condition": 32920800.60529256, + "lr": 0.0009381533400219313, + "time_sec": 66.869384765625 + }, + { + "epoch": 25, + "train_loss": 3.6192829264831543, + "train_acc": 0.14634, + "test_loss": 7.535636337280273, + "test_acc": 0.0161, + "lyapunov": null, + "grad_norm": 0.5983012708829252, + "grad_max_sv": 0.2530865453183651, + "grad_min_sv": 9.982956203358206e-09, + "grad_condition": 29219670.862144046, + "lr": 0.0009330127018922189, + "time_sec": 66.76451802253723 + }, + { + "epoch": 26, + "train_loss": 3.6001767744445803, + "train_acc": 0.1487, + "test_loss": 6.850593623352051, + "test_acc": 0.0151, + "lyapunov": null, + "grad_norm": 0.5947140415117098, + "grad_max_sv": 0.24490244090557098, + "grad_min_sv": 9.946103620567249e-09, + "grad_condition": 94915701.68580723, + "lr": 0.000927682130080253, + "time_sec": 66.80610680580139 + }, + { + "epoch": 27, + "train_loss": 3.5885346211242677, + "train_acc": 0.15218, + "test_loss": 7.121657147216797, + "test_acc": 0.0175, + "lyapunov": null, + "grad_norm": 0.5825348653665754, + "grad_max_sv": 0.2360658310353756, + "grad_min_sv": 9.758478072829923e-09, + "grad_condition": 28325624.288454544, + "lr": 0.0009221639627510072, + "time_sec": 66.7368016242981 + }, + { + "epoch": 28, + "train_loss": 3.5699786253356933, + "train_acc": 0.15318, + "test_loss": 7.339261558532715, + "test_acc": 0.0157, + "lyapunov": null, + "grad_norm": 0.5731165313342855, + "grad_max_sv": 0.23213129304349422, + "grad_min_sv": 9.869128861361709e-09, + "grad_condition": 27851276.279406942, + "lr": 0.0009164606203550494, + "time_sec": 66.76568675041199 + }, + { + "epoch": 29, + "train_loss": 3.562197733078003, + "train_acc": 0.15604, + "test_loss": 7.580322309875489, + "test_acc": 0.0165, + "lyapunov": null, + "grad_norm": 0.5656101207986921, + "grad_max_sv": 0.21968504451215268, + "grad_min_sv": 9.579083420918621e-09, + "grad_condition": 25012099.962059125, + "lr": 0.0009105746045668516, + "time_sec": 66.8453516960144 + }, + { + "epoch": 30, + "train_loss": 3.560017660369873, + "train_acc": 0.15662, + "test_loss": 7.44054066619873, + "test_acc": 0.0173, + "lyapunov": null, + "grad_norm": 0.5599580597173339, + "grad_max_sv": 0.2209590796381235, + "grad_min_sv": 9.39374856998021e-09, + "grad_condition": 61658396.11314602, + "lr": 0.0009045084971874733, + "time_sec": 66.75297498703003 + }, + { + "epoch": 31, + "train_loss": 3.5422336725616455, + "train_acc": 0.1599, + "test_loss": 7.076059481048584, + "test_acc": 0.0198, + "lyapunov": null, + "grad_norm": 0.5515859229373342, + "grad_max_sv": 0.21789075396955013, + "grad_min_sv": 9.395337015327687e-09, + "grad_condition": 33141907.468724538, + "lr": 0.0008982649590120977, + "time_sec": 66.84002542495728 + }, + { + "epoch": 32, + "train_loss": 3.5323507067108153, + "train_acc": 0.16226, + "test_loss": 7.484644064331055, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5491148394893098, + "grad_max_sv": 0.20811132229864598, + "grad_min_sv": 9.385871152511883e-09, + "grad_condition": 32793140.01706022, + "lr": 0.0008918467286629196, + "time_sec": 66.76462388038635 + }, + { + "epoch": 33, + "train_loss": 3.5161914233398437, + "train_acc": 0.16196, + "test_loss": 7.1630567352294925, + "test_acc": 0.0192, + "lyapunov": null, + "grad_norm": 0.5439550193507326, + "grad_max_sv": 0.21854646913707257, + "grad_min_sv": 9.405872293880014e-09, + "grad_condition": 66461999.0202436, + "lr": 0.0008852566213878943, + "time_sec": 66.75850176811218 + }, + { + "epoch": 34, + "train_loss": 3.5097799615478515, + "train_acc": 0.16602, + "test_loss": 7.106797317504883, + "test_acc": 0.0188, + "lyapunov": null, + "grad_norm": 0.5400742997304219, + "grad_max_sv": 0.2044513113796711, + "grad_min_sv": 9.253371524575726e-09, + "grad_condition": 26988718.534539413, + "lr": 0.000878497527825878, + "time_sec": 66.7507495880127 + }, + { + "epoch": 35, + "train_loss": 3.496268680496216, + "train_acc": 0.16568, + "test_loss": 7.082461839294433, + "test_acc": 0.0204, + "lyapunov": null, + "grad_norm": 0.5336117204770247, + "grad_max_sv": 0.20079954750835896, + "grad_min_sv": 9.20759104378055e-09, + "grad_condition": 28862147.41901524, + "lr": 0.000871572412738697, + "time_sec": 66.73531174659729 + }, + { + "epoch": 36, + "train_loss": 3.4916924793243407, + "train_acc": 0.16696, + "test_loss": 6.652525229644775, + "test_acc": 0.0254, + "lyapunov": null, + "grad_norm": 0.5305570334287781, + "grad_max_sv": 0.20064033418893815, + "grad_min_sv": 9.168744452558997e-09, + "grad_condition": 25026310.55810722, + "lr": 0.0008644843137107055, + "time_sec": 66.75055170059204 + }, + { + "epoch": 37, + "train_loss": 3.4758248693847658, + "train_acc": 0.16888, + "test_loss": 6.896866636657715, + "test_acc": 0.0173, + "lyapunov": null, + "grad_norm": 0.5330249264322945, + "grad_max_sv": 0.19781249463558198, + "grad_min_sv": 9.083170277035535e-09, + "grad_condition": 32783382.382080305, + "lr": 0.0008572363398164014, + "time_sec": 66.77334451675415 + }, + { + "epoch": 38, + "train_loss": 3.4695195873260496, + "train_acc": 0.17072, + "test_loss": 6.4400072814941405, + "test_acc": 0.0218, + "lyapunov": null, + "grad_norm": 0.5334319968311563, + "grad_max_sv": 0.20071442537009715, + "grad_min_sv": 9.163169936710069e-09, + "grad_condition": 25885863.511335682, + "lr": 0.0008498316702566826, + "time_sec": 66.7480320930481 + }, + { + "epoch": 39, + "train_loss": 3.45369920539856, + "train_acc": 0.17284, + "test_loss": 6.579633006286621, + "test_acc": 0.0202, + "lyapunov": null, + "grad_norm": 0.5329158861774494, + "grad_max_sv": 0.2015998687595129, + "grad_min_sv": 9.256902752663443e-09, + "grad_condition": 26314550.539648045, + "lr": 0.0008422735529643442, + "time_sec": 66.74337792396545 + }, + { + "epoch": 40, + "train_loss": 3.4462957423400877, + "train_acc": 0.17424, + "test_loss": 7.142499053955079, + "test_acc": 0.0205, + "lyapunov": null, + "grad_norm": 0.5296803296301241, + "grad_max_sv": 0.2004535213112831, + "grad_min_sv": 9.085983729284486e-09, + "grad_condition": 25132983.42064634, + "lr": 0.0008345653031794289, + "time_sec": 66.76149940490723 + }, + { + "epoch": 41, + "train_loss": 3.4409220630645754, + "train_acc": 0.17582, + "test_loss": 6.420920026397705, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.5226482078086451, + "grad_max_sv": 0.1943317238241434, + "grad_min_sv": 9.049205283717666e-09, + "grad_condition": 27231402.34700817, + "lr": 0.0008267103019950526, + "time_sec": 66.75436353683472 + }, + { + "epoch": 42, + "train_loss": 3.4290409894561766, + "train_acc": 0.17698, + "test_loss": 7.220374629211426, + "test_acc": 0.0174, + "lyapunov": null, + "grad_norm": 0.5173855625677775, + "grad_max_sv": 0.19160303175449372, + "grad_min_sv": 8.971642997566628e-09, + "grad_condition": 222494191.59464812, + "lr": 0.0008187119948743447, + "time_sec": 66.7648994922638 + }, + { + "epoch": 43, + "train_loss": 3.416502248687744, + "train_acc": 0.18008, + "test_loss": 7.530539099884034, + "test_acc": 0.0202, + "lyapunov": null, + "grad_norm": 0.5140331017302348, + "grad_max_sv": 0.19175201803445815, + "grad_min_sv": 8.97330940247132e-09, + "grad_condition": 29821043.95148312, + "lr": 0.000810573890139155, + "time_sec": 66.78211045265198 + }, + { + "epoch": 44, + "train_loss": 3.413407900466919, + "train_acc": 0.1816, + "test_loss": 7.1156943313598635, + "test_acc": 0.0201, + "lyapunov": null, + "grad_norm": 0.5124027236392854, + "grad_max_sv": 0.18782692924141883, + "grad_min_sv": 8.988729655046157e-09, + "grad_condition": 25204778.510354124, + "lr": 0.0008022995574311873, + "time_sec": 66.81727170944214 + }, + { + "epoch": 45, + "train_loss": 3.3979202405548095, + "train_acc": 0.18222, + "test_loss": 6.318179810333252, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.5136539539386744, + "grad_max_sv": 0.18584301508963108, + "grad_min_sv": 8.876791780104699e-09, + "grad_condition": 37149562.99360152, + "lr": 0.0007938926261462363, + "time_sec": 66.74810814857483 + }, + { + "epoch": 46, + "train_loss": 3.391953636016846, + "train_acc": 0.18298, + "test_loss": 7.084993099975586, + "test_acc": 0.0223, + "lyapunov": null, + "grad_norm": 0.5118541612022541, + "grad_max_sv": 0.1917757984250784, + "grad_min_sv": 9.094181770141763e-09, + "grad_condition": 26842380.582427092, + "lr": 0.0007853567838422158, + "time_sec": 66.83485198020935 + }, + { + "epoch": 47, + "train_loss": 3.389229907913208, + "train_acc": 0.18506, + "test_loss": 6.78128480834961, + "test_acc": 0.0241, + "lyapunov": null, + "grad_norm": 0.5056241017082704, + "grad_max_sv": 0.17950649335980415, + "grad_min_sv": 9.024113689637402e-09, + "grad_condition": 22964418.65515138, + "lr": 0.0007766957746216719, + "time_sec": 66.7919397354126 + }, + { + "epoch": 48, + "train_loss": 3.372904341278076, + "train_acc": 0.18704, + "test_loss": 6.391386576843262, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.5018522792286711, + "grad_max_sv": 0.18420623578131198, + "grad_min_sv": 8.819236223256421e-09, + "grad_condition": 26329876.204275317, + "lr": 0.0007679133974894982, + "time_sec": 66.75698065757751 + }, + { + "epoch": 49, + "train_loss": 3.366441840133667, + "train_acc": 0.18952, + "test_loss": 7.556707070922852, + "test_acc": 0.0203, + "lyapunov": null, + "grad_norm": 0.504873475902597, + "grad_max_sv": 0.18459936529397963, + "grad_min_sv": 8.905453205074187e-09, + "grad_condition": 61624690.824258946, + "lr": 0.000759013504686565, + "time_sec": 66.79050326347351 + }, + { + "epoch": 50, + "train_loss": 3.3588487029266356, + "train_acc": 0.1897, + "test_loss": 7.536667886352539, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.4999300274080182, + "grad_max_sv": 0.1777935169637203, + "grad_min_sv": 8.829480036692815e-09, + "grad_condition": 40978971.99995713, + "lr": 0.0007499999999999998, + "time_sec": 66.8765435218811 + }, + { + "epoch": 51, + "train_loss": 3.351222337188721, + "train_acc": 0.18978, + "test_loss": 6.873462453460693, + "test_acc": 0.0236, + "lyapunov": null, + "grad_norm": 0.5007634827757871, + "grad_max_sv": 0.17949126586318015, + "grad_min_sv": 8.87983942765569e-09, + "grad_condition": 30553440.958018053, + "lr": 0.0007408768370508575, + "time_sec": 66.94956064224243 + }, + { + "epoch": 52, + "train_loss": 3.3438973377227783, + "train_acc": 0.19176, + "test_loss": 7.438332663726807, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.4966107450536984, + "grad_max_sv": 0.16910983845591546, + "grad_min_sv": 8.771072661228896e-09, + "grad_condition": 25705757.21881602, + "lr": 0.0007316480175599307, + "time_sec": 66.745934009552 + }, + { + "epoch": 53, + "train_loss": 3.3359473081970217, + "train_acc": 0.19448, + "test_loss": 6.782886152648926, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.49739939827662283, + "grad_max_sv": 0.17322255671024323, + "grad_min_sv": 8.82698187598674e-09, + "grad_condition": 24618710.928996503, + "lr": 0.0007223175895924635, + "time_sec": 66.78721380233765 + }, + { + "epoch": 54, + "train_loss": 3.326069559173584, + "train_acc": 0.19428, + "test_loss": 6.960753924560547, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.49604963126677376, + "grad_max_sv": 0.17417073659598828, + "grad_min_sv": 8.839123402659687e-09, + "grad_condition": 29263354.504204772, + "lr": 0.0007128896457825361, + "time_sec": 66.76385855674744 + }, + { + "epoch": 55, + "train_loss": 3.314086589889526, + "train_acc": 0.19676, + "test_loss": 7.05631950302124, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.49743016792725503, + "grad_max_sv": 0.17294535413384438, + "grad_min_sv": 8.920064298312269e-09, + "grad_condition": 23485167.953053717, + "lr": 0.0007033683215378998, + "time_sec": 66.7790584564209 + }, + { + "epoch": 56, + "train_loss": 3.315660849761963, + "train_acc": 0.19834, + "test_loss": 7.533245965576172, + "test_acc": 0.0218, + "lyapunov": null, + "grad_norm": 0.4931603787421123, + "grad_max_sv": 0.16750396378338336, + "grad_min_sv": 8.777685531202728e-09, + "grad_condition": 32655019.620684423, + "lr": 0.0006937577932260512, + "time_sec": 66.7556324005127 + }, + { + "epoch": 57, + "train_loss": 3.296080042266846, + "train_acc": 0.1983, + "test_loss": 7.345844306945801, + "test_acc": 0.0232, + "lyapunov": null, + "grad_norm": 0.4959620105957853, + "grad_max_sv": 0.1722776312381029, + "grad_min_sv": 8.79561782296534e-09, + "grad_condition": 24522492.400894172, + "lr": 0.0006840622763423388, + "time_sec": 66.75379252433777 + }, + { + "epoch": 58, + "train_loss": 3.2960589750671385, + "train_acc": 0.20076, + "test_loss": 7.738760015869141, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.4942958965299343, + "grad_max_sv": 0.17266131974756718, + "grad_min_sv": 8.839166923402252e-09, + "grad_condition": 22698276.146803144, + "lr": 0.0006742860236609073, + "time_sec": 66.74808430671692 + }, + { + "epoch": 59, + "train_loss": 3.294140084838867, + "train_acc": 0.2011, + "test_loss": 8.235951368713378, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.4929354288942166, + "grad_max_sv": 0.17219605818390846, + "grad_min_sv": 8.801463230456718e-09, + "grad_condition": 22079089.27572272, + "lr": 0.0006644333233692913, + "time_sec": 66.85729193687439 + }, + { + "epoch": 60, + "train_loss": 3.2903015409851073, + "train_acc": 0.20054, + "test_loss": 8.185438388061524, + "test_acc": 0.0227, + "lyapunov": null, + "grad_norm": 0.4946800837020447, + "grad_max_sv": 0.17233065664768218, + "grad_min_sv": 8.800618653270754e-09, + "grad_condition": 22666981.105484493, + "lr": 0.0006545084971874734, + "time_sec": 66.75132822990417 + }, + { + "epoch": 61, + "train_loss": 3.276741645050049, + "train_acc": 0.20444, + "test_loss": 7.014369299316407, + "test_acc": 0.0228, + "lyapunov": null, + "grad_norm": 0.4931363277005086, + "grad_max_sv": 0.1697451215237379, + "grad_min_sv": 8.873947368592816e-09, + "grad_condition": 26044808.200629316, + "lr": 0.0006445158984722354, + "time_sec": 66.73762321472168 + }, + { + "epoch": 62, + "train_loss": 3.2659665531921385, + "train_acc": 0.20444, + "test_loss": 7.380694603729248, + "test_acc": 0.0226, + "lyapunov": null, + "grad_norm": 0.49455688688820293, + "grad_max_sv": 0.16783221252262592, + "grad_min_sv": 8.77998669948643e-09, + "grad_condition": 37851467.31001024, + "lr": 0.0006344599103076324, + "time_sec": 66.75685262680054 + }, + { + "epoch": 63, + "train_loss": 3.2631328678894045, + "train_acc": 0.2052, + "test_loss": 7.237985221862793, + "test_acc": 0.0192, + "lyapunov": null, + "grad_norm": 0.4903630545564288, + "grad_max_sv": 0.16607676334679128, + "grad_min_sv": 8.788113892155281e-09, + "grad_condition": 22055295.31402096, + "lr": 0.0006243449435824269, + "time_sec": 66.78277540206909 + }, + { + "epoch": 64, + "train_loss": 3.257690904006958, + "train_acc": 0.20818, + "test_loss": 7.568940380859375, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.49342286662603607, + "grad_max_sv": 0.16695081815123558, + "grad_min_sv": 8.641428320133037e-09, + "grad_condition": 25506042.428760856, + "lr": 0.0006141754350553275, + "time_sec": 66.72653698921204 + }, + { + "epoch": 65, + "train_loss": 3.2442443402099608, + "train_acc": 0.21066, + "test_loss": 7.542497647094726, + "test_acc": 0.0234, + "lyapunov": null, + "grad_norm": 0.4954106045513822, + "grad_max_sv": 0.16896731182932853, + "grad_min_sv": 8.944364218721467e-09, + "grad_condition": 23810878.34586061, + "lr": 0.0006039558454088793, + "time_sec": 66.74552130699158 + }, + { + "epoch": 66, + "train_loss": 3.23546903755188, + "train_acc": 0.21082, + "test_loss": 8.086076991271973, + "test_acc": 0.0251, + "lyapunov": null, + "grad_norm": 0.4907488060159097, + "grad_max_sv": 0.16671691313385964, + "grad_min_sv": 8.83017001740427e-09, + "grad_condition": 21923974.968150117, + "lr": 0.000593690657292862, + "time_sec": 66.7405595779419 + }, + { + "epoch": 67, + "train_loss": 3.233769822845459, + "train_acc": 0.20992, + "test_loss": 8.55976441040039, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.4915441182599445, + "grad_max_sv": 0.1651388220489025, + "grad_min_sv": 8.849489993578707e-09, + "grad_condition": 25245256.560124103, + "lr": 0.0005833843733580507, + "time_sec": 66.77745580673218 + }, + { + "epoch": 68, + "train_loss": 3.224519323272705, + "train_acc": 0.21164, + "test_loss": 8.099955255126954, + "test_acc": 0.0214, + "lyapunov": null, + "grad_norm": 0.489617423603527, + "grad_max_sv": 0.16721767224371434, + "grad_min_sv": 8.79801871772612e-09, + "grad_condition": 24956132.811081767, + "lr": 0.0005730415142812054, + "time_sec": 66.79847407341003 + }, + { + "epoch": 69, + "train_loss": 3.216005241088867, + "train_acc": 0.2156, + "test_loss": 7.735234213256836, + "test_acc": 0.0227, + "lyapunov": null, + "grad_norm": 0.49097769549114934, + "grad_max_sv": 0.16438619494438172, + "grad_min_sv": 8.896314591770594e-09, + "grad_condition": 85889334.34257694, + "lr": 0.0005626666167821517, + "time_sec": 66.74724221229553 + }, + { + "epoch": 70, + "train_loss": 3.2113763916778564, + "train_acc": 0.21408, + "test_loss": 7.496349983215332, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.4930174859602223, + "grad_max_sv": 0.16231456249952317, + "grad_min_sv": 8.889525562882917e-09, + "grad_condition": 24169515.547079507, + "lr": 0.0005522642316338265, + "time_sec": 66.74811506271362 + }, + { + "epoch": 71, + "train_loss": 3.207403873062134, + "train_acc": 0.21444, + "test_loss": 8.061796890258789, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.48698435301726867, + "grad_max_sv": 0.16013988479971886, + "grad_min_sv": 8.797687520156749e-09, + "grad_condition": 21159472.558239408, + "lr": 0.0005418389216661573, + "time_sec": 66.73536777496338 + }, + { + "epoch": 72, + "train_loss": 3.1910123835754396, + "train_acc": 0.21772, + "test_loss": 7.805322082519531, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.4923736982588088, + "grad_max_sv": 0.16533413231372834, + "grad_min_sv": 8.9249454009524e-09, + "grad_condition": 96828590.79503393, + "lr": 0.0005313952597646563, + "time_sec": 66.72183275222778 + }, + { + "epoch": 73, + "train_loss": 3.1902407261657717, + "train_acc": 0.21958, + "test_loss": 8.222962713623048, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.4905281203653412, + "grad_max_sv": 0.16278306022286415, + "grad_min_sv": 8.840706555712785e-09, + "grad_condition": 23093911.6390755, + "lr": 0.0005209378268645994, + "time_sec": 66.76905274391174 + }, + { + "epoch": 74, + "train_loss": 3.186945252761841, + "train_acc": 0.22042, + "test_loss": 7.4509780258178715, + "test_acc": 0.0254, + "lyapunov": null, + "grad_norm": 0.49080682735084724, + "grad_max_sv": 0.16444684211164712, + "grad_min_sv": 8.886749067182898e-09, + "grad_condition": 21069601.509122115, + "lr": 0.0005104712099416781, + "time_sec": 66.73268365859985 + }, + { + "epoch": 75, + "train_loss": 3.1751693920898436, + "train_acc": 0.21962, + "test_loss": 7.327089692687989, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.4907412049602907, + "grad_max_sv": 0.16229031533002852, + "grad_min_sv": 8.930995210043591e-09, + "grad_condition": 20447215.168563277, + "lr": 0.0004999999999999996, + "time_sec": 66.7269811630249 + }, + { + "epoch": 76, + "train_loss": 3.1633840226745606, + "train_acc": 0.22144, + "test_loss": 7.650527050018311, + "test_acc": 0.0232, + "lyapunov": null, + "grad_norm": 0.491245861328977, + "grad_max_sv": 0.16391390115022658, + "grad_min_sv": 8.910306775744558e-09, + "grad_condition": 31218789.734865714, + "lr": 0.0004895287900583212, + "time_sec": 66.74638271331787 + }, + { + "epoch": 77, + "train_loss": 3.154373671417236, + "train_acc": 0.22488, + "test_loss": 7.602050260925293, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.4892558751617366, + "grad_max_sv": 0.16490486972033977, + "grad_min_sv": 8.892741539673343e-09, + "grad_condition": 39253729.389955655, + "lr": 0.0004790621731353997, + "time_sec": 66.74076318740845 + }, + { + "epoch": 78, + "train_loss": 3.1485520709991457, + "train_acc": 0.2247, + "test_loss": 8.166537579345704, + "test_acc": 0.0241, + "lyapunov": null, + "grad_norm": 0.48686800079497317, + "grad_max_sv": 0.16167105846107005, + "grad_min_sv": 8.878994577077304e-09, + "grad_condition": 37064220.10033677, + "lr": 0.000468604740235343, + "time_sec": 66.75325560569763 + }, + { + "epoch": 79, + "train_loss": 3.146766557769775, + "train_acc": 0.22844, + "test_loss": 7.90411237487793, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.49040174515071594, + "grad_max_sv": 0.16053182780742645, + "grad_min_sv": 8.884301404277206e-09, + "grad_condition": 24364113.225008838, + "lr": 0.00045816107833384175, + "time_sec": 66.74130415916443 + }, + { + "epoch": 80, + "train_loss": 3.145488730316162, + "train_acc": 0.22804, + "test_loss": 7.780512563323975, + "test_acc": 0.0252, + "lyapunov": null, + "grad_norm": 0.4943972569981926, + "grad_max_sv": 0.1629514317959547, + "grad_min_sv": 8.936118334190724e-09, + "grad_condition": 38891856.037547626, + "lr": 0.0004477357683661729, + "time_sec": 66.734290599823 + }, + { + "epoch": 81, + "train_loss": 3.1335752784729003, + "train_acc": 0.2256, + "test_loss": 7.793076400756836, + "test_acc": 0.0231, + "lyapunov": null, + "grad_norm": 0.4939390356782499, + "grad_max_sv": 0.15955338068306446, + "grad_min_sv": 8.997340913974305e-09, + "grad_condition": 21171055.698999647, + "lr": 0.00043733338321784746, + "time_sec": 66.73108649253845 + }, + { + "epoch": 82, + "train_loss": 3.1309402253723144, + "train_acc": 0.22804, + "test_loss": 7.9182415901184084, + "test_acc": 0.0286, + "lyapunov": null, + "grad_norm": 0.49237561983191397, + "grad_max_sv": 0.15897708609700203, + "grad_min_sv": 8.919429018983126e-09, + "grad_condition": 24130255.734166417, + "lr": 0.0004269584857187939, + "time_sec": 66.74584746360779 + }, + { + "epoch": 83, + "train_loss": 3.1320227099609377, + "train_acc": 0.23082, + "test_loss": 8.17084792022705, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.4923723854198216, + "grad_max_sv": 0.16074697338044644, + "grad_min_sv": 8.95209650297879e-09, + "grad_condition": 21250707.48315563, + "lr": 0.0004166156266419484, + "time_sec": 66.75584173202515 + }, + { + "epoch": 84, + "train_loss": 3.116801164550781, + "train_acc": 0.23106, + "test_loss": 8.594211498260497, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.4937123379502474, + "grad_max_sv": 0.16294312290847301, + "grad_min_sv": 8.918351879910746e-09, + "grad_condition": 32523875.43833986, + "lr": 0.0004063093427071373, + "time_sec": 66.74527430534363 + }, + { + "epoch": 85, + "train_loss": 3.1138555347442627, + "train_acc": 0.23154, + "test_loss": 7.848691880035401, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.49437474598710707, + "grad_max_sv": 0.1639211293309927, + "grad_min_sv": 8.966596980186648e-09, + "grad_condition": 29105331.398801915, + "lr": 0.0003960441545911199, + "time_sec": 66.72178506851196 + }, + { + "epoch": 86, + "train_loss": 3.0959864405822755, + "train_acc": 0.23314, + "test_loss": 7.94962300491333, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.4933773113271138, + "grad_max_sv": 0.1572486527264118, + "grad_min_sv": 8.887307614141582e-09, + "grad_condition": 60627728.54777368, + "lr": 0.0003858245649446718, + "time_sec": 66.73936724662781 + }, + { + "epoch": 87, + "train_loss": 3.1002150044250487, + "train_acc": 0.23374, + "test_loss": 8.25519141845703, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.4923201649178117, + "grad_max_sv": 0.16258857287466527, + "grad_min_sv": 9.065216627357487e-09, + "grad_condition": 23403653.876579102, + "lr": 0.00037565505641757235, + "time_sec": 66.7319266796112 + }, + { + "epoch": 88, + "train_loss": 3.0908289854431152, + "train_acc": 0.23508, + "test_loss": 8.057901398468017, + "test_acc": 0.0254, + "lyapunov": null, + "grad_norm": 0.49157293018855497, + "grad_max_sv": 0.16135855726897716, + "grad_min_sv": 8.947001231551788e-09, + "grad_condition": 44687527.86973098, + "lr": 0.00036554008969236695, + "time_sec": 66.73309588432312 + }, + { + "epoch": 89, + "train_loss": 3.0786484061431887, + "train_acc": 0.23678, + "test_loss": 7.728022393798828, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.496481999420392, + "grad_max_sv": 0.16325689144432545, + "grad_min_sv": 9.071061696924732e-09, + "grad_condition": 33780242.920800135, + "lr": 0.0003554841015277638, + "time_sec": 66.7649736404419 + }, + { + "epoch": 90, + "train_loss": 3.080343514328003, + "train_acc": 0.23796, + "test_loss": 7.649538640594482, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.4958853581872073, + "grad_max_sv": 0.15821573026478292, + "grad_min_sv": 9.068041348890554e-09, + "grad_condition": 99443661.9604651, + "lr": 0.000345491502812526, + "time_sec": 66.75938820838928 + }, + { + "epoch": 91, + "train_loss": 3.0665194551086428, + "train_acc": 0.23906, + "test_loss": 7.882036618041992, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.49404821675883814, + "grad_max_sv": 0.16070808731019498, + "grad_min_sv": 8.97562283178055e-09, + "grad_condition": 43916780.79243892, + "lr": 0.0003355666766307081, + "time_sec": 66.87539291381836 + }, + { + "epoch": 92, + "train_loss": 3.067614875793457, + "train_acc": 0.23864, + "test_loss": 7.817445317077636, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 0.49506578954377534, + "grad_max_sv": 0.1606835663318634, + "grad_min_sv": 9.140586166439535e-09, + "grad_condition": 32597225.524517875, + "lr": 0.00032571397633909225, + "time_sec": 66.78059506416321 + }, + { + "epoch": 93, + "train_loss": 3.0596435570526124, + "train_acc": 0.24158, + "test_loss": 8.042932987976075, + "test_acc": 0.0225, + "lyapunov": null, + "grad_norm": 0.4959998942206781, + "grad_max_sv": 0.1597288616001606, + "grad_min_sv": 9.08612836081346e-09, + "grad_condition": 31733250.071886934, + "lr": 0.00031593772365766094, + "time_sec": 66.82975125312805 + }, + { + "epoch": 94, + "train_loss": 3.0495442120361327, + "train_acc": 0.2429, + "test_loss": 7.59449294052124, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.4982536551750556, + "grad_max_sv": 0.16117390170693396, + "grad_min_sv": 9.039274752840887e-09, + "grad_condition": 82000533.38506715, + "lr": 0.0003062422067739483, + "time_sec": 66.78579998016357 + }, + { + "epoch": 95, + "train_loss": 3.0474711390686036, + "train_acc": 0.24268, + "test_loss": 8.05243324584961, + "test_acc": 0.0241, + "lyapunov": null, + "grad_norm": 0.4987374169285617, + "grad_max_sv": 0.1600899651646614, + "grad_min_sv": 9.17260397914621e-09, + "grad_condition": 20457204.833973993, + "lr": 0.00029663167846209965, + "time_sec": 66.88967680931091 + }, + { + "epoch": 96, + "train_loss": 3.043592535858154, + "train_acc": 0.24712, + "test_loss": 8.085104446411133, + "test_acc": 0.0236, + "lyapunov": null, + "grad_norm": 0.495196191233677, + "grad_max_sv": 0.1615884281694889, + "grad_min_sv": 9.055856260709039e-09, + "grad_condition": 22431222.93985162, + "lr": 0.00028711035421746345, + "time_sec": 66.75688600540161 + }, + { + "epoch": 97, + "train_loss": 3.037664843826294, + "train_acc": 0.24506, + "test_loss": 7.9920450149536135, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.49669572478665774, + "grad_max_sv": 0.16185057312250137, + "grad_min_sv": 9.08467869542573e-09, + "grad_condition": 21200545.010530062, + "lr": 0.00027768241040753615, + "time_sec": 66.7662045955658 + }, + { + "epoch": 98, + "train_loss": 3.031687122955322, + "train_acc": 0.2451, + "test_loss": 7.918573980712891, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.49913703885454763, + "grad_max_sv": 0.16182911209762096, + "grad_min_sv": 9.20874306739594e-09, + "grad_condition": 45645019.87124987, + "lr": 0.00026835198244006903, + "time_sec": 66.7293975353241 + }, + { + "epoch": 99, + "train_loss": 3.0274880534362794, + "train_acc": 0.2473, + "test_loss": 7.841742308807373, + "test_acc": 0.0301, + "lyapunov": null, + "grad_norm": 0.49642185350492907, + "grad_max_sv": 0.1603651110082865, + "grad_min_sv": 9.093327535403262e-09, + "grad_condition": 19719511.10750369, + "lr": 0.0002591231629491421, + "time_sec": 66.7403724193573 + }, + { + "epoch": 100, + "train_loss": 3.0153498964691163, + "train_acc": 0.24856, + "test_loss": 8.214636975097656, + "test_acc": 0.0254, + "lyapunov": null, + "grad_norm": 0.4985021553240975, + "grad_max_sv": 0.16094849184155463, + "grad_min_sv": 9.110507272203083e-09, + "grad_condition": 30803607.03022697, + "lr": 0.0002499999999999997, + "time_sec": 66.77785897254944 + }, + { + "epoch": 101, + "train_loss": 3.016648301010132, + "train_acc": 0.24796, + "test_loss": 8.018017488098145, + "test_acc": 0.024, + "lyapunov": null, + "grad_norm": 0.49781758634911777, + "grad_max_sv": 0.1628634061664343, + "grad_min_sv": 9.167758632799838e-09, + "grad_condition": 29242095.541800775, + "lr": 0.00024098649531343477, + "time_sec": 66.75502634048462 + }, + { + "epoch": 102, + "train_loss": 3.0057240830993655, + "train_acc": 0.2494, + "test_loss": 7.966342135620117, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.49727001747907607, + "grad_max_sv": 0.1595818493515253, + "grad_min_sv": 9.158894652416816e-09, + "grad_condition": 25050549.493724942, + "lr": 0.0002320866025105016, + "time_sec": 66.73536777496338 + }, + { + "epoch": 103, + "train_loss": 3.0083345415496825, + "train_acc": 0.24916, + "test_loss": 7.602651586914062, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.4972675096226543, + "grad_max_sv": 0.15909511968493462, + "grad_min_sv": 9.152518881542019e-09, + "grad_condition": 176611520.9765485, + "lr": 0.0002233042253783278, + "time_sec": 66.78067326545715 + }, + { + "epoch": 104, + "train_loss": 3.0043220927429197, + "train_acc": 0.25416, + "test_loss": 7.736685781860351, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.4991979838174823, + "grad_max_sv": 0.16091925352811814, + "grad_min_sv": 9.099881177754288e-09, + "grad_condition": 26326830.964460164, + "lr": 0.000214643216157784, + "time_sec": 66.8768937587738 + }, + { + "epoch": 105, + "train_loss": 2.990384366760254, + "train_acc": 0.2549, + "test_loss": 7.9314300880432125, + "test_acc": 0.0257, + "lyapunov": null, + "grad_norm": 0.4989399321110013, + "grad_max_sv": 0.16301956586539745, + "grad_min_sv": 9.068342649021233e-09, + "grad_condition": 22164317.14735137, + "lr": 0.00020610737385376332, + "time_sec": 66.72530388832092 + }, + { + "epoch": 106, + "train_loss": 2.9880060688781738, + "train_acc": 0.2559, + "test_loss": 7.935620104980469, + "test_acc": 0.0239, + "lyapunov": null, + "grad_norm": 0.5020971657629898, + "grad_max_sv": 0.158639619871974, + "grad_min_sv": 9.218992125248349e-09, + "grad_condition": 19751045.24452741, + "lr": 0.00019770044256881242, + "time_sec": 66.74578857421875 + }, + { + "epoch": 107, + "train_loss": 2.9826569903564453, + "train_acc": 0.25612, + "test_loss": 7.572006935119629, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.5015635447032545, + "grad_max_sv": 0.16168206445872785, + "grad_min_sv": 9.25978992372123e-09, + "grad_condition": 20545972.245303817, + "lr": 0.0001894261098608447, + "time_sec": 66.7324481010437 + }, + { + "epoch": 108, + "train_loss": 2.9888600968170165, + "train_acc": 0.25294, + "test_loss": 8.053074099731445, + "test_acc": 0.0251, + "lyapunov": null, + "grad_norm": 0.5009802565861355, + "grad_max_sv": 0.1584490414708853, + "grad_min_sv": 9.149287724663502e-09, + "grad_condition": 21503521.68923875, + "lr": 0.000181288005125655, + "time_sec": 66.72810864448547 + }, + { + "epoch": 109, + "train_loss": 2.975886121902466, + "train_acc": 0.25652, + "test_loss": 7.477262289428711, + "test_acc": 0.0284, + "lyapunov": null, + "grad_norm": 0.503925091244166, + "grad_max_sv": 0.16282350979745389, + "grad_min_sv": 9.335586921566108e-09, + "grad_condition": 35447222.499738775, + "lr": 0.0001732896980049473, + "time_sec": 66.72842764854431 + }, + { + "epoch": 110, + "train_loss": 2.9755415910339353, + "train_acc": 0.25556, + "test_loss": 7.165874292755127, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.5037804832276148, + "grad_max_sv": 0.15851956307888032, + "grad_min_sv": 9.099825162839359e-09, + "grad_condition": 20173486.309247635, + "lr": 0.00016543469682057076, + "time_sec": 66.74954080581665 + }, + { + "epoch": 111, + "train_loss": 2.959470086517334, + "train_acc": 0.2599, + "test_loss": 7.450650096130371, + "test_acc": 0.0262, + "lyapunov": null, + "grad_norm": 0.503654089312831, + "grad_max_sv": 0.16573349833488465, + "grad_min_sv": 9.32649130147567e-09, + "grad_condition": 21752264.314719558, + "lr": 0.00015772644703565552, + "time_sec": 66.74236154556274 + }, + { + "epoch": 112, + "train_loss": 2.965289024734497, + "train_acc": 0.25718, + "test_loss": 7.889770016479492, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.502653464675152, + "grad_max_sv": 0.15698793567717076, + "grad_min_sv": 9.185129989930374e-09, + "grad_condition": 21947654.317370795, + "lr": 0.00015016832974331713, + "time_sec": 66.72698640823364 + }, + { + "epoch": 113, + "train_loss": 2.9564146237182616, + "train_acc": 0.25944, + "test_loss": 7.50577006072998, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.5025800570896282, + "grad_max_sv": 0.16476120464503766, + "grad_min_sv": 9.262197631261515e-09, + "grad_condition": 64643866.275285676, + "lr": 0.00014276366018359834, + "time_sec": 66.73694157600403 + }, + { + "epoch": 114, + "train_loss": 2.9632557470703125, + "train_acc": 0.2588, + "test_loss": 7.324433947753906, + "test_acc": 0.0267, + "lyapunov": null, + "grad_norm": 0.5032433350827459, + "grad_max_sv": 0.1614664951339364, + "grad_min_sv": 9.332686041335635e-09, + "grad_condition": 25925973.16098608, + "lr": 0.00013551568628929425, + "time_sec": 66.73091220855713 + }, + { + "epoch": 115, + "train_loss": 2.960151859741211, + "train_acc": 0.25964, + "test_loss": 7.166713363647461, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.5041184948364359, + "grad_max_sv": 0.16642464362084866, + "grad_min_sv": 9.282518911857273e-09, + "grad_condition": 25859258.01788441, + "lr": 0.00012842758726130276, + "time_sec": 66.74849343299866 + }, + { + "epoch": 116, + "train_loss": 2.953709926071167, + "train_acc": 0.26278, + "test_loss": 7.547538887786866, + "test_acc": 0.0249, + "lyapunov": null, + "grad_norm": 0.5046521011193764, + "grad_max_sv": 0.16437436863780022, + "grad_min_sv": 9.262822032313211e-09, + "grad_condition": 32398308.30398508, + "lr": 0.0001215024721741218, + "time_sec": 66.71618747711182 + }, + { + "epoch": 117, + "train_loss": 2.944321136703491, + "train_acc": 0.26162, + "test_loss": 7.580604026031494, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.505619534605041, + "grad_max_sv": 0.1670211985707283, + "grad_min_sv": 9.292541550826039e-09, + "grad_condition": 38518888.53739685, + "lr": 0.00011474337861210538, + "time_sec": 66.73683166503906 + }, + { + "epoch": 118, + "train_loss": 2.9500590826416015, + "train_acc": 0.26096, + "test_loss": 7.419709242248535, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.5042339990258256, + "grad_max_sv": 0.1646095708012581, + "grad_min_sv": 9.212309370898452e-09, + "grad_condition": 21855283.7419735, + "lr": 0.00010815327133708009, + "time_sec": 66.74755263328552 + }, + { + "epoch": 119, + "train_loss": 2.935969953994751, + "train_acc": 0.26214, + "test_loss": 7.739272484588623, + "test_acc": 0.0234, + "lyapunov": null, + "grad_norm": 0.5050901894066223, + "grad_max_sv": 0.16230421848595142, + "grad_min_sv": 9.406476235429561e-09, + "grad_condition": 23432734.062338997, + "lr": 0.00010173504098790182, + "time_sec": 66.73239493370056 + }, + { + "epoch": 120, + "train_loss": 2.9394694520568847, + "train_acc": 0.26124, + "test_loss": 7.496024851226807, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.5041839504858715, + "grad_max_sv": 0.16297951228916646, + "grad_min_sv": 9.110734936618182e-09, + "grad_condition": 45276046.40189681, + "lr": 9.549150281252629e-05, + "time_sec": 66.73548793792725 + }, + { + "epoch": 121, + "train_loss": 2.9316130532836913, + "train_acc": 0.2664, + "test_loss": 7.61925634765625, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.5023886352582314, + "grad_max_sv": 0.15873938724398612, + "grad_min_sv": 9.294875413790039e-09, + "grad_condition": 20138059.978483208, + "lr": 8.942539543314794e-05, + "time_sec": 66.74223852157593 + }, + { + "epoch": 122, + "train_loss": 2.9368685430145263, + "train_acc": 0.26608, + "test_loss": 7.860937660217285, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.5039830709868471, + "grad_max_sv": 0.16210089661180974, + "grad_min_sv": 9.378378940105847e-09, + "grad_condition": 20479652.910540055, + "lr": 8.353937964495024e-05, + "time_sec": 66.74034976959229 + }, + { + "epoch": 123, + "train_loss": 2.926223219604492, + "train_acc": 0.26618, + "test_loss": 7.657449048614502, + "test_acc": 0.0276, + "lyapunov": null, + "grad_norm": 0.5037732278957073, + "grad_max_sv": 0.15904913768172263, + "grad_min_sv": 9.340245438194117e-09, + "grad_condition": 20095366.0692247, + "lr": 7.783603724899243e-05, + "time_sec": 66.75890016555786 + }, + { + "epoch": 124, + "train_loss": 2.927701270751953, + "train_acc": 0.26618, + "test_loss": 7.6647051956176755, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.5038337975979664, + "grad_max_sv": 0.16181248128414155, + "grad_min_sv": 9.28121109827762e-09, + "grad_condition": 42446050.42012946, + "lr": 7.231786991974666e-05, + "time_sec": 66.76168918609619 + }, + { + "epoch": 125, + "train_loss": 2.930084992752075, + "train_acc": 0.26502, + "test_loss": 7.625859857177734, + "test_acc": 0.0328, + "lyapunov": null, + "grad_norm": 0.5068469898138476, + "grad_max_sv": 0.1638263937085867, + "grad_min_sv": 9.328329653168766e-09, + "grad_condition": 19841078.364509214, + "lr": 6.698729810778072e-05, + "time_sec": 66.7655291557312 + }, + { + "epoch": 126, + "train_loss": 2.9266408013916014, + "train_acc": 0.26464, + "test_loss": 7.402858703613282, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.505889509702572, + "grad_max_sv": 0.16251356080174445, + "grad_min_sv": 9.373523023568919e-09, + "grad_condition": 93221533.70102426, + "lr": 6.184665997806817e-05, + "time_sec": 66.73502945899963 + }, + { + "epoch": 127, + "train_loss": 2.9134882929229735, + "train_acc": 0.26768, + "test_loss": 7.378057833862305, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.506715553420855, + "grad_max_sv": 0.16353526711463928, + "grad_min_sv": 9.384702157055891e-09, + "grad_condition": 20359698.916846666, + "lr": 5.6898210384392595e-05, + "time_sec": 66.77921509742737 + }, + { + "epoch": 128, + "train_loss": 2.9213341883850097, + "train_acc": 0.26664, + "test_loss": 7.712895046997071, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.5063760234244125, + "grad_max_sv": 0.1611122377216816, + "grad_min_sv": 9.26308537929632e-09, + "grad_condition": 20248767.57568174, + "lr": 5.214411988029363e-05, + "time_sec": 66.77419829368591 + }, + { + "epoch": 129, + "train_loss": 2.920669847869873, + "train_acc": 0.26896, + "test_loss": 7.742536703491211, + "test_acc": 0.0294, + "lyapunov": null, + "grad_norm": 0.5050452367296605, + "grad_max_sv": 0.16588766500353813, + "grad_min_sv": 9.188665948955955e-09, + "grad_condition": 25535623.034593392, + "lr": 4.7586473766990294e-05, + "time_sec": 66.74674034118652 + }, + { + "epoch": 130, + "train_loss": 2.9166115370178223, + "train_acc": 0.27046, + "test_loss": 7.745564926147461, + "test_acc": 0.0268, + "lyapunov": null, + "grad_norm": 0.5042584300860155, + "grad_max_sv": 0.15993600897490978, + "grad_min_sv": 9.22239243722478e-09, + "grad_condition": 30040595.585581142, + "lr": 4.32272711786996e-05, + "time_sec": 66.75978875160217 + }, + { + "epoch": 131, + "train_loss": 2.907492437210083, + "train_acc": 0.26916, + "test_loss": 7.649399880218506, + "test_acc": 0.0284, + "lyapunov": null, + "grad_norm": 0.5070808120078898, + "grad_max_sv": 0.1605027388781309, + "grad_min_sv": 9.278778108356978e-09, + "grad_condition": 24457159.000251405, + "lr": 3.906842420574966e-05, + "time_sec": 66.75747895240784 + }, + { + "epoch": 132, + "train_loss": 2.9026521766662596, + "train_acc": 0.272, + "test_loss": 7.8230515625, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.5063112060998534, + "grad_max_sv": 0.16093650609254836, + "grad_min_sv": 9.186510611935982e-09, + "grad_condition": 42276385.55766246, + "lr": 3.5111757055874305e-05, + "time_sec": 66.77963304519653 + }, + { + "epoch": 133, + "train_loss": 2.911207528076172, + "train_acc": 0.26944, + "test_loss": 7.760893005371094, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.5056301711850308, + "grad_max_sv": 0.15996609181165694, + "grad_min_sv": 9.24704448498903e-09, + "grad_condition": 28608092.489089973, + "lr": 3.1359005254054254e-05, + "time_sec": 66.76844477653503 + }, + { + "epoch": 134, + "train_loss": 2.906010355911255, + "train_acc": 0.26984, + "test_loss": 8.008016571044921, + "test_acc": 0.0277, + "lyapunov": null, + "grad_norm": 0.5057626039215439, + "grad_max_sv": 0.16315203942358494, + "grad_min_sv": 9.36498750769843e-09, + "grad_condition": 27854382.101013802, + "lr": 2.7811814881259484e-05, + "time_sec": 66.71080470085144 + }, + { + "epoch": 135, + "train_loss": 2.9123083544921875, + "train_acc": 0.2708, + "test_loss": 7.937577700805664, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.507430486691674, + "grad_max_sv": 0.16183615513145924, + "grad_min_sv": 9.295077910143057e-09, + "grad_condition": 35641637.9216369, + "lr": 2.4471741852423218e-05, + "time_sec": 66.70258069038391 + }, + { + "epoch": 136, + "train_loss": 2.9030120794677736, + "train_acc": 0.26876, + "test_loss": 7.929943086242676, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.5047150022788596, + "grad_max_sv": 0.159928035736084, + "grad_min_sv": 9.18635804370016e-09, + "grad_condition": 24708684.685064685, + "lr": 2.1340251233966362e-05, + "time_sec": 66.80279207229614 + }, + { + "epoch": 137, + "train_loss": 2.8984097245788574, + "train_acc": 0.27096, + "test_loss": 7.787900932312012, + "test_acc": 0.0252, + "lyapunov": null, + "grad_norm": 0.5057579673029589, + "grad_max_sv": 0.16343264877796174, + "grad_min_sv": 9.42844148223848e-09, + "grad_condition": 68103682.6831769, + "lr": 1.8418716601170932e-05, + "time_sec": 66.79385328292847 + }, + { + "epoch": 138, + "train_loss": 2.9015779782867432, + "train_acc": 0.27052, + "test_loss": 7.685623684692382, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.5052475881253131, + "grad_max_sv": 0.16178990341722965, + "grad_min_sv": 9.403153949927301e-09, + "grad_condition": 21529766.30441346, + "lr": 1.570841943568445e-05, + "time_sec": 66.79542922973633 + }, + { + "epoch": 139, + "train_loss": 2.9034746910095213, + "train_acc": 0.26858, + "test_loss": 7.7811192077636715, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.5067466784573343, + "grad_max_sv": 0.16502070650458336, + "grad_min_sv": 9.381726348567377e-09, + "grad_condition": 23363276.54143712, + "lr": 1.3210548563419845e-05, + "time_sec": 66.82312655448914 + }, + { + "epoch": 140, + "train_loss": 2.90350335647583, + "train_acc": 0.27, + "test_loss": 7.9639368255615235, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.5063255238101101, + "grad_max_sv": 0.16305876486003398, + "grad_min_sv": 9.320621746633506e-09, + "grad_condition": 19763781.55112334, + "lr": 1.0926199633097203e-05, + "time_sec": 66.94665789604187 + }, + { + "epoch": 141, + "train_loss": 2.905441074523926, + "train_acc": 0.27062, + "test_loss": 7.834839343261719, + "test_acc": 0.0272, + "lyapunov": null, + "grad_norm": 0.5065610335232089, + "grad_max_sv": 0.16221509799361228, + "grad_min_sv": 9.371092498950546e-09, + "grad_condition": 143044385.21136397, + "lr": 8.856374635655688e-06, + "time_sec": 66.75584673881531 + }, + { + "epoch": 142, + "train_loss": 2.8884568811035156, + "train_acc": 0.27424, + "test_loss": 7.891295666503907, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5049742628293102, + "grad_max_sv": 0.16406644098460674, + "grad_min_sv": 9.222863864809249e-09, + "grad_condition": 104466753.44108576, + "lr": 7.001981464747503e-06, + "time_sec": 66.83577418327332 + }, + { + "epoch": 143, + "train_loss": 2.89968453956604, + "train_acc": 0.2687, + "test_loss": 7.587808401489258, + "test_acc": 0.026, + "lyapunov": null, + "grad_norm": 0.5066200115515498, + "grad_max_sv": 0.16335729993879794, + "grad_min_sv": 9.35185720529752e-09, + "grad_condition": 21201534.185457647, + "lr": 5.3638335185058295e-06, + "time_sec": 66.86586809158325 + }, + { + "epoch": 144, + "train_loss": 2.9001665770721434, + "train_acc": 0.27342, + "test_loss": 7.801967292785645, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5068696147722536, + "grad_max_sv": 0.16632004491984845, + "grad_min_sv": 9.407527784555114e-09, + "grad_condition": 28416722.547434002, + "lr": 3.942649342761114e-06, + "time_sec": 66.81737685203552 + }, + { + "epoch": 145, + "train_loss": 2.9069715209197997, + "train_acc": 0.26842, + "test_loss": 7.833915914916992, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.5072129956219519, + "grad_max_sv": 0.16434708684682847, + "grad_min_sv": 9.273034223128417e-09, + "grad_condition": 28838252.01997738, + "lr": 2.7390523158633524e-06, + "time_sec": 66.8349096775055 + }, + { + "epoch": 146, + "train_loss": 2.8987478762054444, + "train_acc": 0.27234, + "test_loss": 7.62391605682373, + "test_acc": 0.0297, + "lyapunov": null, + "grad_norm": 0.5057465664592161, + "grad_max_sv": 0.16144540309906005, + "grad_min_sv": 9.35427735687666e-09, + "grad_condition": 30743326.442479603, + "lr": 1.7535703752478133e-06, + "time_sec": 66.83043193817139 + }, + { + "epoch": 147, + "train_loss": 2.903320244064331, + "train_acc": 0.27186, + "test_loss": 7.7698071029663085, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.5064754333352515, + "grad_max_sv": 0.1591943196952343, + "grad_min_sv": 9.42194651465389e-09, + "grad_condition": 19579097.33375772, + "lr": 9.866357858642196e-07, + "time_sec": 66.99268507957458 + }, + { + "epoch": 148, + "train_loss": 2.8968810515594483, + "train_acc": 0.27114, + "test_loss": 7.890472512817383, + "test_acc": 0.0269, + "lyapunov": null, + "grad_norm": 0.5064792087675245, + "grad_max_sv": 0.16383817605674267, + "grad_min_sv": 9.303890557976757e-09, + "grad_condition": 20672685.281352926, + "lr": 4.38584950570808e-07, + "time_sec": 66.84124112129211 + }, + { + "epoch": 149, + "train_loss": 2.9055178635406493, + "train_acc": 0.26998, + "test_loss": 7.986205418395996, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.506757696244553, + "grad_max_sv": 0.1625267457216978, + "grad_min_sv": 9.227836753056274e-09, + "grad_condition": 22246592.926524755, + "lr": 1.096582625772501e-07, + "time_sec": 66.75054454803467 + }, + { + "epoch": 150, + "train_loss": 2.9042972522735595, + "train_acc": 0.27168, + "test_loss": 7.824682766723633, + "test_acc": 0.027, + "lyapunov": null, + "grad_norm": 0.5067642000471761, + "grad_max_sv": 0.16473121605813504, + "grad_min_sv": 9.266963207216206e-09, + "grad_condition": 38426194.43824513, + "lr": 0.0, + "time_sec": 66.75282382965088 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 4.402453376159668, + "train_acc": 0.09068, + "test_loss": 3.647318689727783, + "test_acc": 0.1599, + "lyapunov": 2.275165726156796, + "grad_norm": 6.3193677906118335, + "grad_max_sv": 4.972608983516693, + "grad_min_sv": 1.1423275143029876e-07, + "grad_condition": 106438558.78809075, + "lr": 0.0009998903417374227, + "time_sec": 41.85859131813049 + }, + { + "epoch": 2, + "train_loss": 3.6593205111694336, + "train_acc": 0.16428, + "test_loss": 3.411211491394043, + "test_acc": 0.2035, + "lyapunov": 2.1582698181766986, + "grad_norm": 4.644400986379697, + "grad_max_sv": 3.4886934638023375, + "grad_min_sv": 8.646843122905868e-08, + "grad_condition": 120977117.93021207, + "lr": 0.0009995614150494292, + "time_sec": 41.73804235458374 + }, + { + "epoch": 3, + "train_loss": 3.308978451004028, + "train_acc": 0.20998, + "test_loss": 3.1940381771087645, + "test_acc": 0.2372, + "lyapunov": 2.093446350158633, + "grad_norm": 3.7153186701227567, + "grad_max_sv": 2.5730993062257768, + "grad_min_sv": 6.944630572824906e-08, + "grad_condition": 44436928.378804766, + "lr": 0.0009990133642141358, + "time_sec": 41.72993302345276 + }, + { + "epoch": 4, + "train_loss": 3.0701835554504395, + "train_acc": 0.24742, + "test_loss": 3.0969710327148436, + "test_acc": 0.2537, + "lyapunov": 2.040784895267633, + "grad_norm": 3.06563581854696, + "grad_max_sv": 1.9565235763788222, + "grad_min_sv": 5.723270060375985e-08, + "grad_condition": 70190432.33127163, + "lr": 0.0009982464296247522, + "time_sec": 41.73050355911255 + }, + { + "epoch": 5, + "train_loss": 2.9189507540130615, + "train_acc": 0.2716, + "test_loss": 2.918551559829712, + "test_acc": 0.2808, + "lyapunov": 2.0341829082849996, + "grad_norm": 2.651388374004006, + "grad_max_sv": 1.6357308089733125, + "grad_min_sv": 5.089967798355133e-08, + "grad_condition": 37371144.51391194, + "lr": 0.0009972609476841367, + "time_sec": 41.74047303199768 + }, + { + "epoch": 6, + "train_loss": 2.741786095199585, + "train_acc": 0.30958, + "test_loss": 2.7842771644592283, + "test_acc": 0.3068, + "lyapunov": 2.012049251200293, + "grad_norm": 2.376654222106478, + "grad_max_sv": 1.3564517319202423, + "grad_min_sv": 4.5076624693995984e-08, + "grad_condition": 44513934.45114143, + "lr": 0.000996057350657239, + "time_sec": 41.71632218360901 + }, + { + "epoch": 7, + "train_loss": 2.5753888706970214, + "train_acc": 0.34372, + "test_loss": 2.7615582008361814, + "test_acc": 0.3086, + "lyapunov": 2.007953660567398, + "grad_norm": 2.1602223715226843, + "grad_max_sv": 1.1779062479734421, + "grad_min_sv": 4.122792165439648e-08, + "grad_condition": 44826268.11284047, + "lr": 0.000994636166481494, + "time_sec": 41.72747349739075 + }, + { + "epoch": 8, + "train_loss": 2.468557521286011, + "train_acc": 0.36452, + "test_loss": 2.653182541656494, + "test_acc": 0.3324, + "lyapunov": 1.9948931578784952, + "grad_norm": 2.0073198059721875, + "grad_max_sv": 1.0865133196115493, + "grad_min_sv": 3.855332622038077e-08, + "grad_condition": 43669185.113960825, + "lr": 0.0009929980185352525, + "time_sec": 41.73755121231079 + }, + { + "epoch": 9, + "train_loss": 2.350626865539551, + "train_acc": 0.38764, + "test_loss": 2.836592961883545, + "test_acc": 0.3099, + "lyapunov": 1.9819872019540927, + "grad_norm": 1.8849515867179252, + "grad_max_sv": 0.990830908715725, + "grad_min_sv": 3.6664210431580635e-08, + "grad_condition": 48804777.56163528, + "lr": 0.0009911436253643444, + "time_sec": 41.74427247047424 + }, + { + "epoch": 10, + "train_loss": 2.232207765197754, + "train_acc": 0.41502, + "test_loss": 6.005580019378662, + "test_acc": 0.1198, + "lyapunov": 1.973588870919269, + "grad_norm": 1.795724371022914, + "grad_max_sv": 0.895367507636547, + "grad_min_sv": 3.4024029961499114e-08, + "grad_condition": 56137324.74168767, + "lr": 0.0009890738003669028, + "time_sec": 41.73108172416687 + }, + { + "epoch": 11, + "train_loss": 2.2177761376953127, + "train_acc": 0.41552, + "test_loss": 2.757076937866211, + "test_acc": 0.3297, + "lyapunov": 1.9674199688465088, + "grad_norm": 1.7014618441403062, + "grad_max_sv": 0.8264698967337608, + "grad_min_sv": 3.289183631016712e-08, + "grad_condition": 31290581.06717081, + "lr": 0.00098678945143658, + "time_sec": 41.73191976547241 + }, + { + "epoch": 12, + "train_loss": 2.07756498046875, + "train_acc": 0.44758, + "test_loss": 2.4285128423690794, + "test_acc": 0.3776, + "lyapunov": 1.9612870170637164, + "grad_norm": 1.6299132393626308, + "grad_max_sv": 0.7798347935080528, + "grad_min_sv": 3.11786861995067e-08, + "grad_condition": 35260018.784767784, + "lr": 0.0009842915805643154, + "time_sec": 41.73758554458618 + }, + { + "epoch": 13, + "train_loss": 2.0029664388275146, + "train_acc": 0.4627, + "test_loss": 2.394765958404541, + "test_acc": 0.3877, + "lyapunov": 1.9591088959628054, + "grad_norm": 1.5753571075909552, + "grad_max_sv": 0.737843057513237, + "grad_min_sv": 2.9724672816894282e-08, + "grad_condition": 75029315.64952049, + "lr": 0.000981581283398829, + "time_sec": 41.75543141365051 + }, + { + "epoch": 14, + "train_loss": 1.9314122444152833, + "train_acc": 0.48014, + "test_loss": 2.494458251953125, + "test_acc": 0.3794, + "lyapunov": 1.95977995493223, + "grad_norm": 1.5223678763290471, + "grad_max_sv": 0.7179754331707955, + "grad_min_sv": 2.9007061810859547e-08, + "grad_condition": 45859489.60778977, + "lr": 0.0009786597487660333, + "time_sec": 41.764060497283936 + }, + { + "epoch": 15, + "train_loss": 1.8691918286132811, + "train_acc": 0.49388, + "test_loss": 2.6827464235305785, + "test_acc": 0.3491, + "lyapunov": 1.9565891402456768, + "grad_norm": 1.4758165731208024, + "grad_max_sv": 0.6874889254570007, + "grad_min_sv": 2.8080017771409117e-08, + "grad_condition": 100775627.80158803, + "lr": 0.0009755282581475766, + "time_sec": 41.739460945129395 + }, + { + "epoch": 16, + "train_loss": 1.8350643015670776, + "train_acc": 0.50486, + "test_loss": 2.473033560180664, + "test_acc": 0.3885, + "lyapunov": 1.9510287967179438, + "grad_norm": 1.4300731390012025, + "grad_max_sv": 0.6442486211657524, + "grad_min_sv": 2.706107265007529e-08, + "grad_condition": 91373101.9091527, + "lr": 0.0009721881851187403, + "time_sec": 41.718268632888794 + }, + { + "epoch": 17, + "train_loss": 1.762912439842224, + "train_acc": 0.51876, + "test_loss": 2.2700052513122557, + "test_acc": 0.4251, + "lyapunov": 1.9505040874261685, + "grad_norm": 1.3848095474137985, + "grad_max_sv": 0.6225782200694084, + "grad_min_sv": 2.618359110292956e-08, + "grad_condition": 74496958.8790254, + "lr": 0.0009686409947459456, + "time_sec": 41.724280834198 + }, + { + "epoch": 18, + "train_loss": 1.7018197515487672, + "train_acc": 0.53204, + "test_loss": 2.353795319747925, + "test_acc": 0.412, + "lyapunov": 1.9468479519305022, + "grad_norm": 1.353559766643193, + "grad_max_sv": 0.6109417073428631, + "grad_min_sv": 2.558382817263727e-08, + "grad_condition": 38470934.80593135, + "lr": 0.0009648882429441254, + "time_sec": 41.72322702407837 + }, + { + "epoch": 19, + "train_loss": 1.664328369178772, + "train_acc": 0.5418, + "test_loss": 2.362927633666992, + "test_acc": 0.4075, + "lyapunov": 1.9501073872646713, + "grad_norm": 1.323458416808866, + "grad_max_sv": 0.6041884273290634, + "grad_min_sv": 2.519698935610215e-08, + "grad_condition": 33066628.42882558, + "lr": 0.00096093157579425, + "time_sec": 41.76836347579956 + }, + { + "epoch": 20, + "train_loss": 1.625159342651367, + "train_acc": 0.55094, + "test_loss": 2.3062631443023682, + "test_acc": 0.4138, + "lyapunov": 1.943288565291773, + "grad_norm": 1.29233886993043, + "grad_max_sv": 0.5701985210180283, + "grad_min_sv": 2.444946393675984e-08, + "grad_condition": 37960247.61471464, + "lr": 0.0009567727288213001, + "time_sec": 41.72097706794739 + }, + { + "epoch": 21, + "train_loss": 1.596832010192871, + "train_acc": 0.55774, + "test_loss": 3.380753642654419, + "test_acc": 0.277, + "lyapunov": 1.938459638744364, + "grad_norm": 1.2589299533251497, + "grad_max_sv": 0.5499200604856014, + "grad_min_sv": 2.3781619607962658e-08, + "grad_condition": 91436448.31120124, + "lr": 0.0009524135262330095, + "time_sec": 41.7327356338501 + }, + { + "epoch": 22, + "train_loss": 1.562855760269165, + "train_acc": 0.56626, + "test_loss": 2.9307581508636473, + "test_acc": 0.3111, + "lyapunov": 1.9406123039362682, + "grad_norm": 1.241425743050732, + "grad_max_sv": 0.5555930100381374, + "grad_min_sv": 2.3678109623004317e-08, + "grad_condition": 50716060.86165904, + "lr": 0.0009478558801197061, + "time_sec": 41.73275923728943 + }, + { + "epoch": 23, + "train_loss": 1.6072356412506104, + "train_acc": 0.55254, + "test_loss": 2.2621861825942995, + "test_acc": 0.4296, + "lyapunov": 1.9443157017993196, + "grad_norm": 1.2234319330661123, + "grad_max_sv": 0.5390392452478409, + "grad_min_sv": 2.321677808753142e-08, + "grad_condition": 49922944.04769093, + "lr": 0.000943101789615607, + "time_sec": 41.73086071014404 + }, + { + "epoch": 24, + "train_loss": 1.5153026651382446, + "train_acc": 0.57702, + "test_loss": 2.1956796672821044, + "test_acc": 0.4481, + "lyapunov": 1.9344317580732848, + "grad_norm": 1.190552794742183, + "grad_max_sv": 0.5149525038897991, + "grad_min_sv": 2.253187114734101e-08, + "grad_condition": 127046418.74079685, + "lr": 0.0009381533400219313, + "time_sec": 41.734899282455444 + }, + { + "epoch": 25, + "train_loss": 1.4858929053878784, + "train_acc": 0.58118, + "test_loss": 2.2958973640441895, + "test_acc": 0.4294, + "lyapunov": 1.9265085903884809, + "grad_norm": 1.1651463746568211, + "grad_max_sv": 0.49507031962275505, + "grad_min_sv": 2.175962801054254e-08, + "grad_condition": 47886846.443262614, + "lr": 0.0009330127018922189, + "time_sec": 41.743216037750244 + }, + { + "epoch": 26, + "train_loss": 1.4500890027999878, + "train_acc": 0.59236, + "test_loss": 2.1691157886505126, + "test_acc": 0.4522, + "lyapunov": 1.9298277998824254, + "grad_norm": 1.14471446432319, + "grad_max_sv": 0.4816065445542336, + "grad_min_sv": 2.120719223008827e-08, + "grad_condition": 207464491.0347305, + "lr": 0.000927682130080253, + "time_sec": 41.736358404159546 + }, + { + "epoch": 27, + "train_loss": 1.3898312545394897, + "train_acc": 0.60436, + "test_loss": 2.1529868070602416, + "test_acc": 0.4542, + "lyapunov": 1.9273115341620677, + "grad_norm": 1.132063260634141, + "grad_max_sv": 0.483544921875, + "grad_min_sv": 2.1037810878088426e-08, + "grad_condition": 75636823.96295121, + "lr": 0.0009221639627510072, + "time_sec": 41.904048681259155 + }, + { + "epoch": 28, + "train_loss": 1.3611045029067994, + "train_acc": 0.6133, + "test_loss": 2.1179029682159425, + "test_acc": 0.4696, + "lyapunov": 1.9238266844273832, + "grad_norm": 1.115677971738466, + "grad_max_sv": 0.47497326210141183, + "grad_min_sv": 2.075745057054934e-08, + "grad_condition": 101106197.99800023, + "lr": 0.0009164606203550494, + "time_sec": 41.733999490737915 + }, + { + "epoch": 29, + "train_loss": 1.325206062850952, + "train_acc": 0.62252, + "test_loss": 2.226005189323425, + "test_acc": 0.4459, + "lyapunov": 1.9295200911324348, + "grad_norm": 1.0960133455946792, + "grad_max_sv": 0.48051142767071725, + "grad_min_sv": 2.054557136504931e-08, + "grad_condition": 40520134.72078063, + "lr": 0.0009105746045668516, + "time_sec": 41.72044110298157 + }, + { + "epoch": 30, + "train_loss": 1.2888097004318237, + "train_acc": 0.63098, + "test_loss": 2.0181628200531008, + "test_acc": 0.4794, + "lyapunov": 1.9217432499541651, + "grad_norm": 1.0858874791311768, + "grad_max_sv": 0.4642782934010029, + "grad_min_sv": 2.0495078399684895e-08, + "grad_condition": 88671009.78788772, + "lr": 0.0009045084971874733, + "time_sec": 41.716856479644775 + }, + { + "epoch": 31, + "train_loss": 1.2502998229980469, + "train_acc": 0.6408, + "test_loss": 2.2429887283325196, + "test_acc": 0.4503, + "lyapunov": 1.922774575555416, + "grad_norm": 1.0748895050730505, + "grad_max_sv": 0.4512033395469189, + "grad_min_sv": 2.0210702748879596e-08, + "grad_condition": 43556480.38088348, + "lr": 0.0008982649590120977, + "time_sec": 41.73362612724304 + }, + { + "epoch": 32, + "train_loss": 1.2372033821868897, + "train_acc": 0.64594, + "test_loss": 2.1298938304901123, + "test_acc": 0.4605, + "lyapunov": 1.925371012419386, + "grad_norm": 1.0634688792667035, + "grad_max_sv": 0.4533583827316761, + "grad_min_sv": 1.969395504730631e-08, + "grad_condition": 66439793.43201858, + "lr": 0.0008918467286629196, + "time_sec": 41.73435115814209 + }, + { + "epoch": 33, + "train_loss": 1.2053633908462524, + "train_acc": 0.6516, + "test_loss": 2.3437958654403688, + "test_acc": 0.4421, + "lyapunov": 1.9254186299755751, + "grad_norm": 1.05209489056104, + "grad_max_sv": 0.44990424290299413, + "grad_min_sv": 1.9769683148873617e-08, + "grad_condition": 82804669.4982578, + "lr": 0.0008852566213878943, + "time_sec": 41.762763023376465 + }, + { + "epoch": 34, + "train_loss": 1.2061978987121582, + "train_acc": 0.65046, + "test_loss": 2.372113970756531, + "test_acc": 0.4298, + "lyapunov": 1.9202916914849635, + "grad_norm": 1.046307959951425, + "grad_max_sv": 0.4367548406124115, + "grad_min_sv": 1.9302947323884823e-08, + "grad_condition": 31344720.942354918, + "lr": 0.000878497527825878, + "time_sec": 41.73297643661499 + }, + { + "epoch": 35, + "train_loss": 1.1511029064559937, + "train_acc": 0.66476, + "test_loss": 2.2585899780273437, + "test_acc": 0.4491, + "lyapunov": 1.9170936425323681, + "grad_norm": 1.024495483747724, + "grad_max_sv": 0.43175056800246236, + "grad_min_sv": 1.90148727416406e-08, + "grad_condition": 44349967.927345894, + "lr": 0.000871572412738697, + "time_sec": 41.72303080558777 + }, + { + "epoch": 36, + "train_loss": 1.1435650005722047, + "train_acc": 0.66498, + "test_loss": 2.3082976978302003, + "test_acc": 0.4449, + "lyapunov": 1.9124643171534819, + "grad_norm": 1.010954120317237, + "grad_max_sv": 0.4223634794354439, + "grad_min_sv": 1.8588104889333267e-08, + "grad_condition": 76069054.1612477, + "lr": 0.0008644843137107055, + "time_sec": 41.72624754905701 + }, + { + "epoch": 37, + "train_loss": 1.1196837075805663, + "train_acc": 0.67186, + "test_loss": 2.4391525012969972, + "test_acc": 0.4274, + "lyapunov": 1.913648688274881, + "grad_norm": 1.0018970676650854, + "grad_max_sv": 0.4204524204134941, + "grad_min_sv": 1.8693978807993174e-08, + "grad_condition": 40402274.52996386, + "lr": 0.0008572363398164014, + "time_sec": 41.74878001213074 + }, + { + "epoch": 38, + "train_loss": 1.0952399520874023, + "train_acc": 0.67804, + "test_loss": 2.5844401374816894, + "test_acc": 0.4157, + "lyapunov": 1.9180302019314388, + "grad_norm": 0.9894651423227762, + "grad_max_sv": 0.4199659042060375, + "grad_min_sv": 1.837818106812522e-08, + "grad_condition": 260857764.359212, + "lr": 0.0008498316702566826, + "time_sec": 41.74680805206299 + }, + { + "epoch": 39, + "train_loss": 1.0627006562042236, + "train_acc": 0.68668, + "test_loss": 2.7415998706817626, + "test_acc": 0.4015, + "lyapunov": 1.9058937633129032, + "grad_norm": 0.9809260985523547, + "grad_max_sv": 0.40667932853102684, + "grad_min_sv": 1.812777311299002e-08, + "grad_condition": 244897287.65822238, + "lr": 0.0008422735529643442, + "time_sec": 41.75808906555176 + }, + { + "epoch": 40, + "train_loss": 1.0391249797439575, + "train_acc": 0.69176, + "test_loss": 2.7787880683898925, + "test_acc": 0.3939, + "lyapunov": 1.9083486545421278, + "grad_norm": 0.9750828470525472, + "grad_max_sv": 0.41750494614243505, + "grad_min_sv": 1.8325020090248502e-08, + "grad_condition": 31807877.730814517, + "lr": 0.0008345653031794289, + "time_sec": 41.722562313079834 + }, + { + "epoch": 41, + "train_loss": 1.0108007943916322, + "train_acc": 0.70096, + "test_loss": 2.499814228439331, + "test_acc": 0.4253, + "lyapunov": 1.9111734753679437, + "grad_norm": 0.9620542008359738, + "grad_max_sv": 0.39485047459602357, + "grad_min_sv": 1.7690556127977765e-08, + "grad_condition": 106971193.48807144, + "lr": 0.0008267103019950526, + "time_sec": 41.71957492828369 + }, + { + "epoch": 42, + "train_loss": 1.0110623504638672, + "train_acc": 0.70168, + "test_loss": 2.424097459793091, + "test_acc": 0.4384, + "lyapunov": 1.9121353684179008, + "grad_norm": 0.9598148784544778, + "grad_max_sv": 0.3985880985856056, + "grad_min_sv": 1.7510208861429982e-08, + "grad_condition": 241797453.4696713, + "lr": 0.0008187119948743447, + "time_sec": 41.724589109420776 + }, + { + "epoch": 43, + "train_loss": 0.9982641059112549, + "train_acc": 0.70184, + "test_loss": 2.483708995056152, + "test_acc": 0.4375, + "lyapunov": 1.909155901435696, + "grad_norm": 0.9506160023368213, + "grad_max_sv": 0.40187592804431915, + "grad_min_sv": 1.785357471792426e-08, + "grad_condition": 60385213.424743295, + "lr": 0.000810573890139155, + "time_sec": 41.74249339103699 + }, + { + "epoch": 44, + "train_loss": 0.9965381250762939, + "train_acc": 0.7027, + "test_loss": 2.795687140274048, + "test_acc": 0.3911, + "lyapunov": 1.9044793124698922, + "grad_norm": 0.9395738384441539, + "grad_max_sv": 0.39191935360431673, + "grad_min_sv": 1.7274444058523742e-08, + "grad_condition": 45224982.34490965, + "lr": 0.0008022995574311873, + "time_sec": 41.73937010765076 + }, + { + "epoch": 45, + "train_loss": 0.9683418419647217, + "train_acc": 0.70942, + "test_loss": 2.4733401664733887, + "test_acc": 0.445, + "lyapunov": 1.9045238778414324, + "grad_norm": 0.9219171735102869, + "grad_max_sv": 0.3813773214817047, + "grad_min_sv": 1.6867463496078593e-08, + "grad_condition": 108828712.50016733, + "lr": 0.0007938926261462363, + "time_sec": 41.75324892997742 + }, + { + "epoch": 46, + "train_loss": 0.9805485520553588, + "train_acc": 0.70914, + "test_loss": 2.31701719455719, + "test_acc": 0.4594, + "lyapunov": 1.9050119078677634, + "grad_norm": 0.9175512318527826, + "grad_max_sv": 0.3853737100958824, + "grad_min_sv": 1.672956074852405e-08, + "grad_condition": 168972117.70333335, + "lr": 0.0007853567838422158, + "time_sec": 41.743704319000244 + }, + { + "epoch": 47, + "train_loss": 0.9310689119720459, + "train_acc": 0.72066, + "test_loss": 2.309445872116089, + "test_acc": 0.4671, + "lyapunov": 1.898601669484697, + "grad_norm": 0.9054984582662673, + "grad_max_sv": 0.3751869909465313, + "grad_min_sv": 1.6639817324417063e-08, + "grad_condition": 838715300.6314169, + "lr": 0.0007766957746216719, + "time_sec": 41.74590611457825 + }, + { + "epoch": 48, + "train_loss": 0.8996099283027649, + "train_acc": 0.73198, + "test_loss": 2.8926421657562256, + "test_acc": 0.3964, + "lyapunov": 1.9078812385763964, + "grad_norm": 0.9035452379371108, + "grad_max_sv": 0.370052120834589, + "grad_min_sv": 1.6593997936159566e-08, + "grad_condition": 63519300.25874162, + "lr": 0.0007679133974894982, + "time_sec": 41.767823219299316 + }, + { + "epoch": 49, + "train_loss": 0.8779695009231567, + "train_acc": 0.73534, + "test_loss": 2.5444780319213867, + "test_acc": 0.4456, + "lyapunov": 1.910392487750334, + "grad_norm": 0.8959995200973341, + "grad_max_sv": 0.3752055235207081, + "grad_min_sv": 1.6205076294739662e-08, + "grad_condition": 33654601.36183037, + "lr": 0.000759013504686565, + "time_sec": 41.75288200378418 + }, + { + "epoch": 50, + "train_loss": 0.8604569892501831, + "train_acc": 0.73878, + "test_loss": 2.7883367189407346, + "test_acc": 0.4183, + "lyapunov": 1.9094159654949023, + "grad_norm": 0.8941278995375711, + "grad_max_sv": 0.3705851808190346, + "grad_min_sv": 1.6047344859708433e-08, + "grad_condition": 138603429.49724263, + "lr": 0.0007499999999999998, + "time_sec": 41.72500133514404 + }, + { + "epoch": 51, + "train_loss": 0.8416437990188599, + "train_acc": 0.74344, + "test_loss": 2.746726350402832, + "test_acc": 0.4108, + "lyapunov": 1.9145060311193052, + "grad_norm": 0.8808437513085351, + "grad_max_sv": 0.37436478212475777, + "grad_min_sv": 1.6171273435269808e-08, + "grad_condition": 179566441.60046786, + "lr": 0.0007408768370508575, + "time_sec": 41.74752902984619 + }, + { + "epoch": 52, + "train_loss": 0.820111142578125, + "train_acc": 0.75174, + "test_loss": 2.4467312171936033, + "test_acc": 0.4663, + "lyapunov": 1.910064988124096, + "grad_norm": 0.880437067439811, + "grad_max_sv": 0.36293432787060736, + "grad_min_sv": 1.5746691332807483e-08, + "grad_condition": 179789739.16053975, + "lr": 0.0007316480175599307, + "time_sec": 41.7735435962677 + }, + { + "epoch": 53, + "train_loss": 0.8140859049987793, + "train_acc": 0.75356, + "test_loss": 2.9469207336425782, + "test_acc": 0.4004, + "lyapunov": 1.9099171506169508, + "grad_norm": 0.8741677915368938, + "grad_max_sv": 0.37706185728311536, + "grad_min_sv": 1.6255310596180462e-08, + "grad_condition": 51250955.562284306, + "lr": 0.0007223175895924635, + "time_sec": 41.76830744743347 + }, + { + "epoch": 54, + "train_loss": 0.797414921245575, + "train_acc": 0.75706, + "test_loss": 2.59845022354126, + "test_acc": 0.4344, + "lyapunov": 1.9113083166234635, + "grad_norm": 0.8662096832265834, + "grad_max_sv": 0.3637803480029106, + "grad_min_sv": 1.592472985874338e-08, + "grad_condition": 78602783.87625492, + "lr": 0.0007128896457825361, + "time_sec": 41.77692222595215 + }, + { + "epoch": 55, + "train_loss": 0.7699506399154663, + "train_acc": 0.76474, + "test_loss": 2.452611435890198, + "test_acc": 0.4574, + "lyapunov": 1.9056391063553597, + "grad_norm": 0.8551615410550228, + "grad_max_sv": 0.3565914809703827, + "grad_min_sv": 1.5535208886668928e-08, + "grad_condition": 58261874.95313827, + "lr": 0.0007033683215378998, + "time_sec": 41.74821591377258 + }, + { + "epoch": 56, + "train_loss": 0.7388520823860169, + "train_acc": 0.77042, + "test_loss": 2.4759717765808107, + "test_acc": 0.4595, + "lyapunov": 1.9136662239308857, + "grad_norm": 0.8463088224698184, + "grad_max_sv": 0.35618705451488497, + "grad_min_sv": 1.5355412906177883e-08, + "grad_condition": 1209264968.6456847, + "lr": 0.0006937577932260512, + "time_sec": 41.73610758781433 + }, + { + "epoch": 57, + "train_loss": 0.7569624709701538, + "train_acc": 0.76814, + "test_loss": 2.3143113048553468, + "test_acc": 0.4746, + "lyapunov": 1.9175606316617688, + "grad_norm": 0.8518490658229559, + "grad_max_sv": 0.35069304183125494, + "grad_min_sv": 1.529794265444327e-08, + "grad_condition": 4456282580.150646, + "lr": 0.0006840622763423388, + "time_sec": 41.726720571517944 + }, + { + "epoch": 58, + "train_loss": 0.7390606773376465, + "train_acc": 0.7708, + "test_loss": 2.433010138130188, + "test_acc": 0.4673, + "lyapunov": 1.9161848207873762, + "grad_norm": 0.8471212829897161, + "grad_max_sv": 0.3454029098153114, + "grad_min_sv": 1.5223766105338863e-08, + "grad_condition": 489851337.6565568, + "lr": 0.0006742860236609073, + "time_sec": 41.74778985977173 + }, + { + "epoch": 59, + "train_loss": 0.7225271960830688, + "train_acc": 0.77766, + "test_loss": 2.476504100227356, + "test_acc": 0.4644, + "lyapunov": 1.9161952419963943, + "grad_norm": 0.8355419434677147, + "grad_max_sv": 0.34493052437901495, + "grad_min_sv": 1.4839035536494751e-08, + "grad_condition": 436813395.5045742, + "lr": 0.0006644333233692913, + "time_sec": 41.74501943588257 + }, + { + "epoch": 60, + "train_loss": 0.7100051165390014, + "train_acc": 0.77968, + "test_loss": 2.623545463180542, + "test_acc": 0.4462, + "lyapunov": 1.917024619743952, + "grad_norm": 0.8337880287503584, + "grad_max_sv": 0.35577779933810233, + "grad_min_sv": 1.5173673202639738e-08, + "grad_condition": 76369527.43553363, + "lr": 0.0006545084971874734, + "time_sec": 41.75426197052002 + }, + { + "epoch": 61, + "train_loss": 0.6912109909248352, + "train_acc": 0.78626, + "test_loss": 2.539391030693054, + "test_acc": 0.4593, + "lyapunov": 1.9186238227293009, + "grad_norm": 0.8193245175241345, + "grad_max_sv": 0.3327420450747013, + "grad_min_sv": 1.4762172681221513e-08, + "grad_condition": 222644067.44861478, + "lr": 0.0006445158984722354, + "time_sec": 41.74089074134827 + }, + { + "epoch": 62, + "train_loss": 0.6812233833694458, + "train_acc": 0.78942, + "test_loss": 2.3871022064208987, + "test_acc": 0.4774, + "lyapunov": 1.914946661580859, + "grad_norm": 0.8166344353267739, + "grad_max_sv": 0.34046063795685766, + "grad_min_sv": 1.4884670004877698e-08, + "grad_condition": 70123083.83702484, + "lr": 0.0006344599103076324, + "time_sec": 41.76645374298096 + }, + { + "epoch": 63, + "train_loss": 0.6683249555969238, + "train_acc": 0.79194, + "test_loss": 2.352469948577881, + "test_acc": 0.4844, + "lyapunov": 1.9207763571263579, + "grad_norm": 0.8134465519827773, + "grad_max_sv": 0.33852725103497505, + "grad_min_sv": 1.4292673627893e-08, + "grad_condition": 1043657787.5004251, + "lr": 0.0006243449435824269, + "time_sec": 41.75386071205139 + }, + { + "epoch": 64, + "train_loss": 0.6555111625862121, + "train_acc": 0.79462, + "test_loss": 2.3883603565216065, + "test_acc": 0.4793, + "lyapunov": 1.9168409045090151, + "grad_norm": 0.8105482202188788, + "grad_max_sv": 0.3407238692045212, + "grad_min_sv": 1.4592515325652713e-08, + "grad_condition": 448726137.26567876, + "lr": 0.0006141754350553275, + "time_sec": 41.782273292541504 + }, + { + "epoch": 65, + "train_loss": 0.6423080613708496, + "train_acc": 0.79788, + "test_loss": 2.599993039703369, + "test_acc": 0.4553, + "lyapunov": 1.9109126295884857, + "grad_norm": 0.8019063430431282, + "grad_max_sv": 0.3350201122462749, + "grad_min_sv": 1.4804530349028788e-08, + "grad_condition": 173720955.30947796, + "lr": 0.0006039558454088793, + "time_sec": 41.746013879776 + }, + { + "epoch": 66, + "train_loss": 0.6266677593612671, + "train_acc": 0.8052, + "test_loss": 2.433604884719849, + "test_acc": 0.4798, + "lyapunov": 1.9193745555780124, + "grad_norm": 0.7946069802068467, + "grad_max_sv": 0.3393189825117588, + "grad_min_sv": 1.4602912156574944e-08, + "grad_condition": 62071459.860591695, + "lr": 0.000593690657292862, + "time_sec": 41.7394495010376 + }, + { + "epoch": 67, + "train_loss": 0.6094798414611816, + "train_acc": 0.80856, + "test_loss": 2.396722966766357, + "test_acc": 0.4837, + "lyapunov": 1.9150565887046287, + "grad_norm": 0.7859000358672813, + "grad_max_sv": 0.3356419734656811, + "grad_min_sv": 1.4121937252573048e-08, + "grad_condition": 181810970.80928102, + "lr": 0.0005833843733580507, + "time_sec": 41.75516724586487 + }, + { + "epoch": 68, + "train_loss": 0.5999105793190003, + "train_acc": 0.81248, + "test_loss": 2.446664057159424, + "test_acc": 0.483, + "lyapunov": 1.9211967817657745, + "grad_norm": 0.7831815361001928, + "grad_max_sv": 0.3327556479722261, + "grad_min_sv": 1.4034283608854725e-08, + "grad_condition": 78476832.00824165, + "lr": 0.0005730415142812054, + "time_sec": 41.781288146972656 + }, + { + "epoch": 69, + "train_loss": 0.5935948301315308, + "train_acc": 0.8132, + "test_loss": 2.3918896797180174, + "test_acc": 0.491, + "lyapunov": 1.914429887786241, + "grad_norm": 0.7813354211317349, + "grad_max_sv": 0.3260443016886711, + "grad_min_sv": 1.3618330424458592e-08, + "grad_condition": 46650464.37711043, + "lr": 0.0005626666167821517, + "time_sec": 41.73920011520386 + }, + { + "epoch": 70, + "train_loss": 0.5843463416194916, + "train_acc": 0.81546, + "test_loss": 2.6817255722045896, + "test_acc": 0.4581, + "lyapunov": 1.9144641691461548, + "grad_norm": 0.7699117020841023, + "grad_max_sv": 0.328417931497097, + "grad_min_sv": 1.3631501394502365e-08, + "grad_condition": 129818603.96291387, + "lr": 0.0005522642316338265, + "time_sec": 41.736809730529785 + }, + { + "epoch": 71, + "train_loss": 0.5763696609115601, + "train_acc": 0.82078, + "test_loss": 2.5401578393936157, + "test_acc": 0.4677, + "lyapunov": 1.9133489470347724, + "grad_norm": 0.764712938126372, + "grad_max_sv": 0.32092626169323923, + "grad_min_sv": 1.3779004780223315e-08, + "grad_condition": 36042926.25966102, + "lr": 0.0005418389216661573, + "time_sec": 41.749176025390625 + }, + { + "epoch": 72, + "train_loss": 0.5613589873886108, + "train_acc": 0.82394, + "test_loss": 2.6585654582977294, + "test_acc": 0.4642, + "lyapunov": 1.9165738116749718, + "grad_norm": 0.7561452726240956, + "grad_max_sv": 0.3221577055752277, + "grad_min_sv": 1.3559068421341302e-08, + "grad_condition": 195511311.9984496, + "lr": 0.0005313952597646563, + "time_sec": 41.7347617149353 + }, + { + "epoch": 73, + "train_loss": 0.5599145156478882, + "train_acc": 0.82492, + "test_loss": 2.7406621421813964, + "test_acc": 0.4603, + "lyapunov": 1.9185552828757049, + "grad_norm": 0.7588854096769289, + "grad_max_sv": 0.32260433249175546, + "grad_min_sv": 1.4095438387318194e-08, + "grad_condition": 41201054.198086895, + "lr": 0.0005209378268645994, + "time_sec": 41.74638390541077 + }, + { + "epoch": 74, + "train_loss": 0.5376129404258728, + "train_acc": 0.82944, + "test_loss": 2.4721676399230956, + "test_acc": 0.4799, + "lyapunov": 1.9179751610816898, + "grad_norm": 0.7480764764212195, + "grad_max_sv": 0.3109534688293934, + "grad_min_sv": 1.3455031369451198e-08, + "grad_condition": 149094968.70418516, + "lr": 0.0005104712099416781, + "time_sec": 41.730305671691895 + }, + { + "epoch": 75, + "train_loss": 0.5237712098312378, + "train_acc": 0.83388, + "test_loss": 2.397841025161743, + "test_acc": 0.4966, + "lyapunov": 1.9220011475141092, + "grad_norm": 0.7416005314030649, + "grad_max_sv": 0.31333489045500756, + "grad_min_sv": 1.331565547381744e-08, + "grad_condition": 415186471.2442873, + "lr": 0.0004999999999999996, + "time_sec": 41.73826336860657 + }, + { + "epoch": 76, + "train_loss": 0.5300501476287842, + "train_acc": 0.8323, + "test_loss": 2.5804484046936036, + "test_acc": 0.4727, + "lyapunov": 1.9251569838779967, + "grad_norm": 0.7507739522438411, + "grad_max_sv": 0.3152198389172554, + "grad_min_sv": 1.327232550621686e-08, + "grad_condition": 3546860698.254091, + "lr": 0.0004895287900583212, + "time_sec": 41.737696170806885 + }, + { + "epoch": 77, + "train_loss": 0.5159329537963867, + "train_acc": 0.83542, + "test_loss": 2.4313048795700074, + "test_acc": 0.4913, + "lyapunov": 1.925811360559195, + "grad_norm": 0.7427051247628867, + "grad_max_sv": 0.319369000941515, + "grad_min_sv": 1.315879346250326e-08, + "grad_condition": 136344488.07483166, + "lr": 0.0004790621731353997, + "time_sec": 41.74639177322388 + }, + { + "epoch": 78, + "train_loss": 0.5110208293533325, + "train_acc": 0.83718, + "test_loss": 2.6526639022827148, + "test_acc": 0.4722, + "lyapunov": 1.9213380045293238, + "grad_norm": 0.7375218819003904, + "grad_max_sv": 0.32032484784722326, + "grad_min_sv": 1.3357332261446086e-08, + "grad_condition": 124809479.79969828, + "lr": 0.000468604740235343, + "time_sec": 41.75381779670715 + }, + { + "epoch": 79, + "train_loss": 0.4978685107421875, + "train_acc": 0.84272, + "test_loss": 2.5780771820068358, + "test_acc": 0.4824, + "lyapunov": 1.9186263599664048, + "grad_norm": 0.7297066594126903, + "grad_max_sv": 0.3142619103193283, + "grad_min_sv": 1.2722505653497973e-08, + "grad_condition": 79029553.67487936, + "lr": 0.00045816107833384175, + "time_sec": 41.72344255447388 + }, + { + "epoch": 80, + "train_loss": 0.49247674268722536, + "train_acc": 0.84458, + "test_loss": 2.5446572189331054, + "test_acc": 0.4799, + "lyapunov": 1.9232349865271916, + "grad_norm": 0.7275951858607266, + "grad_max_sv": 0.3104961056262255, + "grad_min_sv": 1.3169045832983617e-08, + "grad_condition": 248307092.67052037, + "lr": 0.0004477357683661729, + "time_sec": 41.76416063308716 + }, + { + "epoch": 81, + "train_loss": 0.48337669410705564, + "train_acc": 0.84848, + "test_loss": 2.5547529037475587, + "test_acc": 0.4899, + "lyapunov": 1.9256743460969852, + "grad_norm": 0.7207093399917843, + "grad_max_sv": 0.304505006223917, + "grad_min_sv": 1.2912396260989639e-08, + "grad_condition": 761193569.252575, + "lr": 0.00043733338321784746, + "time_sec": 41.735899925231934 + }, + { + "epoch": 82, + "train_loss": 0.47038244450569155, + "train_acc": 0.85108, + "test_loss": 2.644123673629761, + "test_acc": 0.4786, + "lyapunov": 1.930096074443339, + "grad_norm": 0.7144800079200238, + "grad_max_sv": 0.2952072460204363, + "grad_min_sv": 1.2669713050743325e-08, + "grad_condition": 114675121.44426188, + "lr": 0.0004269584857187939, + "time_sec": 41.7294647693634 + }, + { + "epoch": 83, + "train_loss": 0.4745187729072571, + "train_acc": 0.8504, + "test_loss": 2.425137010765076, + "test_acc": 0.5084, + "lyapunov": 1.9276282580002495, + "grad_norm": 0.7212549588812428, + "grad_max_sv": 0.30666181854903696, + "grad_min_sv": 1.3082162746429378e-08, + "grad_condition": 904844779.252668, + "lr": 0.0004166156266419484, + "time_sec": 41.81492853164673 + }, + { + "epoch": 84, + "train_loss": 0.4549512226009369, + "train_acc": 0.85492, + "test_loss": 2.538830058670044, + "test_acc": 0.4869, + "lyapunov": 1.9258351478430316, + "grad_norm": 0.7060628623584708, + "grad_max_sv": 0.3005705580115318, + "grad_min_sv": 1.2579670287090131e-08, + "grad_condition": 581415836.450834, + "lr": 0.0004063093427071373, + "time_sec": 41.79721474647522 + }, + { + "epoch": 85, + "train_loss": 0.4378455565452576, + "train_acc": 0.86152, + "test_loss": 2.403009338760376, + "test_acc": 0.5053, + "lyapunov": 1.9211271891508566, + "grad_norm": 0.6915986515440182, + "grad_max_sv": 0.29778869934380053, + "grad_min_sv": 1.2116298254809255e-08, + "grad_condition": 168424059.958263, + "lr": 0.0003960441545911199, + "time_sec": 41.778464555740356 + }, + { + "epoch": 86, + "train_loss": 0.44116118485450745, + "train_acc": 0.8581, + "test_loss": 2.5981835475921633, + "test_acc": 0.4849, + "lyapunov": 1.9242132054570387, + "grad_norm": 0.695658599371694, + "grad_max_sv": 0.3008798252791166, + "grad_min_sv": 1.2512174167936263e-08, + "grad_condition": 90708710.16389017, + "lr": 0.0003858245649446718, + "time_sec": 41.74471735954285 + }, + { + "epoch": 87, + "train_loss": 0.4308753871154785, + "train_acc": 0.86306, + "test_loss": 2.6437651992797853, + "test_acc": 0.4849, + "lyapunov": 1.9249147149303076, + "grad_norm": 0.6871040939444923, + "grad_max_sv": 0.2963280539959669, + "grad_min_sv": 1.2314203955317294e-08, + "grad_condition": 235479442.6243511, + "lr": 0.00037565505641757235, + "time_sec": 41.74060416221619 + }, + { + "epoch": 88, + "train_loss": 0.42922929346084593, + "train_acc": 0.8624, + "test_loss": 2.7029798751831056, + "test_acc": 0.4783, + "lyapunov": 1.9280765681620449, + "grad_norm": 0.6902892364270126, + "grad_max_sv": 0.29961013570427897, + "grad_min_sv": 1.2467451820583065e-08, + "grad_condition": 83771929.29604985, + "lr": 0.00036554008969236695, + "time_sec": 41.73495125770569 + }, + { + "epoch": 89, + "train_loss": 0.42102145546913144, + "train_acc": 0.8664, + "test_loss": 2.652896765899658, + "test_acc": 0.4788, + "lyapunov": 1.9265515252452372, + "grad_norm": 0.6826413064481601, + "grad_max_sv": 0.28691675662994387, + "grad_min_sv": 1.2127424076427418e-08, + "grad_condition": 95695289.58802594, + "lr": 0.0003554841015277638, + "time_sec": 41.7242865562439 + }, + { + "epoch": 90, + "train_loss": 0.41206748454093933, + "train_acc": 0.86824, + "test_loss": 2.6346706451416018, + "test_acc": 0.4864, + "lyapunov": 1.9194746419901738, + "grad_norm": 0.673396257277482, + "grad_max_sv": 0.29285924062132834, + "grad_min_sv": 1.1979546579721224e-08, + "grad_condition": 109743659.6901602, + "lr": 0.000345491502812526, + "time_sec": 41.755749225616455 + }, + { + "epoch": 91, + "train_loss": 0.4055181764316559, + "train_acc": 0.87004, + "test_loss": 2.6682676147460938, + "test_acc": 0.491, + "lyapunov": 1.9270745613385953, + "grad_norm": 0.6709435953060504, + "grad_max_sv": 0.2939354989677668, + "grad_min_sv": 1.235212860437214e-08, + "grad_condition": 1190331582.4196603, + "lr": 0.0003355666766307081, + "time_sec": 41.775524854660034 + }, + { + "epoch": 92, + "train_loss": 0.40252040519714355, + "train_acc": 0.8713, + "test_loss": 2.8629150386810305, + "test_acc": 0.4675, + "lyapunov": 1.9212740391416623, + "grad_norm": 0.6682127031915542, + "grad_max_sv": 0.2836850434541702, + "grad_min_sv": 1.1869678317143196e-08, + "grad_condition": 291933170.3921443, + "lr": 0.00032571397633909225, + "time_sec": 41.75170874595642 + }, + { + "epoch": 93, + "train_loss": 0.3905279335021973, + "train_acc": 0.87384, + "test_loss": 2.869659869003296, + "test_acc": 0.4716, + "lyapunov": 1.9229713644822846, + "grad_norm": 0.662730757253173, + "grad_max_sv": 0.286379961296916, + "grad_min_sv": 1.1959134642975343e-08, + "grad_condition": 1480240895.0819964, + "lr": 0.00031593772365766094, + "time_sec": 41.732693672180176 + }, + { + "epoch": 94, + "train_loss": 0.38746253270149233, + "train_acc": 0.87604, + "test_loss": 2.7872890632629392, + "test_acc": 0.4755, + "lyapunov": 1.9311103025055907, + "grad_norm": 0.6611852629580202, + "grad_max_sv": 0.2878059033304453, + "grad_min_sv": 1.2017589580599637e-08, + "grad_condition": 1407737610.2401586, + "lr": 0.0003062422067739483, + "time_sec": 41.764424085617065 + }, + { + "epoch": 95, + "train_loss": 0.37622571551322936, + "train_acc": 0.8805, + "test_loss": 2.7488246644973753, + "test_acc": 0.4812, + "lyapunov": 1.9282519402711287, + "grad_norm": 0.650610171245445, + "grad_max_sv": 0.27731936909258365, + "grad_min_sv": 1.1181425138865816e-08, + "grad_condition": 541851565.3391017, + "lr": 0.00029663167846209965, + "time_sec": 41.73838663101196 + }, + { + "epoch": 96, + "train_loss": 0.3805333632850647, + "train_acc": 0.87832, + "test_loss": 2.7933618152618407, + "test_acc": 0.4737, + "lyapunov": 1.9210287707540996, + "grad_norm": 0.6546558120083016, + "grad_max_sv": 0.293675172701478, + "grad_min_sv": 1.1850324428160217e-08, + "grad_condition": 1899448088.2640438, + "lr": 0.00028711035421746345, + "time_sec": 41.75114345550537 + }, + { + "epoch": 97, + "train_loss": 0.3698344562911987, + "train_acc": 0.8821, + "test_loss": 2.626072149658203, + "test_acc": 0.4933, + "lyapunov": 1.9215583484191114, + "grad_norm": 0.6455625049641249, + "grad_max_sv": 0.2753082763403654, + "grad_min_sv": 1.140981761606208e-08, + "grad_condition": 102441123.60054779, + "lr": 0.00027768241040753615, + "time_sec": 41.779812812805176 + }, + { + "epoch": 98, + "train_loss": 0.36370936042785645, + "train_acc": 0.8827, + "test_loss": 2.7376982440948487, + "test_acc": 0.4819, + "lyapunov": 1.9254729970336875, + "grad_norm": 0.6429896465869342, + "grad_max_sv": 0.275909772887826, + "grad_min_sv": 1.1198205342871636e-08, + "grad_condition": 96379650.54540862, + "lr": 0.00026835198244006903, + "time_sec": 41.74297332763672 + }, + { + "epoch": 99, + "train_loss": 0.35008830539703367, + "train_acc": 0.88708, + "test_loss": 2.672455603027344, + "test_acc": 0.4932, + "lyapunov": 1.925299749349999, + "grad_norm": 0.63374512447599, + "grad_max_sv": 0.2778238713741302, + "grad_min_sv": 1.1432909302220781e-08, + "grad_condition": 362637559.40708697, + "lr": 0.0002591231629491421, + "time_sec": 41.739681243896484 + }, + { + "epoch": 100, + "train_loss": 0.3549016403007507, + "train_acc": 0.88744, + "test_loss": 2.7878278060913084, + "test_acc": 0.4803, + "lyapunov": 1.9233372269384086, + "grad_norm": 0.6389150356661637, + "grad_max_sv": 0.27901838831603526, + "grad_min_sv": 1.1473734666788684e-08, + "grad_condition": 2639061362.898227, + "lr": 0.0002499999999999997, + "time_sec": 41.74522304534912 + }, + { + "epoch": 101, + "train_loss": 0.34493496802330015, + "train_acc": 0.88894, + "test_loss": 2.78032173538208, + "test_acc": 0.4838, + "lyapunov": 1.9269454619463753, + "grad_norm": 0.6295472923198826, + "grad_max_sv": 0.2820887628942728, + "grad_min_sv": 1.1113912810022109e-08, + "grad_condition": 624324453.2508206, + "lr": 0.00024098649531343477, + "time_sec": 41.743125915527344 + }, + { + "epoch": 102, + "train_loss": 0.3421867981338501, + "train_acc": 0.89074, + "test_loss": 2.7059894664764403, + "test_acc": 0.4876, + "lyapunov": 1.9258580113310948, + "grad_norm": 0.628687088973467, + "grad_max_sv": 0.2694883894175291, + "grad_min_sv": 1.0822553434680638e-08, + "grad_condition": 46651489.8878482, + "lr": 0.0002320866025105016, + "time_sec": 41.76480436325073 + }, + { + "epoch": 103, + "train_loss": 0.3384503825998306, + "train_acc": 0.89086, + "test_loss": 2.8318667066574097, + "test_acc": 0.4741, + "lyapunov": 1.9292250283233954, + "grad_norm": 0.6271743664174141, + "grad_max_sv": 0.2730583131313324, + "grad_min_sv": 1.1385578555065008e-08, + "grad_condition": 563435206.0433385, + "lr": 0.0002233042253783278, + "time_sec": 41.741034269332886 + }, + { + "epoch": 104, + "train_loss": 0.33336328342437743, + "train_acc": 0.89252, + "test_loss": 2.634573328399658, + "test_acc": 0.4951, + "lyapunov": 1.931383354279696, + "grad_norm": 0.6210016202001825, + "grad_max_sv": 0.27210688553750517, + "grad_min_sv": 1.1000466340616021e-08, + "grad_condition": 92010665.89314088, + "lr": 0.000214643216157784, + "time_sec": 41.75269269943237 + }, + { + "epoch": 105, + "train_loss": 0.3197405033969879, + "train_acc": 0.899, + "test_loss": 2.884822589111328, + "test_acc": 0.4682, + "lyapunov": 1.9301893150105196, + "grad_norm": 0.609586933280062, + "grad_max_sv": 0.27548312693834304, + "grad_min_sv": 1.118888890011549e-08, + "grad_condition": 131626322.2514697, + "lr": 0.00020610737385376332, + "time_sec": 41.73700475692749 + }, + { + "epoch": 106, + "train_loss": 0.3236599215316772, + "train_acc": 0.89716, + "test_loss": 2.7713792285919188, + "test_acc": 0.488, + "lyapunov": 1.9288730526824132, + "grad_norm": 0.6135037710408716, + "grad_max_sv": 0.2704245876520872, + "grad_min_sv": 1.085851556751824e-08, + "grad_condition": 215829565.18721938, + "lr": 0.00019770044256881242, + "time_sec": 41.75580883026123 + }, + { + "epoch": 107, + "train_loss": 0.3160914605522156, + "train_acc": 0.89788, + "test_loss": 2.76917931137085, + "test_acc": 0.488, + "lyapunov": 1.9280755730236279, + "grad_norm": 0.606491129447243, + "grad_max_sv": 0.26502735577523706, + "grad_min_sv": 1.0846700593866027e-08, + "grad_condition": 610346687.9366983, + "lr": 0.0001894261098608447, + "time_sec": 41.76302671432495 + }, + { + "epoch": 108, + "train_loss": 0.3119147304725647, + "train_acc": 0.90094, + "test_loss": 2.7750482391357423, + "test_acc": 0.4835, + "lyapunov": 1.9312091818855852, + "grad_norm": 0.6043924060421743, + "grad_max_sv": 0.274587269499898, + "grad_min_sv": 1.0853883777514617e-08, + "grad_condition": 170249620.6656044, + "lr": 0.000181288005125655, + "time_sec": 41.80406713485718 + }, + { + "epoch": 109, + "train_loss": 0.31209370684623716, + "train_acc": 0.90148, + "test_loss": 2.8157909286499025, + "test_acc": 0.4794, + "lyapunov": 1.9337092665455224, + "grad_norm": 0.6050202865224388, + "grad_max_sv": 0.2639197990298271, + "grad_min_sv": 1.0996519571445859e-08, + "grad_condition": 575625785.574527, + "lr": 0.0001732896980049473, + "time_sec": 41.73463416099548 + }, + { + "epoch": 110, + "train_loss": 0.3082316113948822, + "train_acc": 0.90204, + "test_loss": 2.702104316520691, + "test_acc": 0.489, + "lyapunov": 1.9290470900133139, + "grad_norm": 0.6042001043838351, + "grad_max_sv": 0.2752346571534872, + "grad_min_sv": 1.0839321291054859e-08, + "grad_condition": 250403471.48285875, + "lr": 0.00016543469682057076, + "time_sec": 41.76645040512085 + }, + { + "epoch": 111, + "train_loss": 0.30120701184272763, + "train_acc": 0.90372, + "test_loss": 2.748506890106201, + "test_acc": 0.4882, + "lyapunov": 1.9334574395128528, + "grad_norm": 0.5954562498399162, + "grad_max_sv": 0.2545849312096834, + "grad_min_sv": 1.070429428322913e-08, + "grad_condition": 664921377.0965778, + "lr": 0.00015772644703565552, + "time_sec": 41.757800579071045 + }, + { + "epoch": 112, + "train_loss": 0.296090919880867, + "train_acc": 0.90562, + "test_loss": 2.8513975952148436, + "test_acc": 0.4822, + "lyapunov": 1.9362541113972969, + "grad_norm": 0.5909410329046563, + "grad_max_sv": 0.2773400656878948, + "grad_min_sv": 1.0838356696504792e-08, + "grad_condition": 251394061.463588, + "lr": 0.00015016832974331713, + "time_sec": 41.770912170410156 + }, + { + "epoch": 113, + "train_loss": 0.2947556733894348, + "train_acc": 0.90598, + "test_loss": 2.7514869749069213, + "test_acc": 0.4896, + "lyapunov": 1.9318870656630571, + "grad_norm": 0.5943988573865283, + "grad_max_sv": 0.27221206203103065, + "grad_min_sv": 1.0821243565713873e-08, + "grad_condition": 302031136.5804342, + "lr": 0.00014276366018359834, + "time_sec": 41.773146629333496 + }, + { + "epoch": 114, + "train_loss": 0.29452732785224917, + "train_acc": 0.90454, + "test_loss": 2.858088223838806, + "test_acc": 0.48, + "lyapunov": 1.9324586171933147, + "grad_norm": 0.593702860983604, + "grad_max_sv": 0.2621223747730255, + "grad_min_sv": 1.0779565017985998e-08, + "grad_condition": 3257642951.5839953, + "lr": 0.00013551568628929425, + "time_sec": 41.75748801231384 + }, + { + "epoch": 115, + "train_loss": 0.2846847169780731, + "train_acc": 0.90822, + "test_loss": 2.8158035331726072, + "test_acc": 0.4877, + "lyapunov": 1.938668950134531, + "grad_norm": 0.5835151609835706, + "grad_max_sv": 0.26009339913725854, + "grad_min_sv": 1.0696786583233586e-08, + "grad_condition": 111398610.47337827, + "lr": 0.00012842758726130276, + "time_sec": 41.738929271698 + }, + { + "epoch": 116, + "train_loss": 0.286880124874115, + "train_acc": 0.90824, + "test_loss": 2.9191000652313233, + "test_acc": 0.4748, + "lyapunov": 1.9339045792284524, + "grad_norm": 0.5858453870641945, + "grad_max_sv": 0.2665789842605591, + "grad_min_sv": 1.0711847837202841e-08, + "grad_condition": 1320713444.8020804, + "lr": 0.0001215024721741218, + "time_sec": 41.768064737319946 + }, + { + "epoch": 117, + "train_loss": 0.27806476739883423, + "train_acc": 0.91212, + "test_loss": 2.9575212314605714, + "test_acc": 0.466, + "lyapunov": 1.9268688045804152, + "grad_norm": 0.5769703196978114, + "grad_max_sv": 0.2631434515118599, + "grad_min_sv": 1.0619501080583182e-08, + "grad_condition": 176638250.39521796, + "lr": 0.00011474337861210538, + "time_sec": 41.77944993972778 + }, + { + "epoch": 118, + "train_loss": 0.28147749565124514, + "train_acc": 0.90956, + "test_loss": 2.902259288787842, + "test_acc": 0.4773, + "lyapunov": 1.926734477052908, + "grad_norm": 0.5830821972377033, + "grad_max_sv": 0.2594000995159149, + "grad_min_sv": 1.0544785641018739e-08, + "grad_condition": 689316939.9163088, + "lr": 0.00010815327133708009, + "time_sec": 41.77560567855835 + }, + { + "epoch": 119, + "train_loss": 0.2722447591972351, + "train_acc": 0.91258, + "test_loss": 2.931415486526489, + "test_acc": 0.4709, + "lyapunov": 1.9345182488336587, + "grad_norm": 0.572763731033364, + "grad_max_sv": 0.2539283610880375, + "grad_min_sv": 1.0309096255833612e-08, + "grad_condition": 1377511789.4658034, + "lr": 0.00010173504098790182, + "time_sec": 41.76324152946472 + }, + { + "epoch": 120, + "train_loss": 0.27617920718193056, + "train_acc": 0.91258, + "test_loss": 2.973516095352173, + "test_acc": 0.4674, + "lyapunov": 1.925510235149842, + "grad_norm": 0.5773926888156061, + "grad_max_sv": 0.2658484969288111, + "grad_min_sv": 1.0499199683570646e-08, + "grad_condition": 374501076.1017169, + "lr": 9.549150281252629e-05, + "time_sec": 41.767186403274536 + }, + { + "epoch": 121, + "train_loss": 0.27251530948638913, + "train_acc": 0.91296, + "test_loss": 2.8450429317474364, + "test_acc": 0.4802, + "lyapunov": 1.9281866379711023, + "grad_norm": 0.5717886428343918, + "grad_max_sv": 0.2499128393828869, + "grad_min_sv": 1.0331575387616601e-08, + "grad_condition": 434199923.9134222, + "lr": 8.942539543314794e-05, + "time_sec": 42.006184816360474 + }, + { + "epoch": 122, + "train_loss": 0.2621309459686279, + "train_acc": 0.91672, + "test_loss": 2.9349596824645996, + "test_acc": 0.4718, + "lyapunov": 1.9293642839812257, + "grad_norm": 0.5633585392065859, + "grad_max_sv": 0.2584250021725893, + "grad_min_sv": 1.0407827803239622e-08, + "grad_condition": 156669157.0178101, + "lr": 8.353937964495024e-05, + "time_sec": 41.74145746231079 + }, + { + "epoch": 123, + "train_loss": 0.2615852005672455, + "train_acc": 0.91608, + "test_loss": 2.7961125595092775, + "test_acc": 0.4893, + "lyapunov": 1.9358660528422011, + "grad_norm": 0.5637925697976807, + "grad_max_sv": 0.25874742604792117, + "grad_min_sv": 1.032914649661985e-08, + "grad_condition": 1660430573.0575848, + "lr": 7.783603724899243e-05, + "time_sec": 41.76014065742493 + }, + { + "epoch": 124, + "train_loss": 0.26532973320961, + "train_acc": 0.91602, + "test_loss": 2.8865388355255126, + "test_acc": 0.4822, + "lyapunov": 1.934482484522378, + "grad_norm": 0.5661055598868787, + "grad_max_sv": 0.253901906684041, + "grad_min_sv": 1.037683180745222e-08, + "grad_condition": 461832455.3376358, + "lr": 7.231786991974666e-05, + "time_sec": 41.72244453430176 + }, + { + "epoch": 125, + "train_loss": 0.26151716954231263, + "train_acc": 0.91778, + "test_loss": 2.8506041109085083, + "test_acc": 0.4845, + "lyapunov": 1.9337351691082616, + "grad_norm": 0.5623776376124604, + "grad_max_sv": 0.24803672395646573, + "grad_min_sv": 9.977197801182975e-09, + "grad_condition": 220737122.69380316, + "lr": 6.698729810778072e-05, + "time_sec": 41.73867464065552 + }, + { + "epoch": 126, + "train_loss": 0.2597654493045807, + "train_acc": 0.91768, + "test_loss": 2.8917087631225584, + "test_acc": 0.4821, + "lyapunov": 1.9302716776538078, + "grad_norm": 0.5629102340404084, + "grad_max_sv": 0.2492838267236948, + "grad_min_sv": 1.0013882490236825e-08, + "grad_condition": 476014349.4220117, + "lr": 6.184665997806817e-05, + "time_sec": 41.76627588272095 + }, + { + "epoch": 127, + "train_loss": 0.25805088083267214, + "train_acc": 0.91756, + "test_loss": 2.8765572607040406, + "test_acc": 0.4834, + "lyapunov": 1.9315851753020226, + "grad_norm": 0.5592154441844838, + "grad_max_sv": 0.2544619936496019, + "grad_min_sv": 1.0077015917086923e-08, + "grad_condition": 783149549.4386375, + "lr": 5.6898210384392595e-05, + "time_sec": 41.87174725532532 + }, + { + "epoch": 128, + "train_loss": 0.2577546704006195, + "train_acc": 0.91874, + "test_loss": 3.0074226676940916, + "test_acc": 0.471, + "lyapunov": 1.934407904629817, + "grad_norm": 0.5594357059695831, + "grad_max_sv": 0.25228654518723487, + "grad_min_sv": 1.0156657575058087e-08, + "grad_condition": 1008188371.837209, + "lr": 5.214411988029363e-05, + "time_sec": 41.916406869888306 + }, + { + "epoch": 129, + "train_loss": 0.25312234355926516, + "train_acc": 0.9199, + "test_loss": 2.8548696338653565, + "test_acc": 0.4856, + "lyapunov": 1.9328541795311072, + "grad_norm": 0.555008814003618, + "grad_max_sv": 0.2534768160432577, + "grad_min_sv": 1.0178250110966237e-08, + "grad_condition": 143839991.3649338, + "lr": 4.7586473766990294e-05, + "time_sec": 41.82679748535156 + }, + { + "epoch": 130, + "train_loss": 0.250835018787384, + "train_acc": 0.91954, + "test_loss": 2.906131639289856, + "test_acc": 0.4791, + "lyapunov": 1.9312424421920191, + "grad_norm": 0.5528140940454066, + "grad_max_sv": 0.2588647808879614, + "grad_min_sv": 1.0268260352414017e-08, + "grad_condition": 509072962.47948426, + "lr": 4.32272711786996e-05, + "time_sec": 41.91203331947327 + }, + { + "epoch": 131, + "train_loss": 0.25008735834121704, + "train_acc": 0.92054, + "test_loss": 2.92816100769043, + "test_acc": 0.4772, + "lyapunov": 1.9284685694653054, + "grad_norm": 0.5548065863249975, + "grad_max_sv": 0.2578789483755827, + "grad_min_sv": 9.949257935831097e-09, + "grad_condition": 323013200.7705888, + "lr": 3.906842420574966e-05, + "time_sec": 41.81468987464905 + }, + { + "epoch": 132, + "train_loss": 0.24849324222564698, + "train_acc": 0.92134, + "test_loss": 2.8456837230682375, + "test_acc": 0.4816, + "lyapunov": 1.9316642177684227, + "grad_norm": 0.55172841455075, + "grad_max_sv": 0.250290111079812, + "grad_min_sv": 9.853710934964316e-09, + "grad_condition": 322476561.6918553, + "lr": 3.5111757055874305e-05, + "time_sec": 41.77635145187378 + }, + { + "epoch": 133, + "train_loss": 0.24915866560935973, + "train_acc": 0.92132, + "test_loss": 2.901075325012207, + "test_acc": 0.4789, + "lyapunov": 1.9320397776411014, + "grad_norm": 0.5474895998750056, + "grad_max_sv": 0.24624281339347362, + "grad_min_sv": 9.830540990182074e-09, + "grad_condition": 623620626.9707788, + "lr": 3.1359005254054254e-05, + "time_sec": 41.84829306602478 + }, + { + "epoch": 134, + "train_loss": 0.24534906030654907, + "train_acc": 0.92328, + "test_loss": 2.85434139919281, + "test_acc": 0.485, + "lyapunov": 1.930702987534311, + "grad_norm": 0.5483867358779149, + "grad_max_sv": 0.25784828178584573, + "grad_min_sv": 1.0019850669020035e-08, + "grad_condition": 3586444175.3568053, + "lr": 2.7811814881259484e-05, + "time_sec": 41.77039647102356 + }, + { + "epoch": 135, + "train_loss": 0.24960718570709228, + "train_acc": 0.92082, + "test_loss": 2.9888268871307373, + "test_acc": 0.4742, + "lyapunov": 1.929203321561789, + "grad_norm": 0.5527946736547813, + "grad_max_sv": 0.2546125616878271, + "grad_min_sv": 1.0004818609351835e-08, + "grad_condition": 1860575432.817696, + "lr": 2.4471741852423218e-05, + "time_sec": 41.771665811538696 + }, + { + "epoch": 136, + "train_loss": 0.24571303916931153, + "train_acc": 0.92212, + "test_loss": 2.855561435317993, + "test_acc": 0.4836, + "lyapunov": 1.9275208034783677, + "grad_norm": 0.5483578499169555, + "grad_max_sv": 0.2608003545552492, + "grad_min_sv": 1.0308928769832416e-08, + "grad_condition": 157360659.1727987, + "lr": 2.1340251233966362e-05, + "time_sec": 41.765148401260376 + }, + { + "epoch": 137, + "train_loss": 0.2372880220603943, + "train_acc": 0.9246, + "test_loss": 2.8222301815032957, + "test_acc": 0.4912, + "lyapunov": 1.9333144886719296, + "grad_norm": 0.5405053222263085, + "grad_max_sv": 0.2489485152065754, + "grad_min_sv": 9.955221673754732e-09, + "grad_condition": 144936356.89202416, + "lr": 1.8418716601170932e-05, + "time_sec": 41.924315214157104 + }, + { + "epoch": 138, + "train_loss": 0.24242675877571107, + "train_acc": 0.923, + "test_loss": 2.9303861391067505, + "test_acc": 0.4749, + "lyapunov": 1.9311096826782617, + "grad_norm": 0.5452114116385087, + "grad_max_sv": 0.2530204698443413, + "grad_min_sv": 9.918986039556682e-09, + "grad_condition": 493617409.4262516, + "lr": 1.570841943568445e-05, + "time_sec": 41.81815791130066 + }, + { + "epoch": 139, + "train_loss": 0.2430030436182022, + "train_acc": 0.92424, + "test_loss": 3.007392513656616, + "test_acc": 0.4702, + "lyapunov": 1.925496112355186, + "grad_norm": 0.5452105368622537, + "grad_max_sv": 0.2529194738715887, + "grad_min_sv": 1.0028199618448974e-08, + "grad_condition": 155790807.15890232, + "lr": 1.3210548563419845e-05, + "time_sec": 41.84099984169006 + }, + { + "epoch": 140, + "train_loss": 0.2422716226863861, + "train_acc": 0.92382, + "test_loss": 2.854384679031372, + "test_acc": 0.4826, + "lyapunov": 1.9280666451320014, + "grad_norm": 0.5442266316973285, + "grad_max_sv": 0.2506759535521269, + "grad_min_sv": 9.808605576019924e-09, + "grad_condition": 133627211.11637631, + "lr": 1.0926199633097203e-05, + "time_sec": 41.865853786468506 + }, + { + "epoch": 141, + "train_loss": 0.24081885069847106, + "train_acc": 0.9238, + "test_loss": 2.7676011840820314, + "test_acc": 0.4943, + "lyapunov": 1.9324955101818075, + "grad_norm": 0.5425632444902094, + "grad_max_sv": 0.2467295128852129, + "grad_min_sv": 9.574480816162967e-09, + "grad_condition": 576306909.6284522, + "lr": 8.856374635655688e-06, + "time_sec": 41.76636242866516 + }, + { + "epoch": 142, + "train_loss": 0.24086300157546997, + "train_acc": 0.92522, + "test_loss": 2.8614378929138184, + "test_acc": 0.4836, + "lyapunov": 1.9337395066800325, + "grad_norm": 0.5404771137173922, + "grad_max_sv": 0.2464255016297102, + "grad_min_sv": 9.947362959207561e-09, + "grad_condition": 114228686.58834465, + "lr": 7.001981464747503e-06, + "time_sec": 41.761412620544434 + }, + { + "epoch": 143, + "train_loss": 0.2395897879266739, + "train_acc": 0.92414, + "test_loss": 2.896664640045166, + "test_acc": 0.478, + "lyapunov": 1.9352869106375652, + "grad_norm": 0.5416892903185835, + "grad_max_sv": 0.2529788102954626, + "grad_min_sv": 1.0238048510618353e-08, + "grad_condition": 1532576908.8286607, + "lr": 5.3638335185058295e-06, + "time_sec": 41.76142954826355 + }, + { + "epoch": 144, + "train_loss": 0.24413162813663483, + "train_acc": 0.92276, + "test_loss": 2.901497490310669, + "test_acc": 0.4825, + "lyapunov": 1.932041302971218, + "grad_norm": 0.5467390531621076, + "grad_max_sv": 0.25547480322420596, + "grad_min_sv": 1.001782952095992e-08, + "grad_condition": 1305106323.795214, + "lr": 3.942649342761114e-06, + "time_sec": 41.75995445251465 + }, + { + "epoch": 145, + "train_loss": 0.24082909001350403, + "train_acc": 0.9238, + "test_loss": 2.8805097682952883, + "test_acc": 0.4828, + "lyapunov": 1.9317203464410495, + "grad_norm": 0.5424165341158477, + "grad_max_sv": 0.24744903817772865, + "grad_min_sv": 9.918928221570172e-09, + "grad_condition": 331363007.2769295, + "lr": 2.7390523158633524e-06, + "time_sec": 41.773282051086426 + }, + { + "epoch": 146, + "train_loss": 0.2425065231323242, + "train_acc": 0.92434, + "test_loss": 2.8091441358566285, + "test_acc": 0.4894, + "lyapunov": 1.9370027018325102, + "grad_norm": 0.541973717932011, + "grad_max_sv": 0.25062944628298284, + "grad_min_sv": 9.777612066850205e-09, + "grad_condition": 683683044.9455674, + "lr": 1.7535703752478133e-06, + "time_sec": 41.779646158218384 + }, + { + "epoch": 147, + "train_loss": 0.243648607006073, + "train_acc": 0.92394, + "test_loss": 2.9627289031982422, + "test_acc": 0.4747, + "lyapunov": 1.9350933790816676, + "grad_norm": 0.5460094108296196, + "grad_max_sv": 0.25854056514799595, + "grad_min_sv": 1.0052750944698763e-08, + "grad_condition": 163297918.53123143, + "lr": 9.866357858642196e-07, + "time_sec": 41.752511978149414 + }, + { + "epoch": 148, + "train_loss": 0.24173086163520813, + "train_acc": 0.92284, + "test_loss": 2.897349497795105, + "test_acc": 0.4763, + "lyapunov": 1.934230356265212, + "grad_norm": 0.5430565308059258, + "grad_max_sv": 0.2540682602673769, + "grad_min_sv": 9.93330022628497e-09, + "grad_condition": 117573005.28624102, + "lr": 4.38584950570808e-07, + "time_sec": 41.760454416275024 + }, + { + "epoch": 149, + "train_loss": 0.23882179662227632, + "train_acc": 0.92438, + "test_loss": 2.773164476585388, + "test_acc": 0.4939, + "lyapunov": 1.9274460501073267, + "grad_norm": 0.5410357160833368, + "grad_max_sv": 0.24793715849518777, + "grad_min_sv": 1.0011503008122008e-08, + "grad_condition": 273235188.66167367, + "lr": 1.096582625772501e-07, + "time_sec": 41.756510972976685 + }, + { + "epoch": 150, + "train_loss": 0.23481016640663147, + "train_acc": 0.92526, + "test_loss": 2.940252774810791, + "test_acc": 0.4748, + "lyapunov": 1.9373228156658084, + "grad_norm": 0.5375246640619566, + "grad_max_sv": 0.24730135016143323, + "grad_min_sv": 9.855697390148688e-09, + "grad_condition": 100621205.51330084, + "lr": 0.0, + "time_sec": 41.74098205566406 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 5.039967026519776, + "train_acc": 0.0234, + "test_loss": 4.748602368164063, + "test_acc": 0.0246, + "lyapunov": 2.415693138566468, + "grad_norm": 5.6811829629604595, + "grad_max_sv": 4.614773678779602, + "grad_min_sv": 9.740753990072903e-08, + "grad_condition": 72131656.66698691, + "lr": 0.0009998903417374227, + "time_sec": 86.94209289550781 + }, + { + "epoch": 2, + "train_loss": 4.660584386291504, + "train_acc": 0.03056, + "test_loss": 4.660949175262451, + "test_acc": 0.0193, + "lyapunov": 2.0534968525552384, + "grad_norm": 3.9531656806343887, + "grad_max_sv": 3.2878769516944883, + "grad_min_sv": 7.153735092080282e-08, + "grad_condition": 55276484.92766464, + "lr": 0.0009995614150494292, + "time_sec": 86.9403190612793 + }, + { + "epoch": 3, + "train_loss": 4.518558804626465, + "train_acc": 0.03996, + "test_loss": 4.602233891296387, + "test_acc": 0.0216, + "lyapunov": 1.9753954017253788, + "grad_norm": 3.2461558800665022, + "grad_max_sv": 2.6165521502494813, + "grad_min_sv": 5.880856221995856e-08, + "grad_condition": 49165967.40808712, + "lr": 0.0009990133642141358, + "time_sec": 86.943772315979 + }, + { + "epoch": 4, + "train_loss": 4.400333577575684, + "train_acc": 0.04772, + "test_loss": 4.644777604675293, + "test_acc": 0.0185, + "lyapunov": 1.9347219668385927, + "grad_norm": 2.6695735080987517, + "grad_max_sv": 2.0608615189790727, + "grad_min_sv": 4.778128466914611e-08, + "grad_condition": 100833441.58651581, + "lr": 0.0009982464296247522, + "time_sec": 86.92900562286377 + }, + { + "epoch": 5, + "train_loss": 4.304982159423828, + "train_acc": 0.0577, + "test_loss": 4.64799471282959, + "test_acc": 0.0219, + "lyapunov": 1.9172774044144185, + "grad_norm": 2.212895811679079, + "grad_max_sv": 1.6046739518642426, + "grad_min_sv": 4.02720649161914e-08, + "grad_condition": 43918089.42599782, + "lr": 0.0009972609476841367, + "time_sec": 86.92955732345581 + }, + { + "epoch": 6, + "train_loss": 4.24821193572998, + "train_acc": 0.061, + "test_loss": 4.873469715118408, + "test_acc": 0.0157, + "lyapunov": 1.8960081256564012, + "grad_norm": 1.8434311476217744, + "grad_max_sv": 1.245962518453598, + "grad_min_sv": 3.368539798070946e-08, + "grad_condition": 71333711.70341551, + "lr": 0.000996057350657239, + "time_sec": 86.92592644691467 + }, + { + "epoch": 7, + "train_loss": 4.20261858505249, + "train_acc": 0.06626, + "test_loss": 5.144480117797851, + "test_acc": 0.0188, + "lyapunov": 1.88111193039838, + "grad_norm": 1.5313271927636798, + "grad_max_sv": 0.944209098815918, + "grad_min_sv": 2.798817304583423e-08, + "grad_condition": 39003783.16712481, + "lr": 0.000994636166481494, + "time_sec": 86.92185950279236 + }, + { + "epoch": 8, + "train_loss": 4.1438394500732425, + "train_acc": 0.0751, + "test_loss": 5.032337890625, + "test_acc": 0.0141, + "lyapunov": 1.8621377231519851, + "grad_norm": 1.3161558027962967, + "grad_max_sv": 0.7394168883562088, + "grad_min_sv": 2.3590278237090035e-08, + "grad_condition": 126443373.08524604, + "lr": 0.0009929980185352525, + "time_sec": 86.92974424362183 + }, + { + "epoch": 9, + "train_loss": 4.16818371459961, + "train_acc": 0.06928, + "test_loss": 4.927943510437012, + "test_acc": 0.0182, + "lyapunov": 1.809592140909961, + "grad_norm": 1.1597578429016548, + "grad_max_sv": 0.6403187781572341, + "grad_min_sv": 2.0104599846373917e-08, + "grad_condition": 111889878.19754401, + "lr": 0.0009911436253643444, + "time_sec": 86.95329403877258 + }, + { + "epoch": 10, + "train_loss": 4.111661215133667, + "train_acc": 0.07776, + "test_loss": 4.8633566635131835, + "test_acc": 0.016, + "lyapunov": 1.7768644954237487, + "grad_norm": 1.0165520732353868, + "grad_max_sv": 0.5169711500406265, + "grad_min_sv": 1.7817343992213018e-08, + "grad_condition": 107821917.2277194, + "lr": 0.0009890738003669028, + "time_sec": 86.95670914649963 + }, + { + "epoch": 11, + "train_loss": 4.0691275752258305, + "train_acc": 0.0855, + "test_loss": 4.7518052474975585, + "test_acc": 0.0169, + "lyapunov": 1.7679451768050718, + "grad_norm": 0.9493897318707837, + "grad_max_sv": 0.45400294065475466, + "grad_min_sv": 1.6694678489637128e-08, + "grad_condition": 31838708.54694582, + "lr": 0.00098678945143658, + "time_sec": 86.93720006942749 + }, + { + "epoch": 12, + "train_loss": 4.034702708816528, + "train_acc": 0.08814, + "test_loss": 5.479588261413574, + "test_acc": 0.0123, + "lyapunov": 1.7663455802156491, + "grad_norm": 0.8808410471680627, + "grad_max_sv": 0.3934314988553524, + "grad_min_sv": 1.5704706926578105e-08, + "grad_condition": 30835153.967395704, + "lr": 0.0009842915805643154, + "time_sec": 86.9490315914154 + }, + { + "epoch": 13, + "train_loss": 4.048135414123535, + "train_acc": 0.08836, + "test_loss": 4.974241854858398, + "test_acc": 0.0169, + "lyapunov": 1.7277408698025871, + "grad_norm": 0.81749912551401, + "grad_max_sv": 0.3647046275436878, + "grad_min_sv": 1.4469071707434723e-08, + "grad_condition": 32885789.444102954, + "lr": 0.000981581283398829, + "time_sec": 86.9477162361145 + }, + { + "epoch": 14, + "train_loss": 4.007062616577149, + "train_acc": 0.09308, + "test_loss": 5.175263416290283, + "test_acc": 0.0179, + "lyapunov": 1.7213959389025597, + "grad_norm": 0.8054334315170423, + "grad_max_sv": 0.35222369581460955, + "grad_min_sv": 1.444329909248976e-08, + "grad_condition": 139409691.4248375, + "lr": 0.0009786597487660333, + "time_sec": 86.96184515953064 + }, + { + "epoch": 15, + "train_loss": 3.9827566871643065, + "train_acc": 0.09794, + "test_loss": 5.18627349243164, + "test_acc": 0.0187, + "lyapunov": 1.693825739119059, + "grad_norm": 0.7837766909064864, + "grad_max_sv": 0.3384371198713779, + "grad_min_sv": 1.3973741483375157e-08, + "grad_condition": 50065133.66460046, + "lr": 0.0009755282581475766, + "time_sec": 86.94620490074158 + }, + { + "epoch": 16, + "train_loss": 3.9400778434753416, + "train_acc": 0.10408, + "test_loss": 4.960375379943848, + "test_acc": 0.0174, + "lyapunov": 1.6991827442213092, + "grad_norm": 0.7567286839010319, + "grad_max_sv": 0.312929293513298, + "grad_min_sv": 1.3506557952625008e-08, + "grad_condition": 29222307.9960937, + "lr": 0.0009721881851187403, + "time_sec": 86.91192412376404 + }, + { + "epoch": 17, + "train_loss": 3.9045276139831544, + "train_acc": 0.11088, + "test_loss": 5.235349552154541, + "test_acc": 0.0174, + "lyapunov": 1.6982373008337777, + "grad_norm": 0.7392884239500572, + "grad_max_sv": 0.3013958476483822, + "grad_min_sv": 1.3578178978401745e-08, + "grad_condition": 27215698.462923646, + "lr": 0.0009686409947459456, + "time_sec": 86.93992710113525 + }, + { + "epoch": 18, + "train_loss": 3.8835918949890136, + "train_acc": 0.1134, + "test_loss": 5.087286140441894, + "test_acc": 0.0195, + "lyapunov": 1.6984837890585975, + "grad_norm": 0.7186603276952775, + "grad_max_sv": 0.28467160686850546, + "grad_min_sv": 1.3039492818833764e-08, + "grad_condition": 26314799.87610542, + "lr": 0.0009648882429441254, + "time_sec": 86.9040048122406 + }, + { + "epoch": 19, + "train_loss": 3.8570830113983154, + "train_acc": 0.11826, + "test_loss": 6.674520197296142, + "test_acc": 0.0173, + "lyapunov": 1.6999077053021288, + "grad_norm": 0.7026232910975622, + "grad_max_sv": 0.27488165274262427, + "grad_min_sv": 1.283411938390877e-08, + "grad_condition": 26337722.201227866, + "lr": 0.00096093157579425, + "time_sec": 86.91653943061829 + }, + { + "epoch": 20, + "train_loss": 3.8434328467559813, + "train_acc": 0.121, + "test_loss": 7.015249626159668, + "test_acc": 0.0161, + "lyapunov": 1.693351267243895, + "grad_norm": 0.6879076559096091, + "grad_max_sv": 0.26263708993792534, + "grad_min_sv": 1.253635875664294e-08, + "grad_condition": 24660500.29128598, + "lr": 0.0009567727288213001, + "time_sec": 86.92068099975586 + }, + { + "epoch": 21, + "train_loss": 3.8179317529296877, + "train_acc": 0.1257, + "test_loss": 6.28823071899414, + "test_acc": 0.0185, + "lyapunov": 1.6938256860694008, + "grad_norm": 0.6757265173689927, + "grad_max_sv": 0.25746239386498926, + "grad_min_sv": 1.2419204706293208e-08, + "grad_condition": 25406294.540930398, + "lr": 0.0009524135262330095, + "time_sec": 86.93524384498596 + }, + { + "epoch": 22, + "train_loss": 3.8040669440460206, + "train_acc": 0.1284, + "test_loss": 8.06924171295166, + "test_acc": 0.0166, + "lyapunov": 1.6944642524280207, + "grad_norm": 0.6682498057483773, + "grad_max_sv": 0.24842105731368064, + "grad_min_sv": 1.2251500509236068e-08, + "grad_condition": 52595932.16292306, + "lr": 0.0009478558801197061, + "time_sec": 86.9219081401825 + }, + { + "epoch": 23, + "train_loss": 3.7754980906677247, + "train_acc": 0.13074, + "test_loss": 7.648980326843262, + "test_acc": 0.0179, + "lyapunov": 1.68954312892826, + "grad_norm": 0.6627552369735249, + "grad_max_sv": 0.24308762773871423, + "grad_min_sv": 1.2224439144281619e-08, + "grad_condition": 26069608.693543784, + "lr": 0.000943101789615607, + "time_sec": 86.92962980270386 + }, + { + "epoch": 24, + "train_loss": 3.757672622756958, + "train_acc": 0.13536, + "test_loss": 10.094123184204102, + "test_acc": 0.0136, + "lyapunov": 1.6893348980437763, + "grad_norm": 0.6509659030167023, + "grad_max_sv": 0.23957434706389905, + "grad_min_sv": 1.1972296423690132e-08, + "grad_condition": 35042882.52366346, + "lr": 0.0009381533400219313, + "time_sec": 86.94270205497742 + }, + { + "epoch": 25, + "train_loss": 3.745845176925659, + "train_acc": 0.1359, + "test_loss": 10.251738159179688, + "test_acc": 0.0109, + "lyapunov": 1.6898620018873678, + "grad_norm": 0.6431888749879414, + "grad_max_sv": 0.23203770853579045, + "grad_min_sv": 1.1944590111445664e-08, + "grad_condition": 23832395.262813084, + "lr": 0.0009330127018922189, + "time_sec": 86.90723633766174 + }, + { + "epoch": 26, + "train_loss": 3.757319142456055, + "train_acc": 0.13366, + "test_loss": 10.66865923614502, + "test_acc": 0.0146, + "lyapunov": 1.6835024338549056, + "grad_norm": 0.6410880035698076, + "grad_max_sv": 0.23329635970294477, + "grad_min_sv": 1.174126548486587e-08, + "grad_condition": 23303893.927329373, + "lr": 0.000927682130080253, + "time_sec": 86.91796827316284 + }, + { + "epoch": 27, + "train_loss": 3.7259509687805177, + "train_acc": 0.14096, + "test_loss": 11.372069906616211, + "test_acc": 0.0108, + "lyapunov": 1.6789292700760199, + "grad_norm": 0.637193430729985, + "grad_max_sv": 0.23361454606056214, + "grad_min_sv": 1.1879951530846533e-08, + "grad_condition": 22346839.26764655, + "lr": 0.0009221639627510072, + "time_sec": 86.91676592826843 + }, + { + "epoch": 28, + "train_loss": 3.698563914642334, + "train_acc": 0.14288, + "test_loss": 9.61096866607666, + "test_acc": 0.0175, + "lyapunov": 1.6802275357648844, + "grad_norm": 0.6369229701056937, + "grad_max_sv": 0.23090845197439194, + "grad_min_sv": 1.1949775535757822e-08, + "grad_condition": 24088097.27975302, + "lr": 0.0009164606203550494, + "time_sec": 86.93027591705322 + }, + { + "epoch": 29, + "train_loss": 3.6756981072235106, + "train_acc": 0.14616, + "test_loss": 7.848679396057129, + "test_acc": 0.0222, + "lyapunov": 1.677167893370704, + "grad_norm": 0.632152271917333, + "grad_max_sv": 0.23140450604259968, + "grad_min_sv": 1.177944211616655e-08, + "grad_condition": 28079672.887612868, + "lr": 0.0009105746045668516, + "time_sec": 86.92681694030762 + }, + { + "epoch": 30, + "train_loss": 3.720569337844849, + "train_acc": 0.14278, + "test_loss": 9.134829057312011, + "test_acc": 0.0199, + "lyapunov": 1.6958239910852573, + "grad_norm": 0.6124497377273601, + "grad_max_sv": 0.2226740188896656, + "grad_min_sv": 1.1438976671440671e-08, + "grad_condition": 43710559.09775521, + "lr": 0.0009045084971874733, + "time_sec": 86.95414066314697 + }, + { + "epoch": 31, + "train_loss": 3.681295146942139, + "train_acc": 0.14548, + "test_loss": 10.644169580078126, + "test_acc": 0.0148, + "lyapunov": 1.6929164042558207, + "grad_norm": 0.6160471255082475, + "grad_max_sv": 0.21768128015100957, + "grad_min_sv": 1.1538898583851597e-08, + "grad_condition": 25936536.78372231, + "lr": 0.0008982649590120977, + "time_sec": 86.9529333114624 + }, + { + "epoch": 32, + "train_loss": 3.649655858154297, + "train_acc": 0.15334, + "test_loss": 9.779230001831055, + "test_acc": 0.021, + "lyapunov": 1.700419718042359, + "grad_norm": 0.6173882196636933, + "grad_max_sv": 0.216496866568923, + "grad_min_sv": 1.1471159777620698e-08, + "grad_condition": 21546411.015841365, + "lr": 0.0008918467286629196, + "time_sec": 86.93373703956604 + }, + { + "epoch": 33, + "train_loss": 3.6238256622314453, + "train_acc": 0.15508, + "test_loss": 10.813010598754882, + "test_acc": 0.0186, + "lyapunov": 1.6949882888428085, + "grad_norm": 0.6156784672925573, + "grad_max_sv": 0.21453518383204936, + "grad_min_sv": 1.1543558284254907e-08, + "grad_condition": 24951627.83384871, + "lr": 0.0008852566213878943, + "time_sec": 86.92384076118469 + }, + { + "epoch": 34, + "train_loss": 3.6053655114746093, + "train_acc": 0.15724, + "test_loss": 9.250387573242188, + "test_acc": 0.0255, + "lyapunov": 1.695445427504342, + "grad_norm": 0.617504909683498, + "grad_max_sv": 0.21871747858822346, + "grad_min_sv": 1.1392037478630268e-08, + "grad_condition": 28052156.083601933, + "lr": 0.000878497527825878, + "time_sec": 86.95940613746643 + }, + { + "epoch": 35, + "train_loss": 3.6839909051513673, + "train_acc": 0.14544, + "test_loss": 12.814430276489258, + "test_acc": 0.0193, + "lyapunov": 1.6773092118675446, + "grad_norm": 0.5848508181366305, + "grad_max_sv": 0.2025191828608513, + "grad_min_sv": 1.0841579529442813e-08, + "grad_condition": 603233703.1966207, + "lr": 0.000871572412738697, + "time_sec": 86.93837785720825 + }, + { + "epoch": 36, + "train_loss": 3.651795174102783, + "train_acc": 0.15336, + "test_loss": 12.996923107910156, + "test_acc": 0.0169, + "lyapunov": 1.6706123025825872, + "grad_norm": 0.5876590475710954, + "grad_max_sv": 0.20529181137681007, + "grad_min_sv": 1.0850184412047881e-08, + "grad_condition": 56083508.24967704, + "lr": 0.0008644843137107055, + "time_sec": 86.96726322174072 + }, + { + "epoch": 37, + "train_loss": 3.620498941192627, + "train_acc": 0.15712, + "test_loss": 12.176803886413575, + "test_acc": 0.0229, + "lyapunov": 1.6697818211582311, + "grad_norm": 0.5856419520299609, + "grad_max_sv": 0.20430892258882521, + "grad_min_sv": 1.0912001915941439e-08, + "grad_condition": 27196656.907481592, + "lr": 0.0008572363398164014, + "time_sec": 86.96672797203064 + }, + { + "epoch": 38, + "train_loss": 3.677903451385498, + "train_acc": 0.1468, + "test_loss": 12.39649211730957, + "test_acc": 0.0144, + "lyapunov": 1.6644693802079886, + "grad_norm": 0.5783673224303225, + "grad_max_sv": 0.1985822133719921, + "grad_min_sv": 1.076888991730085e-08, + "grad_condition": 23536064.4273279, + "lr": 0.0008498316702566826, + "time_sec": 87.00131368637085 + }, + { + "epoch": 39, + "train_loss": 3.691991829376221, + "train_acc": 0.14584, + "test_loss": 11.931999853515626, + "test_acc": 0.0208, + "lyapunov": 1.6525612225008133, + "grad_norm": 0.5655243790126536, + "grad_max_sv": 0.19517179019749165, + "grad_min_sv": 1.04696434827245e-08, + "grad_condition": 51128562.33142143, + "lr": 0.0008422735529643442, + "time_sec": 87.03218030929565 + }, + { + "epoch": 40, + "train_loss": 3.662434649810791, + "train_acc": 0.14718, + "test_loss": 10.6877273147583, + "test_acc": 0.0134, + "lyapunov": 1.6567843743907216, + "grad_norm": 0.560115163053598, + "grad_max_sv": 0.1857254110276699, + "grad_min_sv": 1.0581942576359803e-08, + "grad_condition": 26626262.04447771, + "lr": 0.0008345653031794289, + "time_sec": 87.00236964225769 + }, + { + "epoch": 41, + "train_loss": 3.6978988871765135, + "train_acc": 0.14564, + "test_loss": 8.053759545898437, + "test_acc": 0.0127, + "lyapunov": 1.6674467590458864, + "grad_norm": 0.5635968355151927, + "grad_max_sv": 0.19086987487971782, + "grad_min_sv": 1.0342714669431263e-08, + "grad_condition": 60525350.06225469, + "lr": 0.0008267103019950526, + "time_sec": 86.98331022262573 + }, + { + "epoch": 42, + "train_loss": 3.7973634886932373, + "train_acc": 0.12868, + "test_loss": 7.096838776397705, + "test_acc": 0.0177, + "lyapunov": 1.6500295220738481, + "grad_norm": 0.5368482526961335, + "grad_max_sv": 0.17560299709439278, + "grad_min_sv": 9.971410369624678e-09, + "grad_condition": 21547551.84721183, + "lr": 0.0008187119948743447, + "time_sec": 86.9593575000763 + }, + { + "epoch": 43, + "train_loss": 3.760347054901123, + "train_acc": 0.13548, + "test_loss": 7.536987094879151, + "test_acc": 0.0166, + "lyapunov": 1.6433212754061766, + "grad_norm": 0.539360284345072, + "grad_max_sv": 0.18257700726389886, + "grad_min_sv": 9.841167401651584e-09, + "grad_condition": 136858195.99864033, + "lr": 0.000810573890139155, + "time_sec": 86.99102926254272 + }, + { + "epoch": 44, + "train_loss": 3.787106593475342, + "train_acc": 0.13046, + "test_loss": 11.951196694946288, + "test_acc": 0.0102, + "lyapunov": 1.6692767094468217, + "grad_norm": 0.5545505027239148, + "grad_max_sv": 0.17591703571379186, + "grad_min_sv": 9.760416913758007e-09, + "grad_condition": 105743782.14909813, + "lr": 0.0008022995574311873, + "time_sec": 87.00538802146912 + }, + { + "epoch": 45, + "train_loss": 3.977849741363525, + "train_acc": 0.09838, + "test_loss": 9.744494529724122, + "test_acc": 0.0107, + "lyapunov": 1.6796196854632834, + "grad_norm": 0.4973188576403794, + "grad_max_sv": 0.1785931583493948, + "grad_min_sv": 8.718851197964117e-09, + "grad_condition": 28913205.331663024, + "lr": 0.0007938926261462363, + "time_sec": 86.97129440307617 + }, + { + "epoch": 46, + "train_loss": 3.8713095574951173, + "train_acc": 0.11528, + "test_loss": 6.836954457855224, + "test_acc": 0.0136, + "lyapunov": 1.6516431606639073, + "grad_norm": 0.49363589472795627, + "grad_max_sv": 0.17069513574242592, + "grad_min_sv": 8.777947649307728e-09, + "grad_condition": 22630513.20924943, + "lr": 0.0007853567838422158, + "time_sec": 86.9545829296112 + }, + { + "epoch": 47, + "train_loss": 3.8064515753936767, + "train_acc": 0.12602, + "test_loss": 7.460648231506347, + "test_acc": 0.0118, + "lyapunov": 1.6438198812172542, + "grad_norm": 0.5024311046380698, + "grad_max_sv": 0.1723852265626192, + "grad_min_sv": 8.95505288672771e-09, + "grad_condition": 34224410.246411264, + "lr": 0.0007766957746216719, + "time_sec": 86.9643166065216 + }, + { + "epoch": 48, + "train_loss": 3.7720379662322996, + "train_acc": 0.12956, + "test_loss": 8.679229983520507, + "test_acc": 0.0126, + "lyapunov": 1.6496837785481797, + "grad_norm": 0.5043295950696797, + "grad_max_sv": 0.17149083018302919, + "grad_min_sv": 8.865516073623984e-09, + "grad_condition": 1222026243.8555462, + "lr": 0.0007679133974894982, + "time_sec": 86.97412467002869 + }, + { + "epoch": 49, + "train_loss": 3.751894903640747, + "train_acc": 0.13492, + "test_loss": 8.066148229980469, + "test_acc": 0.0123, + "lyapunov": 1.64509734961078, + "grad_norm": 0.49766714010424734, + "grad_max_sv": 0.17132410928606986, + "grad_min_sv": 9.049689823903417e-09, + "grad_condition": 24581412.475744545, + "lr": 0.000759013504686565, + "time_sec": 86.98210406303406 + }, + { + "epoch": 50, + "train_loss": 3.7796132605743407, + "train_acc": 0.12948, + "test_loss": 6.275712922668457, + "test_acc": 0.0123, + "lyapunov": 1.65870054542561, + "grad_norm": 0.4920202538672966, + "grad_max_sv": 0.16835491731762886, + "grad_min_sv": 8.871015866329657e-09, + "grad_condition": 21789647.601223223, + "lr": 0.0007499999999999998, + "time_sec": 86.96125483512878 + }, + { + "epoch": 51, + "train_loss": 3.7543009240722656, + "train_acc": 0.13288, + "test_loss": 9.307511892700195, + "test_acc": 0.0102, + "lyapunov": 1.644919433557164, + "grad_norm": 0.4905167344021336, + "grad_max_sv": 0.16338985599577427, + "grad_min_sv": 8.878451215887928e-09, + "grad_condition": 21466518.22147739, + "lr": 0.0007408768370508575, + "time_sec": 86.97321915626526 + }, + { + "epoch": 52, + "train_loss": 3.7144092133331297, + "train_acc": 0.13956, + "test_loss": 7.959958459472657, + "test_acc": 0.0116, + "lyapunov": 1.6429758294464072, + "grad_norm": 0.49277268788151807, + "grad_max_sv": 0.1628257032483816, + "grad_min_sv": 9.033670800295824e-09, + "grad_condition": 21921113.04524386, + "lr": 0.0007316480175599307, + "time_sec": 87.00878667831421 + }, + { + "epoch": 53, + "train_loss": 3.6915715643310545, + "train_acc": 0.14434, + "test_loss": 7.135662438964844, + "test_acc": 0.0131, + "lyapunov": 1.6323093544796605, + "grad_norm": 0.4979492481271785, + "grad_max_sv": 0.16630124859511852, + "grad_min_sv": 9.105897960312582e-09, + "grad_condition": 50284759.18612621, + "lr": 0.0007223175895924635, + "time_sec": 87.01037693023682 + }, + { + "epoch": 54, + "train_loss": 3.7443332249450685, + "train_acc": 0.13556, + "test_loss": 8.249568377685547, + "test_acc": 0.0131, + "lyapunov": 1.6371140284916323, + "grad_norm": 0.49695792584680404, + "grad_max_sv": 0.16298682950437068, + "grad_min_sv": 8.935503098723985e-09, + "grad_condition": 89099472.7569754, + "lr": 0.0007128896457825361, + "time_sec": 86.96064949035645 + }, + { + "epoch": 55, + "train_loss": 3.682590077972412, + "train_acc": 0.14482, + "test_loss": 6.493008503723145, + "test_acc": 0.0139, + "lyapunov": 1.6443470704281116, + "grad_norm": 0.504908521633717, + "grad_max_sv": 0.1629489880055189, + "grad_min_sv": 9.216769875086683e-09, + "grad_condition": 22104189.00960083, + "lr": 0.0007033683215378998, + "time_sec": 86.97486233711243 + }, + { + "epoch": 56, + "train_loss": 3.6545884216308595, + "train_acc": 0.14948, + "test_loss": 7.142836791992187, + "test_acc": 0.0143, + "lyapunov": 1.62088993778619, + "grad_norm": 0.5059800396027672, + "grad_max_sv": 0.16476057544350625, + "grad_min_sv": 9.248405038325691e-09, + "grad_condition": 38862529.28438302, + "lr": 0.0006937577932260512, + "time_sec": 87.0516619682312 + }, + { + "epoch": 57, + "train_loss": 3.648748851928711, + "train_acc": 0.14874, + "test_loss": 6.9171292694091795, + "test_acc": 0.0138, + "lyapunov": 1.6256865439817423, + "grad_norm": 0.500177420691686, + "grad_max_sv": 0.1641532715409994, + "grad_min_sv": 9.27983705573121e-09, + "grad_condition": 22867156.07272685, + "lr": 0.0006840622763423388, + "time_sec": 87.07263231277466 + }, + { + "epoch": 58, + "train_loss": 3.7093204387664795, + "train_acc": 0.13914, + "test_loss": 6.941782995605469, + "test_acc": 0.0115, + "lyapunov": 1.63103087936216, + "grad_norm": 0.4955991883426222, + "grad_max_sv": 0.16259282156825067, + "grad_min_sv": 9.022654627165865e-09, + "grad_condition": 138363363.53721, + "lr": 0.0006742860236609073, + "time_sec": 86.96074366569519 + }, + { + "epoch": 59, + "train_loss": 3.684690574798584, + "train_acc": 0.1428, + "test_loss": 7.981631962585449, + "test_acc": 0.0127, + "lyapunov": 1.62094318104522, + "grad_norm": 0.49563124296662386, + "grad_max_sv": 0.16301960796117781, + "grad_min_sv": 9.04448190369722e-09, + "grad_condition": 24972620.17904968, + "lr": 0.0006644333233692913, + "time_sec": 86.96800327301025 + }, + { + "epoch": 60, + "train_loss": 3.7217326124572754, + "train_acc": 0.13682, + "test_loss": 6.620712623596192, + "test_acc": 0.011, + "lyapunov": 1.6251535635165242, + "grad_norm": 0.484928081673614, + "grad_max_sv": 0.15391864404082298, + "grad_min_sv": 8.803339172913648e-09, + "grad_condition": 25300255.327375304, + "lr": 0.0006545084971874734, + "time_sec": 86.97639203071594 + }, + { + "epoch": 61, + "train_loss": 3.836674650802612, + "train_acc": 0.12034, + "test_loss": 7.289911544799804, + "test_acc": 0.0149, + "lyapunov": 1.613660539202678, + "grad_norm": 0.45820651801306833, + "grad_max_sv": 0.14781750719994308, + "grad_min_sv": 8.241427132404944e-09, + "grad_condition": 20774740.46227048, + "lr": 0.0006445158984722354, + "time_sec": 87.0773253440857 + }, + { + "epoch": 62, + "train_loss": 3.7829781243896483, + "train_acc": 0.12784, + "test_loss": 5.955834550476074, + "test_acc": 0.0113, + "lyapunov": 1.6045690771868772, + "grad_norm": 0.4631191106662181, + "grad_max_sv": 0.1513774987310171, + "grad_min_sv": 8.341488429153276e-09, + "grad_condition": 26609503.623661477, + "lr": 0.0006344599103076324, + "time_sec": 87.06490015983582 + }, + { + "epoch": 63, + "train_loss": 3.709426063232422, + "train_acc": 0.13916, + "test_loss": 6.786815286254883, + "test_acc": 0.0105, + "lyapunov": 1.5976358277108662, + "grad_norm": 0.4749105641193412, + "grad_max_sv": 0.15383654683828354, + "grad_min_sv": 8.618015233385901e-09, + "grad_condition": 31012479.28524846, + "lr": 0.0006243449435824269, + "time_sec": 87.08106398582458 + }, + { + "epoch": 64, + "train_loss": 3.679068829269409, + "train_acc": 0.14238, + "test_loss": 6.114537014770508, + "test_acc": 0.0104, + "lyapunov": 1.5980056701108927, + "grad_norm": 0.47838572521954287, + "grad_max_sv": 0.15162084400653839, + "grad_min_sv": 8.810203933062865e-09, + "grad_condition": 21274478.103174634, + "lr": 0.0006141754350553275, + "time_sec": 87.03664231300354 + }, + { + "epoch": 65, + "train_loss": 3.7201092626190184, + "train_acc": 0.13754, + "test_loss": 6.025243463897705, + "test_acc": 0.0098, + "lyapunov": 1.602358661344289, + "grad_norm": 0.4778587789544339, + "grad_max_sv": 0.15611788518726827, + "grad_min_sv": 8.63006196141075e-09, + "grad_condition": 78613098.80228965, + "lr": 0.0006039558454088793, + "time_sec": 87.02543997764587 + }, + { + "epoch": 66, + "train_loss": 3.7001313134765623, + "train_acc": 0.14098, + "test_loss": 6.2105860412597655, + "test_acc": 0.0121, + "lyapunov": 1.5974808227070763, + "grad_norm": 0.4718935364343528, + "grad_max_sv": 0.1544180303812027, + "grad_min_sv": 8.637516658860367e-09, + "grad_condition": 26381632.051760912, + "lr": 0.000593690657292862, + "time_sec": 87.0075671672821 + }, + { + "epoch": 67, + "train_loss": 3.6958953248596194, + "train_acc": 0.14228, + "test_loss": 7.906288302612305, + "test_acc": 0.011, + "lyapunov": 1.6165290275193236, + "grad_norm": 0.4729240319685535, + "grad_max_sv": 0.14935983307659625, + "grad_min_sv": 8.422997328783044e-09, + "grad_condition": 103481664.66824803, + "lr": 0.0005833843733580507, + "time_sec": 87.03533220291138 + }, + { + "epoch": 68, + "train_loss": 3.669604234466553, + "train_acc": 0.14592, + "test_loss": 8.88355927886963, + "test_acc": 0.0082, + "lyapunov": 1.6127500518813462, + "grad_norm": 0.4780100279787231, + "grad_max_sv": 0.1534903097897768, + "grad_min_sv": 8.637573695180478e-09, + "grad_condition": 21443199.319011845, + "lr": 0.0005730415142812054, + "time_sec": 86.98495316505432 + }, + { + "epoch": 69, + "train_loss": 3.7872955700683595, + "train_acc": 0.12714, + "test_loss": 11.25625125732422, + "test_acc": 0.01, + "lyapunov": 1.5893510244691464, + "grad_norm": 0.8037765366589226, + "grad_max_sv": 0.14677802547812463, + "grad_min_sv": 8.186407714910748e-09, + "grad_condition": 45154369.52746147, + "lr": 0.0005626666167821517, + "time_sec": 86.9665298461914 + }, + { + "epoch": 70, + "train_loss": 4.064214197998047, + "train_acc": 0.08242, + "test_loss": 12.454515402221679, + "test_acc": 0.0088, + "lyapunov": 1.5885208153053927, + "grad_norm": 0.393495870054543, + "grad_max_sv": 0.131903138384223, + "grad_min_sv": 6.539090802171188e-09, + "grad_condition": 23695704.110266972, + "lr": 0.0005522642316338265, + "time_sec": 86.97868394851685 + }, + { + "epoch": 71, + "train_loss": 3.9644073529052735, + "train_acc": 0.09628, + "test_loss": 10.848277130126952, + "test_acc": 0.01, + "lyapunov": 1.5856929057089568, + "grad_norm": 0.4161566543824354, + "grad_max_sv": 0.146684742346406, + "grad_min_sv": 7.117523364436051e-09, + "grad_condition": 40553732.46325208, + "lr": 0.0005418389216661573, + "time_sec": 86.94270300865173 + }, + { + "epoch": 72, + "train_loss": 3.9191373210144045, + "train_acc": 0.10142, + "test_loss": 14.071105361938477, + "test_acc": 0.01, + "lyapunov": 1.5867945410101616, + "grad_norm": 0.4256377546947174, + "grad_max_sv": 0.15357364155352116, + "grad_min_sv": 7.264279759146286e-09, + "grad_condition": 949577214.7436682, + "lr": 0.0005313952597646563, + "time_sec": 86.9540867805481 + }, + { + "epoch": 73, + "train_loss": 3.894068261871338, + "train_acc": 0.10488, + "test_loss": 18.658797454833984, + "test_acc": 0.01, + "lyapunov": 1.586326296981948, + "grad_norm": 0.42639443694889123, + "grad_max_sv": 0.15087650418281556, + "grad_min_sv": 7.270475468196258e-09, + "grad_condition": 36000827.05117835, + "lr": 0.0005209378268645994, + "time_sec": 86.95636653900146 + }, + { + "epoch": 74, + "train_loss": 3.8784976776885984, + "train_acc": 0.1089, + "test_loss": 18.57114639892578, + "test_acc": 0.0101, + "lyapunov": 1.5917559593839719, + "grad_norm": 0.4248071521185912, + "grad_max_sv": 0.14780581016093491, + "grad_min_sv": 7.161140411215961e-09, + "grad_condition": 23335758.84633479, + "lr": 0.0005104712099416781, + "time_sec": 87.14426589012146 + }, + { + "epoch": 75, + "train_loss": 3.861637345504761, + "train_acc": 0.1122, + "test_loss": 15.879781237792969, + "test_acc": 0.01, + "lyapunov": 1.5892035942858138, + "grad_norm": 0.42720133114034003, + "grad_max_sv": 0.14710958655923606, + "grad_min_sv": 7.42298774530914e-09, + "grad_condition": 27285273.48026234, + "lr": 0.0004999999999999996, + "time_sec": 86.95125460624695 + }, + { + "epoch": 76, + "train_loss": 3.830299222946167, + "train_acc": 0.11708, + "test_loss": 16.76611838989258, + "test_acc": 0.0099, + "lyapunov": 1.5912379123975553, + "grad_norm": 0.431476084915652, + "grad_max_sv": 0.14528207313269376, + "grad_min_sv": 7.4023330423611535e-09, + "grad_condition": 31795981.76308779, + "lr": 0.0004895287900583212, + "time_sec": 86.94743990898132 + }, + { + "epoch": 77, + "train_loss": 3.8078982507324217, + "train_acc": 0.12066, + "test_loss": 20.0999603515625, + "test_acc": 0.0101, + "lyapunov": 1.5911254754761601, + "grad_norm": 0.4312143312914805, + "grad_max_sv": 0.14594154562801123, + "grad_min_sv": 7.3831466392004774e-09, + "grad_condition": 29148555.72123132, + "lr": 0.0004790621731353997, + "time_sec": 86.93247842788696 + }, + { + "epoch": 78, + "train_loss": 3.7942108618164063, + "train_acc": 0.12064, + "test_loss": 19.366783633422852, + "test_acc": 0.0094, + "lyapunov": 1.591662799610811, + "grad_norm": 0.43533821755274854, + "grad_max_sv": 0.1457790955901146, + "grad_min_sv": 7.497610187215398e-09, + "grad_condition": 39012225.543659545, + "lr": 0.000468604740235343, + "time_sec": 86.94203901290894 + }, + { + "epoch": 79, + "train_loss": 3.778176818237305, + "train_acc": 0.1247, + "test_loss": 18.744433993530272, + "test_acc": 0.01, + "lyapunov": 1.5908222671055123, + "grad_norm": 0.4355330984071009, + "grad_max_sv": 0.1430677803233266, + "grad_min_sv": 7.61817114669494e-09, + "grad_condition": 25370511.046323996, + "lr": 0.00045816107833384175, + "time_sec": 86.95873808860779 + }, + { + "epoch": 80, + "train_loss": 3.76448169631958, + "train_acc": 0.12718, + "test_loss": 16.775007608032226, + "test_acc": 0.0109, + "lyapunov": 1.5896995302356418, + "grad_norm": 0.43792266509710825, + "grad_max_sv": 0.14181964825838805, + "grad_min_sv": 7.62938894560694e-09, + "grad_condition": 21222206.527802683, + "lr": 0.0004477357683661729, + "time_sec": 86.95050120353699 + }, + { + "epoch": 81, + "train_loss": 3.7475227643585205, + "train_acc": 0.12978, + "test_loss": 14.160825512695313, + "test_acc": 0.01, + "lyapunov": 1.5942986712736242, + "grad_norm": 0.4370937722961794, + "grad_max_sv": 0.1431336086243391, + "grad_min_sv": 7.701322295161628e-09, + "grad_condition": 33598688.58716972, + "lr": 0.00043733338321784746, + "time_sec": 86.9794499874115 + }, + { + "epoch": 82, + "train_loss": 3.7305331897735594, + "train_acc": 0.13106, + "test_loss": 13.912216326904296, + "test_acc": 0.0101, + "lyapunov": 1.5953164524434473, + "grad_norm": 0.44173148929337547, + "grad_max_sv": 0.14520521014928817, + "grad_min_sv": 7.755290833827421e-09, + "grad_condition": 30924579.10592314, + "lr": 0.0004269584857187939, + "time_sec": 87.0003228187561 + }, + { + "epoch": 83, + "train_loss": 3.7147515576171877, + "train_acc": 0.13188, + "test_loss": 14.445767102050782, + "test_acc": 0.009, + "lyapunov": 1.59371292987443, + "grad_norm": 0.4439421454501282, + "grad_max_sv": 0.14203465301543475, + "grad_min_sv": 7.84910630551635e-09, + "grad_condition": 611757052.2788166, + "lr": 0.0004166156266419484, + "time_sec": 86.9797739982605 + }, + { + "epoch": 84, + "train_loss": 3.706479062423706, + "train_acc": 0.13416, + "test_loss": 11.980558978271484, + "test_acc": 0.0088, + "lyapunov": 1.5939265678605765, + "grad_norm": 0.4417289260925103, + "grad_max_sv": 0.14147576484829189, + "grad_min_sv": 7.820818669068697e-09, + "grad_condition": 26530590.58024422, + "lr": 0.0004063093427071373, + "time_sec": 87.00698661804199 + }, + { + "epoch": 85, + "train_loss": 3.7477826470184326, + "train_acc": 0.12758, + "test_loss": 13.546329722595216, + "test_acc": 0.009, + "lyapunov": 1.6077222897268622, + "grad_norm": 0.4416377935400416, + "grad_max_sv": 0.13991490099579096, + "grad_min_sv": 7.882191255421944e-09, + "grad_condition": 61609587.98453593, + "lr": 0.0003960441545911199, + "time_sec": 86.96598291397095 + }, + { + "epoch": 86, + "train_loss": 3.720520766067505, + "train_acc": 0.13278, + "test_loss": 16.74704148864746, + "test_acc": 0.0096, + "lyapunov": 1.6138804544268361, + "grad_norm": 0.4421801273249669, + "grad_max_sv": 0.14129837341606616, + "grad_min_sv": 7.776938862336102e-09, + "grad_condition": 38892541.45117955, + "lr": 0.0003858245649446718, + "time_sec": 86.95254611968994 + }, + { + "epoch": 87, + "train_loss": 3.711577749786377, + "train_acc": 0.13428, + "test_loss": 22.594557598876953, + "test_acc": 0.0098, + "lyapunov": 1.6033829984152714, + "grad_norm": 0.4512462726867504, + "grad_max_sv": 0.14761524014174937, + "grad_min_sv": 8.091291020528857e-09, + "grad_condition": 22853002.151385926, + "lr": 0.00037565505641757235, + "time_sec": 86.93402934074402 + }, + { + "epoch": 88, + "train_loss": 3.678959339599609, + "train_acc": 0.1377, + "test_loss": 23.849026098632812, + "test_acc": 0.01, + "lyapunov": 1.6056159249961834, + "grad_norm": 0.45182933207932163, + "grad_max_sv": 0.14614916127175093, + "grad_min_sv": 8.171810636503629e-09, + "grad_condition": 23947568.92733029, + "lr": 0.00036554008969236695, + "time_sec": 86.95433020591736 + }, + { + "epoch": 89, + "train_loss": 3.6683367713165285, + "train_acc": 0.13906, + "test_loss": 20.367259674072265, + "test_acc": 0.01, + "lyapunov": 1.6064209029497698, + "grad_norm": 0.45219688997072166, + "grad_max_sv": 0.14644892439246177, + "grad_min_sv": 8.048351576861457e-09, + "grad_condition": 22571841.054483928, + "lr": 0.0003554841015277638, + "time_sec": 86.96333193778992 + }, + { + "epoch": 90, + "train_loss": 3.6530249962615966, + "train_acc": 0.14202, + "test_loss": 17.6921991394043, + "test_acc": 0.0091, + "lyapunov": 1.6094138329596166, + "grad_norm": 0.4524854227912199, + "grad_max_sv": 0.14466388188302517, + "grad_min_sv": 8.253811646652398e-09, + "grad_condition": 31524432.880272698, + "lr": 0.000345491502812526, + "time_sec": 86.94082713127136 + }, + { + "epoch": 91, + "train_loss": 3.637232744674683, + "train_acc": 0.1456, + "test_loss": 20.56831607055664, + "test_acc": 0.0109, + "lyapunov": 1.6082729372526983, + "grad_norm": 0.4556775683867131, + "grad_max_sv": 0.14616837427020074, + "grad_min_sv": 8.160595244000036e-09, + "grad_condition": 28754963.532174416, + "lr": 0.0003355666766307081, + "time_sec": 86.94279336929321 + }, + { + "epoch": 92, + "train_loss": 3.6490048527526855, + "train_acc": 0.14432, + "test_loss": 18.724969110107423, + "test_acc": 0.009, + "lyapunov": 1.5913407104399504, + "grad_norm": 0.45437861427310544, + "grad_max_sv": 0.14675606675446035, + "grad_min_sv": 8.173822554913279e-09, + "grad_condition": 21225585.088906057, + "lr": 0.00032571397633909225, + "time_sec": 86.94307732582092 + }, + { + "epoch": 93, + "train_loss": 3.630709340133667, + "train_acc": 0.14534, + "test_loss": 18.29774376220703, + "test_acc": 0.0096, + "lyapunov": 1.5943918630595098, + "grad_norm": 0.4572074659138503, + "grad_max_sv": 0.14428534246981145, + "grad_min_sv": 8.233453231698551e-09, + "grad_condition": 24019985.151417702, + "lr": 0.00031593772365766094, + "time_sec": 86.94932794570923 + }, + { + "epoch": 94, + "train_loss": 3.6242483766174316, + "train_acc": 0.14782, + "test_loss": 20.522399169921876, + "test_acc": 0.0142, + "lyapunov": 1.5947073164498409, + "grad_norm": 0.45501588896754536, + "grad_max_sv": 0.14271920640021563, + "grad_min_sv": 8.317351417319596e-09, + "grad_condition": 24040639.16855276, + "lr": 0.0003062422067739483, + "time_sec": 86.94991445541382 + }, + { + "epoch": 95, + "train_loss": 3.6074996049499513, + "train_acc": 0.15148, + "test_loss": 19.390435940551757, + "test_acc": 0.013, + "lyapunov": 1.5944416712007254, + "grad_norm": 0.4568634402332776, + "grad_max_sv": 0.14528488460928202, + "grad_min_sv": 8.272740019757418e-09, + "grad_condition": 56145775.598184526, + "lr": 0.00029663167846209965, + "time_sec": 86.97137951850891 + }, + { + "epoch": 96, + "train_loss": 3.6031181813049318, + "train_acc": 0.15196, + "test_loss": 17.69250036010742, + "test_acc": 0.0104, + "lyapunov": 1.6009117489885492, + "grad_norm": 0.46132600242451327, + "grad_max_sv": 0.14789858758449553, + "grad_min_sv": 8.220308266720933e-09, + "grad_condition": 25988170.943460304, + "lr": 0.00028711035421746345, + "time_sec": 86.9358479976654 + }, + { + "epoch": 97, + "train_loss": 3.618217834320068, + "train_acc": 0.14622, + "test_loss": 19.237579772949218, + "test_acc": 0.0095, + "lyapunov": 1.5942770809773594, + "grad_norm": 0.45626783207883664, + "grad_max_sv": 0.14236079752445222, + "grad_min_sv": 8.25946486829321e-09, + "grad_condition": 29611273.407984328, + "lr": 0.00027768241040753615, + "time_sec": 86.9272072315216 + }, + { + "epoch": 98, + "train_loss": 3.6665315843200683, + "train_acc": 0.14364, + "test_loss": 18.6544664855957, + "test_acc": 0.0102, + "lyapunov": 1.5918195894002305, + "grad_norm": 0.4470253327198404, + "grad_max_sv": 0.13931705933064223, + "grad_min_sv": 8.053131270169266e-09, + "grad_condition": 21125243.818313595, + "lr": 0.00026835198244006903, + "time_sec": 86.96563053131104 + }, + { + "epoch": 99, + "train_loss": 3.652189131011963, + "train_acc": 0.14424, + "test_loss": 20.11543081665039, + "test_acc": 0.0117, + "lyapunov": 1.5925892926847842, + "grad_norm": 0.4490609059275306, + "grad_max_sv": 0.1407471911981702, + "grad_min_sv": 8.079158519969098e-09, + "grad_condition": 20647713.041492444, + "lr": 0.0002591231629491421, + "time_sec": 86.94651627540588 + }, + { + "epoch": 100, + "train_loss": 3.631007031326294, + "train_acc": 0.1475, + "test_loss": 16.71507637939453, + "test_acc": 0.012, + "lyapunov": 1.5903882019964934, + "grad_norm": 0.45126212090689816, + "grad_max_sv": 0.14112005103379488, + "grad_min_sv": 8.093771391992633e-09, + "grad_condition": 42885627.74013588, + "lr": 0.0002499999999999997, + "time_sec": 86.9404718875885 + }, + { + "epoch": 101, + "train_loss": 3.6124810808563232, + "train_acc": 0.1499, + "test_loss": 15.476232440185546, + "test_acc": 0.01, + "lyapunov": 1.5941168749728776, + "grad_norm": 0.45743872759540244, + "grad_max_sv": 0.14450851678848267, + "grad_min_sv": 8.251514057970588e-09, + "grad_condition": 77117071.59388432, + "lr": 0.00024098649531343477, + "time_sec": 86.94936323165894 + }, + { + "epoch": 102, + "train_loss": 3.601418228302002, + "train_acc": 0.15264, + "test_loss": 15.486841659545899, + "test_acc": 0.0103, + "lyapunov": 1.5978375228164752, + "grad_norm": 0.45514018316868876, + "grad_max_sv": 0.14419761635363101, + "grad_min_sv": 8.20662132833272e-09, + "grad_condition": 31401694.163503457, + "lr": 0.0002320866025105016, + "time_sec": 86.9201922416687 + }, + { + "epoch": 103, + "train_loss": 3.6135065021514894, + "train_acc": 0.15064, + "test_loss": 15.01775616455078, + "test_acc": 0.0098, + "lyapunov": 1.614576053741338, + "grad_norm": 0.45664748231787383, + "grad_max_sv": 0.14336710162460803, + "grad_min_sv": 8.186609938565237e-09, + "grad_condition": 25695126.93993938, + "lr": 0.0002233042253783278, + "time_sec": 86.95599412918091 + }, + { + "epoch": 104, + "train_loss": 3.648608812866211, + "train_acc": 0.1439, + "test_loss": 20.221762030029296, + "test_acc": 0.011, + "lyapunov": 1.629351832067875, + "grad_norm": 0.45357224145156544, + "grad_max_sv": 0.143721086345613, + "grad_min_sv": 8.055545831775478e-09, + "grad_condition": 29079777.748796843, + "lr": 0.000214643216157784, + "time_sec": 86.93540620803833 + }, + { + "epoch": 105, + "train_loss": 3.637598281326294, + "train_acc": 0.14576, + "test_loss": 19.01300486450195, + "test_acc": 0.01, + "lyapunov": 1.6094059605732598, + "grad_norm": 0.4502613347675905, + "grad_max_sv": 0.137011787481606, + "grad_min_sv": 8.03301990204286e-09, + "grad_condition": 22015837.082748365, + "lr": 0.00020610737385376332, + "time_sec": 86.95102834701538 + }, + { + "epoch": 106, + "train_loss": 3.618973631591797, + "train_acc": 0.1495, + "test_loss": 16.085577545166014, + "test_acc": 0.01, + "lyapunov": 1.6128625138031552, + "grad_norm": 0.4556214841977421, + "grad_max_sv": 0.14623862877488136, + "grad_min_sv": 8.35081238742541e-09, + "grad_condition": 22897456.2787645, + "lr": 0.00019770044256881242, + "time_sec": 86.94620418548584 + }, + { + "epoch": 107, + "train_loss": 3.6474036177062987, + "train_acc": 0.14436, + "test_loss": 16.341380340576173, + "test_acc": 0.01, + "lyapunov": 1.6005805322276356, + "grad_norm": 0.4558707065978972, + "grad_max_sv": 0.1438352506607771, + "grad_min_sv": 8.153306160774143e-09, + "grad_condition": 28678862.20354884, + "lr": 0.0001894261098608447, + "time_sec": 86.92901086807251 + }, + { + "epoch": 108, + "train_loss": 3.64195158744812, + "train_acc": 0.14854, + "test_loss": 16.13983441772461, + "test_acc": 0.01, + "lyapunov": 1.5959153809510838, + "grad_norm": 0.44978366312692825, + "grad_max_sv": 0.14036127552390099, + "grad_min_sv": 8.045889865124223e-09, + "grad_condition": 58306956.06627731, + "lr": 0.000181288005125655, + "time_sec": 86.98011660575867 + }, + { + "epoch": 109, + "train_loss": 3.6266686278533937, + "train_acc": 0.15044, + "test_loss": 13.34403349609375, + "test_acc": 0.01, + "lyapunov": 1.5974578250704519, + "grad_norm": 0.44922727432413695, + "grad_max_sv": 0.14036725666373967, + "grad_min_sv": 8.066583009891381e-09, + "grad_condition": 21363445.86062481, + "lr": 0.0001732896980049473, + "time_sec": 86.92482805252075 + }, + { + "epoch": 110, + "train_loss": 3.6173717938995362, + "train_acc": 0.15206, + "test_loss": 13.922172198486328, + "test_acc": 0.01, + "lyapunov": 1.5978824046566664, + "grad_norm": 0.4481646742398913, + "grad_max_sv": 0.1430126352235675, + "grad_min_sv": 8.061564414629796e-09, + "grad_condition": 23420444.96340143, + "lr": 0.00016543469682057076, + "time_sec": 86.95183658599854 + }, + { + "epoch": 111, + "train_loss": 3.6168490284729002, + "train_acc": 0.15164, + "test_loss": 12.300112701416015, + "test_acc": 0.01, + "lyapunov": 1.6014556332927226, + "grad_norm": 0.4490755550093575, + "grad_max_sv": 0.1372088748961687, + "grad_min_sv": 8.051073664694375e-09, + "grad_condition": 25036223.25955468, + "lr": 0.00015772644703565552, + "time_sec": 86.93953967094421 + }, + { + "epoch": 112, + "train_loss": 3.6116537487030027, + "train_acc": 0.15298, + "test_loss": 13.514413836669922, + "test_acc": 0.01, + "lyapunov": 1.5957695931729758, + "grad_norm": 0.44693782668430027, + "grad_max_sv": 0.13832484576851128, + "grad_min_sv": 8.078373675557415e-09, + "grad_condition": 20791514.24093638, + "lr": 0.00015016832974331713, + "time_sec": 86.95485806465149 + }, + { + "epoch": 113, + "train_loss": 3.6070840077209474, + "train_acc": 0.15356, + "test_loss": 12.948514440917968, + "test_acc": 0.01, + "lyapunov": 1.5965250980518664, + "grad_norm": 0.4489570991887171, + "grad_max_sv": 0.13833273742347957, + "grad_min_sv": 8.10550010998945e-09, + "grad_condition": 19843219.32987036, + "lr": 0.00014276366018359834, + "time_sec": 86.9850001335144 + }, + { + "epoch": 114, + "train_loss": 3.597067463912964, + "train_acc": 0.15536, + "test_loss": 12.993196331787109, + "test_acc": 0.01, + "lyapunov": 1.5981119883334851, + "grad_norm": 0.44825309627638765, + "grad_max_sv": 0.13965518064796925, + "grad_min_sv": 8.13492008408523e-09, + "grad_condition": 35153718.804865494, + "lr": 0.00013551568628929425, + "time_sec": 86.96869111061096 + }, + { + "epoch": 115, + "train_loss": 3.59910719619751, + "train_acc": 0.15512, + "test_loss": 13.8083347946167, + "test_acc": 0.01, + "lyapunov": 1.5909668856569568, + "grad_norm": 0.4487286545501095, + "grad_max_sv": 0.13403443209826946, + "grad_min_sv": 8.086047226241177e-09, + "grad_condition": 22208009.194598757, + "lr": 0.00012842758726130276, + "time_sec": 86.98436570167542 + }, + { + "epoch": 116, + "train_loss": 3.614414676589966, + "train_acc": 0.15304, + "test_loss": 13.193821392822265, + "test_acc": 0.01, + "lyapunov": 1.6072389957545055, + "grad_norm": 0.44606534157464744, + "grad_max_sv": 0.13655881509184836, + "grad_min_sv": 8.107296081694137e-09, + "grad_condition": 19574927.631571237, + "lr": 0.0001215024721741218, + "time_sec": 86.9653697013855 + }, + { + "epoch": 117, + "train_loss": 3.5979878522491453, + "train_acc": 0.1557, + "test_loss": 12.478252127075196, + "test_acc": 0.01, + "lyapunov": 1.5981775647234124, + "grad_norm": 0.4508722951740394, + "grad_max_sv": 0.13530571274459363, + "grad_min_sv": 8.099007993422891e-09, + "grad_condition": 93528307.44650176, + "lr": 0.00011474337861210538, + "time_sec": 86.95283102989197 + }, + { + "epoch": 118, + "train_loss": 3.6169362755584715, + "train_acc": 0.15154, + "test_loss": 13.820507278442383, + "test_acc": 0.01, + "lyapunov": 1.6159481843719092, + "grad_norm": 0.4739834554035624, + "grad_max_sv": 0.13695121873170138, + "grad_min_sv": 8.070444825080303e-09, + "grad_condition": 2839427454.718379, + "lr": 0.00010815327133708009, + "time_sec": 86.95242261886597 + }, + { + "epoch": 119, + "train_loss": 3.586508418045044, + "train_acc": 0.15522, + "test_loss": 12.320869653320312, + "test_acc": 0.01, + "lyapunov": 1.6099912086716088, + "grad_norm": 0.45808687918480023, + "grad_max_sv": 0.13901935014873743, + "grad_min_sv": 8.365241294105986e-09, + "grad_condition": 20497333.66126097, + "lr": 0.00010173504098790182, + "time_sec": 86.95068407058716 + }, + { + "epoch": 120, + "train_loss": 3.594565878448486, + "train_acc": 0.15554, + "test_loss": 12.566050117492676, + "test_acc": 0.01, + "lyapunov": 1.592419114564081, + "grad_norm": 0.45179367321174574, + "grad_max_sv": 0.13976030256599187, + "grad_min_sv": 8.21819581223876e-09, + "grad_condition": 236027859.13267118, + "lr": 9.549150281252629e-05, + "time_sec": 86.94811153411865 + }, + { + "epoch": 121, + "train_loss": 3.571910457839966, + "train_acc": 0.16, + "test_loss": 13.28653671875, + "test_acc": 0.01, + "lyapunov": 1.594237220866601, + "grad_norm": 0.45599158951422275, + "grad_max_sv": 0.1383255071938038, + "grad_min_sv": 8.310267510247549e-09, + "grad_condition": 22424462.588012565, + "lr": 8.942539543314794e-05, + "time_sec": 86.97603249549866 + }, + { + "epoch": 122, + "train_loss": 3.576590520477295, + "train_acc": 0.15836, + "test_loss": 12.382398129272461, + "test_acc": 0.01, + "lyapunov": 1.5904823736766416, + "grad_norm": 0.45552095622752037, + "grad_max_sv": 0.13581450190395117, + "grad_min_sv": 8.293209310950011e-09, + "grad_condition": 20678746.83844463, + "lr": 8.353937964495024e-05, + "time_sec": 86.98238325119019 + }, + { + "epoch": 123, + "train_loss": 3.5637081575012206, + "train_acc": 0.15918, + "test_loss": 13.356674835205078, + "test_acc": 0.01, + "lyapunov": 1.5919670043394083, + "grad_norm": 0.4543696402957075, + "grad_max_sv": 0.13669848274439572, + "grad_min_sv": 8.274563620294489e-09, + "grad_condition": 530363976.123411, + "lr": 7.783603724899243e-05, + "time_sec": 86.97274160385132 + }, + { + "epoch": 124, + "train_loss": 3.5656386724853517, + "train_acc": 0.156, + "test_loss": 12.923330947875977, + "test_acc": 0.01, + "lyapunov": 1.585750177388301, + "grad_norm": 0.45582905257879397, + "grad_max_sv": 0.14233403466641903, + "grad_min_sv": 8.433538600804979e-09, + "grad_condition": 20568679.386500545, + "lr": 7.231786991974666e-05, + "time_sec": 87.00073099136353 + }, + { + "epoch": 125, + "train_loss": 3.56113921333313, + "train_acc": 0.16064, + "test_loss": 12.912995344543457, + "test_acc": 0.01, + "lyapunov": 1.5937265608926563, + "grad_norm": 0.4559850954417373, + "grad_max_sv": 0.14103519525378944, + "grad_min_sv": 8.227180888897151e-09, + "grad_condition": 845919413.8164043, + "lr": 6.698729810778072e-05, + "time_sec": 86.962557554245 + }, + { + "epoch": 126, + "train_loss": 3.5613428678131105, + "train_acc": 0.16236, + "test_loss": 13.346916006469726, + "test_acc": 0.01, + "lyapunov": 1.5917792411716394, + "grad_norm": 0.4552534127580613, + "grad_max_sv": 0.1387007746845484, + "grad_min_sv": 8.233278634209306e-09, + "grad_condition": 55753253.31191778, + "lr": 6.184665997806817e-05, + "time_sec": 86.96297550201416 + }, + { + "epoch": 127, + "train_loss": 3.5623228128051756, + "train_acc": 0.16182, + "test_loss": 12.482252976989747, + "test_acc": 0.01, + "lyapunov": 1.5930519658891136, + "grad_norm": 0.4571494156872022, + "grad_max_sv": 0.13955486342310905, + "grad_min_sv": 8.368131113045685e-09, + "grad_condition": 18887704.93686148, + "lr": 5.6898210384392595e-05, + "time_sec": 86.93619394302368 + }, + { + "epoch": 128, + "train_loss": 3.5547854151916503, + "train_acc": 0.16194, + "test_loss": 12.04546644897461, + "test_acc": 0.01, + "lyapunov": 1.596600215148438, + "grad_norm": 0.4528871946129552, + "grad_max_sv": 0.13451121244579553, + "grad_min_sv": 8.421135419545145e-09, + "grad_condition": 19083239.514846243, + "lr": 5.214411988029363e-05, + "time_sec": 86.9260938167572 + }, + { + "epoch": 129, + "train_loss": 3.55141931640625, + "train_acc": 0.16244, + "test_loss": 11.020759634399415, + "test_acc": 0.01, + "lyapunov": 1.5903867144718804, + "grad_norm": 0.4563521421157675, + "grad_max_sv": 0.13569981120526792, + "grad_min_sv": 8.371482823621434e-09, + "grad_condition": 23747932.223175477, + "lr": 4.7586473766990294e-05, + "time_sec": 86.95992183685303 + }, + { + "epoch": 130, + "train_loss": 3.5459538854217527, + "train_acc": 0.16244, + "test_loss": 11.208521502685548, + "test_acc": 0.01, + "lyapunov": 1.5891283159060856, + "grad_norm": 0.4580085602032628, + "grad_max_sv": 0.1428094120696187, + "grad_min_sv": 8.349487273795475e-09, + "grad_condition": 19461475.588800896, + "lr": 4.32272711786996e-05, + "time_sec": 86.93538308143616 + }, + { + "epoch": 131, + "train_loss": 3.558525732421875, + "train_acc": 0.15972, + "test_loss": 12.568882592773438, + "test_acc": 0.01, + "lyapunov": 1.5841145484953585, + "grad_norm": 0.48081196791485864, + "grad_max_sv": 0.13814902417361735, + "grad_min_sv": 8.270589697823016e-09, + "grad_condition": 24037113.0692943, + "lr": 3.906842420574966e-05, + "time_sec": 86.94438147544861 + }, + { + "epoch": 132, + "train_loss": 3.5661671807098387, + "train_acc": 0.16126, + "test_loss": 12.68510948486328, + "test_acc": 0.01, + "lyapunov": 1.5863902437717408, + "grad_norm": 0.45601709800858026, + "grad_max_sv": 0.13818404618650676, + "grad_min_sv": 8.232326872970041e-09, + "grad_condition": 23552868.195127018, + "lr": 3.5111757055874305e-05, + "time_sec": 86.92369508743286 + }, + { + "epoch": 133, + "train_loss": 3.558476961517334, + "train_acc": 0.16144, + "test_loss": 12.19923288269043, + "test_acc": 0.01, + "lyapunov": 1.5869078831294614, + "grad_norm": 0.4813384001420275, + "grad_max_sv": 0.13685211148113013, + "grad_min_sv": 8.395861997301246e-09, + "grad_condition": 21548117.02208554, + "lr": 3.1359005254054254e-05, + "time_sec": 87.053964138031 + }, + { + "epoch": 134, + "train_loss": 3.553262917404175, + "train_acc": 0.16388, + "test_loss": 13.270139483642579, + "test_acc": 0.01, + "lyapunov": 1.5872592282722064, + "grad_norm": 0.4564815483885395, + "grad_max_sv": 0.13975560273975135, + "grad_min_sv": 8.42094450559383e-09, + "grad_condition": 22619871.333677623, + "lr": 2.7811814881259484e-05, + "time_sec": 87.00632071495056 + }, + { + "epoch": 135, + "train_loss": 3.550828792724609, + "train_acc": 0.16302, + "test_loss": 12.738151782226563, + "test_acc": 0.01, + "lyapunov": 1.5826656888513004, + "grad_norm": 0.455201814869344, + "grad_max_sv": 0.13967375233769416, + "grad_min_sv": 8.311341058442334e-09, + "grad_condition": 20879397.228604488, + "lr": 2.4471741852423218e-05, + "time_sec": 86.95437407493591 + }, + { + "epoch": 136, + "train_loss": 3.551168853302002, + "train_acc": 0.1632, + "test_loss": 12.151814176940919, + "test_acc": 0.01, + "lyapunov": 1.5836480416910117, + "grad_norm": 0.4554914291491391, + "grad_max_sv": 0.13944239709526302, + "grad_min_sv": 8.338976177635349e-09, + "grad_condition": 22102603.436589945, + "lr": 2.1340251233966362e-05, + "time_sec": 86.91853213310242 + }, + { + "epoch": 137, + "train_loss": 3.5524956353759767, + "train_acc": 0.16306, + "test_loss": 12.044658526611329, + "test_acc": 0.01, + "lyapunov": 1.588264409233542, + "grad_norm": 0.45593430306024324, + "grad_max_sv": 0.14212556090205908, + "grad_min_sv": 8.474210927422731e-09, + "grad_condition": 19220785.781618483, + "lr": 1.8418716601170932e-05, + "time_sec": 87.0023365020752 + }, + { + "epoch": 138, + "train_loss": 3.5443750843811035, + "train_acc": 0.16446, + "test_loss": 12.686626306152343, + "test_acc": 0.01, + "lyapunov": 1.5809197684992915, + "grad_norm": 0.45547983858246405, + "grad_max_sv": 0.13838534355163573, + "grad_min_sv": 8.251677251908118e-09, + "grad_condition": 26051046.712826222, + "lr": 1.570841943568445e-05, + "time_sec": 86.97056412696838 + }, + { + "epoch": 139, + "train_loss": 3.546086183013916, + "train_acc": 0.16506, + "test_loss": 12.577361032104491, + "test_acc": 0.01, + "lyapunov": 1.5876071007965167, + "grad_norm": 0.4815643162649342, + "grad_max_sv": 0.13984339833259582, + "grad_min_sv": 8.30150362340909e-09, + "grad_condition": 22471111.660606384, + "lr": 1.3210548563419845e-05, + "time_sec": 86.9632363319397 + }, + { + "epoch": 140, + "train_loss": 3.5484837767028807, + "train_acc": 0.16252, + "test_loss": 12.433845492553711, + "test_acc": 0.01, + "lyapunov": 1.583712893678709, + "grad_norm": 0.455815896192293, + "grad_max_sv": 0.13972379975020885, + "grad_min_sv": 8.472806470316563e-09, + "grad_condition": 20692266.86175378, + "lr": 1.0926199633097203e-05, + "time_sec": 87.00575137138367 + }, + { + "epoch": 141, + "train_loss": 3.549246969680786, + "train_acc": 0.16378, + "test_loss": 12.216989669799805, + "test_acc": 0.01, + "lyapunov": 1.5795855665450815, + "grad_norm": 0.4563113035389347, + "grad_max_sv": 0.13676640279591085, + "grad_min_sv": 8.292400613830325e-09, + "grad_condition": 166938163.47655272, + "lr": 8.856374635655688e-06, + "time_sec": 87.0329806804657 + }, + { + "epoch": 142, + "train_loss": 3.5504096357727053, + "train_acc": 0.16228, + "test_loss": 12.457387181091308, + "test_acc": 0.01, + "lyapunov": 1.5839585102427647, + "grad_norm": 0.45750694546517895, + "grad_max_sv": 0.13983552623540163, + "grad_min_sv": 8.294693049082369e-09, + "grad_condition": 19557640.433229152, + "lr": 7.001981464747503e-06, + "time_sec": 87.01735019683838 + }, + { + "epoch": 143, + "train_loss": 3.550999901123047, + "train_acc": 0.16328, + "test_loss": 11.619247952270507, + "test_acc": 0.01, + "lyapunov": 1.581841357223823, + "grad_norm": 0.5056335656044699, + "grad_max_sv": 0.1368855085223913, + "grad_min_sv": 8.29868041507531e-09, + "grad_condition": 20268360.65968836, + "lr": 5.3638335185058295e-06, + "time_sec": 87.04096722602844 + }, + { + "epoch": 144, + "train_loss": 3.551519507369995, + "train_acc": 0.16406, + "test_loss": 12.968487936401367, + "test_acc": 0.01, + "lyapunov": 1.5792252258266635, + "grad_norm": 0.45788022217526314, + "grad_max_sv": 0.1386097924783826, + "grad_min_sv": 8.452128945346526e-09, + "grad_condition": 25730976.14914393, + "lr": 3.942649342761114e-06, + "time_sec": 86.95848679542542 + }, + { + "epoch": 145, + "train_loss": 3.5502905805206297, + "train_acc": 0.1632, + "test_loss": 11.44388599090576, + "test_acc": 0.01, + "lyapunov": 1.5817355405339195, + "grad_norm": 0.45750383482996937, + "grad_max_sv": 0.1386595867574215, + "grad_min_sv": 8.300189706378357e-09, + "grad_condition": 28768914.37405598, + "lr": 2.7390523158633524e-06, + "time_sec": 86.94220089912415 + }, + { + "epoch": 146, + "train_loss": 3.5512858894348143, + "train_acc": 0.16488, + "test_loss": 11.365958471679688, + "test_acc": 0.01, + "lyapunov": 1.581334916222126, + "grad_norm": 0.45822887700481946, + "grad_max_sv": 0.14089943766593932, + "grad_min_sv": 8.327259416740507e-09, + "grad_condition": 44970764.53328274, + "lr": 1.7535703752478133e-06, + "time_sec": 86.94011187553406 + }, + { + "epoch": 147, + "train_loss": 3.550200090789795, + "train_acc": 0.16272, + "test_loss": 11.458188932800294, + "test_acc": 0.01, + "lyapunov": 1.5809953587744243, + "grad_norm": 0.48194488873837205, + "grad_max_sv": 0.1371115766465664, + "grad_min_sv": 8.368186586206471e-09, + "grad_condition": 90078475.94101183, + "lr": 9.866357858642196e-07, + "time_sec": 86.92108464241028 + }, + { + "epoch": 148, + "train_loss": 3.5539947522735598, + "train_acc": 0.16328, + "test_loss": 12.301221487426758, + "test_acc": 0.01, + "lyapunov": 1.582784356058711, + "grad_norm": 0.45804937695495906, + "grad_max_sv": 0.13778063971549273, + "grad_min_sv": 8.387954587851798e-09, + "grad_condition": 20647087.073492076, + "lr": 4.38584950570808e-07, + "time_sec": 86.95030283927917 + }, + { + "epoch": 149, + "train_loss": 3.552806600189209, + "train_acc": 0.1621, + "test_loss": 11.484873080444336, + "test_acc": 0.01, + "lyapunov": 1.583863987947059, + "grad_norm": 0.4577095154493945, + "grad_max_sv": 0.13773377276957036, + "grad_min_sv": 8.27446097056983e-09, + "grad_condition": 23606522.33603049, + "lr": 1.096582625772501e-07, + "time_sec": 86.98065185546875 + }, + { + "epoch": 150, + "train_loss": 3.552337872467041, + "train_acc": 0.16344, + "test_loss": 11.95844083557129, + "test_acc": 0.01, + "lyapunov": 1.5831444952494043, + "grad_norm": 0.4571571171897792, + "grad_max_sv": 0.13750182762742041, + "grad_min_sv": 8.272403564935082e-09, + "grad_condition": 20799248.812125724, + "lr": 0.0, + "time_sec": 86.96866011619568 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 5.093480541229248, + "train_acc": 0.0164, + "test_loss": 4.951779422760009, + "test_acc": 0.0114, + "lyapunov": 2.5258567003947694, + "grad_norm": 5.272969058209084, + "grad_max_sv": 4.536009293794632, + "grad_min_sv": 9.025351698950524e-08, + "grad_condition": 1008753690.9335768, + "lr": 0.0009998903417374227, + "time_sec": 132.1505901813507 + }, + { + "epoch": 2, + "train_loss": 4.783717939453125, + "train_acc": 0.01934, + "test_loss": 4.956400106048584, + "test_acc": 0.0099, + "lyapunov": 2.113569995326459, + "grad_norm": 3.7387776933061354, + "grad_max_sv": 3.181053787469864, + "grad_min_sv": 6.103191964590415e-08, + "grad_condition": 76830667.42994572, + "lr": 0.0009995614150494292, + "time_sec": 132.10792446136475 + }, + { + "epoch": 3, + "train_loss": 4.682052931213379, + "train_acc": 0.02242, + "test_loss": 4.794901498413086, + "test_acc": 0.01, + "lyapunov": 1.9766119901481491, + "grad_norm": 3.1862358950156584, + "grad_max_sv": 2.7251826524734497, + "grad_min_sv": 4.940198838065957e-08, + "grad_condition": 239516990.12236896, + "lr": 0.0009990133642141358, + "time_sec": 132.10769820213318 + }, + { + "epoch": 4, + "train_loss": 4.638096351318359, + "train_acc": 0.02338, + "test_loss": 4.6849861915588376, + "test_acc": 0.0088, + "lyapunov": 1.9358430570348755, + "grad_norm": 2.8278763341247104, + "grad_max_sv": 2.3887839674949647, + "grad_min_sv": 4.29566129223069e-08, + "grad_condition": 70058075.61594215, + "lr": 0.0009982464296247522, + "time_sec": 132.1413631439209 + }, + { + "epoch": 5, + "train_loss": 4.5945222178649905, + "train_acc": 0.02476, + "test_loss": 4.694830523681641, + "test_acc": 0.01, + "lyapunov": 1.873431063064224, + "grad_norm": 2.542418399235304, + "grad_max_sv": 2.1823901772499084, + "grad_min_sv": 3.936586880914916e-08, + "grad_condition": 65028799.05268152, + "lr": 0.0009972609476841367, + "time_sec": 132.11404299736023 + }, + { + "epoch": 6, + "train_loss": 4.542771276245118, + "train_acc": 0.02718, + "test_loss": 4.6554784561157225, + "test_acc": 0.011, + "lyapunov": 1.846754339344971, + "grad_norm": 2.186253756892433, + "grad_max_sv": 1.796432802081108, + "grad_min_sv": 3.4262639014848165e-08, + "grad_condition": 58220592.492028, + "lr": 0.000996057350657239, + "time_sec": 132.1098918914795 + }, + { + "epoch": 7, + "train_loss": 4.4942261624145505, + "train_acc": 0.029, + "test_loss": 4.681510513305664, + "test_acc": 0.0096, + "lyapunov": 1.8624430949730642, + "grad_norm": 1.5614358774754566, + "grad_max_sv": 1.1527211368083954, + "grad_min_sv": 2.6364993480076926e-08, + "grad_condition": 182614297.81623182, + "lr": 0.000994636166481494, + "time_sec": 132.12222027778625 + }, + { + "epoch": 8, + "train_loss": 4.46247056640625, + "train_acc": 0.02884, + "test_loss": 4.662567490386963, + "test_acc": 0.0108, + "lyapunov": 1.844880536389168, + "grad_norm": 1.147583575655559, + "grad_max_sv": 0.7361248254776, + "grad_min_sv": 1.841648028869103e-08, + "grad_condition": 124584859.33962445, + "lr": 0.0009929980185352525, + "time_sec": 132.15038108825684 + }, + { + "epoch": 9, + "train_loss": 4.470439504089356, + "train_acc": 0.02862, + "test_loss": 4.67383145904541, + "test_acc": 0.01, + "lyapunov": 1.7943601166195882, + "grad_norm": 0.9387495812629724, + "grad_max_sv": 0.5604371950030327, + "grad_min_sv": 1.4283977281537297e-08, + "grad_condition": 69021346.84748732, + "lr": 0.0009911436253643444, + "time_sec": 132.14666748046875 + }, + { + "epoch": 10, + "train_loss": 4.444021055908203, + "train_acc": 0.03062, + "test_loss": 4.703793017578125, + "test_acc": 0.0117, + "lyapunov": 1.7941059179013343, + "grad_norm": 0.7750659560319146, + "grad_max_sv": 0.43930391520261763, + "grad_min_sv": 1.1478437037665268e-08, + "grad_condition": 99153608.6568211, + "lr": 0.0009890738003669028, + "time_sec": 132.10582995414734 + }, + { + "epoch": 11, + "train_loss": 4.432285560607911, + "train_acc": 0.033, + "test_loss": 4.697426881408691, + "test_acc": 0.01, + "lyapunov": 1.7903570470297734, + "grad_norm": 0.6893504146482624, + "grad_max_sv": 0.372271079570055, + "grad_min_sv": 1.0017648831295301e-08, + "grad_condition": 53264269.98770611, + "lr": 0.00098678945143658, + "time_sec": 132.1349811553955 + }, + { + "epoch": 12, + "train_loss": 4.423722417602539, + "train_acc": 0.03148, + "test_loss": 4.848358657073975, + "test_acc": 0.01, + "lyapunov": 1.747073896705647, + "grad_norm": 0.6359958118399717, + "grad_max_sv": 0.35021247938275335, + "grad_min_sv": 8.759130606939003e-09, + "grad_condition": 49917776.1229025, + "lr": 0.0009842915805643154, + "time_sec": 132.14347434043884 + }, + { + "epoch": 13, + "train_loss": 4.415838943786621, + "train_acc": 0.03384, + "test_loss": 5.315225978088379, + "test_acc": 0.01, + "lyapunov": 1.7329754283666001, + "grad_norm": 0.5727006271295083, + "grad_max_sv": 0.2875354364514351, + "grad_min_sv": 7.870123534814422e-09, + "grad_condition": 45065343.610956885, + "lr": 0.000981581283398829, + "time_sec": 132.1161012649536 + }, + { + "epoch": 14, + "train_loss": 4.405268566894531, + "train_acc": 0.03726, + "test_loss": 5.051113725280762, + "test_acc": 0.0089, + "lyapunov": 1.7365910598384144, + "grad_norm": 0.5567815422728497, + "grad_max_sv": 0.2535946353689383, + "grad_min_sv": 7.466976926111848e-09, + "grad_condition": 33242443.419912286, + "lr": 0.0009786597487660333, + "time_sec": 132.19835686683655 + }, + { + "epoch": 15, + "train_loss": 4.4498287826538085, + "train_acc": 0.0298, + "test_loss": 5.018837545776367, + "test_acc": 0.01, + "lyapunov": 1.7563624720439277, + "grad_norm": 0.48061471025200103, + "grad_max_sv": 0.25300529673695565, + "grad_min_sv": 5.973170774317693e-09, + "grad_condition": 232434311.93740588, + "lr": 0.0009755282581475766, + "time_sec": 132.13766241073608 + }, + { + "epoch": 16, + "train_loss": 4.4404813890075685, + "train_acc": 0.03136, + "test_loss": 4.949696199035644, + "test_acc": 0.0072, + "lyapunov": 1.7201906845087895, + "grad_norm": 0.4494383370244252, + "grad_max_sv": 0.2241064589470625, + "grad_min_sv": 5.623495152873304e-09, + "grad_condition": 49482042.46895528, + "lr": 0.0009721881851187403, + "time_sec": 132.1307873725891 + }, + { + "epoch": 17, + "train_loss": 4.423229548950196, + "train_acc": 0.03264, + "test_loss": 4.881808558654785, + "test_acc": 0.0075, + "lyapunov": 1.7098296539252982, + "grad_norm": 0.439640280455229, + "grad_max_sv": 0.21520022340118886, + "grad_min_sv": 5.494700056063451e-09, + "grad_condition": 50360167.53711064, + "lr": 0.0009686409947459456, + "time_sec": 132.12213110923767 + }, + { + "epoch": 18, + "train_loss": 4.425767096099854, + "train_acc": 0.03428, + "test_loss": 4.762300608825684, + "test_acc": 0.0141, + "lyapunov": 1.7254444985743373, + "grad_norm": 0.43102682256118363, + "grad_max_sv": 0.21962687484920024, + "grad_min_sv": 5.481251717787128e-09, + "grad_condition": 62403316.997678205, + "lr": 0.0009648882429441254, + "time_sec": 132.1801242828369 + }, + { + "epoch": 19, + "train_loss": 4.439898339691162, + "train_acc": 0.03102, + "test_loss": 4.7574590133667, + "test_acc": 0.01, + "lyapunov": 1.7191586774938248, + "grad_norm": 0.4103540622399138, + "grad_max_sv": 0.2047900702804327, + "grad_min_sv": 5.2553816437539425e-09, + "grad_condition": 45680253.996666625, + "lr": 0.00096093157579425, + "time_sec": 132.14622616767883 + }, + { + "epoch": 20, + "train_loss": 4.457335680847168, + "train_acc": 0.0282, + "test_loss": 4.84942807006836, + "test_acc": 0.0085, + "lyapunov": 1.71052074920186, + "grad_norm": 0.38215996406438607, + "grad_max_sv": 0.1988411284983158, + "grad_min_sv": 4.469477583868287e-09, + "grad_condition": 64442697.301740505, + "lr": 0.0009567727288213001, + "time_sec": 132.18120908737183 + }, + { + "epoch": 21, + "train_loss": 4.468818942108154, + "train_acc": 0.02682, + "test_loss": 4.99621100616455, + "test_acc": 0.01, + "lyapunov": 1.689738617528735, + "grad_norm": 0.3607957385038194, + "grad_max_sv": 0.19746851846575736, + "grad_min_sv": 3.811521070637425e-09, + "grad_condition": 89818594.76751825, + "lr": 0.0009524135262330095, + "time_sec": 132.16746854782104 + }, + { + "epoch": 22, + "train_loss": 4.462937829284668, + "train_acc": 0.0266, + "test_loss": 5.021303575897217, + "test_acc": 0.0118, + "lyapunov": 1.6899086160732961, + "grad_norm": 0.33217592351402775, + "grad_max_sv": 0.16988870538771153, + "grad_min_sv": 3.581840562170979e-09, + "grad_condition": 178046345.73741922, + "lr": 0.0009478558801197061, + "time_sec": 132.1549870967865 + }, + { + "epoch": 23, + "train_loss": 4.464460679016113, + "train_acc": 0.02638, + "test_loss": 4.941819158172607, + "test_acc": 0.0103, + "lyapunov": 1.6879293180792534, + "grad_norm": 0.324019456404472, + "grad_max_sv": 0.1607154045253992, + "grad_min_sv": 3.337528521954458e-09, + "grad_condition": 109495681.75814696, + "lr": 0.000943101789615607, + "time_sec": 132.1468689441681 + }, + { + "epoch": 24, + "train_loss": 4.463202658996582, + "train_acc": 0.02798, + "test_loss": 4.871240232849121, + "test_acc": 0.0131, + "lyapunov": 1.6886080326631552, + "grad_norm": 0.3201027734589547, + "grad_max_sv": 0.15962571650743484, + "grad_min_sv": 3.349112888981296e-09, + "grad_condition": 1306218372.160006, + "lr": 0.0009381533400219313, + "time_sec": 132.12717270851135 + }, + { + "epoch": 25, + "train_loss": 4.460873207702637, + "train_acc": 0.0277, + "test_loss": 4.803280967712403, + "test_acc": 0.0103, + "lyapunov": 1.6859856490283975, + "grad_norm": 0.3149311014522828, + "grad_max_sv": 0.16311234198510646, + "grad_min_sv": 3.1627192715460993e-09, + "grad_condition": 77293700.78383549, + "lr": 0.0009330127018922189, + "time_sec": 132.17411255836487 + }, + { + "epoch": 26, + "train_loss": 4.45674253692627, + "train_acc": 0.0297, + "test_loss": 4.796747819519043, + "test_acc": 0.0106, + "lyapunov": 1.6874452579356825, + "grad_norm": 0.31292294309713004, + "grad_max_sv": 0.15273103043437003, + "grad_min_sv": 3.1780742041492836e-09, + "grad_condition": 81020390.34111668, + "lr": 0.000927682130080253, + "time_sec": 132.11353087425232 + }, + { + "epoch": 27, + "train_loss": 4.4604747364807125, + "train_acc": 0.02898, + "test_loss": 4.734377107238769, + "test_acc": 0.0101, + "lyapunov": 1.6862671268565574, + "grad_norm": 0.30060678348737635, + "grad_max_sv": 0.14766201358288528, + "grad_min_sv": 2.926658054726479e-09, + "grad_condition": 343084596.85497886, + "lr": 0.0009221639627510072, + "time_sec": 132.19565391540527 + }, + { + "epoch": 28, + "train_loss": 4.4614792274475095, + "train_acc": 0.0267, + "test_loss": 5.034359852600097, + "test_acc": 0.0096, + "lyapunov": 1.6969501737438504, + "grad_norm": 0.3030134158153995, + "grad_max_sv": 0.15624292846769094, + "grad_min_sv": 2.7683598695545097e-09, + "grad_condition": 202791872.97820872, + "lr": 0.0009164606203550494, + "time_sec": 132.1659483909607 + }, + { + "epoch": 29, + "train_loss": 4.464634677429199, + "train_acc": 0.02846, + "test_loss": 5.127542732238769, + "test_acc": 0.0117, + "lyapunov": 1.6796985815857988, + "grad_norm": 0.28779678730535624, + "grad_max_sv": 0.1401840390637517, + "grad_min_sv": 2.6427347623626807e-09, + "grad_condition": 281045279.9265651, + "lr": 0.0009105746045668516, + "time_sec": 132.14807105064392 + }, + { + "epoch": 30, + "train_loss": 4.459805185546875, + "train_acc": 0.02844, + "test_loss": 4.91892096862793, + "test_acc": 0.01, + "lyapunov": 1.683965052180278, + "grad_norm": 0.2837122801189051, + "grad_max_sv": 0.13645010702311994, + "grad_min_sv": 2.726112462722932e-09, + "grad_condition": 380763623.0580058, + "lr": 0.0009045084971874733, + "time_sec": 132.15507793426514 + }, + { + "epoch": 31, + "train_loss": 4.4911380870056155, + "train_acc": 0.02476, + "test_loss": 4.659154684448242, + "test_acc": 0.01, + "lyapunov": 1.693469688105766, + "grad_norm": 0.28637996974953944, + "grad_max_sv": 0.15418015364557505, + "grad_min_sv": 6.907299599802872e-10, + "grad_condition": 12934974978.13471, + "lr": 0.0008982649590120977, + "time_sec": 132.18995237350464 + }, + { + "epoch": 32, + "train_loss": 4.482972508544922, + "train_acc": 0.02506, + "test_loss": 5.101610327148437, + "test_acc": 0.01, + "lyapunov": 1.6612950267694186, + "grad_norm": 0.2762288427327109, + "grad_max_sv": 0.1509731261059642, + "grad_min_sv": 9.70621287791002e-10, + "grad_condition": 13596800140.398924, + "lr": 0.0008918467286629196, + "time_sec": 132.18785095214844 + }, + { + "epoch": 33, + "train_loss": 4.4797290808105465, + "train_acc": 0.02606, + "test_loss": 5.204112957000732, + "test_acc": 0.01, + "lyapunov": 1.6838472977928494, + "grad_norm": 0.3035201213508976, + "grad_max_sv": 0.14257617406547068, + "grad_min_sv": 8.308813689400204e-10, + "grad_condition": 13333320908.238403, + "lr": 0.0008852566213878943, + "time_sec": 132.16928958892822 + }, + { + "epoch": 34, + "train_loss": 4.488282367706299, + "train_acc": 0.024, + "test_loss": 5.69198985748291, + "test_acc": 0.01, + "lyapunov": 1.7140263745851834, + "grad_norm": 0.2759733723719535, + "grad_max_sv": 0.14591740891337396, + "grad_min_sv": 1.4200952253830224e-10, + "grad_condition": 25323234687.437927, + "lr": 0.000878497527825878, + "time_sec": 132.15029501914978 + }, + { + "epoch": 35, + "train_loss": 4.4768339254760745, + "train_acc": 0.02612, + "test_loss": 4.774974635314941, + "test_acc": 0.01, + "lyapunov": 1.7011144554523556, + "grad_norm": 0.2659547607598113, + "grad_max_sv": 0.13555025830864906, + "grad_min_sv": 6.972633117993632e-11, + "grad_condition": 14291413228.467663, + "lr": 0.000871572412738697, + "time_sec": 132.14557480812073 + }, + { + "epoch": 36, + "train_loss": 4.471775978088379, + "train_acc": 0.02596, + "test_loss": 5.075145365905762, + "test_acc": 0.01, + "lyapunov": 1.6838966897686425, + "grad_norm": 0.26348784767210515, + "grad_max_sv": 0.1345422573387623, + "grad_min_sv": 1.3983107736550223e-10, + "grad_condition": 12903386886.183636, + "lr": 0.0008644843137107055, + "time_sec": 132.14007782936096 + }, + { + "epoch": 37, + "train_loss": 4.479115681304932, + "train_acc": 0.02618, + "test_loss": 4.726371655273438, + "test_acc": 0.01, + "lyapunov": 1.6780877332858113, + "grad_norm": 0.267538901796918, + "grad_max_sv": 0.13495051376521588, + "grad_min_sv": 6.580729305752577e-10, + "grad_condition": 12150689800.856388, + "lr": 0.0008572363398164014, + "time_sec": 132.15209221839905 + }, + { + "epoch": 38, + "train_loss": 4.478568660888672, + "train_acc": 0.02988, + "test_loss": 4.669603369140625, + "test_acc": 0.01, + "lyapunov": 1.666163631107496, + "grad_norm": 0.27272372501848424, + "grad_max_sv": 0.13440994173288345, + "grad_min_sv": 2.0660542240645324e-09, + "grad_condition": 3722412312.3171625, + "lr": 0.0008498316702566826, + "time_sec": 132.16476106643677 + }, + { + "epoch": 39, + "train_loss": 4.487948446044922, + "train_acc": 0.02578, + "test_loss": 4.682211064147949, + "test_acc": 0.0094, + "lyapunov": 1.6648545499957736, + "grad_norm": 0.2514286157801758, + "grad_max_sv": 0.11860510352998972, + "grad_min_sv": 4.3644481818254777e-10, + "grad_condition": 28131413125.823936, + "lr": 0.0008422735529643442, + "time_sec": 132.1238396167755 + }, + { + "epoch": 40, + "train_loss": 4.4965964364624025, + "train_acc": 0.02266, + "test_loss": 4.682315950012207, + "test_acc": 0.0065, + "lyapunov": 1.6533517648496896, + "grad_norm": 0.23799752688026737, + "grad_max_sv": 0.11859588380903005, + "grad_min_sv": 4.517485330074683e-12, + "grad_condition": 41227263318.357445, + "lr": 0.0008345653031794289, + "time_sec": 132.11933135986328 + }, + { + "epoch": 41, + "train_loss": 4.484913978118897, + "train_acc": 0.02434, + "test_loss": 5.27199638595581, + "test_acc": 0.0099, + "lyapunov": 1.6664402661725992, + "grad_norm": 0.2566848603997265, + "grad_max_sv": 0.1298685621470213, + "grad_min_sv": 2.1326498270807758e-10, + "grad_condition": 17297931540.42852, + "lr": 0.0008267103019950526, + "time_sec": 132.143639087677 + }, + { + "epoch": 42, + "train_loss": 4.468604016418457, + "train_acc": 0.02626, + "test_loss": 5.080777891540527, + "test_acc": 0.01, + "lyapunov": 1.6653691447909227, + "grad_norm": 0.2764724970011725, + "grad_max_sv": 0.1291674818491174, + "grad_min_sv": 2.4026422252279896e-10, + "grad_condition": 23562794758.6484, + "lr": 0.0008187119948743447, + "time_sec": 132.13302302360535 + }, + { + "epoch": 43, + "train_loss": 4.446361914978027, + "train_acc": 0.02884, + "test_loss": 5.657773085784912, + "test_acc": 0.01, + "lyapunov": 1.6601061516100792, + "grad_norm": 0.25862337095253085, + "grad_max_sv": 0.12544651236385107, + "grad_min_sv": 5.367278505023993e-10, + "grad_condition": 10343213894.571672, + "lr": 0.000810573890139155, + "time_sec": 132.15784335136414 + }, + { + "epoch": 44, + "train_loss": 4.449865913238526, + "train_acc": 0.02946, + "test_loss": 5.434759209442139, + "test_acc": 0.01, + "lyapunov": 1.6606884228299037, + "grad_norm": 0.2501064909683511, + "grad_max_sv": 0.11750353146344424, + "grad_min_sv": 1.2351212005197107e-09, + "grad_condition": 2224069634.7043643, + "lr": 0.0008022995574311873, + "time_sec": 132.12399125099182 + }, + { + "epoch": 45, + "train_loss": 4.446895042724609, + "train_acc": 0.03078, + "test_loss": 5.662740403747558, + "test_acc": 0.01, + "lyapunov": 1.6508479164079632, + "grad_norm": 0.2542409538334788, + "grad_max_sv": 0.11570314355194569, + "grad_min_sv": 2.1666247507906577e-09, + "grad_condition": 1071116412.2051876, + "lr": 0.0007938926261462363, + "time_sec": 132.11558651924133 + }, + { + "epoch": 46, + "train_loss": 4.429976853942871, + "train_acc": 0.03192, + "test_loss": 6.447593637084961, + "test_acc": 0.01, + "lyapunov": 1.6503230879068984, + "grad_norm": 0.2629192843171559, + "grad_max_sv": 0.11958245150744914, + "grad_min_sv": 2.3712545399456886e-09, + "grad_condition": 795552608.2400708, + "lr": 0.0007853567838422158, + "time_sec": 132.13859677314758 + }, + { + "epoch": 47, + "train_loss": 4.440141257476807, + "train_acc": 0.0315, + "test_loss": 6.175933732604981, + "test_acc": 0.01, + "lyapunov": 1.643082844021985, + "grad_norm": 0.25077715487573377, + "grad_max_sv": 0.11236163638532162, + "grad_min_sv": 1.9769814967645554e-09, + "grad_condition": 4225399967.4466867, + "lr": 0.0007766957746216719, + "time_sec": 132.15062427520752 + }, + { + "epoch": 48, + "train_loss": 4.432960889587402, + "train_acc": 0.03282, + "test_loss": 7.094407357025147, + "test_acc": 0.01, + "lyapunov": 1.6440330926719529, + "grad_norm": 0.2559939552032393, + "grad_max_sv": 0.11997251566499471, + "grad_min_sv": 1.7538637819883545e-09, + "grad_condition": 3837004229.4805055, + "lr": 0.0007679133974894982, + "time_sec": 132.150963306427 + }, + { + "epoch": 49, + "train_loss": 4.4246444262695315, + "train_acc": 0.03332, + "test_loss": 6.304141744995118, + "test_acc": 0.01, + "lyapunov": 1.6639957580420062, + "grad_norm": 0.2677119064717794, + "grad_max_sv": 0.12199657559394836, + "grad_min_sv": 2.0906602498033456e-09, + "grad_condition": 2737740786.830507, + "lr": 0.000759013504686565, + "time_sec": 132.123437166214 + }, + { + "epoch": 50, + "train_loss": 4.388952998504639, + "train_acc": 0.03744, + "test_loss": 5.989702935028077, + "test_acc": 0.01, + "lyapunov": 1.6675343476902798, + "grad_norm": 0.2684555234949212, + "grad_max_sv": 0.11272672358900308, + "grad_min_sv": 2.712914801529867e-09, + "grad_condition": 241378009.45196733, + "lr": 0.0007499999999999998, + "time_sec": 132.18075037002563 + }, + { + "epoch": 51, + "train_loss": 4.425981845855713, + "train_acc": 0.03336, + "test_loss": 7.33361047668457, + "test_acc": 0.01, + "lyapunov": 1.663260484900316, + "grad_norm": 0.23880288436504032, + "grad_max_sv": 0.10996924396604299, + "grad_min_sv": 1.0324483909303964e-09, + "grad_condition": 21905066283.747993, + "lr": 0.0007408768370508575, + "time_sec": 132.20320773124695 + }, + { + "epoch": 52, + "train_loss": 4.474253611450195, + "train_acc": 0.02502, + "test_loss": 6.494455329895019, + "test_acc": 0.01, + "lyapunov": 1.6608991122916532, + "grad_norm": 0.21753362561600204, + "grad_max_sv": 0.10691614132374525, + "grad_min_sv": 1.5011627757471705e-11, + "grad_condition": 43394603515.75684, + "lr": 0.0007316480175599307, + "time_sec": 132.25971579551697 + }, + { + "epoch": 53, + "train_loss": 4.456141750946045, + "train_acc": 0.02862, + "test_loss": 6.2588445053100585, + "test_acc": 0.01, + "lyapunov": 1.6519648303156313, + "grad_norm": 0.22382376691509692, + "grad_max_sv": 0.10342430509626865, + "grad_min_sv": 6.169010558440421e-10, + "grad_condition": 35234547156.053955, + "lr": 0.0007223175895924635, + "time_sec": 132.24691557884216 + }, + { + "epoch": 54, + "train_loss": 4.481432471771241, + "train_acc": 0.02352, + "test_loss": 7.138134167480469, + "test_acc": 0.01, + "lyapunov": 1.6530556858652998, + "grad_norm": 0.23466419364577004, + "grad_max_sv": 0.10738010462373496, + "grad_min_sv": 2.21828635072755e-10, + "grad_condition": 52124830959.794014, + "lr": 0.0007128896457825361, + "time_sec": 132.16068625450134 + }, + { + "epoch": 55, + "train_loss": 4.481100361480713, + "train_acc": 0.022, + "test_loss": 7.534436863708496, + "test_acc": 0.01, + "lyapunov": 1.6422339604638727, + "grad_norm": 0.2006843818925739, + "grad_max_sv": 0.10320896934717894, + "grad_min_sv": 1.4001555500584635e-12, + "grad_condition": 56896253352.46786, + "lr": 0.0007033683215378998, + "time_sec": 132.18253254890442 + }, + { + "epoch": 56, + "train_loss": 4.465066035308838, + "train_acc": 0.02478, + "test_loss": 8.372714093017578, + "test_acc": 0.01, + "lyapunov": 1.6449412500766842, + "grad_norm": 0.23729119573244947, + "grad_max_sv": 0.10855503529310226, + "grad_min_sv": 2.2295564792341074e-12, + "grad_condition": 48629747045.42187, + "lr": 0.0006937577932260512, + "time_sec": 132.19158124923706 + }, + { + "epoch": 57, + "train_loss": 4.44365045288086, + "train_acc": 0.02604, + "test_loss": 8.35657233428955, + "test_acc": 0.01, + "lyapunov": 1.6452401361197158, + "grad_norm": 0.2245469225888597, + "grad_max_sv": 0.11490330714732408, + "grad_min_sv": 4.570529843944725e-12, + "grad_condition": 30449041453.168568, + "lr": 0.0006840622763423388, + "time_sec": 132.28182673454285 + }, + { + "epoch": 58, + "train_loss": 4.435514926147461, + "train_acc": 0.02592, + "test_loss": 7.728030586242676, + "test_acc": 0.01, + "lyapunov": 1.6485694628542342, + "grad_norm": 0.24858691157522766, + "grad_max_sv": 0.11334360390901566, + "grad_min_sv": 6.15407037006158e-12, + "grad_condition": 42417111885.625084, + "lr": 0.0006742860236609073, + "time_sec": 132.19542050361633 + }, + { + "epoch": 59, + "train_loss": 4.423215726165772, + "train_acc": 0.02842, + "test_loss": 7.240084691619873, + "test_acc": 0.01, + "lyapunov": 1.6464358674900612, + "grad_norm": 0.22968346464590486, + "grad_max_sv": 0.11179302539676428, + "grad_min_sv": 8.359720202319107e-12, + "grad_condition": 30290262945.665997, + "lr": 0.0006644333233692913, + "time_sec": 132.14637756347656 + }, + { + "epoch": 60, + "train_loss": 4.4195901382446285, + "train_acc": 0.02862, + "test_loss": 6.608919538879395, + "test_acc": 0.01, + "lyapunov": 1.6463265995235394, + "grad_norm": 0.2265519248830367, + "grad_max_sv": 0.11119911409914493, + "grad_min_sv": 8.317048035656272e-12, + "grad_condition": 30940581230.279675, + "lr": 0.0006545084971874734, + "time_sec": 132.19125843048096 + }, + { + "epoch": 61, + "train_loss": 4.417482298431397, + "train_acc": 0.02964, + "test_loss": 7.226232168579101, + "test_acc": 0.01, + "lyapunov": 1.6559016469799344, + "grad_norm": 0.22328050027519591, + "grad_max_sv": 0.10708067342638969, + "grad_min_sv": 6.643318285144196e-12, + "grad_condition": 27586814388.82783, + "lr": 0.0006445158984722354, + "time_sec": 132.20896816253662 + }, + { + "epoch": 62, + "train_loss": 4.417002453308106, + "train_acc": 0.03006, + "test_loss": 7.585696318054199, + "test_acc": 0.01, + "lyapunov": 1.6613401942850683, + "grad_norm": 0.22320537548539296, + "grad_max_sv": 0.10366554521024227, + "grad_min_sv": 1.0478788054824918e-11, + "grad_condition": 26948870287.17867, + "lr": 0.0006344599103076324, + "time_sec": 132.14733290672302 + }, + { + "epoch": 63, + "train_loss": 4.385719082489014, + "train_acc": 0.03458, + "test_loss": 5.228900546264648, + "test_acc": 0.01, + "lyapunov": 1.6645121260372269, + "grad_norm": 0.24853253845087553, + "grad_max_sv": 0.11708337739109993, + "grad_min_sv": 6.967468372327139e-10, + "grad_condition": 10567682701.05836, + "lr": 0.0006243449435824269, + "time_sec": 132.29192066192627 + }, + { + "epoch": 64, + "train_loss": 4.404363639678955, + "train_acc": 0.03296, + "test_loss": 4.7274385276794435, + "test_acc": 0.01, + "lyapunov": 1.6773027696877794, + "grad_norm": 0.7690147759354938, + "grad_max_sv": 0.10654795486257171, + "grad_min_sv": 1.971293366237014e-09, + "grad_condition": 13907648097.405878, + "lr": 0.0006141754350553275, + "time_sec": 132.13429880142212 + }, + { + "epoch": 65, + "train_loss": 4.558996030426026, + "train_acc": 0.01586, + "test_loss": 4.642805049133301, + "test_acc": 0.01, + "lyapunov": 1.8215271088168443, + "grad_norm": 0.16748472313271695, + "grad_max_sv": 0.1105620770715177, + "grad_min_sv": 8.787289494739994e-14, + "grad_condition": 102651332408.88431, + "lr": 0.0006039558454088793, + "time_sec": 132.16812777519226 + }, + { + "epoch": 66, + "train_loss": 4.543730935058594, + "train_acc": 0.01844, + "test_loss": 4.649595483398437, + "test_acc": 0.01, + "lyapunov": 1.8075619405492798, + "grad_norm": 0.19988328524296653, + "grad_max_sv": 0.12379183731973172, + "grad_min_sv": 1.04127554881492e-13, + "grad_condition": 112836624201.79141, + "lr": 0.000593690657292862, + "time_sec": 132.21350002288818 + }, + { + "epoch": 67, + "train_loss": 4.542862183990478, + "train_acc": 0.0185, + "test_loss": 4.6684130096435545, + "test_acc": 0.01, + "lyapunov": 1.8110374151288395, + "grad_norm": 0.20198224436322607, + "grad_max_sv": 0.12510044891387223, + "grad_min_sv": 1.6897107442398038e-13, + "grad_condition": 110315569576.42929, + "lr": 0.0005833843733580507, + "time_sec": 132.21303582191467 + }, + { + "epoch": 68, + "train_loss": 4.533297353515625, + "train_acc": 0.01836, + "test_loss": 4.948698665618896, + "test_acc": 0.01, + "lyapunov": 1.8091393379908998, + "grad_norm": 0.20393830283581765, + "grad_max_sv": 0.12409924473613501, + "grad_min_sv": 1.9688814026908198e-13, + "grad_condition": 106600141201.27957, + "lr": 0.0005730415142812054, + "time_sec": 132.2160370349884 + }, + { + "epoch": 69, + "train_loss": 4.524203167419434, + "train_acc": 0.01924, + "test_loss": 5.146536360931396, + "test_acc": 0.01, + "lyapunov": 1.745428860035089, + "grad_norm": 0.21505692197339663, + "grad_max_sv": 0.1343175122514367, + "grad_min_sv": 4.1179497063756466e-13, + "grad_condition": 104835550128.83902, + "lr": 0.0005626666167821517, + "time_sec": 132.1414828300476 + }, + { + "epoch": 70, + "train_loss": 4.517985006103515, + "train_acc": 0.02132, + "test_loss": 5.5230685882568356, + "test_acc": 0.01, + "lyapunov": 1.7269622227724861, + "grad_norm": 0.21930603503908438, + "grad_max_sv": 0.12969524934887885, + "grad_min_sv": 5.027037874784802e-13, + "grad_condition": 94485385916.61972, + "lr": 0.0005522642316338265, + "time_sec": 132.12957501411438 + }, + { + "epoch": 71, + "train_loss": 4.513141716461182, + "train_acc": 0.02148, + "test_loss": 5.14728856048584, + "test_acc": 0.01, + "lyapunov": 1.7201101194562205, + "grad_norm": 0.2108768945832789, + "grad_max_sv": 0.1154132118448615, + "grad_min_sv": 4.582415659043439e-13, + "grad_condition": 86628312707.01842, + "lr": 0.0005418389216661573, + "time_sec": 132.16575050354004 + }, + { + "epoch": 72, + "train_loss": 4.518121377105713, + "train_acc": 0.02086, + "test_loss": 5.867084600830078, + "test_acc": 0.01, + "lyapunov": 1.7361170272997883, + "grad_norm": 0.2013470383123874, + "grad_max_sv": 0.11099338140338659, + "grad_min_sv": 7.679591307357047e-13, + "grad_condition": 71594062592.2271, + "lr": 0.0005313952597646563, + "time_sec": 132.19545316696167 + }, + { + "epoch": 73, + "train_loss": 4.523569106903076, + "train_acc": 0.02002, + "test_loss": 5.884369519042969, + "test_acc": 0.01, + "lyapunov": 1.7111626808600657, + "grad_norm": 0.1862626190339828, + "grad_max_sv": 0.0956994505599141, + "grad_min_sv": 5.615634920372618e-13, + "grad_condition": 67775819992.42169, + "lr": 0.0005209378268645994, + "time_sec": 132.16929745674133 + }, + { + "epoch": 74, + "train_loss": 4.524184910888672, + "train_acc": 0.0207, + "test_loss": 6.031040227508545, + "test_acc": 0.01, + "lyapunov": 1.7097601433239324, + "grad_norm": 0.1884016511929612, + "grad_max_sv": 0.09857390448451042, + "grad_min_sv": 4.2370344190951513e-13, + "grad_condition": 75293714883.4113, + "lr": 0.0005104712099416781, + "time_sec": 132.1468484401703 + }, + { + "epoch": 75, + "train_loss": 4.520278462219238, + "train_acc": 0.02068, + "test_loss": 6.038993734741211, + "test_acc": 0.01, + "lyapunov": 1.7097111705623929, + "grad_norm": 0.18388358122389875, + "grad_max_sv": 0.09903657622635365, + "grad_min_sv": 3.207687284743533e-13, + "grad_condition": 77688785793.72481, + "lr": 0.0004999999999999996, + "time_sec": 132.16273522377014 + }, + { + "epoch": 76, + "train_loss": 4.519440199432373, + "train_acc": 0.02034, + "test_loss": 6.213510666656494, + "test_acc": 0.01, + "lyapunov": 1.7116832178267067, + "grad_norm": 0.1858679701216664, + "grad_max_sv": 0.09789907988160848, + "grad_min_sv": 6.112542465882311e-13, + "grad_condition": 68567172089.116356, + "lr": 0.0004895287900583212, + "time_sec": 132.1939127445221 + }, + { + "epoch": 77, + "train_loss": 4.518037851409912, + "train_acc": 0.0214, + "test_loss": 5.786403080749512, + "test_acc": 0.01, + "lyapunov": 1.7145553226666073, + "grad_norm": 0.18574695316884535, + "grad_max_sv": 0.09128198456019163, + "grad_min_sv": 4.946589302257e-13, + "grad_condition": 67591746834.44646, + "lr": 0.0004790621731353997, + "time_sec": 132.15240120887756 + }, + { + "epoch": 78, + "train_loss": 4.501732761535645, + "train_acc": 0.02256, + "test_loss": 5.505255569458008, + "test_acc": 0.01, + "lyapunov": 1.7250188009818193, + "grad_norm": 0.19980626014881434, + "grad_max_sv": 0.09609800074249505, + "grad_min_sv": 1.0398673891179978e-12, + "grad_condition": 57566435538.51784, + "lr": 0.000468604740235343, + "time_sec": 132.12926125526428 + }, + { + "epoch": 79, + "train_loss": 4.501669064941407, + "train_acc": 0.02324, + "test_loss": 6.070380794525146, + "test_acc": 0.01, + "lyapunov": 1.735146647524041, + "grad_norm": 0.20106875052773868, + "grad_max_sv": 0.09831586424261332, + "grad_min_sv": 9.935335330325552e-13, + "grad_condition": 58796511684.76035, + "lr": 0.00045816107833384175, + "time_sec": 132.16433572769165 + }, + { + "epoch": 80, + "train_loss": 4.4981083242797855, + "train_acc": 0.0241, + "test_loss": 5.620106427001953, + "test_acc": 0.01, + "lyapunov": 1.7485203517367467, + "grad_norm": 0.20191528885284654, + "grad_max_sv": 0.10116043519228697, + "grad_min_sv": 9.397264041022328e-13, + "grad_condition": 60757002594.674866, + "lr": 0.0004477357683661729, + "time_sec": 132.17495608329773 + }, + { + "epoch": 81, + "train_loss": 4.493218509216309, + "train_acc": 0.02376, + "test_loss": 5.300303136444092, + "test_acc": 0.01, + "lyapunov": 1.6853597962947757, + "grad_norm": 0.20823744684579867, + "grad_max_sv": 0.10085432399064302, + "grad_min_sv": 1.8721769452817893e-12, + "grad_condition": 48739518835.89932, + "lr": 0.00043733338321784746, + "time_sec": 132.22597217559814 + }, + { + "epoch": 82, + "train_loss": 4.491092452697754, + "train_acc": 0.0244, + "test_loss": 5.484540922546387, + "test_acc": 0.01, + "lyapunov": 1.6777428748357632, + "grad_norm": 0.2050457380120937, + "grad_max_sv": 0.1014392027631402, + "grad_min_sv": 1.6302461105309582e-12, + "grad_condition": 48298106057.62421, + "lr": 0.0004269584857187939, + "time_sec": 132.1523575782776 + }, + { + "epoch": 83, + "train_loss": 4.488150163726806, + "train_acc": 0.0244, + "test_loss": 5.661939654541015, + "test_acc": 0.01, + "lyapunov": 1.6749736963940398, + "grad_norm": 0.20418321117537733, + "grad_max_sv": 0.09827770255506038, + "grad_min_sv": 1.251075866354586e-12, + "grad_condition": 57969859270.98726, + "lr": 0.0004166156266419484, + "time_sec": 132.168292760849 + }, + { + "epoch": 84, + "train_loss": 4.488186374206543, + "train_acc": 0.02342, + "test_loss": 5.563153546142578, + "test_acc": 0.01, + "lyapunov": 1.674497790043921, + "grad_norm": 0.2035608057982943, + "grad_max_sv": 0.10094663016498089, + "grad_min_sv": 2.0619277823357323e-12, + "grad_condition": 48466905022.9367, + "lr": 0.0004063093427071373, + "time_sec": 132.16950011253357 + }, + { + "epoch": 85, + "train_loss": 4.485201366271973, + "train_acc": 0.0241, + "test_loss": 5.480735997772217, + "test_acc": 0.01, + "lyapunov": 1.6744796751100388, + "grad_norm": 0.20427635969499436, + "grad_max_sv": 0.09893963132053614, + "grad_min_sv": 1.3937446199220963e-12, + "grad_condition": 52585051637.81031, + "lr": 0.0003960441545911199, + "time_sec": 132.16970133781433 + }, + { + "epoch": 86, + "train_loss": 4.471947127380371, + "train_acc": 0.0246, + "test_loss": 6.341788235473633, + "test_acc": 0.01, + "lyapunov": 1.7030728238317974, + "grad_norm": 0.23549883852282946, + "grad_max_sv": 0.10309729054570198, + "grad_min_sv": 1.865658646350171e-12, + "grad_condition": 50287808814.10475, + "lr": 0.0003858245649446718, + "time_sec": 132.15209889411926 + }, + { + "epoch": 87, + "train_loss": 4.45871408706665, + "train_acc": 0.02508, + "test_loss": 6.5574141830444335, + "test_acc": 0.01, + "lyapunov": 1.7015497336912033, + "grad_norm": 0.20706345186144237, + "grad_max_sv": 0.10086965002119541, + "grad_min_sv": 2.0960061870473903e-12, + "grad_condition": 44893407653.08879, + "lr": 0.00037565505641757235, + "time_sec": 132.1981644630432 + }, + { + "epoch": 88, + "train_loss": 4.4560191854858395, + "train_acc": 0.02594, + "test_loss": 6.111994355773926, + "test_acc": 0.01, + "lyapunov": 1.7030071026224005, + "grad_norm": 0.2056716140989914, + "grad_max_sv": 0.09794572051614522, + "grad_min_sv": 3.489873766253165e-12, + "grad_condition": 37468804044.8835, + "lr": 0.00036554008969236695, + "time_sec": 132.18566298484802 + }, + { + "epoch": 89, + "train_loss": 4.466955214233399, + "train_acc": 0.02466, + "test_loss": 7.051888754272461, + "test_acc": 0.01, + "lyapunov": 1.682900452552854, + "grad_norm": 0.1940717753557399, + "grad_max_sv": 0.09164916388690472, + "grad_min_sv": 1.4839058306084107e-12, + "grad_condition": 48362788591.79397, + "lr": 0.0003554841015277638, + "time_sec": 132.16932582855225 + }, + { + "epoch": 90, + "train_loss": 4.48257959991455, + "train_acc": 0.02168, + "test_loss": 8.26663565673828, + "test_acc": 0.01, + "lyapunov": 1.6648904085159302, + "grad_norm": 0.18466858617264814, + "grad_max_sv": 0.08782129287719727, + "grad_min_sv": 9.054104359032705e-13, + "grad_condition": 55234893471.5977, + "lr": 0.000345491502812526, + "time_sec": 132.1772141456604 + }, + { + "epoch": 91, + "train_loss": 4.476146142120362, + "train_acc": 0.02456, + "test_loss": 9.070208990478516, + "test_acc": 0.01, + "lyapunov": 1.6594186563930853, + "grad_norm": 0.18755828093129312, + "grad_max_sv": 0.08745833095163107, + "grad_min_sv": 1.2909392503343921e-12, + "grad_condition": 50892831636.92212, + "lr": 0.0003355666766307081, + "time_sec": 132.27485394477844 + }, + { + "epoch": 92, + "train_loss": 4.486352113952637, + "train_acc": 0.02176, + "test_loss": 8.653399160766602, + "test_acc": 0.0102, + "lyapunov": 1.6659517510772666, + "grad_norm": 0.1792378899563532, + "grad_max_sv": 0.08171754404902458, + "grad_min_sv": 7.820352245418777e-13, + "grad_condition": 52421997853.347336, + "lr": 0.00032571397633909225, + "time_sec": 132.17684316635132 + }, + { + "epoch": 93, + "train_loss": 4.493307136535645, + "train_acc": 0.02156, + "test_loss": 8.168136666870117, + "test_acc": 0.01, + "lyapunov": 1.6586454442090086, + "grad_norm": 0.17235526056914746, + "grad_max_sv": 0.07756552556529642, + "grad_min_sv": 7.947691420212043e-13, + "grad_condition": 49300927673.13883, + "lr": 0.00031593772365766094, + "time_sec": 132.19673776626587 + }, + { + "epoch": 94, + "train_loss": 4.49889531829834, + "train_acc": 0.0203, + "test_loss": 8.989650103759766, + "test_acc": 0.01, + "lyapunov": 1.6598583097043245, + "grad_norm": 0.1936371985956393, + "grad_max_sv": 0.07813195139169693, + "grad_min_sv": 5.93403713321534e-13, + "grad_condition": 55312577703.14712, + "lr": 0.0003062422067739483, + "time_sec": 132.24237537384033 + }, + { + "epoch": 95, + "train_loss": 4.492598588867187, + "train_acc": 0.0215, + "test_loss": 7.961930172729492, + "test_acc": 0.01, + "lyapunov": 1.6501619547529294, + "grad_norm": 0.17022870698506898, + "grad_max_sv": 0.07985126227140427, + "grad_min_sv": 7.433303273493305e-13, + "grad_condition": 52713816577.99087, + "lr": 0.00029663167846209965, + "time_sec": 132.14930176734924 + }, + { + "epoch": 96, + "train_loss": 4.489167682800293, + "train_acc": 0.0212, + "test_loss": 9.875268710327148, + "test_acc": 0.01, + "lyapunov": 1.6512981820899202, + "grad_norm": 0.17077151687298275, + "grad_max_sv": 0.08098559230566024, + "grad_min_sv": 7.203028542340039e-13, + "grad_condition": 55167315362.48393, + "lr": 0.00028711035421746345, + "time_sec": 132.15733528137207 + }, + { + "epoch": 97, + "train_loss": 4.488607182769775, + "train_acc": 0.0208, + "test_loss": 9.499038198852539, + "test_acc": 0.01, + "lyapunov": 1.6502791972416442, + "grad_norm": 0.17108539080702187, + "grad_max_sv": 0.07986859362572432, + "grad_min_sv": 6.120358092673219e-13, + "grad_condition": 53300232476.72379, + "lr": 0.00027768241040753615, + "time_sec": 132.24549341201782 + }, + { + "epoch": 98, + "train_loss": 4.4901776986694335, + "train_acc": 0.02154, + "test_loss": 8.216125820922851, + "test_acc": 0.01, + "lyapunov": 1.6494739058682375, + "grad_norm": 0.16951910310360138, + "grad_max_sv": 0.07793897418305278, + "grad_min_sv": 6.258507944948885e-13, + "grad_condition": 51950548109.229416, + "lr": 0.00026835198244006903, + "time_sec": 132.17059445381165 + }, + { + "epoch": 99, + "train_loss": 4.491983847351074, + "train_acc": 0.02168, + "test_loss": 8.09697102355957, + "test_acc": 0.01, + "lyapunov": 1.6644236773176266, + "grad_norm": 0.17033780677205843, + "grad_max_sv": 0.0777206091210246, + "grad_min_sv": 9.776283290056205e-13, + "grad_condition": 48345596943.6561, + "lr": 0.0002591231629491421, + "time_sec": 132.22015237808228 + }, + { + "epoch": 100, + "train_loss": 4.491883171386719, + "train_acc": 0.02156, + "test_loss": 9.202599882507323, + "test_acc": 0.01, + "lyapunov": 1.676265578440693, + "grad_norm": 0.16987071721382468, + "grad_max_sv": 0.07617421075701714, + "grad_min_sv": 9.138110471633042e-13, + "grad_condition": 45716951113.780594, + "lr": 0.0002499999999999997, + "time_sec": 132.17183017730713 + }, + { + "epoch": 101, + "train_loss": 4.502107236328125, + "train_acc": 0.02148, + "test_loss": 8.877014265441895, + "test_acc": 0.01, + "lyapunov": 1.6693046135670693, + "grad_norm": 0.16216294695961178, + "grad_max_sv": 0.06937387129291891, + "grad_min_sv": 6.833370538703013e-13, + "grad_condition": 45861961359.593346, + "lr": 0.00024098649531343477, + "time_sec": 132.23760414123535 + }, + { + "epoch": 102, + "train_loss": 4.499898295898437, + "train_acc": 0.02174, + "test_loss": 8.436487481689452, + "test_acc": 0.01, + "lyapunov": 1.6575999412390277, + "grad_norm": 0.1640898699770385, + "grad_max_sv": 0.07209301171824337, + "grad_min_sv": 5.67201842765988e-13, + "grad_condition": 50399333888.00142, + "lr": 0.0002320866025105016, + "time_sec": 132.28947830200195 + }, + { + "epoch": 103, + "train_loss": 4.49589670135498, + "train_acc": 0.02166, + "test_loss": 8.791377081298828, + "test_acc": 0.01, + "lyapunov": 1.6821342990221575, + "grad_norm": 0.1642275448165301, + "grad_max_sv": 0.07227097311988473, + "grad_min_sv": 8.173785106263955e-13, + "grad_condition": 46969951461.32619, + "lr": 0.0002233042253783278, + "time_sec": 132.1418879032135 + }, + { + "epoch": 104, + "train_loss": 4.485214436340332, + "train_acc": 0.0218, + "test_loss": 7.897974142456055, + "test_acc": 0.01, + "lyapunov": 1.678378782308925, + "grad_norm": 0.22118138085111713, + "grad_max_sv": 0.08063290994614362, + "grad_min_sv": 7.583065334713665e-13, + "grad_condition": 51857595723.53325, + "lr": 0.000214643216157784, + "time_sec": 132.1506576538086 + }, + { + "epoch": 105, + "train_loss": 4.469979349365234, + "train_acc": 0.02326, + "test_loss": 8.37761021118164, + "test_acc": 0.01, + "lyapunov": 1.6728657965769853, + "grad_norm": 0.17551703666999802, + "grad_max_sv": 0.0846982304006815, + "grad_min_sv": 1.0180233818444844e-12, + "grad_condition": 49287737749.07934, + "lr": 0.00020610737385376332, + "time_sec": 132.18390417099 + }, + { + "epoch": 106, + "train_loss": 4.473400472564697, + "train_acc": 0.02402, + "test_loss": 7.748300148010254, + "test_acc": 0.01, + "lyapunov": 1.6795688824885338, + "grad_norm": 0.17847414349700472, + "grad_max_sv": 0.08211751151829957, + "grad_min_sv": 9.852367027585543e-13, + "grad_condition": 50172782007.06673, + "lr": 0.00019770044256881242, + "time_sec": 132.18465375900269 + }, + { + "epoch": 107, + "train_loss": 4.470222578125, + "train_acc": 0.0236, + "test_loss": 8.448894213867188, + "test_acc": 0.01, + "lyapunov": 1.6689351574539224, + "grad_norm": 0.20809152753228893, + "grad_max_sv": 0.08809565398842097, + "grad_min_sv": 8.603923254027034e-13, + "grad_condition": 57999001174.971756, + "lr": 0.0001894261098608447, + "time_sec": 132.17956495285034 + }, + { + "epoch": 108, + "train_loss": 4.459717525024414, + "train_acc": 0.02268, + "test_loss": 8.36234213104248, + "test_acc": 0.01, + "lyapunov": 1.644672902343828, + "grad_norm": 0.1764653926066368, + "grad_max_sv": 0.08436396401375532, + "grad_min_sv": 1.1760666999790127e-12, + "grad_condition": 48331131760.11851, + "lr": 0.000181288005125655, + "time_sec": 132.16263604164124 + }, + { + "epoch": 109, + "train_loss": 4.45738801651001, + "train_acc": 0.0224, + "test_loss": 9.078446282958984, + "test_acc": 0.01, + "lyapunov": 1.6396975398368543, + "grad_norm": 0.17670685100672429, + "grad_max_sv": 0.08786458019167184, + "grad_min_sv": 8.563761716652081e-13, + "grad_condition": 57350066983.85077, + "lr": 0.0001732896980049473, + "time_sec": 132.1655683517456 + }, + { + "epoch": 110, + "train_loss": 4.4555519541931154, + "train_acc": 0.02452, + "test_loss": 8.74792897491455, + "test_acc": 0.01, + "lyapunov": 1.6595004513440534, + "grad_norm": 0.17949574405885257, + "grad_max_sv": 0.08448744211345911, + "grad_min_sv": 1.3969123108783706e-12, + "grad_condition": 44076467962.04108, + "lr": 0.00016543469682057076, + "time_sec": 132.23805284500122 + }, + { + "epoch": 111, + "train_loss": 4.452196352539063, + "train_acc": 0.02374, + "test_loss": 8.00354757232666, + "test_acc": 0.01, + "lyapunov": 1.6580178502880398, + "grad_norm": 0.17995085401659994, + "grad_max_sv": 0.08801313545554876, + "grad_min_sv": 1.216669788614879e-12, + "grad_condition": 50895520703.46747, + "lr": 0.00015772644703565552, + "time_sec": 132.17279314994812 + }, + { + "epoch": 112, + "train_loss": 4.448547237548828, + "train_acc": 0.02418, + "test_loss": 9.011292713928222, + "test_acc": 0.01, + "lyapunov": 1.6592172176941582, + "grad_norm": 0.18251147032098386, + "grad_max_sv": 0.08963290825486184, + "grad_min_sv": 1.4949865538305105e-12, + "grad_condition": 48228429173.65173, + "lr": 0.00015016832974331713, + "time_sec": 132.16365575790405 + }, + { + "epoch": 113, + "train_loss": 4.44851509475708, + "train_acc": 0.024, + "test_loss": 7.425234848022461, + "test_acc": 0.01, + "lyapunov": 1.6541204080557275, + "grad_norm": 0.17988180288453134, + "grad_max_sv": 0.08577104695141316, + "grad_min_sv": 1.7064885513720195e-12, + "grad_condition": 42496707596.45669, + "lr": 0.00014276366018359834, + "time_sec": 132.17237329483032 + }, + { + "epoch": 114, + "train_loss": 4.4484559083557125, + "train_acc": 0.0247, + "test_loss": 7.573656594848633, + "test_acc": 0.01, + "lyapunov": 1.6490926172422327, + "grad_norm": 0.17961098442925355, + "grad_max_sv": 0.086801771633327, + "grad_min_sv": 1.846744935242827e-12, + "grad_condition": 41227142123.03452, + "lr": 0.00013551568628929425, + "time_sec": 132.22268390655518 + }, + { + "epoch": 115, + "train_loss": 4.447767953491211, + "train_acc": 0.0244, + "test_loss": 7.697570289611816, + "test_acc": 0.01, + "lyapunov": 1.6411334446933874, + "grad_norm": 0.17899446180570205, + "grad_max_sv": 0.08778086788952351, + "grad_min_sv": 1.912777123157754e-12, + "grad_condition": 44133900284.67078, + "lr": 0.00012842758726130276, + "time_sec": 132.18531441688538 + }, + { + "epoch": 116, + "train_loss": 4.447214733581543, + "train_acc": 0.02514, + "test_loss": 8.197078015136718, + "test_acc": 0.01, + "lyapunov": 1.6453799378231664, + "grad_norm": 0.17838449775067347, + "grad_max_sv": 0.08597556184977292, + "grad_min_sv": 1.2002783937589755e-12, + "grad_condition": 48052209169.14538, + "lr": 0.0001215024721741218, + "time_sec": 132.20826029777527 + }, + { + "epoch": 117, + "train_loss": 4.445804840393066, + "train_acc": 0.02476, + "test_loss": 7.459493585205078, + "test_acc": 0.01, + "lyapunov": 1.6700239077858303, + "grad_norm": 0.17826309113638003, + "grad_max_sv": 0.08523292336612939, + "grad_min_sv": 1.43561713598312e-12, + "grad_condition": 43897229051.608284, + "lr": 0.00011474337861210538, + "time_sec": 132.27570056915283 + }, + { + "epoch": 118, + "train_loss": 4.44613270904541, + "train_acc": 0.02494, + "test_loss": 7.857499731445312, + "test_acc": 0.01, + "lyapunov": 1.634896194538497, + "grad_norm": 0.17842754835213456, + "grad_max_sv": 0.08666675891727209, + "grad_min_sv": 1.7234741086537276e-12, + "grad_condition": 39879322556.25903, + "lr": 0.00010815327133708009, + "time_sec": 132.14366149902344 + }, + { + "epoch": 119, + "train_loss": 4.453590765686035, + "train_acc": 0.02506, + "test_loss": 9.074451724243165, + "test_acc": 0.01, + "lyapunov": 1.6355371264850391, + "grad_norm": 0.17703387614060243, + "grad_max_sv": 0.08299594167619943, + "grad_min_sv": 1.0971823872512062e-12, + "grad_condition": 47469697165.520645, + "lr": 0.00010173504098790182, + "time_sec": 132.20703506469727 + }, + { + "epoch": 120, + "train_loss": 4.449643159942627, + "train_acc": 0.02384, + "test_loss": 7.864449021911621, + "test_acc": 0.01, + "lyapunov": 1.626808090892899, + "grad_norm": 0.17535649768391584, + "grad_max_sv": 0.08262888118624687, + "grad_min_sv": 1.3016816308302772e-12, + "grad_condition": 43366132426.244, + "lr": 9.549150281252629e-05, + "time_sec": 132.15547442436218 + }, + { + "epoch": 121, + "train_loss": 4.447579947814941, + "train_acc": 0.0251, + "test_loss": 8.218537933349609, + "test_acc": 0.01, + "lyapunov": 1.6481489638233429, + "grad_norm": 0.17575759558855317, + "grad_max_sv": 0.07947007808834314, + "grad_min_sv": 1.2257565823825079e-12, + "grad_condition": 42809654336.64394, + "lr": 8.942539543314794e-05, + "time_sec": 132.21557140350342 + }, + { + "epoch": 122, + "train_loss": 4.451288205871582, + "train_acc": 0.02486, + "test_loss": 9.786827795410156, + "test_acc": 0.01, + "lyapunov": 1.634647862685611, + "grad_norm": 0.1748657725986785, + "grad_max_sv": 0.0811953267082572, + "grad_min_sv": 1.232418852351204e-12, + "grad_condition": 45425996224.86906, + "lr": 8.353937964495024e-05, + "time_sec": 132.58023762702942 + }, + { + "epoch": 123, + "train_loss": 4.45665797164917, + "train_acc": 0.02292, + "test_loss": 8.08002472076416, + "test_acc": 0.01, + "lyapunov": 1.640638170034989, + "grad_norm": 0.19951484695796856, + "grad_max_sv": 0.0797580998390913, + "grad_min_sv": 1.1283924413595944e-12, + "grad_condition": 45899924461.005104, + "lr": 7.783603724899243e-05, + "time_sec": 132.2773494720459 + }, + { + "epoch": 124, + "train_loss": 4.452873533630371, + "train_acc": 0.02336, + "test_loss": 9.092270526123047, + "test_acc": 0.01, + "lyapunov": 1.6443614947521472, + "grad_norm": 0.17315643932230268, + "grad_max_sv": 0.0823759377002716, + "grad_min_sv": 1.3724199566157753e-12, + "grad_condition": 48335702196.43469, + "lr": 7.231786991974666e-05, + "time_sec": 132.3210871219635 + }, + { + "epoch": 125, + "train_loss": 4.4542430857849125, + "train_acc": 0.02352, + "test_loss": 8.764940815734864, + "test_acc": 0.01, + "lyapunov": 1.663006810885866, + "grad_norm": 0.19582765959122034, + "grad_max_sv": 0.081761784106493, + "grad_min_sv": 8.076158731506219e-13, + "grad_condition": 51379464353.44197, + "lr": 6.698729810778072e-05, + "time_sec": 132.4144446849823 + }, + { + "epoch": 126, + "train_loss": 4.449181112213135, + "train_acc": 0.02354, + "test_loss": 8.464842572021483, + "test_acc": 0.01, + "lyapunov": 1.6743557538522784, + "grad_norm": 0.17141955117067212, + "grad_max_sv": 0.08278838153928518, + "grad_min_sv": 9.343163889556585e-13, + "grad_condition": 50028040865.10504, + "lr": 6.184665997806817e-05, + "time_sec": 132.24264407157898 + }, + { + "epoch": 127, + "train_loss": 4.448994424133301, + "train_acc": 0.02352, + "test_loss": 8.130727629089355, + "test_acc": 0.01, + "lyapunov": 1.6350413380986284, + "grad_norm": 0.17329659307204753, + "grad_max_sv": 0.08032873682677746, + "grad_min_sv": 1.1334150344781164e-12, + "grad_condition": 45698735238.160416, + "lr": 5.6898210384392595e-05, + "time_sec": 132.1239423751831 + }, + { + "epoch": 128, + "train_loss": 4.450544538269043, + "train_acc": 0.02434, + "test_loss": 8.467534092712402, + "test_acc": 0.01, + "lyapunov": 1.6441292976174513, + "grad_norm": 0.17372897225844472, + "grad_max_sv": 0.08003925699740648, + "grad_min_sv": 1.37686231795248e-12, + "grad_condition": 42113279225.534874, + "lr": 5.214411988029363e-05, + "time_sec": 132.30834007263184 + }, + { + "epoch": 129, + "train_loss": 4.450699962158203, + "train_acc": 0.02354, + "test_loss": 9.638625686645508, + "test_acc": 0.01, + "lyapunov": 1.6521275854476578, + "grad_norm": 0.17278236638845632, + "grad_max_sv": 0.0785352012142539, + "grad_min_sv": 1.2115131568787917e-12, + "grad_condition": 42101040125.73087, + "lr": 4.7586473766990294e-05, + "time_sec": 132.2434434890747 + }, + { + "epoch": 130, + "train_loss": 4.455087382965088, + "train_acc": 0.02386, + "test_loss": 8.756081176757812, + "test_acc": 0.01, + "lyapunov": 1.6631780207309577, + "grad_norm": 0.17377142693511546, + "grad_max_sv": 0.08205142095685006, + "grad_min_sv": 7.963760756481321e-13, + "grad_condition": 52011409179.79567, + "lr": 4.32272711786996e-05, + "time_sec": 132.2769739627838 + }, + { + "epoch": 131, + "train_loss": 4.434134347686768, + "train_acc": 0.02574, + "test_loss": 7.352558810424805, + "test_acc": 0.01, + "lyapunov": 1.6523698214679727, + "grad_norm": 0.20773326710793708, + "grad_max_sv": 0.08667766228318215, + "grad_min_sv": 1.919706897523786e-12, + "grad_condition": 42704655554.58238, + "lr": 3.906842420574966e-05, + "time_sec": 132.55578327178955 + }, + { + "epoch": 132, + "train_loss": 4.4243296493530275, + "train_acc": 0.02678, + "test_loss": 7.780651908874511, + "test_acc": 0.01, + "lyapunov": 1.6417261416954763, + "grad_norm": 0.21158187573943782, + "grad_max_sv": 0.09079265538603068, + "grad_min_sv": 2.443299247835716e-12, + "grad_condition": 37955657652.24723, + "lr": 3.5111757055874305e-05, + "time_sec": 132.18799567222595 + }, + { + "epoch": 133, + "train_loss": 4.422502294006348, + "train_acc": 0.02692, + "test_loss": 7.376312741088867, + "test_acc": 0.01, + "lyapunov": 1.6381114767030682, + "grad_norm": 0.18790104013196945, + "grad_max_sv": 0.09083432145416737, + "grad_min_sv": 3.798563978689657e-12, + "grad_condition": 27418807522.98039, + "lr": 3.1359005254054254e-05, + "time_sec": 132.15543341636658 + }, + { + "epoch": 134, + "train_loss": 4.422092590026855, + "train_acc": 0.02692, + "test_loss": 8.377299313354492, + "test_acc": 0.01, + "lyapunov": 1.636994728956686, + "grad_norm": 0.1869528840778772, + "grad_max_sv": 0.0903508085757494, + "grad_min_sv": 3.6880654496379876e-12, + "grad_condition": 36996850808.571785, + "lr": 2.7811814881259484e-05, + "time_sec": 132.38520789146423 + }, + { + "epoch": 135, + "train_loss": 4.418914005279541, + "train_acc": 0.02742, + "test_loss": 6.906009614562988, + "test_acc": 0.01, + "lyapunov": 1.6363926659459653, + "grad_norm": 0.18668160978325551, + "grad_max_sv": 0.08737325388938189, + "grad_min_sv": 4.087354528458948e-12, + "grad_condition": 36144831519.89355, + "lr": 2.4471741852423218e-05, + "time_sec": 132.16233372688293 + }, + { + "epoch": 136, + "train_loss": 4.418727052154541, + "train_acc": 0.02834, + "test_loss": 6.848020628356934, + "test_acc": 0.01, + "lyapunov": 1.637757837924811, + "grad_norm": 0.185957498259351, + "grad_max_sv": 0.08990161214023829, + "grad_min_sv": 2.5635452047007446e-12, + "grad_condition": 36608541775.97405, + "lr": 2.1340251233966362e-05, + "time_sec": 132.16730999946594 + }, + { + "epoch": 137, + "train_loss": 4.417813260803222, + "train_acc": 0.02786, + "test_loss": 6.513410632324219, + "test_acc": 0.01, + "lyapunov": 1.6581665283578741, + "grad_norm": 0.18752054423192302, + "grad_max_sv": 0.0908197382465005, + "grad_min_sv": 4.3158261947546074e-12, + "grad_condition": 34752028067.51683, + "lr": 1.8418716601170932e-05, + "time_sec": 132.1503939628601 + }, + { + "epoch": 138, + "train_loss": 4.418873815612793, + "train_acc": 0.02748, + "test_loss": 8.087532058715821, + "test_acc": 0.01, + "lyapunov": 1.6522157362964758, + "grad_norm": 0.1866907350713941, + "grad_max_sv": 0.09033620022237301, + "grad_min_sv": 3.213381299999981e-12, + "grad_condition": 35778325534.10133, + "lr": 1.570841943568445e-05, + "time_sec": 132.1567280292511 + }, + { + "epoch": 139, + "train_loss": 4.4161333633422855, + "train_acc": 0.0276, + "test_loss": 8.191026416015625, + "test_acc": 0.01, + "lyapunov": 1.6455879296793048, + "grad_norm": 0.18557542490300608, + "grad_max_sv": 0.0889211179688573, + "grad_min_sv": 3.4593583989002204e-12, + "grad_condition": 31832374202.184643, + "lr": 1.3210548563419845e-05, + "time_sec": 132.19401907920837 + }, + { + "epoch": 140, + "train_loss": 4.418262011413574, + "train_acc": 0.02782, + "test_loss": 6.895318252563476, + "test_acc": 0.01, + "lyapunov": 1.6439879275953677, + "grad_norm": 0.18789652999107584, + "grad_max_sv": 0.09223881866782904, + "grad_min_sv": 3.672034370543509e-12, + "grad_condition": 40996113464.226456, + "lr": 1.0926199633097203e-05, + "time_sec": 132.21073389053345 + }, + { + "epoch": 141, + "train_loss": 4.419678017578125, + "train_acc": 0.02784, + "test_loss": 7.980368154907227, + "test_acc": 0.01, + "lyapunov": 1.645956871454673, + "grad_norm": 0.21175718737651955, + "grad_max_sv": 0.08853729460388422, + "grad_min_sv": 2.6680971420802367e-12, + "grad_condition": 35434715047.637245, + "lr": 8.856374635655688e-06, + "time_sec": 132.18874335289001 + }, + { + "epoch": 142, + "train_loss": 4.419177203826904, + "train_acc": 0.02822, + "test_loss": 8.440240577697754, + "test_acc": 0.01, + "lyapunov": 1.6426525015355375, + "grad_norm": 0.21316019440493214, + "grad_max_sv": 0.09124803766608239, + "grad_min_sv": 3.1175798344336993e-12, + "grad_condition": 37708867557.074486, + "lr": 7.001981464747503e-06, + "time_sec": 132.1491301059723 + }, + { + "epoch": 143, + "train_loss": 4.417434323425293, + "train_acc": 0.0287, + "test_loss": 8.240262408447265, + "test_acc": 0.01, + "lyapunov": 1.6469836302120666, + "grad_norm": 0.23784439046283262, + "grad_max_sv": 0.08761858381393735, + "grad_min_sv": 2.8977386848827147e-12, + "grad_condition": 31187653416.850555, + "lr": 5.3638335185058295e-06, + "time_sec": 132.19097757339478 + }, + { + "epoch": 144, + "train_loss": 4.4156618258666995, + "train_acc": 0.02716, + "test_loss": 7.953450819396973, + "test_acc": 0.01, + "lyapunov": 1.6425745645752343, + "grad_norm": 0.2132245435585326, + "grad_max_sv": 0.09185097869485617, + "grad_min_sv": 3.537113060367509e-12, + "grad_condition": 32291439470.48501, + "lr": 3.942649342761114e-06, + "time_sec": 132.152756690979 + }, + { + "epoch": 145, + "train_loss": 4.41735453491211, + "train_acc": 0.0271, + "test_loss": 7.392109161376953, + "test_acc": 0.01, + "lyapunov": 1.6465119641760122, + "grad_norm": 0.23771171614973002, + "grad_max_sv": 0.08877957258382163, + "grad_min_sv": 3.662623052098543e-12, + "grad_condition": 31444571536.71527, + "lr": 2.7390523158633524e-06, + "time_sec": 132.1491425037384 + }, + { + "epoch": 146, + "train_loss": 4.415992105712891, + "train_acc": 0.02742, + "test_loss": 6.790036075592041, + "test_acc": 0.01, + "lyapunov": 1.644826771962978, + "grad_norm": 0.21400476621867578, + "grad_max_sv": 0.08692030832172612, + "grad_min_sv": 3.319846017557227e-12, + "grad_condition": 29566198204.48894, + "lr": 1.7535703752478133e-06, + "time_sec": 132.18849802017212 + }, + { + "epoch": 147, + "train_loss": 4.416711021881103, + "train_acc": 0.02778, + "test_loss": 7.807013403320313, + "test_acc": 0.01, + "lyapunov": 1.6477658370571673, + "grad_norm": 0.21346132066680912, + "grad_max_sv": 0.08974210694432258, + "grad_min_sv": 5.421937878324293e-12, + "grad_condition": 29100830389.359028, + "lr": 9.866357858642196e-07, + "time_sec": 132.17349576950073 + }, + { + "epoch": 148, + "train_loss": 4.41632912033081, + "train_acc": 0.02642, + "test_loss": 8.702448477172851, + "test_acc": 0.01, + "lyapunov": 1.6435345963139059, + "grad_norm": 0.18869590013180013, + "grad_max_sv": 0.09069793857634068, + "grad_min_sv": 4.757087619330392e-12, + "grad_condition": 28639879790.87664, + "lr": 4.38584950570808e-07, + "time_sec": 132.17170405387878 + }, + { + "epoch": 149, + "train_loss": 4.416911704406738, + "train_acc": 0.02792, + "test_loss": 8.205855052185058, + "test_acc": 0.01, + "lyapunov": 1.644007340416579, + "grad_norm": 0.18838710040912585, + "grad_max_sv": 0.09058569818735122, + "grad_min_sv": 3.918862079919358e-12, + "grad_condition": 32422642045.613342, + "lr": 1.096582625772501e-07, + "time_sec": 132.21703672409058 + }, + { + "epoch": 150, + "train_loss": 4.41457652420044, + "train_acc": 0.02912, + "test_loss": 6.916353001403809, + "test_acc": 0.01, + "lyapunov": 1.6468722286736568, + "grad_norm": 0.2136131575554095, + "grad_max_sv": 0.09045024197548628, + "grad_min_sv": 2.8993581546385765e-12, + "grad_condition": 37658621623.085915, + "lr": 0.0, + "time_sec": 132.163569688797 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.0571779737854, + "train_acc": 0.0167, + "test_loss": 4.827515266418457, + "test_acc": 0.0103, + "lyapunov": 2.5426446635399937, + "grad_norm": 5.177109420411488, + "grad_max_sv": 4.456318712234497, + "grad_min_sv": 8.815798068217972e-08, + "grad_condition": 71118350.91380733, + "lr": 0.0009998903417374227, + "time_sec": 177.42072987556458 + }, + { + "epoch": 2, + "train_loss": 4.794301163787842, + "train_acc": 0.01928, + "test_loss": 4.913976379394532, + "test_acc": 0.0098, + "lyapunov": 2.146181991033237, + "grad_norm": 3.8113808421044735, + "grad_max_sv": 3.2804768919944762, + "grad_min_sv": 6.144172830513383e-08, + "grad_condition": 124696669.38204697, + "lr": 0.0009995614150494292, + "time_sec": 177.39710330963135 + }, + { + "epoch": 3, + "train_loss": 4.714878952331543, + "train_acc": 0.02056, + "test_loss": 4.878452481079101, + "test_acc": 0.01, + "lyapunov": 2.031570847382021, + "grad_norm": 3.2388790745039397, + "grad_max_sv": 2.687403079867363, + "grad_min_sv": 4.841258302024087e-08, + "grad_condition": 67027882.134094395, + "lr": 0.0009990133642141358, + "time_sec": 177.59884071350098 + }, + { + "epoch": 4, + "train_loss": 4.614759566802978, + "train_acc": 0.02084, + "test_loss": 4.775185641479492, + "test_acc": 0.01, + "lyapunov": 2.0082532993667876, + "grad_norm": 2.31316695814439, + "grad_max_sv": 1.8651121258735657, + "grad_min_sv": 3.571143663352871e-08, + "grad_condition": 204953264.94047222, + "lr": 0.0009982464296247522, + "time_sec": 177.37947058677673 + }, + { + "epoch": 5, + "train_loss": 4.589800308074951, + "train_acc": 0.02068, + "test_loss": 4.687682948303222, + "test_acc": 0.01, + "lyapunov": 1.938017784482073, + "grad_norm": 1.9987537203533734, + "grad_max_sv": 1.574848594448015, + "grad_min_sv": 2.9562581094213007e-08, + "grad_condition": 52112524.45563479, + "lr": 0.0009972609476841367, + "time_sec": 177.36336994171143 + }, + { + "epoch": 6, + "train_loss": 4.652974959869384, + "train_acc": 0.01726, + "test_loss": 4.774779940032959, + "test_acc": 0.01, + "lyapunov": 1.9519087929859795, + "grad_norm": 2.9045684670979504, + "grad_max_sv": 1.4192959418629243, + "grad_min_sv": 2.5302831723207163e-08, + "grad_condition": 131080187.01219621, + "lr": 0.000996057350657239, + "time_sec": 177.5318386554718 + }, + { + "epoch": 7, + "train_loss": 4.625725547790528, + "train_acc": 0.01736, + "test_loss": 4.689012890625, + "test_acc": 0.01, + "lyapunov": 1.9375105041372196, + "grad_norm": 1.5277710541195855, + "grad_max_sv": 1.2430943816900253, + "grad_min_sv": 2.3127187931404337e-08, + "grad_condition": 59132800.22834401, + "lr": 0.000994636166481494, + "time_sec": 177.40680027008057 + }, + { + "epoch": 8, + "train_loss": 4.59545005279541, + "train_acc": 0.0184, + "test_loss": 4.622309016418457, + "test_acc": 0.01, + "lyapunov": 1.90919562312953, + "grad_norm": 1.1571484961155014, + "grad_max_sv": 0.9085995584726334, + "grad_min_sv": 1.753208326293887e-08, + "grad_condition": 63281521.14917536, + "lr": 0.0009929980185352525, + "time_sec": 177.37006545066833 + }, + { + "epoch": 9, + "train_loss": 4.573944561767578, + "train_acc": 0.01842, + "test_loss": 4.613925296020508, + "test_acc": 0.01, + "lyapunov": 1.8943235874176025, + "grad_norm": 0.8555279904880331, + "grad_max_sv": 0.640322944521904, + "grad_min_sv": 1.2160011294420903e-08, + "grad_condition": 472846876.7219082, + "lr": 0.0009911436253643444, + "time_sec": 177.3669729232788 + }, + { + "epoch": 10, + "train_loss": 4.557105533752441, + "train_acc": 0.01916, + "test_loss": 4.630582081604004, + "test_acc": 0.01, + "lyapunov": 1.8911274043495392, + "grad_norm": 0.6003404196903899, + "grad_max_sv": 0.40814377516508105, + "grad_min_sv": 7.962132173022773e-09, + "grad_condition": 409893898.93701446, + "lr": 0.0009890738003669028, + "time_sec": 177.38054275512695 + }, + { + "epoch": 11, + "train_loss": 4.5531344345092775, + "train_acc": 0.01868, + "test_loss": 4.641956332397461, + "test_acc": 0.01, + "lyapunov": 1.8781378772252662, + "grad_norm": 0.5034026990569981, + "grad_max_sv": 0.3208323583006859, + "grad_min_sv": 6.321780935542032e-09, + "grad_condition": 82621551.93098283, + "lr": 0.00098678945143658, + "time_sec": 177.42141723632812 + }, + { + "epoch": 12, + "train_loss": 4.547563322296143, + "train_acc": 0.01892, + "test_loss": 4.729993551635742, + "test_acc": 0.01, + "lyapunov": 1.8725779699852398, + "grad_norm": 0.4483811990593719, + "grad_max_sv": 0.2632142174988985, + "grad_min_sv": 5.238542990018691e-09, + "grad_condition": 95216592.46384116, + "lr": 0.0009842915805643154, + "time_sec": 177.37878227233887 + }, + { + "epoch": 13, + "train_loss": 4.5486574642944335, + "train_acc": 0.01906, + "test_loss": 4.699863485717773, + "test_acc": 0.01, + "lyapunov": 1.8532407667935658, + "grad_norm": 0.39800720402294987, + "grad_max_sv": 0.22830541394650936, + "grad_min_sv": 4.325602678822982e-09, + "grad_condition": 62768951.54790844, + "lr": 0.000981581283398829, + "time_sec": 177.41713428497314 + }, + { + "epoch": 14, + "train_loss": 4.5485781225585935, + "train_acc": 0.01988, + "test_loss": 4.687981828308105, + "test_acc": 0.01, + "lyapunov": 1.847328654640471, + "grad_norm": 0.3599420829816771, + "grad_max_sv": 0.20616305619478226, + "grad_min_sv": 3.66715160494426e-09, + "grad_condition": 1685364735.2603889, + "lr": 0.0009786597487660333, + "time_sec": 177.4442057609558 + }, + { + "epoch": 15, + "train_loss": 4.5476718295288086, + "train_acc": 0.01874, + "test_loss": 4.701715921020508, + "test_acc": 0.01, + "lyapunov": 1.8475938474430758, + "grad_norm": 0.33386250842414883, + "grad_max_sv": 0.1797737404704094, + "grad_min_sv": 2.714262508024881e-09, + "grad_condition": 585609298.807006, + "lr": 0.0009755282581475766, + "time_sec": 177.42870712280273 + }, + { + "epoch": 16, + "train_loss": 4.548249047546387, + "train_acc": 0.0189, + "test_loss": 4.644176796722412, + "test_acc": 0.01, + "lyapunov": 1.8449231233743146, + "grad_norm": 0.32722540388947124, + "grad_max_sv": 0.179276442527771, + "grad_min_sv": 1.834452784208601e-09, + "grad_condition": 645613430.8556594, + "lr": 0.0009721881851187403, + "time_sec": 177.38376188278198 + }, + { + "epoch": 17, + "train_loss": 4.550977543945312, + "train_acc": 0.01832, + "test_loss": 4.657319927978516, + "test_acc": 0.01, + "lyapunov": 1.849775262805812, + "grad_norm": 0.33594781658650263, + "grad_max_sv": 0.18930808678269387, + "grad_min_sv": 1.4419275515460163e-09, + "grad_condition": 4245912877.7031355, + "lr": 0.0009686409947459456, + "time_sec": 177.45769500732422 + }, + { + "epoch": 18, + "train_loss": 4.547336664581299, + "train_acc": 0.01872, + "test_loss": 4.824257318115234, + "test_acc": 0.01, + "lyapunov": 1.8506155117698337, + "grad_norm": 0.3186463239410211, + "grad_max_sv": 0.17492111679166555, + "grad_min_sv": 7.962825707957659e-10, + "grad_condition": 9665444897.108833, + "lr": 0.0009648882429441254, + "time_sec": 177.42497754096985 + }, + { + "epoch": 19, + "train_loss": 4.546553368988037, + "train_acc": 0.01988, + "test_loss": 4.634449420166016, + "test_acc": 0.01, + "lyapunov": 1.8629403315541688, + "grad_norm": 0.3141817916987218, + "grad_max_sv": 0.16888962239027022, + "grad_min_sv": 3.100283911986281e-10, + "grad_condition": 12395580054.184483, + "lr": 0.00096093157579425, + "time_sec": 177.42066621780396 + }, + { + "epoch": 20, + "train_loss": 4.547896039733887, + "train_acc": 0.01812, + "test_loss": 4.648453699493408, + "test_acc": 0.01, + "lyapunov": 1.8530689130353806, + "grad_norm": 0.28037051032867333, + "grad_max_sv": 0.14884913954883813, + "grad_min_sv": 4.734970479464422e-11, + "grad_condition": 18706013342.103394, + "lr": 0.0009567727288213001, + "time_sec": 177.42734503746033 + }, + { + "epoch": 21, + "train_loss": 4.553228437805176, + "train_acc": 0.01954, + "test_loss": 4.630985579681396, + "test_acc": 0.01, + "lyapunov": 1.8692577284620242, + "grad_norm": 0.27792900087884953, + "grad_max_sv": 0.1554839551448822, + "grad_min_sv": 4.666823285874219e-10, + "grad_condition": 10008180168.250607, + "lr": 0.0009524135262330095, + "time_sec": 177.4381377696991 + }, + { + "epoch": 22, + "train_loss": 4.543763105773926, + "train_acc": 0.01912, + "test_loss": 4.765555903625488, + "test_acc": 0.01, + "lyapunov": 1.9279104334009274, + "grad_norm": 0.34897259806693026, + "grad_max_sv": 0.19015887528657913, + "grad_min_sv": 9.161465612835251e-10, + "grad_condition": 31310287662.675404, + "lr": 0.0009478558801197061, + "time_sec": 177.40688180923462 + }, + { + "epoch": 23, + "train_loss": 4.545391994476319, + "train_acc": 0.01994, + "test_loss": 4.95503201751709, + "test_acc": 0.01, + "lyapunov": 1.8897823964238472, + "grad_norm": 0.27635093198837796, + "grad_max_sv": 0.15679910629987717, + "grad_min_sv": 1.1278384804314264e-11, + "grad_condition": 32001206389.390984, + "lr": 0.000943101789615607, + "time_sec": 177.41873931884766 + }, + { + "epoch": 24, + "train_loss": 4.537924372406006, + "train_acc": 0.0205, + "test_loss": 4.933882556152343, + "test_acc": 0.01, + "lyapunov": 1.8677331318940653, + "grad_norm": 0.2629499333333197, + "grad_max_sv": 0.1345283007249236, + "grad_min_sv": 1.752183104503964e-11, + "grad_condition": 25761086750.586906, + "lr": 0.0009381533400219313, + "time_sec": 177.39337539672852 + }, + { + "epoch": 25, + "train_loss": 4.5395216925048825, + "train_acc": 0.01982, + "test_loss": 4.7553122573852535, + "test_acc": 0.01, + "lyapunov": 1.892893662233182, + "grad_norm": 0.2494252365663538, + "grad_max_sv": 0.13098876383155583, + "grad_min_sv": 1.1539255091408414e-11, + "grad_condition": 30731634106.521202, + "lr": 0.0009330127018922189, + "time_sec": 177.424161195755 + }, + { + "epoch": 26, + "train_loss": 4.542462890625, + "train_acc": 0.01866, + "test_loss": 4.6617726119995115, + "test_acc": 0.01, + "lyapunov": 1.9029778931146997, + "grad_norm": 0.2418496821532437, + "grad_max_sv": 0.12933116126805544, + "grad_min_sv": 9.016501046764554e-12, + "grad_condition": 32681444533.636635, + "lr": 0.000927682130080253, + "time_sec": 177.39467239379883 + }, + { + "epoch": 27, + "train_loss": 4.546353931274414, + "train_acc": 0.01994, + "test_loss": 4.629417378997803, + "test_acc": 0.01, + "lyapunov": 1.9228146170716152, + "grad_norm": 0.22440941486234903, + "grad_max_sv": 0.11987878885120154, + "grad_min_sv": 3.394249909837516e-12, + "grad_condition": 44184424949.13588, + "lr": 0.0009221639627510072, + "time_sec": 177.37777948379517 + }, + { + "epoch": 28, + "train_loss": 4.5504691630554195, + "train_acc": 0.01782, + "test_loss": 4.6430878219604494, + "test_acc": 0.01, + "lyapunov": 1.9203921748549126, + "grad_norm": 0.21316860601896545, + "grad_max_sv": 0.11068132277578116, + "grad_min_sv": 4.163510696961453e-12, + "grad_condition": 34578779717.74602, + "lr": 0.0009164606203550494, + "time_sec": 177.41506218910217 + }, + { + "epoch": 29, + "train_loss": 4.553192196807862, + "train_acc": 0.01922, + "test_loss": 4.620924549865722, + "test_acc": 0.01, + "lyapunov": 1.9486115564165822, + "grad_norm": 0.21532419740547218, + "grad_max_sv": 0.11121681984513998, + "grad_min_sv": 2.174767523116755e-12, + "grad_condition": 58590467046.06332, + "lr": 0.0009105746045668516, + "time_sec": 177.46036434173584 + }, + { + "epoch": 30, + "train_loss": 4.577628551177979, + "train_acc": 0.01554, + "test_loss": 4.931937181854248, + "test_acc": 0.01, + "lyapunov": 2.03825170487699, + "grad_norm": 0.3192255588212213, + "grad_max_sv": 0.10931874038651586, + "grad_min_sv": 1.0787309123520735e-12, + "grad_condition": 67436360062.25419, + "lr": 0.0009045084971874733, + "time_sec": 177.45620775222778 + }, + { + "epoch": 31, + "train_loss": 4.562947151641846, + "train_acc": 0.01402, + "test_loss": 4.855396501159668, + "test_acc": 0.01, + "lyapunov": 1.9520337072479756, + "grad_norm": 0.24947493243538413, + "grad_max_sv": 0.14996777512133122, + "grad_min_sv": 2.8222605364129484e-13, + "grad_condition": 123865525225.74072, + "lr": 0.0008982649590120977, + "time_sec": 177.510662317276 + }, + { + "epoch": 32, + "train_loss": 4.565983801574707, + "train_acc": 0.01418, + "test_loss": 4.638044543457031, + "test_acc": 0.01, + "lyapunov": 1.9589825380793617, + "grad_norm": 0.21745675305184037, + "grad_max_sv": 0.15418258607387542, + "grad_min_sv": 1.8288951448041711e-13, + "grad_condition": 135201632895.44336, + "lr": 0.0008918467286629196, + "time_sec": 225.82675528526306 + }, + { + "epoch": 33, + "train_loss": 4.574427026519776, + "train_acc": 0.01298, + "test_loss": 4.7455434860229495, + "test_acc": 0.01, + "lyapunov": 2.0786097866799826, + "grad_norm": 0.3011912270329583, + "grad_max_sv": 0.1479480130597949, + "grad_min_sv": 4.040295423662463e-14, + "grad_condition": 143547262648.40558, + "lr": 0.0008852566213878943, + "time_sec": 212.4946165084839 + }, + { + "epoch": 34, + "train_loss": 4.598861814422607, + "train_acc": 0.0115, + "test_loss": 4.605647972869873, + "test_acc": 0.01, + "lyapunov": 2.040311818537505, + "grad_norm": 0.6761833343202188, + "grad_max_sv": 0.11083788472460583, + "grad_min_sv": 4.110164680606927e-11, + "grad_condition": 99834085699.46811, + "lr": 0.000878497527825878, + "time_sec": 177.3635172843933 + }, + { + "epoch": 35, + "train_loss": 4.5978329862976075, + "train_acc": 0.0123, + "test_loss": 4.612800787353516, + "test_acc": 0.01, + "lyapunov": 1.964153668459724, + "grad_norm": 0.17049612065492592, + "grad_max_sv": 0.12097362177446484, + "grad_min_sv": 3.637372272135023e-13, + "grad_condition": 115726872832.26929, + "lr": 0.000871572412738697, + "time_sec": 177.3725883960724 + }, + { + "epoch": 36, + "train_loss": 4.590414097595215, + "train_acc": 0.01364, + "test_loss": 4.613982511901855, + "test_acc": 0.0106, + "lyapunov": 1.940161881849284, + "grad_norm": 0.17661965085230752, + "grad_max_sv": 0.12085543926805258, + "grad_min_sv": 1.7141639479141907e-14, + "grad_condition": 118832574895.3577, + "lr": 0.0008644843137107055, + "time_sec": 177.36169910430908 + }, + { + "epoch": 37, + "train_loss": 4.603200916442871, + "train_acc": 0.01144, + "test_loss": 4.682376429748535, + "test_acc": 0.0099, + "lyapunov": 1.912264422077657, + "grad_norm": 0.19292967799281205, + "grad_max_sv": 0.11742573268711567, + "grad_min_sv": 2.57803301802478e-13, + "grad_condition": 107518420442.89116, + "lr": 0.0008572363398164014, + "time_sec": 177.35389232635498 + }, + { + "epoch": 38, + "train_loss": 4.60353625869751, + "train_acc": 0.01232, + "test_loss": 4.6085469467163085, + "test_acc": 0.0117, + "lyapunov": 1.8644801216662084, + "grad_norm": 0.16293184045510936, + "grad_max_sv": 0.10393068259581924, + "grad_min_sv": 1.7559085685112726e-13, + "grad_condition": 90992351147.92781, + "lr": 0.0008498316702566826, + "time_sec": 177.3858036994934 + }, + { + "epoch": 39, + "train_loss": 4.600621211242676, + "train_acc": 0.0113, + "test_loss": 4.628137604522705, + "test_acc": 0.0059, + "lyapunov": 1.854224362336766, + "grad_norm": 0.14764433538203306, + "grad_max_sv": 0.09894248126074671, + "grad_min_sv": 1.89273452355483e-14, + "grad_condition": 96895515749.60886, + "lr": 0.0008422735529643442, + "time_sec": 177.37866950035095 + }, + { + "epoch": 40, + "train_loss": 4.5831811744689945, + "train_acc": 0.01556, + "test_loss": 4.6161288673400875, + "test_acc": 0.0075, + "lyapunov": 1.8447816320087598, + "grad_norm": 0.16789998934338032, + "grad_max_sv": 0.09656790103763342, + "grad_min_sv": 4.938935938182056e-14, + "grad_condition": 92410869013.77493, + "lr": 0.0008345653031794289, + "time_sec": 177.36352348327637 + }, + { + "epoch": 41, + "train_loss": 4.576951338043213, + "train_acc": 0.01544, + "test_loss": 4.626422532653809, + "test_acc": 0.0059, + "lyapunov": 1.8409895357268546, + "grad_norm": 0.16650132931853925, + "grad_max_sv": 0.09661551136523486, + "grad_min_sv": 5.5311883046546714e-14, + "grad_condition": 91973842148.10474, + "lr": 0.0008267103019950526, + "time_sec": 177.44510340690613 + }, + { + "epoch": 42, + "train_loss": 4.596107442321777, + "train_acc": 0.01286, + "test_loss": 4.609375232696533, + "test_acc": 0.0103, + "lyapunov": 1.867913676039947, + "grad_norm": 0.32255950644628917, + "grad_max_sv": 0.10478700120002031, + "grad_min_sv": 7.395428917744707e-14, + "grad_condition": 99110681649.70932, + "lr": 0.0008187119948743447, + "time_sec": 177.37195253372192 + }, + { + "epoch": 43, + "train_loss": 4.576052311859131, + "train_acc": 0.01216, + "test_loss": 4.605898602294922, + "test_acc": 0.01, + "lyapunov": 1.8121510469700064, + "grad_norm": 0.1682335228453255, + "grad_max_sv": 0.13096272256225347, + "grad_min_sv": 2.325299366018125e-38, + "grad_condition": 130962722562.25346, + "lr": 0.000810573890139155, + "time_sec": 177.3363115787506 + }, + { + "epoch": 44, + "train_loss": 4.575016804962158, + "train_acc": 0.01204, + "test_loss": 4.6531572357177735, + "test_acc": 0.01, + "lyapunov": 1.844909136557518, + "grad_norm": 0.16339088520861647, + "grad_max_sv": 0.12486125733703375, + "grad_min_sv": 7.854270886048278e-41, + "grad_condition": 124861257337.03374, + "lr": 0.0008022995574311873, + "time_sec": 177.3388659954071 + }, + { + "epoch": 45, + "train_loss": 4.571797399902343, + "train_acc": 0.01312, + "test_loss": 4.6326898643493655, + "test_acc": 0.01, + "lyapunov": 1.7807648858755751, + "grad_norm": 0.1583001371978669, + "grad_max_sv": 0.11400312408804894, + "grad_min_sv": 2.0150044461101764e-34, + "grad_condition": 114003124088.04892, + "lr": 0.0007938926261462363, + "time_sec": 177.2870581150055 + }, + { + "epoch": 46, + "train_loss": 4.571164744415284, + "train_acc": 0.01216, + "test_loss": 4.7157730285644535, + "test_acc": 0.0055, + "lyapunov": 1.770619028364606, + "grad_norm": 0.155372177767644, + "grad_max_sv": 0.11489532180130482, + "grad_min_sv": 4.586223596317033e-32, + "grad_condition": 114895321801.30481, + "lr": 0.0007853567838422158, + "time_sec": 177.31609582901 + }, + { + "epoch": 47, + "train_loss": 4.573118797912597, + "train_acc": 0.0127, + "test_loss": 4.652663481140137, + "test_acc": 0.0083, + "lyapunov": 1.755919989112698, + "grad_norm": 0.15694602621142137, + "grad_max_sv": 0.10912387128919362, + "grad_min_sv": 1.082265400009604e-33, + "grad_condition": 109123871289.19363, + "lr": 0.0007766957746216719, + "time_sec": 177.30992484092712 + }, + { + "epoch": 48, + "train_loss": 4.571219747619629, + "train_acc": 0.01276, + "test_loss": 4.659695971679687, + "test_acc": 0.01, + "lyapunov": 1.7550827587961846, + "grad_norm": 0.15287442171405372, + "grad_max_sv": 0.10996787585318088, + "grad_min_sv": 4.670549970125493e-34, + "grad_condition": 109967875853.18088, + "lr": 0.0007679133974894982, + "time_sec": 177.28727316856384 + }, + { + "epoch": 49, + "train_loss": 4.569807028045655, + "train_acc": 0.01218, + "test_loss": 4.636177100372315, + "test_acc": 0.0106, + "lyapunov": 1.7690098404579455, + "grad_norm": 0.18153616207574144, + "grad_max_sv": 0.11563525255769491, + "grad_min_sv": 5.486901725583568e-31, + "grad_condition": 115635252557.6949, + "lr": 0.000759013504686565, + "time_sec": 177.29954981803894 + }, + { + "epoch": 50, + "train_loss": 4.570931665344238, + "train_acc": 0.0121, + "test_loss": 4.6071569503784175, + "test_acc": 0.01, + "lyapunov": 1.807037060218089, + "grad_norm": 0.15845522676178395, + "grad_max_sv": 0.11082600858062505, + "grad_min_sv": 3.3545771830237645e-27, + "grad_condition": 110826008580.62471, + "lr": 0.0007499999999999998, + "time_sec": 177.3009307384491 + }, + { + "epoch": 51, + "train_loss": 4.56821715423584, + "train_acc": 0.01356, + "test_loss": 4.607294733428955, + "test_acc": 0.01, + "lyapunov": 1.7960190611422215, + "grad_norm": 0.15291941879574358, + "grad_max_sv": 0.1085304556414485, + "grad_min_sv": 5.234550087037553e-32, + "grad_condition": 108530455641.44849, + "lr": 0.0007408768370508575, + "time_sec": 177.30324840545654 + }, + { + "epoch": 52, + "train_loss": 4.5681144180297855, + "train_acc": 0.01254, + "test_loss": 4.7746817504882815, + "test_acc": 0.01, + "lyapunov": 1.8113833918900746, + "grad_norm": 0.1551325385716633, + "grad_max_sv": 0.10723174829035997, + "grad_min_sv": 1.156681276768738e-32, + "grad_condition": 107231748290.35995, + "lr": 0.0007316480175599307, + "time_sec": 177.29757356643677 + }, + { + "epoch": 53, + "train_loss": 4.5682883798217775, + "train_acc": 0.01308, + "test_loss": 4.607502725982666, + "test_acc": 0.01, + "lyapunov": 1.797081575064403, + "grad_norm": 0.15424179509635785, + "grad_max_sv": 0.11033043321222066, + "grad_min_sv": 5.555574632007681e-26, + "grad_condition": 110330433212.21455, + "lr": 0.0007223175895924635, + "time_sec": 177.38000464439392 + }, + { + "epoch": 54, + "train_loss": 4.567883385925293, + "train_acc": 0.01308, + "test_loss": 4.6075471481323245, + "test_acc": 0.01, + "lyapunov": 1.795134693155508, + "grad_norm": 0.1479095088192472, + "grad_max_sv": 0.09978982489556074, + "grad_min_sv": 3.0716585923057893e-27, + "grad_condition": 99789824895.56044, + "lr": 0.0007128896457825361, + "time_sec": 177.3199532032013 + }, + { + "epoch": 55, + "train_loss": 4.567380355072022, + "train_acc": 0.0132, + "test_loss": 4.913865223693848, + "test_acc": 0.0071, + "lyapunov": 1.800114458784118, + "grad_norm": 0.15088025535341454, + "grad_max_sv": 0.10508234314620495, + "grad_min_sv": 1.1828436654684573e-20, + "grad_condition": 105082341975.71126, + "lr": 0.0007033683215378998, + "time_sec": 177.33242273330688 + }, + { + "epoch": 56, + "train_loss": 4.568105935058594, + "train_acc": 0.01288, + "test_loss": 4.9639324310302735, + "test_acc": 0.01, + "lyapunov": 1.791341680395024, + "grad_norm": 0.14880666313188015, + "grad_max_sv": 0.10149468388408422, + "grad_min_sv": 3.988422583995241e-33, + "grad_condition": 101494683884.08423, + "lr": 0.0006937577932260512, + "time_sec": 177.3845407962799 + }, + { + "epoch": 57, + "train_loss": 4.5689506640625, + "train_acc": 0.01226, + "test_loss": 5.048221938323975, + "test_acc": 0.01, + "lyapunov": 1.7925406188306297, + "grad_norm": 0.14694104547076697, + "grad_max_sv": 0.1024689320474863, + "grad_min_sv": 4.175795156156322e-27, + "grad_condition": 102468932047.48581, + "lr": 0.0006840622763423388, + "time_sec": 177.35671710968018 + }, + { + "epoch": 58, + "train_loss": 4.567952045135498, + "train_acc": 0.01224, + "test_loss": 4.918060597991944, + "test_acc": 0.01, + "lyapunov": 1.7935436262803919, + "grad_norm": 0.1442604888179717, + "grad_max_sv": 0.0956211369484663, + "grad_min_sv": 8.965700522898849e-35, + "grad_condition": 95621136948.46631, + "lr": 0.0006742860236609073, + "time_sec": 177.30539679527283 + }, + { + "epoch": 59, + "train_loss": 4.567556964111328, + "train_acc": 0.01166, + "test_loss": 4.784052313995361, + "test_acc": 0.01, + "lyapunov": 1.792896061297268, + "grad_norm": 0.14339216567625596, + "grad_max_sv": 0.0998681552708149, + "grad_min_sv": 1.6267929360545776e-33, + "grad_condition": 99868155270.8149, + "lr": 0.0006644333233692913, + "time_sec": 177.3021900653839 + }, + { + "epoch": 60, + "train_loss": 4.566637614135742, + "train_acc": 0.01302, + "test_loss": 4.939413081359863, + "test_acc": 0.0089, + "lyapunov": 1.800732863223766, + "grad_norm": 0.14639646943889295, + "grad_max_sv": 0.1006914485245943, + "grad_min_sv": 2.587203260121448e-28, + "grad_condition": 100691448524.59428, + "lr": 0.0006545084971874734, + "time_sec": 177.3246009349823 + }, + { + "epoch": 61, + "train_loss": 4.5677985464477535, + "train_acc": 0.01204, + "test_loss": 4.689374994659424, + "test_acc": 0.01, + "lyapunov": 1.7923528779193263, + "grad_norm": 0.146856512803808, + "grad_max_sv": 0.10027224402874708, + "grad_min_sv": 3.265638135928119e-34, + "grad_condition": 100272244028.74707, + "lr": 0.0006445158984722354, + "time_sec": 177.3465657234192 + }, + { + "epoch": 62, + "train_loss": 4.568169707183838, + "train_acc": 0.01322, + "test_loss": 4.92401081085205, + "test_acc": 0.01, + "lyapunov": 1.793337759764298, + "grad_norm": 0.14830246569432107, + "grad_max_sv": 0.10649488009512424, + "grad_min_sv": 3.947983458120654e-34, + "grad_condition": 106494880095.12425, + "lr": 0.0006344599103076324, + "time_sec": 177.33594274520874 + }, + { + "epoch": 63, + "train_loss": 4.601692415466308, + "train_acc": 0.01128, + "test_loss": 4.622838488769531, + "test_acc": 0.0093, + "lyapunov": 1.8888863468414072, + "grad_norm": 2.097389221606069, + "grad_max_sv": 0.07372891843697289, + "grad_min_sv": 5.8291273285268636e-15, + "grad_condition": 73088343924.37703, + "lr": 0.0006243449435824269, + "time_sec": 177.34169101715088 + }, + { + "epoch": 64, + "train_loss": 4.564995886535645, + "train_acc": 0.0142, + "test_loss": 4.609309208679199, + "test_acc": 0.01, + "lyapunov": 1.8677834397386712, + "grad_norm": 0.16075228694903138, + "grad_max_sv": 0.10515890400856734, + "grad_min_sv": 1.3911072942013711e-14, + "grad_condition": 104125866183.20358, + "lr": 0.0006141754350553275, + "time_sec": 177.36707615852356 + }, + { + "epoch": 65, + "train_loss": 4.570636109161377, + "train_acc": 0.01426, + "test_loss": 4.607698435211182, + "test_acc": 0.01, + "lyapunov": 1.8525302056461344, + "grad_norm": 0.15426152152539457, + "grad_max_sv": 0.09303022520616651, + "grad_min_sv": 6.8773627432224e-15, + "grad_condition": 92279415120.89612, + "lr": 0.0006039558454088793, + "time_sec": 177.31724667549133 + }, + { + "epoch": 66, + "train_loss": 4.599106399993897, + "train_acc": 0.01154, + "test_loss": 4.633498463439941, + "test_acc": 0.01, + "lyapunov": 1.8344569968445528, + "grad_norm": 0.9455828211740803, + "grad_max_sv": 0.07013371546672716, + "grad_min_sv": 1.507808105341429e-14, + "grad_condition": 68152625137.74638, + "lr": 0.000593690657292862, + "time_sec": 177.32066535949707 + }, + { + "epoch": 67, + "train_loss": 4.580814336547852, + "train_acc": 0.01532, + "test_loss": 4.626534017944336, + "test_acc": 0.01, + "lyapunov": 1.8290482561301697, + "grad_norm": 0.19517115706214946, + "grad_max_sv": 0.12490405924618245, + "grad_min_sv": 1.9444856202991992e-14, + "grad_condition": 122467391557.71028, + "lr": 0.0005833843733580507, + "time_sec": 177.35997676849365 + }, + { + "epoch": 68, + "train_loss": 4.5921751937866215, + "train_acc": 0.01364, + "test_loss": 4.638207249450684, + "test_acc": 0.01, + "lyapunov": 1.8349919072197527, + "grad_norm": 0.460492968119845, + "grad_max_sv": 0.10702236535289558, + "grad_min_sv": 2.2123450599644305e-13, + "grad_condition": 95625261975.70398, + "lr": 0.0005730415142812054, + "time_sec": 177.36813497543335 + }, + { + "epoch": 69, + "train_loss": 4.5961358061218265, + "train_acc": 0.01298, + "test_loss": 4.607077551269532, + "test_acc": 0.01, + "lyapunov": 1.8598975065114247, + "grad_norm": 2.546438567786095, + "grad_max_sv": 0.07785456163189224, + "grad_min_sv": 6.18159561539687e-13, + "grad_condition": 53349256888.33342, + "lr": 0.0005626666167821517, + "time_sec": 177.58047890663147 + }, + { + "epoch": 70, + "train_loss": 4.584916583099365, + "train_acc": 0.0129, + "test_loss": 4.605791180419922, + "test_acc": 0.01, + "lyapunov": 2.063964778809901, + "grad_norm": 1.1269952121140787, + "grad_max_sv": 0.13612028946643875, + "grad_min_sv": 9.475902483685454e-16, + "grad_condition": 135984520961.8097, + "lr": 0.0005522642316338265, + "time_sec": 177.3025302886963 + }, + { + "epoch": 71, + "train_loss": 4.5657632319641115, + "train_acc": 0.015, + "test_loss": 4.6077304992675785, + "test_acc": 0.01, + "lyapunov": 2.048694342908347, + "grad_norm": 0.19880801120613076, + "grad_max_sv": 0.162659665197134, + "grad_min_sv": 9.790377361004964e-35, + "grad_condition": 162659665197.134, + "lr": 0.0005418389216661573, + "time_sec": 177.31212949752808 + }, + { + "epoch": 72, + "train_loss": 4.565562518768311, + "train_acc": 0.0147, + "test_loss": 4.6131870063781735, + "test_acc": 0.01, + "lyapunov": 2.0358364441815544, + "grad_norm": 0.17659979704367984, + "grad_max_sv": 0.1367532407864928, + "grad_min_sv": 1.0813565460063155e-35, + "grad_condition": 136753240786.49283, + "lr": 0.0005313952597646563, + "time_sec": 177.30756258964539 + }, + { + "epoch": 73, + "train_loss": 4.5637111499023435, + "train_acc": 0.01468, + "test_loss": 4.662373492431641, + "test_acc": 0.01, + "lyapunov": 2.0378534354822104, + "grad_norm": 0.16730731102883323, + "grad_max_sv": 0.1271504819393158, + "grad_min_sv": 8.141531004288703e-19, + "grad_condition": 127150364914.09229, + "lr": 0.0005209378268645994, + "time_sec": 177.32029056549072 + }, + { + "epoch": 74, + "train_loss": 4.565951173248291, + "train_acc": 0.0149, + "test_loss": 5.167428440093994, + "test_acc": 0.01, + "lyapunov": 2.034459155233925, + "grad_norm": 0.1598356266166805, + "grad_max_sv": 0.11188621651381254, + "grad_min_sv": 7.956263056308037e-17, + "grad_condition": 111877428680.18631, + "lr": 0.0005104712099416781, + "time_sec": 177.3263282775879 + }, + { + "epoch": 75, + "train_loss": 4.554299867095947, + "train_acc": 0.0148, + "test_loss": 4.670576226043702, + "test_acc": 0.01, + "lyapunov": 2.0256418004974988, + "grad_norm": 0.6425048437317492, + "grad_max_sv": 0.11874032808700577, + "grad_min_sv": 9.53469126201266e-28, + "grad_condition": 118740328087.00566, + "lr": 0.0004999999999999996, + "time_sec": 177.33032536506653 + }, + { + "epoch": 76, + "train_loss": 4.544258031005859, + "train_acc": 0.01582, + "test_loss": 4.7919898590087895, + "test_acc": 0.01, + "lyapunov": 1.9940624051081859, + "grad_norm": 0.18376329495268384, + "grad_max_sv": 0.12770626787096262, + "grad_min_sv": 1.5320719029212827e-14, + "grad_condition": 125850928802.59525, + "lr": 0.0004895287900583212, + "time_sec": 177.3431053161621 + }, + { + "epoch": 77, + "train_loss": 4.53702930557251, + "train_acc": 0.01814, + "test_loss": 5.09228942565918, + "test_acc": 0.01, + "lyapunov": 2.004529595070178, + "grad_norm": 0.23332342855727387, + "grad_max_sv": 0.11955075059086084, + "grad_min_sv": 3.3454590497014467e-14, + "grad_condition": 115784635862.96426, + "lr": 0.0004790621731353997, + "time_sec": 177.3438844680786 + }, + { + "epoch": 78, + "train_loss": 4.534572752380371, + "train_acc": 0.01882, + "test_loss": 4.832008946228028, + "test_acc": 0.01, + "lyapunov": 2.0158191958961584, + "grad_norm": 0.1920573866361736, + "grad_max_sv": 0.1183493785560131, + "grad_min_sv": 4.1988661863109933e-14, + "grad_condition": 113783080933.4834, + "lr": 0.000468604740235343, + "time_sec": 177.35729384422302 + }, + { + "epoch": 79, + "train_loss": 4.529569886932373, + "train_acc": 0.01952, + "test_loss": 5.048179293823242, + "test_acc": 0.01, + "lyapunov": 2.015618150496422, + "grad_norm": 0.1967256476510768, + "grad_max_sv": 0.11198066771030427, + "grad_min_sv": 4.758873523897381e-14, + "grad_condition": 107147740579.17552, + "lr": 0.00045816107833384175, + "time_sec": 177.3638677597046 + }, + { + "epoch": 80, + "train_loss": 4.524784006042481, + "train_acc": 0.02006, + "test_loss": 5.219789337158203, + "test_acc": 0.01, + "lyapunov": 2.054618088790523, + "grad_norm": 0.1882303336778061, + "grad_max_sv": 0.11063385736197233, + "grad_min_sv": 7.36556254526723e-14, + "grad_condition": 103919529913.31416, + "lr": 0.0004477357683661729, + "time_sec": 177.3434329032898 + }, + { + "epoch": 81, + "train_loss": 4.513287781219482, + "train_acc": 0.02046, + "test_loss": 5.4127315925598145, + "test_acc": 0.01, + "lyapunov": 2.0582806338434634, + "grad_norm": 0.2031727105378663, + "grad_max_sv": 0.11583145018666982, + "grad_min_sv": 7.805375957945844e-14, + "grad_condition": 107587810958.66092, + "lr": 0.00043733338321784746, + "time_sec": 177.3602488040924 + }, + { + "epoch": 82, + "train_loss": 4.552439326629639, + "train_acc": 0.01516, + "test_loss": 5.182042855834961, + "test_acc": 0.01, + "lyapunov": 2.0503602448631737, + "grad_norm": 0.17073610088297192, + "grad_max_sv": 0.09705250952392816, + "grad_min_sv": 3.4896408906750006e-14, + "grad_condition": 93852286781.79861, + "lr": 0.0004269584857187939, + "time_sec": 177.36704516410828 + }, + { + "epoch": 83, + "train_loss": 4.540618519439697, + "train_acc": 0.01836, + "test_loss": 4.887316487121582, + "test_acc": 0.01, + "lyapunov": 2.036365619096, + "grad_norm": 0.178925255596835, + "grad_max_sv": 0.09582959767431021, + "grad_min_sv": 6.999946611445171e-14, + "grad_condition": 90352299888.03552, + "lr": 0.0004166156266419484, + "time_sec": 177.42960810661316 + }, + { + "epoch": 84, + "train_loss": 4.5301704800415035, + "train_acc": 0.0202, + "test_loss": 4.911700419616699, + "test_acc": 0.01, + "lyapunov": 2.0310050584471133, + "grad_norm": 0.21956147144261412, + "grad_max_sv": 0.10685321651399135, + "grad_min_sv": 1.6599147474968171e-13, + "grad_condition": 95120504962.38972, + "lr": 0.0004063093427071373, + "time_sec": 177.41741013526917 + }, + { + "epoch": 85, + "train_loss": 4.521631349945069, + "train_acc": 0.02046, + "test_loss": 4.9735999771118165, + "test_acc": 0.01, + "lyapunov": 2.0944621767229434, + "grad_norm": 0.20639357879920123, + "grad_max_sv": 0.1097319820895791, + "grad_min_sv": 3.0481061771537406e-13, + "grad_condition": 89595141799.5074, + "lr": 0.0003960441545911199, + "time_sec": 177.35863280296326 + }, + { + "epoch": 86, + "train_loss": 4.515884091491699, + "train_acc": 0.0226, + "test_loss": 5.020805032348632, + "test_acc": 0.01, + "lyapunov": 2.1580070205356763, + "grad_norm": 0.2171400925836118, + "grad_max_sv": 0.10496667213737965, + "grad_min_sv": 2.3929384956391853e-13, + "grad_condition": 88693595920.06924, + "lr": 0.0003858245649446718, + "time_sec": 177.35719203948975 + }, + { + "epoch": 87, + "train_loss": 4.508240751953125, + "train_acc": 0.02188, + "test_loss": 5.056581590270996, + "test_acc": 0.01, + "lyapunov": 2.179570354159226, + "grad_norm": 0.2117802030762919, + "grad_max_sv": 0.11064628288149833, + "grad_min_sv": 5.629122443043941e-13, + "grad_condition": 82119787484.41371, + "lr": 0.00037565505641757235, + "time_sec": 177.43662810325623 + }, + { + "epoch": 88, + "train_loss": 4.602668369903564, + "train_acc": 0.01458, + "test_loss": 4.645070762634277, + "test_acc": 0.01, + "lyapunov": 2.2725740960796776, + "grad_norm": 0.2810721756625388, + "grad_max_sv": 0.13397499950602879, + "grad_min_sv": 2.3262272314478417e-13, + "grad_condition": 122835138094.28622, + "lr": 0.00036554008969236695, + "time_sec": 177.45580291748047 + }, + { + "epoch": 89, + "train_loss": 4.593976813964844, + "train_acc": 0.01338, + "test_loss": 4.794082858276367, + "test_acc": 0.01, + "lyapunov": 2.147210692200819, + "grad_norm": 0.759058846561603, + "grad_max_sv": 0.1211125890877156, + "grad_min_sv": 2.0899380256263837e-14, + "grad_condition": 118616769495.28653, + "lr": 0.0003554841015277638, + "time_sec": 177.35196542739868 + }, + { + "epoch": 90, + "train_loss": 4.546598121643067, + "train_acc": 0.01692, + "test_loss": 5.085714856719971, + "test_acc": 0.01, + "lyapunov": 1.959295385633893, + "grad_norm": 0.18801319046748138, + "grad_max_sv": 0.12013570107519626, + "grad_min_sv": 1.556443286149524e-13, + "grad_condition": 105681804007.33401, + "lr": 0.000345491502812526, + "time_sec": 177.3326654434204 + }, + { + "epoch": 91, + "train_loss": 4.52639261138916, + "train_acc": 0.02024, + "test_loss": 5.4292246536254885, + "test_acc": 0.01, + "lyapunov": 1.9528833008788127, + "grad_norm": 0.19744289771043935, + "grad_max_sv": 0.11147539932280778, + "grad_min_sv": 1.6081849520359716e-13, + "grad_condition": 97964228191.25418, + "lr": 0.0003355666766307081, + "time_sec": 177.3534951210022 + }, + { + "epoch": 92, + "train_loss": 4.517257850189209, + "train_acc": 0.02166, + "test_loss": 5.752269718933105, + "test_acc": 0.01, + "lyapunov": 1.942441391518049, + "grad_norm": 0.20327679889782116, + "grad_max_sv": 0.10881670657545328, + "grad_min_sv": 2.8148071332918877e-13, + "grad_condition": 88241447588.50455, + "lr": 0.00032571397633909225, + "time_sec": 177.31370544433594 + }, + { + "epoch": 93, + "train_loss": 4.51958215789795, + "train_acc": 0.02058, + "test_loss": 6.215483041381836, + "test_acc": 0.01, + "lyapunov": 1.9454329702860254, + "grad_norm": 0.20233841637212174, + "grad_max_sv": 0.10735675729811192, + "grad_min_sv": 5.437789853487922e-13, + "grad_condition": 80677948091.06416, + "lr": 0.00031593772365766094, + "time_sec": 177.35208916664124 + }, + { + "epoch": 94, + "train_loss": 4.527246778869629, + "train_acc": 0.01882, + "test_loss": 6.593671340942382, + "test_acc": 0.01, + "lyapunov": 1.9411613587528238, + "grad_norm": 0.19160068088300194, + "grad_max_sv": 0.10174073036760092, + "grad_min_sv": 2.793891541001816e-13, + "grad_condition": 85085942332.55312, + "lr": 0.0003062422067739483, + "time_sec": 177.32164216041565 + }, + { + "epoch": 95, + "train_loss": 4.522369806365967, + "train_acc": 0.02012, + "test_loss": 7.235169104003906, + "test_acc": 0.01, + "lyapunov": 1.9293771396817454, + "grad_norm": 0.18883083291584565, + "grad_max_sv": 0.09721812345087529, + "grad_min_sv": 6.229525809297941e-13, + "grad_condition": 70200603277.04945, + "lr": 0.00029663167846209965, + "time_sec": 177.37938117980957 + }, + { + "epoch": 96, + "train_loss": 4.515466445007324, + "train_acc": 0.02094, + "test_loss": 6.755592398834229, + "test_acc": 0.01, + "lyapunov": 1.9193610050489225, + "grad_norm": 0.19450416199611387, + "grad_max_sv": 0.09956333581358194, + "grad_min_sv": 9.974038708528621e-13, + "grad_condition": 65838294277.60075, + "lr": 0.00028711035421746345, + "time_sec": 177.39440894126892 + }, + { + "epoch": 97, + "train_loss": 4.5159863470458985, + "train_acc": 0.02106, + "test_loss": 6.925238887023926, + "test_acc": 0.01, + "lyapunov": 1.9178373036177263, + "grad_norm": 0.19020558899728204, + "grad_max_sv": 0.09718397427350282, + "grad_min_sv": 7.581572850683028e-13, + "grad_condition": 66877963121.29408, + "lr": 0.00027768241040753615, + "time_sec": 177.3824520111084 + }, + { + "epoch": 98, + "train_loss": 4.521075716247559, + "train_acc": 0.02202, + "test_loss": 8.121050939941407, + "test_acc": 0.01, + "lyapunov": 1.9147872854681576, + "grad_norm": 0.1934243158960077, + "grad_max_sv": 0.10121007524430752, + "grad_min_sv": 8.450979273160665e-13, + "grad_condition": 68354558422.48958, + "lr": 0.00026835198244006903, + "time_sec": 177.35862588882446 + }, + { + "epoch": 99, + "train_loss": 4.522917724304199, + "train_acc": 0.01976, + "test_loss": 7.095849452972412, + "test_acc": 0.01, + "lyapunov": 1.8851848322412241, + "grad_norm": 0.18661608851957018, + "grad_max_sv": 0.09974390026181937, + "grad_min_sv": 2.3609410447217e-13, + "grad_condition": 85270551657.5321, + "lr": 0.0002591231629491421, + "time_sec": 177.40244436264038 + }, + { + "epoch": 100, + "train_loss": 4.519071618957519, + "train_acc": 0.02182, + "test_loss": 7.258035105895996, + "test_acc": 0.01, + "lyapunov": 1.8870434898244755, + "grad_norm": 0.18955381594835574, + "grad_max_sv": 0.10142176356166602, + "grad_min_sv": 4.18530860082457e-13, + "grad_condition": 81448255883.87708, + "lr": 0.0002499999999999997, + "time_sec": 177.34263491630554 + }, + { + "epoch": 101, + "train_loss": 4.517442984466553, + "train_acc": 0.021, + "test_loss": 7.576486515808106, + "test_acc": 0.01, + "lyapunov": 1.8868652429727033, + "grad_norm": 0.19157320547777273, + "grad_max_sv": 0.10139708835631608, + "grad_min_sv": 5.327901829573975e-13, + "grad_condition": 82743365215.91306, + "lr": 0.00024098649531343477, + "time_sec": 177.37268996238708 + }, + { + "epoch": 102, + "train_loss": 4.516081234130859, + "train_acc": 0.02092, + "test_loss": 7.540461968994141, + "test_acc": 0.01, + "lyapunov": 1.886926714111777, + "grad_norm": 0.19361816812032298, + "grad_max_sv": 0.10115151274949312, + "grad_min_sv": 7.893692691836129e-13, + "grad_condition": 67614807097.32371, + "lr": 0.0002320866025105016, + "time_sec": 177.4215235710144 + }, + { + "epoch": 103, + "train_loss": 4.51589251953125, + "train_acc": 0.02184, + "test_loss": 6.735574526977539, + "test_acc": 0.01, + "lyapunov": 1.8953558365097436, + "grad_norm": 0.18905125681480797, + "grad_max_sv": 0.0964373467490077, + "grad_min_sv": 6.672119305288094e-13, + "grad_condition": 67264211388.955826, + "lr": 0.0002233042253783278, + "time_sec": 177.44301295280457 + }, + { + "epoch": 104, + "train_loss": 4.510274680633545, + "train_acc": 0.02228, + "test_loss": 6.947120163726806, + "test_acc": 0.01, + "lyapunov": 1.8925634592085543, + "grad_norm": 0.19050377836817628, + "grad_max_sv": 0.10047796424478292, + "grad_min_sv": 6.43513976450922e-13, + "grad_condition": 72543317845.92526, + "lr": 0.000214643216157784, + "time_sec": 177.43615889549255 + }, + { + "epoch": 105, + "train_loss": 4.507045760345459, + "train_acc": 0.02344, + "test_loss": 6.44128829498291, + "test_acc": 0.01, + "lyapunov": 1.8931523140738993, + "grad_norm": 0.1941896672080212, + "grad_max_sv": 0.10169495549052954, + "grad_min_sv": 1.197506250216646e-12, + "grad_condition": 57976645954.3195, + "lr": 0.00020610737385376332, + "time_sec": 177.3762686252594 + }, + { + "epoch": 106, + "train_loss": 4.50908245300293, + "train_acc": 0.02272, + "test_loss": 6.410396545410157, + "test_acc": 0.01, + "lyapunov": 1.891097482512979, + "grad_norm": 0.19224977770583887, + "grad_max_sv": 0.09774007555097342, + "grad_min_sv": 1.6075280263693056e-12, + "grad_condition": 51460468274.59027, + "lr": 0.00019770044256881242, + "time_sec": 177.36651515960693 + }, + { + "epoch": 107, + "train_loss": 4.5151639590454105, + "train_acc": 0.02132, + "test_loss": 6.411097073364258, + "test_acc": 0.01, + "lyapunov": 1.8785841452801013, + "grad_norm": 0.18870212425613683, + "grad_max_sv": 0.09599546585232019, + "grad_min_sv": 9.996112506671593e-13, + "grad_condition": 60403834048.275345, + "lr": 0.0001894261098608447, + "time_sec": 177.41180038452148 + }, + { + "epoch": 108, + "train_loss": 4.512421267089843, + "train_acc": 0.02116, + "test_loss": 6.5682136413574215, + "test_acc": 0.01, + "lyapunov": 1.874200306889956, + "grad_norm": 0.18878498506944777, + "grad_max_sv": 0.09599304348230361, + "grad_min_sv": 5.58528019253264e-13, + "grad_condition": 70564017992.73062, + "lr": 0.000181288005125655, + "time_sec": 177.57528257369995 + }, + { + "epoch": 109, + "train_loss": 4.513136726989746, + "train_acc": 0.02048, + "test_loss": 6.481448352813721, + "test_acc": 0.01, + "lyapunov": 1.8818576552373978, + "grad_norm": 0.1848350031636926, + "grad_max_sv": 0.09705327395349742, + "grad_min_sv": 6.54183362728495e-13, + "grad_condition": 64781627362.86159, + "lr": 0.0001732896980049473, + "time_sec": 177.35780382156372 + }, + { + "epoch": 110, + "train_loss": 4.524208149719239, + "train_acc": 0.01906, + "test_loss": 6.643166270446778, + "test_acc": 0.01, + "lyapunov": 1.8807388602010429, + "grad_norm": 0.1785425192947475, + "grad_max_sv": 0.09457366839051247, + "grad_min_sv": 4.767008084434052e-13, + "grad_condition": 72129851609.04678, + "lr": 0.00016543469682057076, + "time_sec": 177.36579298973083 + }, + { + "epoch": 111, + "train_loss": 4.53040064529419, + "train_acc": 0.01832, + "test_loss": 8.910856002807618, + "test_acc": 0.01, + "lyapunov": 1.8765558891589074, + "grad_norm": 0.17026394073665702, + "grad_max_sv": 0.08836164027452469, + "grad_min_sv": 5.85781253685973e-13, + "grad_condition": 67943464027.98218, + "lr": 0.00015772644703565552, + "time_sec": 177.34918975830078 + }, + { + "epoch": 112, + "train_loss": 4.545937302246093, + "train_acc": 0.01522, + "test_loss": 6.681547387695312, + "test_acc": 0.01, + "lyapunov": 1.8712620235160184, + "grad_norm": 0.14905345779494544, + "grad_max_sv": 0.0828567205928266, + "grad_min_sv": 4.8920962306457093e-14, + "grad_condition": 79387022595.5743, + "lr": 0.00015016832974331713, + "time_sec": 177.32487964630127 + }, + { + "epoch": 113, + "train_loss": 4.547554450683593, + "train_acc": 0.0151, + "test_loss": 6.779077651977539, + "test_acc": 0.01, + "lyapunov": 1.8724847394792015, + "grad_norm": 0.14631715030660067, + "grad_max_sv": 0.08086532177403569, + "grad_min_sv": 5.074463102689055e-14, + "grad_condition": 77175005196.30495, + "lr": 0.00014276366018359834, + "time_sec": 177.30155324935913 + }, + { + "epoch": 114, + "train_loss": 4.5489697427368165, + "train_acc": 0.01486, + "test_loss": 6.522304327392578, + "test_acc": 0.01, + "lyapunov": 1.8717568207274922, + "grad_norm": 0.14324923492777344, + "grad_max_sv": 0.08171637607738376, + "grad_min_sv": 1.3242329414875363e-14, + "grad_condition": 80721246516.98701, + "lr": 0.00013551568628929425, + "time_sec": 177.28179287910461 + }, + { + "epoch": 115, + "train_loss": 4.5471634547424316, + "train_acc": 0.01502, + "test_loss": 7.095610357666016, + "test_acc": 0.01, + "lyapunov": 1.8744507893881834, + "grad_norm": 0.14485837543714783, + "grad_max_sv": 0.08132082503288984, + "grad_min_sv": 1.81078836536911e-14, + "grad_condition": 79919868204.71088, + "lr": 0.00012842758726130276, + "time_sec": 177.33235454559326 + }, + { + "epoch": 116, + "train_loss": 4.548014427185058, + "train_acc": 0.01534, + "test_loss": 6.714404089355469, + "test_acc": 0.01, + "lyapunov": 1.8738381951056478, + "grad_norm": 0.1417318979444601, + "grad_max_sv": 0.08069097753614188, + "grad_min_sv": 2.1261185647335962e-14, + "grad_condition": 79080599236.9338, + "lr": 0.0001215024721741218, + "time_sec": 177.3581359386444 + }, + { + "epoch": 117, + "train_loss": 4.5475594778442385, + "train_acc": 0.0162, + "test_loss": 7.012126634216308, + "test_acc": 0.01, + "lyapunov": 1.8802398299926992, + "grad_norm": 0.14427127432715559, + "grad_max_sv": 0.07751598162576556, + "grad_min_sv": 2.5871283722113393e-14, + "grad_condition": 75660417804.99104, + "lr": 0.00011474337861210538, + "time_sec": 177.34602308273315 + }, + { + "epoch": 118, + "train_loss": 4.547483818054199, + "train_acc": 0.01608, + "test_loss": 6.870603955078125, + "test_acc": 0.01, + "lyapunov": 1.880126509215216, + "grad_norm": 0.14323919878529856, + "grad_max_sv": 0.08231749897822738, + "grad_min_sv": 2.5404315299191894e-14, + "grad_condition": 80539374605.35417, + "lr": 0.00010815327133708009, + "time_sec": 177.37712860107422 + }, + { + "epoch": 119, + "train_loss": 4.534606270751953, + "train_acc": 0.01762, + "test_loss": 6.911497918701172, + "test_acc": 0.01, + "lyapunov": 1.88580509128473, + "grad_norm": 0.1554868932808185, + "grad_max_sv": 0.08145476067438721, + "grad_min_sv": 1.1376842374815623e-13, + "grad_condition": 74485842851.95381, + "lr": 0.00010173504098790182, + "time_sec": 177.39225101470947 + }, + { + "epoch": 120, + "train_loss": 4.53310412185669, + "train_acc": 0.01794, + "test_loss": 6.387413667297364, + "test_acc": 0.01, + "lyapunov": 1.8892596264934296, + "grad_norm": 0.15631372022176057, + "grad_max_sv": 0.08103838972747326, + "grad_min_sv": 9.497261372236228e-14, + "grad_condition": 74695089213.60704, + "lr": 9.549150281252629e-05, + "time_sec": 177.4245948791504 + }, + { + "epoch": 121, + "train_loss": 4.534973322906494, + "train_acc": 0.01776, + "test_loss": 7.1422959945678715, + "test_acc": 0.01, + "lyapunov": 1.881148859972844, + "grad_norm": 0.15666055516425273, + "grad_max_sv": 0.0814055297523737, + "grad_min_sv": 5.697649748368235e-14, + "grad_condition": 77327196032.91525, + "lr": 8.942539543314794e-05, + "time_sec": 177.39071822166443 + }, + { + "epoch": 122, + "train_loss": 4.5416329475402835, + "train_acc": 0.01768, + "test_loss": 7.760357019042969, + "test_acc": 0.01, + "lyapunov": 1.8941616911412504, + "grad_norm": 0.15303806595082975, + "grad_max_sv": 0.08280573170632125, + "grad_min_sv": 7.190334186608317e-14, + "grad_condition": 77551212396.10873, + "lr": 8.353937964495024e-05, + "time_sec": 177.39379000663757 + }, + { + "epoch": 123, + "train_loss": 4.532209703369141, + "train_acc": 0.0188, + "test_loss": 7.213145608520508, + "test_acc": 0.01, + "lyapunov": 1.8783490920005856, + "grad_norm": 0.1570128750865918, + "grad_max_sv": 0.07976588718593121, + "grad_min_sv": 5.378207270335454e-14, + "grad_condition": 75947991946.02742, + "lr": 7.783603724899243e-05, + "time_sec": 177.3858504295349 + }, + { + "epoch": 124, + "train_loss": 4.532452094421386, + "train_acc": 0.01822, + "test_loss": 8.867930480957032, + "test_acc": 0.01, + "lyapunov": 1.8961719725747852, + "grad_norm": 0.1565922966382055, + "grad_max_sv": 0.08160738497972489, + "grad_min_sv": 1.0257821202629168e-13, + "grad_condition": 75250370482.7287, + "lr": 7.231786991974666e-05, + "time_sec": 177.35063314437866 + }, + { + "epoch": 125, + "train_loss": 4.543888686676025, + "train_acc": 0.0169, + "test_loss": 9.472554348754883, + "test_acc": 0.01, + "lyapunov": 1.9082237808295832, + "grad_norm": 0.1517076219008134, + "grad_max_sv": 0.08182584447786212, + "grad_min_sv": 5.187792751512962e-14, + "grad_condition": 78115492846.74008, + "lr": 6.698729810778072e-05, + "time_sec": 177.37032294273376 + }, + { + "epoch": 126, + "train_loss": 4.547970936279297, + "train_acc": 0.01554, + "test_loss": 9.686561820983886, + "test_acc": 0.01, + "lyapunov": 1.913945980693983, + "grad_norm": 0.14499806750062244, + "grad_max_sv": 0.07566633233800531, + "grad_min_sv": 3.1772195777593184e-14, + "grad_condition": 73493387748.77896, + "lr": 6.184665997806817e-05, + "time_sec": 177.35547280311584 + }, + { + "epoch": 127, + "train_loss": 4.546605653076172, + "train_acc": 0.01548, + "test_loss": 10.238512472534179, + "test_acc": 0.01, + "lyapunov": 1.9275426837184546, + "grad_norm": 0.14554790749081933, + "grad_max_sv": 0.07929007997736334, + "grad_min_sv": 3.9511653602873453e-14, + "grad_condition": 76467572800.43704, + "lr": 5.6898210384392595e-05, + "time_sec": 177.30883407592773 + }, + { + "epoch": 128, + "train_loss": 4.548374371185303, + "train_acc": 0.01518, + "test_loss": 7.331470336914062, + "test_acc": 0.01, + "lyapunov": 1.917976202257454, + "grad_norm": 0.14194847208901806, + "grad_max_sv": 0.07561489585787058, + "grad_min_sv": 3.018860197535905e-14, + "grad_condition": 73686654080.81082, + "lr": 5.214411988029363e-05, + "time_sec": 177.29406332969666 + }, + { + "epoch": 129, + "train_loss": 4.552641819152832, + "train_acc": 0.01424, + "test_loss": 10.299223823547363, + "test_acc": 0.01, + "lyapunov": 1.8986562542293384, + "grad_norm": 0.14097964129344484, + "grad_max_sv": 0.07945991829037666, + "grad_min_sv": 3.098126402642908e-14, + "grad_condition": 77295952152.37424, + "lr": 4.7586473766990294e-05, + "time_sec": 177.30149126052856 + }, + { + "epoch": 130, + "train_loss": 4.558454217224121, + "train_acc": 0.01442, + "test_loss": 9.414859741210938, + "test_acc": 0.01, + "lyapunov": 1.8917262898686598, + "grad_norm": 0.13750644159550615, + "grad_max_sv": 0.07227576579898595, + "grad_min_sv": 1.4186463557681784e-14, + "grad_condition": 71301232315.57674, + "lr": 4.32272711786996e-05, + "time_sec": 177.28755593299866 + }, + { + "epoch": 131, + "train_loss": 4.555461906433106, + "train_acc": 0.01466, + "test_loss": 12.041324650573731, + "test_acc": 0.01, + "lyapunov": 1.8987445102628235, + "grad_norm": 0.13757460865371804, + "grad_max_sv": 0.07397228116169571, + "grad_min_sv": 2.319644706817993e-14, + "grad_condition": 72489319776.39827, + "lr": 3.906842420574966e-05, + "time_sec": 177.29019808769226 + }, + { + "epoch": 132, + "train_loss": 4.554803800964356, + "train_acc": 0.01564, + "test_loss": 11.094451065063476, + "test_acc": 0.01, + "lyapunov": 1.8878093031056398, + "grad_norm": 0.13783764545536042, + "grad_max_sv": 0.07386947749182582, + "grad_min_sv": 1.6515898138230524e-14, + "grad_condition": 72754577205.38591, + "lr": 3.5111757055874305e-05, + "time_sec": 177.31085658073425 + }, + { + "epoch": 133, + "train_loss": 4.550925143280029, + "train_acc": 0.01498, + "test_loss": 9.74743147277832, + "test_acc": 0.01, + "lyapunov": 1.878229211663346, + "grad_norm": 0.13768130602715348, + "grad_max_sv": 0.06898155501112342, + "grad_min_sv": 1.0546519595933137e-14, + "grad_condition": 68298184996.095604, + "lr": 3.1359005254054254e-05, + "time_sec": 177.30499482154846 + }, + { + "epoch": 134, + "train_loss": 4.553356967468262, + "train_acc": 0.0149, + "test_loss": 11.778760961914063, + "test_acc": 0.01, + "lyapunov": 1.8766485382528866, + "grad_norm": 0.13736454806799486, + "grad_max_sv": 0.070872993580997, + "grad_min_sv": 2.157465270254722e-14, + "grad_condition": 69432477834.60878, + "lr": 2.7811814881259484e-05, + "time_sec": 177.2809820175171 + }, + { + "epoch": 135, + "train_loss": 4.551636660461425, + "train_acc": 0.01592, + "test_loss": 11.783082652282715, + "test_acc": 0.01, + "lyapunov": 1.8882967026337334, + "grad_norm": 0.13717586705825502, + "grad_max_sv": 0.07159899128600955, + "grad_min_sv": 1.2450805578708491e-14, + "grad_condition": 70660590568.42424, + "lr": 2.4471741852423218e-05, + "time_sec": 177.30125308036804 + }, + { + "epoch": 136, + "train_loss": 4.548730396881104, + "train_acc": 0.01516, + "test_loss": 11.388315562438965, + "test_acc": 0.01, + "lyapunov": 1.8989758704934279, + "grad_norm": 0.1379291481732077, + "grad_max_sv": 0.07207101676613092, + "grad_min_sv": 1.5291750620388887e-14, + "grad_condition": 71063065982.77095, + "lr": 2.1340251233966362e-05, + "time_sec": 177.31817770004272 + }, + { + "epoch": 137, + "train_loss": 4.5493795796203615, + "train_acc": 0.0156, + "test_loss": 11.34073727722168, + "test_acc": 0.01, + "lyapunov": 1.8913398648771789, + "grad_norm": 0.13897953191218543, + "grad_max_sv": 0.07152581168338656, + "grad_min_sv": 1.8546912289041328e-14, + "grad_condition": 70226087635.57034, + "lr": 1.8418716601170932e-05, + "time_sec": 177.3131880760193 + }, + { + "epoch": 138, + "train_loss": 4.553489802398682, + "train_acc": 0.01516, + "test_loss": 12.222237545776368, + "test_acc": 0.01, + "lyapunov": 1.8923300303461608, + "grad_norm": 0.1422578907831012, + "grad_max_sv": 0.07421789932996034, + "grad_min_sv": 2.2511905546267236e-14, + "grad_condition": 72655119204.59192, + "lr": 1.570841943568445e-05, + "time_sec": 177.3508095741272 + }, + { + "epoch": 139, + "train_loss": 4.551329365997314, + "train_acc": 0.01604, + "test_loss": 11.567996215820312, + "test_acc": 0.01, + "lyapunov": 1.896789355351187, + "grad_norm": 0.13857216280793205, + "grad_max_sv": 0.0750581487081945, + "grad_min_sv": 2.7187812199729122e-14, + "grad_condition": 73193036998.8267, + "lr": 1.3210548563419845e-05, + "time_sec": 177.3199553489685 + }, + { + "epoch": 140, + "train_loss": 4.551639187316894, + "train_acc": 0.0152, + "test_loss": 10.962099948120118, + "test_acc": 0.01, + "lyapunov": 1.8980579516466927, + "grad_norm": 0.13913098758019468, + "grad_max_sv": 0.07022048626095057, + "grad_min_sv": 1.6254623784336123e-14, + "grad_condition": 69176986727.67476, + "lr": 1.0926199633097203e-05, + "time_sec": 177.31917572021484 + }, + { + "epoch": 141, + "train_loss": 4.551450812072754, + "train_acc": 0.01548, + "test_loss": 11.749597540283203, + "test_acc": 0.01, + "lyapunov": 1.8976749087233677, + "grad_norm": 0.13543146683337492, + "grad_max_sv": 0.07132029384374619, + "grad_min_sv": 1.2937733568789232e-14, + "grad_condition": 70483725874.9921, + "lr": 8.856374635655688e-06, + "time_sec": 177.30270528793335 + }, + { + "epoch": 142, + "train_loss": 4.550458405609131, + "train_acc": 0.01508, + "test_loss": 11.127458859252929, + "test_acc": 0.01, + "lyapunov": 1.8944645882262598, + "grad_norm": 0.13718078797014463, + "grad_max_sv": 0.07173966113477945, + "grad_min_sv": 5.362134975133005e-15, + "grad_condition": 71343601385.1819, + "lr": 7.001981464747503e-06, + "time_sec": 177.33799290657043 + }, + { + "epoch": 143, + "train_loss": 4.549646302642822, + "train_acc": 0.01504, + "test_loss": 9.781423010253906, + "test_acc": 0.01, + "lyapunov": 1.896026461325643, + "grad_norm": 0.13690028772364582, + "grad_max_sv": 0.07180424155667424, + "grad_min_sv": 9.235488076157911e-15, + "grad_condition": 71150894694.0915, + "lr": 5.3638335185058295e-06, + "time_sec": 177.29442596435547 + }, + { + "epoch": 144, + "train_loss": 4.550904609680176, + "train_acc": 0.01478, + "test_loss": 11.654512042236329, + "test_acc": 0.01, + "lyapunov": 1.8981691126323417, + "grad_norm": 0.13847308318144802, + "grad_max_sv": 0.0707651729695499, + "grad_min_sv": 1.0486687491927528e-14, + "grad_condition": 70068302270.75797, + "lr": 3.942649342761114e-06, + "time_sec": 177.31189107894897 + }, + { + "epoch": 145, + "train_loss": 4.549078409271241, + "train_acc": 0.01536, + "test_loss": 10.245002896118164, + "test_acc": 0.01, + "lyapunov": 1.8977412525040414, + "grad_norm": 0.1380191070864239, + "grad_max_sv": 0.07147834841161967, + "grad_min_sv": 2.442390129201921e-14, + "grad_condition": 69865965621.40735, + "lr": 2.7390523158633524e-06, + "time_sec": 177.3547399044037 + }, + { + "epoch": 146, + "train_loss": 4.549764898529053, + "train_acc": 0.0153, + "test_loss": 12.586336196899413, + "test_acc": 0.01, + "lyapunov": 1.9022346853905017, + "grad_norm": 0.1378382427841838, + "grad_max_sv": 0.07094019828364254, + "grad_min_sv": 4.088156870147558e-14, + "grad_condition": 68488698134.9881, + "lr": 1.7535703752478133e-06, + "time_sec": 177.33843970298767 + }, + { + "epoch": 147, + "train_loss": 4.549026966247559, + "train_acc": 0.01498, + "test_loss": 10.552986677551269, + "test_acc": 0.01, + "lyapunov": 1.8973304896098573, + "grad_norm": 0.1383607211573884, + "grad_max_sv": 0.07058861535042524, + "grad_min_sv": 1.1701259109026522e-14, + "grad_condition": 69871097743.06229, + "lr": 9.866357858642196e-07, + "time_sec": 177.30922889709473 + }, + { + "epoch": 148, + "train_loss": 4.548874216003418, + "train_acc": 0.01538, + "test_loss": 13.164787545776367, + "test_acc": 0.01, + "lyapunov": 1.8975342713353578, + "grad_norm": 0.13819467947797637, + "grad_max_sv": 0.07126009510830045, + "grad_min_sv": 1.3301168495645157e-14, + "grad_condition": 70402076766.28023, + "lr": 4.38584950570808e-07, + "time_sec": 177.32940936088562 + }, + { + "epoch": 149, + "train_loss": 4.548271210632325, + "train_acc": 0.01458, + "test_loss": 13.447799993896485, + "test_acc": 0.01, + "lyapunov": 1.8944333886246547, + "grad_norm": 0.13826879828472308, + "grad_max_sv": 0.07108921753242611, + "grad_min_sv": 1.4796796962166793e-14, + "grad_condition": 70104972764.94934, + "lr": 1.096582625772501e-07, + "time_sec": 177.3080608844757 + }, + { + "epoch": 150, + "train_loss": 4.550895355377198, + "train_acc": 0.01514, + "test_loss": 11.285707998657227, + "test_acc": 0.01, + "lyapunov": 1.899481255684972, + "grad_norm": 0.1383326475891396, + "grad_max_sv": 0.07153223417699336, + "grad_min_sv": 1.1750268769105188e-14, + "grad_condition": 70754427782.17505, + "lr": 0.0, + "time_sec": 177.31517815589905 + } + ] + } +}
\ No newline at end of file |
