{ "vanilla": { "4": [ { "epoch": 1, "train_loss": 3.8700216691589358, "train_acc": 0.12266, "test_loss": 3.471041242599487, "test_acc": 0.1892, "lyapunov": null, "grad_norm": 5.871605597993606, "grad_max_sv": 4.127117091417313, "grad_min_sv": 1.0455270382792037e-07, "grad_condition": 49062288.68792993, "lr": 0.0009998903417374227, "time_sec": 16.27198028564453 }, { "epoch": 2, "train_loss": 3.1769318112182616, "train_acc": 0.22848, "test_loss": 3.0822217151641844, "test_acc": 0.2623, "lyapunov": null, "grad_norm": 4.062262644221631, "grad_max_sv": 2.610152545571327, "grad_min_sv": 7.51297792088955e-08, "grad_condition": 5467508398.9579, "lr": 0.0009995614150494292, "time_sec": 15.849408626556396 }, { "epoch": 3, "train_loss": 2.7716760053253173, "train_acc": 0.30112, "test_loss": 2.786010754776001, "test_acc": 0.3025, "lyapunov": null, "grad_norm": 3.306849913177874, "grad_max_sv": 1.982076707482338, "grad_min_sv": 6.276024400175828e-08, "grad_condition": 35650611.42411845, "lr": 0.0009990133642141358, "time_sec": 15.585639715194702 }, { "epoch": 4, "train_loss": 2.52623803855896, "train_acc": 0.34808, "test_loss": 2.753477826690674, "test_acc": 0.31, "lyapunov": null, "grad_norm": 2.9097492182391815, "grad_max_sv": 1.6385449588298797, "grad_min_sv": 5.4328751075694014e-08, "grad_condition": 39318936.04767501, "lr": 0.0009982464296247522, "time_sec": 15.567962408065796 }, { "epoch": 5, "train_loss": 2.336665892715454, "train_acc": 0.38814, "test_loss": 2.762642176055908, "test_acc": 0.3278, "lyapunov": null, "grad_norm": 2.633575942359962, "grad_max_sv": 1.4780948996543883, "grad_min_sv": 4.9716202832339465e-08, "grad_condition": 36374716.14412971, "lr": 0.0009972609476841367, "time_sec": 15.589628219604492 }, { "epoch": 6, "train_loss": 2.1819915383148194, "train_acc": 0.42402, "test_loss": 2.879850026321411, "test_acc": 0.3169, "lyapunov": null, "grad_norm": 2.4016337956595826, "grad_max_sv": 1.2914279341697692, "grad_min_sv": 4.639223961377947e-08, "grad_condition": 67967054.09377375, "lr": 0.000996057350657239, "time_sec": 15.569096803665161 }, { "epoch": 7, "train_loss": 2.051711977081299, "train_acc": 0.45262, "test_loss": 2.3678430866241453, "test_acc": 0.3932, "lyapunov": null, "grad_norm": 2.226191538130221, "grad_max_sv": 1.1724753439426423, "grad_min_sv": 4.296711672013842e-08, "grad_condition": 36498738.129443035, "lr": 0.000994636166481494, "time_sec": 15.596983671188354 }, { "epoch": 8, "train_loss": 1.940541718597412, "train_acc": 0.47698, "test_loss": 2.2571875411987303, "test_acc": 0.4255, "lyapunov": null, "grad_norm": 2.0805351562913987, "grad_max_sv": 1.1051331430673599, "grad_min_sv": 4.002405433189971e-08, "grad_condition": 35597702.92584355, "lr": 0.0009929980185352525, "time_sec": 15.578535795211792 }, { "epoch": 9, "train_loss": 1.8394872580337525, "train_acc": 0.49896, "test_loss": 2.447062807273865, "test_acc": 0.3908, "lyapunov": null, "grad_norm": 1.95549418174433, "grad_max_sv": 0.9836901038885116, "grad_min_sv": 3.7306198631681385e-08, "grad_condition": 62081794.94354477, "lr": 0.0009911436253643444, "time_sec": 15.615386486053467 }, { "epoch": 10, "train_loss": 1.7619124493789673, "train_acc": 0.51634, "test_loss": 2.1738934711456297, "test_acc": 0.4315, "lyapunov": null, "grad_norm": 1.8481164153982472, "grad_max_sv": 0.9101693272590637, "grad_min_sv": 3.497988239065109e-08, "grad_condition": 46371834.68583612, "lr": 0.0009890738003669028, "time_sec": 15.591166496276855 }, { "epoch": 11, "train_loss": 1.6779080270385742, "train_acc": 0.5374, "test_loss": 2.1254464902877808, "test_acc": 0.4554, "lyapunov": null, "grad_norm": 1.761015251152075, "grad_max_sv": 0.8580568209290504, "grad_min_sv": 3.36019686630884e-08, "grad_condition": 43516726.56073545, "lr": 0.00098678945143658, "time_sec": 15.584970235824585 }, { "epoch": 12, "train_loss": 1.6224668700790406, "train_acc": 0.5503, "test_loss": 2.1070931062698364, "test_acc": 0.4572, "lyapunov": null, "grad_norm": 1.6795284434799669, "grad_max_sv": 0.8227274164557457, "grad_min_sv": 3.2408061501065785e-08, "grad_condition": 46743715.81403457, "lr": 0.0009842915805643154, "time_sec": 15.587612390518188 }, { "epoch": 13, "train_loss": 1.5589283563995362, "train_acc": 0.56658, "test_loss": 2.109080162811279, "test_acc": 0.4555, "lyapunov": null, "grad_norm": 1.6107025543208409, "grad_max_sv": 0.7555071026086807, "grad_min_sv": 3.021804662181257e-08, "grad_condition": 771669383.9576478, "lr": 0.000981581283398829, "time_sec": 15.570199012756348 }, { "epoch": 14, "train_loss": 1.5079251358795167, "train_acc": 0.57552, "test_loss": 2.0982689178466796, "test_acc": 0.4612, "lyapunov": null, "grad_norm": 1.5561237300872648, "grad_max_sv": 0.7464557528495789, "grad_min_sv": 2.9360349014517782e-08, "grad_condition": 57384357.84720645, "lr": 0.0009786597487660333, "time_sec": 15.58092999458313 }, { "epoch": 15, "train_loss": 1.4521892065048219, "train_acc": 0.59046, "test_loss": 2.311817477607727, "test_acc": 0.4302, "lyapunov": null, "grad_norm": 1.5030460275712159, "grad_max_sv": 0.6973782196640969, "grad_min_sv": 2.806552138745477e-08, "grad_condition": 50094988.442197144, "lr": 0.0009755282581475766, "time_sec": 15.59303069114685 }, { "epoch": 16, "train_loss": 1.4043401465606689, "train_acc": 0.6018, "test_loss": 1.9470401285171508, "test_acc": 0.4966, "lyapunov": null, "grad_norm": 1.4501603734300015, "grad_max_sv": 0.6692761570215225, "grad_min_sv": 2.707263816043026e-08, "grad_condition": 123937233.96376769, "lr": 0.0009721881851187403, "time_sec": 15.581094026565552 }, { "epoch": 17, "train_loss": 1.3696716709136962, "train_acc": 0.61152, "test_loss": 1.937501217842102, "test_acc": 0.499, "lyapunov": null, "grad_norm": 1.4220829625575298, "grad_max_sv": 0.6630528435111046, "grad_min_sv": 2.6855075777043603e-08, "grad_condition": 85926301.07871899, "lr": 0.0009686409947459456, "time_sec": 15.594961643218994 }, { "epoch": 18, "train_loss": 1.3274028357696532, "train_acc": 0.62202, "test_loss": 2.163087944793701, "test_acc": 0.4562, "lyapunov": null, "grad_norm": 1.3749658522523285, "grad_max_sv": 0.6294455677270889, "grad_min_sv": 2.59231922022235e-08, "grad_condition": 301195911.7425653, "lr": 0.0009648882429441254, "time_sec": 15.60923433303833 }, { "epoch": 19, "train_loss": 1.2825380062484741, "train_acc": 0.63366, "test_loss": 2.012470700645447, "test_acc": 0.4881, "lyapunov": null, "grad_norm": 1.3365974210853477, "grad_max_sv": 0.6173068635165692, "grad_min_sv": 2.522445298643039e-08, "grad_condition": 107736394.99929431, "lr": 0.00096093157579425, "time_sec": 15.59559416770935 }, { "epoch": 20, "train_loss": 1.2454956715774537, "train_acc": 0.63962, "test_loss": 1.862760306930542, "test_acc": 0.5166, "lyapunov": null, "grad_norm": 1.3087654259412098, "grad_max_sv": 0.583590354025364, "grad_min_sv": 2.470869329140868e-08, "grad_condition": 28538129.547009837, "lr": 0.0009567727288213001, "time_sec": 15.578768253326416 }, { "epoch": 21, "train_loss": 1.2203223657226563, "train_acc": 0.64712, "test_loss": 1.8641546312332153, "test_acc": 0.5193, "lyapunov": null, "grad_norm": 1.2837238048732729, "grad_max_sv": 0.5924517832696438, "grad_min_sv": 2.4348954538039312e-08, "grad_condition": 93781869.91679552, "lr": 0.0009524135262330095, "time_sec": 15.614121198654175 }, { "epoch": 22, "train_loss": 1.1865811985397339, "train_acc": 0.65476, "test_loss": 2.0345648471832276, "test_acc": 0.4893, "lyapunov": null, "grad_norm": 1.2512260920694542, "grad_max_sv": 0.5759196959435939, "grad_min_sv": 2.384011341116654e-08, "grad_condition": 30288258.368695997, "lr": 0.0009478558801197061, "time_sec": 15.612670183181763 }, { "epoch": 23, "train_loss": 1.1597199523544313, "train_acc": 0.66328, "test_loss": 1.7475012817382813, "test_acc": 0.5456, "lyapunov": null, "grad_norm": 1.22099214296503, "grad_max_sv": 0.550060736387968, "grad_min_sv": 2.259520101161039e-08, "grad_condition": 44796813.002676345, "lr": 0.000943101789615607, "time_sec": 15.634280920028687 }, { "epoch": 24, "train_loss": 1.1278974151992798, "train_acc": 0.67306, "test_loss": 1.9481268964767455, "test_acc": 0.5126, "lyapunov": null, "grad_norm": 1.204438554486539, "grad_max_sv": 0.5349243931472302, "grad_min_sv": 2.225912898324439e-08, "grad_condition": 183220898.93468145, "lr": 0.0009381533400219313, "time_sec": 15.649690389633179 }, { "epoch": 25, "train_loss": 1.096091796951294, "train_acc": 0.68, "test_loss": 2.0196787605285644, "test_acc": 0.5038, "lyapunov": null, "grad_norm": 1.1805395110366357, "grad_max_sv": 0.5209554739296436, "grad_min_sv": 2.1478067243539635e-08, "grad_condition": 4139399544.237787, "lr": 0.0009330127018922189, "time_sec": 15.62510895729065 }, { "epoch": 26, "train_loss": 1.0776387982559203, "train_acc": 0.6821, "test_loss": 1.9688811008453369, "test_acc": 0.5111, "lyapunov": null, "grad_norm": 1.1581479939567827, "grad_max_sv": 0.5094197139143943, "grad_min_sv": 2.1775440942062298e-08, "grad_condition": 34416173.97374034, "lr": 0.000927682130080253, "time_sec": 15.616900444030762 }, { "epoch": 27, "train_loss": 1.039057155227661, "train_acc": 0.69314, "test_loss": 1.9735270919799806, "test_acc": 0.5109, "lyapunov": null, "grad_norm": 1.1358478872536777, "grad_max_sv": 0.49843145087361335, "grad_min_sv": 2.0908967124713685e-08, "grad_condition": 147733329.90615898, "lr": 0.0009221639627510072, "time_sec": 15.589634418487549 }, { "epoch": 28, "train_loss": 1.0186366636657715, "train_acc": 0.698, "test_loss": 1.849167727470398, "test_acc": 0.5327, "lyapunov": null, "grad_norm": 1.1179885484776635, "grad_max_sv": 0.4846231251955032, "grad_min_sv": 2.064624871154358e-08, "grad_condition": 187535295.68791586, "lr": 0.0009164606203550494, "time_sec": 15.606561422348022 }, { "epoch": 29, "train_loss": 0.9894418817901611, "train_acc": 0.70704, "test_loss": 1.9159385116577148, "test_acc": 0.5256, "lyapunov": null, "grad_norm": 1.1033010317922292, "grad_max_sv": 0.49175669252872467, "grad_min_sv": 2.0545614226596954e-08, "grad_condition": 28139106.19650669, "lr": 0.0009105746045668516, "time_sec": 15.596401453018188 }, { "epoch": 30, "train_loss": 0.9679239891052246, "train_acc": 0.7117, "test_loss": 1.7626015129089356, "test_acc": 0.5579, "lyapunov": null, "grad_norm": 1.0852050474778043, "grad_max_sv": 0.4818247281014919, "grad_min_sv": 2.036887303824564e-08, "grad_condition": 39564164.33428894, "lr": 0.0009045084971874733, "time_sec": 15.594120025634766 }, { "epoch": 31, "train_loss": 0.9477154457473755, "train_acc": 0.71644, "test_loss": 2.001366552734375, "test_acc": 0.5184, "lyapunov": null, "grad_norm": 1.0714526476916026, "grad_max_sv": 0.45983982309699056, "grad_min_sv": 1.9430452840446533e-08, "grad_condition": 51624978.6905687, "lr": 0.0008982649590120977, "time_sec": 15.600859880447388 }, { "epoch": 32, "train_loss": 0.922220166015625, "train_acc": 0.72322, "test_loss": 1.8274271976470948, "test_acc": 0.552, "lyapunov": null, "grad_norm": 1.0486432180828922, "grad_max_sv": 0.4561096005141735, "grad_min_sv": 1.9119260000893812e-08, "grad_condition": 81358962.64807202, "lr": 0.0008918467286629196, "time_sec": 15.56894040107727 }, { "epoch": 33, "train_loss": 0.9045637095451355, "train_acc": 0.72804, "test_loss": 1.885004960823059, "test_acc": 0.543, "lyapunov": null, "grad_norm": 1.0374896564588747, "grad_max_sv": 0.4518023140728474, "grad_min_sv": 1.917957178319829e-08, "grad_condition": 182673348.7808311, "lr": 0.0008852566213878943, "time_sec": 15.568547010421753 }, { "epoch": 34, "train_loss": 0.8857564904785157, "train_acc": 0.7319, "test_loss": 1.9111962642669678, "test_acc": 0.5412, "lyapunov": null, "grad_norm": 1.0274666482550194, "grad_max_sv": 0.4493935935199261, "grad_min_sv": 1.881604217469912e-08, "grad_condition": 248617918.33796087, "lr": 0.000878497527825878, "time_sec": 15.588915586471558 }, { "epoch": 35, "train_loss": 0.8623492621994019, "train_acc": 0.73752, "test_loss": 1.9594444644927977, "test_acc": 0.5265, "lyapunov": null, "grad_norm": 1.0169882023721266, "grad_max_sv": 0.4450283505022526, "grad_min_sv": 1.8621021413700588e-08, "grad_condition": 51970835.60873811, "lr": 0.000871572412738697, "time_sec": 15.614988565444946 }, { "epoch": 36, "train_loss": 0.847761401977539, "train_acc": 0.7438, "test_loss": 1.8443275575637816, "test_acc": 0.549, "lyapunov": null, "grad_norm": 0.9972656465889882, "grad_max_sv": 0.42991913110017776, "grad_min_sv": 1.8110683554228845e-08, "grad_condition": 63643440.089395806, "lr": 0.0008644843137107055, "time_sec": 15.585567474365234 }, { "epoch": 37, "train_loss": 0.8332586885261536, "train_acc": 0.74546, "test_loss": 1.8331810934066772, "test_acc": 0.5565, "lyapunov": null, "grad_norm": 0.986142343180959, "grad_max_sv": 0.43020778223872186, "grad_min_sv": 1.820308022093542e-08, "grad_condition": 38440650.114556134, "lr": 0.0008572363398164014, "time_sec": 15.585892915725708 }, { "epoch": 38, "train_loss": 0.808667633934021, "train_acc": 0.75458, "test_loss": 1.8140192237854005, "test_acc": 0.563, "lyapunov": null, "grad_norm": 0.9767417084572454, "grad_max_sv": 0.43866117894649503, "grad_min_sv": 1.805343496832229e-08, "grad_condition": 246839591.75793108, "lr": 0.0008498316702566826, "time_sec": 15.576987028121948 }, { "epoch": 39, "train_loss": 0.7920477479743957, "train_acc": 0.75774, "test_loss": 1.998388723373413, "test_acc": 0.5317, "lyapunov": null, "grad_norm": 0.9634949356985317, "grad_max_sv": 0.41083301454782484, "grad_min_sv": 1.7408181231248764e-08, "grad_condition": 207856381.9830411, "lr": 0.0008422735529643442, "time_sec": 15.604882955551147 }, { "epoch": 40, "train_loss": 0.783684113292694, "train_acc": 0.76062, "test_loss": 1.8349973222732543, "test_acc": 0.5584, "lyapunov": null, "grad_norm": 0.9543715044222432, "grad_max_sv": 0.4067095577716827, "grad_min_sv": 1.715405322372243e-08, "grad_condition": 38065468.34049429, "lr": 0.0008345653031794289, "time_sec": 15.61448359489441 }, { "epoch": 41, "train_loss": 0.756040623588562, "train_acc": 0.76704, "test_loss": 1.8635019605636596, "test_acc": 0.5623, "lyapunov": null, "grad_norm": 0.9400945005657612, "grad_max_sv": 0.4006481133401394, "grad_min_sv": 1.706379215496434e-08, "grad_condition": 129917875.15326138, "lr": 0.0008267103019950526, "time_sec": 15.605446100234985 }, { "epoch": 42, "train_loss": 0.747281655292511, "train_acc": 0.77008, "test_loss": 1.804893379020691, "test_acc": 0.5637, "lyapunov": null, "grad_norm": 0.9342754196581016, "grad_max_sv": 0.4069997236132622, "grad_min_sv": 1.690411219660258e-08, "grad_condition": 833088985.4088073, "lr": 0.0008187119948743447, "time_sec": 15.598352432250977 }, { "epoch": 43, "train_loss": 0.7258966027832031, "train_acc": 0.7753, "test_loss": 1.808250590133667, "test_acc": 0.5688, "lyapunov": null, "grad_norm": 0.916899863328162, "grad_max_sv": 0.39457144513726233, "grad_min_sv": 1.6684048499693294e-08, "grad_condition": 39061518.56268385, "lr": 0.000810573890139155, "time_sec": 15.596754550933838 }, { "epoch": 44, "train_loss": 0.7053343192100525, "train_acc": 0.78078, "test_loss": 1.9365575828552246, "test_acc": 0.5516, "lyapunov": null, "grad_norm": 0.909458464797614, "grad_max_sv": 0.38970902636647226, "grad_min_sv": 1.6407527701767232e-08, "grad_condition": 42244499.19662833, "lr": 0.0008022995574311873, "time_sec": 15.606269836425781 }, { "epoch": 45, "train_loss": 0.6963989092254639, "train_acc": 0.7839, "test_loss": 1.8283310445785523, "test_acc": 0.5639, "lyapunov": null, "grad_norm": 0.9004438327166017, "grad_max_sv": 0.39948956444859507, "grad_min_sv": 1.6195382334174836e-08, "grad_condition": 362020379.02432, "lr": 0.0007938926261462363, "time_sec": 15.588224411010742 }, { "epoch": 46, "train_loss": 0.690151353931427, "train_acc": 0.78312, "test_loss": 1.838386841392517, "test_acc": 0.5656, "lyapunov": null, "grad_norm": 0.8990022149636615, "grad_max_sv": 0.3958965942263603, "grad_min_sv": 1.6439048992683212e-08, "grad_condition": 739976934.4713734, "lr": 0.0007853567838422158, "time_sec": 15.608047008514404 }, { "epoch": 47, "train_loss": 0.6644145600509643, "train_acc": 0.79316, "test_loss": 1.7317404174804687, "test_acc": 0.5881, "lyapunov": null, "grad_norm": 0.8888942071856848, "grad_max_sv": 0.3830097340047359, "grad_min_sv": 1.5947025791551715e-08, "grad_condition": 43737023.5418247, "lr": 0.0007766957746216719, "time_sec": 15.61106562614441 }, { "epoch": 48, "train_loss": 0.6501899867248535, "train_acc": 0.7961, "test_loss": 2.0301314384460447, "test_acc": 0.5481, "lyapunov": null, "grad_norm": 0.8710848056333472, "grad_max_sv": 0.37484541684389117, "grad_min_sv": 1.568856004691144e-08, "grad_condition": 71400760.33312531, "lr": 0.0007679133974894982, "time_sec": 15.616482496261597 }, { "epoch": 49, "train_loss": 0.6407210964202881, "train_acc": 0.79878, "test_loss": 1.8660895137786866, "test_acc": 0.5703, "lyapunov": null, "grad_norm": 0.8631402634979823, "grad_max_sv": 0.3794224761426449, "grad_min_sv": 1.5698247981393855e-08, "grad_condition": 48831357.42187855, "lr": 0.000759013504686565, "time_sec": 15.608244180679321 }, { "epoch": 50, "train_loss": 0.635532203464508, "train_acc": 0.79966, "test_loss": 1.8019765382766724, "test_acc": 0.5773, "lyapunov": null, "grad_norm": 0.8639281681323187, "grad_max_sv": 0.3756891183555126, "grad_min_sv": 1.5385762375426383e-08, "grad_condition": 443886531.5137703, "lr": 0.0007499999999999998, "time_sec": 15.595497369766235 }, { "epoch": 51, "train_loss": 0.6136586366081238, "train_acc": 0.8078, "test_loss": 1.985259211730957, "test_acc": 0.5541, "lyapunov": null, "grad_norm": 0.8502360335489318, "grad_max_sv": 0.38991634622216226, "grad_min_sv": 1.589003087859586e-08, "grad_condition": 36685688.17597731, "lr": 0.0007408768370508575, "time_sec": 15.606870174407959 }, { "epoch": 52, "train_loss": 0.6016868180465699, "train_acc": 0.81054, "test_loss": 1.9059622749328613, "test_acc": 0.5677, "lyapunov": null, "grad_norm": 0.839451980682905, "grad_max_sv": 0.3655779927968979, "grad_min_sv": 1.50471602150537e-08, "grad_condition": 68824107.55111663, "lr": 0.0007316480175599307, "time_sec": 15.595157861709595 }, { "epoch": 53, "train_loss": 0.5874249538040162, "train_acc": 0.81406, "test_loss": 1.9880520868301392, "test_acc": 0.5586, "lyapunov": null, "grad_norm": 0.8317551917480781, "grad_max_sv": 0.3655713267624378, "grad_min_sv": 1.5141927978482016e-08, "grad_condition": 349299867.91202754, "lr": 0.0007223175895924635, "time_sec": 15.589019060134888 }, { "epoch": 54, "train_loss": 0.577422985610962, "train_acc": 0.8184, "test_loss": 1.9396752899169922, "test_acc": 0.5636, "lyapunov": null, "grad_norm": 0.8261938394130597, "grad_max_sv": 0.3618521079421043, "grad_min_sv": 1.4864520584507642e-08, "grad_condition": 553216070.5433874, "lr": 0.0007128896457825361, "time_sec": 15.610572338104248 }, { "epoch": 55, "train_loss": 0.5702339578819275, "train_acc": 0.81924, "test_loss": 1.8778120471954345, "test_acc": 0.5713, "lyapunov": null, "grad_norm": 0.8242148097122628, "grad_max_sv": 0.36288107857108115, "grad_min_sv": 1.4883936903103966e-08, "grad_condition": 52140637.21728975, "lr": 0.0007033683215378998, "time_sec": 15.605257749557495 }, { "epoch": 56, "train_loss": 0.5589845707130432, "train_acc": 0.82372, "test_loss": 1.8699417673110963, "test_acc": 0.5751, "lyapunov": null, "grad_norm": 0.8186771944690047, "grad_max_sv": 0.346701592952013, "grad_min_sv": 1.459523215271985e-08, "grad_condition": 46853728.14353165, "lr": 0.0006937577932260512, "time_sec": 15.589865684509277 }, { "epoch": 57, "train_loss": 0.5443892800807952, "train_acc": 0.82776, "test_loss": 1.965821966934204, "test_acc": 0.5664, "lyapunov": null, "grad_norm": 0.8036351010817813, "grad_max_sv": 0.3483227726072073, "grad_min_sv": 1.4410761232583335e-08, "grad_condition": 73431270.59891501, "lr": 0.0006840622763423388, "time_sec": 15.590615510940552 }, { "epoch": 58, "train_loss": 0.5372896729660034, "train_acc": 0.82954, "test_loss": 1.876914355659485, "test_acc": 0.5811, "lyapunov": null, "grad_norm": 0.7997423554449953, "grad_max_sv": 0.34569344371557237, "grad_min_sv": 1.4015608398366443e-08, "grad_condition": 828306651.3532289, "lr": 0.0006742860236609073, "time_sec": 15.640390872955322 }, { "epoch": 59, "train_loss": 0.5291300660514832, "train_acc": 0.83176, "test_loss": 1.8113979286193849, "test_acc": 0.5866, "lyapunov": null, "grad_norm": 0.7903239162734349, "grad_max_sv": 0.34317835718393325, "grad_min_sv": 1.4270118212610095e-08, "grad_condition": 130381299.82028241, "lr": 0.0006644333233692913, "time_sec": 15.598358869552612 }, { "epoch": 60, "train_loss": 0.5121459530830383, "train_acc": 0.83708, "test_loss": 1.8623944423675538, "test_acc": 0.5809, "lyapunov": null, "grad_norm": 0.7828571196598214, "grad_max_sv": 0.33372929617762565, "grad_min_sv": 1.3842122733448425e-08, "grad_condition": 47391163.99310992, "lr": 0.0006545084971874734, "time_sec": 15.594441413879395 }, { "epoch": 61, "train_loss": 0.5045927854156494, "train_acc": 0.83722, "test_loss": 1.868363607597351, "test_acc": 0.5833, "lyapunov": null, "grad_norm": 0.782632751951769, "grad_max_sv": 0.3441222012042999, "grad_min_sv": 1.4132956021933527e-08, "grad_condition": 770221957.2190915, "lr": 0.0006445158984722354, "time_sec": 15.625693082809448 }, { "epoch": 62, "train_loss": 0.4909844134426117, "train_acc": 0.84268, "test_loss": 1.9616632486343384, "test_acc": 0.5686, "lyapunov": null, "grad_norm": 0.7640706557919354, "grad_max_sv": 0.3262421116232872, "grad_min_sv": 1.3609901451661078e-08, "grad_condition": 70578003.89460334, "lr": 0.0006344599103076324, "time_sec": 15.61337399482727 }, { "epoch": 63, "train_loss": 0.47858007513046263, "train_acc": 0.84808, "test_loss": 1.8504299934387207, "test_acc": 0.5864, "lyapunov": null, "grad_norm": 0.7612944717059198, "grad_max_sv": 0.3300259932875633, "grad_min_sv": 1.34369991692607e-08, "grad_condition": 1366561815.948382, "lr": 0.0006243449435824269, "time_sec": 15.618177652359009 }, { "epoch": 64, "train_loss": 0.47501785024642945, "train_acc": 0.84756, "test_loss": 1.8781955436706543, "test_acc": 0.5869, "lyapunov": null, "grad_norm": 0.7572180647827939, "grad_max_sv": 0.3278561718761921, "grad_min_sv": 1.3324545805690896e-08, "grad_condition": 581046380.377969, "lr": 0.0006141754350553275, "time_sec": 15.624166488647461 }, { "epoch": 65, "train_loss": 0.4702414323043823, "train_acc": 0.84926, "test_loss": 1.892370820426941, "test_acc": 0.586, "lyapunov": null, "grad_norm": 0.7563650221448377, "grad_max_sv": 0.3307614929974079, "grad_min_sv": 1.3784487005921026e-08, "grad_condition": 464200921.7045374, "lr": 0.0006039558454088793, "time_sec": 15.617845058441162 }, { "epoch": 66, "train_loss": 0.45756534008026123, "train_acc": 0.85312, "test_loss": 1.9519972061157227, "test_acc": 0.5808, "lyapunov": null, "grad_norm": 0.7420841565788096, "grad_max_sv": 0.33202062249183656, "grad_min_sv": 1.338400364191486e-08, "grad_condition": 499395104.1034541, "lr": 0.000593690657292862, "time_sec": 15.611196994781494 }, { "epoch": 67, "train_loss": 0.44467548862457273, "train_acc": 0.85686, "test_loss": 1.9216414470672607, "test_acc": 0.5822, "lyapunov": null, "grad_norm": 0.7382025740357703, "grad_max_sv": 0.3282777763903141, "grad_min_sv": 1.3046149181881323e-08, "grad_condition": 346705862.33150136, "lr": 0.0005833843733580507, "time_sec": 15.611254215240479 }, { "epoch": 68, "train_loss": 0.43985233959198, "train_acc": 0.85918, "test_loss": 1.8851093154907226, "test_acc": 0.5926, "lyapunov": null, "grad_norm": 0.7289145095731725, "grad_max_sv": 0.32352428287267687, "grad_min_sv": 1.3040011394684428e-08, "grad_condition": 442041574.8141201, "lr": 0.0005730415142812054, "time_sec": 15.625309467315674 }, { "epoch": 69, "train_loss": 0.4362604184055328, "train_acc": 0.85998, "test_loss": 1.8714712146759034, "test_acc": 0.5926, "lyapunov": null, "grad_norm": 0.7311888404996788, "grad_max_sv": 0.31886391565203664, "grad_min_sv": 1.2968906573272102e-08, "grad_condition": 3567171952.0862184, "lr": 0.0005626666167821517, "time_sec": 15.61151123046875 }, { "epoch": 70, "train_loss": 0.42215480308532716, "train_acc": 0.86416, "test_loss": 2.019381594085693, "test_acc": 0.5791, "lyapunov": null, "grad_norm": 0.721768423243528, "grad_max_sv": 0.3247049540281296, "grad_min_sv": 1.2853580642424936e-08, "grad_condition": 450059064.02256596, "lr": 0.0005522642316338265, "time_sec": 15.629756689071655 }, { "epoch": 71, "train_loss": 0.4138381930923462, "train_acc": 0.8672, "test_loss": 1.8805969470977784, "test_acc": 0.5939, "lyapunov": null, "grad_norm": 0.7122183187054967, "grad_max_sv": 0.31785007640719415, "grad_min_sv": 1.2996066436378461e-08, "grad_condition": 197171308.1464749, "lr": 0.0005418389216661573, "time_sec": 15.619616270065308 }, { "epoch": 72, "train_loss": 0.40292635828018186, "train_acc": 0.86882, "test_loss": 1.9322007545471191, "test_acc": 0.5786, "lyapunov": null, "grad_norm": 0.7085910743884665, "grad_max_sv": 0.3134432151913643, "grad_min_sv": 1.2498033243762453e-08, "grad_condition": 793091340.8871062, "lr": 0.0005313952597646563, "time_sec": 15.617356300354004 }, { "epoch": 73, "train_loss": 0.40141631307601927, "train_acc": 0.86948, "test_loss": 1.8957605976104737, "test_acc": 0.599, "lyapunov": null, "grad_norm": 0.7091751625468098, "grad_max_sv": 0.3174535669386387, "grad_min_sv": 1.2447811244958862e-08, "grad_condition": 249741254.61747846, "lr": 0.0005209378268645994, "time_sec": 15.621675968170166 }, { "epoch": 74, "train_loss": 0.3882115649795532, "train_acc": 0.87366, "test_loss": 1.98493223361969, "test_acc": 0.5838, "lyapunov": null, "grad_norm": 0.6962545006972763, "grad_max_sv": 0.31799899972975254, "grad_min_sv": 1.2635416091113378e-08, "grad_condition": 228682453.11998367, "lr": 0.0005104712099416781, "time_sec": 15.613324403762817 }, { "epoch": 75, "train_loss": 0.3784026951885223, "train_acc": 0.8775, "test_loss": 1.9258492612838745, "test_acc": 0.5894, "lyapunov": null, "grad_norm": 0.6897862834083666, "grad_max_sv": 0.3025407921522856, "grad_min_sv": 1.191642424076822e-08, "grad_condition": 517580765.4604114, "lr": 0.0004999999999999996, "time_sec": 15.604532957077026 }, { "epoch": 76, "train_loss": 0.3745850126075745, "train_acc": 0.87942, "test_loss": 1.8862019395828247, "test_acc": 0.597, "lyapunov": null, "grad_norm": 0.6831871296489548, "grad_max_sv": 0.30832933597266676, "grad_min_sv": 1.2160173869495832e-08, "grad_condition": 947775184.6338822, "lr": 0.0004895287900583212, "time_sec": 15.608951568603516 }, { "epoch": 77, "train_loss": 0.3610551133441925, "train_acc": 0.88172, "test_loss": 1.880063851928711, "test_acc": 0.6012, "lyapunov": null, "grad_norm": 0.6743453354187542, "grad_max_sv": 0.29855253025889394, "grad_min_sv": 1.2030242225015767e-08, "grad_condition": 516312299.61059207, "lr": 0.0004790621731353997, "time_sec": 15.615072250366211 }, { "epoch": 78, "train_loss": 0.3575943685531616, "train_acc": 0.88478, "test_loss": 1.9622120880126954, "test_acc": 0.5938, "lyapunov": null, "grad_norm": 0.6751503647014531, "grad_max_sv": 0.30869465619325637, "grad_min_sv": 1.1962258270568903e-08, "grad_condition": 156961942.34190208, "lr": 0.000468604740235343, "time_sec": 15.620108127593994 }, { "epoch": 79, "train_loss": 0.356780963382721, "train_acc": 0.88514, "test_loss": 1.9785774551391602, "test_acc": 0.5895, "lyapunov": null, "grad_norm": 0.6750273249196351, "grad_max_sv": 0.29922002404928205, "grad_min_sv": 1.1769536231547029e-08, "grad_condition": 159293637.70185965, "lr": 0.00045816107833384175, "time_sec": 15.615866899490356 }, { "epoch": 80, "train_loss": 0.34938912315368653, "train_acc": 0.8876, "test_loss": 1.9177911525726319, "test_acc": 0.5916, "lyapunov": null, "grad_norm": 0.6633930537019016, "grad_max_sv": 0.29133019372820856, "grad_min_sv": 1.1681813408617736e-08, "grad_condition": 263364196.96272945, "lr": 0.0004477357683661729, "time_sec": 15.618734359741211 }, { "epoch": 81, "train_loss": 0.34074662324905397, "train_acc": 0.8899, "test_loss": 1.947013536453247, "test_acc": 0.5907, "lyapunov": null, "grad_norm": 0.6597022593428697, "grad_max_sv": 0.29191571436822417, "grad_min_sv": 1.156299900565089e-08, "grad_condition": 1345147447.952278, "lr": 0.00043733338321784746, "time_sec": 15.646045923233032 }, { "epoch": 82, "train_loss": 0.33476794362068174, "train_acc": 0.89196, "test_loss": 1.995362993812561, "test_acc": 0.5918, "lyapunov": null, "grad_norm": 0.6563550515125143, "grad_max_sv": 0.28989207223057745, "grad_min_sv": 1.1521310828500105e-08, "grad_condition": 1549368517.9852664, "lr": 0.0004269584857187939, "time_sec": 15.651390075683594 }, { "epoch": 83, "train_loss": 0.32779589292526246, "train_acc": 0.89466, "test_loss": 1.9326098243713379, "test_acc": 0.5984, "lyapunov": null, "grad_norm": 0.6471640564495617, "grad_max_sv": 0.29146968461573125, "grad_min_sv": 1.1487493853379327e-08, "grad_condition": 92617304.39349434, "lr": 0.0004166156266419484, "time_sec": 15.611905336380005 }, { "epoch": 84, "train_loss": 0.3205149848842621, "train_acc": 0.89636, "test_loss": 2.084268938064575, "test_acc": 0.5809, "lyapunov": null, "grad_norm": 0.6452842014274853, "grad_max_sv": 0.2868046831339598, "grad_min_sv": 1.1289359868812965e-08, "grad_condition": 186807946.77140856, "lr": 0.0004063093427071373, "time_sec": 15.605120658874512 }, { "epoch": 85, "train_loss": 0.31429147192001344, "train_acc": 0.89772, "test_loss": 1.8867773443222047, "test_acc": 0.6067, "lyapunov": null, "grad_norm": 0.6402388209165808, "grad_max_sv": 0.29072388894855977, "grad_min_sv": 1.1252009047418853e-08, "grad_condition": 102815726.30519769, "lr": 0.0003960441545911199, "time_sec": 15.619008302688599 }, { "epoch": 86, "train_loss": 0.3057248209381104, "train_acc": 0.90034, "test_loss": 1.9401320112228393, "test_acc": 0.5983, "lyapunov": null, "grad_norm": 0.6311267078269261, "grad_max_sv": 0.2907364759594202, "grad_min_sv": 1.1278600659490879e-08, "grad_condition": 156533701.22010937, "lr": 0.0003858245649446718, "time_sec": 15.645244359970093 }, { "epoch": 87, "train_loss": 0.3014916487598419, "train_acc": 0.9024, "test_loss": 1.9676358179092408, "test_acc": 0.5951, "lyapunov": null, "grad_norm": 0.6286377862812311, "grad_max_sv": 0.29410710372030735, "grad_min_sv": 1.117144211807558e-08, "grad_condition": 1243341457.898049, "lr": 0.00037565505641757235, "time_sec": 15.613637685775757 }, { "epoch": 88, "train_loss": 0.2975629404449463, "train_acc": 0.90206, "test_loss": 1.9475040822982788, "test_acc": 0.6007, "lyapunov": null, "grad_norm": 0.6288857771151286, "grad_max_sv": 0.29210252575576306, "grad_min_sv": 1.1327018099556787e-08, "grad_condition": 449577659.23919934, "lr": 0.00036554008969236695, "time_sec": 15.627456188201904 }, { "epoch": 89, "train_loss": 0.2940291863822937, "train_acc": 0.90424, "test_loss": 1.9751218059539795, "test_acc": 0.6041, "lyapunov": null, "grad_norm": 0.624248588717073, "grad_max_sv": 0.27752059176564214, "grad_min_sv": 1.0839235129161267e-08, "grad_condition": 328108890.12738866, "lr": 0.0003554841015277638, "time_sec": 15.661294221878052 }, { "epoch": 90, "train_loss": 0.28330512808799746, "train_acc": 0.90742, "test_loss": 1.9922785207748412, "test_acc": 0.6018, "lyapunov": null, "grad_norm": 0.6169602856180438, "grad_max_sv": 0.2886409737169743, "grad_min_sv": 1.0983499523081752e-08, "grad_condition": 97610883.30544701, "lr": 0.000345491502812526, "time_sec": 15.610979795455933 }, { "epoch": 91, "train_loss": 0.2814662490653992, "train_acc": 0.90908, "test_loss": 1.9960870874404908, "test_acc": 0.5995, "lyapunov": null, "grad_norm": 0.6132865794782463, "grad_max_sv": 0.28339540734887125, "grad_min_sv": 1.0941020271021395e-08, "grad_condition": 145384408.70816708, "lr": 0.0003355666766307081, "time_sec": 15.639533281326294 }, { "epoch": 92, "train_loss": 0.2761197953605652, "train_acc": 0.91006, "test_loss": 1.993612285232544, "test_acc": 0.6007, "lyapunov": null, "grad_norm": 0.6073672916952068, "grad_max_sv": 0.2746456813067198, "grad_min_sv": 1.0572886616905252e-08, "grad_condition": 62093577.47245115, "lr": 0.00032571397633909225, "time_sec": 15.616953611373901 }, { "epoch": 93, "train_loss": 0.2773143856334686, "train_acc": 0.90906, "test_loss": 1.9627196998596192, "test_acc": 0.5993, "lyapunov": null, "grad_norm": 0.6057396266879189, "grad_max_sv": 0.27635425254702567, "grad_min_sv": 1.0533270900208586e-08, "grad_condition": 200919941.49428365, "lr": 0.00031593772365766094, "time_sec": 15.62587594985962 }, { "epoch": 94, "train_loss": 0.2620466177368164, "train_acc": 0.91416, "test_loss": 2.0111697412490845, "test_acc": 0.602, "lyapunov": null, "grad_norm": 0.5926928515974628, "grad_max_sv": 0.28529031090438367, "grad_min_sv": 1.0650170428677317e-08, "grad_condition": 743433094.0082552, "lr": 0.0003062422067739483, "time_sec": 15.626370191574097 }, { "epoch": 95, "train_loss": 0.2537871124172211, "train_acc": 0.91762, "test_loss": 1.9979699476242065, "test_acc": 0.5996, "lyapunov": null, "grad_norm": 0.5795471657923094, "grad_max_sv": 0.27274232916533947, "grad_min_sv": 1.036865705178816e-08, "grad_condition": 309294232.0879529, "lr": 0.00029663167846209965, "time_sec": 15.634578943252563 }, { "epoch": 96, "train_loss": 0.2604071279144287, "train_acc": 0.91558, "test_loss": 2.0250939807891846, "test_acc": 0.5981, "lyapunov": null, "grad_norm": 0.5880459177262352, "grad_max_sv": 0.27270981669425964, "grad_min_sv": 1.0527747556186851e-08, "grad_condition": 634008594.0035694, "lr": 0.00028711035421746345, "time_sec": 15.610902070999146 }, { "epoch": 97, "train_loss": 0.25580399082183836, "train_acc": 0.91794, "test_loss": 1.9363522800445556, "test_acc": 0.611, "lyapunov": null, "grad_norm": 0.5834698969226986, "grad_max_sv": 0.2803939372301102, "grad_min_sv": 1.0679914613353353e-08, "grad_condition": 719199780.3413004, "lr": 0.00027768241040753615, "time_sec": 15.64728569984436 }, { "epoch": 98, "train_loss": 0.24704306831359862, "train_acc": 0.92026, "test_loss": 1.959199716567993, "test_acc": 0.6064, "lyapunov": null, "grad_norm": 0.5767069189645235, "grad_max_sv": 0.2719736970961094, "grad_min_sv": 1.0407105681484868e-08, "grad_condition": 507738893.5347587, "lr": 0.00026835198244006903, "time_sec": 15.606433153152466 }, { "epoch": 99, "train_loss": 0.23963388308048247, "train_acc": 0.92232, "test_loss": 2.0193208892822265, "test_acc": 0.604, "lyapunov": null, "grad_norm": 0.5636948581506628, "grad_max_sv": 0.2563767429441214, "grad_min_sv": 9.613457626483913e-09, "grad_condition": 152598313.52871948, "lr": 0.0002591231629491421, "time_sec": 15.63752031326294 }, { "epoch": 100, "train_loss": 0.24343088443756103, "train_acc": 0.92086, "test_loss": 1.9747429904937743, "test_acc": 0.6041, "lyapunov": null, "grad_norm": 0.5699300559096447, "grad_max_sv": 0.270798621699214, "grad_min_sv": 1.0453353890187232e-08, "grad_condition": 2642582699.9195356, "lr": 0.0002499999999999997, "time_sec": 15.625839710235596 }, { "epoch": 101, "train_loss": 0.2352629409980774, "train_acc": 0.92396, "test_loss": 1.989087490463257, "test_acc": 0.6026, "lyapunov": null, "grad_norm": 0.5635783773655396, "grad_max_sv": 0.2760987766087055, "grad_min_sv": 1.0676657122982158e-08, "grad_condition": 230608448.0042146, "lr": 0.00024098649531343477, "time_sec": 15.618889093399048 }, { "epoch": 102, "train_loss": 0.23230449400901795, "train_acc": 0.9242, "test_loss": 2.011552722930908, "test_acc": 0.6012, "lyapunov": null, "grad_norm": 0.5597262828511032, "grad_max_sv": 0.2676333624869585, "grad_min_sv": 1.013142310103167e-08, "grad_condition": 765944599.5566685, "lr": 0.0002320866025105016, "time_sec": 15.619239091873169 }, { "epoch": 103, "train_loss": 0.22586535712242126, "train_acc": 0.92702, "test_loss": 1.984936227798462, "test_acc": 0.6064, "lyapunov": null, "grad_norm": 0.5525662827107412, "grad_max_sv": 0.26978373192250726, "grad_min_sv": 1.0020810805059718e-08, "grad_condition": 426927099.4434453, "lr": 0.0002233042253783278, "time_sec": 15.617717981338501 }, { "epoch": 104, "train_loss": 0.2259028799390793, "train_acc": 0.92724, "test_loss": 1.9414194402694702, "test_acc": 0.6138, "lyapunov": null, "grad_norm": 0.5552198456176712, "grad_max_sv": 0.2549734696745872, "grad_min_sv": 9.559075114318542e-09, "grad_condition": 2183845809.503984, "lr": 0.000214643216157784, "time_sec": 15.639457702636719 }, { "epoch": 105, "train_loss": 0.21585512964725495, "train_acc": 0.93068, "test_loss": 1.9875489110946656, "test_acc": 0.606, "lyapunov": null, "grad_norm": 0.545110676363793, "grad_max_sv": 0.2662647683173418, "grad_min_sv": 9.966519613335139e-09, "grad_condition": 304520020.74158037, "lr": 0.00020610737385376332, "time_sec": 15.633507013320923 }, { "epoch": 106, "train_loss": 0.2177306656885147, "train_acc": 0.92888, "test_loss": 2.001543083000183, "test_acc": 0.6039, "lyapunov": null, "grad_norm": 0.550439381212866, "grad_max_sv": 0.2616906825453043, "grad_min_sv": 9.792636692686207e-09, "grad_condition": 257664085.8931566, "lr": 0.00019770044256881242, "time_sec": 15.617624759674072 }, { "epoch": 107, "train_loss": 0.21544821160316469, "train_acc": 0.93026, "test_loss": 1.982275790977478, "test_acc": 0.6101, "lyapunov": null, "grad_norm": 0.5459895500350969, "grad_max_sv": 0.25458521842956544, "grad_min_sv": 9.842609948471428e-09, "grad_condition": 482597026.39869213, "lr": 0.0001894261098608447, "time_sec": 15.647446632385254 }, { "epoch": 108, "train_loss": 0.2111588809776306, "train_acc": 0.93214, "test_loss": 1.9962615560531616, "test_acc": 0.6122, "lyapunov": null, "grad_norm": 0.5418984142700298, "grad_max_sv": 0.2645403627306223, "grad_min_sv": 9.923241169051967e-09, "grad_condition": 365555925.75439864, "lr": 0.000181288005125655, "time_sec": 15.624069213867188 }, { "epoch": 109, "train_loss": 0.20284160462856293, "train_acc": 0.9356, "test_loss": 1.9948909492492677, "test_acc": 0.6088, "lyapunov": null, "grad_norm": 0.528437343256151, "grad_max_sv": 0.259377746284008, "grad_min_sv": 9.446828402957103e-09, "grad_condition": 445873699.40050447, "lr": 0.0001732896980049473, "time_sec": 15.619670867919922 }, { "epoch": 110, "train_loss": 0.20353743035316468, "train_acc": 0.93482, "test_loss": 1.986756645965576, "test_acc": 0.6055, "lyapunov": null, "grad_norm": 0.5264966046483858, "grad_max_sv": 0.2641640670597553, "grad_min_sv": 9.887280825321421e-09, "grad_condition": 138912649.1504107, "lr": 0.00016543469682057076, "time_sec": 15.631803512573242 }, { "epoch": 111, "train_loss": 0.20074854846000673, "train_acc": 0.93586, "test_loss": 1.9947669797897338, "test_acc": 0.6121, "lyapunov": null, "grad_norm": 0.5275548784671268, "grad_max_sv": 0.2535504408180714, "grad_min_sv": 9.46079494620021e-09, "grad_condition": 547036967.0533922, "lr": 0.00015772644703565552, "time_sec": 15.61940598487854 }, { "epoch": 112, "train_loss": 0.19321160237312318, "train_acc": 0.9385, "test_loss": 2.0327499378204346, "test_acc": 0.6062, "lyapunov": null, "grad_norm": 0.5166537604057669, "grad_max_sv": 0.25912084989249706, "grad_min_sv": 9.35720720976474e-09, "grad_condition": 95478514.06504653, "lr": 0.00015016832974331713, "time_sec": 15.630404233932495 }, { "epoch": 113, "train_loss": 0.19881929339408874, "train_acc": 0.93676, "test_loss": 1.9957002614974975, "test_acc": 0.6131, "lyapunov": null, "grad_norm": 0.5256468964094271, "grad_max_sv": 0.26186227425932884, "grad_min_sv": 9.776758263992796e-09, "grad_condition": 531930595.36185646, "lr": 0.00014276366018359834, "time_sec": 15.610270023345947 }, { "epoch": 114, "train_loss": 0.19278850085735322, "train_acc": 0.93894, "test_loss": 1.9826040161132812, "test_acc": 0.6131, "lyapunov": null, "grad_norm": 0.5148800122190731, "grad_max_sv": 0.2489961117506027, "grad_min_sv": 9.322825122396599e-09, "grad_condition": 159545806.21783024, "lr": 0.00013551568628929425, "time_sec": 15.641097784042358 }, { "epoch": 115, "train_loss": 0.18285285237312318, "train_acc": 0.9414, "test_loss": 1.991772039604187, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.5028991850276996, "grad_max_sv": 0.25001580603420737, "grad_min_sv": 9.509952834441983e-09, "grad_condition": 842043304.8653241, "lr": 0.00012842758726130276, "time_sec": 15.624920845031738 }, { "epoch": 116, "train_loss": 0.18698999623775484, "train_acc": 0.94058, "test_loss": 2.0126701816558836, "test_acc": 0.6119, "lyapunov": null, "grad_norm": 0.5095041564276453, "grad_max_sv": 0.26496921889483926, "grad_min_sv": 9.780998184343373e-09, "grad_condition": 568079773.7667667, "lr": 0.0001215024721741218, "time_sec": 15.629492282867432 }, { "epoch": 117, "train_loss": 0.18326869733810425, "train_acc": 0.94208, "test_loss": 2.0141338161468507, "test_acc": 0.6109, "lyapunov": null, "grad_norm": 0.5053898511223723, "grad_max_sv": 0.25150991678237916, "grad_min_sv": 9.336200610613604e-09, "grad_condition": 1717749653.6011043, "lr": 0.00011474337861210538, "time_sec": 15.634049415588379 }, { "epoch": 118, "train_loss": 0.18224171819210053, "train_acc": 0.94188, "test_loss": 2.0296729431152345, "test_acc": 0.6105, "lyapunov": null, "grad_norm": 0.5029285155771278, "grad_max_sv": 0.23879224769771099, "grad_min_sv": 8.82893005297973e-09, "grad_condition": 239804345.46782646, "lr": 0.00010815327133708009, "time_sec": 15.628947496414185 }, { "epoch": 119, "train_loss": 0.18119296488761902, "train_acc": 0.94198, "test_loss": 2.0246818908691404, "test_acc": 0.6087, "lyapunov": null, "grad_norm": 0.5032702983874193, "grad_max_sv": 0.24678345806896687, "grad_min_sv": 9.113220317789883e-09, "grad_condition": 857312795.1343833, "lr": 0.00010173504098790182, "time_sec": 15.6134774684906 }, { "epoch": 120, "train_loss": 0.17719127690315248, "train_acc": 0.9427, "test_loss": 2.01081164188385, "test_acc": 0.6174, "lyapunov": null, "grad_norm": 0.5004254149003725, "grad_max_sv": 0.246440602093935, "grad_min_sv": 9.41313048775233e-09, "grad_condition": 138861626.69393042, "lr": 9.549150281252629e-05, "time_sec": 15.636605978012085 }, { "epoch": 121, "train_loss": 0.17499777765274047, "train_acc": 0.94382, "test_loss": 1.9586133924484252, "test_acc": 0.6191, "lyapunov": null, "grad_norm": 0.49798749889404575, "grad_max_sv": 0.24333747774362563, "grad_min_sv": 8.965640931665048e-09, "grad_condition": 199036180.79499412, "lr": 8.942539543314794e-05, "time_sec": 15.640979051589966 }, { "epoch": 122, "train_loss": 0.17186202396392822, "train_acc": 0.94454, "test_loss": 2.0166892234802245, "test_acc": 0.6135, "lyapunov": null, "grad_norm": 0.49330378790067125, "grad_max_sv": 0.25466611608862877, "grad_min_sv": 9.453950847171378e-09, "grad_condition": 478328271.5351636, "lr": 8.353937964495024e-05, "time_sec": 15.646830320358276 }, { "epoch": 123, "train_loss": 0.16818810626506805, "train_acc": 0.94736, "test_loss": 2.019712274169922, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.48351538018550005, "grad_max_sv": 0.23057686612010003, "grad_min_sv": 8.829706591578778e-09, "grad_condition": 119186809.27894473, "lr": 7.783603724899243e-05, "time_sec": 15.61932897567749 }, { "epoch": 124, "train_loss": 0.1690133387851715, "train_acc": 0.94626, "test_loss": 2.0480916412353514, "test_acc": 0.6128, "lyapunov": null, "grad_norm": 0.48572744080768737, "grad_max_sv": 0.23872192315757274, "grad_min_sv": 8.860755323661872e-09, "grad_condition": 3145605466.955108, "lr": 7.231786991974666e-05, "time_sec": 15.644042730331421 }, { "epoch": 125, "train_loss": 0.168843046336174, "train_acc": 0.94632, "test_loss": 2.0204298835754395, "test_acc": 0.6129, "lyapunov": null, "grad_norm": 0.4870048472763099, "grad_max_sv": 0.23674570098519326, "grad_min_sv": 8.746680829206827e-09, "grad_condition": 1043463046.0193933, "lr": 6.698729810778072e-05, "time_sec": 15.637329578399658 }, { "epoch": 126, "train_loss": 0.1671668215227127, "train_acc": 0.94594, "test_loss": 2.002202911376953, "test_acc": 0.6131, "lyapunov": null, "grad_norm": 0.48754920878473634, "grad_max_sv": 0.24048108272254468, "grad_min_sv": 9.09920443853407e-09, "grad_condition": 222641480.08621296, "lr": 6.184665997806817e-05, "time_sec": 15.630179405212402 }, { "epoch": 127, "train_loss": 0.1643574129629135, "train_acc": 0.94886, "test_loss": 1.9984551259994507, "test_acc": 0.6156, "lyapunov": null, "grad_norm": 0.47845542032939736, "grad_max_sv": 0.24418257176876068, "grad_min_sv": 9.058184188338348e-09, "grad_condition": 1384258325.8409991, "lr": 5.6898210384392595e-05, "time_sec": 15.670144081115723 }, { "epoch": 128, "train_loss": 0.16359006194114686, "train_acc": 0.9479, "test_loss": 2.0345991184234617, "test_acc": 0.6179, "lyapunov": null, "grad_norm": 0.48011615670673446, "grad_max_sv": 0.2456669148057699, "grad_min_sv": 9.08018520576876e-09, "grad_condition": 6539583536.661702, "lr": 5.214411988029363e-05, "time_sec": 15.629289150238037 }, { "epoch": 129, "train_loss": 0.16212649368047713, "train_acc": 0.94982, "test_loss": 2.010682648849487, "test_acc": 0.6175, "lyapunov": null, "grad_norm": 0.4761536550945564, "grad_max_sv": 0.232033634185791, "grad_min_sv": 8.589821504130924e-09, "grad_condition": 3119446573.9156704, "lr": 4.7586473766990294e-05, "time_sec": 15.64078950881958 }, { "epoch": 130, "train_loss": 0.16086667060375215, "train_acc": 0.94958, "test_loss": 1.9803698434829713, "test_acc": 0.6147, "lyapunov": null, "grad_norm": 0.47391205330881436, "grad_max_sv": 0.2445445589721203, "grad_min_sv": 8.864201939140243e-09, "grad_condition": 1504896403.9424946, "lr": 4.32272711786996e-05, "time_sec": 15.639111280441284 }, { "epoch": 131, "train_loss": 0.1630353739786148, "train_acc": 0.94778, "test_loss": 2.0161276233673098, "test_acc": 0.6182, "lyapunov": null, "grad_norm": 0.47703771588416854, "grad_max_sv": 0.24524084888398648, "grad_min_sv": 8.949330069585661e-09, "grad_condition": 366306191.4994844, "lr": 3.906842420574966e-05, "time_sec": 15.648417472839355 }, { "epoch": 132, "train_loss": 0.1624550827550888, "train_acc": 0.94854, "test_loss": 2.0064841974258423, "test_acc": 0.6153, "lyapunov": null, "grad_norm": 0.4818820971540279, "grad_max_sv": 0.24392225965857506, "grad_min_sv": 9.014241386749028e-09, "grad_condition": 324500193.81381315, "lr": 3.5111757055874305e-05, "time_sec": 15.652456998825073 }, { "epoch": 133, "train_loss": 0.15666789950847626, "train_acc": 0.95052, "test_loss": 2.004924358177185, "test_acc": 0.614, "lyapunov": null, "grad_norm": 0.4692967462799058, "grad_max_sv": 0.23394662290811538, "grad_min_sv": 8.633084696250959e-09, "grad_condition": 738953051.583332, "lr": 3.1359005254054254e-05, "time_sec": 15.626720190048218 }, { "epoch": 134, "train_loss": 0.15714832616329194, "train_acc": 0.951, "test_loss": 1.9721798049926758, "test_acc": 0.6189, "lyapunov": null, "grad_norm": 0.4708593375349624, "grad_max_sv": 0.2399698007851839, "grad_min_sv": 8.714008907333149e-09, "grad_condition": 459943684.01348275, "lr": 2.7811814881259484e-05, "time_sec": 15.634363174438477 }, { "epoch": 135, "train_loss": 0.15481690949440002, "train_acc": 0.95178, "test_loss": 2.056765143966675, "test_acc": 0.6141, "lyapunov": null, "grad_norm": 0.46512649923966126, "grad_max_sv": 0.23735021129250528, "grad_min_sv": 8.604525054706907e-09, "grad_condition": 441311318.94657505, "lr": 2.4471741852423218e-05, "time_sec": 15.641301155090332 }, { "epoch": 136, "train_loss": 0.15590213608264922, "train_acc": 0.95074, "test_loss": 1.9664541049957276, "test_acc": 0.615, "lyapunov": null, "grad_norm": 0.4718253897994526, "grad_max_sv": 0.24445511549711227, "grad_min_sv": 8.92059932467576e-09, "grad_condition": 155779083.2595345, "lr": 2.1340251233966362e-05, "time_sec": 15.650960445404053 }, { "epoch": 137, "train_loss": 0.15185086236953735, "train_acc": 0.95326, "test_loss": 2.047826315307617, "test_acc": 0.6137, "lyapunov": null, "grad_norm": 0.46215794046576214, "grad_max_sv": 0.2249258290976286, "grad_min_sv": 8.299157507572763e-09, "grad_condition": 391195089.613189, "lr": 1.8418716601170932e-05, "time_sec": 15.619166374206543 }, { "epoch": 138, "train_loss": 0.15070438093185426, "train_acc": 0.95262, "test_loss": 2.030345579147339, "test_acc": 0.6129, "lyapunov": null, "grad_norm": 0.4608066254891212, "grad_max_sv": 0.234202978387475, "grad_min_sv": 8.521646538895875e-09, "grad_condition": 5129724937.383492, "lr": 1.570841943568445e-05, "time_sec": 15.623726606369019 }, { "epoch": 139, "train_loss": 0.15612281042575837, "train_acc": 0.95076, "test_loss": 2.0557478452682494, "test_acc": 0.612, "lyapunov": null, "grad_norm": 0.47103497229286695, "grad_max_sv": 0.23263695724308492, "grad_min_sv": 8.57658385075566e-09, "grad_condition": 101811752.76010731, "lr": 1.3210548563419845e-05, "time_sec": 15.65443754196167 }, { "epoch": 140, "train_loss": 0.15597544308423997, "train_acc": 0.95086, "test_loss": 1.9863805370330812, "test_acc": 0.6151, "lyapunov": null, "grad_norm": 0.46515955894700917, "grad_max_sv": 0.22864672914147377, "grad_min_sv": 8.669487886083091e-09, "grad_condition": 2093311134.8373718, "lr": 1.0926199633097203e-05, "time_sec": 15.636597394943237 }, { "epoch": 141, "train_loss": 0.15137063200950623, "train_acc": 0.95232, "test_loss": 2.0044470993041994, "test_acc": 0.6185, "lyapunov": null, "grad_norm": 0.4628286057156769, "grad_max_sv": 0.24093721210956573, "grad_min_sv": 8.729446927135563e-09, "grad_condition": 3146827225.783096, "lr": 8.856374635655688e-06, "time_sec": 15.6335289478302 }, { "epoch": 142, "train_loss": 0.15115962938308716, "train_acc": 0.95278, "test_loss": 1.9897070358276367, "test_acc": 0.6186, "lyapunov": null, "grad_norm": 0.45849067649845243, "grad_max_sv": 0.22538469620049, "grad_min_sv": 8.402085760331798e-09, "grad_condition": 1185010790.8687212, "lr": 7.001981464747503e-06, "time_sec": 15.64037299156189 }, { "epoch": 143, "train_loss": 0.15024116450309755, "train_acc": 0.95378, "test_loss": 1.9762957132339478, "test_acc": 0.62, "lyapunov": null, "grad_norm": 0.4584088819764392, "grad_max_sv": 0.22209009900689125, "grad_min_sv": 8.452660355321145e-09, "grad_condition": 1556012288.1682973, "lr": 5.3638335185058295e-06, "time_sec": 15.659480571746826 }, { "epoch": 144, "train_loss": 0.1521627188205719, "train_acc": 0.95232, "test_loss": 2.0099195236206056, "test_acc": 0.615, "lyapunov": null, "grad_norm": 0.46494782588161737, "grad_max_sv": 0.238496233522892, "grad_min_sv": 8.729236520774175e-09, "grad_condition": 69857580.46396288, "lr": 3.942649342761114e-06, "time_sec": 15.64352297782898 }, { "epoch": 145, "train_loss": 0.15200012585163117, "train_acc": 0.95196, "test_loss": 1.98911852684021, "test_acc": 0.6161, "lyapunov": null, "grad_norm": 0.46350518405517277, "grad_max_sv": 0.22944532111287116, "grad_min_sv": 8.441616768887356e-09, "grad_condition": 1044568693.4332545, "lr": 2.7390523158633524e-06, "time_sec": 15.670719385147095 }, { "epoch": 146, "train_loss": 0.1524506710958481, "train_acc": 0.95248, "test_loss": 1.9624867490768432, "test_acc": 0.6194, "lyapunov": null, "grad_norm": 0.46296967599985495, "grad_max_sv": 0.24031115397810937, "grad_min_sv": 8.944420498528671e-09, "grad_condition": 254633054.1592765, "lr": 1.7535703752478133e-06, "time_sec": 15.643468141555786 }, { "epoch": 147, "train_loss": 0.15344970943927766, "train_acc": 0.95206, "test_loss": 2.0164750316619875, "test_acc": 0.6171, "lyapunov": null, "grad_norm": 0.4641053248109342, "grad_max_sv": 0.24226672500371932, "grad_min_sv": 8.89504937415242e-09, "grad_condition": 221436071.47224984, "lr": 9.866357858642196e-07, "time_sec": 15.642008066177368 }, { "epoch": 148, "train_loss": 0.15008926822185517, "train_acc": 0.95316, "test_loss": 2.007580140686035, "test_acc": 0.6105, "lyapunov": null, "grad_norm": 0.4593316495579621, "grad_max_sv": 0.23314933404326438, "grad_min_sv": 8.37392370464738e-09, "grad_condition": 1235759721.5215242, "lr": 4.38584950570808e-07, "time_sec": 15.637904644012451 }, { "epoch": 149, "train_loss": 0.1545172585248947, "train_acc": 0.95082, "test_loss": 1.9932567636489869, "test_acc": 0.6167, "lyapunov": null, "grad_norm": 0.46711595173344705, "grad_max_sv": 0.24011613838374615, "grad_min_sv": 9.01919292514708e-09, "grad_condition": 533582982.17976344, "lr": 1.096582625772501e-07, "time_sec": 15.649343013763428 }, { "epoch": 150, "train_loss": 0.15159378504276275, "train_acc": 0.95298, "test_loss": 1.981881332397461, "test_acc": 0.6151, "lyapunov": null, "grad_norm": 0.4631918119140012, "grad_max_sv": 0.23626054041087627, "grad_min_sv": 8.505257114788459e-09, "grad_condition": 368578452.6540891, "lr": 0.0, "time_sec": 15.655460119247437 } ], "8": [ { "epoch": 1, "train_loss": 4.193410815277099, "train_acc": 0.07754, "test_loss": 4.000027540588379, "test_acc": 0.1084, "lyapunov": null, "grad_norm": 5.824766820168824, "grad_max_sv": 4.574610841274262, "grad_min_sv": 1.0190309995827818e-07, "grad_condition": 64142283.19081552, "lr": 0.0009998903417374227, "time_sec": 32.83128619194031 }, { "epoch": 2, "train_loss": 3.561303809967041, "train_acc": 0.15712, "test_loss": 3.590533604812622, "test_acc": 0.1573, "lyapunov": null, "grad_norm": 3.9411000996615257, "grad_max_sv": 2.8509309351444245, "grad_min_sv": 7.158311222943414e-08, "grad_condition": 97792152.02989444, "lr": 0.0009995614150494292, "time_sec": 32.72442889213562 }, { "epoch": 3, "train_loss": 3.1933692501068114, "train_acc": 0.21822, "test_loss": 3.4406786922454833, "test_acc": 0.1888, "lyapunov": null, "grad_norm": 2.91352219919842, "grad_max_sv": 1.9122859120368958, "grad_min_sv": 5.4513909730768975e-08, "grad_condition": 41901882.724198125, "lr": 0.0009990133642141358, "time_sec": 32.71043276786804 }, { "epoch": 4, "train_loss": 2.9170604755401612, "train_acc": 0.266, "test_loss": 3.0161821269989013, "test_acc": 0.2662, "lyapunov": null, "grad_norm": 2.4579814839971488, "grad_max_sv": 1.375921016931534, "grad_min_sv": 4.532563397940948e-08, "grad_condition": 34954497.395048514, "lr": 0.0009982464296247522, "time_sec": 32.71440148353577 }, { "epoch": 5, "train_loss": 2.6815094689941406, "train_acc": 0.31454, "test_loss": 3.171553889846802, "test_acc": 0.2379, "lyapunov": null, "grad_norm": 2.19104728864566, "grad_max_sv": 1.1679374247789382, "grad_min_sv": 4.075679240767016e-08, "grad_condition": 34176946.0056582, "lr": 0.0009972609476841367, "time_sec": 32.70787262916565 }, { "epoch": 6, "train_loss": 2.512476542663574, "train_acc": 0.34722, "test_loss": 2.8388263694763185, "test_acc": 0.2956, "lyapunov": null, "grad_norm": 2.024852807897748, "grad_max_sv": 1.048439186811447, "grad_min_sv": 3.766053036924344e-08, "grad_condition": 110646045.40063909, "lr": 0.000996057350657239, "time_sec": 32.716644048690796 }, { "epoch": 7, "train_loss": 2.3700338256072997, "train_acc": 0.37646, "test_loss": 2.664342771148682, "test_acc": 0.3267, "lyapunov": null, "grad_norm": 1.8863637744279735, "grad_max_sv": 0.9381255134940147, "grad_min_sv": 3.53045587958567e-08, "grad_condition": 91691166.21261387, "lr": 0.000994636166481494, "time_sec": 32.70954084396362 }, { "epoch": 8, "train_loss": 2.241964275894165, "train_acc": 0.40536, "test_loss": 2.3703575309753417, "test_acc": 0.3827, "lyapunov": null, "grad_norm": 1.79442458506404, "grad_max_sv": 0.8764713048934937, "grad_min_sv": 3.357538055498432e-08, "grad_condition": 85483165.80410945, "lr": 0.0009929980185352525, "time_sec": 32.705676794052124 }, { "epoch": 9, "train_loss": 2.1290865299224855, "train_acc": 0.43074, "test_loss": 2.346775402069092, "test_acc": 0.3898, "lyapunov": null, "grad_norm": 1.6946660597355347, "grad_max_sv": 0.8082527592778206, "grad_min_sv": 3.168056596919433e-08, "grad_condition": 84022920.74591663, "lr": 0.0009911436253643444, "time_sec": 32.81319451332092 }, { "epoch": 10, "train_loss": 2.0410905982208254, "train_acc": 0.45114, "test_loss": 2.352191310119629, "test_acc": 0.4016, "lyapunov": null, "grad_norm": 1.6077351393537498, "grad_max_sv": 0.7309410408139229, "grad_min_sv": 2.985739961935963e-08, "grad_condition": 36398179.92957014, "lr": 0.0009890738003669028, "time_sec": 32.67559885978699 }, { "epoch": 11, "train_loss": 1.9488755139160157, "train_acc": 0.47108, "test_loss": 2.292022847747803, "test_acc": 0.4149, "lyapunov": null, "grad_norm": 1.5472074192305951, "grad_max_sv": 0.6999917805194855, "grad_min_sv": 2.931911482484395e-08, "grad_condition": 29185684.451776367, "lr": 0.00098678945143658, "time_sec": 32.67131185531616 }, { "epoch": 12, "train_loss": 1.8751110802459716, "train_acc": 0.48868, "test_loss": 2.234260977935791, "test_acc": 0.4219, "lyapunov": null, "grad_norm": 1.477638716923594, "grad_max_sv": 0.647687041759491, "grad_min_sv": 2.7830199432477e-08, "grad_condition": 45906260.41435587, "lr": 0.0009842915805643154, "time_sec": 32.67626142501831 }, { "epoch": 13, "train_loss": 1.8070984636688232, "train_acc": 0.50424, "test_loss": 2.1869627113342287, "test_acc": 0.4348, "lyapunov": null, "grad_norm": 1.4268137700999757, "grad_max_sv": 0.6230859503149986, "grad_min_sv": 2.6403634246358056e-08, "grad_condition": 81962325.61583482, "lr": 0.000981581283398829, "time_sec": 32.71280646324158 }, { "epoch": 14, "train_loss": 1.7594015161895753, "train_acc": 0.51666, "test_loss": 2.225412437438965, "test_acc": 0.4269, "lyapunov": null, "grad_norm": 1.3750641538015655, "grad_max_sv": 0.5909776814281941, "grad_min_sv": 2.5812447444067965e-08, "grad_condition": 110809015.48631673, "lr": 0.0009786597487660333, "time_sec": 32.71353602409363 }, { "epoch": 15, "train_loss": 1.7050045301437378, "train_acc": 0.5265, "test_loss": 2.2115724647521975, "test_acc": 0.4374, "lyapunov": null, "grad_norm": 1.3299355868966125, "grad_max_sv": 0.5802051067352295, "grad_min_sv": 2.5246993384797634e-08, "grad_condition": 26653204.194885753, "lr": 0.0009755282581475766, "time_sec": 32.709041357040405 }, { "epoch": 16, "train_loss": 1.6458034181976318, "train_acc": 0.54052, "test_loss": 2.3288159313201904, "test_acc": 0.4224, "lyapunov": null, "grad_norm": 1.2807898189857698, "grad_max_sv": 0.5446614563465119, "grad_min_sv": 2.4021811557278783e-08, "grad_condition": 91338509.7437632, "lr": 0.0009721881851187403, "time_sec": 32.697059869766235 }, { "epoch": 17, "train_loss": 1.5929106069946288, "train_acc": 0.55406, "test_loss": 2.1113224380493163, "test_acc": 0.4616, "lyapunov": null, "grad_norm": 1.2337526465020512, "grad_max_sv": 0.5095916628837586, "grad_min_sv": 2.2903062109336237e-08, "grad_condition": 57294649.60211961, "lr": 0.0009686409947459456, "time_sec": 32.683470726013184 }, { "epoch": 18, "train_loss": 1.5314323492813111, "train_acc": 0.5677, "test_loss": 2.091776432800293, "test_acc": 0.47, "lyapunov": null, "grad_norm": 1.1978845665370097, "grad_max_sv": 0.5015841260552406, "grad_min_sv": 2.2305156793800408e-08, "grad_condition": 29492886.216326892, "lr": 0.0009648882429441254, "time_sec": 32.737040281295776 }, { "epoch": 19, "train_loss": 1.5103012445449828, "train_acc": 0.57236, "test_loss": 2.0679006351470948, "test_acc": 0.4779, "lyapunov": null, "grad_norm": 1.1728126223162796, "grad_max_sv": 0.4839314170181751, "grad_min_sv": 2.174818596739625e-08, "grad_condition": 107997783.86314659, "lr": 0.00096093157579425, "time_sec": 32.67225241661072 }, { "epoch": 20, "train_loss": 1.4595962884140015, "train_acc": 0.58662, "test_loss": 2.1169062660217284, "test_acc": 0.4706, "lyapunov": null, "grad_norm": 1.1438665670784203, "grad_max_sv": 0.469496750831604, "grad_min_sv": 2.1164104392623617e-08, "grad_condition": 64696771.4776402, "lr": 0.0009567727288213001, "time_sec": 32.6800582408905 }, { "epoch": 21, "train_loss": 1.42210446144104, "train_acc": 0.59338, "test_loss": 2.0751025535583496, "test_acc": 0.4744, "lyapunov": null, "grad_norm": 1.1159812479247186, "grad_max_sv": 0.45728652998805047, "grad_min_sv": 2.1470654895661135e-08, "grad_condition": 28760658.649009824, "lr": 0.0009524135262330095, "time_sec": 32.680222272872925 }, { "epoch": 22, "train_loss": 1.3733370163345338, "train_acc": 0.60568, "test_loss": 2.1397033340454104, "test_acc": 0.4725, "lyapunov": null, "grad_norm": 1.0820101912101088, "grad_max_sv": 0.4380739636719227, "grad_min_sv": 2.027442237706456e-08, "grad_condition": 33804989.22411772, "lr": 0.0009478558801197061, "time_sec": 32.683854818344116 }, { "epoch": 23, "train_loss": 1.3259621669006347, "train_acc": 0.61976, "test_loss": 2.082161441612244, "test_acc": 0.4868, "lyapunov": null, "grad_norm": 1.0590598804772053, "grad_max_sv": 0.4320934973657131, "grad_min_sv": 1.9754895681789452e-08, "grad_condition": 49199633.36386584, "lr": 0.000943101789615607, "time_sec": 32.705042362213135 }, { "epoch": 24, "train_loss": 1.3155639976882934, "train_acc": 0.62032, "test_loss": 2.108880234527588, "test_acc": 0.4823, "lyapunov": null, "grad_norm": 1.046890854380851, "grad_max_sv": 0.42886915877461435, "grad_min_sv": 1.9609551714372398e-08, "grad_condition": 41053712.713573575, "lr": 0.0009381533400219313, "time_sec": 32.71632719039917 }, { "epoch": 25, "train_loss": 1.273603660621643, "train_acc": 0.63364, "test_loss": 2.0933273361206055, "test_acc": 0.4852, "lyapunov": null, "grad_norm": 1.024436079028184, "grad_max_sv": 0.41587754189968107, "grad_min_sv": 1.9385000169652723e-08, "grad_condition": 51992204.20794226, "lr": 0.0009330127018922189, "time_sec": 32.702069997787476 }, { "epoch": 26, "train_loss": 1.2419982319259644, "train_acc": 0.6399, "test_loss": 2.1144972944259646, "test_acc": 0.4865, "lyapunov": null, "grad_norm": 1.0088705466095338, "grad_max_sv": 0.39710880219936373, "grad_min_sv": 1.870035526846392e-08, "grad_condition": 181692609.81395656, "lr": 0.000927682130080253, "time_sec": 32.707526445388794 }, { "epoch": 27, "train_loss": 1.2189629228973389, "train_acc": 0.6436, "test_loss": 2.204226477432251, "test_acc": 0.476, "lyapunov": null, "grad_norm": 0.9979053902708439, "grad_max_sv": 0.3974333480000496, "grad_min_sv": 1.8178674205185376e-08, "grad_condition": 88033285.18865582, "lr": 0.0009221639627510072, "time_sec": 32.74215221405029 }, { "epoch": 28, "train_loss": 1.196308147392273, "train_acc": 0.65004, "test_loss": 2.3723191680908204, "test_acc": 0.4591, "lyapunov": null, "grad_norm": 0.975077074369322, "grad_max_sv": 0.40025187358260156, "grad_min_sv": 1.829182182389033e-08, "grad_condition": 38849966.98297453, "lr": 0.0009164606203550494, "time_sec": 32.70245599746704 }, { "epoch": 29, "train_loss": 1.1692425540161133, "train_acc": 0.65714, "test_loss": 2.2748174949645996, "test_acc": 0.4746, "lyapunov": null, "grad_norm": 0.9656994259472406, "grad_max_sv": 0.3973592549562454, "grad_min_sv": 1.812226688574503e-08, "grad_condition": 39408166.232041776, "lr": 0.0009105746045668516, "time_sec": 32.71292495727539 }, { "epoch": 30, "train_loss": 1.1311084144973755, "train_acc": 0.66644, "test_loss": 2.1602066425323487, "test_acc": 0.4933, "lyapunov": null, "grad_norm": 0.9503788281741601, "grad_max_sv": 0.3813568793237209, "grad_min_sv": 1.7537509381174154e-08, "grad_condition": 91136622.64604397, "lr": 0.0009045084971874733, "time_sec": 32.729275941848755 }, { "epoch": 31, "train_loss": 1.107859415283203, "train_acc": 0.67202, "test_loss": 2.088518197631836, "test_acc": 0.5149, "lyapunov": null, "grad_norm": 0.946846205217341, "grad_max_sv": 0.38662919625639913, "grad_min_sv": 1.787647136014536e-08, "grad_condition": 37247674.11503151, "lr": 0.0008982649590120977, "time_sec": 32.724801540374756 }, { "epoch": 32, "train_loss": 1.075172028541565, "train_acc": 0.68254, "test_loss": 2.11543652381897, "test_acc": 0.5052, "lyapunov": null, "grad_norm": 0.919583751793241, "grad_max_sv": 0.37590193301439284, "grad_min_sv": 1.7335351598646298e-08, "grad_condition": 32173699.63890195, "lr": 0.0008918467286629196, "time_sec": 32.70777225494385 }, { "epoch": 33, "train_loss": 1.0526020958709716, "train_acc": 0.68626, "test_loss": 2.283646846008301, "test_acc": 0.4816, "lyapunov": null, "grad_norm": 0.9156820464594853, "grad_max_sv": 0.37288443073630334, "grad_min_sv": 1.682198175895211e-08, "grad_condition": 41766926.72855186, "lr": 0.0008852566213878943, "time_sec": 32.71830630302429 }, { "epoch": 34, "train_loss": 1.0363747980117797, "train_acc": 0.69038, "test_loss": 2.207733528137207, "test_acc": 0.4943, "lyapunov": null, "grad_norm": 0.9077261463073804, "grad_max_sv": 0.3598011791706085, "grad_min_sv": 1.6353098675377097e-08, "grad_condition": 114742140.57000451, "lr": 0.000878497527825878, "time_sec": 32.70716309547424 }, { "epoch": 35, "train_loss": 1.0068622560119629, "train_acc": 0.69648, "test_loss": 2.274261113357544, "test_acc": 0.489, "lyapunov": null, "grad_norm": 0.8883949473822523, "grad_max_sv": 0.3505275271832943, "grad_min_sv": 1.6455692852801463e-08, "grad_condition": 31982637.47738139, "lr": 0.000871572412738697, "time_sec": 32.704782009124756 }, { "epoch": 36, "train_loss": 0.9864518771362305, "train_acc": 0.7021, "test_loss": 2.3541188930511474, "test_acc": 0.4898, "lyapunov": null, "grad_norm": 0.8736045940658475, "grad_max_sv": 0.3457980893552303, "grad_min_sv": 1.5842762313145187e-08, "grad_condition": 32188123.411770713, "lr": 0.0008644843137107055, "time_sec": 32.691269397735596 }, { "epoch": 37, "train_loss": 0.9681263439178467, "train_acc": 0.7075, "test_loss": 2.195126131439209, "test_acc": 0.5033, "lyapunov": null, "grad_norm": 0.8711424558239054, "grad_max_sv": 0.34736732244491575, "grad_min_sv": 1.5827014727270993e-08, "grad_condition": 66500862.978035614, "lr": 0.0008572363398164014, "time_sec": 32.69683265686035 }, { "epoch": 38, "train_loss": 0.9408467683601379, "train_acc": 0.71608, "test_loss": 2.1800164726257325, "test_acc": 0.5109, "lyapunov": null, "grad_norm": 0.8497079289449048, "grad_max_sv": 0.33491997644305227, "grad_min_sv": 1.5505913916746828e-08, "grad_condition": 37981645.21243934, "lr": 0.0008498316702566826, "time_sec": 32.67169213294983 }, { "epoch": 39, "train_loss": 0.9174955882263184, "train_acc": 0.7231, "test_loss": 2.332292454910278, "test_acc": 0.4984, "lyapunov": null, "grad_norm": 0.8483669541798352, "grad_max_sv": 0.3449387975037098, "grad_min_sv": 1.5716625918760217e-08, "grad_condition": 38753621.785681486, "lr": 0.0008422735529643442, "time_sec": 32.668078660964966 }, { "epoch": 40, "train_loss": 0.8970937779045105, "train_acc": 0.72826, "test_loss": 2.282168871688843, "test_acc": 0.5053, "lyapunov": null, "grad_norm": 0.8354606142013189, "grad_max_sv": 0.3270870424807072, "grad_min_sv": 1.5267581635058926e-08, "grad_condition": 95751205.07057047, "lr": 0.0008345653031794289, "time_sec": 32.70110583305359 }, { "epoch": 41, "train_loss": 0.8763418362236023, "train_acc": 0.73382, "test_loss": 2.3397656742095947, "test_acc": 0.504, "lyapunov": null, "grad_norm": 0.8300379125306362, "grad_max_sv": 0.33984693363308904, "grad_min_sv": 1.5102269786126942e-08, "grad_condition": 36575363.166415855, "lr": 0.0008267103019950526, "time_sec": 32.68285536766052 }, { "epoch": 42, "train_loss": 0.8614973092651367, "train_acc": 0.73702, "test_loss": 2.217091986083984, "test_acc": 0.513, "lyapunov": null, "grad_norm": 0.8218045461669631, "grad_max_sv": 0.32567850723862646, "grad_min_sv": 1.507071445694397e-08, "grad_condition": 48789917.15280264, "lr": 0.0008187119948743447, "time_sec": 32.685330867767334 }, { "epoch": 43, "train_loss": 0.8463610815429687, "train_acc": 0.74162, "test_loss": 2.238330067062378, "test_acc": 0.5145, "lyapunov": null, "grad_norm": 0.8111621240187793, "grad_max_sv": 0.3245612893253565, "grad_min_sv": 1.4757356182567606e-08, "grad_condition": 2265212011.074665, "lr": 0.000810573890139155, "time_sec": 32.6937038898468 }, { "epoch": 44, "train_loss": 0.8388264699935913, "train_acc": 0.7425, "test_loss": 2.2916201137542727, "test_acc": 0.5146, "lyapunov": null, "grad_norm": 0.806013800687461, "grad_max_sv": 0.3360877387225628, "grad_min_sv": 1.4701122835053537e-08, "grad_condition": 56062708.17707713, "lr": 0.0008022995574311873, "time_sec": 32.70379972457886 }, { "epoch": 45, "train_loss": 0.8080853428649902, "train_acc": 0.75246, "test_loss": 2.31492944984436, "test_acc": 0.519, "lyapunov": null, "grad_norm": 0.7954463291291034, "grad_max_sv": 0.3197424054145813, "grad_min_sv": 1.4746050645180267e-08, "grad_condition": 648957804.3057442, "lr": 0.0007938926261462363, "time_sec": 32.704816579818726 }, { "epoch": 46, "train_loss": 0.8025041796875, "train_acc": 0.753, "test_loss": 2.3807359542846678, "test_acc": 0.5181, "lyapunov": null, "grad_norm": 0.7945005415191121, "grad_max_sv": 0.31871558651328086, "grad_min_sv": 1.4457539215806392e-08, "grad_condition": 62012558.50813458, "lr": 0.0007853567838422158, "time_sec": 32.7154860496521 }, { "epoch": 47, "train_loss": 0.7847597545051574, "train_acc": 0.75886, "test_loss": 2.305859538269043, "test_acc": 0.5185, "lyapunov": null, "grad_norm": 0.7791668550262338, "grad_max_sv": 0.3171059262007475, "grad_min_sv": 1.4160447076028148e-08, "grad_condition": 51678874.24460314, "lr": 0.0007766957746216719, "time_sec": 32.71022868156433 }, { "epoch": 48, "train_loss": 0.7660661986160279, "train_acc": 0.7635, "test_loss": 2.373494161605835, "test_acc": 0.5197, "lyapunov": null, "grad_norm": 0.7662493930118918, "grad_max_sv": 0.3144552931189537, "grad_min_sv": 1.4124776402668626e-08, "grad_condition": 42937106.53672977, "lr": 0.0007679133974894982, "time_sec": 32.722716093063354 }, { "epoch": 49, "train_loss": 0.7557950233268738, "train_acc": 0.76584, "test_loss": 2.2862959323883056, "test_acc": 0.5222, "lyapunov": null, "grad_norm": 0.7719008014476091, "grad_max_sv": 0.3158703289926052, "grad_min_sv": 1.4232268583103113e-08, "grad_condition": 39203631.14441905, "lr": 0.000759013504686565, "time_sec": 32.71821331977844 }, { "epoch": 50, "train_loss": 0.7287120180892944, "train_acc": 0.77398, "test_loss": 2.2880530021667482, "test_acc": 0.5331, "lyapunov": null, "grad_norm": 0.7580370777565381, "grad_max_sv": 0.31812012754380703, "grad_min_sv": 1.3956443738194491e-08, "grad_condition": 56488826.56667278, "lr": 0.0007499999999999998, "time_sec": 32.74500012397766 }, { "epoch": 51, "train_loss": 0.7047131567382813, "train_acc": 0.77944, "test_loss": 2.3342226333618163, "test_acc": 0.5242, "lyapunov": null, "grad_norm": 0.7467723064599141, "grad_max_sv": 0.3062335759401321, "grad_min_sv": 1.365980890968843e-08, "grad_condition": 48288096.27243978, "lr": 0.0007408768370508575, "time_sec": 32.73174715042114 }, { "epoch": 52, "train_loss": 0.701608234500885, "train_acc": 0.78146, "test_loss": 2.4530138679504394, "test_acc": 0.5151, "lyapunov": null, "grad_norm": 0.744474034267783, "grad_max_sv": 0.31273389905691146, "grad_min_sv": 1.386061017072393e-08, "grad_condition": 128824936.60768087, "lr": 0.0007316480175599307, "time_sec": 32.70361828804016 }, { "epoch": 53, "train_loss": 0.6784094618415832, "train_acc": 0.7874, "test_loss": 2.3597243209838865, "test_acc": 0.5275, "lyapunov": null, "grad_norm": 0.7374795544632287, "grad_max_sv": 0.30512114986777306, "grad_min_sv": 1.3410438691116578e-08, "grad_condition": 185757572.3538422, "lr": 0.0007223175895924635, "time_sec": 32.71756291389465 }, { "epoch": 54, "train_loss": 0.6558182954406738, "train_acc": 0.795, "test_loss": 2.376951601028442, "test_acc": 0.5316, "lyapunov": null, "grad_norm": 0.7251324903072741, "grad_max_sv": 0.2987603921443224, "grad_min_sv": 1.2931078906264214e-08, "grad_condition": 35614928.216609366, "lr": 0.0007128896457825361, "time_sec": 32.73335146903992 }, { "epoch": 55, "train_loss": 0.6438722687911987, "train_acc": 0.79842, "test_loss": 2.4439307792663576, "test_acc": 0.5237, "lyapunov": null, "grad_norm": 0.7208427013257759, "grad_max_sv": 0.2992406666278839, "grad_min_sv": 1.321393890141298e-08, "grad_condition": 86775812.1538335, "lr": 0.0007033683215378998, "time_sec": 32.714346408843994 }, { "epoch": 56, "train_loss": 0.6417430144309998, "train_acc": 0.7972, "test_loss": 2.3790397010803224, "test_acc": 0.5275, "lyapunov": null, "grad_norm": 0.7192864641522134, "grad_max_sv": 0.2877038486301899, "grad_min_sv": 1.3027487994767515e-08, "grad_condition": 758527469.2650627, "lr": 0.0006937577932260512, "time_sec": 32.70229887962341 }, { "epoch": 57, "train_loss": 0.6262681634902955, "train_acc": 0.803, "test_loss": 2.401387868881226, "test_acc": 0.5319, "lyapunov": null, "grad_norm": 0.7121380891152584, "grad_max_sv": 0.2965920139104128, "grad_min_sv": 1.279559212457454e-08, "grad_condition": 184239403.66627008, "lr": 0.0006840622763423388, "time_sec": 32.71753239631653 }, { "epoch": 58, "train_loss": 0.6120203521347046, "train_acc": 0.80732, "test_loss": 2.503086555862427, "test_acc": 0.5165, "lyapunov": null, "grad_norm": 0.7090038692309348, "grad_max_sv": 0.2882195271551609, "grad_min_sv": 1.2676824923812945e-08, "grad_condition": 64942214.60915594, "lr": 0.0006742860236609073, "time_sec": 32.75395059585571 }, { "epoch": 59, "train_loss": 0.5998075243473053, "train_acc": 0.81224, "test_loss": 2.4825798515319826, "test_acc": 0.5223, "lyapunov": null, "grad_norm": 0.7030307704517706, "grad_max_sv": 0.28765259496867657, "grad_min_sv": 1.2779274688370229e-08, "grad_condition": 182642047.07290906, "lr": 0.0006644333233692913, "time_sec": 32.70982766151428 }, { "epoch": 60, "train_loss": 0.5948525179862976, "train_acc": 0.81162, "test_loss": 2.5030276454925535, "test_acc": 0.5207, "lyapunov": null, "grad_norm": 0.7026252294626018, "grad_max_sv": 0.2934992775321007, "grad_min_sv": 1.284481914573185e-08, "grad_condition": 541914476.4363593, "lr": 0.0006545084971874734, "time_sec": 32.69038796424866 }, { "epoch": 61, "train_loss": 0.572040382938385, "train_acc": 0.81932, "test_loss": 2.5733165519714354, "test_acc": 0.5197, "lyapunov": null, "grad_norm": 0.6845429439823613, "grad_max_sv": 0.28906508460640906, "grad_min_sv": 1.2416446168797556e-08, "grad_condition": 83143739.39889392, "lr": 0.0006445158984722354, "time_sec": 32.70990490913391 }, { "epoch": 62, "train_loss": 0.5523873634338379, "train_acc": 0.82446, "test_loss": 2.563892342758179, "test_acc": 0.5248, "lyapunov": null, "grad_norm": 0.677689496712232, "grad_max_sv": 0.2810227505862713, "grad_min_sv": 1.2061726063945787e-08, "grad_condition": 161335990.45839816, "lr": 0.0006344599103076324, "time_sec": 32.714717864990234 }, { "epoch": 63, "train_loss": 0.537570647277832, "train_acc": 0.82928, "test_loss": 2.5110877151489257, "test_acc": 0.5309, "lyapunov": null, "grad_norm": 0.6752075838217867, "grad_max_sv": 0.2918707847595215, "grad_min_sv": 1.2428116336060669e-08, "grad_condition": 62614290.824099444, "lr": 0.0006243449435824269, "time_sec": 32.73838663101196 }, { "epoch": 64, "train_loss": 0.525590337715149, "train_acc": 0.83162, "test_loss": 2.5260006717681884, "test_acc": 0.5365, "lyapunov": null, "grad_norm": 0.6614195891575191, "grad_max_sv": 0.2785448797047138, "grad_min_sv": 1.2074160667119305e-08, "grad_condition": 68726347.69115171, "lr": 0.0006141754350553275, "time_sec": 32.716681241989136 }, { "epoch": 65, "train_loss": 0.506968226633072, "train_acc": 0.83974, "test_loss": 2.4551146259307863, "test_acc": 0.5332, "lyapunov": null, "grad_norm": 0.6515058246983421, "grad_max_sv": 0.28096592277288435, "grad_min_sv": 1.183612223995545e-08, "grad_condition": 56796145.61117469, "lr": 0.0006039558454088793, "time_sec": 32.72992730140686 }, { "epoch": 66, "train_loss": 0.5121252582931518, "train_acc": 0.8359, "test_loss": 2.4647022022247316, "test_acc": 0.5374, "lyapunov": null, "grad_norm": 0.6569185851243321, "grad_max_sv": 0.2686118472367525, "grad_min_sv": 1.1671607616763752e-08, "grad_condition": 198976036.41965005, "lr": 0.000593690657292862, "time_sec": 32.737778425216675 }, { "epoch": 67, "train_loss": 0.5035950432968139, "train_acc": 0.83814, "test_loss": 2.5104728435516357, "test_acc": 0.5334, "lyapunov": null, "grad_norm": 0.6543970572426195, "grad_max_sv": 0.27697036042809486, "grad_min_sv": 1.1793683101109492e-08, "grad_condition": 2176927259.024586, "lr": 0.0005833843733580507, "time_sec": 32.73714327812195 }, { "epoch": 68, "train_loss": 0.4827924027252197, "train_acc": 0.8449, "test_loss": 2.483680333328247, "test_acc": 0.5362, "lyapunov": null, "grad_norm": 0.6424274790982618, "grad_max_sv": 0.26836494021117685, "grad_min_sv": 1.1452091713826107e-08, "grad_condition": 64248156.31133513, "lr": 0.0005730415142812054, "time_sec": 32.73483109474182 }, { "epoch": 69, "train_loss": 0.463097783498764, "train_acc": 0.85106, "test_loss": 2.5873930728912353, "test_acc": 0.5352, "lyapunov": null, "grad_norm": 0.6283493250843613, "grad_max_sv": 0.26704199202358725, "grad_min_sv": 1.1449700967197662e-08, "grad_condition": 133571192.62172851, "lr": 0.0005626666167821517, "time_sec": 32.76736545562744 }, { "epoch": 70, "train_loss": 0.45964255402565, "train_acc": 0.8516, "test_loss": 2.4906038509368895, "test_acc": 0.5466, "lyapunov": null, "grad_norm": 0.6392818623657084, "grad_max_sv": 0.2811981987208128, "grad_min_sv": 1.1691557246645834e-08, "grad_condition": 83552341.63512965, "lr": 0.0005522642316338265, "time_sec": 32.76137971878052 }, { "epoch": 71, "train_loss": 0.44885221929550173, "train_acc": 0.85536, "test_loss": 2.5581497470855714, "test_acc": 0.5417, "lyapunov": null, "grad_norm": 0.627505222045094, "grad_max_sv": 0.2669704511761665, "grad_min_sv": 1.135505285909666e-08, "grad_condition": 55019996.6299631, "lr": 0.0005418389216661573, "time_sec": 32.754613161087036 }, { "epoch": 72, "train_loss": 0.4373334138870239, "train_acc": 0.85988, "test_loss": 2.5293708190917967, "test_acc": 0.5385, "lyapunov": null, "grad_norm": 0.6228439231508988, "grad_max_sv": 0.27325935252010825, "grad_min_sv": 1.1285354627535438e-08, "grad_condition": 404302529.70424557, "lr": 0.0005313952597646563, "time_sec": 32.747488260269165 }, { "epoch": 73, "train_loss": 0.43413398032188416, "train_acc": 0.86118, "test_loss": 2.59562434463501, "test_acc": 0.5355, "lyapunov": null, "grad_norm": 0.6246623504935193, "grad_max_sv": 0.26360294707119464, "grad_min_sv": 1.0827903220485963e-08, "grad_condition": 202498413.83885324, "lr": 0.0005209378268645994, "time_sec": 32.75055932998657 }, { "epoch": 74, "train_loss": 0.42070443333625795, "train_acc": 0.86404, "test_loss": 2.620591529083252, "test_acc": 0.5311, "lyapunov": null, "grad_norm": 0.6160094351570171, "grad_max_sv": 0.2604650367051363, "grad_min_sv": 1.0893297332399688e-08, "grad_condition": 109053309.86634846, "lr": 0.0005104712099416781, "time_sec": 32.766777753829956 }, { "epoch": 75, "train_loss": 0.41482046060562133, "train_acc": 0.86586, "test_loss": 2.6253975078582763, "test_acc": 0.5364, "lyapunov": null, "grad_norm": 0.614383474689519, "grad_max_sv": 0.2657254245132208, "grad_min_sv": 1.1066643729282667e-08, "grad_condition": 1358046707.310991, "lr": 0.0004999999999999996, "time_sec": 32.753093004226685 }, { "epoch": 76, "train_loss": 0.40771523109436036, "train_acc": 0.8674, "test_loss": 2.7234753631591797, "test_acc": 0.5307, "lyapunov": null, "grad_norm": 0.6089832611690313, "grad_max_sv": 0.2631608698517084, "grad_min_sv": 1.1065733136576827e-08, "grad_condition": 124518956.20538023, "lr": 0.0004895287900583212, "time_sec": 32.7672004699707 }, { "epoch": 77, "train_loss": 0.3850809427070618, "train_acc": 0.87682, "test_loss": 2.6585358211517334, "test_acc": 0.5378, "lyapunov": null, "grad_norm": 0.5905288728439135, "grad_max_sv": 0.2512054055929184, "grad_min_sv": 1.0597189950382891e-08, "grad_condition": 141685910.93483096, "lr": 0.0004790621731353997, "time_sec": 32.75537824630737 }, { "epoch": 78, "train_loss": 0.3790111728191376, "train_acc": 0.87892, "test_loss": 2.6925399055480956, "test_acc": 0.5368, "lyapunov": null, "grad_norm": 0.5936477423986493, "grad_max_sv": 0.2708817757666111, "grad_min_sv": 1.0561610550192946e-08, "grad_condition": 244253851.38396016, "lr": 0.000468604740235343, "time_sec": 32.734121561050415 }, { "epoch": 79, "train_loss": 0.376044921131134, "train_acc": 0.87726, "test_loss": 2.6398166637420655, "test_acc": 0.5322, "lyapunov": null, "grad_norm": 0.5949427297273714, "grad_max_sv": 0.2605267588049173, "grad_min_sv": 1.0820864476679404e-08, "grad_condition": 62663126.18808526, "lr": 0.00045816107833384175, "time_sec": 32.72508406639099 }, { "epoch": 80, "train_loss": 0.3590127901649475, "train_acc": 0.88356, "test_loss": 2.6562103397369383, "test_acc": 0.5313, "lyapunov": null, "grad_norm": 0.57614839106705, "grad_max_sv": 0.2479171995073557, "grad_min_sv": 1.0216514026700069e-08, "grad_condition": 168918888.0387075, "lr": 0.0004477357683661729, "time_sec": 32.7580771446228 }, { "epoch": 81, "train_loss": 0.35495832427978513, "train_acc": 0.88512, "test_loss": 2.6037187816619873, "test_acc": 0.5424, "lyapunov": null, "grad_norm": 0.5731602731960765, "grad_max_sv": 0.2532364260405302, "grad_min_sv": 1.0580176048897299e-08, "grad_condition": 286643189.9936029, "lr": 0.00043733338321784746, "time_sec": 32.72826409339905 }, { "epoch": 82, "train_loss": 0.3466758195114136, "train_acc": 0.88818, "test_loss": 2.6409978286743163, "test_acc": 0.5399, "lyapunov": null, "grad_norm": 0.5643305573749353, "grad_max_sv": 0.25191599801182746, "grad_min_sv": 9.937639448582419e-09, "grad_condition": 418028032.15621006, "lr": 0.0004269584857187939, "time_sec": 32.73789381980896 }, { "epoch": 83, "train_loss": 0.337517634677887, "train_acc": 0.89068, "test_loss": 2.6804797424316407, "test_acc": 0.5387, "lyapunov": null, "grad_norm": 0.5635653171134332, "grad_max_sv": 0.24921411760151385, "grad_min_sv": 1.007469917777351e-08, "grad_condition": 232954348.7021001, "lr": 0.0004166156266419484, "time_sec": 32.75311326980591 }, { "epoch": 84, "train_loss": 0.32895935908317564, "train_acc": 0.89278, "test_loss": 2.670875820159912, "test_acc": 0.5417, "lyapunov": null, "grad_norm": 0.5604425901768842, "grad_max_sv": 0.25350802317261695, "grad_min_sv": 1.0073376105132481e-08, "grad_condition": 810741849.6024733, "lr": 0.0004063093427071373, "time_sec": 32.75568342208862 }, { "epoch": 85, "train_loss": 0.31874533922195436, "train_acc": 0.89668, "test_loss": 2.726188472366333, "test_acc": 0.5437, "lyapunov": null, "grad_norm": 0.5474219905771217, "grad_max_sv": 0.24635729603469372, "grad_min_sv": 9.822750767244857e-09, "grad_condition": 407705693.9191896, "lr": 0.0003960441545911199, "time_sec": 32.74805927276611 }, { "epoch": 86, "train_loss": 0.3149368803215027, "train_acc": 0.89756, "test_loss": 2.7214178714752197, "test_acc": 0.5419, "lyapunov": null, "grad_norm": 0.5494081042104078, "grad_max_sv": 0.2415832221508026, "grad_min_sv": 9.84441673934286e-09, "grad_condition": 259925587.23227444, "lr": 0.0003858245649446718, "time_sec": 32.80679273605347 }, { "epoch": 87, "train_loss": 0.3021876361656189, "train_acc": 0.9004, "test_loss": 2.7706982093811034, "test_acc": 0.5429, "lyapunov": null, "grad_norm": 0.5427208210607071, "grad_max_sv": 0.24498338885605336, "grad_min_sv": 9.92075648437174e-09, "grad_condition": 232757368.44567218, "lr": 0.00037565505641757235, "time_sec": 32.76810097694397 }, { "epoch": 88, "train_loss": 0.297262005405426, "train_acc": 0.90436, "test_loss": 2.736396257019043, "test_acc": 0.5423, "lyapunov": null, "grad_norm": 0.5343970285585263, "grad_max_sv": 0.24844259656965734, "grad_min_sv": 9.910514466504247e-09, "grad_condition": 1110263065.3705904, "lr": 0.00036554008969236695, "time_sec": 32.74753546714783 }, { "epoch": 89, "train_loss": 0.28578209706306457, "train_acc": 0.90734, "test_loss": 2.850689685058594, "test_acc": 0.5399, "lyapunov": null, "grad_norm": 0.5254402888094797, "grad_max_sv": 0.23409140817821025, "grad_min_sv": 9.523284056017854e-09, "grad_condition": 1231623659.8277283, "lr": 0.0003554841015277638, "time_sec": 32.79159116744995 }, { "epoch": 90, "train_loss": 0.2832814686203003, "train_acc": 0.90616, "test_loss": 2.8175382946014405, "test_acc": 0.537, "lyapunov": null, "grad_norm": 0.5216211125471195, "grad_max_sv": 0.23542476668953896, "grad_min_sv": 9.459231551322244e-09, "grad_condition": 1301223464.6618998, "lr": 0.000345491502812526, "time_sec": 32.78084850311279 }, { "epoch": 91, "train_loss": 0.28347388619422914, "train_acc": 0.90788, "test_loss": 2.831140581512451, "test_acc": 0.5444, "lyapunov": null, "grad_norm": 0.5319613521776031, "grad_max_sv": 0.23012890443205833, "grad_min_sv": 9.377407441096135e-09, "grad_condition": 228524276.50434837, "lr": 0.0003355666766307081, "time_sec": 32.71651744842529 }, { "epoch": 92, "train_loss": 0.27393528344631196, "train_acc": 0.91052, "test_loss": 2.775809415435791, "test_acc": 0.545, "lyapunov": null, "grad_norm": 0.5149918732183307, "grad_max_sv": 0.23977560102939605, "grad_min_sv": 9.41244274865055e-09, "grad_condition": 202495109.8759535, "lr": 0.00032571397633909225, "time_sec": 32.70667123794556 }, { "epoch": 93, "train_loss": 0.2638559838104248, "train_acc": 0.9163, "test_loss": 2.7468856441497804, "test_acc": 0.5537, "lyapunov": null, "grad_norm": 0.5066198396238114, "grad_max_sv": 0.23251476027071477, "grad_min_sv": 9.16693782366737e-09, "grad_condition": 232699226.05631667, "lr": 0.00031593772365766094, "time_sec": 32.71683645248413 }, { "epoch": 94, "train_loss": 0.25781995408058167, "train_acc": 0.9156, "test_loss": 2.771767431640625, "test_acc": 0.5456, "lyapunov": null, "grad_norm": 0.5052996090758677, "grad_max_sv": 0.23510573096573353, "grad_min_sv": 8.963649589916433e-09, "grad_condition": 1701543645.1210911, "lr": 0.0003062422067739483, "time_sec": 32.713576555252075 }, { "epoch": 95, "train_loss": 0.25086621726989744, "train_acc": 0.91784, "test_loss": 2.8765688217163086, "test_acc": 0.5451, "lyapunov": null, "grad_norm": 0.49975532415921886, "grad_max_sv": 0.236967783421278, "grad_min_sv": 9.25259010277346e-09, "grad_condition": 145241238.20565036, "lr": 0.00029663167846209965, "time_sec": 32.73633694648743 }, { "epoch": 96, "train_loss": 0.24672197101354598, "train_acc": 0.91946, "test_loss": 2.8446786346435546, "test_acc": 0.5438, "lyapunov": null, "grad_norm": 0.49641090183932196, "grad_max_sv": 0.22625510580837727, "grad_min_sv": 8.7457359089553e-09, "grad_condition": 1836850483.766, "lr": 0.00028711035421746345, "time_sec": 32.76619052886963 }, { "epoch": 97, "train_loss": 0.23921704626083373, "train_acc": 0.92148, "test_loss": 2.797951399230957, "test_acc": 0.5532, "lyapunov": null, "grad_norm": 0.49423071935175245, "grad_max_sv": 0.24016087874770164, "grad_min_sv": 8.990743178508703e-09, "grad_condition": 210059856.3178285, "lr": 0.00027768241040753615, "time_sec": 32.82350516319275 }, { "epoch": 98, "train_loss": 0.23695792595386506, "train_acc": 0.9223, "test_loss": 2.8982477020263673, "test_acc": 0.5432, "lyapunov": null, "grad_norm": 0.4903348629723419, "grad_max_sv": 0.22139078341424465, "grad_min_sv": 8.704557989333561e-09, "grad_condition": 233405578.91055053, "lr": 0.00026835198244006903, "time_sec": 32.75874900817871 }, { "epoch": 99, "train_loss": 0.22282506870508195, "train_acc": 0.92698, "test_loss": 2.896362300491333, "test_acc": 0.544, "lyapunov": null, "grad_norm": 0.4754599951900147, "grad_max_sv": 0.22327796779572964, "grad_min_sv": 8.601119547287876e-09, "grad_condition": 868925326.22085, "lr": 0.0002591231629491421, "time_sec": 32.74084424972534 }, { "epoch": 100, "train_loss": 0.22439868947982788, "train_acc": 0.92668, "test_loss": 2.888060118484497, "test_acc": 0.553, "lyapunov": null, "grad_norm": 0.4789261726309551, "grad_max_sv": 0.22355457432568074, "grad_min_sv": 8.837810024564172e-09, "grad_condition": 804604193.8746045, "lr": 0.0002499999999999997, "time_sec": 32.76948523521423 }, { "epoch": 101, "train_loss": 0.21471880633354187, "train_acc": 0.93042, "test_loss": 2.926622017288208, "test_acc": 0.5459, "lyapunov": null, "grad_norm": 0.46758839629635496, "grad_max_sv": 0.2257686872035265, "grad_min_sv": 8.604181156836657e-09, "grad_condition": 364480196.7882508, "lr": 0.00024098649531343477, "time_sec": 32.761115312576294 }, { "epoch": 102, "train_loss": 0.20999815567016603, "train_acc": 0.93128, "test_loss": 2.7882490966796873, "test_acc": 0.5578, "lyapunov": null, "grad_norm": 0.46851254306004025, "grad_max_sv": 0.21838495172560216, "grad_min_sv": 8.37696591199713e-09, "grad_condition": 1510396720.662658, "lr": 0.0002320866025105016, "time_sec": 32.72404432296753 }, { "epoch": 103, "train_loss": 0.20526846901893617, "train_acc": 0.93262, "test_loss": 2.8693388496398926, "test_acc": 0.554, "lyapunov": null, "grad_norm": 0.4589602275699082, "grad_max_sv": 0.22509709745645523, "grad_min_sv": 8.420789482605027e-09, "grad_condition": 1371218202.1419, "lr": 0.0002233042253783278, "time_sec": 32.752496004104614 }, { "epoch": 104, "train_loss": 0.20646339273929595, "train_acc": 0.9335, "test_loss": 2.89330929107666, "test_acc": 0.5483, "lyapunov": null, "grad_norm": 0.46636768633733616, "grad_max_sv": 0.22183220721781255, "grad_min_sv": 8.39393208819329e-09, "grad_condition": 1827094910.9746387, "lr": 0.000214643216157784, "time_sec": 32.74421238899231 }, { "epoch": 105, "train_loss": 0.20053612211227417, "train_acc": 0.93402, "test_loss": 2.904328105926514, "test_acc": 0.5506, "lyapunov": null, "grad_norm": 0.45700070764272066, "grad_max_sv": 0.21747002471238375, "grad_min_sv": 8.216160540282366e-09, "grad_condition": 1664593727.1128445, "lr": 0.00020610737385376332, "time_sec": 32.724817991256714 }, { "epoch": 106, "train_loss": 0.1944782396030426, "train_acc": 0.9362, "test_loss": 2.8657500442504884, "test_acc": 0.5488, "lyapunov": null, "grad_norm": 0.44687014031192024, "grad_max_sv": 0.2213790450245142, "grad_min_sv": 8.454356608192382e-09, "grad_condition": 127028340.10294946, "lr": 0.00019770044256881242, "time_sec": 32.7451388835907 }, { "epoch": 107, "train_loss": 0.19279775314331055, "train_acc": 0.93688, "test_loss": 2.898486404800415, "test_acc": 0.5523, "lyapunov": null, "grad_norm": 0.44614463029775897, "grad_max_sv": 0.2167466938495636, "grad_min_sv": 8.415876304873615e-09, "grad_condition": 262012758.78866345, "lr": 0.0001894261098608447, "time_sec": 32.76267623901367 }, { "epoch": 108, "train_loss": 0.1886401759147644, "train_acc": 0.93904, "test_loss": 2.833827450942993, "test_acc": 0.5567, "lyapunov": null, "grad_norm": 0.4435964290199411, "grad_max_sv": 0.2225849311798811, "grad_min_sv": 8.340220883015782e-09, "grad_condition": 118785929.89668731, "lr": 0.000181288005125655, "time_sec": 32.86235594749451 }, { "epoch": 109, "train_loss": 0.1890174783563614, "train_acc": 0.93882, "test_loss": 2.941585520553589, "test_acc": 0.5491, "lyapunov": null, "grad_norm": 0.4464239579148638, "grad_max_sv": 0.21364586874842645, "grad_min_sv": 8.245146911967442e-09, "grad_condition": 716792612.4830931, "lr": 0.0001732896980049473, "time_sec": 32.74325895309448 }, { "epoch": 110, "train_loss": 0.18055749108314514, "train_acc": 0.94126, "test_loss": 2.9359549655914305, "test_acc": 0.5517, "lyapunov": null, "grad_norm": 0.4349334962787559, "grad_max_sv": 0.2089217260479927, "grad_min_sv": 8.043115946556504e-09, "grad_condition": 2200871643.370809, "lr": 0.00016543469682057076, "time_sec": 32.756227016448975 }, { "epoch": 111, "train_loss": 0.17659846026420592, "train_acc": 0.9445, "test_loss": 2.904285785675049, "test_acc": 0.5552, "lyapunov": null, "grad_norm": 0.4288194869102633, "grad_max_sv": 0.2133932262659073, "grad_min_sv": 7.951804889029523e-09, "grad_condition": 127160230.15537345, "lr": 0.00015772644703565552, "time_sec": 32.73052453994751 }, { "epoch": 112, "train_loss": 0.17598180088996887, "train_acc": 0.9431, "test_loss": 2.916234812545776, "test_acc": 0.5566, "lyapunov": null, "grad_norm": 0.43046200088706854, "grad_max_sv": 0.21027521118521691, "grad_min_sv": 8.006027082247107e-09, "grad_condition": 1303838738.9934053, "lr": 0.00015016832974331713, "time_sec": 32.737369775772095 }, { "epoch": 113, "train_loss": 0.167477658700943, "train_acc": 0.94562, "test_loss": 2.930574794006348, "test_acc": 0.5492, "lyapunov": null, "grad_norm": 0.4188552255465725, "grad_max_sv": 0.2074826244264841, "grad_min_sv": 7.807182782865966e-09, "grad_condition": 1013028230.5722786, "lr": 0.00014276366018359834, "time_sec": 32.78035497665405 }, { "epoch": 114, "train_loss": 0.16470729023933411, "train_acc": 0.94658, "test_loss": 2.9235076808929445, "test_acc": 0.55, "lyapunov": null, "grad_norm": 0.4196468917250276, "grad_max_sv": 0.2061817307025194, "grad_min_sv": 7.639872719872321e-09, "grad_condition": 147774842.88971734, "lr": 0.00013551568628929425, "time_sec": 32.71555685997009 }, { "epoch": 115, "train_loss": 0.15979129463195801, "train_acc": 0.95014, "test_loss": 2.8977687450408935, "test_acc": 0.5554, "lyapunov": null, "grad_norm": 0.4109842368882969, "grad_max_sv": 0.20125124976038933, "grad_min_sv": 7.641511092990049e-09, "grad_condition": 152806383.8905374, "lr": 0.00012842758726130276, "time_sec": 32.74684023857117 }, { "epoch": 116, "train_loss": 0.15650701507091522, "train_acc": 0.94994, "test_loss": 2.963372290420532, "test_acc": 0.5536, "lyapunov": null, "grad_norm": 0.40714256168185947, "grad_max_sv": 0.21380255445837976, "grad_min_sv": 7.601124127343262e-09, "grad_condition": 187963441.14469656, "lr": 0.0001215024721741218, "time_sec": 32.740856885910034 }, { "epoch": 117, "train_loss": 0.15483391536712646, "train_acc": 0.95134, "test_loss": 2.9223466384887695, "test_acc": 0.5589, "lyapunov": null, "grad_norm": 0.4061085309679021, "grad_max_sv": 0.20323452018201352, "grad_min_sv": 7.630000256912337e-09, "grad_condition": 541093755.1409919, "lr": 0.00011474337861210538, "time_sec": 32.71646022796631 }, { "epoch": 118, "train_loss": 0.15986083958148956, "train_acc": 0.9476, "test_loss": 2.890314678955078, "test_acc": 0.5619, "lyapunov": null, "grad_norm": 0.4176419876084519, "grad_max_sv": 0.20986161157488822, "grad_min_sv": 7.767054953627256e-09, "grad_condition": 181416124.9826005, "lr": 0.00010815327133708009, "time_sec": 32.71689772605896 }, { "epoch": 119, "train_loss": 0.15443852434635164, "train_acc": 0.95028, "test_loss": 2.9833076015472413, "test_acc": 0.5504, "lyapunov": null, "grad_norm": 0.4094461556500699, "grad_max_sv": 0.20980317294597625, "grad_min_sv": 7.66585938392992e-09, "grad_condition": 1289363850.184981, "lr": 0.00010173504098790182, "time_sec": 32.76529359817505 }, { "epoch": 120, "train_loss": 0.1513664803981781, "train_acc": 0.95076, "test_loss": 2.9521168746948243, "test_acc": 0.5535, "lyapunov": null, "grad_norm": 0.40458507675773164, "grad_max_sv": 0.2091453868895769, "grad_min_sv": 7.546225789991506e-09, "grad_condition": 191790265.63931364, "lr": 9.549150281252629e-05, "time_sec": 32.75906276702881 }, { "epoch": 121, "train_loss": 0.1482712536096573, "train_acc": 0.95224, "test_loss": 3.008343357849121, "test_acc": 0.5524, "lyapunov": null, "grad_norm": 0.40250293552115596, "grad_max_sv": 0.20429235510528088, "grad_min_sv": 7.4167842699346915e-09, "grad_condition": 1004863133.4087012, "lr": 8.942539543314794e-05, "time_sec": 32.738195180892944 }, { "epoch": 122, "train_loss": 0.1433233982515335, "train_acc": 0.95406, "test_loss": 2.8811149784088137, "test_acc": 0.5615, "lyapunov": null, "grad_norm": 0.3918685762307977, "grad_max_sv": 0.21150657180696725, "grad_min_sv": 7.566205814736106e-09, "grad_condition": 4864615061.542827, "lr": 8.353937964495024e-05, "time_sec": 32.760249853134155 }, { "epoch": 123, "train_loss": 0.140904153547287, "train_acc": 0.95554, "test_loss": 3.0434706832885743, "test_acc": 0.5488, "lyapunov": null, "grad_norm": 0.39134340646439314, "grad_max_sv": 0.21096068248152733, "grad_min_sv": 7.420657745899582e-09, "grad_condition": 474788541.70389444, "lr": 7.783603724899243e-05, "time_sec": 32.84018850326538 }, { "epoch": 124, "train_loss": 0.1424632687997818, "train_acc": 0.95448, "test_loss": 3.006509048843384, "test_acc": 0.5549, "lyapunov": null, "grad_norm": 0.3952350465926858, "grad_max_sv": 0.20579442996531724, "grad_min_sv": 7.2102639599776894e-09, "grad_condition": 640121523.7171735, "lr": 7.231786991974666e-05, "time_sec": 32.73241114616394 }, { "epoch": 125, "train_loss": 0.13608443251609803, "train_acc": 0.95782, "test_loss": 2.9692224075317384, "test_acc": 0.5578, "lyapunov": null, "grad_norm": 0.38466881950137, "grad_max_sv": 0.19782444536685945, "grad_min_sv": 7.223557173946516e-09, "grad_condition": 248263306.50433522, "lr": 6.698729810778072e-05, "time_sec": 32.678467988967896 }, { "epoch": 126, "train_loss": 0.13552211750030518, "train_acc": 0.95626, "test_loss": 3.032096587371826, "test_acc": 0.5536, "lyapunov": null, "grad_norm": 0.3837934860475664, "grad_max_sv": 0.19592427872121335, "grad_min_sv": 7.1880338589928525e-09, "grad_condition": 1098788620.3456562, "lr": 6.184665997806817e-05, "time_sec": 32.70717906951904 }, { "epoch": 127, "train_loss": 0.1351850691795349, "train_acc": 0.95776, "test_loss": 2.9195703174591063, "test_acc": 0.5604, "lyapunov": null, "grad_norm": 0.3835199995919498, "grad_max_sv": 0.19671063385903836, "grad_min_sv": 7.301026294463924e-09, "grad_condition": 998102013.5820692, "lr": 5.6898210384392595e-05, "time_sec": 32.741135597229004 }, { "epoch": 128, "train_loss": 0.13267261865139007, "train_acc": 0.95764, "test_loss": 2.9626207927703856, "test_acc": 0.5545, "lyapunov": null, "grad_norm": 0.3832565427194031, "grad_max_sv": 0.2010548248887062, "grad_min_sv": 7.084323496310118e-09, "grad_condition": 1908110316.0124466, "lr": 5.214411988029363e-05, "time_sec": 32.724841356277466 }, { "epoch": 129, "train_loss": 0.13098865546941757, "train_acc": 0.95846, "test_loss": 3.011842226791382, "test_acc": 0.5506, "lyapunov": null, "grad_norm": 0.37939468237880797, "grad_max_sv": 0.20046190060675145, "grad_min_sv": 7.379042803222838e-09, "grad_condition": 356098689.45926607, "lr": 4.7586473766990294e-05, "time_sec": 32.721606492996216 }, { "epoch": 130, "train_loss": 0.12933046006202698, "train_acc": 0.95886, "test_loss": 3.0411768558502197, "test_acc": 0.5527, "lyapunov": null, "grad_norm": 0.37924053294163973, "grad_max_sv": 0.20988954231142998, "grad_min_sv": 7.388776484596772e-09, "grad_condition": 554124327.4297839, "lr": 4.32272711786996e-05, "time_sec": 32.76217794418335 }, { "epoch": 131, "train_loss": 0.12891825794219972, "train_acc": 0.95952, "test_loss": 3.000077504730225, "test_acc": 0.5546, "lyapunov": null, "grad_norm": 0.3741869428415791, "grad_max_sv": 0.1881616409868002, "grad_min_sv": 7.156842123405213e-09, "grad_condition": 312499495.3085783, "lr": 3.906842420574966e-05, "time_sec": 32.74306511878967 }, { "epoch": 132, "train_loss": 0.12583676107883454, "train_acc": 0.96062, "test_loss": 3.0664391510009765, "test_acc": 0.5534, "lyapunov": null, "grad_norm": 0.3704229743876738, "grad_max_sv": 0.19701430164277553, "grad_min_sv": 7.223526106328419e-09, "grad_condition": 1413194923.3587193, "lr": 3.5111757055874305e-05, "time_sec": 32.808775424957275 }, { "epoch": 133, "train_loss": 0.13008767341136931, "train_acc": 0.95896, "test_loss": 3.0139704319000242, "test_acc": 0.5574, "lyapunov": null, "grad_norm": 0.3764215368002029, "grad_max_sv": 0.18944438602775335, "grad_min_sv": 7.082572564553764e-09, "grad_condition": 874087736.501687, "lr": 3.1359005254054254e-05, "time_sec": 32.82065176963806 }, { "epoch": 134, "train_loss": 0.1276783154821396, "train_acc": 0.95996, "test_loss": 3.022883545303345, "test_acc": 0.5532, "lyapunov": null, "grad_norm": 0.375861463579636, "grad_max_sv": 0.20601846650242805, "grad_min_sv": 6.996468762177945e-09, "grad_condition": 1890410555.4428897, "lr": 2.7811814881259484e-05, "time_sec": 32.80414128303528 }, { "epoch": 135, "train_loss": 0.12308010986804963, "train_acc": 0.9606, "test_loss": 2.9876843898773195, "test_acc": 0.5593, "lyapunov": null, "grad_norm": 0.36736730687062175, "grad_max_sv": 0.19790339954197406, "grad_min_sv": 7.039625574654928e-09, "grad_condition": 157775177.85623857, "lr": 2.4471741852423218e-05, "time_sec": 32.851438760757446 }, { "epoch": 136, "train_loss": 0.12776446427345275, "train_acc": 0.96144, "test_loss": 3.0140146301269533, "test_acc": 0.5535, "lyapunov": null, "grad_norm": 0.3714043891983977, "grad_max_sv": 0.19383110255002975, "grad_min_sv": 7.2285312062653555e-09, "grad_condition": 999433479.7051426, "lr": 2.1340251233966362e-05, "time_sec": 32.794949769973755 }, { "epoch": 137, "train_loss": 0.12337936633110047, "train_acc": 0.96152, "test_loss": 2.9756490589141844, "test_acc": 0.5589, "lyapunov": null, "grad_norm": 0.36599462716404635, "grad_max_sv": 0.18621533513069152, "grad_min_sv": 6.8799666707621e-09, "grad_condition": 2633273626.2954164, "lr": 1.8418716601170932e-05, "time_sec": 32.78418707847595 }, { "epoch": 138, "train_loss": 0.12530339601516724, "train_acc": 0.96096, "test_loss": 2.9389760871887205, "test_acc": 0.5643, "lyapunov": null, "grad_norm": 0.36857224147370304, "grad_max_sv": 0.19519462659955025, "grad_min_sv": 7.2010847566817904e-09, "grad_condition": 1104132755.735764, "lr": 1.570841943568445e-05, "time_sec": 32.72880840301514 }, { "epoch": 139, "train_loss": 0.12289305024623871, "train_acc": 0.9611, "test_loss": 3.0236512790679932, "test_acc": 0.5543, "lyapunov": null, "grad_norm": 0.3682552501598832, "grad_max_sv": 0.20100074261426926, "grad_min_sv": 7.34378154774052e-09, "grad_condition": 1520683884.3197339, "lr": 1.3210548563419845e-05, "time_sec": 32.78127360343933 }, { "epoch": 140, "train_loss": 0.12596595900058746, "train_acc": 0.95946, "test_loss": 2.973658073425293, "test_acc": 0.561, "lyapunov": null, "grad_norm": 0.3717079213334779, "grad_max_sv": 0.1950546268373728, "grad_min_sv": 7.189997905268728e-09, "grad_condition": 1974792452.4561849, "lr": 1.0926199633097203e-05, "time_sec": 32.781864643096924 }, { "epoch": 141, "train_loss": 0.12001886625289918, "train_acc": 0.96264, "test_loss": 2.990137744522095, "test_acc": 0.5583, "lyapunov": null, "grad_norm": 0.3612101803004304, "grad_max_sv": 0.19684142302721738, "grad_min_sv": 7.084273648266673e-09, "grad_condition": 1957601954.2835248, "lr": 8.856374635655688e-06, "time_sec": 32.77344870567322 }, { "epoch": 142, "train_loss": 0.12250841891288758, "train_acc": 0.96208, "test_loss": 3.0072501789093016, "test_acc": 0.557, "lyapunov": null, "grad_norm": 0.3656411150745857, "grad_max_sv": 0.18694628309458494, "grad_min_sv": 6.765250024683839e-09, "grad_condition": 728041100.7004558, "lr": 7.001981464747503e-06, "time_sec": 32.78335380554199 }, { "epoch": 143, "train_loss": 0.12062059470653534, "train_acc": 0.96196, "test_loss": 2.9649132221221923, "test_acc": 0.5592, "lyapunov": null, "grad_norm": 0.36372343649597894, "grad_max_sv": 0.19535562619566918, "grad_min_sv": 6.99444468851753e-09, "grad_condition": 1233101804.7440555, "lr": 5.3638335185058295e-06, "time_sec": 32.80367183685303 }, { "epoch": 144, "train_loss": 0.12207864775896073, "train_acc": 0.96178, "test_loss": 3.036870691680908, "test_acc": 0.5574, "lyapunov": null, "grad_norm": 0.3636070415011162, "grad_max_sv": 0.20035785287618638, "grad_min_sv": 7.128019625154275e-09, "grad_condition": 171713281.12199268, "lr": 3.942649342761114e-06, "time_sec": 32.81153345108032 }, { "epoch": 145, "train_loss": 0.11943841837644577, "train_acc": 0.96326, "test_loss": 2.9936345024108886, "test_acc": 0.5606, "lyapunov": null, "grad_norm": 0.3616987855339011, "grad_max_sv": 0.19010693076997995, "grad_min_sv": 6.951608487104404e-09, "grad_condition": 4475866647.186778, "lr": 2.7390523158633524e-06, "time_sec": 32.77432584762573 }, { "epoch": 146, "train_loss": 0.12161365668535233, "train_acc": 0.96184, "test_loss": 3.0051653202056885, "test_acc": 0.5534, "lyapunov": null, "grad_norm": 0.36606365240898514, "grad_max_sv": 0.19566274229437114, "grad_min_sv": 7.090793683911957e-09, "grad_condition": 1292263099.7971816, "lr": 1.7535703752478133e-06, "time_sec": 32.722100257873535 }, { "epoch": 147, "train_loss": 0.11985450011253357, "train_acc": 0.96366, "test_loss": 2.9604510833740236, "test_acc": 0.5575, "lyapunov": null, "grad_norm": 0.36142233410993513, "grad_max_sv": 0.19281328432261943, "grad_min_sv": 7.25558266457792e-09, "grad_condition": 7387609214.887906, "lr": 9.866357858642196e-07, "time_sec": 32.73111319541931 }, { "epoch": 148, "train_loss": 0.11937485624313354, "train_acc": 0.96304, "test_loss": 3.0363352073669434, "test_acc": 0.555, "lyapunov": null, "grad_norm": 0.3611567529216887, "grad_max_sv": 0.1957642961293459, "grad_min_sv": 7.231622295303733e-09, "grad_condition": 393022755.7130184, "lr": 4.38584950570808e-07, "time_sec": 32.739211320877075 }, { "epoch": 149, "train_loss": 0.11994361319065094, "train_acc": 0.96282, "test_loss": 2.9720828590393067, "test_acc": 0.5586, "lyapunov": null, "grad_norm": 0.36260803003121506, "grad_max_sv": 0.19581739362329245, "grad_min_sv": 6.825674283401049e-09, "grad_condition": 640655030.4564087, "lr": 1.096582625772501e-07, "time_sec": 32.73686075210571 }, { "epoch": 150, "train_loss": 0.12198109043121338, "train_acc": 0.96096, "test_loss": 3.0690538398742677, "test_acc": 0.5514, "lyapunov": null, "grad_norm": 0.3640908774200121, "grad_max_sv": 0.19363359715789558, "grad_min_sv": 6.96894196785744e-09, "grad_condition": 273507263.305566, "lr": 0.0, "time_sec": 32.99615716934204 } ], "12": [ { "epoch": 1, "train_loss": 4.494552028656006, "train_acc": 0.03786, "test_loss": 4.61479503326416, "test_acc": 0.0201, "lyapunov": null, "grad_norm": 4.970128680900294, "grad_max_sv": 4.1727720379829405, "grad_min_sv": 8.289555068485832e-08, "grad_condition": 76452781.51601897, "lr": 0.0009998903417374227, "time_sec": 49.85722231864929 }, { "epoch": 2, "train_loss": 3.9854862425994875, "train_acc": 0.08822, "test_loss": 4.992143798828125, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 3.054976721991771, "grad_max_sv": 2.33364659845829, "grad_min_sv": 4.921280333802791e-08, "grad_condition": 63442313.555687234, "lr": 0.0009995614150494292, "time_sec": 49.82543992996216 }, { "epoch": 3, "train_loss": 3.6997953691101073, "train_acc": 0.12854, "test_loss": 4.995684532165527, "test_acc": 0.0293, "lyapunov": null, "grad_norm": 2.062296620286874, "grad_max_sv": 1.3390462696552277, "grad_min_sv": 3.588550117061828e-08, "grad_condition": 44525979.84656793, "lr": 0.0009990133642141358, "time_sec": 49.824538707733154 }, { "epoch": 4, "train_loss": 3.5368371379089356, "train_acc": 0.15444, "test_loss": 5.110721218109131, "test_acc": 0.0304, "lyapunov": null, "grad_norm": 1.6796942132426855, "grad_max_sv": 0.9513197481632233, "grad_min_sv": 2.9029874798469635e-08, "grad_condition": 38187587.0072392, "lr": 0.0009982464296247522, "time_sec": 49.857542514801025 }, { "epoch": 5, "train_loss": 3.4063741930389404, "train_acc": 0.1804, "test_loss": 4.820973803710937, "test_acc": 0.0488, "lyapunov": null, "grad_norm": 1.5228591587706575, "grad_max_sv": 0.8078360810875893, "grad_min_sv": 2.6718039813911078e-08, "grad_condition": 36188290.78873479, "lr": 0.0009972609476841367, "time_sec": 49.83380579948425 }, { "epoch": 6, "train_loss": 3.298316816482544, "train_acc": 0.19704, "test_loss": 4.687854388427734, "test_acc": 0.063, "lyapunov": null, "grad_norm": 1.430907384491558, "grad_max_sv": 0.7338306248188019, "grad_min_sv": 2.5322855712328617e-08, "grad_condition": 32479596.327881176, "lr": 0.000996057350657239, "time_sec": 49.85435748100281 }, { "epoch": 7, "train_loss": 3.212421199264526, "train_acc": 0.21768, "test_loss": 5.175653315734864, "test_acc": 0.0504, "lyapunov": null, "grad_norm": 1.336875610023359, "grad_max_sv": 0.649027307331562, "grad_min_sv": 2.378195060326327e-08, "grad_condition": 32637118.77699437, "lr": 0.000994636166481494, "time_sec": 49.8446729183197 }, { "epoch": 8, "train_loss": 3.138554875640869, "train_acc": 0.22894, "test_loss": 5.807579966735839, "test_acc": 0.0462, "lyapunov": null, "grad_norm": 1.2679659601013358, "grad_max_sv": 0.5943921484053135, "grad_min_sv": 2.2575583161904557e-08, "grad_condition": 97277800.55107144, "lr": 0.0009929980185352525, "time_sec": 49.8536856174469 }, { "epoch": 9, "train_loss": 3.0594152055358887, "train_acc": 0.24342, "test_loss": 5.896516481018066, "test_acc": 0.0504, "lyapunov": null, "grad_norm": 1.1948384399270802, "grad_max_sv": 0.5371919803321361, "grad_min_sv": 2.1378302061947352e-08, "grad_condition": 43411043.09074741, "lr": 0.0009911436253643444, "time_sec": 49.826568365097046 }, { "epoch": 10, "train_loss": 3.0018548110961913, "train_acc": 0.25334, "test_loss": 6.065813122558594, "test_acc": 0.0461, "lyapunov": null, "grad_norm": 1.1307569845828864, "grad_max_sv": 0.49591890424489976, "grad_min_sv": 2.0269659145588648e-08, "grad_condition": 137243724.22937468, "lr": 0.0009890738003669028, "time_sec": 49.83774471282959 }, { "epoch": 11, "train_loss": 2.955089698944092, "train_acc": 0.2653, "test_loss": 5.9151001647949215, "test_acc": 0.0512, "lyapunov": null, "grad_norm": 1.067241785689624, "grad_max_sv": 0.4469477400183678, "grad_min_sv": 1.8805797574739103e-08, "grad_condition": 39379357.71574137, "lr": 0.00098678945143658, "time_sec": 49.843921184539795 }, { "epoch": 12, "train_loss": 2.9137347607421873, "train_acc": 0.27164, "test_loss": 6.294404597473145, "test_acc": 0.0476, "lyapunov": null, "grad_norm": 1.0355748395798314, "grad_max_sv": 0.4451711155474186, "grad_min_sv": 1.9072327144360128e-08, "grad_condition": 11465758103.108255, "lr": 0.0009842915805643154, "time_sec": 49.864059925079346 }, { "epoch": 13, "train_loss": 2.8780907594299316, "train_acc": 0.2771, "test_loss": 5.592148977661132, "test_acc": 0.0478, "lyapunov": null, "grad_norm": 0.9968605810380445, "grad_max_sv": 0.42295421436429026, "grad_min_sv": 1.8676737473244386e-08, "grad_condition": 25252476.39695831, "lr": 0.000981581283398829, "time_sec": 49.83604097366333 }, { "epoch": 14, "train_loss": 2.83197486907959, "train_acc": 0.28466, "test_loss": 5.6323877784729, "test_acc": 0.0609, "lyapunov": null, "grad_norm": 0.9600893848651761, "grad_max_sv": 0.40282900631427765, "grad_min_sv": 1.79312983100699e-08, "grad_condition": 46420938.26971118, "lr": 0.0009786597487660333, "time_sec": 49.834007263183594 }, { "epoch": 15, "train_loss": 2.8022082035064697, "train_acc": 0.29582, "test_loss": 6.161382629394531, "test_acc": 0.067, "lyapunov": null, "grad_norm": 0.9375482131775189, "grad_max_sv": 0.38931420594453814, "grad_min_sv": 1.7493153070535784e-08, "grad_condition": 36503130.621698126, "lr": 0.0009755282581475766, "time_sec": 49.843669176101685 }, { "epoch": 16, "train_loss": 2.7717318687438963, "train_acc": 0.29786, "test_loss": 6.750612663269043, "test_acc": 0.0319, "lyapunov": null, "grad_norm": 0.914689907325661, "grad_max_sv": 0.3722547680139542, "grad_min_sv": 1.6777755511981906e-08, "grad_condition": 56626372.0449656, "lr": 0.0009721881851187403, "time_sec": 49.83157706260681 }, { "epoch": 17, "train_loss": 2.737800383453369, "train_acc": 0.30562, "test_loss": 6.416880516052246, "test_acc": 0.0612, "lyapunov": null, "grad_norm": 0.8943352214027238, "grad_max_sv": 0.35389882922172544, "grad_min_sv": 1.6637817648601504e-08, "grad_condition": 27086037.56335088, "lr": 0.0009686409947459456, "time_sec": 49.84391736984253 }, { "epoch": 18, "train_loss": 2.726037522125244, "train_acc": 0.30952, "test_loss": 6.604639881896973, "test_acc": 0.0459, "lyapunov": null, "grad_norm": 0.8840199433360627, "grad_max_sv": 0.35427382588386536, "grad_min_sv": 1.631152495851218e-08, "grad_condition": 30779446.928706445, "lr": 0.0009648882429441254, "time_sec": 49.85922360420227 }, { "epoch": 19, "train_loss": 2.6859044135284424, "train_acc": 0.31622, "test_loss": 5.795512687683106, "test_acc": 0.057, "lyapunov": null, "grad_norm": 0.8549569769936459, "grad_max_sv": 0.33466122299432755, "grad_min_sv": 1.565257393698616e-08, "grad_condition": 29386830.435270645, "lr": 0.00096093157579425, "time_sec": 49.82556509971619 }, { "epoch": 20, "train_loss": 2.6536119274902346, "train_acc": 0.3221, "test_loss": 6.344257983398437, "test_acc": 0.044, "lyapunov": null, "grad_norm": 0.8449773123460955, "grad_max_sv": 0.3348921127617359, "grad_min_sv": 1.5790628153482257e-08, "grad_condition": 98318741.07961987, "lr": 0.0009567727288213001, "time_sec": 49.83516526222229 }, { "epoch": 21, "train_loss": 2.6361696144104005, "train_acc": 0.32656, "test_loss": 7.515093251800537, "test_acc": 0.0334, "lyapunov": null, "grad_norm": 0.8336479900582607, "grad_max_sv": 0.3216260939836502, "grad_min_sv": 1.536505757071538e-08, "grad_condition": 26686558.28517064, "lr": 0.0009524135262330095, "time_sec": 49.80964422225952 }, { "epoch": 22, "train_loss": 2.609321441345215, "train_acc": 0.33038, "test_loss": 6.987834294128418, "test_acc": 0.0336, "lyapunov": null, "grad_norm": 0.8111631557338365, "grad_max_sv": 0.32318604178726673, "grad_min_sv": 1.552950264216424e-08, "grad_condition": 31459791.97556909, "lr": 0.0009478558801197061, "time_sec": 49.83420443534851 }, { "epoch": 23, "train_loss": 2.5819150804138182, "train_acc": 0.33626, "test_loss": 5.626160023498535, "test_acc": 0.0597, "lyapunov": null, "grad_norm": 0.7975730239086433, "grad_max_sv": 0.2971249621361494, "grad_min_sv": 1.4598027968382166e-08, "grad_condition": 29388140.880233955, "lr": 0.000943101789615607, "time_sec": 49.84738302230835 }, { "epoch": 24, "train_loss": 2.563654583282471, "train_acc": 0.34112, "test_loss": 8.088758407592774, "test_acc": 0.0365, "lyapunov": null, "grad_norm": 0.7820981992902372, "grad_max_sv": 0.30556059442460537, "grad_min_sv": 1.4405372743275802e-08, "grad_condition": 36896273.106267676, "lr": 0.0009381533400219313, "time_sec": 49.83872365951538 }, { "epoch": 25, "train_loss": 2.5395704370880128, "train_acc": 0.3453, "test_loss": 6.280784951782227, "test_acc": 0.0419, "lyapunov": null, "grad_norm": 0.7796352290200003, "grad_max_sv": 0.29107407070696356, "grad_min_sv": 1.438702274536574e-08, "grad_condition": 23506322.84645006, "lr": 0.0009330127018922189, "time_sec": 49.84307074546814 }, { "epoch": 26, "train_loss": 2.516899804611206, "train_acc": 0.34914, "test_loss": 6.8854626892089845, "test_acc": 0.0472, "lyapunov": null, "grad_norm": 0.7654504890703723, "grad_max_sv": 0.2898920584470034, "grad_min_sv": 1.4131242567771985e-08, "grad_condition": 36962656.131567374, "lr": 0.000927682130080253, "time_sec": 49.82866811752319 }, { "epoch": 27, "train_loss": 2.486618924636841, "train_acc": 0.35846, "test_loss": 6.096959390258789, "test_acc": 0.0526, "lyapunov": null, "grad_norm": 0.7544470177982979, "grad_max_sv": 0.2747815653681755, "grad_min_sv": 1.4021938565811353e-08, "grad_condition": 22894223.22709341, "lr": 0.0009221639627510072, "time_sec": 49.833322048187256 }, { "epoch": 28, "train_loss": 2.4692860332489013, "train_acc": 0.35872, "test_loss": 7.058197943115235, "test_acc": 0.0368, "lyapunov": null, "grad_norm": 0.7556141642776453, "grad_max_sv": 0.2829656444489956, "grad_min_sv": 1.4026384997922747e-08, "grad_condition": 24010034.28343827, "lr": 0.0009164606203550494, "time_sec": 49.853132247924805 }, { "epoch": 29, "train_loss": 2.458679496536255, "train_acc": 0.36202, "test_loss": 5.932370195007325, "test_acc": 0.0515, "lyapunov": null, "grad_norm": 0.7489931312284205, "grad_max_sv": 0.2846912644803524, "grad_min_sv": 1.3950906180867743e-08, "grad_condition": 759126756.028516, "lr": 0.0009105746045668516, "time_sec": 49.815508127212524 }, { "epoch": 30, "train_loss": 2.440240175704956, "train_acc": 0.3643, "test_loss": 5.7076008422851565, "test_acc": 0.0545, "lyapunov": null, "grad_norm": 0.7451604093710013, "grad_max_sv": 0.27726204246282576, "grad_min_sv": 1.3802408763141649e-08, "grad_condition": 25518721.12854769, "lr": 0.0009045084971874733, "time_sec": 49.83587169647217 }, { "epoch": 31, "train_loss": 2.413286708908081, "train_acc": 0.37092, "test_loss": 5.388267793273926, "test_acc": 0.0567, "lyapunov": null, "grad_norm": 0.734602471620392, "grad_max_sv": 0.2801205262541771, "grad_min_sv": 1.3700489934209691e-08, "grad_condition": 70621872.17100011, "lr": 0.0008982649590120977, "time_sec": 49.82285523414612 }, { "epoch": 32, "train_loss": 2.3982598586273194, "train_acc": 0.37454, "test_loss": 4.8633959762573244, "test_acc": 0.0614, "lyapunov": null, "grad_norm": 0.7317568960693007, "grad_max_sv": 0.27396991699934004, "grad_min_sv": 1.3639147818100827e-08, "grad_condition": 29568703.15011265, "lr": 0.0008918467286629196, "time_sec": 49.83714246749878 }, { "epoch": 33, "train_loss": 2.3700755281066894, "train_acc": 0.37942, "test_loss": 5.800725856018066, "test_acc": 0.062, "lyapunov": null, "grad_norm": 0.7363325475877537, "grad_max_sv": 0.27091147713363173, "grad_min_sv": 1.3641409607467736e-08, "grad_condition": 23422095.65938937, "lr": 0.0008852566213878943, "time_sec": 49.85065937042236 }, { "epoch": 34, "train_loss": 2.3484229640197753, "train_acc": 0.38438, "test_loss": 5.51493988494873, "test_acc": 0.0489, "lyapunov": null, "grad_norm": 0.7318255060238914, "grad_max_sv": 0.2700826805084944, "grad_min_sv": 1.3733222553602431e-08, "grad_condition": 23110083.817654673, "lr": 0.000878497527825878, "time_sec": 49.825148820877075 }, { "epoch": 35, "train_loss": 2.332993766708374, "train_acc": 0.38728, "test_loss": 6.365867942047119, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.7235217593940582, "grad_max_sv": 0.26724731288850306, "grad_min_sv": 1.3652239799766264e-08, "grad_condition": 21635340.607584503, "lr": 0.000871572412738697, "time_sec": 49.830586194992065 }, { "epoch": 36, "train_loss": 2.306020415649414, "train_acc": 0.39186, "test_loss": 5.792026341247559, "test_acc": 0.0452, "lyapunov": null, "grad_norm": 0.7128640395593397, "grad_max_sv": 0.26750593855977056, "grad_min_sv": 1.3493218886662105e-08, "grad_condition": 28714487.625810385, "lr": 0.0008644843137107055, "time_sec": 49.84518265724182 }, { "epoch": 37, "train_loss": 2.2972560415649412, "train_acc": 0.39398, "test_loss": 6.719418971252441, "test_acc": 0.0336, "lyapunov": null, "grad_norm": 0.7133630215784597, "grad_max_sv": 0.2599464699625969, "grad_min_sv": 1.321531789555408e-08, "grad_condition": 23431301.61775563, "lr": 0.0008572363398164014, "time_sec": 49.80765676498413 }, { "epoch": 38, "train_loss": 2.2751118283843996, "train_acc": 0.39982, "test_loss": 5.9905416282653805, "test_acc": 0.0405, "lyapunov": null, "grad_norm": 0.711317525951205, "grad_max_sv": 0.25357839167118074, "grad_min_sv": 1.3227913819857662e-08, "grad_condition": 22136545.95270278, "lr": 0.0008498316702566826, "time_sec": 49.8195858001709 }, { "epoch": 39, "train_loss": 2.2572131638336184, "train_acc": 0.40186, "test_loss": 5.522994046783447, "test_acc": 0.0292, "lyapunov": null, "grad_norm": 0.7046395490795619, "grad_max_sv": 0.2534454546868801, "grad_min_sv": 1.3053050565425828e-08, "grad_condition": 23267030.12204785, "lr": 0.0008422735529643442, "time_sec": 49.82005977630615 }, { "epoch": 40, "train_loss": 2.247441282196045, "train_acc": 0.40386, "test_loss": 6.156334571838379, "test_acc": 0.0459, "lyapunov": null, "grad_norm": 0.7028096798670115, "grad_max_sv": 0.2492887545377016, "grad_min_sv": 1.295731734268779e-08, "grad_condition": 27228242.583258677, "lr": 0.0008345653031794289, "time_sec": 49.840070724487305 }, { "epoch": 41, "train_loss": 2.240987236175537, "train_acc": 0.4064, "test_loss": 6.480609422302246, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.6963939273563242, "grad_max_sv": 0.25355591997504234, "grad_min_sv": 1.3210752133896442e-08, "grad_condition": 51874622.58196541, "lr": 0.0008267103019950526, "time_sec": 49.89214468002319 }, { "epoch": 42, "train_loss": 2.2241448893737794, "train_acc": 0.40938, "test_loss": 7.472731929016113, "test_acc": 0.0364, "lyapunov": null, "grad_norm": 0.6886576186838276, "grad_max_sv": 0.24406687431037427, "grad_min_sv": 1.2965910546614001e-08, "grad_condition": 26237426.90185051, "lr": 0.0008187119948743447, "time_sec": 49.831929445266724 }, { "epoch": 43, "train_loss": 2.195390332183838, "train_acc": 0.41482, "test_loss": 6.986102354431153, "test_acc": 0.0354, "lyapunov": null, "grad_norm": 0.692064929980546, "grad_max_sv": 0.24136908873915672, "grad_min_sv": 1.287102841251997e-08, "grad_condition": 29191367.16539036, "lr": 0.000810573890139155, "time_sec": 49.820056438446045 }, { "epoch": 44, "train_loss": 2.1865518129730224, "train_acc": 0.41708, "test_loss": 6.7771270584106444, "test_acc": 0.0393, "lyapunov": null, "grad_norm": 0.6868416402158027, "grad_max_sv": 0.2486371211707592, "grad_min_sv": 1.2717046270899201e-08, "grad_condition": 39400931.65148838, "lr": 0.0008022995574311873, "time_sec": 49.82724571228027 }, { "epoch": 45, "train_loss": 2.176023401031494, "train_acc": 0.41766, "test_loss": 6.5321983726501465, "test_acc": 0.0329, "lyapunov": null, "grad_norm": 0.688101634481696, "grad_max_sv": 0.2483655706048012, "grad_min_sv": 1.2939461641048311e-08, "grad_condition": 24745167.039308526, "lr": 0.0007938926261462363, "time_sec": 49.83728241920471 }, { "epoch": 46, "train_loss": 2.157371569519043, "train_acc": 0.42422, "test_loss": 5.901077621459961, "test_acc": 0.0536, "lyapunov": null, "grad_norm": 0.6810937554159694, "grad_max_sv": 0.2453255333006382, "grad_min_sv": 1.2790355725933455e-08, "grad_condition": 42427572.437124, "lr": 0.0007853567838422158, "time_sec": 49.83260989189148 }, { "epoch": 47, "train_loss": 2.1449081243896484, "train_acc": 0.42456, "test_loss": 6.075893556213379, "test_acc": 0.042, "lyapunov": null, "grad_norm": 0.677274699872145, "grad_max_sv": 0.23359011709690095, "grad_min_sv": 1.2604452173659019e-08, "grad_condition": 23439756.57327797, "lr": 0.0007766957746216719, "time_sec": 49.81248760223389 }, { "epoch": 48, "train_loss": 2.121114821166992, "train_acc": 0.43062, "test_loss": 6.324017465209961, "test_acc": 0.0699, "lyapunov": null, "grad_norm": 0.6768119432582711, "grad_max_sv": 0.23583042696118356, "grad_min_sv": 1.2428631641914211e-08, "grad_condition": 26576129.087632615, "lr": 0.0007679133974894982, "time_sec": 49.85111737251282 }, { "epoch": 49, "train_loss": 2.1201681073760987, "train_acc": 0.43092, "test_loss": 5.493146458435058, "test_acc": 0.0673, "lyapunov": null, "grad_norm": 0.6795448834334495, "grad_max_sv": 0.24224164076149463, "grad_min_sv": 1.2691686027133109e-08, "grad_condition": 24348457.963241145, "lr": 0.000759013504686565, "time_sec": 49.81028628349304 }, { "epoch": 50, "train_loss": 2.082837229309082, "train_acc": 0.4386, "test_loss": 6.459659493255615, "test_acc": 0.0616, "lyapunov": null, "grad_norm": 0.6728576224616372, "grad_max_sv": 0.23022082336246968, "grad_min_sv": 1.2368064503109899e-08, "grad_condition": 23985269.670404635, "lr": 0.0007499999999999998, "time_sec": 49.82207798957825 }, { "epoch": 51, "train_loss": 2.0762338228607176, "train_acc": 0.43984, "test_loss": 6.028357986450195, "test_acc": 0.0474, "lyapunov": null, "grad_norm": 0.671786463321322, "grad_max_sv": 0.23933242298662663, "grad_min_sv": 1.2453496028852485e-08, "grad_condition": 27468424.752658807, "lr": 0.0007408768370508575, "time_sec": 49.839146852493286 }, { "epoch": 52, "train_loss": 2.068026172409058, "train_acc": 0.44324, "test_loss": 6.386326299285889, "test_acc": 0.0521, "lyapunov": null, "grad_norm": 0.6708600139651663, "grad_max_sv": 0.24169348366558552, "grad_min_sv": 1.2435446072878164e-08, "grad_condition": 53682617.89361428, "lr": 0.0007316480175599307, "time_sec": 49.84106373786926 }, { "epoch": 53, "train_loss": 2.0512850422668456, "train_acc": 0.44514, "test_loss": 5.693611965942383, "test_acc": 0.0412, "lyapunov": null, "grad_norm": 0.6693562330574987, "grad_max_sv": 0.23974683545529843, "grad_min_sv": 1.2387516072631665e-08, "grad_condition": 26566156.55520319, "lr": 0.0007223175895924635, "time_sec": 49.83973002433777 }, { "epoch": 54, "train_loss": 2.0340771446990966, "train_acc": 0.45072, "test_loss": 6.135411253356933, "test_acc": 0.0562, "lyapunov": null, "grad_norm": 0.6690638479693323, "grad_max_sv": 0.23783069401979445, "grad_min_sv": 1.2572742053018614e-08, "grad_condition": 21778321.765234537, "lr": 0.0007128896457825361, "time_sec": 49.87506914138794 }, { "epoch": 55, "train_loss": 2.0094136617279053, "train_acc": 0.45566, "test_loss": 5.745096834564209, "test_acc": 0.0572, "lyapunov": null, "grad_norm": 0.6669166301057209, "grad_max_sv": 0.23878032267093657, "grad_min_sv": 1.231176157273639e-08, "grad_condition": 29310923.371788334, "lr": 0.0007033683215378998, "time_sec": 49.82778191566467 }, { "epoch": 56, "train_loss": 2.0006568963241578, "train_acc": 0.457, "test_loss": 6.5824570434570315, "test_acc": 0.0501, "lyapunov": null, "grad_norm": 0.6683455061699762, "grad_max_sv": 0.23399036526679992, "grad_min_sv": 1.2379160156672509e-08, "grad_condition": 42922377.98757514, "lr": 0.0006937577932260512, "time_sec": 49.85116100311279 }, { "epoch": 57, "train_loss": 1.9894362976074218, "train_acc": 0.45838, "test_loss": 6.51012366104126, "test_acc": 0.0442, "lyapunov": null, "grad_norm": 0.6646066170012002, "grad_max_sv": 0.23274879157543182, "grad_min_sv": 1.238940085523943e-08, "grad_condition": 24070465.15252796, "lr": 0.0006840622763423388, "time_sec": 49.8274929523468 }, { "epoch": 58, "train_loss": 1.9678663694000245, "train_acc": 0.46314, "test_loss": 6.619851453399658, "test_acc": 0.0576, "lyapunov": null, "grad_norm": 0.6643541450786883, "grad_max_sv": 0.23393345512449742, "grad_min_sv": 1.2389777363092103e-08, "grad_condition": 38285129.517120846, "lr": 0.0006742860236609073, "time_sec": 49.837411880493164 }, { "epoch": 59, "train_loss": 1.965532445755005, "train_acc": 0.46532, "test_loss": 7.184655822753906, "test_acc": 0.0412, "lyapunov": null, "grad_norm": 0.6645069826423124, "grad_max_sv": 0.23921045735478402, "grad_min_sv": 1.2522070774040328e-08, "grad_condition": 95635689.47436689, "lr": 0.0006644333233692913, "time_sec": 49.82288122177124 }, { "epoch": 60, "train_loss": 1.9421441039657592, "train_acc": 0.46942, "test_loss": 6.0968818130493165, "test_acc": 0.0396, "lyapunov": null, "grad_norm": 0.6647686483063734, "grad_max_sv": 0.23022540807723998, "grad_min_sv": 1.2435142121569597e-08, "grad_condition": 36516212.89900361, "lr": 0.0006545084971874734, "time_sec": 49.836525440216064 }, { "epoch": 61, "train_loss": 1.9307384226989746, "train_acc": 0.4713, "test_loss": 7.351404643249512, "test_acc": 0.0467, "lyapunov": null, "grad_norm": 0.6598071015542969, "grad_max_sv": 0.23300293684005738, "grad_min_sv": 1.2553449488250656e-08, "grad_condition": 21336349.83542385, "lr": 0.0006445158984722354, "time_sec": 49.81679058074951 }, { "epoch": 62, "train_loss": 1.9107242463684082, "train_acc": 0.47584, "test_loss": 7.41353745803833, "test_acc": 0.0564, "lyapunov": null, "grad_norm": 0.6632922829797736, "grad_max_sv": 0.23702187687158585, "grad_min_sv": 1.256866596290214e-08, "grad_condition": 414252068.6680373, "lr": 0.0006344599103076324, "time_sec": 49.81079959869385 }, { "epoch": 63, "train_loss": 1.906180576171875, "train_acc": 0.47704, "test_loss": 8.345553895568848, "test_acc": 0.0514, "lyapunov": null, "grad_norm": 0.6641303546175715, "grad_max_sv": 0.23919319920241833, "grad_min_sv": 1.2445030603269736e-08, "grad_condition": 48181552.89073322, "lr": 0.0006243449435824269, "time_sec": 49.834824323654175 }, { "epoch": 64, "train_loss": 1.896571351852417, "train_acc": 0.48022, "test_loss": 7.706241481018067, "test_acc": 0.0495, "lyapunov": null, "grad_norm": 0.6580911542263143, "grad_max_sv": 0.233155807107687, "grad_min_sv": 1.2258548102821176e-08, "grad_condition": 147912368.09627536, "lr": 0.0006141754350553275, "time_sec": 49.827706813812256 }, { "epoch": 65, "train_loss": 1.8689342678833007, "train_acc": 0.48694, "test_loss": 7.604910266113281, "test_acc": 0.068, "lyapunov": null, "grad_norm": 0.6601961376883955, "grad_max_sv": 0.24266679622232915, "grad_min_sv": 1.2337946858967385e-08, "grad_condition": 109479288.75078002, "lr": 0.0006039558454088793, "time_sec": 49.847835063934326 }, { "epoch": 66, "train_loss": 1.8541412976837157, "train_acc": 0.4913, "test_loss": 7.621131346130371, "test_acc": 0.0502, "lyapunov": null, "grad_norm": 0.6526859807082246, "grad_max_sv": 0.22503522336483, "grad_min_sv": 1.1999139423735094e-08, "grad_condition": 27658012.606830657, "lr": 0.000593690657292862, "time_sec": 49.83453869819641 }, { "epoch": 67, "train_loss": 1.8500203356170655, "train_acc": 0.4895, "test_loss": 8.448241088867187, "test_acc": 0.0602, "lyapunov": null, "grad_norm": 0.654584216781727, "grad_max_sv": 0.23166645579040052, "grad_min_sv": 1.2144356195328832e-08, "grad_condition": 57526231.39027766, "lr": 0.0005833843733580507, "time_sec": 49.87798357009888 }, { "epoch": 68, "train_loss": 1.8333191384887695, "train_acc": 0.49588, "test_loss": 7.663671650695801, "test_acc": 0.0539, "lyapunov": null, "grad_norm": 0.6550869721940646, "grad_max_sv": 0.23333334550261497, "grad_min_sv": 1.2233289833907257e-08, "grad_condition": 24346438.395213075, "lr": 0.0005730415142812054, "time_sec": 49.82582187652588 }, { "epoch": 69, "train_loss": 1.8119923030090332, "train_acc": 0.50032, "test_loss": 7.175043432617188, "test_acc": 0.0712, "lyapunov": null, "grad_norm": 0.6513215911180641, "grad_max_sv": 0.2193699970841408, "grad_min_sv": 1.1865115855103081e-08, "grad_condition": 26929150.493882775, "lr": 0.0005626666167821517, "time_sec": 49.80794405937195 }, { "epoch": 70, "train_loss": 1.8089694079589844, "train_acc": 0.49764, "test_loss": 7.612014476013184, "test_acc": 0.0538, "lyapunov": null, "grad_norm": 0.6557711961342083, "grad_max_sv": 0.23481616117060183, "grad_min_sv": 1.21222042414465e-08, "grad_condition": 49730665.95439996, "lr": 0.0005522642316338265, "time_sec": 49.81162214279175 }, { "epoch": 71, "train_loss": 1.794535770225525, "train_acc": 0.50302, "test_loss": 8.002939363861085, "test_acc": 0.054, "lyapunov": null, "grad_norm": 0.6530360122929442, "grad_max_sv": 0.22891747988760472, "grad_min_sv": 1.2135645938160522e-08, "grad_condition": 30239652.54848214, "lr": 0.0005418389216661573, "time_sec": 49.83351969718933 }, { "epoch": 72, "train_loss": 1.7888313204574584, "train_acc": 0.50272, "test_loss": 7.378663352966308, "test_acc": 0.0477, "lyapunov": null, "grad_norm": 0.6515803468137452, "grad_max_sv": 0.223580015450716, "grad_min_sv": 1.2234114341730384e-08, "grad_condition": 31177170.11021496, "lr": 0.0005313952597646563, "time_sec": 49.80682587623596 }, { "epoch": 73, "train_loss": 1.7610743871688843, "train_acc": 0.51094, "test_loss": 7.5734631568908695, "test_acc": 0.0456, "lyapunov": null, "grad_norm": 0.6471442109164438, "grad_max_sv": 0.23298447765409946, "grad_min_sv": 1.2235564984808267e-08, "grad_condition": 30205955.557135515, "lr": 0.0005209378268645994, "time_sec": 49.8284707069397 }, { "epoch": 74, "train_loss": 1.743510553855896, "train_acc": 0.51648, "test_loss": 8.115744052124024, "test_acc": 0.0597, "lyapunov": null, "grad_norm": 0.6470361414945306, "grad_max_sv": 0.22419601753354074, "grad_min_sv": 1.175036056857981e-08, "grad_condition": 44883670.89626708, "lr": 0.0005104712099416781, "time_sec": 49.81434655189514 }, { "epoch": 75, "train_loss": 1.732315214996338, "train_acc": 0.5162, "test_loss": 8.69449387588501, "test_acc": 0.0443, "lyapunov": null, "grad_norm": 0.6534168175273212, "grad_max_sv": 0.22915640994906425, "grad_min_sv": 1.2120835880813362e-08, "grad_condition": 30203938.86272805, "lr": 0.0004999999999999996, "time_sec": 49.822524070739746 }, { "epoch": 76, "train_loss": 1.7280053578186034, "train_acc": 0.51708, "test_loss": 8.161399678039551, "test_acc": 0.0506, "lyapunov": null, "grad_norm": 0.6519718595623971, "grad_max_sv": 0.22868257723748683, "grad_min_sv": 1.1916949028967227e-08, "grad_condition": 27392099.189085342, "lr": 0.0004895287900583212, "time_sec": 49.806185245513916 }, { "epoch": 77, "train_loss": 1.707364101486206, "train_acc": 0.52106, "test_loss": 8.635691497802734, "test_acc": 0.0553, "lyapunov": null, "grad_norm": 0.6489518165829526, "grad_max_sv": 0.22707784324884414, "grad_min_sv": 1.21318999957154e-08, "grad_condition": 22161799.719214164, "lr": 0.0004790621731353997, "time_sec": 49.8337197303772 }, { "epoch": 78, "train_loss": 1.699185922279358, "train_acc": 0.52508, "test_loss": 8.116340428161621, "test_acc": 0.059, "lyapunov": null, "grad_norm": 0.6466631616175401, "grad_max_sv": 0.2242755901068449, "grad_min_sv": 1.197350978088263e-08, "grad_condition": 22907889.143189352, "lr": 0.000468604740235343, "time_sec": 49.84882068634033 }, { "epoch": 79, "train_loss": 1.6851876223754882, "train_acc": 0.53002, "test_loss": 7.6594300460815425, "test_acc": 0.0668, "lyapunov": null, "grad_norm": 0.6508056360794745, "grad_max_sv": 0.22947054952383042, "grad_min_sv": 1.2146863270084962e-08, "grad_condition": 50400181.57036874, "lr": 0.00045816107833384175, "time_sec": 49.81526827812195 }, { "epoch": 80, "train_loss": 1.6667000872421265, "train_acc": 0.53166, "test_loss": 7.577922117614746, "test_acc": 0.0581, "lyapunov": null, "grad_norm": 0.6484594553766964, "grad_max_sv": 0.22649560272693633, "grad_min_sv": 1.2028468630853606e-08, "grad_condition": 33979879.18367102, "lr": 0.0004477357683661729, "time_sec": 49.79970574378967 }, { "epoch": 81, "train_loss": 1.6529949746704102, "train_acc": 0.53676, "test_loss": 7.7760236434936525, "test_acc": 0.061, "lyapunov": null, "grad_norm": 0.6501069318076672, "grad_max_sv": 0.22972256727516652, "grad_min_sv": 1.196574576337213e-08, "grad_condition": 396215587.1427422, "lr": 0.00043733338321784746, "time_sec": 49.81192994117737 }, { "epoch": 82, "train_loss": 1.6425591729736329, "train_acc": 0.53686, "test_loss": 7.6887285552978515, "test_acc": 0.0449, "lyapunov": null, "grad_norm": 0.6461003642754752, "grad_max_sv": 0.23114448301494123, "grad_min_sv": 1.2002917063394513e-08, "grad_condition": 58155843.95520236, "lr": 0.0004269584857187939, "time_sec": 49.80897355079651 }, { "epoch": 83, "train_loss": 1.6318637802124023, "train_acc": 0.54154, "test_loss": 7.384182490539551, "test_acc": 0.0735, "lyapunov": null, "grad_norm": 0.639611071259903, "grad_max_sv": 0.22576675675809382, "grad_min_sv": 1.1820984322299943e-08, "grad_condition": 61458281.56309018, "lr": 0.0004166156266419484, "time_sec": 49.81825590133667 }, { "epoch": 84, "train_loss": 1.6224907682418823, "train_acc": 0.54502, "test_loss": 6.842728860473633, "test_acc": 0.0545, "lyapunov": null, "grad_norm": 0.6421226956015884, "grad_max_sv": 0.21887084767222403, "grad_min_sv": 1.1874146338408664e-08, "grad_condition": 36085101.45868175, "lr": 0.0004063093427071373, "time_sec": 49.907301902770996 }, { "epoch": 85, "train_loss": 1.6129507275390624, "train_acc": 0.5441, "test_loss": 8.217321695709229, "test_acc": 0.0637, "lyapunov": null, "grad_norm": 0.6427366718485839, "grad_max_sv": 0.23318556658923625, "grad_min_sv": 1.2124754387304871e-08, "grad_condition": 42339311.94718243, "lr": 0.0003960441545911199, "time_sec": 49.83733892440796 }, { "epoch": 86, "train_loss": 1.5975109223556518, "train_acc": 0.54868, "test_loss": 7.930374978637695, "test_acc": 0.0457, "lyapunov": null, "grad_norm": 0.648213394339368, "grad_max_sv": 0.23059269934892654, "grad_min_sv": 1.2111861368707676e-08, "grad_condition": 42084970.06037265, "lr": 0.0003858245649446718, "time_sec": 49.827972412109375 }, { "epoch": 87, "train_loss": 1.5812813794708251, "train_acc": 0.55458, "test_loss": 7.960672058105469, "test_acc": 0.0501, "lyapunov": null, "grad_norm": 0.6429264180119875, "grad_max_sv": 0.2283397376537323, "grad_min_sv": 1.2037938704190233e-08, "grad_condition": 24951514.668881785, "lr": 0.00037565505641757235, "time_sec": 49.82942318916321 }, { "epoch": 88, "train_loss": 1.573117269897461, "train_acc": 0.55398, "test_loss": 8.257780656433106, "test_acc": 0.0591, "lyapunov": null, "grad_norm": 0.6443323703742537, "grad_max_sv": 0.22722676433622838, "grad_min_sv": 1.201048842325303e-08, "grad_condition": 22188712.23632911, "lr": 0.00036554008969236695, "time_sec": 49.86358904838562 }, { "epoch": 89, "train_loss": 1.5576643622207642, "train_acc": 0.55992, "test_loss": 8.274403761291504, "test_acc": 0.041, "lyapunov": null, "grad_norm": 0.6402469644123193, "grad_max_sv": 0.22650128416717052, "grad_min_sv": 1.1862416463004343e-08, "grad_condition": 35019834.9168684, "lr": 0.0003554841015277638, "time_sec": 49.83419132232666 }, { "epoch": 90, "train_loss": 1.549127948036194, "train_acc": 0.56466, "test_loss": 7.301855851745605, "test_acc": 0.0718, "lyapunov": null, "grad_norm": 0.6449275085704251, "grad_max_sv": 0.22556735202670097, "grad_min_sv": 1.1762558954631075e-08, "grad_condition": 21940981.03509561, "lr": 0.000345491502812526, "time_sec": 49.81568884849548 }, { "epoch": 91, "train_loss": 1.5344566452407837, "train_acc": 0.56436, "test_loss": 8.916962014770508, "test_acc": 0.0515, "lyapunov": null, "grad_norm": 0.6463598068323441, "grad_max_sv": 0.23813196495175362, "grad_min_sv": 1.2199751642932855e-08, "grad_condition": 45733250.122319184, "lr": 0.0003355666766307081, "time_sec": 49.839728355407715 }, { "epoch": 92, "train_loss": 1.5208702486419678, "train_acc": 0.56684, "test_loss": 8.993258874511719, "test_acc": 0.054, "lyapunov": null, "grad_norm": 0.6391383040365451, "grad_max_sv": 0.22249663844704629, "grad_min_sv": 1.166908096122965e-08, "grad_condition": 28597379.63678825, "lr": 0.00032571397633909225, "time_sec": 49.850322008132935 }, { "epoch": 93, "train_loss": 1.5081010787582398, "train_acc": 0.57028, "test_loss": 9.433806256103516, "test_acc": 0.0535, "lyapunov": null, "grad_norm": 0.6456709453433311, "grad_max_sv": 0.23419931791722776, "grad_min_sv": 1.195185940633392e-08, "grad_condition": 29245401.732327044, "lr": 0.00031593772365766094, "time_sec": 49.83537983894348 }, { "epoch": 94, "train_loss": 1.4969723129653931, "train_acc": 0.57362, "test_loss": 8.755092433166505, "test_acc": 0.0528, "lyapunov": null, "grad_norm": 0.6461658506271033, "grad_max_sv": 0.22756082080304624, "grad_min_sv": 1.1912134220692926e-08, "grad_condition": 23423387.436489962, "lr": 0.0003062422067739483, "time_sec": 49.80311179161072 }, { "epoch": 95, "train_loss": 2.9494932527923585, "train_acc": 0.411, "test_loss": 4.676254756927491, "test_acc": 0.0505, "lyapunov": null, "grad_norm": 0.8335419963078607, "grad_max_sv": 0.3271928407251835, "grad_min_sv": 1.4720300411941168e-08, "grad_condition": 24067860.441598095, "lr": 0.00029663167846209965, "time_sec": 49.814762115478516 }, { "epoch": 96, "train_loss": 3.6572426443481447, "train_acc": 0.1492, "test_loss": 5.234876950836181, "test_acc": 0.0688, "lyapunov": null, "grad_norm": 0.5523560840003197, "grad_max_sv": 0.18005239982157945, "grad_min_sv": 9.93911985318341e-09, "grad_condition": 91354773.39239445, "lr": 0.00028711035421746345, "time_sec": 49.84577131271362 }, { "epoch": 97, "train_loss": 3.3812893244171143, "train_acc": 0.19184, "test_loss": 4.862454182434082, "test_acc": 0.077, "lyapunov": null, "grad_norm": 0.5636212270422577, "grad_max_sv": 0.18343333192169667, "grad_min_sv": 1.0359513497038009e-08, "grad_condition": 20784291.458693452, "lr": 0.00027768241040753615, "time_sec": 49.83091354370117 }, { "epoch": 98, "train_loss": 3.179550113220215, "train_acc": 0.2255, "test_loss": 4.858168863677979, "test_acc": 0.0807, "lyapunov": null, "grad_norm": 0.5839200776735536, "grad_max_sv": 0.18244810923933982, "grad_min_sv": 1.037966059214135e-08, "grad_condition": 22427331.372158233, "lr": 0.00026835198244006903, "time_sec": 49.867558002471924 }, { "epoch": 99, "train_loss": 3.02292495223999, "train_acc": 0.25396, "test_loss": 5.169387593078613, "test_acc": 0.0881, "lyapunov": null, "grad_norm": 0.595907429260728, "grad_max_sv": 0.1938932089135051, "grad_min_sv": 1.105600735823442e-08, "grad_condition": 39890639.04859903, "lr": 0.0002591231629491421, "time_sec": 49.82200026512146 }, { "epoch": 100, "train_loss": 2.9043469207000734, "train_acc": 0.27584, "test_loss": 4.884814841461182, "test_acc": 0.0989, "lyapunov": null, "grad_norm": 0.5987053513470115, "grad_max_sv": 0.1915395434945822, "grad_min_sv": 1.0967718520123356e-08, "grad_condition": 507391317.2637795, "lr": 0.0002499999999999997, "time_sec": 49.835878133773804 }, { "epoch": 101, "train_loss": 2.8044686096191405, "train_acc": 0.29558, "test_loss": 4.889270275497436, "test_acc": 0.0981, "lyapunov": null, "grad_norm": 0.6096838460034203, "grad_max_sv": 0.20316330213099718, "grad_min_sv": 1.1341824002197854e-08, "grad_condition": 19853325.836087834, "lr": 0.00024098649531343477, "time_sec": 49.85874676704407 }, { "epoch": 102, "train_loss": 2.697149913482666, "train_acc": 0.3167, "test_loss": 4.92620325088501, "test_acc": 0.1009, "lyapunov": null, "grad_norm": 0.6154909980411829, "grad_max_sv": 0.20256872698664666, "grad_min_sv": 1.1648207248748933e-08, "grad_condition": 19320886.90158599, "lr": 0.0002320866025105016, "time_sec": 50.07639527320862 }, { "epoch": 103, "train_loss": 2.618629614944458, "train_acc": 0.33036, "test_loss": 5.49400161895752, "test_acc": 0.1068, "lyapunov": null, "grad_norm": 0.6217563116117207, "grad_max_sv": 0.20746214482933284, "grad_min_sv": 1.1507716859981975e-08, "grad_condition": 25949652.78149998, "lr": 0.0002233042253783278, "time_sec": 49.818949460983276 }, { "epoch": 104, "train_loss": 2.540534757156372, "train_acc": 0.34564, "test_loss": 4.9159078086853025, "test_acc": 0.1126, "lyapunov": null, "grad_norm": 0.6217698336501172, "grad_max_sv": 0.20552988573908806, "grad_min_sv": 1.1522777731975964e-08, "grad_condition": 21899890.551626954, "lr": 0.000214643216157784, "time_sec": 49.87585234642029 }, { "epoch": 105, "train_loss": 2.479596985321045, "train_acc": 0.35746, "test_loss": 5.100056993484497, "test_acc": 0.1253, "lyapunov": null, "grad_norm": 0.6287156405132894, "grad_max_sv": 0.2140802226960659, "grad_min_sv": 1.1805095190275949e-08, "grad_condition": 26208309.323742133, "lr": 0.00020610737385376332, "time_sec": 49.82085204124451 }, { "epoch": 106, "train_loss": 2.415481425552368, "train_acc": 0.36924, "test_loss": 4.742834524536133, "test_acc": 0.1225, "lyapunov": null, "grad_norm": 0.6282670457594898, "grad_max_sv": 0.21101173125207423, "grad_min_sv": 1.1938832567004453e-08, "grad_condition": 33782298.89931901, "lr": 0.00019770044256881242, "time_sec": 49.805906534194946 }, { "epoch": 107, "train_loss": 2.3521559171295165, "train_acc": 0.38442, "test_loss": 5.213879206848144, "test_acc": 0.1211, "lyapunov": null, "grad_norm": 0.6335700941216259, "grad_max_sv": 0.21410419717431067, "grad_min_sv": 1.1941749475385954e-08, "grad_condition": 22110752.957356386, "lr": 0.0001894261098608447, "time_sec": 49.83317017555237 }, { "epoch": 108, "train_loss": 2.302857539215088, "train_acc": 0.39628, "test_loss": 5.207193740844726, "test_acc": 0.1285, "lyapunov": null, "grad_norm": 0.6359374602349686, "grad_max_sv": 0.21151717714965343, "grad_min_sv": 1.187537558844376e-08, "grad_condition": 37488925.60398644, "lr": 0.000181288005125655, "time_sec": 49.82870650291443 }, { "epoch": 109, "train_loss": 2.2536745275878904, "train_acc": 0.40138, "test_loss": 5.2042837226867675, "test_acc": 0.1322, "lyapunov": null, "grad_norm": 0.6289692207235398, "grad_max_sv": 0.20782952345907688, "grad_min_sv": 1.1739032497459779e-08, "grad_condition": 29358916.829315763, "lr": 0.0001732896980049473, "time_sec": 49.83245229721069 }, { "epoch": 110, "train_loss": 2.2073010168457032, "train_acc": 0.40866, "test_loss": 5.739359895324707, "test_acc": 0.1227, "lyapunov": null, "grad_norm": 0.6385992521842959, "grad_max_sv": 0.2127275388687849, "grad_min_sv": 1.1950131779958628e-08, "grad_condition": 28764337.97746384, "lr": 0.00016543469682057076, "time_sec": 49.83092474937439 }, { "epoch": 111, "train_loss": 2.1692623610687254, "train_acc": 0.41942, "test_loss": 6.2040216323852535, "test_acc": 0.1309, "lyapunov": null, "grad_norm": 0.6444316866103925, "grad_max_sv": 0.21499809809029102, "grad_min_sv": 1.1752886208693526e-08, "grad_condition": 31962706.67450107, "lr": 0.00015772644703565552, "time_sec": 49.85021710395813 }, { "epoch": 112, "train_loss": 2.1302712613677977, "train_acc": 0.42516, "test_loss": 5.75790121383667, "test_acc": 0.1399, "lyapunov": null, "grad_norm": 0.6329896331917518, "grad_max_sv": 0.21649966202676296, "grad_min_sv": 1.2179612900176106e-08, "grad_condition": 34093436.46700279, "lr": 0.00015016832974331713, "time_sec": 49.81994557380676 }, { "epoch": 113, "train_loss": 2.1065593459701537, "train_acc": 0.43386, "test_loss": 6.140606423950195, "test_acc": 0.1364, "lyapunov": null, "grad_norm": 0.6373030825503643, "grad_max_sv": 0.2152324143797159, "grad_min_sv": 1.191059096350422e-08, "grad_condition": 24786528.45697539, "lr": 0.00014276366018359834, "time_sec": 49.832173347473145 }, { "epoch": 114, "train_loss": 2.0826868451690674, "train_acc": 0.43754, "test_loss": 7.314329501342773, "test_acc": 0.1193, "lyapunov": null, "grad_norm": 0.6350963671857877, "grad_max_sv": 0.2231900453567505, "grad_min_sv": 1.2137735866390998e-08, "grad_condition": 27948227.054936886, "lr": 0.00013551568628929425, "time_sec": 49.82054424285889 }, { "epoch": 115, "train_loss": 2.057500901184082, "train_acc": 0.44596, "test_loss": 5.995877742004395, "test_acc": 0.1372, "lyapunov": null, "grad_norm": 0.6319121818844147, "grad_max_sv": 0.2083717118948698, "grad_min_sv": 1.1799914823723556e-08, "grad_condition": 35488295.07860346, "lr": 0.00012842758726130276, "time_sec": 49.81160569190979 }, { "epoch": 116, "train_loss": 2.027409094619751, "train_acc": 0.452, "test_loss": 7.286285119628906, "test_acc": 0.122, "lyapunov": null, "grad_norm": 0.639785065376269, "grad_max_sv": 0.2164283238351345, "grad_min_sv": 1.1941236867721305e-08, "grad_condition": 66360354.77809191, "lr": 0.0001215024721741218, "time_sec": 49.836623191833496 }, { "epoch": 117, "train_loss": 1.998638267250061, "train_acc": 0.45694, "test_loss": 6.76222890625, "test_acc": 0.1205, "lyapunov": null, "grad_norm": 0.6411689060332757, "grad_max_sv": 0.21728002466261387, "grad_min_sv": 1.186145185405607e-08, "grad_condition": 25472303.080288395, "lr": 0.00011474337861210538, "time_sec": 49.835474252700806 }, { "epoch": 118, "train_loss": 1.9871974803924561, "train_acc": 0.46078, "test_loss": 6.990749812316895, "test_acc": 0.1306, "lyapunov": null, "grad_norm": 0.6401613879770299, "grad_max_sv": 0.21996232829988002, "grad_min_sv": 1.212309715947768e-08, "grad_condition": 43599185.89621965, "lr": 0.00010815327133708009, "time_sec": 49.82992196083069 }, { "epoch": 119, "train_loss": 1.9558954917144775, "train_acc": 0.46806, "test_loss": 6.338745205688476, "test_acc": 0.1423, "lyapunov": null, "grad_norm": 0.6380666956188763, "grad_max_sv": 0.21726358123123646, "grad_min_sv": 1.1924941875629536e-08, "grad_condition": 23332267.546088994, "lr": 0.00010173504098790182, "time_sec": 49.8153715133667 }, { "epoch": 120, "train_loss": 1.9510743766784668, "train_acc": 0.46974, "test_loss": 6.733411245727539, "test_acc": 0.1243, "lyapunov": null, "grad_norm": 0.6418284890195846, "grad_max_sv": 0.22671268545091153, "grad_min_sv": 1.199444485400214e-08, "grad_condition": 24711059.275352217, "lr": 9.549150281252629e-05, "time_sec": 49.81182289123535 }, { "epoch": 121, "train_loss": 1.9362508995819092, "train_acc": 0.47356, "test_loss": 6.134232345581054, "test_acc": 0.1378, "lyapunov": null, "grad_norm": 0.6346296231277031, "grad_max_sv": 0.21598901376128196, "grad_min_sv": 1.1970328496480053e-08, "grad_condition": 25346274.751641985, "lr": 8.942539543314794e-05, "time_sec": 49.83584427833557 }, { "epoch": 122, "train_loss": 1.9162643937683106, "train_acc": 0.4749, "test_loss": 7.639575733947754, "test_acc": 0.1265, "lyapunov": null, "grad_norm": 0.6378739210927734, "grad_max_sv": 0.21739229559898376, "grad_min_sv": 1.1819409628278932e-08, "grad_condition": 181332693.33855394, "lr": 8.353937964495024e-05, "time_sec": 49.82065296173096 }, { "epoch": 123, "train_loss": 1.9041280354309083, "train_acc": 0.47994, "test_loss": 6.308480444335937, "test_acc": 0.1392, "lyapunov": null, "grad_norm": 0.6332843460906636, "grad_max_sv": 0.21474863290786744, "grad_min_sv": 1.1848325226493373e-08, "grad_condition": 30395117.45243178, "lr": 7.783603724899243e-05, "time_sec": 49.83568549156189 }, { "epoch": 124, "train_loss": 1.888980817489624, "train_acc": 0.48018, "test_loss": 6.931203792572021, "test_acc": 0.1361, "lyapunov": null, "grad_norm": 0.6468989904611825, "grad_max_sv": 0.22639431655406952, "grad_min_sv": 1.2179835734427157e-08, "grad_condition": 27031913.997842442, "lr": 7.231786991974666e-05, "time_sec": 49.86228370666504 }, { "epoch": 125, "train_loss": 1.8688794164657592, "train_acc": 0.48822, "test_loss": 7.4782632530212405, "test_acc": 0.132, "lyapunov": null, "grad_norm": 0.6436381282742432, "grad_max_sv": 0.21808561868965626, "grad_min_sv": 1.21570175322383e-08, "grad_condition": 33380104.6057067, "lr": 6.698729810778072e-05, "time_sec": 49.83109521865845 }, { "epoch": 126, "train_loss": 1.8640016136932374, "train_acc": 0.491, "test_loss": 6.5455432174682615, "test_acc": 0.1403, "lyapunov": null, "grad_norm": 0.6367336212592833, "grad_max_sv": 0.22216320559382438, "grad_min_sv": 1.1826145895899032e-08, "grad_condition": 33022831.75443542, "lr": 6.184665997806817e-05, "time_sec": 49.83457159996033 }, { "epoch": 127, "train_loss": 1.8510954288101196, "train_acc": 0.4882, "test_loss": 7.0682084793090825, "test_acc": 0.1326, "lyapunov": null, "grad_norm": 0.6431259646730736, "grad_max_sv": 0.22209820635616778, "grad_min_sv": 1.2136436526935524e-08, "grad_condition": 66497220.94224206, "lr": 5.6898210384392595e-05, "time_sec": 49.83670258522034 }, { "epoch": 128, "train_loss": 1.8453027178573609, "train_acc": 0.49042, "test_loss": 6.2842555938720706, "test_acc": 0.1305, "lyapunov": null, "grad_norm": 0.6383805845227949, "grad_max_sv": 0.21130143105983734, "grad_min_sv": 1.1917887206280842e-08, "grad_condition": 43204631.05359116, "lr": 5.214411988029363e-05, "time_sec": 49.81800961494446 }, { "epoch": 129, "train_loss": 1.8346676333618164, "train_acc": 0.4945, "test_loss": 6.274330713653565, "test_acc": 0.1391, "lyapunov": null, "grad_norm": 0.6376052549176046, "grad_max_sv": 0.2089413482695818, "grad_min_sv": 1.1727769512470676e-08, "grad_condition": 27159660.544945084, "lr": 4.7586473766990294e-05, "time_sec": 49.845595598220825 }, { "epoch": 130, "train_loss": 1.830022028465271, "train_acc": 0.49474, "test_loss": 6.249729978942871, "test_acc": 0.1459, "lyapunov": null, "grad_norm": 0.6453711202585213, "grad_max_sv": 0.2190984409302473, "grad_min_sv": 1.2224324771881178e-08, "grad_condition": 22960059.51271691, "lr": 4.32272711786996e-05, "time_sec": 49.87020516395569 }, { "epoch": 131, "train_loss": 1.8177084483337402, "train_acc": 0.49802, "test_loss": 6.943641340637207, "test_acc": 0.1332, "lyapunov": null, "grad_norm": 0.6440523788025603, "grad_max_sv": 0.21554723903536796, "grad_min_sv": 1.1872820722402811e-08, "grad_condition": 25176936.12047171, "lr": 3.906842420574966e-05, "time_sec": 49.89444398880005 }, { "epoch": 132, "train_loss": 1.8117612997817993, "train_acc": 0.4992, "test_loss": 7.735134202575684, "test_acc": 0.1244, "lyapunov": null, "grad_norm": 0.6458623734804945, "grad_max_sv": 0.2287333384156227, "grad_min_sv": 1.2116058153988085e-08, "grad_condition": 23082329.335862808, "lr": 3.5111757055874305e-05, "time_sec": 49.84588980674744 }, { "epoch": 133, "train_loss": 1.811845332069397, "train_acc": 0.50014, "test_loss": 7.118609297180176, "test_acc": 0.1331, "lyapunov": null, "grad_norm": 0.638841020277806, "grad_max_sv": 0.21471160911023618, "grad_min_sv": 1.1894429352565794e-08, "grad_condition": 24148328.84591496, "lr": 3.1359005254054254e-05, "time_sec": 49.831459283828735 }, { "epoch": 134, "train_loss": 1.8001032112121582, "train_acc": 0.50294, "test_loss": 7.107429740142822, "test_acc": 0.1282, "lyapunov": null, "grad_norm": 0.6464497671620558, "grad_max_sv": 0.23182750679552555, "grad_min_sv": 1.2161121044212964e-08, "grad_condition": 54577461.874021314, "lr": 2.7811814881259484e-05, "time_sec": 49.83904433250427 }, { "epoch": 135, "train_loss": 1.7929331283569336, "train_acc": 0.50366, "test_loss": 7.344893767547608, "test_acc": 0.1271, "lyapunov": null, "grad_norm": 0.6435222264694869, "grad_max_sv": 0.2192435622215271, "grad_min_sv": 1.2271505814287487e-08, "grad_condition": 22236846.49951817, "lr": 2.4471741852423218e-05, "time_sec": 49.82794523239136 }, { "epoch": 136, "train_loss": 1.8045927509307862, "train_acc": 0.49886, "test_loss": 8.085471559143066, "test_acc": 0.1207, "lyapunov": null, "grad_norm": 0.6382347842581513, "grad_max_sv": 0.22427703253924847, "grad_min_sv": 1.216163273837223e-08, "grad_condition": 28207277.011594873, "lr": 2.1340251233966362e-05, "time_sec": 49.88175678253174 }, { "epoch": 137, "train_loss": 1.7832990637588502, "train_acc": 0.50496, "test_loss": 6.688453459167481, "test_acc": 0.1334, "lyapunov": null, "grad_norm": 0.6418151086385053, "grad_max_sv": 0.21794002875685692, "grad_min_sv": 1.2034389010318058e-08, "grad_condition": 22793569.96555335, "lr": 1.8418716601170932e-05, "time_sec": 49.84071898460388 }, { "epoch": 138, "train_loss": 1.7905620854187012, "train_acc": 0.50572, "test_loss": 7.2380154365539555, "test_acc": 0.129, "lyapunov": null, "grad_norm": 0.6407824951102813, "grad_max_sv": 0.22645330876111985, "grad_min_sv": 1.2214871658589033e-08, "grad_condition": 20569116.284954578, "lr": 1.570841943568445e-05, "time_sec": 49.84640121459961 }, { "epoch": 139, "train_loss": 1.788800776901245, "train_acc": 0.50604, "test_loss": 7.676028425598145, "test_acc": 0.1308, "lyapunov": null, "grad_norm": 0.6393065831907885, "grad_max_sv": 0.2201111435890198, "grad_min_sv": 1.206703041933821e-08, "grad_condition": 28068636.701712035, "lr": 1.3210548563419845e-05, "time_sec": 49.82333970069885 }, { "epoch": 140, "train_loss": 1.7775352002334595, "train_acc": 0.50992, "test_loss": 6.824903617858887, "test_acc": 0.1382, "lyapunov": null, "grad_norm": 0.6429938723422318, "grad_max_sv": 0.21460832096636295, "grad_min_sv": 1.17411291786218e-08, "grad_condition": 31960287.943684638, "lr": 1.0926199633097203e-05, "time_sec": 49.83107376098633 }, { "epoch": 141, "train_loss": 1.7772767013931274, "train_acc": 0.50912, "test_loss": 8.417906446838378, "test_acc": 0.1201, "lyapunov": null, "grad_norm": 0.6414560412377437, "grad_max_sv": 0.22789728231728076, "grad_min_sv": 1.2347990069327964e-08, "grad_condition": 21519591.2698054, "lr": 8.856374635655688e-06, "time_sec": 49.830055475234985 }, { "epoch": 142, "train_loss": 1.7722079333496095, "train_acc": 0.5074, "test_loss": 7.479126264190674, "test_acc": 0.1332, "lyapunov": null, "grad_norm": 0.6492349389016402, "grad_max_sv": 0.23224957659840584, "grad_min_sv": 1.2359584963816949e-08, "grad_condition": 23310731.56809649, "lr": 7.001981464747503e-06, "time_sec": 49.821824073791504 }, { "epoch": 143, "train_loss": 1.7706715833282471, "train_acc": 0.50882, "test_loss": 6.759830638885498, "test_acc": 0.1312, "lyapunov": null, "grad_norm": 0.6386303224852788, "grad_max_sv": 0.21973421648144723, "grad_min_sv": 1.2129359658330508e-08, "grad_condition": 22303453.162939433, "lr": 5.3638335185058295e-06, "time_sec": 49.82608699798584 }, { "epoch": 144, "train_loss": 1.770061126937866, "train_acc": 0.51042, "test_loss": 8.168591398620606, "test_acc": 0.1265, "lyapunov": null, "grad_norm": 0.6443170070907279, "grad_max_sv": 0.22507050447165966, "grad_min_sv": 1.2152392936393141e-08, "grad_condition": 22873019.852206793, "lr": 3.942649342761114e-06, "time_sec": 49.8205029964447 }, { "epoch": 145, "train_loss": 1.7649179027938844, "train_acc": 0.509, "test_loss": 7.854398386383057, "test_acc": 0.1211, "lyapunov": null, "grad_norm": 0.63938639247204, "grad_max_sv": 0.22039102129638194, "grad_min_sv": 1.1966107968386375e-08, "grad_condition": 29791248.29023991, "lr": 2.7390523158633524e-06, "time_sec": 49.8352313041687 }, { "epoch": 146, "train_loss": 1.771636342201233, "train_acc": 0.50926, "test_loss": 7.595294637298584, "test_acc": 0.1263, "lyapunov": null, "grad_norm": 0.6439134858087602, "grad_max_sv": 0.22073593139648437, "grad_min_sv": 1.1903592189027589e-08, "grad_condition": 36630674.258442916, "lr": 1.7535703752478133e-06, "time_sec": 49.85316801071167 }, { "epoch": 147, "train_loss": 1.7654109023666382, "train_acc": 0.50992, "test_loss": 7.858496125793457, "test_acc": 0.1228, "lyapunov": null, "grad_norm": 0.6452120448477214, "grad_max_sv": 0.21640395522117614, "grad_min_sv": 1.1791314735720703e-08, "grad_condition": 36184836.96072569, "lr": 9.866357858642196e-07, "time_sec": 49.80920720100403 }, { "epoch": 148, "train_loss": 1.76628436378479, "train_acc": 0.50766, "test_loss": 8.274021264648438, "test_acc": 0.1088, "lyapunov": null, "grad_norm": 0.6448148716908921, "grad_max_sv": 0.22330073527991773, "grad_min_sv": 1.2051270137369841e-08, "grad_condition": 21403660.781028073, "lr": 4.38584950570808e-07, "time_sec": 49.84639763832092 }, { "epoch": 149, "train_loss": 1.7641568323135377, "train_acc": 0.50932, "test_loss": 7.1706701782226565, "test_acc": 0.1418, "lyapunov": null, "grad_norm": 0.6419761185100763, "grad_max_sv": 0.22420972734689712, "grad_min_sv": 1.2012330221494726e-08, "grad_condition": 44951323.39984313, "lr": 1.096582625772501e-07, "time_sec": 49.835381269454956 }, { "epoch": 150, "train_loss": 1.7616498372650147, "train_acc": 0.51152, "test_loss": 7.837383623504639, "test_acc": 0.1182, "lyapunov": null, "grad_norm": 0.6426676505435569, "grad_max_sv": 0.21811567358672618, "grad_min_sv": 1.1744335026014906e-08, "grad_condition": 40653937.072005436, "lr": 0.0, "time_sec": 49.85364270210266 } ], "16": [ { "epoch": 1, "train_loss": 4.790666111755371, "train_acc": 0.0165, "test_loss": 4.9503300064086915, "test_acc": 0.01, "lyapunov": null, "grad_norm": 5.291697588876432, "grad_max_sv": 4.663330984115601, "grad_min_sv": 7.994122603882659e-08, "grad_condition": 204227559.8068969, "lr": 0.0009998903417374227, "time_sec": 66.97809171676636 }, { "epoch": 2, "train_loss": 4.437635167236328, "train_acc": 0.03372, "test_loss": 4.9434486038208005, "test_acc": 0.0109, "lyapunov": null, "grad_norm": 3.3795440241281205, "grad_max_sv": 2.9110051512718202, "grad_min_sv": 5.2089944511252154e-08, "grad_condition": 566186137.812573, "lr": 0.0009995614150494292, "time_sec": 66.91377472877502 }, { "epoch": 3, "train_loss": 4.26833670211792, "train_acc": 0.04816, "test_loss": 4.993957643127441, "test_acc": 0.0118, "lyapunov": null, "grad_norm": 2.265691942587348, "grad_max_sv": 1.775827443599701, "grad_min_sv": 3.447322165783806e-08, "grad_condition": 193597124.56597418, "lr": 0.0009990133642141358, "time_sec": 66.95397591590881 }, { "epoch": 4, "train_loss": 4.126825766448975, "train_acc": 0.0657, "test_loss": 5.033058495330811, "test_acc": 0.0133, "lyapunov": null, "grad_norm": 1.503639209245557, "grad_max_sv": 0.996296688914299, "grad_min_sv": 2.3224798484378083e-08, "grad_condition": 47352815.280070126, "lr": 0.0009982464296247522, "time_sec": 66.94082856178284 }, { "epoch": 5, "train_loss": 4.033032944335938, "train_acc": 0.07788, "test_loss": 5.366096397399902, "test_acc": 0.0146, "lyapunov": null, "grad_norm": 1.2167707155197347, "grad_max_sv": 0.7315087422728539, "grad_min_sv": 1.914776174977151e-08, "grad_condition": 65647468.63073953, "lr": 0.0009972609476841367, "time_sec": 66.9649748802185 }, { "epoch": 6, "train_loss": 3.9636214042663576, "train_acc": 0.08816, "test_loss": 5.34757041015625, "test_acc": 0.0149, "lyapunov": null, "grad_norm": 1.109160273746945, "grad_max_sv": 0.6089150205254554, "grad_min_sv": 1.7710445950058773e-08, "grad_condition": 77884060.5331116, "lr": 0.000996057350657239, "time_sec": 66.97061657905579 }, { "epoch": 7, "train_loss": 3.9122159162902834, "train_acc": 0.09544, "test_loss": 5.439447886657715, "test_acc": 0.013, "lyapunov": null, "grad_norm": 1.0363457541084344, "grad_max_sv": 0.5376138880848884, "grad_min_sv": 1.6374132377761085e-08, "grad_condition": 48186425.879532695, "lr": 0.000994636166481494, "time_sec": 67.02947664260864 }, { "epoch": 8, "train_loss": 3.860605283126831, "train_acc": 0.10604, "test_loss": 5.774677875518798, "test_acc": 0.0152, "lyapunov": null, "grad_norm": 0.9855402112805093, "grad_max_sv": 0.5275192707777023, "grad_min_sv": 1.6650217127267554e-08, "grad_condition": 36767266.40486912, "lr": 0.0009929980185352525, "time_sec": 66.97124218940735 }, { "epoch": 9, "train_loss": 3.8149237147521973, "train_acc": 0.11454, "test_loss": 5.3070202072143555, "test_acc": 0.0222, "lyapunov": null, "grad_norm": 0.9330412728543993, "grad_max_sv": 0.4647836610674858, "grad_min_sv": 1.5222168972539585e-08, "grad_condition": 49307207.804101914, "lr": 0.0009911436253643444, "time_sec": 67.01966977119446 }, { "epoch": 10, "train_loss": 3.7818530071258545, "train_acc": 0.12014, "test_loss": 5.634545847320557, "test_acc": 0.0199, "lyapunov": null, "grad_norm": 0.8719008089031304, "grad_max_sv": 0.40649077892303465, "grad_min_sv": 1.4515182727992126e-08, "grad_condition": 38341756.409908436, "lr": 0.0009890738003669028, "time_sec": 67.23870015144348 }, { "epoch": 11, "train_loss": 3.743896211090088, "train_acc": 0.12462, "test_loss": 5.8831702270507815, "test_acc": 0.0241, "lyapunov": null, "grad_norm": 0.8436698179223415, "grad_max_sv": 0.39998230785131456, "grad_min_sv": 1.4137996530785845e-08, "grad_condition": 231359110.35725895, "lr": 0.00098678945143658, "time_sec": 67.23693895339966 }, { "epoch": 12, "train_loss": 3.7158116050720214, "train_acc": 0.12962, "test_loss": 5.8489625442504884, "test_acc": 0.0182, "lyapunov": null, "grad_norm": 0.8103156188684312, "grad_max_sv": 0.36918022111058235, "grad_min_sv": 1.3637384886633352e-08, "grad_condition": 38409273.56149448, "lr": 0.0009842915805643154, "time_sec": 67.05321264266968 }, { "epoch": 13, "train_loss": 3.690355722808838, "train_acc": 0.13444, "test_loss": 5.952298941802979, "test_acc": 0.0139, "lyapunov": null, "grad_norm": 0.7799393076966175, "grad_max_sv": 0.3450939729809761, "grad_min_sv": 1.3063578439224261e-08, "grad_condition": 267805312.78349906, "lr": 0.000981581283398829, "time_sec": 67.01498341560364 }, { "epoch": 14, "train_loss": 3.660913709640503, "train_acc": 0.13974, "test_loss": 5.962563812255859, "test_acc": 0.0157, "lyapunov": null, "grad_norm": 0.7562346727823589, "grad_max_sv": 0.3272464439272881, "grad_min_sv": 1.2569073787327411e-08, "grad_condition": 28603602.411010243, "lr": 0.0009786597487660333, "time_sec": 67.02658581733704 }, { "epoch": 15, "train_loss": 3.6474139246368407, "train_acc": 0.14148, "test_loss": 6.562283952331543, "test_acc": 0.0135, "lyapunov": null, "grad_norm": 0.7393349403998549, "grad_max_sv": 0.33356437757611274, "grad_min_sv": 1.2411575255055763e-08, "grad_condition": 43624327.61961842, "lr": 0.0009755282581475766, "time_sec": 67.03324222564697 }, { "epoch": 16, "train_loss": 3.625168949737549, "train_acc": 0.1432, "test_loss": 6.292130155944824, "test_acc": 0.0141, "lyapunov": null, "grad_norm": 0.7144248820011195, "grad_max_sv": 0.31020588912069796, "grad_min_sv": 1.2080284056414925e-08, "grad_condition": 29549483.252300274, "lr": 0.0009721881851187403, "time_sec": 66.97783041000366 }, { "epoch": 17, "train_loss": 3.597680552520752, "train_acc": 0.14858, "test_loss": 6.235865226745606, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.6905264720289787, "grad_max_sv": 0.2911532886326313, "grad_min_sv": 1.1886577161446255e-08, "grad_condition": 31227215.280764975, "lr": 0.0009686409947459456, "time_sec": 67.08970355987549 }, { "epoch": 18, "train_loss": 3.5831439966583254, "train_acc": 0.1503, "test_loss": 5.975571099853515, "test_acc": 0.0174, "lyapunov": null, "grad_norm": 0.6807202195385632, "grad_max_sv": 0.28772652372717855, "grad_min_sv": 1.1393226486029751e-08, "grad_condition": 137655636.45168823, "lr": 0.0009648882429441254, "time_sec": 66.99836611747742 }, { "epoch": 19, "train_loss": 3.5665633306121824, "train_acc": 0.15322, "test_loss": 5.7967665618896485, "test_acc": 0.0147, "lyapunov": null, "grad_norm": 0.6692239217191613, "grad_max_sv": 0.289702807366848, "grad_min_sv": 1.1524174722138403e-08, "grad_condition": 43837157.90767797, "lr": 0.00096093157579425, "time_sec": 66.98469638824463 }, { "epoch": 20, "train_loss": 3.5485270121765136, "train_acc": 0.15842, "test_loss": 6.38743748626709, "test_acc": 0.0106, "lyapunov": null, "grad_norm": 0.6524234858247975, "grad_max_sv": 0.2710107877850533, "grad_min_sv": 1.1343318032097648e-08, "grad_condition": 27194748.912352692, "lr": 0.0009567727288213001, "time_sec": 66.97950530052185 }, { "epoch": 21, "train_loss": 3.5387647283172607, "train_acc": 0.15974, "test_loss": 6.142497198486328, "test_acc": 0.0122, "lyapunov": null, "grad_norm": 0.6404971752730705, "grad_max_sv": 0.25612146519124507, "grad_min_sv": 1.1065940866417101e-08, "grad_condition": 27020698.902072392, "lr": 0.0009524135262330095, "time_sec": 67.06527757644653 }, { "epoch": 22, "train_loss": 3.5167810900115968, "train_acc": 0.16126, "test_loss": 5.6688673957824705, "test_acc": 0.0192, "lyapunov": null, "grad_norm": 0.6273838486372684, "grad_max_sv": 0.253273681178689, "grad_min_sv": 1.0633086347869302e-08, "grad_condition": 63663927.521495186, "lr": 0.0009478558801197061, "time_sec": 67.08625936508179 }, { "epoch": 23, "train_loss": 3.505348560180664, "train_acc": 0.16408, "test_loss": 6.704450527191162, "test_acc": 0.0106, "lyapunov": null, "grad_norm": 0.6205013434735249, "grad_max_sv": 0.24795704074203967, "grad_min_sv": 1.0544875683748956e-08, "grad_condition": 26930900.301938236, "lr": 0.000943101789615607, "time_sec": 67.07537865638733 }, { "epoch": 24, "train_loss": 3.487646808624268, "train_acc": 0.16852, "test_loss": 6.14088282699585, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.614195126220202, "grad_max_sv": 0.24658647775650025, "grad_min_sv": 1.0614721224211365e-08, "grad_condition": 25409602.645818073, "lr": 0.0009381533400219313, "time_sec": 67.04035305976868 }, { "epoch": 25, "train_loss": 3.476624384918213, "train_acc": 0.16722, "test_loss": 6.3985797378540035, "test_acc": 0.0153, "lyapunov": null, "grad_norm": 0.6065663518942211, "grad_max_sv": 0.24001154042780398, "grad_min_sv": 1.0449337081719356e-08, "grad_condition": 26892625.00106412, "lr": 0.0009330127018922189, "time_sec": 66.98434329032898 }, { "epoch": 26, "train_loss": 3.451528890914917, "train_acc": 0.17194, "test_loss": 7.005337218475342, "test_acc": 0.0161, "lyapunov": null, "grad_norm": 0.5958316341461533, "grad_max_sv": 0.23011010847985744, "grad_min_sv": 1.0420057322546583e-08, "grad_condition": 25092916.983647533, "lr": 0.000927682130080253, "time_sec": 67.00863981246948 }, { "epoch": 27, "train_loss": 3.438732011184692, "train_acc": 0.17512, "test_loss": 6.713776673126221, "test_acc": 0.0158, "lyapunov": null, "grad_norm": 0.5885432606585439, "grad_max_sv": 0.22313685715198517, "grad_min_sv": 1.0256330273961112e-08, "grad_condition": 25498257.67463268, "lr": 0.0009221639627510072, "time_sec": 66.99373292922974 }, { "epoch": 28, "train_loss": 3.425728820877075, "train_acc": 0.17648, "test_loss": 6.706079711914063, "test_acc": 0.0161, "lyapunov": null, "grad_norm": 0.5776306796513797, "grad_max_sv": 0.21763003207743167, "grad_min_sv": 1.0131521277489953e-08, "grad_condition": 25502860.727228213, "lr": 0.0009164606203550494, "time_sec": 66.99960255622864 }, { "epoch": 29, "train_loss": 3.415288860321045, "train_acc": 0.18104, "test_loss": 7.00422691116333, "test_acc": 0.0154, "lyapunov": null, "grad_norm": 0.5811456709025584, "grad_max_sv": 0.2154564827680588, "grad_min_sv": 1.0227832727971453e-08, "grad_condition": 23155291.155594237, "lr": 0.0009105746045668516, "time_sec": 67.00278520584106 }, { "epoch": 30, "train_loss": 3.3993768449401855, "train_acc": 0.18168, "test_loss": 6.7661912048339845, "test_acc": 0.0159, "lyapunov": null, "grad_norm": 0.5774334611780905, "grad_max_sv": 0.21602067165076733, "grad_min_sv": 9.999383252662363e-09, "grad_condition": 46830102.49335132, "lr": 0.0009045084971874733, "time_sec": 67.01802110671997 }, { "epoch": 31, "train_loss": 3.39102335395813, "train_acc": 0.183, "test_loss": 6.575534628295898, "test_acc": 0.0259, "lyapunov": null, "grad_norm": 0.5750391869831528, "grad_max_sv": 0.21328589245676993, "grad_min_sv": 1.0037052611266972e-08, "grad_condition": 25219793.844095282, "lr": 0.0008982649590120977, "time_sec": 66.98685121536255 }, { "epoch": 32, "train_loss": 3.3709024705505373, "train_acc": 0.1847, "test_loss": 6.773156211090088, "test_acc": 0.0241, "lyapunov": null, "grad_norm": 0.5682008127495727, "grad_max_sv": 0.20905940011143684, "grad_min_sv": 9.929261479690864e-09, "grad_condition": 24026442.614084087, "lr": 0.0008918467286629196, "time_sec": 66.98118853569031 }, { "epoch": 33, "train_loss": 3.35322883605957, "train_acc": 0.19048, "test_loss": 6.544390415191651, "test_acc": 0.0174, "lyapunov": null, "grad_norm": 0.5641011790857979, "grad_max_sv": 0.21131759136915207, "grad_min_sv": 9.970292436448092e-09, "grad_condition": 108439933.80954358, "lr": 0.0008852566213878943, "time_sec": 67.0021116733551 }, { "epoch": 34, "train_loss": 3.346888256225586, "train_acc": 0.1906, "test_loss": 6.572783890533447, "test_acc": 0.0249, "lyapunov": null, "grad_norm": 0.5631657519504247, "grad_max_sv": 0.20612632147967816, "grad_min_sv": 9.939895384558639e-09, "grad_condition": 27859013.00420784, "lr": 0.000878497527825878, "time_sec": 66.99292349815369 }, { "epoch": 35, "train_loss": 3.3364852532958986, "train_acc": 0.19192, "test_loss": 6.624941380310059, "test_acc": 0.0267, "lyapunov": null, "grad_norm": 0.5605769760458655, "grad_max_sv": 0.20491612255573272, "grad_min_sv": 9.870486683549728e-09, "grad_condition": 23146292.907969765, "lr": 0.000871572412738697, "time_sec": 66.99680066108704 }, { "epoch": 36, "train_loss": 3.3320838648986815, "train_acc": 0.19194, "test_loss": 6.509025389099121, "test_acc": 0.0338, "lyapunov": null, "grad_norm": 0.5514752672797416, "grad_max_sv": 0.19631769321858883, "grad_min_sv": 9.801347783389147e-09, "grad_condition": 22925424.744912885, "lr": 0.0008644843137107055, "time_sec": 67.00271224975586 }, { "epoch": 37, "train_loss": 3.3248722314453123, "train_acc": 0.19368, "test_loss": 6.660050495910644, "test_acc": 0.0232, "lyapunov": null, "grad_norm": 0.5549782000253485, "grad_max_sv": 0.20016637705266477, "grad_min_sv": 9.80520761806325e-09, "grad_condition": 43150496.42441137, "lr": 0.0008572363398164014, "time_sec": 67.00392818450928 }, { "epoch": 38, "train_loss": 3.3040303685760497, "train_acc": 0.1978, "test_loss": 6.438115409851074, "test_acc": 0.0278, "lyapunov": null, "grad_norm": 0.552679160616354, "grad_max_sv": 0.20150073878467084, "grad_min_sv": 9.978901688301178e-09, "grad_condition": 24404614.851154737, "lr": 0.0008498316702566826, "time_sec": 66.97884392738342 }, { "epoch": 39, "train_loss": 3.295093801422119, "train_acc": 0.2004, "test_loss": 6.857768655395508, "test_acc": 0.0356, "lyapunov": null, "grad_norm": 0.5456414300888803, "grad_max_sv": 0.19542820267379285, "grad_min_sv": 9.64108341980352e-09, "grad_condition": 38418267.99625971, "lr": 0.0008422735529643442, "time_sec": 66.989262342453 }, { "epoch": 40, "train_loss": 3.2807973724365236, "train_acc": 0.20254, "test_loss": 7.183624605560302, "test_acc": 0.0288, "lyapunov": null, "grad_norm": 0.5502236317298648, "grad_max_sv": 0.20073941312730312, "grad_min_sv": 9.736421222039659e-09, "grad_condition": 23971099.963185668, "lr": 0.0008345653031794289, "time_sec": 67.05479025840759 }, { "epoch": 41, "train_loss": 3.27089994934082, "train_acc": 0.20396, "test_loss": 7.336966199493408, "test_acc": 0.0235, "lyapunov": null, "grad_norm": 0.5476662910413355, "grad_max_sv": 0.19763046652078628, "grad_min_sv": 9.775574641435192e-09, "grad_condition": 23640934.778466806, "lr": 0.0008267103019950526, "time_sec": 67.02259588241577 }, { "epoch": 42, "train_loss": 3.2620423323059082, "train_acc": 0.20586, "test_loss": 6.97865482788086, "test_acc": 0.0258, "lyapunov": null, "grad_norm": 0.5434507884263167, "grad_max_sv": 0.19267416559159756, "grad_min_sv": 9.676590862622846e-09, "grad_condition": 32692140.861607928, "lr": 0.0008187119948743447, "time_sec": 67.11938738822937 }, { "epoch": 43, "train_loss": 3.246746938018799, "train_acc": 0.20984, "test_loss": 7.017108020019531, "test_acc": 0.027, "lyapunov": null, "grad_norm": 0.5396772430481056, "grad_max_sv": 0.1911445375531912, "grad_min_sv": 9.706909992468482e-09, "grad_condition": 22347408.62738797, "lr": 0.000810573890139155, "time_sec": 67.11671566963196 }, { "epoch": 44, "train_loss": 3.2492278230285643, "train_acc": 0.20804, "test_loss": 6.893268182373047, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.5383084022428465, "grad_max_sv": 0.18535939790308475, "grad_min_sv": 9.539425227522713e-09, "grad_condition": 74582506.47418927, "lr": 0.0008022995574311873, "time_sec": 67.00796937942505 }, { "epoch": 45, "train_loss": 3.2271074884796143, "train_acc": 0.2125, "test_loss": 6.6321695571899415, "test_acc": 0.0298, "lyapunov": null, "grad_norm": 0.5350882941371298, "grad_max_sv": 0.18614536896348, "grad_min_sv": 9.520675481561152e-09, "grad_condition": 519972815.1749519, "lr": 0.0007938926261462363, "time_sec": 67.05224251747131 }, { "epoch": 46, "train_loss": 3.223205012207031, "train_acc": 0.21378, "test_loss": 8.111690937805175, "test_acc": 0.0245, "lyapunov": null, "grad_norm": 0.5313315491107766, "grad_max_sv": 0.18769054301083088, "grad_min_sv": 9.561545546987737e-09, "grad_condition": 22558726.834869802, "lr": 0.0007853567838422158, "time_sec": 67.02692914009094 }, { "epoch": 47, "train_loss": 3.2102231874084475, "train_acc": 0.21366, "test_loss": 7.20476734161377, "test_acc": 0.0268, "lyapunov": null, "grad_norm": 0.5300596779522426, "grad_max_sv": 0.18552429899573325, "grad_min_sv": 9.575782686233047e-09, "grad_condition": 21495882.964656584, "lr": 0.0007766957746216719, "time_sec": 67.0929958820343 }, { "epoch": 48, "train_loss": 3.202328568191528, "train_acc": 0.21738, "test_loss": 7.143350020599366, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.5275781384357864, "grad_max_sv": 0.18636706620454788, "grad_min_sv": 9.551907610705345e-09, "grad_condition": 33257654.14790963, "lr": 0.0007679133974894982, "time_sec": 67.10289525985718 }, { "epoch": 49, "train_loss": 3.1964333237457274, "train_acc": 0.21696, "test_loss": 7.0859999771118165, "test_acc": 0.0354, "lyapunov": null, "grad_norm": 0.5290459768999093, "grad_max_sv": 0.18547305800020694, "grad_min_sv": 9.539052431978278e-09, "grad_condition": 34652740.14328016, "lr": 0.000759013504686565, "time_sec": 67.11912679672241 }, { "epoch": 50, "train_loss": 3.1868507556152346, "train_acc": 0.2195, "test_loss": 7.204959943389893, "test_acc": 0.0247, "lyapunov": null, "grad_norm": 0.5304998310773968, "grad_max_sv": 0.1833030626177788, "grad_min_sv": 9.589407306935527e-09, "grad_condition": 93768948.14927751, "lr": 0.0007499999999999998, "time_sec": 67.06959462165833 }, { "epoch": 51, "train_loss": 3.1883190923309326, "train_acc": 0.21784, "test_loss": 7.328389108276367, "test_acc": 0.0303, "lyapunov": null, "grad_norm": 0.5248467282170762, "grad_max_sv": 0.18131516128778458, "grad_min_sv": 9.465690375617952e-09, "grad_condition": 47668215.59636396, "lr": 0.0007408768370508575, "time_sec": 67.01846742630005 }, { "epoch": 52, "train_loss": 3.1719473053741454, "train_acc": 0.22166, "test_loss": 8.36594852142334, "test_acc": 0.025, "lyapunov": null, "grad_norm": 0.5248103969653446, "grad_max_sv": 0.17532115392386913, "grad_min_sv": 9.532304753867572e-09, "grad_condition": 26041874.469802074, "lr": 0.0007316480175599307, "time_sec": 67.03516387939453 }, { "epoch": 53, "train_loss": 3.1698596488952635, "train_acc": 0.22132, "test_loss": 8.36387837677002, "test_acc": 0.0251, "lyapunov": null, "grad_norm": 0.5233372908286834, "grad_max_sv": 0.17466790974140167, "grad_min_sv": 9.286205268632663e-09, "grad_condition": 21363168.099911686, "lr": 0.0007223175895924635, "time_sec": 67.02187657356262 }, { "epoch": 54, "train_loss": 3.152655903167725, "train_acc": 0.22722, "test_loss": 8.196963485717774, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.5285400405038103, "grad_max_sv": 0.17916450947523116, "grad_min_sv": 9.4594759324218e-09, "grad_condition": 82291006.99579689, "lr": 0.0007128896457825361, "time_sec": 66.97509050369263 }, { "epoch": 55, "train_loss": 3.1408946729278564, "train_acc": 0.22896, "test_loss": 8.031216970825195, "test_acc": 0.0238, "lyapunov": null, "grad_norm": 0.5251164499697153, "grad_max_sv": 0.17466633953154087, "grad_min_sv": 9.452194638104316e-09, "grad_condition": 22653052.01456701, "lr": 0.0007033683215378998, "time_sec": 67.00176858901978 }, { "epoch": 56, "train_loss": 3.1348105377960205, "train_acc": 0.22832, "test_loss": 8.950087960815429, "test_acc": 0.0204, "lyapunov": null, "grad_norm": 0.5200008300943049, "grad_max_sv": 0.17119008600711821, "grad_min_sv": 9.414464659240895e-09, "grad_condition": 31689823.38588159, "lr": 0.0006937577932260512, "time_sec": 66.97579646110535 }, { "epoch": 57, "train_loss": 3.1169134953308104, "train_acc": 0.23282, "test_loss": 8.065475146484374, "test_acc": 0.0311, "lyapunov": null, "grad_norm": 0.5241244870526487, "grad_max_sv": 0.17154259756207466, "grad_min_sv": 9.529985643685902e-09, "grad_condition": 28312826.48374013, "lr": 0.0006840622763423388, "time_sec": 66.9856812953949 }, { "epoch": 58, "train_loss": 3.1234397563171385, "train_acc": 0.22962, "test_loss": 8.583345112609864, "test_acc": 0.0222, "lyapunov": null, "grad_norm": 0.5197452718406793, "grad_max_sv": 0.17415275909006595, "grad_min_sv": 9.31348687893685e-09, "grad_condition": 21270072.13306666, "lr": 0.0006742860236609073, "time_sec": 66.99910068511963 }, { "epoch": 59, "train_loss": 3.1087922663879395, "train_acc": 0.23302, "test_loss": 8.37566005859375, "test_acc": 0.0239, "lyapunov": null, "grad_norm": 0.5182628480059946, "grad_max_sv": 0.17543886601924896, "grad_min_sv": 9.358361164474304e-09, "grad_condition": 31647391.583267204, "lr": 0.0006644333233692913, "time_sec": 66.97189855575562 }, { "epoch": 60, "train_loss": 3.0956507678985594, "train_acc": 0.23662, "test_loss": 7.7532292655944826, "test_acc": 0.0248, "lyapunov": null, "grad_norm": 0.5195814358053482, "grad_max_sv": 0.1776260558515787, "grad_min_sv": 9.643665624392561e-09, "grad_condition": 22666276.356990974, "lr": 0.0006545084971874734, "time_sec": 67.00041198730469 }, { "epoch": 61, "train_loss": 3.092038777694702, "train_acc": 0.23596, "test_loss": 7.946604266357422, "test_acc": 0.0245, "lyapunov": null, "grad_norm": 0.5196921425232948, "grad_max_sv": 0.17445886991918086, "grad_min_sv": 9.508607204389285e-09, "grad_condition": 21427055.017691903, "lr": 0.0006445158984722354, "time_sec": 67.06589937210083 }, { "epoch": 62, "train_loss": 3.079979831466675, "train_acc": 0.23898, "test_loss": 9.319492291259765, "test_acc": 0.0213, "lyapunov": null, "grad_norm": 0.5186454829421666, "grad_max_sv": 0.16986236572265626, "grad_min_sv": 9.32054670874094e-09, "grad_condition": 31246817.26616311, "lr": 0.0006344599103076324, "time_sec": 66.99018096923828 }, { "epoch": 63, "train_loss": 3.0727787420654296, "train_acc": 0.23906, "test_loss": 8.948303262329102, "test_acc": 0.0269, "lyapunov": null, "grad_norm": 0.5175233947350019, "grad_max_sv": 0.16513913124799728, "grad_min_sv": 9.338011380810585e-09, "grad_condition": 24005876.4941143, "lr": 0.0006243449435824269, "time_sec": 66.9405734539032 }, { "epoch": 64, "train_loss": 3.074298862915039, "train_acc": 0.23708, "test_loss": 9.195949301147461, "test_acc": 0.0262, "lyapunov": null, "grad_norm": 0.5221855467062518, "grad_max_sv": 0.17083160430192948, "grad_min_sv": 9.452190228090296e-09, "grad_condition": 48343788.07302423, "lr": 0.0006141754350553275, "time_sec": 67.0041880607605 }, { "epoch": 65, "train_loss": 3.0613560808563234, "train_acc": 0.24008, "test_loss": 8.735752813720703, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 0.5207095947451149, "grad_max_sv": 0.1693739652633667, "grad_min_sv": 9.425346239599897e-09, "grad_condition": 23106579.847053923, "lr": 0.0006039558454088793, "time_sec": 66.9728434085846 }, { "epoch": 66, "train_loss": 3.050594620132446, "train_acc": 0.243, "test_loss": 8.672268884277344, "test_acc": 0.0298, "lyapunov": null, "grad_norm": 0.5161820441185401, "grad_max_sv": 0.1685989484190941, "grad_min_sv": 9.325516864278071e-09, "grad_condition": 20646125.746492933, "lr": 0.000593690657292862, "time_sec": 66.97670912742615 }, { "epoch": 67, "train_loss": 3.0404045782470703, "train_acc": 0.2468, "test_loss": 9.001078883361817, "test_acc": 0.0227, "lyapunov": null, "grad_norm": 0.5184119200981759, "grad_max_sv": 0.1701225485652685, "grad_min_sv": 9.472868531257284e-09, "grad_condition": 23517656.45251561, "lr": 0.0005833843733580507, "time_sec": 66.96425604820251 }, { "epoch": 68, "train_loss": 3.0347717694091796, "train_acc": 0.24578, "test_loss": 8.55764455871582, "test_acc": 0.0204, "lyapunov": null, "grad_norm": 0.5177787618737804, "grad_max_sv": 0.17245440557599068, "grad_min_sv": 9.351008802005456e-09, "grad_condition": 26504498.6419156, "lr": 0.0005730415142812054, "time_sec": 66.987557888031 }, { "epoch": 69, "train_loss": 3.0343177091979983, "train_acc": 0.24472, "test_loss": 8.6480171875, "test_acc": 0.0252, "lyapunov": null, "grad_norm": 0.5144704452610198, "grad_max_sv": 0.16564900018274784, "grad_min_sv": 9.403833016452534e-09, "grad_condition": 27296778.54875686, "lr": 0.0005626666167821517, "time_sec": 66.97946643829346 }, { "epoch": 70, "train_loss": 3.019142656097412, "train_acc": 0.25006, "test_loss": 8.915339315795899, "test_acc": 0.0291, "lyapunov": null, "grad_norm": 0.5199788677371252, "grad_max_sv": 0.16652515456080436, "grad_min_sv": 9.64339011144677e-09, "grad_condition": 23020050.410736304, "lr": 0.0005522642316338265, "time_sec": 66.97834086418152 }, { "epoch": 71, "train_loss": 3.0120436127471923, "train_acc": 0.25124, "test_loss": 9.489800686645507, "test_acc": 0.0229, "lyapunov": null, "grad_norm": 0.5170392758240284, "grad_max_sv": 0.16549308113753797, "grad_min_sv": 9.466763362109277e-09, "grad_condition": 23186013.564122196, "lr": 0.0005418389216661573, "time_sec": 66.98612070083618 }, { "epoch": 72, "train_loss": 3.005094768676758, "train_acc": 0.25262, "test_loss": 9.240029809570313, "test_acc": 0.0228, "lyapunov": null, "grad_norm": 0.5193656479358113, "grad_max_sv": 0.16801112554967404, "grad_min_sv": 9.608471449040756e-09, "grad_condition": 72045711.1919595, "lr": 0.0005313952597646563, "time_sec": 66.99170446395874 }, { "epoch": 73, "train_loss": 2.9903506928253174, "train_acc": 0.25404, "test_loss": 9.075869140625, "test_acc": 0.0255, "lyapunov": null, "grad_norm": 0.517195719023633, "grad_max_sv": 0.16475822702050208, "grad_min_sv": 9.421488161853731e-09, "grad_condition": 20088448.14143536, "lr": 0.0005209378268645994, "time_sec": 66.99337768554688 }, { "epoch": 74, "train_loss": 2.9886431184387208, "train_acc": 0.25206, "test_loss": 8.946782205200195, "test_acc": 0.0216, "lyapunov": null, "grad_norm": 0.5156132053442515, "grad_max_sv": 0.1671187650412321, "grad_min_sv": 9.546754539679903e-09, "grad_condition": 20526453.312863432, "lr": 0.0005104712099416781, "time_sec": 66.97370409965515 }, { "epoch": 75, "train_loss": 2.978247420654297, "train_acc": 0.25748, "test_loss": 8.795244805908203, "test_acc": 0.0265, "lyapunov": null, "grad_norm": 0.5172367229977752, "grad_max_sv": 0.16712253615260125, "grad_min_sv": 9.516156018046784e-09, "grad_condition": 30249731.938419342, "lr": 0.0004999999999999996, "time_sec": 67.0042519569397 }, { "epoch": 76, "train_loss": 2.975222046432495, "train_acc": 0.2575, "test_loss": 7.9467042022705074, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.5205213451239863, "grad_max_sv": 0.16927127800881864, "grad_min_sv": 9.570786241308582e-09, "grad_condition": 21297706.844217338, "lr": 0.0004895287900583212, "time_sec": 66.98396968841553 }, { "epoch": 77, "train_loss": 2.9694722108459475, "train_acc": 0.25688, "test_loss": 8.63839992980957, "test_acc": 0.027, "lyapunov": null, "grad_norm": 0.5171656548088565, "grad_max_sv": 0.16773934625089168, "grad_min_sv": 9.45730138160461e-09, "grad_condition": 53792449.33116071, "lr": 0.0004790621731353997, "time_sec": 67.06471967697144 }, { "epoch": 78, "train_loss": 2.954387292098999, "train_acc": 0.26136, "test_loss": 8.785921076965332, "test_acc": 0.0231, "lyapunov": null, "grad_norm": 0.5158257600732294, "grad_max_sv": 0.16913142390549182, "grad_min_sv": 9.432701836287194e-09, "grad_condition": 22764076.692523666, "lr": 0.000468604740235343, "time_sec": 66.98979210853577 }, { "epoch": 79, "train_loss": 2.951801152191162, "train_acc": 0.26352, "test_loss": 8.070646887207031, "test_acc": 0.0255, "lyapunov": null, "grad_norm": 0.5174682191745558, "grad_max_sv": 0.16524536907672882, "grad_min_sv": 9.502134473704515e-09, "grad_condition": 19794117.95628558, "lr": 0.00045816107833384175, "time_sec": 67.00397682189941 }, { "epoch": 80, "train_loss": 2.945303405151367, "train_acc": 0.25934, "test_loss": 8.538162045288086, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.5164921536500987, "grad_max_sv": 0.16473788283765317, "grad_min_sv": 9.313295684654222e-09, "grad_condition": 20076070.15299391, "lr": 0.0004477357683661729, "time_sec": 66.99750208854675 }, { "epoch": 81, "train_loss": 2.9330507093811033, "train_acc": 0.26472, "test_loss": 9.089803251647949, "test_acc": 0.0256, "lyapunov": null, "grad_norm": 0.5182949552264074, "grad_max_sv": 0.16235619597136974, "grad_min_sv": 9.617397696282115e-09, "grad_condition": 30543590.097258378, "lr": 0.00043733338321784746, "time_sec": 66.96942782402039 }, { "epoch": 82, "train_loss": 2.931871794204712, "train_acc": 0.26478, "test_loss": 9.64152674560547, "test_acc": 0.0219, "lyapunov": null, "grad_norm": 0.5176276155464238, "grad_max_sv": 0.16380822993814945, "grad_min_sv": 9.444439504069369e-09, "grad_condition": 55360326.762117185, "lr": 0.0004269584857187939, "time_sec": 66.98204827308655 }, { "epoch": 83, "train_loss": 2.9243045820617675, "train_acc": 0.2654, "test_loss": 8.998370599365234, "test_acc": 0.0286, "lyapunov": null, "grad_norm": 0.5221359210821417, "grad_max_sv": 0.16723665855824948, "grad_min_sv": 9.730227464033181e-09, "grad_condition": 37510081.93776859, "lr": 0.0004166156266419484, "time_sec": 67.03800463676453 }, { "epoch": 84, "train_loss": 2.910555010223389, "train_acc": 0.26936, "test_loss": 9.721973526000976, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 0.519552420362012, "grad_max_sv": 0.16508992463350297, "grad_min_sv": 9.647469361231953e-09, "grad_condition": 55059867.79942672, "lr": 0.0004063093427071373, "time_sec": 67.02205467224121 }, { "epoch": 85, "train_loss": 2.908977954711914, "train_acc": 0.26772, "test_loss": 9.513397438049317, "test_acc": 0.0262, "lyapunov": null, "grad_norm": 0.5225336336313486, "grad_max_sv": 0.1674807954579592, "grad_min_sv": 9.611194474665185e-09, "grad_condition": 61660610.28358656, "lr": 0.0003960441545911199, "time_sec": 66.98397827148438 }, { "epoch": 86, "train_loss": 2.9070045388793946, "train_acc": 0.26946, "test_loss": 9.42815225982666, "test_acc": 0.0253, "lyapunov": null, "grad_norm": 0.5163838704970162, "grad_max_sv": 0.15979891866445542, "grad_min_sv": 9.371719027900793e-09, "grad_condition": 27067310.492935486, "lr": 0.0003858245649446718, "time_sec": 67.00940752029419 }, { "epoch": 87, "train_loss": 2.8997818164825437, "train_acc": 0.27182, "test_loss": 9.99990376586914, "test_acc": 0.0235, "lyapunov": null, "grad_norm": 0.5185938331206461, "grad_max_sv": 0.1670172270387411, "grad_min_sv": 9.72940567521563e-09, "grad_condition": 41690290.30450606, "lr": 0.00037565505641757235, "time_sec": 66.98136639595032 }, { "epoch": 88, "train_loss": 2.8861678593444826, "train_acc": 0.27088, "test_loss": 9.440834574890136, "test_acc": 0.0223, "lyapunov": null, "grad_norm": 0.5210845021802476, "grad_max_sv": 0.16573623865842818, "grad_min_sv": 9.66025861803832e-09, "grad_condition": 21401152.005565703, "lr": 0.00036554008969236695, "time_sec": 66.97698450088501 }, { "epoch": 89, "train_loss": 2.879338860092163, "train_acc": 0.2741, "test_loss": 9.169851208496095, "test_acc": 0.0199, "lyapunov": null, "grad_norm": 0.5207447841157706, "grad_max_sv": 0.16667181067168713, "grad_min_sv": 9.689165991755289e-09, "grad_condition": 26973958.650769584, "lr": 0.0003554841015277638, "time_sec": 67.01995515823364 }, { "epoch": 90, "train_loss": 2.8748147813415525, "train_acc": 0.27324, "test_loss": 10.077813652038575, "test_acc": 0.022, "lyapunov": null, "grad_norm": 0.5199671563562479, "grad_max_sv": 0.16343193501234055, "grad_min_sv": 9.647999926754025e-09, "grad_condition": 21023683.920218416, "lr": 0.000345491502812526, "time_sec": 67.06868648529053 }, { "epoch": 91, "train_loss": 2.8696892933654787, "train_acc": 0.27466, "test_loss": 9.565517497253419, "test_acc": 0.0229, "lyapunov": null, "grad_norm": 0.5208386545074176, "grad_max_sv": 0.16384688578546047, "grad_min_sv": 9.741156603571e-09, "grad_condition": 20234282.31156399, "lr": 0.0003355666766307081, "time_sec": 67.05189514160156 }, { "epoch": 92, "train_loss": 2.8643893748474123, "train_acc": 0.27506, "test_loss": 9.676446484375, "test_acc": 0.0222, "lyapunov": null, "grad_norm": 0.5227536692673017, "grad_max_sv": 0.16562484614551068, "grad_min_sv": 9.696238559286918e-09, "grad_condition": 19364268.060319778, "lr": 0.00032571397633909225, "time_sec": 67.04055285453796 }, { "epoch": 93, "train_loss": 2.9157111973571777, "train_acc": 0.2694, "test_loss": 10.502802850341796, "test_acc": 0.016, "lyapunov": null, "grad_norm": 0.5304583427147314, "grad_max_sv": 0.16479565128684043, "grad_min_sv": 9.75800383412606e-09, "grad_condition": 23919445.487485204, "lr": 0.00031593772365766094, "time_sec": 67.07202672958374 }, { "epoch": 94, "train_loss": 3.5718225437927247, "train_acc": 0.14984, "test_loss": 8.342486605834962, "test_acc": 0.0173, "lyapunov": null, "grad_norm": 0.47865396629415263, "grad_max_sv": 0.146741402707994, "grad_min_sv": 8.774483893636553e-09, "grad_condition": 22076860.426247958, "lr": 0.0003062422067739483, "time_sec": 66.99063777923584 }, { "epoch": 95, "train_loss": 3.3590557197570803, "train_acc": 0.18824, "test_loss": 9.117096383666992, "test_acc": 0.018, "lyapunov": null, "grad_norm": 0.47849958749977733, "grad_max_sv": 0.14531232379376888, "grad_min_sv": 8.800075565473798e-09, "grad_condition": 21940629.92360129, "lr": 0.00029663167846209965, "time_sec": 66.97514224052429 }, { "epoch": 96, "train_loss": 3.2702466972351076, "train_acc": 0.2019, "test_loss": 9.76727836151123, "test_acc": 0.0196, "lyapunov": null, "grad_norm": 0.47937534710610474, "grad_max_sv": 0.14464113656431438, "grad_min_sv": 8.792039801926166e-09, "grad_condition": 89660660.43121836, "lr": 0.00028711035421746345, "time_sec": 66.99873089790344 }, { "epoch": 97, "train_loss": 3.2227031265258788, "train_acc": 0.21062, "test_loss": 9.626097766113281, "test_acc": 0.02, "lyapunov": null, "grad_norm": 0.4871680253381029, "grad_max_sv": 0.15086784306913614, "grad_min_sv": 9.198363076778903e-09, "grad_condition": 18446455.013218474, "lr": 0.00027768241040753615, "time_sec": 67.01664638519287 }, { "epoch": 98, "train_loss": 3.1770834211730956, "train_acc": 0.21918, "test_loss": 9.366678713989257, "test_acc": 0.0189, "lyapunov": null, "grad_norm": 0.48983757815120343, "grad_max_sv": 0.14779492281377316, "grad_min_sv": 9.026428729463909e-09, "grad_condition": 18794227.40584495, "lr": 0.00026835198244006903, "time_sec": 66.9809033870697 }, { "epoch": 99, "train_loss": 3.154748341598511, "train_acc": 0.22074, "test_loss": 8.755814114379882, "test_acc": 0.0203, "lyapunov": null, "grad_norm": 0.49142802947586006, "grad_max_sv": 0.14894249550998212, "grad_min_sv": 9.186921921030405e-09, "grad_condition": 243665710.2249507, "lr": 0.0002591231629491421, "time_sec": 66.99194574356079 }, { "epoch": 100, "train_loss": 3.120311908035278, "train_acc": 0.229, "test_loss": 9.377279025268555, "test_acc": 0.019, "lyapunov": null, "grad_norm": 0.49378455655907144, "grad_max_sv": 0.1519782803952694, "grad_min_sv": 9.117503733946376e-09, "grad_condition": 21901137.13681825, "lr": 0.0002499999999999997, "time_sec": 66.99540328979492 }, { "epoch": 101, "train_loss": 3.102491766357422, "train_acc": 0.23234, "test_loss": 9.32430498046875, "test_acc": 0.0219, "lyapunov": null, "grad_norm": 0.49627664046313075, "grad_max_sv": 0.15419429913163185, "grad_min_sv": 9.201821271620503e-09, "grad_condition": 21776686.85204944, "lr": 0.00024098649531343477, "time_sec": 66.98357772827148 }, { "epoch": 102, "train_loss": 3.085017224731445, "train_acc": 0.23322, "test_loss": 9.753949787902831, "test_acc": 0.0193, "lyapunov": null, "grad_norm": 0.49406280305370465, "grad_max_sv": 0.15118828602135181, "grad_min_sv": 9.171319623191288e-09, "grad_condition": 24151283.383643005, "lr": 0.0002320866025105016, "time_sec": 66.97265934944153 }, { "epoch": 103, "train_loss": 3.066944828414917, "train_acc": 0.23798, "test_loss": 9.439580722045898, "test_acc": 0.0198, "lyapunov": null, "grad_norm": 0.49800148183033643, "grad_max_sv": 0.15005342811346054, "grad_min_sv": 9.260063320998268e-09, "grad_condition": 32769732.654720783, "lr": 0.0002233042253783278, "time_sec": 67.00615048408508 }, { "epoch": 104, "train_loss": 3.0457233097839356, "train_acc": 0.24206, "test_loss": 9.283833685302735, "test_acc": 0.022, "lyapunov": null, "grad_norm": 0.5005816660320969, "grad_max_sv": 0.15397185049951076, "grad_min_sv": 9.2347574705276e-09, "grad_condition": 39740043.841383025, "lr": 0.000214643216157784, "time_sec": 66.98598265647888 }, { "epoch": 105, "train_loss": 3.0319893937683107, "train_acc": 0.24054, "test_loss": 9.208142726135254, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.4998792272266736, "grad_max_sv": 0.15734503231942654, "grad_min_sv": 9.254817884274402e-09, "grad_condition": 23445108.874561593, "lr": 0.00020610737385376332, "time_sec": 66.97633767127991 }, { "epoch": 106, "train_loss": 3.0231310614013673, "train_acc": 0.2459, "test_loss": 9.397696965026855, "test_acc": 0.0216, "lyapunov": null, "grad_norm": 0.5036514636560196, "grad_max_sv": 0.15039666295051574, "grad_min_sv": 9.292655003714615e-09, "grad_condition": 456660482.4660243, "lr": 0.00019770044256881242, "time_sec": 66.97969722747803 }, { "epoch": 107, "train_loss": 3.015210195846558, "train_acc": 0.24924, "test_loss": 9.136646028137207, "test_acc": 0.0253, "lyapunov": null, "grad_norm": 0.5044102710994137, "grad_max_sv": 0.15338496044278144, "grad_min_sv": 9.416407534962313e-09, "grad_condition": 29814119.267252993, "lr": 0.0001894261098608447, "time_sec": 66.9929895401001 }, { "epoch": 108, "train_loss": 2.992950742034912, "train_acc": 0.25076, "test_loss": 9.683133767700195, "test_acc": 0.0206, "lyapunov": null, "grad_norm": 0.5024766427018658, "grad_max_sv": 0.15207941457629204, "grad_min_sv": 9.368817296961928e-09, "grad_condition": 25707665.821010012, "lr": 0.000181288005125655, "time_sec": 67.04599475860596 }, { "epoch": 109, "train_loss": 2.9911826483917237, "train_acc": 0.25182, "test_loss": 9.541546542358398, "test_acc": 0.0216, "lyapunov": null, "grad_norm": 0.5050428635829171, "grad_max_sv": 0.1559975240379572, "grad_min_sv": 9.425568786580741e-09, "grad_condition": 29011942.837490637, "lr": 0.0001732896980049473, "time_sec": 66.9745888710022 }, { "epoch": 110, "train_loss": 2.9719406244659425, "train_acc": 0.25626, "test_loss": 9.304527082824707, "test_acc": 0.0239, "lyapunov": null, "grad_norm": 0.50709757758927, "grad_max_sv": 0.15366660207509994, "grad_min_sv": 9.407841375375093e-09, "grad_condition": 20259210.324132033, "lr": 0.00016543469682057076, "time_sec": 67.00725531578064 }, { "epoch": 111, "train_loss": 2.9610974934387206, "train_acc": 0.25892, "test_loss": 9.905137655639649, "test_acc": 0.0233, "lyapunov": null, "grad_norm": 0.5069510646769094, "grad_max_sv": 0.16044184900820255, "grad_min_sv": 9.517911378487121e-09, "grad_condition": 20572867.320830267, "lr": 0.00015772644703565552, "time_sec": 66.96853518486023 }, { "epoch": 112, "train_loss": 2.956413153839111, "train_acc": 0.25946, "test_loss": 10.164678506469727, "test_acc": 0.0226, "lyapunov": null, "grad_norm": 0.5077720159938983, "grad_max_sv": 0.15506692193448543, "grad_min_sv": 9.397505702779529e-09, "grad_condition": 22578916.073937874, "lr": 0.00015016832974331713, "time_sec": 67.01250433921814 }, { "epoch": 113, "train_loss": 2.9505707207489014, "train_acc": 0.26056, "test_loss": 9.862203175354004, "test_acc": 0.0237, "lyapunov": null, "grad_norm": 0.508430292455553, "grad_max_sv": 0.1596985150128603, "grad_min_sv": 9.460744607170391e-09, "grad_condition": 18853883.48562253, "lr": 0.00014276366018359834, "time_sec": 66.99557614326477 }, { "epoch": 114, "train_loss": 2.9415723051452636, "train_acc": 0.2616, "test_loss": 9.63483480834961, "test_acc": 0.0232, "lyapunov": null, "grad_norm": 0.5104303932486228, "grad_max_sv": 0.1552283179014921, "grad_min_sv": 9.445251571464034e-09, "grad_condition": 693766580.7640529, "lr": 0.00013551568628929425, "time_sec": 66.99906969070435 }, { "epoch": 115, "train_loss": 2.9388054510498045, "train_acc": 0.26148, "test_loss": 9.398469245910645, "test_acc": 0.0231, "lyapunov": null, "grad_norm": 0.5141390434712518, "grad_max_sv": 0.16008906662464142, "grad_min_sv": 9.453520891100631e-09, "grad_condition": 21355980.767428003, "lr": 0.00012842758726130276, "time_sec": 66.97847414016724 }, { "epoch": 116, "train_loss": 2.9283171284484864, "train_acc": 0.26438, "test_loss": 9.456967205810546, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.5133058115565678, "grad_max_sv": 0.15975738912820817, "grad_min_sv": 9.5292529520008e-09, "grad_condition": 22298576.095964633, "lr": 0.0001215024721741218, "time_sec": 66.9903039932251 }, { "epoch": 117, "train_loss": 2.919693772506714, "train_acc": 0.26682, "test_loss": 9.649295095825195, "test_acc": 0.0229, "lyapunov": null, "grad_norm": 0.5098040600332114, "grad_max_sv": 0.15964976735413075, "grad_min_sv": 9.535333161947435e-09, "grad_condition": 18488699.782394268, "lr": 0.00011474337861210538, "time_sec": 66.98530316352844 }, { "epoch": 118, "train_loss": 2.9129154638671877, "train_acc": 0.26648, "test_loss": 9.582696447753905, "test_acc": 0.0252, "lyapunov": null, "grad_norm": 0.5137327165981059, "grad_max_sv": 0.15674266032874584, "grad_min_sv": 9.422415092608106e-09, "grad_condition": 21769035.1047443, "lr": 0.00010815327133708009, "time_sec": 67.0712718963623 }, { "epoch": 119, "train_loss": 2.90771673576355, "train_acc": 0.26738, "test_loss": 9.686517756652831, "test_acc": 0.0223, "lyapunov": null, "grad_norm": 0.5112636160904589, "grad_max_sv": 0.15690986551344394, "grad_min_sv": 9.557581368002666e-09, "grad_condition": 65271422.15119822, "lr": 0.00010173504098790182, "time_sec": 66.99134540557861 }, { "epoch": 120, "train_loss": 2.903361056442261, "train_acc": 0.26626, "test_loss": 9.534084574890137, "test_acc": 0.025, "lyapunov": null, "grad_norm": 0.5139337490910202, "grad_max_sv": 0.16002687215805053, "grad_min_sv": 9.488575995753035e-09, "grad_condition": 26500108.07568959, "lr": 9.549150281252629e-05, "time_sec": 66.98560166358948 }, { "epoch": 121, "train_loss": 2.8838987274169923, "train_acc": 0.27268, "test_loss": 9.002799011230469, "test_acc": 0.0286, "lyapunov": null, "grad_norm": 0.5181242234216702, "grad_max_sv": 0.15681598484516143, "grad_min_sv": 9.58419937996391e-09, "grad_condition": 21911011.850442223, "lr": 8.942539543314794e-05, "time_sec": 66.99542880058289 }, { "epoch": 122, "train_loss": 2.8907574623107912, "train_acc": 0.27284, "test_loss": 9.40299231262207, "test_acc": 0.023, "lyapunov": null, "grad_norm": 0.5154755058010533, "grad_max_sv": 0.16150307320058346, "grad_min_sv": 9.692825331253373e-09, "grad_condition": 20117302.380122818, "lr": 8.353937964495024e-05, "time_sec": 66.98236727714539 }, { "epoch": 123, "train_loss": 2.8763803490448, "train_acc": 0.2739, "test_loss": 9.18796940612793, "test_acc": 0.0263, "lyapunov": null, "grad_norm": 0.514194573203304, "grad_max_sv": 0.15613614898175002, "grad_min_sv": 9.584234908488477e-09, "grad_condition": 18777275.99405461, "lr": 7.783603724899243e-05, "time_sec": 66.99689793586731 }, { "epoch": 124, "train_loss": 2.8843617086029054, "train_acc": 0.27144, "test_loss": 9.370162466430664, "test_acc": 0.0248, "lyapunov": null, "grad_norm": 0.5136262444075659, "grad_max_sv": 0.15881695374846458, "grad_min_sv": 9.587037638758567e-09, "grad_condition": 18534833.152038723, "lr": 7.231786991974666e-05, "time_sec": 66.98831605911255 }, { "epoch": 125, "train_loss": 2.8742648021697996, "train_acc": 0.27246, "test_loss": 9.4968570602417, "test_acc": 0.0258, "lyapunov": null, "grad_norm": 0.5172296409721588, "grad_max_sv": 0.15975196473300457, "grad_min_sv": 9.493101107982404e-09, "grad_condition": 20120176.988574862, "lr": 6.698729810778072e-05, "time_sec": 66.98702692985535 }, { "epoch": 126, "train_loss": 2.868820255508423, "train_acc": 0.27476, "test_loss": 9.60731820678711, "test_acc": 0.0243, "lyapunov": null, "grad_norm": 0.5204414887458292, "grad_max_sv": 0.16092863790690898, "grad_min_sv": 9.674041201446215e-09, "grad_condition": 18855250.862980247, "lr": 6.184665997806817e-05, "time_sec": 66.97707200050354 }, { "epoch": 127, "train_loss": 2.8692937660217286, "train_acc": 0.27484, "test_loss": 9.273512542724609, "test_acc": 0.0252, "lyapunov": null, "grad_norm": 0.5162971653606119, "grad_max_sv": 0.16184906139969826, "grad_min_sv": 9.668298800447062e-09, "grad_condition": 21519277.77695776, "lr": 5.6898210384392595e-05, "time_sec": 67.0102117061615 }, { "epoch": 128, "train_loss": 2.8623614330291747, "train_acc": 0.27702, "test_loss": 9.566067819213867, "test_acc": 0.0239, "lyapunov": null, "grad_norm": 0.5161277911748794, "grad_max_sv": 0.1572089247405529, "grad_min_sv": 9.598460455964574e-09, "grad_condition": 40264946.42458854, "lr": 5.214411988029363e-05, "time_sec": 66.9910991191864 }, { "epoch": 129, "train_loss": 2.8542457569122313, "train_acc": 0.27896, "test_loss": 9.585708435058594, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.5185536839510844, "grad_max_sv": 0.16669968273490668, "grad_min_sv": 9.84268076209549e-09, "grad_condition": 20409849.055229448, "lr": 4.7586473766990294e-05, "time_sec": 67.02374720573425 }, { "epoch": 130, "train_loss": 2.8572039877319337, "train_acc": 0.27668, "test_loss": 9.687789022827149, "test_acc": 0.0255, "lyapunov": null, "grad_norm": 0.5186381052419109, "grad_max_sv": 0.15739406496286393, "grad_min_sv": 9.484110215923769e-09, "grad_condition": 32956127.450649947, "lr": 4.32272711786996e-05, "time_sec": 67.0042040348053 }, { "epoch": 131, "train_loss": 2.8510476612854005, "train_acc": 0.27938, "test_loss": 9.569248272705078, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.5207995350849649, "grad_max_sv": 0.16004110053181647, "grad_min_sv": 9.74696345579229e-09, "grad_condition": 19170988.284027696, "lr": 3.906842420574966e-05, "time_sec": 67.01241946220398 }, { "epoch": 132, "train_loss": 2.846966871871948, "train_acc": 0.28012, "test_loss": 9.591386764526368, "test_acc": 0.0255, "lyapunov": null, "grad_norm": 0.5190948064684937, "grad_max_sv": 0.16090917438268662, "grad_min_sv": 9.59687692925204e-09, "grad_condition": 19916201.19002537, "lr": 3.5111757055874305e-05, "time_sec": 66.99244403839111 }, { "epoch": 133, "train_loss": 2.849546993560791, "train_acc": 0.2807, "test_loss": 9.568466381835938, "test_acc": 0.0256, "lyapunov": null, "grad_norm": 0.5185948998509293, "grad_max_sv": 0.1592203661799431, "grad_min_sv": 9.741048792588635e-09, "grad_condition": 21889901.09234864, "lr": 3.1359005254054254e-05, "time_sec": 66.98589158058167 }, { "epoch": 134, "train_loss": 2.8438784635925294, "train_acc": 0.28108, "test_loss": 9.896654699707032, "test_acc": 0.0239, "lyapunov": null, "grad_norm": 0.5160935862439748, "grad_max_sv": 0.1570783667266369, "grad_min_sv": 9.671757885201804e-09, "grad_condition": 260951372.1762239, "lr": 2.7811814881259484e-05, "time_sec": 66.98548531532288 }, { "epoch": 135, "train_loss": 2.834603865356445, "train_acc": 0.28228, "test_loss": 9.507378176879882, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.5182545697342097, "grad_max_sv": 0.16007349267601967, "grad_min_sv": 9.658516472721423e-09, "grad_condition": 19713617.954316415, "lr": 2.4471741852423218e-05, "time_sec": 67.04329872131348 }, { "epoch": 136, "train_loss": 2.839189874649048, "train_acc": 0.28064, "test_loss": 9.359465802001953, "test_acc": 0.0248, "lyapunov": null, "grad_norm": 0.5169244988974169, "grad_max_sv": 0.16038464941084385, "grad_min_sv": 9.551935577917225e-09, "grad_condition": 92654982.50365481, "lr": 2.1340251233966362e-05, "time_sec": 67.0141191482544 }, { "epoch": 137, "train_loss": 2.8397282981109617, "train_acc": 0.28072, "test_loss": 9.637136407470702, "test_acc": 0.0232, "lyapunov": null, "grad_norm": 0.5171965418231472, "grad_max_sv": 0.1600246898829937, "grad_min_sv": 9.73793786961108e-09, "grad_condition": 49688363.904323384, "lr": 1.8418716601170932e-05, "time_sec": 67.01152467727661 }, { "epoch": 138, "train_loss": 2.832450699005127, "train_acc": 0.2818, "test_loss": 9.6108934967041, "test_acc": 0.0257, "lyapunov": null, "grad_norm": 0.5180887909699459, "grad_max_sv": 0.15756660997867583, "grad_min_sv": 9.721027080522582e-09, "grad_condition": 111964333.48758218, "lr": 1.570841943568445e-05, "time_sec": 66.98093700408936 }, { "epoch": 139, "train_loss": 2.831738001098633, "train_acc": 0.28372, "test_loss": 9.70671376953125, "test_acc": 0.0243, "lyapunov": null, "grad_norm": 0.5175564205755943, "grad_max_sv": 0.15984287559986116, "grad_min_sv": 9.567414729211298e-09, "grad_condition": 30908421.83810656, "lr": 1.3210548563419845e-05, "time_sec": 66.98836731910706 }, { "epoch": 140, "train_loss": 2.8314741302490236, "train_acc": 0.2828, "test_loss": 9.671274719238282, "test_acc": 0.0253, "lyapunov": null, "grad_norm": 0.5195292394658827, "grad_max_sv": 0.16055516712367535, "grad_min_sv": 9.656845009232972e-09, "grad_condition": 116770748.01439288, "lr": 1.0926199633097203e-05, "time_sec": 67.06937670707703 }, { "epoch": 141, "train_loss": 2.8331345532226564, "train_acc": 0.28274, "test_loss": 9.6149158203125, "test_acc": 0.0254, "lyapunov": null, "grad_norm": 0.5200947221378508, "grad_max_sv": 0.1620084557682276, "grad_min_sv": 9.736931689749428e-09, "grad_condition": 45631030.28761599, "lr": 8.856374635655688e-06, "time_sec": 67.04308843612671 }, { "epoch": 142, "train_loss": 2.8309748402404784, "train_acc": 0.28162, "test_loss": 9.762360348510741, "test_acc": 0.0236, "lyapunov": null, "grad_norm": 0.5193749464503752, "grad_max_sv": 0.16398511864244938, "grad_min_sv": 9.725219179967937e-09, "grad_condition": 21389461.650285553, "lr": 7.001981464747503e-06, "time_sec": 66.99746632575989 }, { "epoch": 143, "train_loss": 2.8280009740447998, "train_acc": 0.28424, "test_loss": 9.46468698425293, "test_acc": 0.0236, "lyapunov": null, "grad_norm": 0.5183118315610563, "grad_max_sv": 0.15934774614870548, "grad_min_sv": 9.612720197615943e-09, "grad_condition": 28184363.311956126, "lr": 5.3638335185058295e-06, "time_sec": 67.1207172870636 }, { "epoch": 144, "train_loss": 2.8344388133239744, "train_acc": 0.27982, "test_loss": 9.481146864318848, "test_acc": 0.0253, "lyapunov": null, "grad_norm": 0.5191802199413043, "grad_max_sv": 0.16139711774885654, "grad_min_sv": 9.682644661057616e-09, "grad_condition": 19530671.727896534, "lr": 3.942649342761114e-06, "time_sec": 67.00769138336182 }, { "epoch": 145, "train_loss": 2.8336991081237795, "train_acc": 0.28372, "test_loss": 9.66582228088379, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.5185987884305854, "grad_max_sv": 0.16210929341614247, "grad_min_sv": 9.609004592014969e-09, "grad_condition": 19136474.88235427, "lr": 2.7390523158633524e-06, "time_sec": 67.0150043964386 }, { "epoch": 146, "train_loss": 2.8299831028747557, "train_acc": 0.28278, "test_loss": 9.453235021972656, "test_acc": 0.0257, "lyapunov": null, "grad_norm": 0.5191689479196915, "grad_max_sv": 0.16032814532518386, "grad_min_sv": 9.704305628868703e-09, "grad_condition": 46973186.46224795, "lr": 1.7535703752478133e-06, "time_sec": 67.00002098083496 }, { "epoch": 147, "train_loss": 2.825070192184448, "train_acc": 0.28334, "test_loss": 9.736306394958497, "test_acc": 0.0241, "lyapunov": null, "grad_norm": 0.5194004947332557, "grad_max_sv": 0.15663104616105555, "grad_min_sv": 9.712660245519977e-09, "grad_condition": 19953974.129073095, "lr": 9.866357858642196e-07, "time_sec": 67.0251133441925 }, { "epoch": 148, "train_loss": 2.8285147483825686, "train_acc": 0.28494, "test_loss": 9.718778967285155, "test_acc": 0.0232, "lyapunov": null, "grad_norm": 0.519735769986064, "grad_max_sv": 0.16175503246486186, "grad_min_sv": 9.61004464027082e-09, "grad_condition": 41640518.28457622, "lr": 4.38584950570808e-07, "time_sec": 66.99386191368103 }, { "epoch": 149, "train_loss": 2.8338044094085695, "train_acc": 0.2828, "test_loss": 9.769097790527344, "test_acc": 0.025, "lyapunov": null, "grad_norm": 0.518369855767956, "grad_max_sv": 0.16054188311100007, "grad_min_sv": 9.553421861929757e-09, "grad_condition": 19432504.243999995, "lr": 1.096582625772501e-07, "time_sec": 66.99177241325378 }, { "epoch": 150, "train_loss": 2.8278376667022704, "train_acc": 0.28346, "test_loss": 9.647385183715821, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.5190962063342817, "grad_max_sv": 0.16339128278195858, "grad_min_sv": 9.625854724415461e-09, "grad_condition": 26849402.241447162, "lr": 0.0, "time_sec": 66.99396753311157 } ] }, "lyapunov": { "4": [ { "epoch": 1, "train_loss": 4.0711297009277345, "train_acc": 0.09922, "test_loss": 3.9652711036682127, "test_acc": 0.106, "lyapunov": 2.009106175978775, "grad_norm": 5.770356961936896, "grad_max_sv": 4.216659033298493, "grad_min_sv": 1.0549574099294467e-07, "grad_condition": 83568782.62868212, "lr": 0.0009998903417374227, "time_sec": 41.888622999191284 }, { "epoch": 2, "train_loss": 3.7634158575439454, "train_acc": 0.13558, "test_loss": 4.481808354949951, "test_acc": 0.0542, "lyapunov": 1.6958206730425511, "grad_norm": 3.6343119962391017, "grad_max_sv": 2.4889110922813416, "grad_min_sv": 6.732413328491837e-08, "grad_condition": 91225677.18337384, "lr": 0.0009995614150494292, "time_sec": 41.84356164932251 }, { "epoch": 3, "train_loss": 3.6647304371643066, "train_acc": 0.1493, "test_loss": 4.3052373779296875, "test_acc": 0.0762, "lyapunov": 1.6261345663338975, "grad_norm": 2.8093749766197624, "grad_max_sv": 1.7556122809648513, "grad_min_sv": 5.287189366841305e-08, "grad_condition": 314142006.47060126, "lr": 0.0009990133642141358, "time_sec": 41.84758758544922 }, { "epoch": 4, "train_loss": 3.546524167175293, "train_acc": 0.16742, "test_loss": 5.702491674804688, "test_acc": 0.0294, "lyapunov": 1.5553575302938671, "grad_norm": 2.385940862508357, "grad_max_sv": 1.40236736536026, "grad_min_sv": 4.480527846517646e-08, "grad_condition": 43664896.37977407, "lr": 0.0009982464296247522, "time_sec": 41.83865737915039 }, { "epoch": 5, "train_loss": 3.4743005490112306, "train_acc": 0.18312, "test_loss": 8.196367356872559, "test_acc": 0.019, "lyapunov": 1.5279129725283065, "grad_norm": 2.072916387891114, "grad_max_sv": 1.1730020090937614, "grad_min_sv": 3.8785105194172334e-08, "grad_condition": 32346211.56806183, "lr": 0.0009972609476841367, "time_sec": 41.85976266860962 }, { "epoch": 6, "train_loss": 3.4256133052062987, "train_acc": 0.19342, "test_loss": 9.553438766479491, "test_acc": 0.0187, "lyapunov": 1.5210750066410854, "grad_norm": 1.8439895228569763, "grad_max_sv": 0.9858661040663719, "grad_min_sv": 3.4533098991484934e-08, "grad_condition": 35319864.79656621, "lr": 0.000996057350657239, "time_sec": 41.841728925704956 }, { "epoch": 7, "train_loss": 3.4064867937469483, "train_acc": 0.2019, "test_loss": 11.607983041381836, "test_acc": 0.0152, "lyapunov": 1.523884119280159, "grad_norm": 1.687138246958699, "grad_max_sv": 0.8869923338294029, "grad_min_sv": 3.151686688296351e-08, "grad_condition": 33789366.4765297, "lr": 0.000994636166481494, "time_sec": 41.84767436981201 }, { "epoch": 8, "train_loss": 3.434463021774292, "train_acc": 0.19834, "test_loss": 11.012699322509766, "test_acc": 0.0218, "lyapunov": 1.5377070940364048, "grad_norm": 1.5753285999803672, "grad_max_sv": 0.8568978801369667, "grad_min_sv": 2.9292211212172958e-08, "grad_condition": 38247647.23104979, "lr": 0.0009929980185352525, "time_sec": 41.83318567276001 }, { "epoch": 9, "train_loss": 3.4525474771118163, "train_acc": 0.19694, "test_loss": 13.244960899353027, "test_acc": 0.0188, "lyapunov": 1.5521414874459776, "grad_norm": 1.4910263576831584, "grad_max_sv": 0.7901037082076072, "grad_min_sv": 2.7871724133082115e-08, "grad_condition": 652853959.565771, "lr": 0.0009911436253643444, "time_sec": 41.85349941253662 }, { "epoch": 10, "train_loss": 3.4827073947906495, "train_acc": 0.19456, "test_loss": 13.097009005737304, "test_acc": 0.0142, "lyapunov": 1.54852739807285, "grad_norm": 1.3918276084929038, "grad_max_sv": 0.7072893396019936, "grad_min_sv": 2.5679541396095296e-08, "grad_condition": 39117704.605187416, "lr": 0.0009890738003669028, "time_sec": 41.853031635284424 }, { "epoch": 11, "train_loss": 3.502148910446167, "train_acc": 0.19276, "test_loss": 14.30014864807129, "test_acc": 0.0163, "lyapunov": 1.5574408672044955, "grad_norm": 1.3267443475145169, "grad_max_sv": 0.6856341227889061, "grad_min_sv": 2.4468690279499938e-08, "grad_condition": 36359188.54410316, "lr": 0.00098678945143658, "time_sec": 41.87047362327576 }, { "epoch": 12, "train_loss": 3.5455151155090334, "train_acc": 0.1879, "test_loss": 12.457445967102052, "test_acc": 0.0197, "lyapunov": 1.5671831793187525, "grad_norm": 1.2480528019241246, "grad_max_sv": 0.6239843934774398, "grad_min_sv": 2.3005261242953905e-08, "grad_condition": 526118663.91773003, "lr": 0.0009842915805643154, "time_sec": 41.888609409332275 }, { "epoch": 13, "train_loss": 3.6091552614593505, "train_acc": 0.17994, "test_loss": 12.732378463745118, "test_acc": 0.0121, "lyapunov": 1.568660382419596, "grad_norm": 1.1583490651743926, "grad_max_sv": 0.581366877257824, "grad_min_sv": 2.1129029859068282e-08, "grad_condition": 32416771.726506818, "lr": 0.000981581283398829, "time_sec": 41.91386127471924 }, { "epoch": 14, "train_loss": 3.791756629562378, "train_acc": 0.15402, "test_loss": 15.130843069458008, "test_acc": 0.0119, "lyapunov": 1.616871199034669, "grad_norm": 1.087286539710877, "grad_max_sv": 0.572893675416708, "grad_min_sv": 1.9829283692818224e-08, "grad_condition": 32374293.19268779, "lr": 0.0009786597487660333, "time_sec": 41.84876489639282 }, { "epoch": 15, "train_loss": 3.8399617958068846, "train_acc": 0.14724, "test_loss": 17.94291413269043, "test_acc": 0.0166, "lyapunov": 1.6528625835847977, "grad_norm": 1.0379429629839805, "grad_max_sv": 0.5574500106275082, "grad_min_sv": 1.8863349182662857e-08, "grad_condition": 39761225.70266014, "lr": 0.0009755282581475766, "time_sec": 41.82764172554016 }, { "epoch": 16, "train_loss": 3.8371740995025636, "train_acc": 0.15152, "test_loss": 13.5413774017334, "test_acc": 0.01, "lyapunov": 1.648486807218293, "grad_norm": 0.9596716866271199, "grad_max_sv": 0.5051649369299411, "grad_min_sv": 1.7647910632856423e-08, "grad_condition": 34020323.13172309, "lr": 0.0009721881851187403, "time_sec": 41.84924578666687 }, { "epoch": 17, "train_loss": 3.890597806930542, "train_acc": 0.14732, "test_loss": 14.242138269042968, "test_acc": 0.0132, "lyapunov": 1.6423247948936794, "grad_norm": 0.8982590539538886, "grad_max_sv": 0.46011053323745726, "grad_min_sv": 1.6221578684992576e-08, "grad_condition": 227922899.83540225, "lr": 0.0009686409947459456, "time_sec": 41.824068784713745 }, { "epoch": 18, "train_loss": 3.8945003430938723, "train_acc": 0.14424, "test_loss": 12.652154109191894, "test_acc": 0.009, "lyapunov": 1.6140738649441457, "grad_norm": 0.8509250568629757, "grad_max_sv": 0.4146191440522671, "grad_min_sv": 1.5334739790484608e-08, "grad_condition": 46249959.20615914, "lr": 0.0009648882429441254, "time_sec": 41.92591094970703 }, { "epoch": 19, "train_loss": 3.911494416732788, "train_acc": 0.14534, "test_loss": 10.313947262573242, "test_acc": 0.01, "lyapunov": 1.6057381596406708, "grad_norm": 0.8291056062070911, "grad_max_sv": 0.39902378544211387, "grad_min_sv": 1.5037980047316603e-08, "grad_condition": 51800842.237051465, "lr": 0.00096093157579425, "time_sec": 41.85994362831116 }, { "epoch": 20, "train_loss": 3.9858800520324706, "train_acc": 0.13508, "test_loss": 9.495584085083008, "test_acc": 0.0117, "lyapunov": 1.5699561761163385, "grad_norm": 0.8464930976238112, "grad_max_sv": 0.4136614315211773, "grad_min_sv": 1.490709049438779e-08, "grad_condition": 522735678.0721162, "lr": 0.0009567727288213001, "time_sec": 41.85805010795593 }, { "epoch": 21, "train_loss": 4.023155120925903, "train_acc": 0.12818, "test_loss": 10.004813737487792, "test_acc": 0.0135, "lyapunov": 1.5752095285888827, "grad_norm": 0.8291979613527221, "grad_max_sv": 0.38449598476290703, "grad_min_sv": 1.4266561158826629e-08, "grad_condition": 100203024.77550165, "lr": 0.0009524135262330095, "time_sec": 41.84737300872803 }, { "epoch": 22, "train_loss": 4.029212285461425, "train_acc": 0.12438, "test_loss": 12.173621334838867, "test_acc": 0.01, "lyapunov": 1.5598359254315077, "grad_norm": 0.7501647761926934, "grad_max_sv": 0.36557952016592027, "grad_min_sv": 1.3507705134974124e-08, "grad_condition": 32668036.703706127, "lr": 0.0009478558801197061, "time_sec": 41.83857583999634 }, { "epoch": 23, "train_loss": 4.038732503051758, "train_acc": 0.12626, "test_loss": 8.940043533325195, "test_acc": 0.011, "lyapunov": 1.5640881744492086, "grad_norm": 0.7404717741571084, "grad_max_sv": 0.36797516867518426, "grad_min_sv": 1.314027773258175e-08, "grad_condition": 31266761.905169785, "lr": 0.000943101789615607, "time_sec": 41.82795524597168 }, { "epoch": 24, "train_loss": 4.0988731300354, "train_acc": 0.11452, "test_loss": 12.849692756652832, "test_acc": 0.0107, "lyapunov": 1.550421966311267, "grad_norm": 0.7098563411237487, "grad_max_sv": 0.36257990449666977, "grad_min_sv": 1.25359189376284e-08, "grad_condition": 40983554.09727303, "lr": 0.0009381533400219313, "time_sec": 41.85472393035889 }, { "epoch": 25, "train_loss": 4.209664036712646, "train_acc": 0.09956, "test_loss": 13.292383435058595, "test_acc": 0.01, "lyapunov": 1.5532953726970935, "grad_norm": 0.6761784984779601, "grad_max_sv": 0.3498499631881714, "grad_min_sv": 1.1860140708419564e-08, "grad_condition": 35321140.57939846, "lr": 0.0009330127018922189, "time_sec": 41.83675241470337 }, { "epoch": 26, "train_loss": 4.387504685211182, "train_acc": 0.06822, "test_loss": 13.442844244384766, "test_acc": 0.01, "lyapunov": 1.5123424859303038, "grad_norm": 0.613666343544254, "grad_max_sv": 0.312596595287323, "grad_min_sv": 9.974056802697362e-09, "grad_condition": 73223482.84978306, "lr": 0.000927682130080253, "time_sec": 41.83025002479553 }, { "epoch": 27, "train_loss": 4.494176885528565, "train_acc": 0.0543, "test_loss": 11.84754227294922, "test_acc": 0.0094, "lyapunov": 1.4815948003393304, "grad_norm": 0.5747479343845562, "grad_max_sv": 0.3057863064110279, "grad_min_sv": 8.438247317554826e-09, "grad_condition": 38945619.0197791, "lr": 0.0009221639627510072, "time_sec": 41.84781360626221 }, { "epoch": 28, "train_loss": 4.46251156829834, "train_acc": 0.05616, "test_loss": 11.681759558105469, "test_acc": 0.01, "lyapunov": 1.4850436720396856, "grad_norm": 0.5367103881878276, "grad_max_sv": 0.27574604004621506, "grad_min_sv": 7.970707525950527e-09, "grad_condition": 43556131.981196605, "lr": 0.0009164606203550494, "time_sec": 41.85157370567322 }, { "epoch": 29, "train_loss": 4.478804314422607, "train_acc": 0.05546, "test_loss": 13.70535901184082, "test_acc": 0.01, "lyapunov": 1.4930339225417817, "grad_norm": 0.4922959043886969, "grad_max_sv": 0.26684653796255586, "grad_min_sv": 7.476301915054772e-09, "grad_condition": 50660877.44966361, "lr": 0.0009105746045668516, "time_sec": 41.84281659126282 }, { "epoch": 30, "train_loss": 4.461830242156982, "train_acc": 0.05732, "test_loss": 16.430956909179688, "test_acc": 0.01, "lyapunov": 1.4880318653857922, "grad_norm": 0.463062312015885, "grad_max_sv": 0.24580183289945126, "grad_min_sv": 6.99083638443232e-09, "grad_condition": 91544069.9810532, "lr": 0.0009045084971874733, "time_sec": 41.85340070724487 }, { "epoch": 31, "train_loss": 4.449828500366211, "train_acc": 0.06014, "test_loss": 16.980024148559572, "test_acc": 0.01, "lyapunov": 1.515285712068953, "grad_norm": 0.46991707412670536, "grad_max_sv": 0.24059981070458888, "grad_min_sv": 7.035010417960619e-09, "grad_condition": 75974624.60279362, "lr": 0.0008982649590120977, "time_sec": 41.8510844707489 }, { "epoch": 32, "train_loss": 4.437514468383789, "train_acc": 0.06294, "test_loss": 18.52886298980713, "test_acc": 0.01, "lyapunov": 1.5204427940461336, "grad_norm": 0.45125734819245583, "grad_max_sv": 0.22053336799144746, "grad_min_sv": 6.6175200534590585e-09, "grad_condition": 48917947.725726604, "lr": 0.0008918467286629196, "time_sec": 41.869179248809814 }, { "epoch": 33, "train_loss": 4.40278786529541, "train_acc": 0.06556, "test_loss": 18.846385064697266, "test_acc": 0.01, "lyapunov": 1.4883441946390645, "grad_norm": 0.45666973025646995, "grad_max_sv": 0.21949558071792125, "grad_min_sv": 6.802780549985954e-09, "grad_condition": 36143230.241273426, "lr": 0.0008852566213878943, "time_sec": 41.84911870956421 }, { "epoch": 34, "train_loss": 4.40820367401123, "train_acc": 0.06462, "test_loss": 20.250594232177736, "test_acc": 0.01, "lyapunov": 1.4780629108019192, "grad_norm": 0.4533983560833586, "grad_max_sv": 0.21924315206706524, "grad_min_sv": 6.449878905967488e-09, "grad_condition": 45022497.55124281, "lr": 0.000878497527825878, "time_sec": 41.82957434654236 }, { "epoch": 35, "train_loss": 4.416326632080078, "train_acc": 0.06346, "test_loss": 18.319365844726562, "test_acc": 0.01, "lyapunov": 1.4840021791970333, "grad_norm": 0.44153691028523245, "grad_max_sv": 0.20659824572503566, "grad_min_sv": 6.229376612806869e-09, "grad_condition": 59088146.05455335, "lr": 0.000871572412738697, "time_sec": 41.850478410720825 }, { "epoch": 36, "train_loss": 4.408258157043457, "train_acc": 0.064, "test_loss": 20.95832971191406, "test_acc": 0.01, "lyapunov": 1.479226511152809, "grad_norm": 0.4410718020248668, "grad_max_sv": 0.2093581147491932, "grad_min_sv": 6.282209370940539e-09, "grad_condition": 105188788.23632967, "lr": 0.0008644843137107055, "time_sec": 41.878541469573975 }, { "epoch": 37, "train_loss": 4.407336394348144, "train_acc": 0.06656, "test_loss": 16.102902310180664, "test_acc": 0.01, "lyapunov": 1.4862678380268615, "grad_norm": 0.44349953997935043, "grad_max_sv": 0.215363934263587, "grad_min_sv": 6.384406239789975e-09, "grad_condition": 37599506.61324627, "lr": 0.0008572363398164014, "time_sec": 41.84441637992859 }, { "epoch": 38, "train_loss": 4.39930072052002, "train_acc": 0.06716, "test_loss": 14.936711614990234, "test_acc": 0.01, "lyapunov": 1.4831183868296005, "grad_norm": 0.45835307206344844, "grad_max_sv": 0.22024714946746826, "grad_min_sv": 6.405372059842263e-09, "grad_condition": 66702014.21939925, "lr": 0.0008498316702566826, "time_sec": 41.848416805267334 }, { "epoch": 39, "train_loss": 4.400538181915283, "train_acc": 0.06598, "test_loss": 16.468564752197267, "test_acc": 0.01, "lyapunov": 1.4876915777430815, "grad_norm": 0.4485664393328264, "grad_max_sv": 0.22156519442796707, "grad_min_sv": 6.4785729367994316e-09, "grad_condition": 280429030.69459355, "lr": 0.0008422735529643442, "time_sec": 41.86299443244934 }, { "epoch": 40, "train_loss": 4.397091385955811, "train_acc": 0.06734, "test_loss": 18.54481873931885, "test_acc": 0.01, "lyapunov": 1.4808301129914305, "grad_norm": 0.4299005955382572, "grad_max_sv": 0.2034155208617449, "grad_min_sv": 6.2005965799361015e-09, "grad_condition": 44401112.87668381, "lr": 0.0008345653031794289, "time_sec": 41.8275043964386 }, { "epoch": 41, "train_loss": 4.386424259796143, "train_acc": 0.06824, "test_loss": 21.206073614501953, "test_acc": 0.01, "lyapunov": 1.4804525152801553, "grad_norm": 0.4248718447548538, "grad_max_sv": 0.20124743394553662, "grad_min_sv": 6.046653282243408e-09, "grad_condition": 40043238.334212705, "lr": 0.0008267103019950526, "time_sec": 41.85425305366516 }, { "epoch": 42, "train_loss": 4.386167093048096, "train_acc": 0.0676, "test_loss": 19.16770219116211, "test_acc": 0.01, "lyapunov": 1.4792915119234558, "grad_norm": 0.4093890186492107, "grad_max_sv": 0.1878580778837204, "grad_min_sv": 5.876780584390673e-09, "grad_condition": 44144026.50569831, "lr": 0.0008187119948743447, "time_sec": 41.865527868270874 }, { "epoch": 43, "train_loss": 4.397055397033691, "train_acc": 0.06784, "test_loss": 18.22021773529053, "test_acc": 0.01, "lyapunov": 1.4911047723287207, "grad_norm": 0.42408941793691435, "grad_max_sv": 0.1856762148439884, "grad_min_sv": 5.8528611551061925e-09, "grad_condition": 150471528.47198898, "lr": 0.000810573890139155, "time_sec": 41.851991176605225 }, { "epoch": 44, "train_loss": 4.418051720123291, "train_acc": 0.06534, "test_loss": 18.890657635498048, "test_acc": 0.01, "lyapunov": 1.506059860634377, "grad_norm": 0.41379860519627926, "grad_max_sv": 0.1912920583039522, "grad_min_sv": 5.7118770109554354e-09, "grad_condition": 70799416.84221649, "lr": 0.0008022995574311873, "time_sec": 41.855762004852295 }, { "epoch": 45, "train_loss": 4.555874091186523, "train_acc": 0.05074, "test_loss": 16.445907543945314, "test_acc": 0.01, "lyapunov": 1.5668693082716765, "grad_norm": 0.421064301771623, "grad_max_sv": 0.20280106514692306, "grad_min_sv": 5.1596785455299e-09, "grad_condition": 50522308.14501454, "lr": 0.0007938926261462363, "time_sec": 41.843982219696045 }, { "epoch": 46, "train_loss": 4.56307541015625, "train_acc": 0.04834, "test_loss": 15.170621519470215, "test_acc": 0.01, "lyapunov": 1.5478406470754873, "grad_norm": 0.4022239019959698, "grad_max_sv": 0.20177871510386466, "grad_min_sv": 4.925644440934018e-09, "grad_condition": 51504299.42247386, "lr": 0.0007853567838422158, "time_sec": 41.843809366226196 }, { "epoch": 47, "train_loss": 4.461052338867187, "train_acc": 0.06168, "test_loss": 13.590689770507813, "test_acc": 0.01, "lyapunov": 1.539207870698036, "grad_norm": 0.39483180875809476, "grad_max_sv": 0.18038341253995896, "grad_min_sv": 5.225175523509984e-09, "grad_condition": 48416053.199461475, "lr": 0.0007766957746216719, "time_sec": 41.86233711242676 }, { "epoch": 48, "train_loss": 4.483129704589844, "train_acc": 0.06082, "test_loss": 15.866412992858887, "test_acc": 0.01, "lyapunov": 1.5564451214602537, "grad_norm": 0.4001213731670661, "grad_max_sv": 0.17479643113911153, "grad_min_sv": 4.983967312466309e-09, "grad_condition": 45597451.14778058, "lr": 0.0007679133974894982, "time_sec": 41.860371828079224 }, { "epoch": 49, "train_loss": 4.563996811523437, "train_acc": 0.05704, "test_loss": 14.467741319274902, "test_acc": 0.01, "lyapunov": 1.7151714895692323, "grad_norm": 0.35765858704843245, "grad_max_sv": 0.17724147401750087, "grad_min_sv": 4.611558551666846e-09, "grad_condition": 3652674833.016098, "lr": 0.000759013504686565, "time_sec": 41.88652062416077 }, { "epoch": 50, "train_loss": 4.699548272705078, "train_acc": 0.04798, "test_loss": 14.650819215393067, "test_acc": 0.01, "lyapunov": 1.8773073610442375, "grad_norm": 0.3237139765922586, "grad_max_sv": 0.18019139617681504, "grad_min_sv": 4.004119223688374e-09, "grad_condition": 56553030.085173145, "lr": 0.0007499999999999998, "time_sec": 41.8651602268219 }, { "epoch": 51, "train_loss": 4.856528885040283, "train_acc": 0.01108, "test_loss": 13.696816278076172, "test_acc": 0.01, "lyapunov": 1.4683626176756057, "grad_norm": 0.238328597603378, "grad_max_sv": 0.17753527872264385, "grad_min_sv": 2.2218590706860787e-10, "grad_condition": 124996343340.03922, "lr": 0.0007408768370508575, "time_sec": 41.89140796661377 }, { "epoch": 52, "train_loss": 4.859013377990722, "train_acc": 0.0091, "test_loss": 13.624913540649414, "test_acc": 0.01, "lyapunov": 1.465970806453539, "grad_norm": 0.16106795495349294, "grad_max_sv": 0.1110096687451005, "grad_min_sv": 6.2731757239434485e-15, "grad_condition": 110304236489.90335, "lr": 0.0007316480175599307, "time_sec": 41.900989294052124 }, { "epoch": 53, "train_loss": 4.851568754730224, "train_acc": 0.00906, "test_loss": 15.073454458618164, "test_acc": 0.01, "lyapunov": 1.456499196684269, "grad_norm": 0.1430055471916021, "grad_max_sv": 0.09564914535731077, "grad_min_sv": 1.5236447104070445e-15, "grad_condition": 95502112628.56236, "lr": 0.0007223175895924635, "time_sec": 41.87765717506409 }, { "epoch": 54, "train_loss": 4.851486787261963, "train_acc": 0.0096, "test_loss": 15.396797889709473, "test_acc": 0.01, "lyapunov": 1.4582891162399136, "grad_norm": 0.1275918494558622, "grad_max_sv": 0.07877833610400557, "grad_min_sv": 1.1071724086990746e-23, "grad_condition": 78778336103.16934, "lr": 0.0007128896457825361, "time_sec": 41.84445524215698 }, { "epoch": 55, "train_loss": 4.850928226623535, "train_acc": 0.00872, "test_loss": 14.606024462890625, "test_acc": 0.01, "lyapunov": 1.4591175653135684, "grad_norm": 0.12323118676067203, "grad_max_sv": 0.07178116273134946, "grad_min_sv": 2.5052708059998736e-20, "grad_condition": 71781161032.94218, "lr": 0.0007033683215378998, "time_sec": 41.84666895866394 }, { "epoch": 56, "train_loss": 4.852352551269531, "train_acc": 0.0098, "test_loss": 14.902420947265625, "test_acc": 0.01, "lyapunov": 1.4618816878789527, "grad_norm": 0.114352449118403, "grad_max_sv": 0.06100161336362362, "grad_min_sv": 6.896960539960325e-27, "grad_condition": 61001613363.62309, "lr": 0.0006937577932260512, "time_sec": 41.880367279052734 }, { "epoch": 57, "train_loss": 4.852858272247315, "train_acc": 0.01102, "test_loss": 14.057881980895996, "test_acc": 0.01, "lyapunov": 1.4654078419556094, "grad_norm": 0.10881533107486291, "grad_max_sv": 0.05331473303958774, "grad_min_sv": 1.4012984643248171e-46, "grad_condition": 53314733039.58773, "lr": 0.0006840622763423388, "time_sec": 41.84727120399475 }, { "epoch": 58, "train_loss": 4.851343263397217, "train_acc": 0.01044, "test_loss": 14.620996353149414, "test_acc": 0.01, "lyapunov": 1.4605532884597778, "grad_norm": 0.11574598071345925, "grad_max_sv": 0.06319006895646453, "grad_min_sv": 2.802712535772941e-41, "grad_condition": 63190068956.46452, "lr": 0.0006742860236609073, "time_sec": 41.8674533367157 }, { "epoch": 59, "train_loss": 4.852657847747802, "train_acc": 0.0102, "test_loss": 14.391234281921387, "test_acc": 0.01, "lyapunov": 1.4630218619275885, "grad_norm": 0.1117850897535104, "grad_max_sv": 0.057737766206264494, "grad_min_sv": 8.962900509942182e-33, "grad_condition": 57737766206.2645, "lr": 0.0006644333233692913, "time_sec": 41.853941679000854 }, { "epoch": 60, "train_loss": 4.851071483917236, "train_acc": 0.00948, "test_loss": 14.590808624267579, "test_acc": 0.01, "lyapunov": 1.4618642052726063, "grad_norm": 0.10400000692897449, "grad_max_sv": 0.04577720589004457, "grad_min_sv": 0.0, "grad_condition": 45777205890.04457, "lr": 0.0006545084971874734, "time_sec": 41.848552227020264 }, { "epoch": 61, "train_loss": 4.852240568084717, "train_acc": 0.0095, "test_loss": 14.59047717590332, "test_acc": 0.01, "lyapunov": 1.4638908500866512, "grad_norm": 0.10799934715249591, "grad_max_sv": 0.05035868901759386, "grad_min_sv": 0.0, "grad_condition": 50358689017.59386, "lr": 0.0006445158984722354, "time_sec": 41.850308418273926 }, { "epoch": 62, "train_loss": 4.852433279266357, "train_acc": 0.01012, "test_loss": 15.986171211242675, "test_acc": 0.01, "lyapunov": 1.4649500645639952, "grad_norm": 0.10733331744324738, "grad_max_sv": 0.05229583606123924, "grad_min_sv": 0.0, "grad_condition": 52295836061.23924, "lr": 0.0006344599103076324, "time_sec": 41.855886936187744 }, { "epoch": 63, "train_loss": 4.85242006362915, "train_acc": 0.00952, "test_loss": 13.999450773620605, "test_acc": 0.01, "lyapunov": 1.4631946355180667, "grad_norm": 0.10887508886634635, "grad_max_sv": 0.05549173932522535, "grad_min_sv": 0.0, "grad_condition": 55491739325.22536, "lr": 0.0006243449435824269, "time_sec": 41.875603675842285 }, { "epoch": 64, "train_loss": 4.852031197509765, "train_acc": 0.00988, "test_loss": 13.823671005249023, "test_acc": 0.01, "lyapunov": 1.46498492947015, "grad_norm": 0.10631816229605466, "grad_max_sv": 0.050992762017995116, "grad_min_sv": 0.0, "grad_condition": 50992762017.99512, "lr": 0.0006141754350553275, "time_sec": 41.84609389305115 }, { "epoch": 65, "train_loss": 4.851191096801758, "train_acc": 0.01018, "test_loss": 13.375173307800292, "test_acc": 0.01, "lyapunov": 1.4641655095093085, "grad_norm": 0.1010577343573765, "grad_max_sv": 0.042480578925460574, "grad_min_sv": 0.0, "grad_condition": 42480578925.46058, "lr": 0.0006039558454088793, "time_sec": 41.83738660812378 }, { "epoch": 66, "train_loss": 4.852197050323486, "train_acc": 0.00882, "test_loss": 14.165961294555665, "test_acc": 0.01, "lyapunov": 1.4664015864472255, "grad_norm": 0.09792907198844746, "grad_max_sv": 0.036209277296438816, "grad_min_sv": 0.0, "grad_condition": 36209277296.43882, "lr": 0.000593690657292862, "time_sec": 41.797043323516846 }, { "epoch": 67, "train_loss": 4.85130561340332, "train_acc": 0.0101, "test_loss": 14.011718264770508, "test_acc": 0.01, "lyapunov": 1.4650892686965826, "grad_norm": 0.09456101481889781, "grad_max_sv": 0.02113236514851451, "grad_min_sv": 0.0, "grad_condition": 21132365148.514507, "lr": 0.0005833843733580507, "time_sec": 41.754011154174805 }, { "epoch": 68, "train_loss": 4.852421583099365, "train_acc": 0.00954, "test_loss": 13.768776727294922, "test_acc": 0.01, "lyapunov": 1.4679525093654233, "grad_norm": 0.09464764660731555, "grad_max_sv": 0.025787328323349356, "grad_min_sv": 0.0, "grad_condition": 25787328323.349358, "lr": 0.0005730415142812054, "time_sec": 42.026938676834106 }, { "epoch": 69, "train_loss": 4.85272935760498, "train_acc": 0.00984, "test_loss": 13.534171914672852, "test_acc": 0.01, "lyapunov": 1.4685536226653078, "grad_norm": 0.09557086506346626, "grad_max_sv": 0.026282459730282426, "grad_min_sv": 0.0, "grad_condition": 26282459730.282425, "lr": 0.0005626666167821517, "time_sec": 41.802675008773804 }, { "epoch": 70, "train_loss": 4.851980906524658, "train_acc": 0.01004, "test_loss": 13.33881396484375, "test_acc": 0.01, "lyapunov": 1.4669674391026997, "grad_norm": 0.09715157690608033, "grad_max_sv": 0.03565134848468006, "grad_min_sv": 0.0, "grad_condition": 35651348484.68006, "lr": 0.0005522642316338265, "time_sec": 41.813010931015015 }, { "epoch": 71, "train_loss": 4.85278720413208, "train_acc": 0.01006, "test_loss": 12.802179231262206, "test_acc": 0.01, "lyapunov": 1.468117561791559, "grad_norm": 0.09992948652871142, "grad_max_sv": 0.03685425859875977, "grad_min_sv": 0.0, "grad_condition": 36854258598.759766, "lr": 0.0005418389216661573, "time_sec": 41.84488320350647 }, { "epoch": 72, "train_loss": 4.851398905639648, "train_acc": 0.00926, "test_loss": 13.120699348449707, "test_acc": 0.01, "lyapunov": 1.4663349237588361, "grad_norm": 0.0922810139338614, "grad_max_sv": 0.021838864544406533, "grad_min_sv": 0.0, "grad_condition": 21838864544.406532, "lr": 0.0005313952597646563, "time_sec": 41.80693006515503 }, { "epoch": 73, "train_loss": 4.852625637207031, "train_acc": 0.01006, "test_loss": 14.170262338256835, "test_acc": 0.01, "lyapunov": 1.4684231619700752, "grad_norm": 0.09725476129415889, "grad_max_sv": 0.03474617879837751, "grad_min_sv": 0.0, "grad_condition": 34746178798.37752, "lr": 0.0005209378268645994, "time_sec": 41.80283856391907 }, { "epoch": 74, "train_loss": 4.854615002288818, "train_acc": 0.01012, "test_loss": 13.06523247833252, "test_acc": 0.01, "lyapunov": 1.4741113576132927, "grad_norm": 0.09355435634576315, "grad_max_sv": 0.026293953135609626, "grad_min_sv": 0.0, "grad_condition": 26293953135.609627, "lr": 0.0005104712099416781, "time_sec": 41.77813935279846 }, { "epoch": 75, "train_loss": 4.8521118782043455, "train_acc": 0.01014, "test_loss": 13.227028475952148, "test_acc": 0.01, "lyapunov": 1.4683185632881302, "grad_norm": 0.09873531057612077, "grad_max_sv": 0.029217457259073855, "grad_min_sv": 0.0, "grad_condition": 29217457259.073853, "lr": 0.0004999999999999996, "time_sec": 41.80186319351196 }, { "epoch": 76, "train_loss": 4.8521026638793945, "train_acc": 0.00974, "test_loss": 13.727623275756835, "test_acc": 0.01, "lyapunov": 1.4683916117529126, "grad_norm": 0.09359089364340291, "grad_max_sv": 0.019284735713154078, "grad_min_sv": 0.0, "grad_condition": 19284735713.154076, "lr": 0.0004895287900583212, "time_sec": 41.79860997200012 }, { "epoch": 77, "train_loss": 4.85240275100708, "train_acc": 0.00924, "test_loss": 13.845351657104493, "test_acc": 0.01, "lyapunov": 1.469331070285319, "grad_norm": 0.09291177556896672, "grad_max_sv": 0.02184786768630147, "grad_min_sv": 0.0, "grad_condition": 21847867686.30147, "lr": 0.0004790621731353997, "time_sec": 41.78152871131897 }, { "epoch": 78, "train_loss": 4.853202556762695, "train_acc": 0.0094, "test_loss": 12.943718765258788, "test_acc": 0.01, "lyapunov": 1.4710808498475252, "grad_norm": 0.09560356806636944, "grad_max_sv": 0.024571862118318678, "grad_min_sv": 0.0, "grad_condition": 24571862118.318676, "lr": 0.000468604740235343, "time_sec": 41.800830364227295 }, { "epoch": 79, "train_loss": 4.852821475524903, "train_acc": 0.00916, "test_loss": 13.06967273864746, "test_acc": 0.01, "lyapunov": 1.4714962222691996, "grad_norm": 0.09286348407291162, "grad_max_sv": 0.01579846618697047, "grad_min_sv": 0.0, "grad_condition": 15798466186.97047, "lr": 0.00045816107833384175, "time_sec": 41.79053092002869 }, { "epoch": 80, "train_loss": 4.852609764556885, "train_acc": 0.00954, "test_loss": 13.320957052612306, "test_acc": 0.01, "lyapunov": 1.4709682016421461, "grad_norm": 0.09107911624268931, "grad_max_sv": 0.013279847288504242, "grad_min_sv": 0.0, "grad_condition": 13279847288.504242, "lr": 0.0004477357683661729, "time_sec": 41.762046813964844 }, { "epoch": 81, "train_loss": 4.851465040130615, "train_acc": 0.00952, "test_loss": 13.012565188598632, "test_acc": 0.01, "lyapunov": 1.468221844004853, "grad_norm": 0.09041003134861456, "grad_max_sv": 0.007651371089741588, "grad_min_sv": 0.0, "grad_condition": 7651371089.741588, "lr": 0.00043733338321784746, "time_sec": 41.751330614089966 }, { "epoch": 82, "train_loss": 4.852081020355224, "train_acc": 0.00966, "test_loss": 12.822627255249023, "test_acc": 0.01, "lyapunov": 1.4696848944324972, "grad_norm": 0.09065480177880879, "grad_max_sv": 0.01019995305687189, "grad_min_sv": 0.0, "grad_condition": 10199953056.871891, "lr": 0.0004269584857187939, "time_sec": 41.86999726295471 }, { "epoch": 83, "train_loss": 4.852022810516358, "train_acc": 0.00996, "test_loss": 12.253762084960938, "test_acc": 0.01, "lyapunov": 1.4689973016529132, "grad_norm": 0.09460842094540753, "grad_max_sv": 0.029235992394387723, "grad_min_sv": 0.0, "grad_condition": 29235992394.38772, "lr": 0.0004166156266419484, "time_sec": 41.76723504066467 }, { "epoch": 84, "train_loss": 4.852035647277832, "train_acc": 0.01024, "test_loss": 12.115891886901855, "test_acc": 0.01, "lyapunov": 1.4691770165167806, "grad_norm": 0.09360646750239629, "grad_max_sv": 0.019934501592069866, "grad_min_sv": 0.0, "grad_condition": 19934501592.069862, "lr": 0.0004063093427071373, "time_sec": 41.82295870780945 }, { "epoch": 85, "train_loss": 4.852076805419922, "train_acc": 0.00986, "test_loss": 12.878702352905274, "test_acc": 0.01, "lyapunov": 1.4699803453577145, "grad_norm": 0.09050948837033777, "grad_max_sv": 0.010260828444734216, "grad_min_sv": 0.0, "grad_condition": 10260828444.734217, "lr": 0.0003960441545911199, "time_sec": 41.740272521972656 }, { "epoch": 86, "train_loss": 4.853503344268799, "train_acc": 0.00942, "test_loss": 13.130225515747071, "test_acc": 0.01, "lyapunov": 1.473677592204355, "grad_norm": 0.08911124738850405, "grad_max_sv": 0.0034935059491544964, "grad_min_sv": 0.0, "grad_condition": 3493505949.154496, "lr": 0.0003858245649446718, "time_sec": 41.71459937095642 }, { "epoch": 87, "train_loss": 4.852846223449707, "train_acc": 0.0098, "test_loss": 13.668508865356445, "test_acc": 0.01, "lyapunov": 1.4720799718671442, "grad_norm": 0.09028155404620607, "grad_max_sv": 0.008756613591685891, "grad_min_sv": 0.0, "grad_condition": 8756613591.685892, "lr": 0.00037565505641757235, "time_sec": 41.74625873565674 }, { "epoch": 88, "train_loss": 4.852147266693115, "train_acc": 0.01, "test_loss": 13.016764665222167, "test_acc": 0.01, "lyapunov": 1.4709450503444428, "grad_norm": 0.08907329873744592, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 41.72583556175232 }, { "epoch": 89, "train_loss": 4.854143925933838, "train_acc": 0.00968, "test_loss": 13.080362130737305, "test_acc": 0.01, "lyapunov": 1.4749400249832427, "grad_norm": 0.09887236057674029, "grad_max_sv": 0.017000502441078424, "grad_min_sv": 0.0, "grad_condition": 17000502441.078424, "lr": 0.0003554841015277638, "time_sec": 41.776273250579834 }, { "epoch": 90, "train_loss": 4.852338234405518, "train_acc": 0.00894, "test_loss": 13.206872094726563, "test_acc": 0.01, "lyapunov": 1.470992279784454, "grad_norm": 0.08990915500150026, "grad_max_sv": 0.004822738515213132, "grad_min_sv": 0.0, "grad_condition": 4822738515.213132, "lr": 0.000345491502812526, "time_sec": 41.74059700965881 }, { "epoch": 91, "train_loss": 4.854439675140381, "train_acc": 0.0098, "test_loss": 13.193742947387696, "test_acc": 0.01, "lyapunov": 1.4752069266555865, "grad_norm": 0.09195463137068469, "grad_max_sv": 0.016309724561870097, "grad_min_sv": 0.0, "grad_condition": 16309724561.870098, "lr": 0.0003355666766307081, "time_sec": 41.72685122489929 }, { "epoch": 92, "train_loss": 4.852755132141113, "train_acc": 0.00966, "test_loss": 12.651437782287598, "test_acc": 0.01, "lyapunov": 1.4722728369485996, "grad_norm": 0.09031090314491075, "grad_max_sv": 0.013889235025271774, "grad_min_sv": 0.0, "grad_condition": 13889235025.27177, "lr": 0.00032571397633909225, "time_sec": 41.76129865646362 }, { "epoch": 93, "train_loss": 4.852394995727539, "train_acc": 0.00978, "test_loss": 13.140398934936524, "test_acc": 0.01, "lyapunov": 1.4706439609112947, "grad_norm": 0.09896021199497843, "grad_max_sv": 0.012632346572354436, "grad_min_sv": 0.0, "grad_condition": 12632346572.354437, "lr": 0.00031593772365766094, "time_sec": 41.7473201751709 }, { "epoch": 94, "train_loss": 4.853237281036377, "train_acc": 0.00878, "test_loss": 12.807959544372558, "test_acc": 0.01, "lyapunov": 1.4736966973985248, "grad_norm": 0.09036941229411612, "grad_max_sv": 0.008218426816165447, "grad_min_sv": 0.0, "grad_condition": 8218426816.165448, "lr": 0.0003062422067739483, "time_sec": 41.732847452163696 }, { "epoch": 95, "train_loss": 4.852389494171143, "train_acc": 0.00908, "test_loss": 12.560802192687989, "test_acc": 0.01, "lyapunov": 1.471325798412723, "grad_norm": 0.08925054999698791, "grad_max_sv": 0.00795787493698299, "grad_min_sv": 0.0, "grad_condition": 7957874936.982989, "lr": 0.00029663167846209965, "time_sec": 41.743444204330444 }, { "epoch": 96, "train_loss": 4.852095717926026, "train_acc": 0.00964, "test_loss": 12.698743003845214, "test_acc": 0.01, "lyapunov": 1.4707305251484941, "grad_norm": 0.08980211873044659, "grad_max_sv": 0.006079048849642277, "grad_min_sv": 0.0, "grad_condition": 6079048849.642277, "lr": 0.00028711035421746345, "time_sec": 41.744508266448975 }, { "epoch": 97, "train_loss": 4.852325097198486, "train_acc": 0.00998, "test_loss": 12.385714389038085, "test_acc": 0.01, "lyapunov": 1.4707067143886596, "grad_norm": 0.09303110633276697, "grad_max_sv": 0.013369420357048512, "grad_min_sv": 0.0, "grad_condition": 13369420357.048512, "lr": 0.00027768241040753615, "time_sec": 41.777459383010864 }, { "epoch": 98, "train_loss": 4.852114578399658, "train_acc": 0.00946, "test_loss": 12.616465420532226, "test_acc": 0.01, "lyapunov": 1.4709890193646522, "grad_norm": 0.08982717043210414, "grad_max_sv": 0.011742619890719652, "grad_min_sv": 0.0, "grad_condition": 11742619890.719652, "lr": 0.00026835198244006903, "time_sec": 41.74090838432312 }, { "epoch": 99, "train_loss": 4.852081492767334, "train_acc": 0.00914, "test_loss": 12.773276670837403, "test_acc": 0.01, "lyapunov": 1.4708703545963062, "grad_norm": 0.08820725715813042, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 41.70957374572754 }, { "epoch": 100, "train_loss": 4.852057821807861, "train_acc": 0.00854, "test_loss": 12.903013801574707, "test_acc": 0.01, "lyapunov": 1.470713365718227, "grad_norm": 0.08831333485556404, "grad_max_sv": 0.001176884165033698, "grad_min_sv": 0.0, "grad_condition": 1176884165.033698, "lr": 0.0002499999999999997, "time_sec": 41.70664095878601 }, { "epoch": 101, "train_loss": 4.852297632446289, "train_acc": 0.0088, "test_loss": 12.991321166992188, "test_acc": 0.01, "lyapunov": 1.471470196838574, "grad_norm": 0.08844546443228318, "grad_max_sv": 0.0007792085409164429, "grad_min_sv": 0.0, "grad_condition": 779208540.9164429, "lr": 0.00024098649531343477, "time_sec": 41.72946095466614 }, { "epoch": 102, "train_loss": 4.85340077835083, "train_acc": 0.00928, "test_loss": 12.494372912597656, "test_acc": 0.01, "lyapunov": 1.4734248584493652, "grad_norm": 0.0904122316991309, "grad_max_sv": 0.01403848035261035, "grad_min_sv": 0.0, "grad_condition": 14038480352.610352, "lr": 0.0002320866025105016, "time_sec": 41.72011160850525 }, { "epoch": 103, "train_loss": 4.8527667138671875, "train_acc": 0.00854, "test_loss": 13.111592295837402, "test_acc": 0.01, "lyapunov": 1.4726007445084164, "grad_norm": 0.08932121120200033, "grad_max_sv": 0.004739455413073301, "grad_min_sv": 0.0, "grad_condition": 4739455413.073301, "lr": 0.0002233042253783278, "time_sec": 41.74779987335205 }, { "epoch": 104, "train_loss": 4.852004501037598, "train_acc": 0.00946, "test_loss": 12.720405123901367, "test_acc": 0.01, "lyapunov": 1.4705228412242801, "grad_norm": 0.08860158464501969, "grad_max_sv": 0.006343359779566527, "grad_min_sv": 0.0, "grad_condition": 6343359779.566526, "lr": 0.000214643216157784, "time_sec": 41.75279927253723 }, { "epoch": 105, "train_loss": 4.852732130584717, "train_acc": 0.00936, "test_loss": 12.728569932556152, "test_acc": 0.01, "lyapunov": 1.4726796906317592, "grad_norm": 0.08858840001436137, "grad_max_sv": 0.0021229078993201256, "grad_min_sv": 0.0, "grad_condition": 2122907899.3201256, "lr": 0.00020610737385376332, "time_sec": 41.71723484992981 }, { "epoch": 106, "train_loss": 4.852207695922852, "train_acc": 0.00926, "test_loss": 12.709718621826172, "test_acc": 0.01, "lyapunov": 1.4712865084333493, "grad_norm": 0.08830963721683445, "grad_max_sv": 0.0027129428926855326, "grad_min_sv": 0.0, "grad_condition": 2712942892.6855326, "lr": 0.00019770044256881242, "time_sec": 41.71148443222046 }, { "epoch": 107, "train_loss": 4.85225803314209, "train_acc": 0.00982, "test_loss": 12.837951531982421, "test_acc": 0.01, "lyapunov": 1.4712638537902052, "grad_norm": 0.08902472521530928, "grad_max_sv": 0.008135201036930084, "grad_min_sv": 0.0, "grad_condition": 8135201036.930084, "lr": 0.0001894261098608447, "time_sec": 41.72528624534607 }, { "epoch": 108, "train_loss": 4.852549499511719, "train_acc": 0.00936, "test_loss": 13.247559573364258, "test_acc": 0.01, "lyapunov": 1.4724893740680822, "grad_norm": 0.08825387718460724, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 41.74774885177612 }, { "epoch": 109, "train_loss": 4.85227595916748, "train_acc": 0.00946, "test_loss": 13.13632116241455, "test_acc": 0.01, "lyapunov": 1.471560059910845, "grad_norm": 0.08956498900691849, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 41.7323522567749 }, { "epoch": 110, "train_loss": 4.852233708801269, "train_acc": 0.00902, "test_loss": 13.550802612304688, "test_acc": 0.01, "lyapunov": 1.4712924996910193, "grad_norm": 0.08901901086212888, "grad_max_sv": 0.004322580248117447, "grad_min_sv": 0.0, "grad_condition": 4322580248.117447, "lr": 0.00016543469682057076, "time_sec": 41.74680209159851 }, { "epoch": 111, "train_loss": 4.852689293060303, "train_acc": 0.00916, "test_loss": 13.372785118103028, "test_acc": 0.01, "lyapunov": 1.4729326292681877, "grad_norm": 0.08862372209724671, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 41.72367000579834 }, { "epoch": 112, "train_loss": 4.855245245056152, "train_acc": 0.00918, "test_loss": 13.167806037902832, "test_acc": 0.01, "lyapunov": 1.4768958594792945, "grad_norm": 0.08841785458131039, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 41.73188829421997 }, { "epoch": 113, "train_loss": 4.852458833618164, "train_acc": 0.00882, "test_loss": 13.374362356567383, "test_acc": 0.01, "lyapunov": 1.4722495371728297, "grad_norm": 0.08871568614447918, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 41.71817493438721 }, { "epoch": 114, "train_loss": 4.851942072448731, "train_acc": 0.00902, "test_loss": 13.413740673828125, "test_acc": 0.01, "lyapunov": 1.4704074313878404, "grad_norm": 0.08870214010553126, "grad_max_sv": 0.0019620250910520553, "grad_min_sv": 0.0, "grad_condition": 1962025091.0520554, "lr": 0.00013551568628929425, "time_sec": 41.72637939453125 }, { "epoch": 115, "train_loss": 4.853842346343994, "train_acc": 0.00876, "test_loss": 13.078753887939452, "test_acc": 0.01, "lyapunov": 1.4757750683733264, "grad_norm": 0.08934074054242225, "grad_max_sv": 0.0054347761906683445, "grad_min_sv": 0.0, "grad_condition": 5434776190.6683445, "lr": 0.00012842758726130276, "time_sec": 41.711642265319824 }, { "epoch": 116, "train_loss": 4.852122984466552, "train_acc": 0.0092, "test_loss": 13.219519885253906, "test_acc": 0.01, "lyapunov": 1.4712010920809968, "grad_norm": 0.08808712563631747, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 41.74567747116089 }, { "epoch": 117, "train_loss": 4.8583870220947265, "train_acc": 0.00938, "test_loss": 13.296599545288085, "test_acc": 0.01, "lyapunov": 1.4836899404940398, "grad_norm": 0.08878474499083394, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 41.72996282577515 }, { "epoch": 118, "train_loss": 4.8542758628845215, "train_acc": 0.0095, "test_loss": 13.232178741455078, "test_acc": 0.01, "lyapunov": 1.476102854284789, "grad_norm": 0.08869739853760654, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 41.73535418510437 }, { "epoch": 119, "train_loss": 4.852905385437012, "train_acc": 0.00894, "test_loss": 13.59550298614502, "test_acc": 0.01, "lyapunov": 1.4737293317799678, "grad_norm": 0.08826212131432655, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 41.72545409202576 }, { "epoch": 120, "train_loss": 4.852262009429932, "train_acc": 0.0092, "test_loss": 13.53664966430664, "test_acc": 0.01, "lyapunov": 1.471702798248252, "grad_norm": 0.08816229564695008, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 41.747995376586914 }, { "epoch": 121, "train_loss": 4.852286165924072, "train_acc": 0.00938, "test_loss": 13.543427288818359, "test_acc": 0.01, "lyapunov": 1.4718451771284917, "grad_norm": 0.0882556097544163, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 41.71251606941223 }, { "epoch": 122, "train_loss": 4.852815079193115, "train_acc": 0.00866, "test_loss": 13.50841277770996, "test_acc": 0.01, "lyapunov": 1.4734657941876774, "grad_norm": 0.08834171363916951, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 41.828593492507935 }, { "epoch": 123, "train_loss": 4.8519872172546386, "train_acc": 0.0097, "test_loss": 13.492674378967285, "test_acc": 0.01, "lyapunov": 1.470838068696239, "grad_norm": 0.08874014439548912, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 41.981213331222534 }, { "epoch": 124, "train_loss": 4.853034484252929, "train_acc": 0.009, "test_loss": 13.126736920166016, "test_acc": 0.01, "lyapunov": 1.4740290989351394, "grad_norm": 0.08813885370977613, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 41.71132040023804 }, { "epoch": 125, "train_loss": 4.85233381652832, "train_acc": 0.00952, "test_loss": 13.397762631225586, "test_acc": 0.01, "lyapunov": 1.471941991230411, "grad_norm": 0.08812641091996891, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 41.72543954849243 }, { "epoch": 126, "train_loss": 4.8525572804260255, "train_acc": 0.0096, "test_loss": 13.308763629150391, "test_acc": 0.01, "lyapunov": 1.472656028349991, "grad_norm": 0.08840738704987161, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 41.72384238243103 }, { "epoch": 127, "train_loss": 4.855584846191406, "train_acc": 0.00946, "test_loss": 13.759437710571289, "test_acc": 0.01, "lyapunov": 1.4782639266279958, "grad_norm": 0.08826506573029154, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 41.73837852478027 }, { "epoch": 128, "train_loss": 4.85253405090332, "train_acc": 0.00946, "test_loss": 13.737331958007813, "test_acc": 0.01, "lyapunov": 1.4725991725311864, "grad_norm": 0.08806307055084844, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 41.761263847351074 }, { "epoch": 129, "train_loss": 4.852324590759277, "train_acc": 0.01, "test_loss": 13.721236633300782, "test_acc": 0.01, "lyapunov": 1.4719348380632717, "grad_norm": 0.08813587403770864, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 41.74943208694458 }, { "epoch": 130, "train_loss": 4.85221561340332, "train_acc": 0.00954, "test_loss": 13.78914153137207, "test_acc": 0.01, "lyapunov": 1.4716954301385319, "grad_norm": 0.08851547081560074, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 41.76015615463257 }, { "epoch": 131, "train_loss": 4.852464799957275, "train_acc": 0.00878, "test_loss": 13.605609268188477, "test_acc": 0.01, "lyapunov": 1.4723939121226826, "grad_norm": 0.08823360335901036, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 41.77037334442139 }, { "epoch": 132, "train_loss": 4.852380610198975, "train_acc": 0.00896, "test_loss": 13.703162010192871, "test_acc": 0.01, "lyapunov": 1.4721423701557053, "grad_norm": 0.08806535417914078, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 41.78282904624939 }, { "epoch": 133, "train_loss": 4.853441643676758, "train_acc": 0.00924, "test_loss": 13.780622036743164, "test_acc": 0.01, "lyapunov": 1.4737608521185872, "grad_norm": 0.08786943886020787, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 41.94830918312073 }, { "epoch": 134, "train_loss": 4.8520362255859375, "train_acc": 0.00954, "test_loss": 13.83701887512207, "test_acc": 0.01, "lyapunov": 1.471004798284272, "grad_norm": 0.08837937530648805, "grad_max_sv": 0.000659800786525011, "grad_min_sv": 0.0, "grad_condition": 659800786.5250111, "lr": 2.7811814881259484e-05, "time_sec": 41.915955781936646 }, { "epoch": 135, "train_loss": 4.852150169067383, "train_acc": 0.00958, "test_loss": 13.836302838134765, "test_acc": 0.01, "lyapunov": 1.471451068473289, "grad_norm": 0.0887060490050228, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 41.69927930831909 }, { "epoch": 136, "train_loss": 4.853155226898194, "train_acc": 0.00916, "test_loss": 13.758418685913085, "test_acc": 0.01, "lyapunov": 1.4742048859901136, "grad_norm": 0.09745955508136325, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 41.71672034263611 }, { "epoch": 137, "train_loss": 4.85282894165039, "train_acc": 0.00928, "test_loss": 13.801075386047364, "test_acc": 0.01, "lyapunov": 1.4736028842608948, "grad_norm": 0.08838780479254947, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 41.86513018608093 }, { "epoch": 138, "train_loss": 4.852049649047852, "train_acc": 0.00982, "test_loss": 13.844301895141601, "test_acc": 0.01, "lyapunov": 1.4711221602871596, "grad_norm": 0.0886793780466303, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 41.807748317718506 }, { "epoch": 139, "train_loss": 4.853534520874024, "train_acc": 0.01, "test_loss": 13.770389680480957, "test_acc": 0.01, "lyapunov": 1.4747250278282653, "grad_norm": 0.08808641740018294, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 41.780285596847534 }, { "epoch": 140, "train_loss": 4.851904624481201, "train_acc": 0.0096, "test_loss": 13.713402738952636, "test_acc": 0.01, "lyapunov": 1.4706565852055464, "grad_norm": 0.08806158709361275, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 41.71153283119202 }, { "epoch": 141, "train_loss": 4.852294711456299, "train_acc": 0.00974, "test_loss": 13.674919595336915, "test_acc": 0.01, "lyapunov": 1.4719334886507, "grad_norm": 0.08848605705342659, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 41.75360417366028 }, { "epoch": 142, "train_loss": 4.852051578979492, "train_acc": 0.00986, "test_loss": 13.683543762207032, "test_acc": 0.01, "lyapunov": 1.4711576669722262, "grad_norm": 0.08814132937210956, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 41.73791003227234 }, { "epoch": 143, "train_loss": 4.852365187683105, "train_acc": 0.00984, "test_loss": 13.635780154418946, "test_acc": 0.01, "lyapunov": 1.4721494221016573, "grad_norm": 0.08862731675513442, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 41.75744414329529 }, { "epoch": 144, "train_loss": 4.852421789550781, "train_acc": 0.00964, "test_loss": 13.633413438415527, "test_acc": 0.01, "lyapunov": 1.4723204545047888, "grad_norm": 0.08863761801039138, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 41.74138283729553 }, { "epoch": 145, "train_loss": 4.852283345336914, "train_acc": 0.00988, "test_loss": 13.618844378662109, "test_acc": 0.01, "lyapunov": 1.471912037990892, "grad_norm": 0.08829552590637708, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 41.73318958282471 }, { "epoch": 146, "train_loss": 4.852081503601074, "train_acc": 0.00942, "test_loss": 13.636005783081055, "test_acc": 0.01, "lyapunov": 1.4712535944741096, "grad_norm": 0.0881891115278494, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 41.7281494140625 }, { "epoch": 147, "train_loss": 4.851804008331299, "train_acc": 0.00964, "test_loss": 13.61884249420166, "test_acc": 0.01, "lyapunov": 1.4703791028703266, "grad_norm": 0.08816211822553004, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 41.74032163619995 }, { "epoch": 148, "train_loss": 4.8529896348571775, "train_acc": 0.0097, "test_loss": 13.650962756347656, "test_acc": 0.01, "lyapunov": 1.4741563284793473, "grad_norm": 0.08847924183215054, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 41.70267343521118 }, { "epoch": 149, "train_loss": 4.851896666412354, "train_acc": 0.01, "test_loss": 13.636007565307617, "test_acc": 0.01, "lyapunov": 1.470671361669555, "grad_norm": 0.08871972262513622, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 41.72864389419556 }, { "epoch": 150, "train_loss": 4.852557410736084, "train_acc": 0.01, "test_loss": 13.636007955932618, "test_acc": 0.01, "lyapunov": 1.4727459463012187, "grad_norm": 0.08844840269295245, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 41.74263858795166 } ], "8": [ { "epoch": 1, "train_loss": 4.735240103759765, "train_acc": 0.02524, "test_loss": 4.866816416931153, "test_acc": 0.0196, "lyapunov": 2.026013672809162, "grad_norm": 5.2515251679689285, "grad_max_sv": 4.178838831186295, "grad_min_sv": 9.041712029367321e-08, "grad_condition": 179649161.33195654, "lr": 0.0009998903417374227, "time_sec": 87.18950843811035 }, { "epoch": 2, "train_loss": 4.5068304737854, "train_acc": 0.03554, "test_loss": 5.026126983642578, "test_acc": 0.0173, "lyapunov": 1.7496998066182636, "grad_norm": 3.127286126154696, "grad_max_sv": 2.359567102789879, "grad_min_sv": 5.685370215550989e-08, "grad_condition": 519592009.8775345, "lr": 0.0009995614150494292, "time_sec": 87.2297294139862 }, { "epoch": 3, "train_loss": 4.461366838684082, "train_acc": 0.03612, "test_loss": 4.588225796508789, "test_acc": 0.0214, "lyapunov": 1.5944948662882266, "grad_norm": 1.7421788335036872, "grad_max_sv": 1.159491127729416, "grad_min_sv": 3.012503119736998e-08, "grad_condition": 46872158.840100154, "lr": 0.0009990133642141358, "time_sec": 87.14756369590759 }, { "epoch": 4, "train_loss": 4.419443615722656, "train_acc": 0.0416, "test_loss": 5.286386401367188, "test_acc": 0.01, "lyapunov": 1.5645387861734765, "grad_norm": 1.1211397301440151, "grad_max_sv": 0.6769661128520965, "grad_min_sv": 1.748986164784583e-08, "grad_condition": 61425339.07877908, "lr": 0.0009982464296247522, "time_sec": 87.12213373184204 }, { "epoch": 5, "train_loss": 4.423492089996338, "train_acc": 0.04338, "test_loss": 6.2819957962036135, "test_acc": 0.01, "lyapunov": 1.5490608950100286, "grad_norm": 0.8706870069158426, "grad_max_sv": 0.5114456944167614, "grad_min_sv": 1.31196238317699e-08, "grad_condition": 53181583.053102724, "lr": 0.0009972609476841367, "time_sec": 87.13790082931519 }, { "epoch": 6, "train_loss": 4.523505429840088, "train_acc": 0.03268, "test_loss": 5.438013370513916, "test_acc": 0.0125, "lyapunov": 1.5594564731163747, "grad_norm": 0.857804226532666, "grad_max_sv": 0.49648181200027464, "grad_min_sv": 1.1631784305188297e-08, "grad_condition": 65912570.425740495, "lr": 0.000996057350657239, "time_sec": 87.11513113975525 }, { "epoch": 7, "train_loss": 4.491675056762696, "train_acc": 0.03868, "test_loss": 4.85823662109375, "test_acc": 0.01, "lyapunov": 1.5649392903613313, "grad_norm": 0.922475970431733, "grad_max_sv": 0.5282619304955005, "grad_min_sv": 1.3700025544571837e-08, "grad_condition": 115221136.73324652, "lr": 0.000994636166481494, "time_sec": 87.11052560806274 }, { "epoch": 8, "train_loss": 4.458245279388428, "train_acc": 0.04286, "test_loss": 5.0693019569396975, "test_acc": 0.01, "lyapunov": 1.564261608416467, "grad_norm": 0.8247796151577914, "grad_max_sv": 0.4666087761521339, "grad_min_sv": 1.2590186138083937e-08, "grad_condition": 80951881.02073678, "lr": 0.0009929980185352525, "time_sec": 87.10055899620056 }, { "epoch": 9, "train_loss": 4.479283211364746, "train_acc": 0.04164, "test_loss": 4.6463909927368165, "test_acc": 0.01, "lyapunov": 1.5368007479421317, "grad_norm": 0.7899216729609227, "grad_max_sv": 0.41627604588866235, "grad_min_sv": 1.04147358570561e-08, "grad_condition": 47679788.12689672, "lr": 0.0009911436253643444, "time_sec": 87.12877798080444 }, { "epoch": 10, "train_loss": 4.452324397583008, "train_acc": 0.0458, "test_loss": 4.653008950805664, "test_acc": 0.01, "lyapunov": 1.5427158729499564, "grad_norm": 0.693102659392051, "grad_max_sv": 0.39028600230813026, "grad_min_sv": 9.917548506044316e-09, "grad_condition": 50871255.950711094, "lr": 0.0009890738003669028, "time_sec": 87.09939312934875 }, { "epoch": 11, "train_loss": 4.498550581054688, "train_acc": 0.04238, "test_loss": 4.798313717651367, "test_acc": 0.01, "lyapunov": 1.562767594061849, "grad_norm": 0.7157991404315234, "grad_max_sv": 0.3735340617597103, "grad_min_sv": 9.18097689817099e-09, "grad_condition": 76046170.48271176, "lr": 0.00098678945143658, "time_sec": 87.10426044464111 }, { "epoch": 12, "train_loss": 4.4704539869689945, "train_acc": 0.04582, "test_loss": 4.7863667205810545, "test_acc": 0.01, "lyapunov": 1.5232323402029169, "grad_norm": 0.6028364454937816, "grad_max_sv": 0.332496403157711, "grad_min_sv": 8.755317024156106e-09, "grad_condition": 43134971.96461357, "lr": 0.0009842915805643154, "time_sec": 87.09469079971313 }, { "epoch": 13, "train_loss": 4.537702497558594, "train_acc": 0.03896, "test_loss": 4.654966796875, "test_acc": 0.01, "lyapunov": 1.54529083567812, "grad_norm": 0.6292726486160667, "grad_max_sv": 0.3057276763021946, "grad_min_sv": 6.5090396415661e-09, "grad_condition": 700356710.9321487, "lr": 0.000981581283398829, "time_sec": 87.09531950950623 }, { "epoch": 14, "train_loss": 4.620839001159668, "train_acc": 0.0303, "test_loss": 4.868439013671875, "test_acc": 0.01, "lyapunov": 1.5458131620036366, "grad_norm": 0.5338695301373511, "grad_max_sv": 0.29795307405292987, "grad_min_sv": 5.120543077052897e-09, "grad_condition": 339314023.7111832, "lr": 0.0009786597487660333, "time_sec": 87.12465906143188 }, { "epoch": 15, "train_loss": 4.513916426849366, "train_acc": 0.04438, "test_loss": 4.835803776550293, "test_acc": 0.01, "lyapunov": 1.5507933197119046, "grad_norm": 0.6007957930506477, "grad_max_sv": 0.3038324311375618, "grad_min_sv": 6.934315210233022e-09, "grad_condition": 198097346.8229193, "lr": 0.0009755282581475766, "time_sec": 87.08587527275085 }, { "epoch": 16, "train_loss": 4.492137908630371, "train_acc": 0.04818, "test_loss": 4.887235678100586, "test_acc": 0.01, "lyapunov": 1.5494948896910528, "grad_norm": 0.5976636149826597, "grad_max_sv": 0.30106121934950353, "grad_min_sv": 7.290029437057033e-09, "grad_condition": 63284303.580263734, "lr": 0.0009721881851187403, "time_sec": 87.09524250030518 }, { "epoch": 17, "train_loss": 4.575829989471435, "train_acc": 0.03854, "test_loss": 4.948842854309082, "test_acc": 0.01, "lyapunov": 1.53777074539448, "grad_norm": 0.5014123935951768, "grad_max_sv": 0.29032444581389427, "grad_min_sv": 5.414256840086118e-09, "grad_condition": 69838858.70858149, "lr": 0.0009686409947459456, "time_sec": 87.14909029006958 }, { "epoch": 18, "train_loss": 4.597054883728028, "train_acc": 0.03624, "test_loss": 4.844102088165283, "test_acc": 0.01, "lyapunov": 1.5350244057452893, "grad_norm": 0.5123739316899657, "grad_max_sv": 0.26398728154599665, "grad_min_sv": 5.243455172138089e-09, "grad_condition": 119920046.5630234, "lr": 0.0009648882429441254, "time_sec": 87.09620761871338 }, { "epoch": 19, "train_loss": 4.620368363647461, "train_acc": 0.03384, "test_loss": 4.720510952758789, "test_acc": 0.01, "lyapunov": 1.5356951705025286, "grad_norm": 0.47243607957213, "grad_max_sv": 0.24507929012179375, "grad_min_sv": 5.088020715859898e-09, "grad_condition": 57785330.0936975, "lr": 0.00096093157579425, "time_sec": 87.11660838127136 }, { "epoch": 20, "train_loss": 4.613923555145264, "train_acc": 0.03756, "test_loss": 5.093030418395996, "test_acc": 0.01, "lyapunov": 1.5330088199556942, "grad_norm": 0.5270298408202432, "grad_max_sv": 0.2416334819048643, "grad_min_sv": 4.882703122420853e-09, "grad_condition": 311593743.69228464, "lr": 0.0009567727288213001, "time_sec": 87.09937357902527 }, { "epoch": 21, "train_loss": 4.636924856567383, "train_acc": 0.036, "test_loss": 5.04784955368042, "test_acc": 0.01, "lyapunov": 1.5540363645309683, "grad_norm": 0.526606906737193, "grad_max_sv": 0.24690264500677586, "grad_min_sv": 5.1651495895903985e-09, "grad_condition": 691559676.1292815, "lr": 0.0009524135262330095, "time_sec": 87.11412358283997 }, { "epoch": 22, "train_loss": 4.679128698577881, "train_acc": 0.02896, "test_loss": 4.895172619628906, "test_acc": 0.01, "lyapunov": 1.547908184778355, "grad_norm": 0.44727272149588615, "grad_max_sv": 0.24925720058381556, "grad_min_sv": 4.642139438126858e-09, "grad_condition": 66478210.43898354, "lr": 0.0009478558801197061, "time_sec": 87.11094355583191 }, { "epoch": 23, "train_loss": 4.662371476287841, "train_acc": 0.03188, "test_loss": 4.795903799438476, "test_acc": 0.01, "lyapunov": 1.5548140889848285, "grad_norm": 0.5260267923584394, "grad_max_sv": 0.23556945472955704, "grad_min_sv": 4.337634041588854e-09, "grad_condition": 1025805594.4440111, "lr": 0.000943101789615607, "time_sec": 87.11297392845154 }, { "epoch": 24, "train_loss": 4.6645262229919435, "train_acc": 0.03214, "test_loss": 5.057237059783936, "test_acc": 0.01, "lyapunov": 1.5496064592200471, "grad_norm": 0.6505246940270789, "grad_max_sv": 0.2576914459466934, "grad_min_sv": 4.8245041350813974e-09, "grad_condition": 94704831.81255548, "lr": 0.0009381533400219313, "time_sec": 87.10920405387878 }, { "epoch": 25, "train_loss": 4.654648971710205, "train_acc": 0.0322, "test_loss": 5.318339912414551, "test_acc": 0.01, "lyapunov": 1.565699156592874, "grad_norm": 0.4161938321621143, "grad_max_sv": 0.2134155698120594, "grad_min_sv": 3.946434762314155e-09, "grad_condition": 254671281.05499464, "lr": 0.0009330127018922189, "time_sec": 87.13201785087585 }, { "epoch": 26, "train_loss": 4.791520259552002, "train_acc": 0.02372, "test_loss": 4.959452788543701, "test_acc": 0.01, "lyapunov": 1.600033207012869, "grad_norm": 0.9779964796296537, "grad_max_sv": 0.2255085190758109, "grad_min_sv": 3.1466205011160244e-09, "grad_condition": 11039609220.08119, "lr": 0.000927682130080253, "time_sec": 87.18698191642761 }, { "epoch": 27, "train_loss": 4.69488529296875, "train_acc": 0.03142, "test_loss": 5.3654563461303715, "test_acc": 0.01, "lyapunov": 1.5987402142771066, "grad_norm": 0.6442328720311332, "grad_max_sv": 0.23703443501144647, "grad_min_sv": 3.5609615074683707e-09, "grad_condition": 1745246073.6363997, "lr": 0.0009221639627510072, "time_sec": 87.134925365448 }, { "epoch": 28, "train_loss": 4.606881724700928, "train_acc": 0.03926, "test_loss": 4.73573546295166, "test_acc": 0.0103, "lyapunov": 1.5937491731570506, "grad_norm": 0.4194063933325514, "grad_max_sv": 0.21865120753645897, "grad_min_sv": 3.87901320235591e-09, "grad_condition": 523863784.21676093, "lr": 0.0009164606203550494, "time_sec": 87.14774799346924 }, { "epoch": 29, "train_loss": 4.617493250274658, "train_acc": 0.03728, "test_loss": 4.662520077514649, "test_acc": 0.01, "lyapunov": 1.596246981559812, "grad_norm": 0.3789306278435458, "grad_max_sv": 0.19524494409561158, "grad_min_sv": 3.4768166591418737e-09, "grad_condition": 236541357.234686, "lr": 0.0009105746045668516, "time_sec": 87.11421346664429 }, { "epoch": 30, "train_loss": 4.631677906799316, "train_acc": 0.03778, "test_loss": 6.121908515167236, "test_acc": 0.01, "lyapunov": 1.6226924099885593, "grad_norm": 0.44716784199095383, "grad_max_sv": 0.1934027548879385, "grad_min_sv": 3.3855620726374116e-09, "grad_condition": 581199629.6704518, "lr": 0.0009045084971874733, "time_sec": 87.11589574813843 }, { "epoch": 31, "train_loss": 4.7931158798217774, "train_acc": 0.02286, "test_loss": 4.620251409912109, "test_acc": 0.0092, "lyapunov": 1.6308694739475884, "grad_norm": 0.550187770618441, "grad_max_sv": 0.18949946835637094, "grad_min_sv": 1.786556805578803e-09, "grad_condition": 42877123442.64499, "lr": 0.0008982649590120977, "time_sec": 87.1836428642273 }, { "epoch": 32, "train_loss": 4.760539370574951, "train_acc": 0.02752, "test_loss": 4.657791676330566, "test_acc": 0.01, "lyapunov": 1.6191697065787547, "grad_norm": 0.3614365919222485, "grad_max_sv": 0.17497441843152045, "grad_min_sv": 1.779506375100445e-09, "grad_condition": 13836124253.01267, "lr": 0.0008918467286629196, "time_sec": 87.18445110321045 }, { "epoch": 33, "train_loss": 4.739889914245605, "train_acc": 0.029, "test_loss": 4.71790985031128, "test_acc": 0.0111, "lyapunov": 1.6113197523004867, "grad_norm": 0.3353632004468733, "grad_max_sv": 0.1673861812800169, "grad_min_sv": 7.641599533418533e-10, "grad_condition": 13965803361.130926, "lr": 0.0008852566213878943, "time_sec": 87.21766877174377 }, { "epoch": 34, "train_loss": 4.753917649078369, "train_acc": 0.02908, "test_loss": 6.4435778312683105, "test_acc": 0.01, "lyapunov": 1.6236087751510504, "grad_norm": 0.32686722214079433, "grad_max_sv": 0.16869123242795467, "grad_min_sv": 5.19174209905656e-10, "grad_condition": 25949866712.408104, "lr": 0.000878497527825878, "time_sec": 87.14275527000427 }, { "epoch": 35, "train_loss": 4.802844509124756, "train_acc": 0.0244, "test_loss": 6.557575407409668, "test_acc": 0.01, "lyapunov": 1.6418090259937375, "grad_norm": 0.4988110566872576, "grad_max_sv": 0.1611970603466034, "grad_min_sv": 7.265029261023372e-10, "grad_condition": 19350605239.471405, "lr": 0.000871572412738697, "time_sec": 87.16936993598938 }, { "epoch": 36, "train_loss": 4.776907616271973, "train_acc": 0.02782, "test_loss": 4.822451950073242, "test_acc": 0.01, "lyapunov": 1.649027470737467, "grad_norm": 0.342256043849884, "grad_max_sv": 0.15263066124171018, "grad_min_sv": 1.2339334798351036e-10, "grad_condition": 9338850661.261333, "lr": 0.0008644843137107055, "time_sec": 87.186208486557 }, { "epoch": 37, "train_loss": 4.772866481628418, "train_acc": 0.0269, "test_loss": 6.221601684570312, "test_acc": 0.01, "lyapunov": 1.6788606286963539, "grad_norm": 0.6629649981625318, "grad_max_sv": 0.17593900030478835, "grad_min_sv": 2.304191549799707e-09, "grad_condition": 9259298449.8995, "lr": 0.0008572363398164014, "time_sec": 87.18624091148376 }, { "epoch": 38, "train_loss": 4.77164099029541, "train_acc": 0.02672, "test_loss": 4.766420809936523, "test_acc": 0.01, "lyapunov": 1.7235305708692508, "grad_norm": 0.3937581266699412, "grad_max_sv": 0.17076923064887523, "grad_min_sv": 4.0183006136103404e-10, "grad_condition": 16063615551.021002, "lr": 0.0008498316702566826, "time_sec": 87.20626258850098 }, { "epoch": 39, "train_loss": 4.807452021179199, "train_acc": 0.02832, "test_loss": 4.899550021362304, "test_acc": 0.01, "lyapunov": 1.8249543252808358, "grad_norm": 0.5715574182036978, "grad_max_sv": 0.16177968972187956, "grad_min_sv": 3.793029192220455e-10, "grad_condition": 8307565763.804538, "lr": 0.0008422735529643442, "time_sec": 87.19903802871704 }, { "epoch": 40, "train_loss": 4.760174724121094, "train_acc": 0.0279, "test_loss": 5.857627616119385, "test_acc": 0.01, "lyapunov": 1.7056615718490327, "grad_norm": 0.4256172750988047, "grad_max_sv": 0.16561466939747332, "grad_min_sv": 2.058724911119941e-09, "grad_condition": 512180966.31238127, "lr": 0.0008345653031794289, "time_sec": 87.21863722801208 }, { "epoch": 41, "train_loss": 4.69559801071167, "train_acc": 0.02966, "test_loss": 5.604364262390137, "test_acc": 0.01, "lyapunov": 1.5935010431367722, "grad_norm": 0.35011105073884097, "grad_max_sv": 0.18168312907218934, "grad_min_sv": 2.4247929442111626e-09, "grad_condition": 93356754.736842, "lr": 0.0008267103019950526, "time_sec": 87.22393608093262 }, { "epoch": 42, "train_loss": 4.709802615814209, "train_acc": 0.02616, "test_loss": 4.870189538574219, "test_acc": 0.01, "lyapunov": 1.615870985228692, "grad_norm": 0.31755349221985774, "grad_max_sv": 0.17116790413856506, "grad_min_sv": 2.5351133262074833e-09, "grad_condition": 220960563.35692176, "lr": 0.0008187119948743447, "time_sec": 87.20640540122986 }, { "epoch": 43, "train_loss": 4.793043034057617, "train_acc": 0.02262, "test_loss": 5.881324156951904, "test_acc": 0.01, "lyapunov": 1.7521904277069795, "grad_norm": 0.5590339405433944, "grad_max_sv": 0.14497370515600777, "grad_min_sv": 3.9279086975103414e-10, "grad_condition": 19019670561.939625, "lr": 0.000810573890139155, "time_sec": 87.31258749961853 }, { "epoch": 44, "train_loss": 4.844116692810059, "train_acc": 0.02276, "test_loss": 5.395824824523926, "test_acc": 0.01, "lyapunov": 1.8710771832624664, "grad_norm": 0.5293965973008694, "grad_max_sv": 0.1555709108710289, "grad_min_sv": 4.2711866910149697e-10, "grad_condition": 14548258948.991043, "lr": 0.0008022995574311873, "time_sec": 87.18556952476501 }, { "epoch": 45, "train_loss": 4.8768616571044925, "train_acc": 0.02038, "test_loss": 4.61512779083252, "test_acc": 0.01, "lyapunov": 1.8506627338926505, "grad_norm": 0.6998099846191761, "grad_max_sv": 0.13765994729474187, "grad_min_sv": 5.812380418716187e-11, "grad_condition": 29846677946.806488, "lr": 0.0007938926261462363, "time_sec": 87.2240195274353 }, { "epoch": 46, "train_loss": 4.969230243377686, "train_acc": 0.01168, "test_loss": 7.386215936279297, "test_acc": 0.01, "lyapunov": 1.8457061924288034, "grad_norm": 1.2406105764459343, "grad_max_sv": 0.11906649246811866, "grad_min_sv": 3.98718814026065e-11, "grad_condition": 92245006784.32524, "lr": 0.0007853567838422158, "time_sec": 87.17690944671631 }, { "epoch": 47, "train_loss": 4.875964500274658, "train_acc": 0.01072, "test_loss": 6.527316121673584, "test_acc": 0.01, "lyapunov": 1.5310816859345302, "grad_norm": 0.16182231228887384, "grad_max_sv": 0.08984448052942753, "grad_min_sv": 1.0441322375968024e-16, "grad_condition": 89835727617.94872, "lr": 0.0007766957746216719, "time_sec": 87.1852126121521 }, { "epoch": 48, "train_loss": 4.875588766021728, "train_acc": 0.00916, "test_loss": 6.651647409820557, "test_acc": 0.01, "lyapunov": 1.5314356905724995, "grad_norm": 0.17879068685955746, "grad_max_sv": 0.09055437743663788, "grad_min_sv": 2.807460538981671e-16, "grad_condition": 90529399768.58862, "lr": 0.0007679133974894982, "time_sec": 87.19542217254639 }, { "epoch": 49, "train_loss": 4.874160293884278, "train_acc": 0.00928, "test_loss": 6.9806133621215825, "test_acc": 0.01, "lyapunov": 1.5310221773279293, "grad_norm": 0.15914063982748972, "grad_max_sv": 0.0841954169794917, "grad_min_sv": 1.1028138256059021e-16, "grad_condition": 84186278073.27275, "lr": 0.000759013504686565, "time_sec": 87.18294835090637 }, { "epoch": 50, "train_loss": 4.874967584228516, "train_acc": 0.0088, "test_loss": 7.2512130996704105, "test_acc": 0.01, "lyapunov": 1.531926109052985, "grad_norm": 0.13359997166294424, "grad_max_sv": 0.07885234858840703, "grad_min_sv": 1.5449564137240798e-17, "grad_condition": 78851261996.51497, "lr": 0.0007499999999999998, "time_sec": 87.1744954586029 }, { "epoch": 51, "train_loss": 4.873049064331055, "train_acc": 0.00894, "test_loss": 7.2680836700439455, "test_acc": 0.01, "lyapunov": 1.5300328816904132, "grad_norm": 0.13566663059488987, "grad_max_sv": 0.06801612647250295, "grad_min_sv": 3.3721854663294077e-28, "grad_condition": 68016126472.50293, "lr": 0.0007408768370508575, "time_sec": 87.2090744972229 }, { "epoch": 52, "train_loss": 4.8752045971679685, "train_acc": 0.00998, "test_loss": 7.319013902282715, "test_acc": 0.01, "lyapunov": 1.5358237284223746, "grad_norm": 0.15295505609252377, "grad_max_sv": 0.07399358823895455, "grad_min_sv": 4.036005675649565e-34, "grad_condition": 73993588238.95454, "lr": 0.0007316480175599307, "time_sec": 87.17916941642761 }, { "epoch": 53, "train_loss": 4.875089646759033, "train_acc": 0.00932, "test_loss": 6.708341079711914, "test_acc": 0.01, "lyapunov": 1.535219712025674, "grad_norm": 0.15337946692641713, "grad_max_sv": 0.0786401204764843, "grad_min_sv": 9.418872962396182e-34, "grad_condition": 78640120476.4843, "lr": 0.0007223175895924635, "time_sec": 87.19920134544373 }, { "epoch": 54, "train_loss": 4.8763134245300295, "train_acc": 0.00954, "test_loss": 7.893965859985352, "test_acc": 0.01, "lyapunov": 1.5382219912755826, "grad_norm": 0.14430315662174414, "grad_max_sv": 0.0842284008860588, "grad_min_sv": 1.4016176262153585e-17, "grad_condition": 84227307606.50656, "lr": 0.0007128896457825361, "time_sec": 87.16732549667358 }, { "epoch": 55, "train_loss": 4.880924655761719, "train_acc": 0.00986, "test_loss": 8.769433529663086, "test_acc": 0.01, "lyapunov": 1.5441064075435824, "grad_norm": 0.16740838552751033, "grad_max_sv": 0.08879097644239664, "grad_min_sv": 3.0302474954849e-15, "grad_condition": 88489187160.01863, "lr": 0.0007033683215378998, "time_sec": 87.23270034790039 }, { "epoch": 56, "train_loss": 4.880691115722656, "train_acc": 0.00984, "test_loss": 8.956744931030274, "test_acc": 0.01, "lyapunov": 1.5440428296623327, "grad_norm": 0.169681128943872, "grad_max_sv": 0.08683812469244004, "grad_min_sv": 2.6780771295629216e-16, "grad_condition": 86810744990.1141, "lr": 0.0006937577932260512, "time_sec": 87.5180823802948 }, { "epoch": 57, "train_loss": 4.875461320648193, "train_acc": 0.00882, "test_loss": 7.914718838500977, "test_acc": 0.01, "lyapunov": 1.5361771690266213, "grad_norm": 0.13744745585086549, "grad_max_sv": 0.08106257226318121, "grad_min_sv": 4.602306454836924e-17, "grad_condition": 81058882088.7789, "lr": 0.0006840622763423388, "time_sec": 87.23774647712708 }, { "epoch": 58, "train_loss": 4.876462248229981, "train_acc": 0.0086, "test_loss": 7.521480532836914, "test_acc": 0.01, "lyapunov": 1.5380861676867357, "grad_norm": 0.1308094426729998, "grad_max_sv": 0.07691145669668913, "grad_min_sv": 5.2512441923478546e-21, "grad_condition": 76911456255.58595, "lr": 0.0006742860236609073, "time_sec": 87.19443416595459 }, { "epoch": 59, "train_loss": 4.876125813751221, "train_acc": 0.00958, "test_loss": 9.108944590759277, "test_acc": 0.01, "lyapunov": 1.5374773286492622, "grad_norm": 0.13065965995697965, "grad_max_sv": 0.07693316899240017, "grad_min_sv": 4.628041294277668e-28, "grad_condition": 76933168992.40013, "lr": 0.0006644333233692913, "time_sec": 87.11430335044861 }, { "epoch": 60, "train_loss": 4.876531585845948, "train_acc": 0.01002, "test_loss": 8.708165438842773, "test_acc": 0.01, "lyapunov": 1.540081706193402, "grad_norm": 0.12514364110494514, "grad_max_sv": 0.04278304530307651, "grad_min_sv": 5.111839701214236e-27, "grad_condition": 42783045303.07613, "lr": 0.0006545084971874734, "time_sec": 87.08950901031494 }, { "epoch": 61, "train_loss": 4.876955277404785, "train_acc": 0.00986, "test_loss": 9.633759455871582, "test_acc": 0.01, "lyapunov": 1.5432406968777748, "grad_norm": 0.13030696119131907, "grad_max_sv": 0.01869940897449851, "grad_min_sv": 0.0, "grad_condition": 18699408974.498512, "lr": 0.0006445158984722354, "time_sec": 87.06369233131409 }, { "epoch": 62, "train_loss": 4.880256801300049, "train_acc": 0.00914, "test_loss": 8.106962710571288, "test_acc": 0.01, "lyapunov": 1.5493804704197838, "grad_norm": 0.13707953455281482, "grad_max_sv": 0.05703742457553744, "grad_min_sv": 2.412788074144182e-18, "grad_condition": 57037235841.35691, "lr": 0.0006344599103076324, "time_sec": 87.23956346511841 }, { "epoch": 63, "train_loss": 4.877262191009521, "train_acc": 0.00972, "test_loss": 9.24615108947754, "test_acc": 0.01, "lyapunov": 1.5415991502039879, "grad_norm": 0.13665560919633327, "grad_max_sv": 0.0726124294102192, "grad_min_sv": 2.0682456318226844e-23, "grad_condition": 72612429408.54066, "lr": 0.0006243449435824269, "time_sec": 87.23054909706116 }, { "epoch": 64, "train_loss": 4.87730983215332, "train_acc": 0.00936, "test_loss": 10.058143447875976, "test_acc": 0.01, "lyapunov": 1.5422342823594428, "grad_norm": 0.12004208587403144, "grad_max_sv": 0.06160930292680859, "grad_min_sv": 0.0, "grad_condition": 61609302926.80859, "lr": 0.0006141754350553275, "time_sec": 87.30030584335327 }, { "epoch": 65, "train_loss": 4.878948260040283, "train_acc": 0.0093, "test_loss": 9.260436712646484, "test_acc": 0.01, "lyapunov": 1.5483233312816571, "grad_norm": 0.12423135486220072, "grad_max_sv": 0.0546061669010669, "grad_min_sv": 0.0, "grad_condition": 54606166901.066895, "lr": 0.0006039558454088793, "time_sec": 87.31754422187805 }, { "epoch": 66, "train_loss": 4.881117270965576, "train_acc": 0.00976, "test_loss": 7.955686111450195, "test_acc": 0.01, "lyapunov": 1.5531517626989224, "grad_norm": 0.1466609355894601, "grad_max_sv": 0.05231738574802876, "grad_min_sv": 0.0, "grad_condition": 52317385748.02876, "lr": 0.000593690657292862, "time_sec": 87.25684475898743 }, { "epoch": 67, "train_loss": 4.87848960723877, "train_acc": 0.0093, "test_loss": 8.291721563720703, "test_acc": 0.01, "lyapunov": 1.5488468536635493, "grad_norm": 0.13358884588524558, "grad_max_sv": 0.046516909170895814, "grad_min_sv": 0.0, "grad_condition": 46516909170.89581, "lr": 0.0005833843733580507, "time_sec": 87.23024368286133 }, { "epoch": 68, "train_loss": 4.876251863098145, "train_acc": 0.00948, "test_loss": 8.313035414123535, "test_acc": 0.01, "lyapunov": 1.5433335642680488, "grad_norm": 0.10782264609925914, "grad_max_sv": 0.04402522062882781, "grad_min_sv": 0.0, "grad_condition": 44025220628.827805, "lr": 0.0005730415142812054, "time_sec": 87.16200470924377 }, { "epoch": 69, "train_loss": 4.877121996459961, "train_acc": 0.00992, "test_loss": 6.634935369110107, "test_acc": 0.01, "lyapunov": 1.5465551251950471, "grad_norm": 0.10524482896626382, "grad_max_sv": 0.03552310774102807, "grad_min_sv": 0.0, "grad_condition": 35523107741.02806, "lr": 0.0005626666167821517, "time_sec": 87.16768336296082 }, { "epoch": 70, "train_loss": 4.877148870697021, "train_acc": 0.00924, "test_loss": 5.170057612609863, "test_acc": 0.01, "lyapunov": 1.544044288223052, "grad_norm": 0.12272040694034365, "grad_max_sv": 0.042177446838468316, "grad_min_sv": 0.0, "grad_condition": 42177446838.46831, "lr": 0.0005522642316338265, "time_sec": 87.17852282524109 }, { "epoch": 71, "train_loss": 4.878114613800049, "train_acc": 0.00918, "test_loss": 5.881608570861816, "test_acc": 0.01, "lyapunov": 1.5485444328059321, "grad_norm": 0.1267744759308649, "grad_max_sv": 0.03348520016297698, "grad_min_sv": 0.0, "grad_condition": 33485200162.97698, "lr": 0.0005418389216661573, "time_sec": 87.12145924568176 }, { "epoch": 72, "train_loss": 4.877243146057129, "train_acc": 0.00954, "test_loss": 4.831268686676025, "test_acc": 0.01, "lyapunov": 1.5455416965362665, "grad_norm": 0.11162604722177562, "grad_max_sv": 0.04829189190641046, "grad_min_sv": 0.0, "grad_condition": 48291891906.41045, "lr": 0.0005313952597646563, "time_sec": 87.20591306686401 }, { "epoch": 73, "train_loss": 4.877523553466797, "train_acc": 0.00916, "test_loss": 5.21819946975708, "test_acc": 0.01, "lyapunov": 1.5469345262898204, "grad_norm": 0.1695274830056392, "grad_max_sv": 0.03528429148718715, "grad_min_sv": 0.0, "grad_condition": 35284291487.18715, "lr": 0.0005209378268645994, "time_sec": 87.15492391586304 }, { "epoch": 74, "train_loss": 4.878687818603516, "train_acc": 0.00902, "test_loss": 7.045982824707031, "test_acc": 0.01, "lyapunov": 1.548920457320445, "grad_norm": 0.11876165619339213, "grad_max_sv": 0.0398634166456759, "grad_min_sv": 0.0, "grad_condition": 39863416645.675896, "lr": 0.0005104712099416781, "time_sec": 87.20987892150879 }, { "epoch": 75, "train_loss": 4.8802404374694826, "train_acc": 0.00952, "test_loss": 5.816082705688476, "test_acc": 0.01, "lyapunov": 1.5510207057913856, "grad_norm": 0.11814260313160607, "grad_max_sv": 0.04241896355524659, "grad_min_sv": 0.0, "grad_condition": 42418963555.24659, "lr": 0.0004999999999999996, "time_sec": 87.17034125328064 }, { "epoch": 76, "train_loss": 4.877049774017334, "train_acc": 0.01008, "test_loss": 5.791509801483154, "test_acc": 0.01, "lyapunov": 1.545583454544282, "grad_norm": 0.10644494843061181, "grad_max_sv": 0.044637566059827806, "grad_min_sv": 0.0, "grad_condition": 44637566059.827805, "lr": 0.0004895287900583212, "time_sec": 87.17367744445801 }, { "epoch": 77, "train_loss": 4.876323641052246, "train_acc": 0.00964, "test_loss": 5.184193676757812, "test_acc": 0.01, "lyapunov": 1.5437548282506215, "grad_norm": 0.10450293107653293, "grad_max_sv": 0.04073738274164498, "grad_min_sv": 0.0, "grad_condition": 40737382741.64498, "lr": 0.0004790621731353997, "time_sec": 87.17853283882141 }, { "epoch": 78, "train_loss": 4.8809456416320804, "train_acc": 0.00946, "test_loss": 4.926686591339111, "test_acc": 0.01, "lyapunov": 1.5541882484465304, "grad_norm": 0.12051319198728945, "grad_max_sv": 0.033642015885561705, "grad_min_sv": 0.0, "grad_condition": 33642015885.561707, "lr": 0.000468604740235343, "time_sec": 87.15360975265503 }, { "epoch": 79, "train_loss": 4.878056556091309, "train_acc": 0.00886, "test_loss": 4.698637203979493, "test_acc": 0.01, "lyapunov": 1.5484835391154375, "grad_norm": 0.11143972892340351, "grad_max_sv": 0.03221007520332932, "grad_min_sv": 0.0, "grad_condition": 32210075203.329323, "lr": 0.00045816107833384175, "time_sec": 87.12274217605591 }, { "epoch": 80, "train_loss": 4.877688450622559, "train_acc": 0.00998, "test_loss": 4.708519946289062, "test_acc": 0.01, "lyapunov": 1.5479903696747996, "grad_norm": 0.10853834057327462, "grad_max_sv": 0.03808168638497591, "grad_min_sv": 0.0, "grad_condition": 38081686384.97591, "lr": 0.0004477357683661729, "time_sec": 87.16511940956116 }, { "epoch": 81, "train_loss": 4.877410650787353, "train_acc": 0.00924, "test_loss": 5.326217936706543, "test_acc": 0.01, "lyapunov": 1.5462311384318126, "grad_norm": 0.1078272819076305, "grad_max_sv": 0.0341941992752254, "grad_min_sv": 0.0, "grad_condition": 34194199275.225403, "lr": 0.00043733338321784746, "time_sec": 87.13259315490723 }, { "epoch": 82, "train_loss": 4.878852579498291, "train_acc": 0.00992, "test_loss": 5.124214416503906, "test_acc": 0.01, "lyapunov": 1.551578131783039, "grad_norm": 0.11924540172549285, "grad_max_sv": 0.032149143144488336, "grad_min_sv": 0.0, "grad_condition": 32149143144.488342, "lr": 0.0004269584857187939, "time_sec": 87.15441107749939 }, { "epoch": 83, "train_loss": 4.877541376647949, "train_acc": 0.00962, "test_loss": 5.2295348327636715, "test_acc": 0.01, "lyapunov": 1.5478261575064696, "grad_norm": 0.1053498185299808, "grad_max_sv": 0.026044291676953435, "grad_min_sv": 0.0, "grad_condition": 26044291676.953438, "lr": 0.0004166156266419484, "time_sec": 87.16295027732849 }, { "epoch": 84, "train_loss": 4.877119447631836, "train_acc": 0.00984, "test_loss": 5.116746160888672, "test_acc": 0.01, "lyapunov": 1.5470911304054358, "grad_norm": 0.10156236054846617, "grad_max_sv": 0.028701860643923282, "grad_min_sv": 0.0, "grad_condition": 28701860643.92328, "lr": 0.0004063093427071373, "time_sec": 87.13170576095581 }, { "epoch": 85, "train_loss": 4.878303242034912, "train_acc": 0.01008, "test_loss": 4.748899824523925, "test_acc": 0.01, "lyapunov": 1.5509575178556125, "grad_norm": 0.1141388454907746, "grad_max_sv": 0.033817021455615756, "grad_min_sv": 0.0, "grad_condition": 33817021455.61576, "lr": 0.0003960441545911199, "time_sec": 87.10089588165283 }, { "epoch": 86, "train_loss": 4.87876032699585, "train_acc": 0.0097, "test_loss": 4.651885162353516, "test_acc": 0.01, "lyapunov": 1.5511503161676705, "grad_norm": 0.09785209813867382, "grad_max_sv": 0.027630697237327695, "grad_min_sv": 0.0, "grad_condition": 27630697237.32769, "lr": 0.0003858245649446718, "time_sec": 87.0941972732544 }, { "epoch": 87, "train_loss": 4.877712865142822, "train_acc": 0.00998, "test_loss": 5.250769630432129, "test_acc": 0.01, "lyapunov": 1.548732325549016, "grad_norm": 0.1974258085478382, "grad_max_sv": 0.02602379145100713, "grad_min_sv": 0.0, "grad_condition": 26023791451.00713, "lr": 0.00037565505641757235, "time_sec": 87.11909556388855 }, { "epoch": 88, "train_loss": 4.877790277404785, "train_acc": 0.00996, "test_loss": 5.091197055053711, "test_acc": 0.01, "lyapunov": 1.5483774038227014, "grad_norm": 0.10333331120218883, "grad_max_sv": 0.03042559456080198, "grad_min_sv": 0.0, "grad_condition": 30425594560.801983, "lr": 0.00036554008969236695, "time_sec": 87.1078622341156 }, { "epoch": 89, "train_loss": 4.877677908020019, "train_acc": 0.0099, "test_loss": 5.058323477935791, "test_acc": 0.01, "lyapunov": 1.5483884863231494, "grad_norm": 0.09905622622525881, "grad_max_sv": 0.03069272106513381, "grad_min_sv": 0.0, "grad_condition": 30692721065.133812, "lr": 0.0003554841015277638, "time_sec": 87.05663800239563 }, { "epoch": 90, "train_loss": 4.881804440917969, "train_acc": 0.0106, "test_loss": 5.362990502166748, "test_acc": 0.01, "lyapunov": 1.553605647648082, "grad_norm": 0.10267946386955158, "grad_max_sv": 0.030273563507944346, "grad_min_sv": 0.0, "grad_condition": 30273563507.944347, "lr": 0.000345491502812526, "time_sec": 87.06899333000183 }, { "epoch": 91, "train_loss": 4.879398302917481, "train_acc": 0.01, "test_loss": 5.126827237701416, "test_acc": 0.01, "lyapunov": 1.5521758828321686, "grad_norm": 0.12087522031268683, "grad_max_sv": 0.03009325391612947, "grad_min_sv": 0.0, "grad_condition": 30093253916.129467, "lr": 0.0003355666766307081, "time_sec": 87.05256390571594 }, { "epoch": 92, "train_loss": 4.880291121673584, "train_acc": 0.00988, "test_loss": 5.26154695892334, "test_acc": 0.01, "lyapunov": 1.5549428770914102, "grad_norm": 0.13231588784429352, "grad_max_sv": 0.03350330209359527, "grad_min_sv": 0.0, "grad_condition": 33503302093.595264, "lr": 0.00032571397633909225, "time_sec": 87.10619926452637 }, { "epoch": 93, "train_loss": 4.8782078823852535, "train_acc": 0.00968, "test_loss": 5.271252917480469, "test_acc": 0.01, "lyapunov": 1.5495562916216643, "grad_norm": 0.12175801600529883, "grad_max_sv": 0.03186503546312451, "grad_min_sv": 0.0, "grad_condition": 31865035463.12451, "lr": 0.00031593772365766094, "time_sec": 87.12923264503479 }, { "epoch": 94, "train_loss": 4.87740290222168, "train_acc": 0.00982, "test_loss": 5.075842178344726, "test_acc": 0.01, "lyapunov": 1.547658307473068, "grad_norm": 0.11436426699794455, "grad_max_sv": 0.02530919690616429, "grad_min_sv": 0.0, "grad_condition": 25309196906.164288, "lr": 0.0003062422067739483, "time_sec": 87.08783769607544 }, { "epoch": 95, "train_loss": 4.877675037384034, "train_acc": 0.00952, "test_loss": 5.33029627532959, "test_acc": 0.01, "lyapunov": 1.5485165667960712, "grad_norm": 0.10074303038813699, "grad_max_sv": 0.03554986314848065, "grad_min_sv": 0.0, "grad_condition": 35549863148.48065, "lr": 0.00029663167846209965, "time_sec": 87.08289909362793 }, { "epoch": 96, "train_loss": 4.877177648620606, "train_acc": 0.01022, "test_loss": 5.369173509216308, "test_acc": 0.01, "lyapunov": 1.5468677212210262, "grad_norm": 0.1013436246118025, "grad_max_sv": 0.03922831532545388, "grad_min_sv": 0.0, "grad_condition": 39228315325.45387, "lr": 0.00028711035421746345, "time_sec": 87.09603428840637 }, { "epoch": 97, "train_loss": 4.881449295959473, "train_acc": 0.00942, "test_loss": 4.928601164245605, "test_acc": 0.01, "lyapunov": 1.5567159265508432, "grad_norm": 0.10170216841041604, "grad_max_sv": 0.021827650628983973, "grad_min_sv": 0.0, "grad_condition": 21827650628.98397, "lr": 0.00027768241040753615, "time_sec": 87.07169818878174 }, { "epoch": 98, "train_loss": 4.8775743408203125, "train_acc": 0.00984, "test_loss": 4.987854670715332, "test_acc": 0.01, "lyapunov": 1.548287238916168, "grad_norm": 0.12626493811946907, "grad_max_sv": 0.03011642089113593, "grad_min_sv": 0.0, "grad_condition": 30116420891.135933, "lr": 0.00026835198244006903, "time_sec": 87.164879322052 }, { "epoch": 99, "train_loss": 4.878459322357178, "train_acc": 0.00968, "test_loss": 4.931130755615234, "test_acc": 0.01, "lyapunov": 1.5513008421339343, "grad_norm": 0.1050431882077805, "grad_max_sv": 0.026918977173045276, "grad_min_sv": 0.0, "grad_condition": 26918977173.045277, "lr": 0.0002591231629491421, "time_sec": 87.06193971633911 }, { "epoch": 100, "train_loss": 4.877405020904541, "train_acc": 0.00972, "test_loss": 4.892998168182373, "test_acc": 0.01, "lyapunov": 1.5485746119638233, "grad_norm": 0.10391039157029125, "grad_max_sv": 0.009399653738364577, "grad_min_sv": 0.0, "grad_condition": 9399653738.364578, "lr": 0.0002499999999999997, "time_sec": 86.99319124221802 }, { "epoch": 101, "train_loss": 4.878013845367431, "train_acc": 0.00972, "test_loss": 4.892334498596192, "test_acc": 0.01, "lyapunov": 1.549886227568702, "grad_norm": 0.10312805970588344, "grad_max_sv": 0.020510493777692318, "grad_min_sv": 0.0, "grad_condition": 20510493777.692318, "lr": 0.00024098649531343477, "time_sec": 87.05790066719055 }, { "epoch": 102, "train_loss": 4.878095693969726, "train_acc": 0.00976, "test_loss": 4.820429385375976, "test_acc": 0.01, "lyapunov": 1.5501237391206004, "grad_norm": 0.11558211080028734, "grad_max_sv": 0.024952154234051706, "grad_min_sv": 0.0, "grad_condition": 24952154234.051704, "lr": 0.0002320866025105016, "time_sec": 87.05184125900269 }, { "epoch": 103, "train_loss": 4.878661685333252, "train_acc": 0.01018, "test_loss": 5.300121360015869, "test_acc": 0.01, "lyapunov": 1.551538582957919, "grad_norm": 0.12567932831666664, "grad_max_sv": 0.012993747182190419, "grad_min_sv": 0.0, "grad_condition": 12993747182.190418, "lr": 0.0002233042253783278, "time_sec": 87.06061792373657 }, { "epoch": 104, "train_loss": 4.877294933776856, "train_acc": 0.0099, "test_loss": 5.135670352172852, "test_acc": 0.01, "lyapunov": 1.5485212714470866, "grad_norm": 0.09250410480818645, "grad_max_sv": 0.004851618967950344, "grad_min_sv": 0.0, "grad_condition": 4851618967.950345, "lr": 0.000214643216157784, "time_sec": 87.05238747596741 }, { "epoch": 105, "train_loss": 4.877063808746338, "train_acc": 0.00988, "test_loss": 5.725478736877442, "test_acc": 0.01, "lyapunov": 1.5481484466806397, "grad_norm": 0.09550603539231842, "grad_max_sv": 0.011385573633015155, "grad_min_sv": 0.0, "grad_condition": 11385573633.015156, "lr": 0.00020610737385376332, "time_sec": 87.0910587310791 }, { "epoch": 106, "train_loss": 4.877282638549804, "train_acc": 0.00984, "test_loss": 5.60465906829834, "test_acc": 0.01, "lyapunov": 1.5483009687165166, "grad_norm": 0.10354511535570549, "grad_max_sv": 0.02720399503596127, "grad_min_sv": 0.0, "grad_condition": 27203995035.961273, "lr": 0.00019770044256881242, "time_sec": 87.10812902450562 }, { "epoch": 107, "train_loss": 4.876681364440918, "train_acc": 0.00976, "test_loss": 5.2093520240783695, "test_acc": 0.01, "lyapunov": 1.5473160725420394, "grad_norm": 0.09575843142426103, "grad_max_sv": 0.007643958646804094, "grad_min_sv": 0.0, "grad_condition": 7643958646.804095, "lr": 0.0001894261098608447, "time_sec": 87.00347948074341 }, { "epoch": 108, "train_loss": 4.878350821228027, "train_acc": 0.01052, "test_loss": 4.913621876525879, "test_acc": 0.01, "lyapunov": 1.5520180210737926, "grad_norm": 0.1307850708492295, "grad_max_sv": 0.016565991286188363, "grad_min_sv": 0.0, "grad_condition": 16565991286.188366, "lr": 0.000181288005125655, "time_sec": 87.0159866809845 }, { "epoch": 109, "train_loss": 4.876669662628174, "train_acc": 0.01016, "test_loss": 4.88301672668457, "test_acc": 0.01, "lyapunov": 1.5467288201422338, "grad_norm": 0.09856162731459642, "grad_max_sv": 0.014887689799070358, "grad_min_sv": 0.0, "grad_condition": 14887689799.070358, "lr": 0.0001732896980049473, "time_sec": 86.99599003791809 }, { "epoch": 110, "train_loss": 4.877418764038086, "train_acc": 0.00988, "test_loss": 5.01456753540039, "test_acc": 0.01, "lyapunov": 1.549457520170285, "grad_norm": 0.11878011333313225, "grad_max_sv": 0.005905823782086372, "grad_min_sv": 0.0, "grad_condition": 5905823782.086372, "lr": 0.00016543469682057076, "time_sec": 87.00050139427185 }, { "epoch": 111, "train_loss": 4.877375203704834, "train_acc": 0.01016, "test_loss": 4.923972444152832, "test_acc": 0.01, "lyapunov": 1.549215167074862, "grad_norm": 0.11051840491520531, "grad_max_sv": 0.007604151451960206, "grad_min_sv": 0.0, "grad_condition": 7604151451.960205, "lr": 0.00015772644703565552, "time_sec": 87.03872609138489 }, { "epoch": 112, "train_loss": 4.87747160736084, "train_acc": 0.0097, "test_loss": 4.956568124389649, "test_acc": 0.01, "lyapunov": 1.5494032619554368, "grad_norm": 0.11381662366828246, "grad_max_sv": 0.01119147464632988, "grad_min_sv": 0.0, "grad_condition": 11191474646.32988, "lr": 0.00015016832974331713, "time_sec": 87.11299419403076 }, { "epoch": 113, "train_loss": 4.87979639755249, "train_acc": 0.01012, "test_loss": 4.926776232910156, "test_acc": 0.01, "lyapunov": 1.5544771361533942, "grad_norm": 0.15709933765078352, "grad_max_sv": 0.00347123583778739, "grad_min_sv": 0.0, "grad_condition": 3471235837.78739, "lr": 0.00014276366018359834, "time_sec": 87.06232452392578 }, { "epoch": 114, "train_loss": 4.878047005310059, "train_acc": 0.00952, "test_loss": 4.92212592086792, "test_acc": 0.01, "lyapunov": 1.5507129702116826, "grad_norm": 0.10294832245991155, "grad_max_sv": 0.012609629379585385, "grad_min_sv": 0.0, "grad_condition": 12609629379.585384, "lr": 0.00013551568628929425, "time_sec": 87.06694340705872 }, { "epoch": 115, "train_loss": 4.877151131134033, "train_acc": 0.0092, "test_loss": 4.918728126525879, "test_acc": 0.01, "lyapunov": 1.548615127878116, "grad_norm": 0.10263613090186025, "grad_max_sv": 0.006314583634957671, "grad_min_sv": 0.0, "grad_condition": 6314583634.957671, "lr": 0.00012842758726130276, "time_sec": 87.03067350387573 }, { "epoch": 116, "train_loss": 4.87786820098877, "train_acc": 0.00982, "test_loss": 5.00487536239624, "test_acc": 0.01, "lyapunov": 1.5504866353691082, "grad_norm": 0.12269127259842373, "grad_max_sv": 0.014170486759394408, "grad_min_sv": 0.0, "grad_condition": 14170486759.39441, "lr": 0.0001215024721741218, "time_sec": 87.00306367874146 }, { "epoch": 117, "train_loss": 4.876784671478272, "train_acc": 0.00974, "test_loss": 5.023514326477051, "test_acc": 0.01, "lyapunov": 1.5474366047193326, "grad_norm": 0.10427521316985092, "grad_max_sv": 0.004411047184839844, "grad_min_sv": 0.0, "grad_condition": 4411047184.839845, "lr": 0.00011474337861210538, "time_sec": 87.03306269645691 }, { "epoch": 118, "train_loss": 4.877164349365234, "train_acc": 0.01002, "test_loss": 4.991419695281983, "test_acc": 0.01, "lyapunov": 1.5484020453889658, "grad_norm": 0.10471789513305493, "grad_max_sv": 0.008587307529523969, "grad_min_sv": 0.0, "grad_condition": 8587307529.523969, "lr": 0.00010815327133708009, "time_sec": 87.06011486053467 }, { "epoch": 119, "train_loss": 4.876861254577637, "train_acc": 0.00988, "test_loss": 5.089453727722168, "test_acc": 0.01, "lyapunov": 1.5475890602906952, "grad_norm": 0.10992180658040822, "grad_max_sv": 0.009593591233715415, "grad_min_sv": 0.0, "grad_condition": 9593591233.715414, "lr": 0.00010173504098790182, "time_sec": 87.0181610584259 }, { "epoch": 120, "train_loss": 4.87691458618164, "train_acc": 0.00984, "test_loss": 5.0014659088134765, "test_acc": 0.01, "lyapunov": 1.5480926106957829, "grad_norm": 0.10767138662291806, "grad_max_sv": 0.0038278432097285987, "grad_min_sv": 0.0, "grad_condition": 3827843209.728598, "lr": 9.549150281252629e-05, "time_sec": 86.99478530883789 }, { "epoch": 121, "train_loss": 4.877940362548828, "train_acc": 0.00962, "test_loss": 4.935777435302734, "test_acc": 0.01, "lyapunov": 1.5509431261540678, "grad_norm": 0.13054112707845358, "grad_max_sv": 0.006552627170458436, "grad_min_sv": 0.0, "grad_condition": 6552627170.458437, "lr": 8.942539543314794e-05, "time_sec": 87.0364146232605 }, { "epoch": 122, "train_loss": 4.877626941223144, "train_acc": 0.01018, "test_loss": 4.956711478424072, "test_acc": 0.01, "lyapunov": 1.549799994434542, "grad_norm": 0.12579422138988705, "grad_max_sv": 0.012472250685095786, "grad_min_sv": 0.0, "grad_condition": 12472250685.095787, "lr": 8.353937964495024e-05, "time_sec": 87.04438400268555 }, { "epoch": 123, "train_loss": 4.8773612213134765, "train_acc": 0.01028, "test_loss": 5.112759294128418, "test_acc": 0.01, "lyapunov": 1.5493231264831464, "grad_norm": 0.11869948278714595, "grad_max_sv": 0.006990070082247257, "grad_min_sv": 0.0, "grad_condition": 6990070082.247256, "lr": 7.783603724899243e-05, "time_sec": 87.04442477226257 }, { "epoch": 124, "train_loss": 4.876904801330566, "train_acc": 0.00974, "test_loss": 5.0848597717285156, "test_acc": 0.01, "lyapunov": 1.547949957725642, "grad_norm": 0.11622328135609243, "grad_max_sv": 0.00592916551977396, "grad_min_sv": 0.0, "grad_condition": 5929165519.773959, "lr": 7.231786991974666e-05, "time_sec": 87.02583312988281 }, { "epoch": 125, "train_loss": 4.876884867248535, "train_acc": 0.00994, "test_loss": 5.093001669311524, "test_acc": 0.01, "lyapunov": 1.5479519553196706, "grad_norm": 0.11394234129927898, "grad_max_sv": 0.003486808715388179, "grad_min_sv": 0.0, "grad_condition": 3486808715.388179, "lr": 6.698729810778072e-05, "time_sec": 87.01634311676025 }, { "epoch": 126, "train_loss": 4.87686362991333, "train_acc": 0.00962, "test_loss": 5.044818876647949, "test_acc": 0.01, "lyapunov": 1.5478015985635236, "grad_norm": 0.11528475995319568, "grad_max_sv": 0.01741538755595684, "grad_min_sv": 0.0, "grad_condition": 17415387555.95684, "lr": 6.184665997806817e-05, "time_sec": 87.03749418258667 }, { "epoch": 127, "train_loss": 4.877244481811523, "train_acc": 0.00992, "test_loss": 5.0011329849243165, "test_acc": 0.01, "lyapunov": 1.5490661807682202, "grad_norm": 0.11235050252375584, "grad_max_sv": 0.0023714601527899505, "grad_min_sv": 0.0, "grad_condition": 2371460152.7899504, "lr": 5.6898210384392595e-05, "time_sec": 87.06668877601624 }, { "epoch": 128, "train_loss": 4.877482815856934, "train_acc": 0.01004, "test_loss": 5.234975555419922, "test_acc": 0.01, "lyapunov": 1.549882313784431, "grad_norm": 0.11546242652617031, "grad_max_sv": 0.0007256413344293832, "grad_min_sv": 0.0, "grad_condition": 725641334.4293833, "lr": 5.214411988029363e-05, "time_sec": 87.02991795539856 }, { "epoch": 129, "train_loss": 4.8767640072631835, "train_acc": 0.01006, "test_loss": 5.377161560821533, "test_acc": 0.01, "lyapunov": 1.5474718257289408, "grad_norm": 0.12203371483427425, "grad_max_sv": 0.016016411827877164, "grad_min_sv": 0.0, "grad_condition": 16016411827.877163, "lr": 4.7586473766990294e-05, "time_sec": 87.09737348556519 }, { "epoch": 130, "train_loss": 4.8772621307373045, "train_acc": 0.00994, "test_loss": 5.146733520507812, "test_acc": 0.01, "lyapunov": 1.5492317725325484, "grad_norm": 0.13239853793431725, "grad_max_sv": 0.007805489096790552, "grad_min_sv": 0.0, "grad_condition": 7805489096.790552, "lr": 4.32272711786996e-05, "time_sec": 87.02493596076965 }, { "epoch": 131, "train_loss": 4.878482946472168, "train_acc": 0.01002, "test_loss": 5.187312270355225, "test_acc": 0.01, "lyapunov": 1.5515824739280564, "grad_norm": 0.13050261520417258, "grad_max_sv": 0.003781923418864608, "grad_min_sv": 0.0, "grad_condition": 3781923418.8646073, "lr": 3.906842420574966e-05, "time_sec": 87.00766158103943 }, { "epoch": 132, "train_loss": 4.8773687062072755, "train_acc": 0.01038, "test_loss": 5.233526524353027, "test_acc": 0.01, "lyapunov": 1.5493864241768331, "grad_norm": 0.13275623808990364, "grad_max_sv": 0.00900785457342863, "grad_min_sv": 0.0, "grad_condition": 9007854573.42863, "lr": 3.5111757055874305e-05, "time_sec": 87.07332277297974 }, { "epoch": 133, "train_loss": 4.877119999389649, "train_acc": 0.01, "test_loss": 5.208364566040039, "test_acc": 0.01, "lyapunov": 1.5486897553324395, "grad_norm": 0.13669667117137443, "grad_max_sv": 0.0031375800725072624, "grad_min_sv": 0.0, "grad_condition": 3137580072.507262, "lr": 3.1359005254054254e-05, "time_sec": 87.08415913581848 }, { "epoch": 134, "train_loss": 4.876680097198486, "train_acc": 0.01026, "test_loss": 5.228788011169434, "test_acc": 0.01, "lyapunov": 1.5476158646976246, "grad_norm": 0.1315586247563803, "grad_max_sv": 0.0019336893223226071, "grad_min_sv": 0.0, "grad_condition": 1933689322.322607, "lr": 2.7811814881259484e-05, "time_sec": 87.04997158050537 }, { "epoch": 135, "train_loss": 4.877045626525879, "train_acc": 0.00998, "test_loss": 5.150844607543945, "test_acc": 0.01, "lyapunov": 1.5484065021700262, "grad_norm": 0.16019208167708357, "grad_max_sv": 0.0067828110419213775, "grad_min_sv": 0.0, "grad_condition": 6782811041.921377, "lr": 2.4471741852423218e-05, "time_sec": 87.07145261764526 }, { "epoch": 136, "train_loss": 4.877011717224121, "train_acc": 0.00942, "test_loss": 5.185321200561523, "test_acc": 0.01, "lyapunov": 1.5481893522355257, "grad_norm": 0.16513336675938264, "grad_max_sv": 0.006155044818297028, "grad_min_sv": 0.0, "grad_condition": 6155044818.297029, "lr": 2.1340251233966362e-05, "time_sec": 87.08501839637756 }, { "epoch": 137, "train_loss": 4.877299792480469, "train_acc": 0.00994, "test_loss": 5.153644463348389, "test_acc": 0.01, "lyapunov": 1.5492148905458962, "grad_norm": 0.14657870229772474, "grad_max_sv": 0.007406354090198875, "grad_min_sv": 0.0, "grad_condition": 7406354090.1988735, "lr": 1.8418716601170932e-05, "time_sec": 87.17517495155334 }, { "epoch": 138, "train_loss": 4.877124798736572, "train_acc": 0.01016, "test_loss": 5.164669793701172, "test_acc": 0.01, "lyapunov": 1.548459598170522, "grad_norm": 0.15457514508897918, "grad_max_sv": 0.012952858628705145, "grad_min_sv": 0.0, "grad_condition": 12952858628.705143, "lr": 1.570841943568445e-05, "time_sec": 87.19324207305908 }, { "epoch": 139, "train_loss": 4.877282972564697, "train_acc": 0.00982, "test_loss": 5.207451676940918, "test_acc": 0.01, "lyapunov": 1.5492830764302208, "grad_norm": 0.18425099220738375, "grad_max_sv": 0.0019508119206875564, "grad_min_sv": 0.0, "grad_condition": 1950811920.6875565, "lr": 1.3210548563419845e-05, "time_sec": 87.13183116912842 }, { "epoch": 140, "train_loss": 4.877498146057129, "train_acc": 0.00968, "test_loss": 5.200590103149414, "test_acc": 0.01, "lyapunov": 1.5491700614504802, "grad_norm": 0.1734732516042842, "grad_max_sv": 0.01371888890862465, "grad_min_sv": 0.0, "grad_condition": 13718888908.62465, "lr": 1.0926199633097203e-05, "time_sec": 87.21231150627136 }, { "epoch": 141, "train_loss": 4.8770866912841795, "train_acc": 0.00992, "test_loss": 5.190837601470947, "test_acc": 0.01, "lyapunov": 1.548795386653422, "grad_norm": 0.14753103772737095, "grad_max_sv": 0.005145562486723066, "grad_min_sv": 0.0, "grad_condition": 5145562486.723065, "lr": 8.856374635655688e-06, "time_sec": 87.26526665687561 }, { "epoch": 142, "train_loss": 4.8766608699035645, "train_acc": 0.00968, "test_loss": 5.162030874633789, "test_acc": 0.01, "lyapunov": 1.5475660821665889, "grad_norm": 0.15219397900813178, "grad_max_sv": 0.005608938308432699, "grad_min_sv": 0.0, "grad_condition": 5608938308.432698, "lr": 7.001981464747503e-06, "time_sec": 87.12494492530823 }, { "epoch": 143, "train_loss": 4.8769151321411135, "train_acc": 0.01004, "test_loss": 5.153072937011719, "test_acc": 0.01, "lyapunov": 1.5482893115114373, "grad_norm": 0.15346228098731488, "grad_max_sv": 0.001303949998691678, "grad_min_sv": 0.0, "grad_condition": 1303949998.691678, "lr": 5.3638335185058295e-06, "time_sec": 87.097491979599 }, { "epoch": 144, "train_loss": 4.877143389892578, "train_acc": 0.0097, "test_loss": 5.164535620117188, "test_acc": 0.01, "lyapunov": 1.5487491736936447, "grad_norm": 0.15811775595604075, "grad_max_sv": 0.008902552211657167, "grad_min_sv": 0.0, "grad_condition": 8902552211.657166, "lr": 3.942649342761114e-06, "time_sec": 87.06983470916748 }, { "epoch": 145, "train_loss": 4.876982822113037, "train_acc": 0.00984, "test_loss": 5.165194831848145, "test_acc": 0.01, "lyapunov": 1.5484599853720507, "grad_norm": 0.1582019401241392, "grad_max_sv": 0.004445526329800486, "grad_min_sv": 0.0, "grad_condition": 4445526329.800487, "lr": 2.7390523158633524e-06, "time_sec": 87.08561754226685 }, { "epoch": 146, "train_loss": 4.876878872375488, "train_acc": 0.00992, "test_loss": 5.165199098205567, "test_acc": 0.01, "lyapunov": 1.5481780770489626, "grad_norm": 0.16041164237051417, "grad_max_sv": 0.003941980935633182, "grad_min_sv": 0.0, "grad_condition": 3941980935.6331825, "lr": 1.7535703752478133e-06, "time_sec": 87.0421531200409 }, { "epoch": 147, "train_loss": 4.8771999089050295, "train_acc": 0.01004, "test_loss": 5.164550498199463, "test_acc": 0.01, "lyapunov": 1.5491338004846402, "grad_norm": 0.16309259034155005, "grad_max_sv": 0.004459652304649353, "grad_min_sv": 0.0, "grad_condition": 4459652304.649353, "lr": 9.866357858642196e-07, "time_sec": 87.06988906860352 }, { "epoch": 148, "train_loss": 4.876641088562011, "train_acc": 0.00982, "test_loss": 5.164551524353027, "test_acc": 0.01, "lyapunov": 1.5472115714226842, "grad_norm": 0.15826813584085664, "grad_max_sv": 0.008349275542423129, "grad_min_sv": 0.0, "grad_condition": 8349275542.423129, "lr": 4.38584950570808e-07, "time_sec": 87.10272812843323 }, { "epoch": 149, "train_loss": 4.877132370300293, "train_acc": 0.01012, "test_loss": 5.164552142333984, "test_acc": 0.01, "lyapunov": 1.5489305702926557, "grad_norm": 0.15991562154962183, "grad_max_sv": 0.0012625465169548988, "grad_min_sv": 0.0, "grad_condition": 1262546516.9548988, "lr": 1.096582625772501e-07, "time_sec": 87.08622741699219 }, { "epoch": 150, "train_loss": 4.876020973968505, "train_acc": 0.0099, "test_loss": 5.164552197265625, "test_acc": 0.01, "lyapunov": 1.545588637251988, "grad_norm": 0.16382667555465003, "grad_max_sv": 0.008686219714581967, "grad_min_sv": 0.0, "grad_condition": 8686219714.581966, "lr": 0.0, "time_sec": 87.09966802597046 } ], "12": [ { "epoch": 1, "train_loss": 4.855030886230469, "train_acc": 0.0148, "test_loss": 4.869620406341553, "test_acc": 0.01, "lyapunov": 2.2862052685769316, "grad_norm": 4.935339749560766, "grad_max_sv": 4.1397371053695675, "grad_min_sv": 8.49077093301176e-08, "grad_condition": 60021939.87195291, "lr": 0.0009998903417374227, "time_sec": 132.66977620124817 }, { "epoch": 2, "train_loss": 4.676363162231445, "train_acc": 0.01706, "test_loss": 4.653746462249756, "test_acc": 0.01, "lyapunov": 1.9439213897870935, "grad_norm": 2.813935189124443, "grad_max_sv": 2.2243280917406083, "grad_min_sv": 4.668241500582759e-08, "grad_condition": 69883158.92021513, "lr": 0.0009995614150494292, "time_sec": 132.62859869003296 }, { "epoch": 3, "train_loss": 4.635125137634278, "train_acc": 0.0156, "test_loss": 4.85989921875, "test_acc": 0.01, "lyapunov": 1.709093817359651, "grad_norm": 1.402581704275357, "grad_max_sv": 1.0371076561510564, "grad_min_sv": 1.9744334944187383e-08, "grad_condition": 12965122527.521233, "lr": 0.0009990133642141358, "time_sec": 132.57633781433105 }, { "epoch": 4, "train_loss": 4.640354335479737, "train_acc": 0.01534, "test_loss": 4.637619474792481, "test_acc": 0.01, "lyapunov": 1.6715390605999685, "grad_norm": 0.9398579368308534, "grad_max_sv": 0.6633182838559151, "grad_min_sv": 1.2069862256511819e-08, "grad_condition": 8530355196.976077, "lr": 0.0009982464296247522, "time_sec": 132.54676032066345 }, { "epoch": 5, "train_loss": 4.64221305480957, "train_acc": 0.01564, "test_loss": 4.680573092651367, "test_acc": 0.01, "lyapunov": 1.657093484688293, "grad_norm": 0.552135234831364, "grad_max_sv": 0.3695975001901388, "grad_min_sv": 2.375610143283509e-09, "grad_condition": 53738580663.96106, "lr": 0.0009972609476841367, "time_sec": 132.5168435573578 }, { "epoch": 6, "train_loss": 4.6413539511108395, "train_acc": 0.01584, "test_loss": 5.049699407958984, "test_acc": 0.0103, "lyapunov": 1.6153722675255193, "grad_norm": 0.5032723336212916, "grad_max_sv": 0.3346161611378193, "grad_min_sv": 1.7202862416924891e-09, "grad_condition": 61330096051.013405, "lr": 0.000996057350657239, "time_sec": 132.53665018081665 }, { "epoch": 7, "train_loss": 4.6673028504943845, "train_acc": 0.01474, "test_loss": 4.570369634246826, "test_acc": 0.0114, "lyapunov": 1.6155120164841947, "grad_norm": 0.406883512526028, "grad_max_sv": 0.2576971501111984, "grad_min_sv": 1.9000999133456468e-10, "grad_condition": 77661364868.79805, "lr": 0.000994636166481494, "time_sec": 132.51018714904785 }, { "epoch": 8, "train_loss": 4.760079259643555, "train_acc": 0.01052, "test_loss": 4.907698545074463, "test_acc": 0.01, "lyapunov": 1.5642740458173825, "grad_norm": 0.7987649812847755, "grad_max_sv": 0.6862246070057154, "grad_min_sv": 1.0877307097171696e-08, "grad_condition": 32321166738.690815, "lr": 0.0009929980185352525, "time_sec": 132.5572907924652 }, { "epoch": 9, "train_loss": 4.772606210021973, "train_acc": 0.00996, "test_loss": 4.704743336486817, "test_acc": 0.01, "lyapunov": 1.5716174904952573, "grad_norm": 0.8148548143851404, "grad_max_sv": 0.6870301708579063, "grad_min_sv": 1.1020205989789069e-08, "grad_condition": 2417926250.6670694, "lr": 0.0009911436253643444, "time_sec": 132.52283430099487 }, { "epoch": 10, "train_loss": 4.773616914978027, "train_acc": 0.01062, "test_loss": 4.874710052490235, "test_acc": 0.01, "lyapunov": 1.562704872292326, "grad_norm": 0.6675097799983111, "grad_max_sv": 0.5464496180415154, "grad_min_sv": 7.172653980753015e-09, "grad_condition": 20965681724.308956, "lr": 0.0009890738003669028, "time_sec": 132.5459840297699 }, { "epoch": 11, "train_loss": 4.773348721618652, "train_acc": 0.01024, "test_loss": 4.6200670059204105, "test_acc": 0.01, "lyapunov": 1.562029262637848, "grad_norm": 0.5488543058826973, "grad_max_sv": 0.4311558365821838, "grad_min_sv": 2.9074530078217566e-09, "grad_condition": 49435903159.65074, "lr": 0.00098678945143658, "time_sec": 132.52372455596924 }, { "epoch": 12, "train_loss": 4.780688554229736, "train_acc": 0.01046, "test_loss": 4.7990555023193355, "test_acc": 0.01, "lyapunov": 1.557410420359248, "grad_norm": 0.39735835708243683, "grad_max_sv": 0.29783011190593245, "grad_min_sv": 2.955632668999543e-10, "grad_condition": 137320228990.74185, "lr": 0.0009842915805643154, "time_sec": 132.52459120750427 }, { "epoch": 13, "train_loss": 4.794568827362061, "train_acc": 0.00944, "test_loss": 4.6620225440979, "test_acc": 0.01, "lyapunov": 1.5579908677684071, "grad_norm": 0.3760550232574214, "grad_max_sv": 0.27942878790199754, "grad_min_sv": 7.445462603040203e-10, "grad_condition": 105013083205.519, "lr": 0.000981581283398829, "time_sec": 132.5209527015686 }, { "epoch": 14, "train_loss": 4.809564754486084, "train_acc": 0.00862, "test_loss": 4.655567189025879, "test_acc": 0.01, "lyapunov": 1.571449481007998, "grad_norm": 0.33124516886493516, "grad_max_sv": 0.21216185558587314, "grad_min_sv": 5.858595327667813e-10, "grad_condition": 110751878933.28384, "lr": 0.0009786597487660333, "time_sec": 132.577819108963 }, { "epoch": 15, "train_loss": 4.816427656860352, "train_acc": 0.00936, "test_loss": 4.6545363082885745, "test_acc": 0.01, "lyapunov": 1.5565597386006504, "grad_norm": 0.2791973343426611, "grad_max_sv": 0.1684179350733757, "grad_min_sv": 6.917982259102923e-13, "grad_condition": 127223674978.58926, "lr": 0.0009755282581475766, "time_sec": 132.58430194854736 }, { "epoch": 16, "train_loss": 4.829237567138672, "train_acc": 0.00908, "test_loss": 4.629003553771972, "test_acc": 0.01, "lyapunov": 1.5557427775219579, "grad_norm": 0.2712716184485074, "grad_max_sv": 0.1436759451404214, "grad_min_sv": 3.50392380214562e-13, "grad_condition": 118193912798.78633, "lr": 0.0009721881851187403, "time_sec": 132.49679327011108 }, { "epoch": 17, "train_loss": 4.842587297058105, "train_acc": 0.00944, "test_loss": 4.633112139892578, "test_acc": 0.01, "lyapunov": 1.554307114742601, "grad_norm": 0.26245775185719383, "grad_max_sv": 0.140065660700202, "grad_min_sv": 2.6676405041443376e-15, "grad_condition": 139703664535.0272, "lr": 0.0009686409947459456, "time_sec": 132.52488541603088 }, { "epoch": 18, "train_loss": 4.85334480545044, "train_acc": 0.0098, "test_loss": 4.6145305236816405, "test_acc": 0.01, "lyapunov": 1.5502319726187859, "grad_norm": 0.20648576741983057, "grad_max_sv": 0.11613305620849132, "grad_min_sv": 2.4641309551932607e-14, "grad_condition": 112456376406.20891, "lr": 0.0009648882429441254, "time_sec": 132.53546261787415 }, { "epoch": 19, "train_loss": 4.8756606997680665, "train_acc": 0.00972, "test_loss": 4.63894914932251, "test_acc": 0.01, "lyapunov": 1.5529851959184613, "grad_norm": 0.29909579690838006, "grad_max_sv": 0.2365069929510355, "grad_min_sv": 8.824648532682828e-14, "grad_condition": 223546987940.7954, "lr": 0.00096093157579425, "time_sec": 132.5408227443695 }, { "epoch": 20, "train_loss": 4.8827299949646, "train_acc": 0.01024, "test_loss": 4.622587729644775, "test_acc": 0.01, "lyapunov": 1.556399286555512, "grad_norm": 0.15272550856176187, "grad_max_sv": 0.08741383519954979, "grad_min_sv": 8.699695565641333e-15, "grad_condition": 85913025020.82304, "lr": 0.0009567727288213001, "time_sec": 132.51366233825684 }, { "epoch": 21, "train_loss": 4.884711999969483, "train_acc": 0.00998, "test_loss": 4.606764881896972, "test_acc": 0.01, "lyapunov": 1.5493811259184347, "grad_norm": 0.2280734728397927, "grad_max_sv": 0.17737758290022612, "grad_min_sv": 1.7983389117226294e-14, "grad_condition": 174310016585.06476, "lr": 0.0009524135262330095, "time_sec": 132.5240728855133 }, { "epoch": 22, "train_loss": 4.88518779006958, "train_acc": 0.00898, "test_loss": 4.625405541229248, "test_acc": 0.01, "lyapunov": 1.5538233515551634, "grad_norm": 0.21224774170023955, "grad_max_sv": 0.15938115157186986, "grad_min_sv": 3.1749157935371154e-14, "grad_condition": 154547913667.9044, "lr": 0.0009478558801197061, "time_sec": 132.49090003967285 }, { "epoch": 23, "train_loss": 4.87999728149414, "train_acc": 0.01018, "test_loss": 4.662280471801758, "test_acc": 0.01, "lyapunov": 1.5508448772723107, "grad_norm": 0.15119163863092763, "grad_max_sv": 0.08865232784301043, "grad_min_sv": 7.005994597272193e-16, "grad_condition": 88575401119.44853, "lr": 0.000943101789615607, "time_sec": 132.47974038124084 }, { "epoch": 24, "train_loss": 4.881147270202637, "train_acc": 0.00976, "test_loss": 4.615948718261719, "test_acc": 0.01, "lyapunov": 1.5512399081988713, "grad_norm": 0.15770676446584825, "grad_max_sv": 0.10294295214116574, "grad_min_sv": 5.7741339454657465e-15, "grad_condition": 102285384766.49887, "lr": 0.0009381533400219313, "time_sec": 132.52317762374878 }, { "epoch": 25, "train_loss": 4.880569260253906, "train_acc": 0.00984, "test_loss": 4.610492027282715, "test_acc": 0.01, "lyapunov": 1.5512746035900262, "grad_norm": 0.14554815906091484, "grad_max_sv": 0.08865004125982523, "grad_min_sv": 2.6778839672578997e-16, "grad_condition": 88627301882.68987, "lr": 0.0009330127018922189, "time_sec": 132.56079196929932 }, { "epoch": 26, "train_loss": 4.881224513397217, "train_acc": 0.01002, "test_loss": 4.747660410308838, "test_acc": 0.01, "lyapunov": 1.5542162702516522, "grad_norm": 0.1391562981495577, "grad_max_sv": 0.08203545394353569, "grad_min_sv": 2.822381678288234e-15, "grad_condition": 81722256507.78954, "lr": 0.000927682130080253, "time_sec": 132.5239975452423 }, { "epoch": 27, "train_loss": 4.881258678741455, "train_acc": 0.0098, "test_loss": 4.790026293182373, "test_acc": 0.01, "lyapunov": 1.5510657614149401, "grad_norm": 0.14725967817424349, "grad_max_sv": 0.09194991793483495, "grad_min_sv": 4.568772527401975e-15, "grad_condition": 91398390464.57925, "lr": 0.0009221639627510072, "time_sec": 132.526837348938 }, { "epoch": 28, "train_loss": 4.880898860931397, "train_acc": 0.0102, "test_loss": 4.802646064758301, "test_acc": 0.01, "lyapunov": 1.5514030862037482, "grad_norm": 0.14347689217252269, "grad_max_sv": 0.09245897587388754, "grad_min_sv": 1.0843861076282981e-15, "grad_condition": 92342187840.9415, "lr": 0.0009164606203550494, "time_sec": 132.5042200088501 }, { "epoch": 29, "train_loss": 4.880448774719238, "train_acc": 0.01046, "test_loss": 4.7516579360961915, "test_acc": 0.01, "lyapunov": 1.5519556474807623, "grad_norm": 0.13309334546952373, "grad_max_sv": 0.08154573319479823, "grad_min_sv": 9.282067880476938e-16, "grad_condition": 81454842058.19734, "lr": 0.0009105746045668516, "time_sec": 132.52633500099182 }, { "epoch": 30, "train_loss": 4.883071630401611, "train_acc": 0.00954, "test_loss": 4.771951943206787, "test_acc": 0.01, "lyapunov": 1.554316602399587, "grad_norm": 0.14789859288021653, "grad_max_sv": 0.09579872786998749, "grad_min_sv": 3.051331237308755e-15, "grad_condition": 95468711969.6211, "lr": 0.0009045084971874733, "time_sec": 132.5885534286499 }, { "epoch": 31, "train_loss": 4.881176261901856, "train_acc": 0.00888, "test_loss": 4.774106753540039, "test_acc": 0.01, "lyapunov": 1.5536001310933887, "grad_norm": 0.13112482323923252, "grad_max_sv": 0.07564891651272773, "grad_min_sv": 2.107048715412855e-15, "grad_condition": 75454097088.2188, "lr": 0.0008982649590120977, "time_sec": 132.49479031562805 }, { "epoch": 32, "train_loss": 4.880477762145996, "train_acc": 0.00962, "test_loss": 4.746245973968506, "test_acc": 0.01, "lyapunov": 1.5537874387658162, "grad_norm": 0.12461403839681509, "grad_max_sv": 0.062327271420508625, "grad_min_sv": 1.0725391843424482e-20, "grad_condition": 62327270693.35764, "lr": 0.0008918467286629196, "time_sec": 132.4852647781372 }, { "epoch": 33, "train_loss": 4.881243226470947, "train_acc": 0.00888, "test_loss": 4.736703532409668, "test_acc": 0.01, "lyapunov": 1.556170121788064, "grad_norm": 0.1148317700659679, "grad_max_sv": 0.05345285767689347, "grad_min_sv": 0.0, "grad_condition": 53452857676.89348, "lr": 0.0008852566213878943, "time_sec": 132.53890919685364 }, { "epoch": 34, "train_loss": 4.881585180969238, "train_acc": 0.01008, "test_loss": 4.703427969360352, "test_acc": 0.01, "lyapunov": 1.5578572292766912, "grad_norm": 0.11335239335552806, "grad_max_sv": 0.052668086066842076, "grad_min_sv": 0.0, "grad_condition": 52668086066.84208, "lr": 0.000878497527825878, "time_sec": 132.64637637138367 }, { "epoch": 35, "train_loss": 4.882511229858398, "train_acc": 0.0097, "test_loss": 4.681371363830566, "test_acc": 0.01, "lyapunov": 1.5592110135671122, "grad_norm": 0.12058968555924836, "grad_max_sv": 0.06217097630724311, "grad_min_sv": 0.0, "grad_condition": 62170976307.2431, "lr": 0.000871572412738697, "time_sec": 132.43680119514465 }, { "epoch": 36, "train_loss": 4.881192719268799, "train_acc": 0.00946, "test_loss": 4.697506471252441, "test_acc": 0.01, "lyapunov": 1.5561128973655993, "grad_norm": 0.11655881819882306, "grad_max_sv": 0.058859458193182945, "grad_min_sv": 8.230737425630695e-40, "grad_condition": 58859458193.182945, "lr": 0.0008644843137107055, "time_sec": 132.4848039150238 }, { "epoch": 37, "train_loss": 4.8825209786987305, "train_acc": 0.00972, "test_loss": 4.694917836761475, "test_acc": 0.01, "lyapunov": 1.5584492564506238, "grad_norm": 0.13341533833277566, "grad_max_sv": 0.07657676143571734, "grad_min_sv": 1.687390330982044e-16, "grad_condition": 76560751213.82744, "lr": 0.0008572363398164014, "time_sec": 132.51812028884888 }, { "epoch": 38, "train_loss": 4.882141689910888, "train_acc": 0.01016, "test_loss": 4.688916626739502, "test_acc": 0.01, "lyapunov": 1.5593435761263914, "grad_norm": 0.11853299040694154, "grad_max_sv": 0.055678781820461154, "grad_min_sv": 6.767910398009686e-40, "grad_condition": 55678781820.46116, "lr": 0.0008498316702566826, "time_sec": 132.56456470489502 }, { "epoch": 39, "train_loss": 4.8832370683288575, "train_acc": 0.01006, "test_loss": 4.7038502136230465, "test_acc": 0.01, "lyapunov": 1.5620976924286474, "grad_norm": 0.11941743088728123, "grad_max_sv": 0.05502237342298031, "grad_min_sv": 8.246841147582715e-40, "grad_condition": 55022373422.9803, "lr": 0.0008422735529643442, "time_sec": 132.5043168067932 }, { "epoch": 40, "train_loss": 4.884805080718994, "train_acc": 0.00916, "test_loss": 4.710450775146485, "test_acc": 0.01, "lyapunov": 1.5655303751416219, "grad_norm": 0.12619034606889276, "grad_max_sv": 0.06059649083763361, "grad_min_sv": 2.3062997125157342e-34, "grad_condition": 60596490837.63362, "lr": 0.0008345653031794289, "time_sec": 132.5351688861847 }, { "epoch": 41, "train_loss": 4.886436430511474, "train_acc": 0.00842, "test_loss": 4.693475389099121, "test_acc": 0.01, "lyapunov": 1.566963563794675, "grad_norm": 0.13196364661308996, "grad_max_sv": 0.06961128637194633, "grad_min_sv": 1.1737794876080507e-22, "grad_condition": 69611286362.64899, "lr": 0.0008267103019950526, "time_sec": 132.51111769676208 }, { "epoch": 42, "train_loss": 4.882716519012451, "train_acc": 0.00938, "test_loss": 4.694032908630371, "test_acc": 0.01, "lyapunov": 1.5620074573990024, "grad_norm": 0.11781162776823918, "grad_max_sv": 0.046270584035664794, "grad_min_sv": 0.0, "grad_condition": 46270584035.664795, "lr": 0.0008187119948743447, "time_sec": 132.5160994529724 }, { "epoch": 43, "train_loss": 4.8821180502319335, "train_acc": 0.00952, "test_loss": 4.7027722869873045, "test_acc": 0.01, "lyapunov": 1.561017348638276, "grad_norm": 0.11312831534529132, "grad_max_sv": 0.04106818297877908, "grad_min_sv": 0.0, "grad_condition": 41068182978.77908, "lr": 0.000810573890139155, "time_sec": 132.5087025165558 }, { "epoch": 44, "train_loss": 4.883875316619873, "train_acc": 0.00868, "test_loss": 4.726299923706055, "test_acc": 0.01, "lyapunov": 1.5633756574767326, "grad_norm": 0.12667296790156193, "grad_max_sv": 0.0658588983118534, "grad_min_sv": 1.0092078216956858e-18, "grad_condition": 65858810617.60825, "lr": 0.0008022995574311873, "time_sec": 132.5128674507141 }, { "epoch": 45, "train_loss": 4.883541934661865, "train_acc": 0.00932, "test_loss": 4.7017227630615235, "test_acc": 0.01, "lyapunov": 1.5632145856042652, "grad_norm": 0.12309109072630019, "grad_max_sv": 0.05839173295535147, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 58391732955.35146, "lr": 0.0007938926261462363, "time_sec": 132.53016304969788 }, { "epoch": 46, "train_loss": 4.888793373718261, "train_acc": 0.00888, "test_loss": 4.696292651367187, "test_acc": 0.01, "lyapunov": 1.5750811136592076, "grad_norm": 0.13746736535152312, "grad_max_sv": 0.058484140876680614, "grad_min_sv": 0.0, "grad_condition": 58484140876.68062, "lr": 0.0007853567838422158, "time_sec": 132.50724458694458 }, { "epoch": 47, "train_loss": 4.883440639190674, "train_acc": 0.00972, "test_loss": 4.701148196411133, "test_acc": 0.01, "lyapunov": 1.564275365351411, "grad_norm": 0.12158899868830998, "grad_max_sv": 0.05122774885967374, "grad_min_sv": 0.0, "grad_condition": 51227748859.673744, "lr": 0.0007766957746216719, "time_sec": 132.50299715995789 }, { "epoch": 48, "train_loss": 4.884719120330811, "train_acc": 0.00906, "test_loss": 4.729176859283447, "test_acc": 0.01, "lyapunov": 1.5687132698800557, "grad_norm": 0.12254448404539135, "grad_max_sv": 0.040120215015485884, "grad_min_sv": 0.0, "grad_condition": 40120215015.485886, "lr": 0.0007679133974894982, "time_sec": 132.46641159057617 }, { "epoch": 49, "train_loss": 4.884110562133789, "train_acc": 0.00872, "test_loss": 4.725056867980957, "test_acc": 0.01, "lyapunov": 1.5669305754439604, "grad_norm": 0.1149187900499572, "grad_max_sv": 0.03382976925931871, "grad_min_sv": 0.0, "grad_condition": 33829769259.318707, "lr": 0.000759013504686565, "time_sec": 132.51045417785645 }, { "epoch": 50, "train_loss": 4.883614390563965, "train_acc": 0.00966, "test_loss": 4.709762881469727, "test_acc": 0.01, "lyapunov": 1.566156323608535, "grad_norm": 0.12258255087018385, "grad_max_sv": 0.034629582427442074, "grad_min_sv": 0.0, "grad_condition": 34629582427.44206, "lr": 0.0007499999999999998, "time_sec": 132.5417709350586 }, { "epoch": 51, "train_loss": 4.8839620613098145, "train_acc": 0.0093, "test_loss": 4.6980411888122555, "test_acc": 0.01, "lyapunov": 1.5664365087323786, "grad_norm": 0.13769170593996222, "grad_max_sv": 0.04753138842061162, "grad_min_sv": 0.0, "grad_condition": 47531388420.61162, "lr": 0.0007408768370508575, "time_sec": 132.5473415851593 }, { "epoch": 52, "train_loss": 4.883951457366943, "train_acc": 0.0097, "test_loss": 4.7330233673095705, "test_acc": 0.01, "lyapunov": 1.5676923822563933, "grad_norm": 0.12914534017358148, "grad_max_sv": 0.03236106717959046, "grad_min_sv": 0.0, "grad_condition": 32361067179.590466, "lr": 0.0007316480175599307, "time_sec": 132.50377297401428 }, { "epoch": 53, "train_loss": 4.883413257293701, "train_acc": 0.00908, "test_loss": 4.7225365089416504, "test_acc": 0.01, "lyapunov": 1.5648496943666501, "grad_norm": 0.1255861922278266, "grad_max_sv": 0.04178534299135208, "grad_min_sv": 0.0, "grad_condition": 41785342991.35208, "lr": 0.0007223175895924635, "time_sec": 132.52618622779846 }, { "epoch": 54, "train_loss": 4.8835242868041995, "train_acc": 0.00984, "test_loss": 4.827378164672852, "test_acc": 0.01, "lyapunov": 1.5652363522888144, "grad_norm": 0.11717740789911417, "grad_max_sv": 0.04349024128168821, "grad_min_sv": 0.0, "grad_condition": 43490241281.68822, "lr": 0.0007128896457825361, "time_sec": 132.49181389808655 }, { "epoch": 55, "train_loss": 4.885148456573487, "train_acc": 0.00938, "test_loss": 4.805696286010742, "test_acc": 0.01, "lyapunov": 1.5694574946942537, "grad_norm": 0.11719591784462954, "grad_max_sv": 0.027647955063730478, "grad_min_sv": 0.0, "grad_condition": 27647955063.73048, "lr": 0.0007033683215378998, "time_sec": 132.4630925655365 }, { "epoch": 56, "train_loss": 4.8840925729370115, "train_acc": 0.00916, "test_loss": 4.817810218048096, "test_acc": 0.01, "lyapunov": 1.5679599275369474, "grad_norm": 0.10763202558448146, "grad_max_sv": 0.024515782250091434, "grad_min_sv": 0.0, "grad_condition": 24515782250.09143, "lr": 0.0006937577932260512, "time_sec": 132.42955470085144 }, { "epoch": 57, "train_loss": 4.883760057678223, "train_acc": 0.0095, "test_loss": 4.856276947784424, "test_acc": 0.01, "lyapunov": 1.5672943607315688, "grad_norm": 0.11038524447317109, "grad_max_sv": 0.031160860368981958, "grad_min_sv": 0.0, "grad_condition": 31160860368.981956, "lr": 0.0006840622763423388, "time_sec": 132.52315950393677 }, { "epoch": 58, "train_loss": 4.884222667388916, "train_acc": 0.00974, "test_loss": 4.874290851593018, "test_acc": 0.01, "lyapunov": 1.567508033779271, "grad_norm": 0.11849561013061653, "grad_max_sv": 0.03593655498698354, "grad_min_sv": 0.0, "grad_condition": 35936554986.983536, "lr": 0.0006742860236609073, "time_sec": 132.47893905639648 }, { "epoch": 59, "train_loss": 4.88414927734375, "train_acc": 0.00932, "test_loss": 4.812584387207031, "test_acc": 0.01, "lyapunov": 1.5678569962606406, "grad_norm": 0.11036912590820531, "grad_max_sv": 0.028424020344391464, "grad_min_sv": 0.0, "grad_condition": 28424020344.391468, "lr": 0.0006644333233692913, "time_sec": 132.4449987411499 }, { "epoch": 60, "train_loss": 4.8860119464111325, "train_acc": 0.00866, "test_loss": 4.839297940826416, "test_acc": 0.01, "lyapunov": 1.5727104262622726, "grad_norm": 0.12489417029089354, "grad_max_sv": 0.0449837657622993, "grad_min_sv": 0.0, "grad_condition": 44983765762.2993, "lr": 0.0006545084971874734, "time_sec": 132.52293181419373 }, { "epoch": 61, "train_loss": 4.884305205383301, "train_acc": 0.01046, "test_loss": 4.857601212310791, "test_acc": 0.01, "lyapunov": 1.5686972680908944, "grad_norm": 0.11135287490998455, "grad_max_sv": 0.04157614354044199, "grad_min_sv": 0.0, "grad_condition": 41576143540.44199, "lr": 0.0006445158984722354, "time_sec": 132.51698970794678 }, { "epoch": 62, "train_loss": 4.884398639678955, "train_acc": 0.00944, "test_loss": 4.833207711791992, "test_acc": 0.01, "lyapunov": 1.5687918172163122, "grad_norm": 0.11243013251101783, "grad_max_sv": 0.043204908631742, "grad_min_sv": 0.0, "grad_condition": 43204908631.742004, "lr": 0.0006344599103076324, "time_sec": 132.51721620559692 }, { "epoch": 63, "train_loss": 4.884688519744873, "train_acc": 0.00908, "test_loss": 4.811236346435547, "test_acc": 0.01, "lyapunov": 1.570080169326509, "grad_norm": 0.11662661682539925, "grad_max_sv": 0.02772782016545534, "grad_min_sv": 0.0, "grad_condition": 27727820165.455345, "lr": 0.0006243449435824269, "time_sec": 132.50267052650452 }, { "epoch": 64, "train_loss": 4.8855357188415525, "train_acc": 0.0096, "test_loss": 4.834980075073243, "test_acc": 0.01, "lyapunov": 1.5721226451951829, "grad_norm": 0.12180207356240787, "grad_max_sv": 0.013557582441717387, "grad_min_sv": 0.0, "grad_condition": 13557582441.717386, "lr": 0.0006141754350553275, "time_sec": 132.6969666481018 }, { "epoch": 65, "train_loss": 4.884502696838379, "train_acc": 0.00962, "test_loss": 4.815651828765869, "test_acc": 0.01, "lyapunov": 1.5692061444987422, "grad_norm": 0.13731619014897972, "grad_max_sv": 0.036923335213214156, "grad_min_sv": 0.0, "grad_condition": 36923335213.21416, "lr": 0.0006039558454088793, "time_sec": 132.4734799861908 }, { "epoch": 66, "train_loss": 4.88990579711914, "train_acc": 0.00978, "test_loss": 4.791162698364258, "test_acc": 0.01, "lyapunov": 1.581291075862582, "grad_norm": 0.14075282121769883, "grad_max_sv": 0.039619889203459026, "grad_min_sv": 0.0, "grad_condition": 39619889203.45903, "lr": 0.000593690657292862, "time_sec": 132.52782583236694 }, { "epoch": 67, "train_loss": 4.888191639251709, "train_acc": 0.00998, "test_loss": 4.805363137054443, "test_acc": 0.01, "lyapunov": 1.5781969777153582, "grad_norm": 0.11852732787787948, "grad_max_sv": 0.03636179021559656, "grad_min_sv": 0.0, "grad_condition": 36361790215.59656, "lr": 0.0005833843733580507, "time_sec": 132.50655126571655 }, { "epoch": 68, "train_loss": 4.885113808746338, "train_acc": 0.0092, "test_loss": 4.790876692962646, "test_acc": 0.01, "lyapunov": 1.5712030659551206, "grad_norm": 0.11464904106569235, "grad_max_sv": 0.02942234524525702, "grad_min_sv": 0.0, "grad_condition": 29422345245.25702, "lr": 0.0005730415142812054, "time_sec": 132.44155955314636 }, { "epoch": 69, "train_loss": 4.886073732910156, "train_acc": 0.00874, "test_loss": 4.788568280029297, "test_acc": 0.01, "lyapunov": 1.5744608549205847, "grad_norm": 0.11158557694696751, "grad_max_sv": 0.004607879696413875, "grad_min_sv": 0.0, "grad_condition": 4607879696.413875, "lr": 0.0005626666167821517, "time_sec": 132.44937348365784 }, { "epoch": 70, "train_loss": 4.885406183319092, "train_acc": 0.00988, "test_loss": 4.791419393157959, "test_acc": 0.01, "lyapunov": 1.5723789460823665, "grad_norm": 0.1093341588876136, "grad_max_sv": 0.013379927957430482, "grad_min_sv": 0.0, "grad_condition": 13379927957.430483, "lr": 0.0005522642316338265, "time_sec": 132.44818544387817 }, { "epoch": 71, "train_loss": 4.885112988128662, "train_acc": 0.00898, "test_loss": 4.807086729431153, "test_acc": 0.01, "lyapunov": 1.5718346922598836, "grad_norm": 0.12168415122862028, "grad_max_sv": 0.014193862210959196, "grad_min_sv": 0.0, "grad_condition": 14193862210.959198, "lr": 0.0005418389216661573, "time_sec": 132.46469593048096 }, { "epoch": 72, "train_loss": 4.888309308624268, "train_acc": 0.00942, "test_loss": 4.786458195495605, "test_acc": 0.01, "lyapunov": 1.5786126913012142, "grad_norm": 0.1257472430943546, "grad_max_sv": 0.00992818851955235, "grad_min_sv": 0.0, "grad_condition": 9928188519.55235, "lr": 0.0005313952597646563, "time_sec": 132.4868745803833 }, { "epoch": 73, "train_loss": 4.8883187344360355, "train_acc": 0.01008, "test_loss": 4.763764072418213, "test_acc": 0.01, "lyapunov": 1.5783945306792588, "grad_norm": 0.16063770590325258, "grad_max_sv": 0.02905639265663922, "grad_min_sv": 0.0, "grad_condition": 29056392656.63922, "lr": 0.0005209378268645994, "time_sec": 132.40988731384277 }, { "epoch": 74, "train_loss": 4.885095281524658, "train_acc": 0.00904, "test_loss": 4.771036297607422, "test_acc": 0.01, "lyapunov": 1.5722466762108571, "grad_norm": 0.332703681561214, "grad_max_sv": 0.009321404900401831, "grad_min_sv": 0.0, "grad_condition": 9321404900.40183, "lr": 0.0005104712099416781, "time_sec": 132.41944670677185 }, { "epoch": 75, "train_loss": 4.8858135334777835, "train_acc": 0.00924, "test_loss": 4.7793162803649905, "test_acc": 0.01, "lyapunov": 1.573599765367825, "grad_norm": 0.3785245081976868, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 132.43439865112305 }, { "epoch": 76, "train_loss": 4.885755948486328, "train_acc": 0.00894, "test_loss": 4.775339208984375, "test_acc": 0.01, "lyapunov": 1.5738494380965562, "grad_norm": 0.26809830726413736, "grad_max_sv": 0.00972625520080328, "grad_min_sv": 0.0, "grad_condition": 9726255200.80328, "lr": 0.0004895287900583212, "time_sec": 132.4453580379486 }, { "epoch": 77, "train_loss": 4.886971358032227, "train_acc": 0.0088, "test_loss": 4.780246302032471, "test_acc": 0.01, "lyapunov": 1.576519505447134, "grad_norm": 0.5857000867492739, "grad_max_sv": 0.015286983083933591, "grad_min_sv": 0.0, "grad_condition": 15286983083.933594, "lr": 0.0004790621731353997, "time_sec": 132.4340922832489 }, { "epoch": 78, "train_loss": 4.8857606088256835, "train_acc": 0.00878, "test_loss": 4.796332804870605, "test_acc": 0.01, "lyapunov": 1.574093949764281, "grad_norm": 0.19474925059694603, "grad_max_sv": 0.007740102289244532, "grad_min_sv": 0.0, "grad_condition": 7740102289.244532, "lr": 0.000468604740235343, "time_sec": 132.4252007007599 }, { "epoch": 79, "train_loss": 4.8854332868957515, "train_acc": 0.00904, "test_loss": 4.7431994110107425, "test_acc": 0.01, "lyapunov": 1.5728687746140657, "grad_norm": 0.2002833929164076, "grad_max_sv": 0.018612090731039643, "grad_min_sv": 0.0, "grad_condition": 18612090731.039646, "lr": 0.00045816107833384175, "time_sec": 132.41635990142822 }, { "epoch": 80, "train_loss": 4.88607871963501, "train_acc": 0.00908, "test_loss": 4.782230687713623, "test_acc": 0.01, "lyapunov": 1.5748912559445862, "grad_norm": 0.2663292726664251, "grad_max_sv": 0.0006320734973996878, "grad_min_sv": 0.0, "grad_condition": 632073497.3996878, "lr": 0.0004477357683661729, "time_sec": 132.3943703174591 }, { "epoch": 81, "train_loss": 4.885633817596435, "train_acc": 0.00894, "test_loss": 4.773731129455566, "test_acc": 0.01, "lyapunov": 1.5739493342616675, "grad_norm": 0.19467627817910108, "grad_max_sv": 0.004234243137761951, "grad_min_sv": 0.0, "grad_condition": 4234243137.7619505, "lr": 0.00043733338321784746, "time_sec": 132.42148518562317 }, { "epoch": 82, "train_loss": 4.890183934631348, "train_acc": 0.00922, "test_loss": 4.80019803237915, "test_acc": 0.01, "lyapunov": 1.58174940356818, "grad_norm": 0.2693904362677404, "grad_max_sv": 0.023508542357012628, "grad_min_sv": 0.0, "grad_condition": 23508542357.01263, "lr": 0.0004269584857187939, "time_sec": 132.48368287086487 }, { "epoch": 83, "train_loss": 4.887686183624267, "train_acc": 0.00988, "test_loss": 4.6776658203125, "test_acc": 0.01, "lyapunov": 1.574008427922378, "grad_norm": 0.2293228968062561, "grad_max_sv": 0.06707085431553424, "grad_min_sv": 5.322572622808566e-16, "grad_condition": 67002509647.244484, "lr": 0.0004166156266419484, "time_sec": 132.49965047836304 }, { "epoch": 84, "train_loss": 4.887849067077637, "train_acc": 0.01004, "test_loss": 4.733781813049316, "test_acc": 0.01, "lyapunov": 1.573820165356102, "grad_norm": 0.14901481902367925, "grad_max_sv": 0.09299901695922017, "grad_min_sv": 1.6405075679230025e-16, "grad_condition": 92982403383.72546, "lr": 0.0004063093427071373, "time_sec": 132.49851322174072 }, { "epoch": 85, "train_loss": 4.891140226135254, "train_acc": 0.00994, "test_loss": 4.79980509262085, "test_acc": 0.01, "lyapunov": 1.5841534381632305, "grad_norm": 0.14782164130887582, "grad_max_sv": 0.07909845747053623, "grad_min_sv": 4.4865151314265836e-26, "grad_condition": 79098457470.53198, "lr": 0.0003960441545911199, "time_sec": 132.5316731929779 }, { "epoch": 86, "train_loss": 4.887021747589111, "train_acc": 0.00944, "test_loss": 4.776346062469482, "test_acc": 0.01, "lyapunov": 1.5762594874252749, "grad_norm": 0.12848068900948553, "grad_max_sv": 0.05206927340477705, "grad_min_sv": 0.0, "grad_condition": 52069273404.777054, "lr": 0.0003858245649446718, "time_sec": 132.53142595291138 }, { "epoch": 87, "train_loss": 4.889097787322998, "train_acc": 0.00868, "test_loss": 4.707060712432861, "test_acc": 0.01, "lyapunov": 1.5793669498180185, "grad_norm": 0.1548551396628501, "grad_max_sv": 0.07543672090396285, "grad_min_sv": 1.994722925254039e-23, "grad_condition": 75436720902.41975, "lr": 0.00037565505641757235, "time_sec": 132.56474471092224 }, { "epoch": 88, "train_loss": 4.887517103881836, "train_acc": 0.00934, "test_loss": 4.697494779968261, "test_acc": 0.01, "lyapunov": 1.5769202114675966, "grad_norm": 0.12499428379004662, "grad_max_sv": 0.06417224258184433, "grad_min_sv": 3.819406582541987e-27, "grad_condition": 64172242581.844055, "lr": 0.00036554008969236695, "time_sec": 132.5758376121521 }, { "epoch": 89, "train_loss": 4.889558787384034, "train_acc": 0.00908, "test_loss": 4.738901914978027, "test_acc": 0.01, "lyapunov": 1.5814725813048576, "grad_norm": 0.1259682508249713, "grad_max_sv": 0.05729179736226797, "grad_min_sv": 0.0, "grad_condition": 57291797362.26797, "lr": 0.0003554841015277638, "time_sec": 132.55631971359253 }, { "epoch": 90, "train_loss": 4.887118022155762, "train_acc": 0.00926, "test_loss": 4.745434680175781, "test_acc": 0.01, "lyapunov": 1.57591240881654, "grad_norm": 0.12675049544335418, "grad_max_sv": 0.0551216053776443, "grad_min_sv": 0.0, "grad_condition": 55121605377.64431, "lr": 0.000345491502812526, "time_sec": 132.52520608901978 }, { "epoch": 91, "train_loss": 4.886403057098389, "train_acc": 0.01032, "test_loss": 4.728809788513184, "test_acc": 0.01, "lyapunov": 1.575149437045807, "grad_norm": 0.12166328349782148, "grad_max_sv": 0.04358728057704866, "grad_min_sv": 0.0, "grad_condition": 43587280577.04866, "lr": 0.0003355666766307081, "time_sec": 132.5356101989746 }, { "epoch": 92, "train_loss": 4.886422184295654, "train_acc": 0.00926, "test_loss": 4.738454541015625, "test_acc": 0.01, "lyapunov": 1.5745899811425172, "grad_norm": 0.11920532388570855, "grad_max_sv": 0.05519997598603368, "grad_min_sv": 0.0, "grad_condition": 55199975986.033676, "lr": 0.00032571397633909225, "time_sec": 132.55407977104187 }, { "epoch": 93, "train_loss": 4.886163410339355, "train_acc": 0.00948, "test_loss": 4.729941507720947, "test_acc": 0.01, "lyapunov": 1.5739426192115336, "grad_norm": 0.13075040975965602, "grad_max_sv": 0.051908688899129626, "grad_min_sv": 0.0, "grad_condition": 51908688899.12963, "lr": 0.00031593772365766094, "time_sec": 132.55454182624817 }, { "epoch": 94, "train_loss": 4.889471523284912, "train_acc": 0.00938, "test_loss": 4.726048579406738, "test_acc": 0.01, "lyapunov": 1.5820539750711387, "grad_norm": 0.13111792932705457, "grad_max_sv": 0.04076082408428192, "grad_min_sv": 0.0, "grad_condition": 40760824084.28192, "lr": 0.0003062422067739483, "time_sec": 132.50855350494385 }, { "epoch": 95, "train_loss": 4.886597353057861, "train_acc": 0.00966, "test_loss": 4.721816172790527, "test_acc": 0.01, "lyapunov": 1.5761216878890991, "grad_norm": 0.10242530878744271, "grad_max_sv": 0.018115377286449075, "grad_min_sv": 0.0, "grad_condition": 18115377286.449074, "lr": 0.00029663167846209965, "time_sec": 132.52085852622986 }, { "epoch": 96, "train_loss": 4.8871041314697266, "train_acc": 0.00878, "test_loss": 4.708365040588379, "test_acc": 0.01, "lyapunov": 1.5773879777440025, "grad_norm": 0.11832202769749675, "grad_max_sv": 0.01925608702003956, "grad_min_sv": 0.0, "grad_condition": 19256087020.03956, "lr": 0.00028711035421746345, "time_sec": 132.48231029510498 }, { "epoch": 97, "train_loss": 4.885575797424316, "train_acc": 0.00956, "test_loss": 4.758969999694824, "test_acc": 0.01, "lyapunov": 1.5739980253112285, "grad_norm": 0.102958848729015, "grad_max_sv": 0.00836998880840838, "grad_min_sv": 0.0, "grad_condition": 8369988808.4083805, "lr": 0.00027768241040753615, "time_sec": 132.4623761177063 }, { "epoch": 98, "train_loss": 4.885688443298339, "train_acc": 0.00946, "test_loss": 4.7685779739379885, "test_acc": 0.01, "lyapunov": 1.5737464616975516, "grad_norm": 0.11414360687104802, "grad_max_sv": 0.033959317160770296, "grad_min_sv": 0.0, "grad_condition": 33959317160.770294, "lr": 0.00026835198244006903, "time_sec": 132.65263080596924 }, { "epoch": 99, "train_loss": 4.888634443054199, "train_acc": 0.00974, "test_loss": 4.754720726013184, "test_acc": 0.01, "lyapunov": 1.5796314081572511, "grad_norm": 0.11056614929218114, "grad_max_sv": 0.034730975748971105, "grad_min_sv": 0.0, "grad_condition": 34730975748.9711, "lr": 0.0002591231629491421, "time_sec": 132.53659439086914 }, { "epoch": 100, "train_loss": 4.888005011444092, "train_acc": 0.00978, "test_loss": 4.7091091361999515, "test_acc": 0.01, "lyapunov": 1.5793088131853381, "grad_norm": 0.11538715899109499, "grad_max_sv": 0.027404929930344223, "grad_min_sv": 0.0, "grad_condition": 27404929930.344227, "lr": 0.0002499999999999997, "time_sec": 132.47063946723938 }, { "epoch": 101, "train_loss": 4.890101184844971, "train_acc": 0.00978, "test_loss": 4.713412440490723, "test_acc": 0.01, "lyapunov": 1.583473697037953, "grad_norm": 0.14124961194918514, "grad_max_sv": 0.030058392463251947, "grad_min_sv": 0.0, "grad_condition": 30058392463.251945, "lr": 0.00024098649531343477, "time_sec": 132.50555539131165 }, { "epoch": 102, "train_loss": 4.887625363464355, "train_acc": 0.01148, "test_loss": 4.7020545562744145, "test_acc": 0.01, "lyapunov": 1.579564877178358, "grad_norm": 0.1297826697220666, "grad_max_sv": 0.019950845977291465, "grad_min_sv": 0.0, "grad_condition": 19950845977.291466, "lr": 0.0002320866025105016, "time_sec": 132.43331456184387 }, { "epoch": 103, "train_loss": 4.889458109130859, "train_acc": 0.00924, "test_loss": 4.700020100402832, "test_acc": 0.01, "lyapunov": 1.5832947227351195, "grad_norm": 0.16304165123375366, "grad_max_sv": 0.00834191357716918, "grad_min_sv": 0.0, "grad_condition": 8341913577.16918, "lr": 0.0002233042253783278, "time_sec": 132.42489337921143 }, { "epoch": 104, "train_loss": 4.888043740234375, "train_acc": 0.00976, "test_loss": 4.690122833251953, "test_acc": 0.01, "lyapunov": 1.580241550874832, "grad_norm": 0.16164115490422049, "grad_max_sv": 0.00892186602577567, "grad_min_sv": 0.0, "grad_condition": 8921866025.775671, "lr": 0.000214643216157784, "time_sec": 132.40913486480713 }, { "epoch": 105, "train_loss": 4.885801515350342, "train_acc": 0.00962, "test_loss": 4.70759442062378, "test_acc": 0.01, "lyapunov": 1.5747494935379613, "grad_norm": 0.10757507074973427, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 132.41837000846863 }, { "epoch": 106, "train_loss": 4.886232281951904, "train_acc": 0.00966, "test_loss": 4.676759211730957, "test_acc": 0.01, "lyapunov": 1.5755804490555279, "grad_norm": 0.11054714782321104, "grad_max_sv": 0.016818781569600105, "grad_min_sv": 0.0, "grad_condition": 16818781569.600103, "lr": 0.00019770044256881242, "time_sec": 132.38776516914368 }, { "epoch": 107, "train_loss": 4.889010899200439, "train_acc": 0.00964, "test_loss": 4.686521159362793, "test_acc": 0.01, "lyapunov": 1.5793325800420073, "grad_norm": 0.5205851606002122, "grad_max_sv": 0.027481868257746102, "grad_min_sv": 0.0, "grad_condition": 27481868257.7461, "lr": 0.0001894261098608447, "time_sec": 132.4469666481018 }, { "epoch": 108, "train_loss": 4.885496775512696, "train_acc": 0.00916, "test_loss": 4.701310534667969, "test_acc": 0.01, "lyapunov": 1.5739044819951362, "grad_norm": 0.9976131592675321, "grad_max_sv": 0.010380421532317996, "grad_min_sv": 0.0, "grad_condition": 10380421532.317997, "lr": 0.000181288005125655, "time_sec": 132.34952044487 }, { "epoch": 109, "train_loss": 4.88569960144043, "train_acc": 0.00982, "test_loss": 4.704411970520019, "test_acc": 0.01, "lyapunov": 1.574234271598289, "grad_norm": 0.9761047066143378, "grad_max_sv": 0.026565171172842385, "grad_min_sv": 0.0, "grad_condition": 26565171172.842384, "lr": 0.0001732896980049473, "time_sec": 132.45858502388 }, { "epoch": 110, "train_loss": 4.885857049255371, "train_acc": 0.00906, "test_loss": 4.700390522766114, "test_acc": 0.01, "lyapunov": 1.5747647572051533, "grad_norm": 1.1449227675806375, "grad_max_sv": 0.025618467247113585, "grad_min_sv": 0.0, "grad_condition": 25618467247.113586, "lr": 0.00016543469682057076, "time_sec": 132.4441635608673 }, { "epoch": 111, "train_loss": 4.886974509887695, "train_acc": 0.00982, "test_loss": 4.78629910736084, "test_acc": 0.01, "lyapunov": 1.5769317887933052, "grad_norm": 0.9679265494141023, "grad_max_sv": 0.03804315887391567, "grad_min_sv": 0.0, "grad_condition": 38043158873.91567, "lr": 0.00015772644703565552, "time_sec": 132.5875232219696 }, { "epoch": 112, "train_loss": 4.886453926544189, "train_acc": 0.00974, "test_loss": 4.8048784591674805, "test_acc": 0.01, "lyapunov": 1.5754460748809074, "grad_norm": 0.8807920950548352, "grad_max_sv": 0.03984132050536573, "grad_min_sv": 0.0, "grad_condition": 39841320505.36573, "lr": 0.00015016832974331713, "time_sec": 132.5120551586151 }, { "epoch": 113, "train_loss": 4.885906947784424, "train_acc": 0.00966, "test_loss": 4.798358418273926, "test_acc": 0.01, "lyapunov": 1.5747274245752398, "grad_norm": 0.8637882261226464, "grad_max_sv": 0.033320454647764564, "grad_min_sv": 0.0, "grad_condition": 33320454647.764565, "lr": 0.00014276366018359834, "time_sec": 132.50000762939453 }, { "epoch": 114, "train_loss": 4.885719304962159, "train_acc": 0.00982, "test_loss": 4.793103702545166, "test_acc": 0.01, "lyapunov": 1.5744778527628125, "grad_norm": 0.782099951820462, "grad_max_sv": 0.03417456489987671, "grad_min_sv": 0.0, "grad_condition": 34174564899.87671, "lr": 0.00013551568628929425, "time_sec": 132.49124789237976 }, { "epoch": 115, "train_loss": 4.8859512828063965, "train_acc": 0.00934, "test_loss": 4.802629745483398, "test_acc": 0.01, "lyapunov": 1.575113305960165, "grad_norm": 0.7049115792540724, "grad_max_sv": 0.018358896067366005, "grad_min_sv": 0.0, "grad_condition": 18358896067.366005, "lr": 0.00012842758726130276, "time_sec": 132.44965839385986 }, { "epoch": 116, "train_loss": 4.886716898498535, "train_acc": 0.01, "test_loss": 4.802504382324218, "test_acc": 0.01, "lyapunov": 1.5769645506158814, "grad_norm": 0.7070432983143201, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 132.43424487113953 }, { "epoch": 117, "train_loss": 4.8879242680358885, "train_acc": 0.00916, "test_loss": 4.805041016387939, "test_acc": 0.01, "lyapunov": 1.5800700291343357, "grad_norm": 0.7061830114700672, "grad_max_sv": 0.02115973932668567, "grad_min_sv": 0.0, "grad_condition": 21159739326.68567, "lr": 0.00011474337861210538, "time_sec": 132.52493023872375 }, { "epoch": 118, "train_loss": 4.885882244415283, "train_acc": 0.01036, "test_loss": 4.74331266784668, "test_acc": 0.01, "lyapunov": 1.5747067300255035, "grad_norm": 0.7245826894780792, "grad_max_sv": 0.03378571714274585, "grad_min_sv": 0.0, "grad_condition": 33785717142.745857, "lr": 0.00010815327133708009, "time_sec": 132.48710799217224 }, { "epoch": 119, "train_loss": 4.886389665374756, "train_acc": 0.00962, "test_loss": 4.740865539550781, "test_acc": 0.01, "lyapunov": 1.5762843387511076, "grad_norm": 0.7753676227893881, "grad_max_sv": 0.03039190392009914, "grad_min_sv": 0.0, "grad_condition": 30391903920.09914, "lr": 0.00010173504098790182, "time_sec": 132.4465343952179 }, { "epoch": 120, "train_loss": 4.886249551086426, "train_acc": 0.00964, "test_loss": 4.7418055305480955, "test_acc": 0.01, "lyapunov": 1.5757878259624667, "grad_norm": 0.7403330417590244, "grad_max_sv": 0.03614077656529844, "grad_min_sv": 0.0, "grad_condition": 36140776565.29844, "lr": 9.549150281252629e-05, "time_sec": 132.79633259773254 }, { "epoch": 121, "train_loss": 4.886320632019043, "train_acc": 0.0099, "test_loss": 4.7293956802368164, "test_acc": 0.01, "lyapunov": 1.5760322620191842, "grad_norm": 0.7505635192152501, "grad_max_sv": 0.026077959313988687, "grad_min_sv": 0.0, "grad_condition": 26077959313.988686, "lr": 8.942539543314794e-05, "time_sec": 133.23189043998718 }, { "epoch": 122, "train_loss": 4.887943274230957, "train_acc": 0.00948, "test_loss": 4.919895000457764, "test_acc": 0.01, "lyapunov": 1.5784789354295072, "grad_norm": 0.6996628561837273, "grad_max_sv": 0.0160073421895504, "grad_min_sv": 0.0, "grad_condition": 16007342189.550396, "lr": 8.353937964495024e-05, "time_sec": 132.61993741989136 }, { "epoch": 123, "train_loss": 4.886383193359375, "train_acc": 0.01012, "test_loss": 4.8154360328674315, "test_acc": 0.01, "lyapunov": 1.5765104918833583, "grad_norm": 0.8202114075319168, "grad_max_sv": 0.0287565924692899, "grad_min_sv": 0.0, "grad_condition": 28756592469.289906, "lr": 7.783603724899243e-05, "time_sec": 132.69449758529663 }, { "epoch": 124, "train_loss": 4.885598735046386, "train_acc": 0.01062, "test_loss": 4.811818315124512, "test_acc": 0.01, "lyapunov": 1.5741741837138106, "grad_norm": 0.7110817230064039, "grad_max_sv": 0.04011002266779542, "grad_min_sv": 0.0, "grad_condition": 40110022667.795425, "lr": 7.231786991974666e-05, "time_sec": 132.79418468475342 }, { "epoch": 125, "train_loss": 4.887531413879395, "train_acc": 0.00998, "test_loss": 4.798822694396972, "test_acc": 0.01, "lyapunov": 1.5775156819911869, "grad_norm": 0.6755952206914222, "grad_max_sv": 0.03821564754471183, "grad_min_sv": 0.0, "grad_condition": 38215647544.71183, "lr": 6.698729810778072e-05, "time_sec": 132.56555151939392 }, { "epoch": 126, "train_loss": 4.885848933258057, "train_acc": 0.0096, "test_loss": 4.79271836013794, "test_acc": 0.01, "lyapunov": 1.5746296488720437, "grad_norm": 0.783689796852182, "grad_max_sv": 0.0219818449113518, "grad_min_sv": 0.0, "grad_condition": 21981844911.3518, "lr": 6.184665997806817e-05, "time_sec": 132.44697856903076 }, { "epoch": 127, "train_loss": 4.885011657409668, "train_acc": 0.0099, "test_loss": 4.796478929901123, "test_acc": 0.01, "lyapunov": 1.5726598202420012, "grad_norm": 0.746827927020454, "grad_max_sv": 0.006885465793311596, "grad_min_sv": 0.0, "grad_condition": 6885465793.311597, "lr": 5.6898210384392595e-05, "time_sec": 132.4967279434204 }, { "epoch": 128, "train_loss": 4.885314655151367, "train_acc": 0.00972, "test_loss": 4.764711624908447, "test_acc": 0.01, "lyapunov": 1.5735664736584325, "grad_norm": 0.7327332821536672, "grad_max_sv": 0.000560962175950408, "grad_min_sv": 0.0, "grad_condition": 560962175.950408, "lr": 5.214411988029363e-05, "time_sec": 132.5673258304596 }, { "epoch": 129, "train_loss": 4.886808303070068, "train_acc": 0.00958, "test_loss": 4.767883946990967, "test_acc": 0.01, "lyapunov": 1.5768778150343834, "grad_norm": 0.7089376244924456, "grad_max_sv": 0.0005988820921629667, "grad_min_sv": 0.0, "grad_condition": 598882092.1629667, "lr": 4.7586473766990294e-05, "time_sec": 132.46098804473877 }, { "epoch": 130, "train_loss": 4.886055064697266, "train_acc": 0.00958, "test_loss": 4.76520872039795, "test_acc": 0.01, "lyapunov": 1.575562137167167, "grad_norm": 0.8017477597198375, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 132.55271816253662 }, { "epoch": 131, "train_loss": 4.8861244363403324, "train_acc": 0.0098, "test_loss": 4.774403156280518, "test_acc": 0.01, "lyapunov": 1.5755851704751134, "grad_norm": 0.8346593666537984, "grad_max_sv": 0.0012377811130136252, "grad_min_sv": 0.0, "grad_condition": 1237781113.0136251, "lr": 3.906842420574966e-05, "time_sec": 132.4554464817047 }, { "epoch": 132, "train_loss": 4.8852793449401855, "train_acc": 0.00998, "test_loss": 4.771010957336426, "test_acc": 0.01, "lyapunov": 1.573425286566205, "grad_norm": 0.7375330331800295, "grad_max_sv": 0.006311370152980089, "grad_min_sv": 0.0, "grad_condition": 6311370152.980089, "lr": 3.5111757055874305e-05, "time_sec": 132.4216513633728 }, { "epoch": 133, "train_loss": 4.884971447448731, "train_acc": 0.00938, "test_loss": 4.771634101104737, "test_acc": 0.01, "lyapunov": 1.572620025985991, "grad_norm": 0.6774345796584929, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 132.4028835296631 }, { "epoch": 134, "train_loss": 4.885691842803955, "train_acc": 0.01002, "test_loss": 4.844159544372559, "test_acc": 0.01, "lyapunov": 1.57454265353015, "grad_norm": 0.7944955115704805, "grad_max_sv": 0.02395228371024132, "grad_min_sv": 0.0, "grad_condition": 23952283710.241318, "lr": 2.7811814881259484e-05, "time_sec": 132.41754722595215 }, { "epoch": 135, "train_loss": 4.8864432501220705, "train_acc": 0.0101, "test_loss": 4.844892832946777, "test_acc": 0.01, "lyapunov": 1.575845740945138, "grad_norm": 0.7437160641154223, "grad_max_sv": 0.020727850822731854, "grad_min_sv": 0.0, "grad_condition": 20727850822.731853, "lr": 2.4471741852423218e-05, "time_sec": 132.44422578811646 }, { "epoch": 136, "train_loss": 4.8851325263977055, "train_acc": 0.0098, "test_loss": 4.8378851570129395, "test_acc": 0.01, "lyapunov": 1.5731066611721694, "grad_norm": 0.6658420197701125, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 132.38768362998962 }, { "epoch": 137, "train_loss": 4.885479872436523, "train_acc": 0.01006, "test_loss": 4.843586358642578, "test_acc": 0.01, "lyapunov": 1.5740535426932527, "grad_norm": 0.7299510564419838, "grad_max_sv": 0.003957807831466198, "grad_min_sv": 0.0, "grad_condition": 3957807831.466198, "lr": 1.8418716601170932e-05, "time_sec": 132.38154101371765 }, { "epoch": 138, "train_loss": 4.884863400421143, "train_acc": 0.01014, "test_loss": 4.843053856658935, "test_acc": 0.01, "lyapunov": 1.5721587311581273, "grad_norm": 0.6927716154040414, "grad_max_sv": 0.017578842211514713, "grad_min_sv": 0.0, "grad_condition": 17578842211.51471, "lr": 1.570841943568445e-05, "time_sec": 132.4182834625244 }, { "epoch": 139, "train_loss": 4.884934008331299, "train_acc": 0.01022, "test_loss": 4.844250295257568, "test_acc": 0.01, "lyapunov": 1.5725375057181434, "grad_norm": 0.6981880900264675, "grad_max_sv": 0.0031383157707750796, "grad_min_sv": 0.0, "grad_condition": 3138315770.7750797, "lr": 1.3210548563419845e-05, "time_sec": 132.41427326202393 }, { "epoch": 140, "train_loss": 4.885497499389649, "train_acc": 0.00972, "test_loss": 4.844135813903809, "test_acc": 0.01, "lyapunov": 1.574064860868332, "grad_norm": 0.774635016593933, "grad_max_sv": 0.005403042444959283, "grad_min_sv": 0.0, "grad_condition": 5403042444.959283, "lr": 1.0926199633097203e-05, "time_sec": 132.38426899909973 }, { "epoch": 141, "train_loss": 4.885045772247315, "train_acc": 0.01014, "test_loss": 4.8358864456176756, "test_acc": 0.01, "lyapunov": 1.5727792880724154, "grad_norm": 0.7412742981630644, "grad_max_sv": 0.011697014886885881, "grad_min_sv": 0.0, "grad_condition": 11697014886.885881, "lr": 8.856374635655688e-06, "time_sec": 132.46910786628723 }, { "epoch": 142, "train_loss": 4.884702201538086, "train_acc": 0.01002, "test_loss": 4.838421836090088, "test_acc": 0.01, "lyapunov": 1.5717649999481942, "grad_norm": 0.7113065718119301, "grad_max_sv": 0.00798416011966765, "grad_min_sv": 0.0, "grad_condition": 7984160119.66765, "lr": 7.001981464747503e-06, "time_sec": 132.44912910461426 }, { "epoch": 143, "train_loss": 4.885199571380615, "train_acc": 0.00982, "test_loss": 4.841495401763916, "test_acc": 0.01, "lyapunov": 1.5731582995265951, "grad_norm": 0.705829448061863, "grad_max_sv": 0.021906211972236633, "grad_min_sv": 0.0, "grad_condition": 21906211972.236633, "lr": 5.3638335185058295e-06, "time_sec": 132.39459085464478 }, { "epoch": 144, "train_loss": 4.884931218566894, "train_acc": 0.01002, "test_loss": 4.842521714782714, "test_acc": 0.01, "lyapunov": 1.5725436259413619, "grad_norm": 0.7770696416339791, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 132.33704686164856 }, { "epoch": 145, "train_loss": 4.885003453521729, "train_acc": 0.01038, "test_loss": 4.84215620880127, "test_acc": 0.01, "lyapunov": 1.5727140568101499, "grad_norm": 0.7469803441120764, "grad_max_sv": 0.007154888892546296, "grad_min_sv": 0.0, "grad_condition": 7154888892.546295, "lr": 2.7390523158633524e-06, "time_sec": 132.3757495880127 }, { "epoch": 146, "train_loss": 4.885197346801758, "train_acc": 0.00996, "test_loss": 4.842266304016113, "test_acc": 0.01, "lyapunov": 1.5733027034403417, "grad_norm": 0.7332908840273178, "grad_max_sv": 0.0006548997946083546, "grad_min_sv": 0.0, "grad_condition": 654899794.6083546, "lr": 1.7535703752478133e-06, "time_sec": 132.45014452934265 }, { "epoch": 147, "train_loss": 4.885225572662353, "train_acc": 0.01, "test_loss": 4.841919314575195, "test_acc": 0.01, "lyapunov": 1.5734141430891384, "grad_norm": 0.7407542017866708, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 132.37303113937378 }, { "epoch": 148, "train_loss": 4.885419764556885, "train_acc": 0.01, "test_loss": 4.841919337463379, "test_acc": 0.01, "lyapunov": 1.5739776710110247, "grad_norm": 0.7868248231615788, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 132.36948442459106 }, { "epoch": 149, "train_loss": 4.884984393463135, "train_acc": 0.01, "test_loss": 4.841919581604004, "test_acc": 0.01, "lyapunov": 1.5726999001734703, "grad_norm": 0.7663497621598592, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 132.3525311946869 }, { "epoch": 150, "train_loss": 4.8838786590576175, "train_acc": 0.01, "test_loss": 4.841919624328614, "test_acc": 0.01, "lyapunov": 1.5694036883161502, "grad_norm": 0.6984069616734725, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 132.51661276817322 } ], "16": [ { "epoch": 1, "train_loss": 4.785678502502441, "train_acc": 0.01854, "test_loss": 4.888219262695313, "test_acc": 0.0096, "lyapunov": 2.2034229628570245, "grad_norm": 4.9662527525898525, "grad_max_sv": 4.1295246422290806, "grad_min_sv": 8.43239183145883e-08, "grad_condition": 57848709.59664528, "lr": 0.0009998903417374227, "time_sec": 178.03496599197388 }, { "epoch": 2, "train_loss": 4.6398111044311525, "train_acc": 0.0207, "test_loss": 4.653040969085693, "test_acc": 0.01, "lyapunov": 1.9294306939215307, "grad_norm": 3.0185365178654044, "grad_max_sv": 2.4029204517602922, "grad_min_sv": 5.100535853952426e-08, "grad_condition": 482708945.8134031, "lr": 0.0009995614150494292, "time_sec": 178.04272985458374 }, { "epoch": 3, "train_loss": 4.587504278259277, "train_acc": 0.01798, "test_loss": 4.565644731140137, "test_acc": 0.0158, "lyapunov": 1.7756437584567253, "grad_norm": 1.468640621914821, "grad_max_sv": 0.8633963579282863, "grad_min_sv": 1.4697805644365008e-08, "grad_condition": 29354955308.653522, "lr": 0.0009990133642141358, "time_sec": 177.90911650657654 }, { "epoch": 4, "train_loss": 4.609674820861817, "train_acc": 0.01586, "test_loss": 5.16701375579834, "test_acc": 0.0101, "lyapunov": 1.7137653553272452, "grad_norm": 0.7203838648352618, "grad_max_sv": 0.5238488506525755, "grad_min_sv": 2.2053512622504097e-09, "grad_condition": 75198729364.04495, "lr": 0.0009982464296247522, "time_sec": 177.86139965057373 }, { "epoch": 5, "train_loss": 4.638868305969238, "train_acc": 0.01426, "test_loss": 5.560866254425049, "test_acc": 0.01, "lyapunov": 1.6978333834796915, "grad_norm": 0.5502157339199643, "grad_max_sv": 0.44361272603273394, "grad_min_sv": 2.7029428141806377e-12, "grad_condition": 181889969040.05048, "lr": 0.0009972609476841367, "time_sec": 177.9277467727661 }, { "epoch": 6, "train_loss": 4.669847656402588, "train_acc": 0.01332, "test_loss": 4.8178652496337895, "test_acc": 0.01, "lyapunov": 1.7381863307465069, "grad_norm": 0.5563091323848212, "grad_max_sv": 0.37752934321761134, "grad_min_sv": 1.4602178925586487e-12, "grad_condition": 201992262866.57877, "lr": 0.000996057350657239, "time_sec": 177.8438265323639 }, { "epoch": 7, "train_loss": 4.702823111572266, "train_acc": 0.01186, "test_loss": 4.627877201843262, "test_acc": 0.01, "lyapunov": 1.7552724058365883, "grad_norm": 0.4233607461027203, "grad_max_sv": 0.35499467700719833, "grad_min_sv": 3.8501282054302263e-13, "grad_condition": 282171382589.46027, "lr": 0.000994636166481494, "time_sec": 177.7493600845337 }, { "epoch": 8, "train_loss": 4.722017111511231, "train_acc": 0.01098, "test_loss": 6.090566035461426, "test_acc": 0.01, "lyapunov": 1.7357035292993725, "grad_norm": 0.3850039806872663, "grad_max_sv": 0.3226898044347763, "grad_min_sv": 7.113592445244562e-14, "grad_condition": 304348428639.08154, "lr": 0.0009929980185352525, "time_sec": 177.78767728805542 }, { "epoch": 9, "train_loss": 4.741448409118652, "train_acc": 0.01154, "test_loss": 5.83977333984375, "test_acc": 0.01, "lyapunov": 1.7204718992228398, "grad_norm": 0.4078264807422899, "grad_max_sv": 0.31335003934800626, "grad_min_sv": 1.9402458265888006e-13, "grad_condition": 298038507715.96027, "lr": 0.0009911436253643444, "time_sec": 177.80518293380737 }, { "epoch": 10, "train_loss": 4.747990810241699, "train_acc": 0.01106, "test_loss": 6.513046632385254, "test_acc": 0.01, "lyapunov": 1.6953654838035175, "grad_norm": 0.4292578477364445, "grad_max_sv": 0.3652988448739052, "grad_min_sv": 1.2809375813436604e-13, "grad_condition": 342642686942.9036, "lr": 0.0009890738003669028, "time_sec": 177.78542613983154 }, { "epoch": 11, "train_loss": 4.765809431610108, "train_acc": 0.01214, "test_loss": 7.22933176574707, "test_acc": 0.01, "lyapunov": 1.7186210655495333, "grad_norm": 0.4487253545215033, "grad_max_sv": 0.3868314690887928, "grad_min_sv": 3.013939023123918e-13, "grad_condition": 329330315777.6491, "lr": 0.00098678945143658, "time_sec": 177.81605434417725 }, { "epoch": 12, "train_loss": 4.784488880615235, "train_acc": 0.00986, "test_loss": 4.611177786254883, "test_acc": 0.01, "lyapunov": 1.652159307009119, "grad_norm": 0.4707826268774683, "grad_max_sv": 0.3026094869710505, "grad_min_sv": 3.8656478774921674e-15, "grad_condition": 301420540269.25793, "lr": 0.0009842915805643154, "time_sec": 177.8059630393982 }, { "epoch": 13, "train_loss": 4.809918058624268, "train_acc": 0.00966, "test_loss": 5.106430908203125, "test_acc": 0.01, "lyapunov": 1.6707328871997726, "grad_norm": 0.667273831565697, "grad_max_sv": 0.24273031912744045, "grad_min_sv": 1.0572839902934006e-10, "grad_condition": 229305129700.13013, "lr": 0.000981581283398829, "time_sec": 177.8098611831665 }, { "epoch": 14, "train_loss": 4.825652238159179, "train_acc": 0.01056, "test_loss": 10.256812258911133, "test_acc": 0.01, "lyapunov": 1.6938227213861998, "grad_norm": 1.331380545313032, "grad_max_sv": 0.26493136398494244, "grad_min_sv": 2.65579091596793e-10, "grad_condition": 237101921206.0838, "lr": 0.0009786597487660333, "time_sec": 177.74433708190918 }, { "epoch": 15, "train_loss": 4.858567563171387, "train_acc": 0.01086, "test_loss": 4.6056615829467775, "test_acc": 0.01, "lyapunov": 1.7649985844521876, "grad_norm": 0.6838854666615405, "grad_max_sv": 0.34980414882302285, "grad_min_sv": 2.1796140399673834e-13, "grad_condition": 312022583270.1326, "lr": 0.0009755282581475766, "time_sec": 177.7609293460846 }, { "epoch": 16, "train_loss": 4.88505381439209, "train_acc": 0.01104, "test_loss": 4.605761392211914, "test_acc": 0.01, "lyapunov": 1.8020565973218445, "grad_norm": 0.5845356530706413, "grad_max_sv": 0.2943306349217892, "grad_min_sv": 4.369502606031448e-14, "grad_condition": 287139369751.0244, "lr": 0.0009721881851187403, "time_sec": 177.8197786808014 }, { "epoch": 17, "train_loss": 4.893186149749756, "train_acc": 0.01036, "test_loss": 4.605876076507569, "test_acc": 0.01, "lyapunov": 1.7787105851161205, "grad_norm": 0.4680659078828573, "grad_max_sv": 0.2733098614960909, "grad_min_sv": 4.296774163499721e-19, "grad_condition": 273309717860.49023, "lr": 0.0009686409947459456, "time_sec": 177.79044127464294 }, { "epoch": 18, "train_loss": 4.893065974731445, "train_acc": 0.0107, "test_loss": 4.6065135696411135, "test_acc": 0.01, "lyapunov": 1.718729690822494, "grad_norm": 0.5727929210621684, "grad_max_sv": 0.30122888199985026, "grad_min_sv": 4.424719830275789e-19, "grad_condition": 301228714224.6802, "lr": 0.0009648882429441254, "time_sec": 177.80086708068848 }, { "epoch": 19, "train_loss": 4.88860928604126, "train_acc": 0.01, "test_loss": 4.702660593414307, "test_acc": 0.01, "lyapunov": 1.6696165498260342, "grad_norm": 0.42342867331427436, "grad_max_sv": 0.34960081316530706, "grad_min_sv": 2.8274243075655694e-14, "grad_condition": 340909047209.5011, "lr": 0.00096093157579425, "time_sec": 177.7979953289032 }, { "epoch": 20, "train_loss": 4.903309204711914, "train_acc": 0.01068, "test_loss": 5.4670142036437985, "test_acc": 0.01, "lyapunov": 1.6678839117059927, "grad_norm": 0.5364190790754718, "grad_max_sv": 0.3460624013096094, "grad_min_sv": 1.5815154140131103e-14, "grad_condition": 341291954932.3224, "lr": 0.0009567727288213001, "time_sec": 177.79369568824768 }, { "epoch": 21, "train_loss": 4.915025991210937, "train_acc": 0.01106, "test_loss": 4.692510232543945, "test_acc": 0.01, "lyapunov": 1.6982163163402197, "grad_norm": 0.5511803995310802, "grad_max_sv": 0.34619002789258957, "grad_min_sv": 4.733950722420789e-14, "grad_condition": 333444655591.8086, "lr": 0.0009524135262330095, "time_sec": 177.79608535766602 }, { "epoch": 22, "train_loss": 4.909840554809571, "train_acc": 0.01084, "test_loss": 4.6062485778808595, "test_acc": 0.01, "lyapunov": 1.6909822228619509, "grad_norm": 0.4483805706207121, "grad_max_sv": 0.3018789976027193, "grad_min_sv": 3.421304159357815e-14, "grad_condition": 293400173556.4137, "lr": 0.0009478558801197061, "time_sec": 177.81299710273743 }, { "epoch": 23, "train_loss": 4.909692084808349, "train_acc": 0.01108, "test_loss": 4.6094023056030275, "test_acc": 0.01, "lyapunov": 1.6835671846214157, "grad_norm": 0.45426031851013016, "grad_max_sv": 0.3322039857506752, "grad_min_sv": 6.560297434150338e-15, "grad_condition": 330632003336.626, "lr": 0.000943101789615607, "time_sec": 177.8134524822235 }, { "epoch": 24, "train_loss": 4.901827787475586, "train_acc": 0.011, "test_loss": 4.606396533203125, "test_acc": 0.01, "lyapunov": 1.6725571582384426, "grad_norm": 0.5007132528772561, "grad_max_sv": 0.3051792338490486, "grad_min_sv": 2.976912647072195e-14, "grad_condition": 299276387943.3783, "lr": 0.0009381533400219313, "time_sec": 177.7837200164795 }, { "epoch": 25, "train_loss": 4.899776871948243, "train_acc": 0.0109, "test_loss": 4.606364790344238, "test_acc": 0.01, "lyapunov": 1.6670247737099142, "grad_norm": 0.4224268025378797, "grad_max_sv": 0.2703032233530493, "grad_min_sv": 5.37251515366592e-15, "grad_condition": 268629366269.90933, "lr": 0.0009330127018922189, "time_sec": 177.82209467887878 }, { "epoch": 26, "train_loss": 4.896821321258545, "train_acc": 0.0107, "test_loss": 4.722185048675537, "test_acc": 0.01, "lyapunov": 1.6472089549769526, "grad_norm": 0.48011762637076694, "grad_max_sv": 0.2670708648860455, "grad_min_sv": 3.756115387104417e-15, "grad_condition": 266170283847.3038, "lr": 0.000927682130080253, "time_sec": 177.78438448905945 }, { "epoch": 27, "train_loss": 4.906476246490478, "train_acc": 0.01086, "test_loss": 5.412735247802734, "test_acc": 0.01, "lyapunov": 1.6813617880691958, "grad_norm": 0.4406715400059857, "grad_max_sv": 0.25074354074895383, "grad_min_sv": 6.093407208933511e-20, "grad_condition": 250743525278.97955, "lr": 0.0009221639627510072, "time_sec": 177.7901487350464 }, { "epoch": 28, "train_loss": 4.893644842224121, "train_acc": 0.01172, "test_loss": 5.005291435241699, "test_acc": 0.01, "lyapunov": 1.6454817526175847, "grad_norm": 0.3605258439803559, "grad_max_sv": 0.2296090517193079, "grad_min_sv": 8.79898850927057e-21, "grad_condition": 229609049604.029, "lr": 0.0009164606203550494, "time_sec": 177.8756561279297 }, { "epoch": 29, "train_loss": 4.886972426452637, "train_acc": 0.01162, "test_loss": 5.60837995223999, "test_acc": 0.01, "lyapunov": 1.6373517272417502, "grad_norm": 0.35252531034326595, "grad_max_sv": 0.2174192801117897, "grad_min_sv": 1.7514629554834846e-20, "grad_condition": 217419276581.3401, "lr": 0.0009105746045668516, "time_sec": 177.83988404273987 }, { "epoch": 30, "train_loss": 4.887171002197266, "train_acc": 0.011, "test_loss": 5.029856091308594, "test_acc": 0.01, "lyapunov": 1.6322715209268244, "grad_norm": 0.3694860441565804, "grad_max_sv": 0.1933195549994707, "grad_min_sv": 2.0216060912179585e-20, "grad_condition": 193319550988.26825, "lr": 0.0009045084971874733, "time_sec": 177.91060781478882 }, { "epoch": 31, "train_loss": 4.882497029418945, "train_acc": 0.01094, "test_loss": 4.946529456329346, "test_acc": 0.01, "lyapunov": 1.6160695430872691, "grad_norm": 0.3009086445042491, "grad_max_sv": 0.17770135290920736, "grad_min_sv": 3.24419256482409e-21, "grad_condition": 177701352269.52295, "lr": 0.0008982649590120977, "time_sec": 179.66105842590332 }, { "epoch": 32, "train_loss": 4.880725912780762, "train_acc": 0.01128, "test_loss": 5.578618463897705, "test_acc": 0.01, "lyapunov": 1.62386571232925, "grad_norm": 0.36023587191613426, "grad_max_sv": 0.1822029523551464, "grad_min_sv": 3.6796007523380705e-21, "grad_condition": 182202951444.53656, "lr": 0.0008918467286629196, "time_sec": 179.0988199710846 }, { "epoch": 33, "train_loss": 4.908818702850342, "train_acc": 0.01182, "test_loss": 4.791287840270996, "test_acc": 0.01, "lyapunov": 1.674632024886968, "grad_norm": 2.355286231583665, "grad_max_sv": 0.1451555678440961, "grad_min_sv": 3.147262321441897e-13, "grad_condition": 145124831420.269, "lr": 0.0008852566213878943, "time_sec": 177.81290411949158 }, { "epoch": 34, "train_loss": 4.966870961761475, "train_acc": 0.00932, "test_loss": 4.691395782470703, "test_acc": 0.01, "lyapunov": 1.7797045579651738, "grad_norm": 0.4484129521918933, "grad_max_sv": 0.14517696127295493, "grad_min_sv": 1.115426717388758e-15, "grad_condition": 144975581810.04208, "lr": 0.000878497527825878, "time_sec": 177.8652102947235 }, { "epoch": 35, "train_loss": 4.915819309997558, "train_acc": 0.01472, "test_loss": 4.624800839996338, "test_acc": 0.01, "lyapunov": 1.721020828122678, "grad_norm": 1.0620945447138674, "grad_max_sv": 0.19911672528833152, "grad_min_sv": 1.9872991955575878e-10, "grad_condition": 95641187798.97682, "lr": 0.000871572412738697, "time_sec": 177.88512420654297 }, { "epoch": 36, "train_loss": 4.9530413731384275, "train_acc": 0.01452, "test_loss": 4.789580516052246, "test_acc": 0.0101, "lyapunov": 1.8076083949764672, "grad_norm": 0.5972631933008199, "grad_max_sv": 0.19924248810857534, "grad_min_sv": 3.440275442940527e-10, "grad_condition": 148843110630.56686, "lr": 0.0008644843137107055, "time_sec": 177.85971999168396 }, { "epoch": 37, "train_loss": 4.963237725219726, "train_acc": 0.01242, "test_loss": 9.607163096618653, "test_acc": 0.01, "lyapunov": 1.7487757071814574, "grad_norm": 0.5178441019436488, "grad_max_sv": 0.2677606202661991, "grad_min_sv": 1.2794001535597794e-09, "grad_condition": 118342772090.25644, "lr": 0.0008572363398164014, "time_sec": 177.87799191474915 }, { "epoch": 38, "train_loss": 4.974736349639892, "train_acc": 0.01056, "test_loss": 4.772847597503662, "test_acc": 0.01, "lyapunov": 1.6420561239847442, "grad_norm": 0.7737397356236614, "grad_max_sv": 0.48621650636196134, "grad_min_sv": 5.431396735144922e-09, "grad_condition": 1130833560.0526097, "lr": 0.0008498316702566826, "time_sec": 177.84695863723755 }, { "epoch": 39, "train_loss": 4.914389076538086, "train_acc": 0.00954, "test_loss": 5.4321878707885745, "test_acc": 0.01, "lyapunov": 1.606756867959981, "grad_norm": 0.6387073953630102, "grad_max_sv": 0.28100625462830064, "grad_min_sv": 1.1923785099299402e-09, "grad_condition": 31042166964.6133, "lr": 0.0008422735529643442, "time_sec": 177.8997838497162 }, { "epoch": 40, "train_loss": 4.907334909515381, "train_acc": 0.00932, "test_loss": 5.197367625427246, "test_acc": 0.01, "lyapunov": 1.6101341015847443, "grad_norm": 0.549617557037775, "grad_max_sv": 0.21684555038809777, "grad_min_sv": 1.6231511646555081e-12, "grad_condition": 115360148938.91074, "lr": 0.0008345653031794289, "time_sec": 177.88523411750793 }, { "epoch": 41, "train_loss": 4.9172815733337405, "train_acc": 0.00966, "test_loss": 5.328871868896484, "test_acc": 0.01, "lyapunov": 1.6233936231154615, "grad_norm": 0.6437990568107412, "grad_max_sv": 0.23363575600087644, "grad_min_sv": 5.030357610936974e-10, "grad_condition": 138575586823.60834, "lr": 0.0008267103019950526, "time_sec": 177.87491416931152 }, { "epoch": 42, "train_loss": 4.910974921875, "train_acc": 0.0094, "test_loss": 5.260343148803711, "test_acc": 0.01, "lyapunov": 1.6119288898185087, "grad_norm": 0.6213630809261163, "grad_max_sv": 0.2208472192287445, "grad_min_sv": 1.6566058977896803e-10, "grad_condition": 142601015959.25623, "lr": 0.0008187119948743447, "time_sec": 177.85157465934753 }, { "epoch": 43, "train_loss": 4.910828229217529, "train_acc": 0.0082, "test_loss": 4.699688921356201, "test_acc": 0.01, "lyapunov": 1.6258944394948232, "grad_norm": 0.4079357024315036, "grad_max_sv": 0.15661620609462262, "grad_min_sv": 1.7684309930750455e-15, "grad_condition": 156350108060.72934, "lr": 0.000810573890139155, "time_sec": 177.86257314682007 }, { "epoch": 44, "train_loss": 4.896916885833741, "train_acc": 0.00922, "test_loss": 4.812428985595703, "test_acc": 0.01, "lyapunov": 1.5950726255431504, "grad_norm": 0.4783756369080321, "grad_max_sv": 0.14141971599310638, "grad_min_sv": 1.3813946661647787e-39, "grad_condition": 141419715993.10638, "lr": 0.0008022995574311873, "time_sec": 177.92987060546875 }, { "epoch": 45, "train_loss": 4.908877978973389, "train_acc": 0.00912, "test_loss": 4.708805274963379, "test_acc": 0.01, "lyapunov": 1.6267534076710186, "grad_norm": 0.7771603049125322, "grad_max_sv": 0.15806035809218882, "grad_min_sv": 1.4034116208559716e-15, "grad_condition": 157762251235.76987, "lr": 0.0007938926261462363, "time_sec": 177.94272303581238 }, { "epoch": 46, "train_loss": 4.90580543838501, "train_acc": 0.00928, "test_loss": 4.734797378540039, "test_acc": 0.01, "lyapunov": 1.6176637389775737, "grad_norm": 0.6942542366402378, "grad_max_sv": 0.15787413250654936, "grad_min_sv": 7.864894789560978e-16, "grad_condition": 157723200668.28387, "lr": 0.0007853567838422158, "time_sec": 177.97623896598816 }, { "epoch": 47, "train_loss": 4.8965187059021, "train_acc": 0.00938, "test_loss": 4.6579503898620604, "test_acc": 0.01, "lyapunov": 1.5973099085985851, "grad_norm": 0.36353228305050295, "grad_max_sv": 0.13088524471968413, "grad_min_sv": 1.2231276530985221e-20, "grad_condition": 130885242907.8948, "lr": 0.0007766957746216719, "time_sec": 177.95993542671204 }, { "epoch": 48, "train_loss": 4.8988071447753905, "train_acc": 0.00944, "test_loss": 4.662165933227539, "test_acc": 0.01, "lyapunov": 1.603416101402029, "grad_norm": 0.3898458431943687, "grad_max_sv": 0.1284548096358776, "grad_min_sv": 1.1576870843401716e-38, "grad_condition": 128454809635.87761, "lr": 0.0007679133974894982, "time_sec": 177.8052430152893 }, { "epoch": 49, "train_loss": 4.913481904144287, "train_acc": 0.00918, "test_loss": 4.763600569915772, "test_acc": 0.01, "lyapunov": 1.6402373295610824, "grad_norm": 0.5994299094599757, "grad_max_sv": 0.1396894573670579, "grad_min_sv": 2.779377619525618e-15, "grad_condition": 139046550095.99487, "lr": 0.000759013504686565, "time_sec": 177.86163926124573 }, { "epoch": 50, "train_loss": 4.906329712219239, "train_acc": 0.00982, "test_loss": 4.609917034912109, "test_acc": 0.01, "lyapunov": 1.6202878165427985, "grad_norm": 0.6143555741962269, "grad_max_sv": 0.15427468828856944, "grad_min_sv": 1.5586657350285492e-15, "grad_condition": 153998022994.1138, "lr": 0.0007499999999999998, "time_sec": 177.81070852279663 }, { "epoch": 51, "train_loss": 4.901778139953613, "train_acc": 0.01, "test_loss": 5.7906026428222654, "test_acc": 0.01, "lyapunov": 1.6095840150438, "grad_norm": 0.4846890301599483, "grad_max_sv": 0.10476460931822658, "grad_min_sv": 6.919555377168684e-15, "grad_condition": 103682757395.60971, "lr": 0.0007408768370508575, "time_sec": 177.827232837677 }, { "epoch": 52, "train_loss": 4.897733354492187, "train_acc": 0.0102, "test_loss": 5.14119333190918, "test_acc": 0.01, "lyapunov": 1.6018984003749954, "grad_norm": 0.45183942591328674, "grad_max_sv": 0.08775242893025278, "grad_min_sv": 1.964503741104032e-16, "grad_condition": 87731321318.76743, "lr": 0.0007316480175599307, "time_sec": 177.8825397491455 }, { "epoch": 53, "train_loss": 4.899286302947998, "train_acc": 0.0105, "test_loss": 5.116060150146485, "test_acc": 0.01, "lyapunov": 1.6068680664462507, "grad_norm": 0.39046803319247386, "grad_max_sv": 0.10442779418081045, "grad_min_sv": 1.8704405143177693e-32, "grad_condition": 104427794180.81046, "lr": 0.0007223175895924635, "time_sec": 177.85691237449646 }, { "epoch": 54, "train_loss": 4.900419689025879, "train_acc": 0.00974, "test_loss": 6.225739611816406, "test_acc": 0.01, "lyapunov": 1.611330489673273, "grad_norm": 0.7830684513344699, "grad_max_sv": 0.08616076316975523, "grad_min_sv": 7.006492321624086e-47, "grad_condition": 86160763169.75522, "lr": 0.0007128896457825361, "time_sec": 177.79533982276917 }, { "epoch": 55, "train_loss": 4.90022905456543, "train_acc": 0.00872, "test_loss": 4.660898509216309, "test_acc": 0.01, "lyapunov": 1.6107879657574626, "grad_norm": 0.3602507862317559, "grad_max_sv": 0.07782914067938691, "grad_min_sv": 0.0, "grad_condition": 77829140679.3869, "lr": 0.0007033683215378998, "time_sec": 177.81696367263794 }, { "epoch": 56, "train_loss": 4.899950318450927, "train_acc": 0.009, "test_loss": 4.8788808166503905, "test_acc": 0.01, "lyapunov": 1.608769400345395, "grad_norm": 0.24016992273295382, "grad_max_sv": 0.07058875868096948, "grad_min_sv": 0.0, "grad_condition": 70588758680.96948, "lr": 0.0006937577932260512, "time_sec": 177.81637740135193 }, { "epoch": 57, "train_loss": 4.904979566650391, "train_acc": 0.01016, "test_loss": 4.727262957763672, "test_acc": 0.01, "lyapunov": 1.6228536108265752, "grad_norm": 0.25668226851580556, "grad_max_sv": 0.08947733379900455, "grad_min_sv": 3.709630814829091e-18, "grad_condition": 89476902167.92735, "lr": 0.0006840622763423388, "time_sec": 177.7847032546997 }, { "epoch": 58, "train_loss": 4.91234857635498, "train_acc": 0.00984, "test_loss": 4.992978315734863, "test_acc": 0.01, "lyapunov": 1.6392204319424641, "grad_norm": 0.2870713508381296, "grad_max_sv": 0.08510738047771156, "grad_min_sv": 5.680980030609821e-34, "grad_condition": 85107380477.71156, "lr": 0.0006742860236609073, "time_sec": 177.93095755577087 }, { "epoch": 59, "train_loss": 4.895672921447754, "train_acc": 0.00956, "test_loss": 4.850344149017334, "test_acc": 0.01, "lyapunov": 1.6016130505315482, "grad_norm": 0.21955395456353394, "grad_max_sv": 0.04376054578460753, "grad_min_sv": 0.0, "grad_condition": 43760545784.60753, "lr": 0.0006644333233692913, "time_sec": 178.03867888450623 }, { "epoch": 60, "train_loss": 4.904327979278564, "train_acc": 0.01052, "test_loss": 5.107528366088867, "test_acc": 0.01, "lyapunov": 1.6214414124598588, "grad_norm": 0.4134573581512024, "grad_max_sv": 0.05148340538144112, "grad_min_sv": 0.0, "grad_condition": 51483405381.44112, "lr": 0.0006545084971874734, "time_sec": 177.95739769935608 }, { "epoch": 61, "train_loss": 4.898002865753174, "train_acc": 0.0092, "test_loss": 5.260837869262695, "test_acc": 0.01, "lyapunov": 1.6072155035975035, "grad_norm": 0.21245422531513092, "grad_max_sv": 0.06225627232342958, "grad_min_sv": 0.0, "grad_condition": 62256272323.42959, "lr": 0.0006445158984722354, "time_sec": 177.8253002166748 }, { "epoch": 62, "train_loss": 4.895106823730469, "train_acc": 0.00882, "test_loss": 4.800835796356202, "test_acc": 0.01, "lyapunov": 1.6004807888089543, "grad_norm": 0.2174674542614135, "grad_max_sv": 0.05514842057600618, "grad_min_sv": 0.0, "grad_condition": 55148420576.00618, "lr": 0.0006344599103076324, "time_sec": 177.72123980522156 }, { "epoch": 63, "train_loss": 4.899956417541504, "train_acc": 0.0105, "test_loss": 4.751542483520508, "test_acc": 0.01, "lyapunov": 1.6128623427637399, "grad_norm": 0.40884851608059564, "grad_max_sv": 0.05529614672996104, "grad_min_sv": 0.0, "grad_condition": 55296146729.96104, "lr": 0.0006243449435824269, "time_sec": 177.73331904411316 }, { "epoch": 64, "train_loss": 4.899741290130615, "train_acc": 0.01012, "test_loss": 4.856732801818848, "test_acc": 0.01, "lyapunov": 1.610243486931257, "grad_norm": 0.2140046037475775, "grad_max_sv": 0.04319468280300498, "grad_min_sv": 1.2200012063541023e-32, "grad_condition": 43194682803.00498, "lr": 0.0006141754350553275, "time_sec": 177.72633337974548 }, { "epoch": 65, "train_loss": 4.901744207763672, "train_acc": 0.00894, "test_loss": 5.05665267791748, "test_acc": 0.01, "lyapunov": 1.612555693482499, "grad_norm": 0.41191406243662826, "grad_max_sv": 0.06249867400620133, "grad_min_sv": 9.569992363469874e-20, "grad_condition": 62498664540.05955, "lr": 0.0006039558454088793, "time_sec": 177.71029257774353 }, { "epoch": 66, "train_loss": 4.905766971282959, "train_acc": 0.00954, "test_loss": 5.186077005767822, "test_acc": 0.01, "lyapunov": 1.6214341486201567, "grad_norm": 0.4859633789458757, "grad_max_sv": 0.0410848444327712, "grad_min_sv": 0.0, "grad_condition": 41084844432.7712, "lr": 0.000593690657292862, "time_sec": 177.8285129070282 }, { "epoch": 67, "train_loss": 4.905345126495361, "train_acc": 0.00986, "test_loss": 4.869504832458496, "test_acc": 0.01, "lyapunov": 1.6231126108437852, "grad_norm": 0.39055695869151713, "grad_max_sv": 0.04164083697833121, "grad_min_sv": 1.4012984643248171e-46, "grad_condition": 41640836978.3312, "lr": 0.0005833843733580507, "time_sec": 177.75302600860596 }, { "epoch": 68, "train_loss": 4.897688937835693, "train_acc": 0.00942, "test_loss": 4.753113725280762, "test_acc": 0.01, "lyapunov": 1.6065946210680715, "grad_norm": 0.20313081565215924, "grad_max_sv": 0.023377659870311616, "grad_min_sv": 0.0, "grad_condition": 23377659870.311615, "lr": 0.0005730415142812054, "time_sec": 177.63269519805908 }, { "epoch": 69, "train_loss": 4.898588792419433, "train_acc": 0.01028, "test_loss": 4.782024855804443, "test_acc": 0.01, "lyapunov": 1.6088185420121683, "grad_norm": 0.17496031637798137, "grad_max_sv": 0.026315743662416936, "grad_min_sv": 0.0, "grad_condition": 26315743662.416935, "lr": 0.0005626666167821517, "time_sec": 177.63309144973755 }, { "epoch": 70, "train_loss": 4.8972829446411135, "train_acc": 0.00906, "test_loss": 5.072041613769532, "test_acc": 0.01, "lyapunov": 1.606105865419978, "grad_norm": 4.752321231571355, "grad_max_sv": 0.01162667127500754, "grad_min_sv": 0.0, "grad_condition": 11626671275.007538, "lr": 0.0005522642316338265, "time_sec": 177.63151264190674 }, { "epoch": 71, "train_loss": 4.903229199066162, "train_acc": 0.00974, "test_loss": 4.996621307373047, "test_acc": 0.01, "lyapunov": 1.618955539315558, "grad_norm": 8.808121966401492, "grad_max_sv": 0.009761298389639706, "grad_min_sv": 0.0, "grad_condition": 9761298389.639706, "lr": 0.0005418389216661573, "time_sec": 177.6599452495575 }, { "epoch": 72, "train_loss": 4.906216805419922, "train_acc": 0.00934, "test_loss": 4.894567427062988, "test_acc": 0.01, "lyapunov": 1.628432136362471, "grad_norm": 8.489795940827486, "grad_max_sv": 0.016040445899125188, "grad_min_sv": 0.0, "grad_condition": 16040445899.125189, "lr": 0.0005313952597646563, "time_sec": 177.6416893005371 }, { "epoch": 73, "train_loss": 4.899343757019043, "train_acc": 0.00984, "test_loss": 4.877998015594482, "test_acc": 0.01, "lyapunov": 1.6116645827012903, "grad_norm": 8.78253510980995, "grad_max_sv": 0.011263658234383911, "grad_min_sv": 0.0, "grad_condition": 11263658234.383911, "lr": 0.0005209378268645994, "time_sec": 177.685124874115 }, { "epoch": 74, "train_loss": 4.909308713531495, "train_acc": 0.0098, "test_loss": 4.906534819030762, "test_acc": 0.01, "lyapunov": 1.6356849475284976, "grad_norm": 8.739719950493322, "grad_max_sv": 0.018200278421863912, "grad_min_sv": 0.0, "grad_condition": 18200278421.863914, "lr": 0.0005104712099416781, "time_sec": 177.67348718643188 }, { "epoch": 75, "train_loss": 4.896382185516358, "train_acc": 0.00988, "test_loss": 4.891489701843262, "test_acc": 0.01, "lyapunov": 1.6029227630561576, "grad_norm": 8.719549027099202, "grad_max_sv": 0.022427358670393006, "grad_min_sv": 0.0, "grad_condition": 22427358670.393005, "lr": 0.0004999999999999996, "time_sec": 177.7534384727478 }, { "epoch": 76, "train_loss": 4.899071414489746, "train_acc": 0.00968, "test_loss": 4.9015754707336425, "test_acc": 0.01, "lyapunov": 1.6096787852094607, "grad_norm": 8.515820970435684, "grad_max_sv": 0.009400015359278768, "grad_min_sv": 0.0, "grad_condition": 9400015359.278769, "lr": 0.0004895287900583212, "time_sec": 177.62656164169312 }, { "epoch": 77, "train_loss": 4.898522388305664, "train_acc": 0.01038, "test_loss": 5.091467515563965, "test_acc": 0.01, "lyapunov": 1.6093772655862677, "grad_norm": 8.114992022856779, "grad_max_sv": 0.018641287484206258, "grad_min_sv": 0.0, "grad_condition": 18641287484.20626, "lr": 0.0004790621731353997, "time_sec": 177.68832445144653 }, { "epoch": 78, "train_loss": 4.898501075897217, "train_acc": 0.00976, "test_loss": 5.021521907043457, "test_acc": 0.01, "lyapunov": 1.609497647761079, "grad_norm": 8.539277939413502, "grad_max_sv": 0.007715003727935254, "grad_min_sv": 0.0, "grad_condition": 7715003727.935254, "lr": 0.000468604740235343, "time_sec": 177.67188620567322 }, { "epoch": 79, "train_loss": 4.89914041229248, "train_acc": 0.00952, "test_loss": 5.091536389160156, "test_acc": 0.01, "lyapunov": 1.6118732392025725, "grad_norm": 8.137454688889077, "grad_max_sv": 0.014247056667227299, "grad_min_sv": 0.0, "grad_condition": 14247056667.227299, "lr": 0.00045816107833384175, "time_sec": 177.66169714927673 }, { "epoch": 80, "train_loss": 4.896471509552002, "train_acc": 0.00904, "test_loss": 5.056171662139892, "test_acc": 0.01, "lyapunov": 1.6047609431664351, "grad_norm": 8.176635016602376, "grad_max_sv": 0.01795925593469292, "grad_min_sv": 0.0, "grad_condition": 17959255934.69292, "lr": 0.0004477357683661729, "time_sec": 177.69231700897217 }, { "epoch": 81, "train_loss": 4.902812586059571, "train_acc": 0.00932, "test_loss": 4.95149069366455, "test_acc": 0.01, "lyapunov": 1.6196627622979987, "grad_norm": 7.929696982355576, "grad_max_sv": 0.0070913337520323695, "grad_min_sv": 0.0, "grad_condition": 7091333752.03237, "lr": 0.00043733338321784746, "time_sec": 177.62628316879272 }, { "epoch": 82, "train_loss": 4.896946704254151, "train_acc": 0.00924, "test_loss": 5.036287983703613, "test_acc": 0.01, "lyapunov": 1.606176169632036, "grad_norm": 7.888136562780922, "grad_max_sv": 0.0152505733538419, "grad_min_sv": 0.0, "grad_condition": 15250573353.8419, "lr": 0.0004269584857187939, "time_sec": 177.6838881969452 }, { "epoch": 83, "train_loss": 4.903535429534912, "train_acc": 0.00942, "test_loss": 4.913862983703614, "test_acc": 0.01, "lyapunov": 1.6229887536114744, "grad_norm": 5.821543829416724, "grad_max_sv": 0.0042757402297866065, "grad_min_sv": 0.0, "grad_condition": 4275740229.786606, "lr": 0.0004166156266419484, "time_sec": 177.63864398002625 }, { "epoch": 84, "train_loss": 4.900573203125, "train_acc": 0.00922, "test_loss": 4.881514458465576, "test_acc": 0.01, "lyapunov": 1.6157215519634354, "grad_norm": 2.3035299291537767, "grad_max_sv": 0.018527308432385325, "grad_min_sv": 0.0, "grad_condition": 18527308432.385326, "lr": 0.0004063093427071373, "time_sec": 177.61864590644836 }, { "epoch": 85, "train_loss": 4.902895740814209, "train_acc": 0.00928, "test_loss": 4.858868844604492, "test_acc": 0.01, "lyapunov": 1.6206753049665095, "grad_norm": 0.12191327008361393, "grad_max_sv": 0.011266671447083354, "grad_min_sv": 0.0, "grad_condition": 11266671447.083355, "lr": 0.0003960441545911199, "time_sec": 177.60221338272095 }, { "epoch": 86, "train_loss": 4.899129556274414, "train_acc": 0.01002, "test_loss": 4.940996123504639, "test_acc": 0.01, "lyapunov": 1.6121560679677198, "grad_norm": 1.7402391187392277, "grad_max_sv": 0.002565371198579669, "grad_min_sv": 0.0, "grad_condition": 2565371198.579669, "lr": 0.0003858245649446718, "time_sec": 177.66662287712097 }, { "epoch": 87, "train_loss": 4.898443488616944, "train_acc": 0.0105, "test_loss": 4.900648780059814, "test_acc": 0.01, "lyapunov": 1.6101132055072833, "grad_norm": 3.9387378230742067, "grad_max_sv": 0.014504804974421859, "grad_min_sv": 0.0, "grad_condition": 14504804974.421856, "lr": 0.00037565505641757235, "time_sec": 177.92060565948486 }, { "epoch": 88, "train_loss": 4.903396017608642, "train_acc": 0.01006, "test_loss": 4.946898637390137, "test_acc": 0.01, "lyapunov": 1.6227889701228617, "grad_norm": 3.523322793117835, "grad_max_sv": 0.010716242669150233, "grad_min_sv": 0.0, "grad_condition": 10716242669.150234, "lr": 0.00036554008969236695, "time_sec": 177.71660375595093 }, { "epoch": 89, "train_loss": 4.898063175964356, "train_acc": 0.00952, "test_loss": 4.944628465270996, "test_acc": 0.01, "lyapunov": 1.6093785500587405, "grad_norm": 3.442066441987714, "grad_max_sv": 0.001931725861504674, "grad_min_sv": 0.0, "grad_condition": 1931725861.5046737, "lr": 0.0003554841015277638, "time_sec": 177.85225415229797 }, { "epoch": 90, "train_loss": 4.897619627685547, "train_acc": 0.00938, "test_loss": 5.051801362609863, "test_acc": 0.01, "lyapunov": 1.608569312583455, "grad_norm": 2.438214274664479, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 177.65104031562805 }, { "epoch": 91, "train_loss": 4.901775200042724, "train_acc": 0.00952, "test_loss": 4.932051847076416, "test_acc": 0.01, "lyapunov": 1.6196813135195876, "grad_norm": 1.9676599328431443, "grad_max_sv": 0.0042047965805977585, "grad_min_sv": 0.0, "grad_condition": 4204796580.5977583, "lr": 0.0003355666766307081, "time_sec": 177.5405979156494 }, { "epoch": 92, "train_loss": 4.8983032328796385, "train_acc": 0.0092, "test_loss": 4.899715927886963, "test_acc": 0.01, "lyapunov": 1.6106610715846577, "grad_norm": 1.4208199060741078, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 177.52678775787354 }, { "epoch": 93, "train_loss": 4.899546262664795, "train_acc": 0.00828, "test_loss": 4.734424713134765, "test_acc": 0.01, "lyapunov": 1.6129982721470202, "grad_norm": 0.7679133474898795, "grad_max_sv": 0.001235782215371728, "grad_min_sv": 0.0, "grad_condition": 1235782215.371728, "lr": 0.00031593772365766094, "time_sec": 177.578599691391 }, { "epoch": 94, "train_loss": 4.897470514221191, "train_acc": 0.00868, "test_loss": 4.861271743774414, "test_acc": 0.01, "lyapunov": 1.6078075801624971, "grad_norm": 0.5114523908732937, "grad_max_sv": 0.010413796734064817, "grad_min_sv": 0.0, "grad_condition": 10413796734.064817, "lr": 0.0003062422067739483, "time_sec": 177.66828536987305 }, { "epoch": 95, "train_loss": 4.896396814422608, "train_acc": 0.00902, "test_loss": 4.879605053710938, "test_acc": 0.01, "lyapunov": 1.6050515763290094, "grad_norm": 0.3961292769391823, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 177.51401448249817 }, { "epoch": 96, "train_loss": 4.8946277626037595, "train_acc": 0.00906, "test_loss": 4.8813762161254886, "test_acc": 0.01, "lyapunov": 1.6007561808656854, "grad_norm": 0.3223908585413378, "grad_max_sv": 0.004684461047872901, "grad_min_sv": 0.0, "grad_condition": 4684461047.8729, "lr": 0.00028711035421746345, "time_sec": 177.507954120636 }, { "epoch": 97, "train_loss": 4.898638327026367, "train_acc": 0.0089, "test_loss": 4.8062256309509275, "test_acc": 0.01, "lyapunov": 1.6108122432933134, "grad_norm": 0.26732308458116777, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 177.541433095932 }, { "epoch": 98, "train_loss": 4.898670770721435, "train_acc": 0.00952, "test_loss": 4.863480428314209, "test_acc": 0.01, "lyapunov": 1.6111446103781386, "grad_norm": 0.2214969265799768, "grad_max_sv": 0.009903033776208759, "grad_min_sv": 0.0, "grad_condition": 9903033776.20876, "lr": 0.00026835198244006903, "time_sec": 177.60904955863953 }, { "epoch": 99, "train_loss": 4.897254006500244, "train_acc": 0.00834, "test_loss": 4.817773220062256, "test_acc": 0.01, "lyapunov": 1.607484469023507, "grad_norm": 0.19294402621230472, "grad_max_sv": 0.0008362619206309319, "grad_min_sv": 0.0, "grad_condition": 836261920.6309319, "lr": 0.0002591231629491421, "time_sec": 177.57478499412537 }, { "epoch": 100, "train_loss": 4.901547922363282, "train_acc": 0.0089, "test_loss": 4.874810285949707, "test_acc": 0.01, "lyapunov": 1.618047608134082, "grad_norm": 0.48303744135317395, "grad_max_sv": 0.0005853609647601843, "grad_min_sv": 0.0, "grad_condition": 585360964.7601843, "lr": 0.0002499999999999997, "time_sec": 177.57369899749756 }, { "epoch": 101, "train_loss": 4.900225694732666, "train_acc": 0.0088, "test_loss": 4.874546339416504, "test_acc": 0.01, "lyapunov": 1.6143963080842783, "grad_norm": 0.10450627590873329, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 177.6406271457672 }, { "epoch": 102, "train_loss": 4.897779517669678, "train_acc": 0.00842, "test_loss": 4.97530121307373, "test_acc": 0.01, "lyapunov": 1.6092621133760419, "grad_norm": 0.11958307306926726, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 177.58187460899353 }, { "epoch": 103, "train_loss": 4.89978483215332, "train_acc": 0.00836, "test_loss": 4.904860715484619, "test_acc": 0.01, "lyapunov": 1.613416659862489, "grad_norm": 0.11840174924430107, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 177.59923720359802 }, { "epoch": 104, "train_loss": 4.8979805488586425, "train_acc": 0.0086, "test_loss": 5.0884550689697265, "test_acc": 0.01, "lyapunov": 1.6097813783704167, "grad_norm": 0.119936422604111, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 177.6080665588379 }, { "epoch": 105, "train_loss": 4.898741788330078, "train_acc": 0.00866, "test_loss": 4.9618072402954105, "test_acc": 0.01, "lyapunov": 1.6113920699604942, "grad_norm": 0.152172750895754, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 177.6668050289154 }, { "epoch": 106, "train_loss": 4.899783585510254, "train_acc": 0.00854, "test_loss": 4.853069065856934, "test_acc": 0.01, "lyapunov": 1.6142695355598273, "grad_norm": 0.12651234741385065, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 177.65955018997192 }, { "epoch": 107, "train_loss": 4.89967593460083, "train_acc": 0.00888, "test_loss": 4.81962833480835, "test_acc": 0.01, "lyapunov": 1.6138155131083924, "grad_norm": 0.12897917774661904, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 178.0168354511261 }, { "epoch": 108, "train_loss": 4.898814065093994, "train_acc": 0.00946, "test_loss": 4.862646290588379, "test_acc": 0.01, "lyapunov": 1.6114065183702941, "grad_norm": 0.12441425701414183, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 177.91981077194214 }, { "epoch": 109, "train_loss": 4.895898725891113, "train_acc": 0.00866, "test_loss": 4.898298935699463, "test_acc": 0.01, "lyapunov": 1.6044228336085444, "grad_norm": 0.12735396729359733, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 177.5811812877655 }, { "epoch": 110, "train_loss": 4.897967128295899, "train_acc": 0.0088, "test_loss": 4.881989184570313, "test_acc": 0.01, "lyapunov": 1.610074214008458, "grad_norm": 0.12498581799753569, "grad_max_sv": 0.0005899489391595125, "grad_min_sv": 0.0, "grad_condition": 589948939.1595125, "lr": 0.00016543469682057076, "time_sec": 177.58177971839905 }, { "epoch": 111, "train_loss": 4.894624674987793, "train_acc": 0.00892, "test_loss": 4.883820623779297, "test_acc": 0.01, "lyapunov": 1.6010574471310277, "grad_norm": 0.12140577807922988, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 177.56197333335876 }, { "epoch": 112, "train_loss": 4.895216448974609, "train_acc": 0.00852, "test_loss": 4.954343832397461, "test_acc": 0.01, "lyapunov": 1.602743710093486, "grad_norm": 0.1186981012224881, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 177.6377820968628 }, { "epoch": 113, "train_loss": 4.89654906173706, "train_acc": 0.00892, "test_loss": 4.86073722076416, "test_acc": 0.01, "lyapunov": 1.6060491681403821, "grad_norm": 0.13508163826012107, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 177.58386063575745 }, { "epoch": 114, "train_loss": 4.8961822531127925, "train_acc": 0.00894, "test_loss": 4.85973716430664, "test_acc": 0.01, "lyapunov": 1.605295106578056, "grad_norm": 0.1269661896874639, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 177.66930723190308 }, { "epoch": 115, "train_loss": 4.899547542419434, "train_acc": 0.00846, "test_loss": 4.86928017654419, "test_acc": 0.01, "lyapunov": 1.611534357680689, "grad_norm": 0.12942007445088913, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 177.5964391231537 }, { "epoch": 116, "train_loss": 4.8983458253479, "train_acc": 0.00896, "test_loss": 4.843299571990967, "test_acc": 0.01, "lyapunov": 1.6105001826420464, "grad_norm": 0.13930842303851845, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 177.61230850219727 }, { "epoch": 117, "train_loss": 4.896871134490967, "train_acc": 0.00876, "test_loss": 4.854955553436279, "test_acc": 0.01, "lyapunov": 1.6068359040238362, "grad_norm": 0.14085548109201876, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 177.60942769050598 }, { "epoch": 118, "train_loss": 4.895171242523193, "train_acc": 0.00872, "test_loss": 4.848788255310058, "test_acc": 0.01, "lyapunov": 1.6026884250323792, "grad_norm": 0.14154856326059925, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 177.55690503120422 }, { "epoch": 119, "train_loss": 4.896756847839355, "train_acc": 0.00832, "test_loss": 4.8384888511657715, "test_acc": 0.01, "lyapunov": 1.6064672335944212, "grad_norm": 0.13186296404041234, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 177.58031153678894 }, { "epoch": 120, "train_loss": 4.898055244140625, "train_acc": 0.00912, "test_loss": 4.863050064086914, "test_acc": 0.01, "lyapunov": 1.608289188131347, "grad_norm": 0.13789827868104076, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 177.57413148880005 }, { "epoch": 121, "train_loss": 4.895827691040039, "train_acc": 0.00928, "test_loss": 4.863882962799072, "test_acc": 0.01, "lyapunov": 1.6041748965792644, "grad_norm": 0.1447753316018149, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 177.61848878860474 }, { "epoch": 122, "train_loss": 4.894580706329346, "train_acc": 0.0093, "test_loss": 4.832992823791504, "test_acc": 0.01, "lyapunov": 1.6009809287917582, "grad_norm": 0.13403320495860124, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 177.63413906097412 }, { "epoch": 123, "train_loss": 4.896512101593018, "train_acc": 0.00856, "test_loss": 4.88107511138916, "test_acc": 0.01, "lyapunov": 1.6053285842661358, "grad_norm": 0.1349040405870927, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 177.86059856414795 }, { "epoch": 124, "train_loss": 4.902536525726318, "train_acc": 0.00916, "test_loss": 4.825576887512207, "test_acc": 0.01, "lyapunov": 1.618482659235025, "grad_norm": 0.15260564991727005, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 177.59844970703125 }, { "epoch": 125, "train_loss": 4.8969797262573245, "train_acc": 0.00904, "test_loss": 4.842672832489014, "test_acc": 0.01, "lyapunov": 1.607402919198546, "grad_norm": 0.14681033483413716, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 177.69832468032837 }, { "epoch": 126, "train_loss": 4.896537158660888, "train_acc": 0.00922, "test_loss": 4.80990348739624, "test_acc": 0.01, "lyapunov": 1.6063618071548773, "grad_norm": 0.13507935123670756, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 177.70786309242249 }, { "epoch": 127, "train_loss": 4.894742733154297, "train_acc": 0.00798, "test_loss": 4.8113509506225585, "test_acc": 0.01, "lyapunov": 1.6014454364776611, "grad_norm": 0.1351277333350339, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 177.86230516433716 }, { "epoch": 128, "train_loss": 4.897651534729004, "train_acc": 0.0094, "test_loss": 4.849126397705078, "test_acc": 0.01, "lyapunov": 1.6088779442145695, "grad_norm": 0.17636542409245334, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 177.6271688938141 }, { "epoch": 129, "train_loss": 4.89603802230835, "train_acc": 0.00886, "test_loss": 4.837294686126709, "test_acc": 0.01, "lyapunov": 1.605165058694532, "grad_norm": 0.1801255445906475, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 177.71211314201355 }, { "epoch": 130, "train_loss": 4.895125115509034, "train_acc": 0.00866, "test_loss": 4.808775178527832, "test_acc": 0.01, "lyapunov": 1.6025557109462025, "grad_norm": 0.14181669608504024, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 177.64269709587097 }, { "epoch": 131, "train_loss": 4.902938699340821, "train_acc": 0.008, "test_loss": 4.826445443725586, "test_acc": 0.01, "lyapunov": 1.6225644127487222, "grad_norm": 0.15063649346643543, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 177.69655632972717 }, { "epoch": 132, "train_loss": 4.895815797271728, "train_acc": 0.00944, "test_loss": 4.808843030548096, "test_acc": 0.01, "lyapunov": 1.6045795020544926, "grad_norm": 0.13954946888706687, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 177.6466555595398 }, { "epoch": 133, "train_loss": 4.896005963287354, "train_acc": 0.0088, "test_loss": 4.82414176940918, "test_acc": 0.01, "lyapunov": 1.6050951605867547, "grad_norm": 0.14029597054344972, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 177.6260485649109 }, { "epoch": 134, "train_loss": 4.898020515136719, "train_acc": 0.00954, "test_loss": 4.837333515167236, "test_acc": 0.01, "lyapunov": 1.609246312199956, "grad_norm": 0.14357714581869627, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 177.584956407547 }, { "epoch": 135, "train_loss": 4.895735731048584, "train_acc": 0.0092, "test_loss": 4.8159059692382815, "test_acc": 0.01, "lyapunov": 1.6042115407831528, "grad_norm": 0.14076247756947305, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 177.55930995941162 }, { "epoch": 136, "train_loss": 4.899449185333252, "train_acc": 0.01, "test_loss": 4.8122740142822265, "test_acc": 0.01, "lyapunov": 1.61043234645863, "grad_norm": 0.19068368741616817, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 177.60587310791016 }, { "epoch": 137, "train_loss": 4.895413861694336, "train_acc": 0.0092, "test_loss": 4.812394242858887, "test_acc": 0.01, "lyapunov": 1.6033874640379415, "grad_norm": 0.5123554678520819, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 177.5866892337799 }, { "epoch": 138, "train_loss": 4.897919689941406, "train_acc": 0.01, "test_loss": 4.824399436187744, "test_acc": 0.01, "lyapunov": 1.60939773604693, "grad_norm": 0.42554152230186504, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 177.5575873851776 }, { "epoch": 139, "train_loss": 4.896585512237549, "train_acc": 0.0096, "test_loss": 4.813831822967529, "test_acc": 0.01, "lyapunov": 1.6059378885552096, "grad_norm": 0.40395815580062067, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 177.5689401626587 }, { "epoch": 140, "train_loss": 4.896397541656494, "train_acc": 0.01, "test_loss": 4.813830749511719, "test_acc": 0.01, "lyapunov": 1.6058773750539326, "grad_norm": 0.3517546520670756, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 177.56592845916748 }, { "epoch": 141, "train_loss": 4.897689798278809, "train_acc": 0.00908, "test_loss": 4.809725570678711, "test_acc": 0.01, "lyapunov": 1.6086021369070653, "grad_norm": 0.34730980637645387, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 177.57834815979004 }, { "epoch": 142, "train_loss": 4.897065491943359, "train_acc": 0.00946, "test_loss": 4.804353742218018, "test_acc": 0.01, "lyapunov": 1.6070060754371116, "grad_norm": 0.34991199227840564, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 177.5697898864746 }, { "epoch": 143, "train_loss": 4.895145080566406, "train_acc": 0.00966, "test_loss": 4.821014101409912, "test_acc": 0.01, "lyapunov": 1.6025798217110012, "grad_norm": 0.3468579023438424, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 177.62174582481384 }, { "epoch": 144, "train_loss": 4.895165930786133, "train_acc": 0.00984, "test_loss": 4.800519823455811, "test_acc": 0.01, "lyapunov": 1.602697217860795, "grad_norm": 0.34813989460737055, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 177.58397316932678 }, { "epoch": 145, "train_loss": 4.896360063476562, "train_acc": 0.01, "test_loss": 4.800519633483887, "test_acc": 0.01, "lyapunov": 1.605867438913916, "grad_norm": 0.3366340618642584, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 177.5893211364746 }, { "epoch": 146, "train_loss": 4.894688441314697, "train_acc": 0.01, "test_loss": 4.800520404052734, "test_acc": 0.01, "lyapunov": 1.6013682687374027, "grad_norm": 0.3310266277326936, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 177.56866335868835 }, { "epoch": 147, "train_loss": 4.894518559265137, "train_acc": 0.01, "test_loss": 4.8005200927734375, "test_acc": 0.01, "lyapunov": 1.600981123307172, "grad_norm": 0.3451840089468246, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 177.56436419487 }, { "epoch": 148, "train_loss": 4.895737046356201, "train_acc": 0.01, "test_loss": 4.800520344543457, "test_acc": 0.01, "lyapunov": 1.6043054953865383, "grad_norm": 0.3208172451267627, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 177.5520420074463 }, { "epoch": 149, "train_loss": 4.894163135528564, "train_acc": 0.01, "test_loss": 4.800520320892334, "test_acc": 0.01, "lyapunov": 1.5999351096580097, "grad_norm": 0.32420799089770896, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 177.6083221435547 }, { "epoch": 150, "train_loss": 4.892976047668457, "train_acc": 0.01, "test_loss": 4.8005203384399415, "test_acc": 0.01, "lyapunov": 1.596442692724945, "grad_norm": 0.32157877988197864, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 177.66009068489075 } ] } }