{ "args": { "ckpt_root": "/home/yurenh2/rrm/hrm/checkpoints/Sudoku-extreme-1k-aug-1000 ACT-torch/HierarchicalReasoningModel_ACTV1 righteous-python", "ckpt_name": "step_26040", "n_steps": 500, "batch_size": 8, "lr": 1e-05, "alpha_rf": 10.0, "lambda_star": -0.05, "k_lyap": 2, "lyap_act_steps": 4, "seed": 42, "eval_every": 100, "eval_n": 512, "eval_batch_size": 32, "out": "/home/yurenh2/rrm/research/flossing/step3_C_rf_26040.json" }, "initial_acc": 0.517578125, "initial_tok_acc": 0.8276668595679012, "steps": [ { "step": 0, "sup_loss": 0.5692806735310538, "rf_loss": 8.730140507395845e-06, "total_loss": 0.5693679749379468, "lyap1_mean": -0.18472686409950256, "lyap1_max": -0.04164290055632591, "frac_above_star": 0.125 }, { "step": 1, "sup_loss": 0.4256530641595496, "rf_loss": 0.0, "total_loss": 0.4256530641595496, "lyap1_mean": -0.18686789274215698, "lyap1_max": -0.0872039645910263, "frac_above_star": 0.0 }, { "step": 2, "sup_loss": 0.7297214513564844, "rf_loss": 0.0, "total_loss": 0.7297214513564844, "lyap1_mean": -0.19814404845237732, "lyap1_max": -0.13654550909996033, "frac_above_star": 0.0 }, { "step": 3, "sup_loss": 0.5305226765501326, "rf_loss": 0.0, "total_loss": 0.5305226765501326, "lyap1_mean": -0.18494391441345215, "lyap1_max": -0.09610007703304291, "frac_above_star": 0.0 }, { "step": 4, "sup_loss": 0.6530737764586068, "rf_loss": 0.0, "total_loss": 0.6530737764586068, "lyap1_mean": -0.14886385202407837, "lyap1_max": -0.051897354423999786, "frac_above_star": 0.0 }, { "step": 5, "sup_loss": 0.8219793628339117, "rf_loss": 4.5718057663179934e-05, "total_loss": 0.8224365434105435, "lyap1_mean": -0.14355605840682983, "lyap1_max": -0.03087555430829525, "frac_above_star": 0.125 }, { "step": 6, "sup_loss": 0.6218899233075229, "rf_loss": 0.0, "total_loss": 0.6218899233075229, "lyap1_mean": -0.1884099841117859, "lyap1_max": -0.1256392002105713, "frac_above_star": 0.0 }, { "step": 7, "sup_loss": 0.6366865559939567, "rf_loss": 0.0, "total_loss": 0.6366865559939567, "lyap1_mean": -0.17351576685905457, "lyap1_max": -0.12977278232574463, "frac_above_star": 0.0 }, { "step": 8, "sup_loss": 0.8273739711801417, "rf_loss": 0.0, "total_loss": 0.8273739711801417, "lyap1_mean": -0.15072572231292725, "lyap1_max": -0.10887785255908966, "frac_above_star": 0.0 }, { "step": 9, "sup_loss": 0.8388152816960708, "rf_loss": 5.7935678341891617e-05, "total_loss": 0.8393946384940416, "lyap1_mean": -0.15443460643291473, "lyap1_max": -0.028471289202570915, "frac_above_star": 0.125 }, { "step": 10, "sup_loss": 0.5884922889641484, "rf_loss": 0.0, "total_loss": 0.5884922889641484, "lyap1_mean": -0.17496049404144287, "lyap1_max": -0.096577487885952, "frac_above_star": 0.0 }, { "step": 11, "sup_loss": 0.5878587874187478, "rf_loss": 0.0, "total_loss": 0.5878587874187478, "lyap1_mean": -0.19995838403701782, "lyap1_max": -0.11154899001121521, "frac_above_star": 0.0 }, { "step": 12, "sup_loss": 0.4732437735449548, "rf_loss": 0.0, "total_loss": 0.4732437735449548, "lyap1_mean": -0.18807215988636017, "lyap1_max": -0.11670893430709839, "frac_above_star": 0.0 }, { "step": 13, "sup_loss": 0.6936183670110372, "rf_loss": 0.0, "total_loss": 0.6936183670110372, "lyap1_mean": -0.15418314933776855, "lyap1_max": -0.07703495770692825, "frac_above_star": 0.0 }, { "step": 14, "sup_loss": 0.634786247230436, "rf_loss": 0.0, "total_loss": 0.634786247230436, "lyap1_mean": -0.18757356703281403, "lyap1_max": -0.09002988785505295, "frac_above_star": 0.0 }, { "step": 15, "sup_loss": 0.7161386334910096, "rf_loss": 0.0, "total_loss": 0.7161386334910096, "lyap1_mean": -0.18413621187210083, "lyap1_max": -0.08889326453208923, "frac_above_star": 0.0 }, { "step": 16, "sup_loss": 0.5688225334782482, "rf_loss": 0.0, "total_loss": 0.5688225334782482, "lyap1_mean": -0.18539652228355408, "lyap1_max": -0.1365247368812561, "frac_above_star": 0.0 }, { "step": 17, "sup_loss": 0.7419275285982696, "rf_loss": 0.0, "total_loss": 0.7419275285982696, "lyap1_mean": -0.14077171683311462, "lyap1_max": -0.10038422793149948, "frac_above_star": 0.0 }, { "step": 18, "sup_loss": 0.6251659308804067, "rf_loss": 0.0, "total_loss": 0.6251659308804067, "lyap1_mean": -0.19977544248104095, "lyap1_max": -0.1411890983581543, "frac_above_star": 0.0 }, { "step": 19, "sup_loss": 0.47931541785969645, "rf_loss": 0.0, "total_loss": 0.47931541785969645, "lyap1_mean": -0.19939261674880981, "lyap1_max": -0.05177782475948334, "frac_above_star": 0.0 }, { "step": 20, "sup_loss": 0.5755442567017433, "rf_loss": 0.0, "total_loss": 0.5755442567017433, "lyap1_mean": -0.17150744795799255, "lyap1_max": -0.0765736848115921, "frac_above_star": 0.0 }, { "step": 21, "sup_loss": 0.6602223300636985, "rf_loss": 0.0, "total_loss": 0.6602223300636985, "lyap1_mean": -0.17469163239002228, "lyap1_max": -0.11657081544399261, "frac_above_star": 0.0 }, { "step": 22, "sup_loss": 0.5494241428120278, "rf_loss": 0.0, "total_loss": 0.5494241428120278, "lyap1_mean": -0.18806186318397522, "lyap1_max": -0.13081824779510498, "frac_above_star": 0.0 }, { "step": 23, "sup_loss": 0.5720102900969967, "rf_loss": 0.0, "total_loss": 0.5720102900969967, "lyap1_mean": -0.189255028963089, "lyap1_max": -0.13640080392360687, "frac_above_star": 0.0 }, { "step": 24, "sup_loss": 0.6200697687914075, "rf_loss": 0.0, "total_loss": 0.6200697687914075, "lyap1_mean": -0.18683704733848572, "lyap1_max": -0.15241771936416626, "frac_above_star": 0.0 }, { "step": 25, "sup_loss": 0.7708447275750623, "rf_loss": 7.396034197881818e-05, "total_loss": 0.7715843309948505, "lyap1_mean": -0.13307297229766846, "lyap1_max": -0.02684459462761879, "frac_above_star": 0.25 }, { "step": 26, "sup_loss": 0.7134329074047788, "rf_loss": 0.0, "total_loss": 0.7134329074047788, "lyap1_mean": -0.16006088256835938, "lyap1_max": -0.11834649741649628, "frac_above_star": 0.0 }, { "step": 27, "sup_loss": 0.4433266649670745, "rf_loss": 0.0, "total_loss": 0.4433266649670745, "lyap1_mean": -0.21617424488067627, "lyap1_max": -0.09347926080226898, "frac_above_star": 0.0 }, { "step": 28, "sup_loss": 0.7546234439622822, "rf_loss": 0.0, "total_loss": 0.7546234439622822, "lyap1_mean": -0.1505395770072937, "lyap1_max": -0.08319316804409027, "frac_above_star": 0.0 }, { "step": 29, "sup_loss": 0.7812489796402995, "rf_loss": 0.0, "total_loss": 0.7812489796402995, "lyap1_mean": -0.16996526718139648, "lyap1_max": -0.09263668954372406, "frac_above_star": 0.0 }, { "step": 30, "sup_loss": 0.6161543732921804, "rf_loss": 0.0, "total_loss": 0.6161543732921804, "lyap1_mean": -0.1655355542898178, "lyap1_max": -0.06628571450710297, "frac_above_star": 0.0 }, { "step": 31, "sup_loss": 0.6526502041454323, "rf_loss": 0.0, "total_loss": 0.6526502041454323, "lyap1_mean": -0.16468918323516846, "lyap1_max": -0.0951920673251152, "frac_above_star": 0.0 }, { "step": 32, "sup_loss": 0.6116748757372479, "rf_loss": 0.0, "total_loss": 0.6116748757372479, "lyap1_mean": -0.14170441031455994, "lyap1_max": -0.07779055833816528, "frac_above_star": 0.0 }, { "step": 33, "sup_loss": 0.5715996718656129, "rf_loss": 0.0, "total_loss": 0.5715996718656129, "lyap1_mean": -0.1859581470489502, "lyap1_max": -0.09928901493549347, "frac_above_star": 0.0 }, { "step": 34, "sup_loss": 0.7155047617114231, "rf_loss": 0.0, "total_loss": 0.7155047617114231, "lyap1_mean": -0.16743279993534088, "lyap1_max": -0.13878943026065826, "frac_above_star": 0.0 }, { "step": 35, "sup_loss": 0.405594918584735, "rf_loss": 0.0, "total_loss": 0.405594918584735, "lyap1_mean": -0.20414918661117554, "lyap1_max": -0.1424926221370697, "frac_above_star": 0.0 }, { "step": 36, "sup_loss": 0.5742962932293634, "rf_loss": 0.0, "total_loss": 0.5742962932293634, "lyap1_mean": -0.19033342599868774, "lyap1_max": -0.1235819086432457, "frac_above_star": 0.0 }, { "step": 37, "sup_loss": 0.779355227864023, "rf_loss": 0.0, "total_loss": 0.779355227864023, "lyap1_mean": -0.16759246587753296, "lyap1_max": -0.1254093497991562, "frac_above_star": 0.0 }, { "step": 38, "sup_loss": 0.5656018805901114, "rf_loss": 0.0, "total_loss": 0.5656018805901114, "lyap1_mean": -0.1866704374551773, "lyap1_max": -0.10992076247930527, "frac_above_star": 0.0 }, { "step": 39, "sup_loss": 0.7040410326101555, "rf_loss": 0.0, "total_loss": 0.7040410326101555, "lyap1_mean": -0.17482686042785645, "lyap1_max": -0.1386720836162567, "frac_above_star": 0.0 }, { "step": 40, "sup_loss": 0.6854342059490072, "rf_loss": 0.0, "total_loss": 0.6854342059490072, "lyap1_mean": -0.18073156476020813, "lyap1_max": -0.1336684226989746, "frac_above_star": 0.0 }, { "step": 41, "sup_loss": 0.4590976153719093, "rf_loss": 0.0, "total_loss": 0.4590976153719093, "lyap1_mean": -0.22070184350013733, "lyap1_max": -0.13353635370731354, "frac_above_star": 0.0 }, { "step": 42, "sup_loss": 0.7326898256298093, "rf_loss": 0.0006855739047750831, "total_loss": 0.7395455649103908, "lyap1_mean": -0.15728053450584412, "lyap1_max": 0.024058029055595398, "frac_above_star": 0.125 }, { "step": 43, "sup_loss": 0.7123319703814748, "rf_loss": 0.0, "total_loss": 0.7123319703814748, "lyap1_mean": -0.18902835249900818, "lyap1_max": -0.11963468790054321, "frac_above_star": 0.0 }, { "step": 44, "sup_loss": 0.9444873795921138, "rf_loss": 0.0, "total_loss": 0.9444873795921138, "lyap1_mean": -0.15437626838684082, "lyap1_max": -0.08420934528112411, "frac_above_star": 0.0 }, { "step": 45, "sup_loss": 0.6105991115340909, "rf_loss": 0.0, "total_loss": 0.6105991115340909, "lyap1_mean": -0.16357484459877014, "lyap1_max": -0.09036712348461151, "frac_above_star": 0.0 }, { "step": 46, "sup_loss": 0.6511733318015783, "rf_loss": 0.0, "total_loss": 0.6511733318015783, "lyap1_mean": -0.17456793785095215, "lyap1_max": -0.09218809008598328, "frac_above_star": 0.0 }, { "step": 47, "sup_loss": 0.6681804216542886, "rf_loss": 0.0, "total_loss": 0.6681804216542886, "lyap1_mean": -0.1810278743505478, "lyap1_max": -0.06158395856618881, "frac_above_star": 0.0 }, { "step": 48, "sup_loss": 0.6536462391944303, "rf_loss": 0.0, "total_loss": 0.6536462391944303, "lyap1_mean": -0.1637968271970749, "lyap1_max": -0.059858888387680054, "frac_above_star": 0.0 }, { "step": 49, "sup_loss": 0.5716275082407425, "rf_loss": 0.0, "total_loss": 0.5716275082407425, "lyap1_mean": -0.1786249727010727, "lyap1_max": -0.14303715527057648, "frac_above_star": 0.0 }, { "step": 50, "sup_loss": 0.603092031769928, "rf_loss": 0.0, "total_loss": 0.603092031769928, "lyap1_mean": -0.19462862610816956, "lyap1_max": -0.1409212201833725, "frac_above_star": 0.0 }, { "step": 51, "sup_loss": 0.8258017276412262, "rf_loss": 0.0, "total_loss": 0.8258017276412262, "lyap1_mean": -0.17781853675842285, "lyap1_max": -0.12817521393299103, "frac_above_star": 0.0 }, { "step": 52, "sup_loss": 0.5143208426588572, "rf_loss": 0.0, "total_loss": 0.5143208426588572, "lyap1_mean": -0.18833813071250916, "lyap1_max": -0.067641481757164, "frac_above_star": 0.0 }, { "step": 53, "sup_loss": 0.6277062174054168, "rf_loss": 0.0, "total_loss": 0.6277062174054168, "lyap1_mean": -0.1856500506401062, "lyap1_max": -0.1020214781165123, "frac_above_star": 0.0 }, { "step": 54, "sup_loss": 0.6103892031023235, "rf_loss": 0.0, "total_loss": 0.6103892031023235, "lyap1_mean": -0.16502267122268677, "lyap1_max": -0.12042690813541412, "frac_above_star": 0.0 }, { "step": 55, "sup_loss": 0.6455055669389037, "rf_loss": 0.0, "total_loss": 0.6455055669389037, "lyap1_mean": -0.19511613249778748, "lyap1_max": -0.1421412229537964, "frac_above_star": 0.0 }, { "step": 56, "sup_loss": 0.6145164240286488, "rf_loss": 0.0, "total_loss": 0.6145164240286488, "lyap1_mean": -0.20549499988555908, "lyap1_max": -0.12187451124191284, "frac_above_star": 0.0 }, { "step": 57, "sup_loss": 0.5940261257955141, "rf_loss": 0.0, "total_loss": 0.5940261257955141, "lyap1_mean": -0.17917832732200623, "lyap1_max": -0.11406894028186798, "frac_above_star": 0.0 }, { "step": 58, "sup_loss": 0.6619334911749458, "rf_loss": 0.0, "total_loss": 0.6619334911749458, "lyap1_mean": -0.164550319314003, "lyap1_max": -0.11046522855758667, "frac_above_star": 0.0 }, { "step": 59, "sup_loss": 0.4150616594111256, "rf_loss": 0.0, "total_loss": 0.4150616594111256, "lyap1_mean": -0.22426193952560425, "lyap1_max": -0.1789734661579132, "frac_above_star": 0.0 }, { "step": 60, "sup_loss": 0.6366023342544679, "rf_loss": 0.0, "total_loss": 0.6366023342544679, "lyap1_mean": -0.1950746476650238, "lyap1_max": -0.1201804131269455, "frac_above_star": 0.0 }, { "step": 61, "sup_loss": 0.5621954120897326, "rf_loss": 0.0, "total_loss": 0.5621954120897326, "lyap1_mean": -0.1846153736114502, "lyap1_max": -0.06914173066616058, "frac_above_star": 0.0 }, { "step": 62, "sup_loss": 0.4090317561733625, "rf_loss": 0.0, "total_loss": 0.4090317561733625, "lyap1_mean": -0.19688698649406433, "lyap1_max": -0.09841044247150421, "frac_above_star": 0.0 }, { "step": 63, "sup_loss": 0.6444829295462823, "rf_loss": 0.0, "total_loss": 0.6444829295462823, "lyap1_mean": -0.15889519453048706, "lyap1_max": -0.058723412454128265, "frac_above_star": 0.0 }, { "step": 64, "sup_loss": 0.6032293179857517, "rf_loss": 2.3355278244707733e-06, "total_loss": 0.6032526732639965, "lyap1_mean": -0.16479796171188354, "lyap1_max": -0.04567747563123703, "frac_above_star": 0.125 }, { "step": 65, "sup_loss": 0.8559884240257292, "rf_loss": 0.0, "total_loss": 0.8559884240257292, "lyap1_mean": -0.1752115786075592, "lyap1_max": -0.12007348239421844, "frac_above_star": 0.0 }, { "step": 66, "sup_loss": 0.6215779601100612, "rf_loss": 0.0, "total_loss": 0.6215779601100612, "lyap1_mean": -0.17921197414398193, "lyap1_max": -0.12914569675922394, "frac_above_star": 0.0 }, { "step": 67, "sup_loss": 0.5663748954082356, "rf_loss": 0.0, "total_loss": 0.5663748954082356, "lyap1_mean": -0.18078398704528809, "lyap1_max": -0.12422117590904236, "frac_above_star": 0.0 }, { "step": 68, "sup_loss": 0.681322342192105, "rf_loss": 0.0, "total_loss": 0.681322342192105, "lyap1_mean": -0.19753026962280273, "lyap1_max": -0.14116621017456055, "frac_above_star": 0.0 }, { "step": 69, "sup_loss": 0.724612880165071, "rf_loss": 0.0, "total_loss": 0.724612880165071, "lyap1_mean": -0.17135238647460938, "lyap1_max": -0.11894424259662628, "frac_above_star": 0.0 }, { "step": 70, "sup_loss": 0.6548271197096364, "rf_loss": 0.0, "total_loss": 0.6548271197096364, "lyap1_mean": -0.2083948403596878, "lyap1_max": -0.12929992377758026, "frac_above_star": 0.0 }, { "step": 71, "sup_loss": 0.7001088288185602, "rf_loss": 0.0, "total_loss": 0.7001088288185602, "lyap1_mean": -0.1846844106912613, "lyap1_max": -0.16559511423110962, "frac_above_star": 0.0 }, { "step": 72, "sup_loss": 0.6152699486939265, "rf_loss": 0.0, "total_loss": 0.6152699486939265, "lyap1_mean": -0.19737334549427032, "lyap1_max": -0.050438061356544495, "frac_above_star": 0.0 }, { "step": 73, "sup_loss": 0.5330825014170364, "rf_loss": 0.0, "total_loss": 0.5330825014170364, "lyap1_mean": -0.2135828584432602, "lyap1_max": -0.15321503579616547, "frac_above_star": 0.0 }, { "step": 74, "sup_loss": 0.7178433843512522, "rf_loss": 0.0, "total_loss": 0.7178433843512522, "lyap1_mean": -0.20191745460033417, "lyap1_max": -0.09855665266513824, "frac_above_star": 0.0 }, { "step": 75, "sup_loss": 0.5494383288488749, "rf_loss": 0.0, "total_loss": 0.5494383288488749, "lyap1_mean": -0.16783832013607025, "lyap1_max": -0.08376707881689072, "frac_above_star": 0.0 }, { "step": 76, "sup_loss": 0.560307411121749, "rf_loss": 0.0, "total_loss": 0.560307411121749, "lyap1_mean": -0.20312337577342987, "lyap1_max": -0.13778817653656006, "frac_above_star": 0.0 }, { "step": 77, "sup_loss": 0.5539597423634346, "rf_loss": 0.0, "total_loss": 0.5539597423634346, "lyap1_mean": -0.18205776810646057, "lyap1_max": -0.139293372631073, "frac_above_star": 0.0 }, { "step": 78, "sup_loss": 0.8142099924852012, "rf_loss": 0.0, "total_loss": 0.8142099924852012, "lyap1_mean": -0.17192959785461426, "lyap1_max": -0.11066693067550659, "frac_above_star": 0.0 }, { "step": 79, "sup_loss": 0.7390341665853719, "rf_loss": 0.0, "total_loss": 0.7390341665853719, "lyap1_mean": -0.17934057116508484, "lyap1_max": -0.14188216626644135, "frac_above_star": 0.0 }, { "step": 80, "sup_loss": 0.6894345472396097, "rf_loss": 0.0, "total_loss": 0.6894345472396097, "lyap1_mean": -0.19345922768115997, "lyap1_max": -0.10066233575344086, "frac_above_star": 0.0 }, { "step": 81, "sup_loss": 0.48982314214698575, "rf_loss": 0.0, "total_loss": 0.48982314214698575, "lyap1_mean": -0.19416800141334534, "lyap1_max": -0.09982820600271225, "frac_above_star": 0.0 }, { "step": 82, "sup_loss": 0.5869300998628438, "rf_loss": 8.435400786765967e-07, "total_loss": 0.5869385352634032, "lyap1_mean": -0.20247265696525574, "lyap1_max": -0.04740224778652191, "frac_above_star": 0.125 }, { "step": 83, "sup_loss": 0.6842885951991206, "rf_loss": 0.0, "total_loss": 0.6842885951991206, "lyap1_mean": -0.18653219938278198, "lyap1_max": -0.13923929631710052, "frac_above_star": 0.0 }, { "step": 84, "sup_loss": 0.6780766391534829, "rf_loss": 0.0, "total_loss": 0.6780766391534829, "lyap1_mean": -0.17154312133789062, "lyap1_max": -0.08502425998449326, "frac_above_star": 0.0 }, { "step": 85, "sup_loss": 0.7446607674675148, "rf_loss": 0.0, "total_loss": 0.7446607674675148, "lyap1_mean": -0.1939150094985962, "lyap1_max": -0.12365493178367615, "frac_above_star": 0.0 }, { "step": 86, "sup_loss": 0.7088483602063388, "rf_loss": 0.0, "total_loss": 0.7088483602063388, "lyap1_mean": -0.21206793189048767, "lyap1_max": -0.1382783204317093, "frac_above_star": 0.0 }, { "step": 87, "sup_loss": 0.6548089941804851, "rf_loss": 0.0, "total_loss": 0.6548089941804851, "lyap1_mean": -0.1882571578025818, "lyap1_max": -0.15231479704380035, "frac_above_star": 0.0 }, { "step": 88, "sup_loss": 0.8375563116736965, "rf_loss": 0.0, "total_loss": 0.8375563116736965, "lyap1_mean": -0.1890907734632492, "lyap1_max": -0.061795737594366074, "frac_above_star": 0.0 }, { "step": 89, "sup_loss": 0.7943912132026928, "rf_loss": 0.0, "total_loss": 0.7943912132026928, "lyap1_mean": -0.17644642293453217, "lyap1_max": -0.1137496829032898, "frac_above_star": 0.0 }, { "step": 90, "sup_loss": 0.4358871156373397, "rf_loss": 0.0, "total_loss": 0.4358871156373397, "lyap1_mean": -0.19933903217315674, "lyap1_max": -0.12500867247581482, "frac_above_star": 0.0 }, { "step": 91, "sup_loss": 0.6397124120544256, "rf_loss": 0.0, "total_loss": 0.6397124120544256, "lyap1_mean": -0.1956581175327301, "lyap1_max": -0.1527823805809021, "frac_above_star": 0.0 }, { "step": 92, "sup_loss": 0.6943673993377347, "rf_loss": 0.0, "total_loss": 0.6943673993377347, "lyap1_mean": -0.19748640060424805, "lyap1_max": -0.12701278924942017, "frac_above_star": 0.0 }, { "step": 93, "sup_loss": 0.5266307041969792, "rf_loss": 0.0, "total_loss": 0.5266307041969792, "lyap1_mean": -0.2056117206811905, "lyap1_max": -0.13870689272880554, "frac_above_star": 0.0 }, { "step": 94, "sup_loss": 0.6972693876216245, "rf_loss": 0.0, "total_loss": 0.6972693876216245, "lyap1_mean": -0.1784152388572693, "lyap1_max": -0.11077430844306946, "frac_above_star": 0.0 }, { "step": 95, "sup_loss": 0.6702732523663966, "rf_loss": 0.0, "total_loss": 0.6702732523663966, "lyap1_mean": -0.19987890124320984, "lyap1_max": -0.1555045247077942, "frac_above_star": 0.0 }, { "step": 96, "sup_loss": 0.7178331592585567, "rf_loss": 0.0, "total_loss": 0.7178331592585567, "lyap1_mean": -0.19023260474205017, "lyap1_max": -0.11993156373500824, "frac_above_star": 0.0 }, { "step": 97, "sup_loss": 0.4032309093915764, "rf_loss": 0.0, "total_loss": 0.4032309093915764, "lyap1_mean": -0.1976034939289093, "lyap1_max": -0.14226825535297394, "frac_above_star": 0.0 }, { "step": 98, "sup_loss": 0.9127691885507438, "rf_loss": 0.0, "total_loss": 0.9127691885507438, "lyap1_mean": -0.20238561928272247, "lyap1_max": -0.14032000303268433, "frac_above_star": 0.0 }, { "step": 99, "sup_loss": 0.6567831590498325, "rf_loss": 0.0, "total_loss": 0.6567831590498325, "lyap1_mean": -0.20472730696201324, "lyap1_max": -0.1166522428393364, "frac_above_star": 0.0 }, { "step": 100, "sup_loss": 0.5994851694257204, "rf_loss": 0.0, "total_loss": 0.5994851694257204, "lyap1_mean": -0.20277434587478638, "lyap1_max": -0.13231883943080902, "frac_above_star": 0.0 }, { "step": 101, "sup_loss": 0.5436927602746822, "rf_loss": 0.00010434372234158218, "total_loss": 0.5447361975563056, "lyap1_mean": -0.1669021099805832, "lyap1_max": -0.02110796421766281, "frac_above_star": 0.125 }, { "step": 102, "sup_loss": 0.6854589286347211, "rf_loss": 0.0, "total_loss": 0.6854589286347211, "lyap1_mean": -0.19036145508289337, "lyap1_max": -0.1197056919336319, "frac_above_star": 0.0 }, { "step": 103, "sup_loss": 0.6398141625252861, "rf_loss": 0.0, "total_loss": 0.6398141625252861, "lyap1_mean": -0.19734860956668854, "lyap1_max": -0.14658886194229126, "frac_above_star": 0.0 }, { "step": 104, "sup_loss": 0.7240415879906443, "rf_loss": 0.0, "total_loss": 0.7240415879906443, "lyap1_mean": -0.1635725200176239, "lyap1_max": -0.08775108307600021, "frac_above_star": 0.0 }, { "step": 105, "sup_loss": 0.7421535566166461, "rf_loss": 0.0, "total_loss": 0.7421535566166461, "lyap1_mean": -0.18113252520561218, "lyap1_max": -0.11357490718364716, "frac_above_star": 0.0 }, { "step": 106, "sup_loss": 0.6658438252352756, "rf_loss": 0.0, "total_loss": 0.6658438252352756, "lyap1_mean": -0.1905079334974289, "lyap1_max": -0.10756576061248779, "frac_above_star": 0.0 }, { "step": 107, "sup_loss": 0.6255287965005226, "rf_loss": 0.0, "total_loss": 0.6255287965005226, "lyap1_mean": -0.18496447801589966, "lyap1_max": -0.11795295774936676, "frac_above_star": 0.0 }, { "step": 108, "sup_loss": 0.6415584925304553, "rf_loss": 2.2425259885494597e-05, "total_loss": 0.6417827451256722, "lyap1_mean": -0.1817285269498825, "lyap1_max": -0.036605894565582275, "frac_above_star": 0.125 }, { "step": 109, "sup_loss": 0.7917047679250432, "rf_loss": 0.0, "total_loss": 0.7917047679250432, "lyap1_mean": -0.17028799653053284, "lyap1_max": -0.11498349159955978, "frac_above_star": 0.0 }, { "step": 110, "sup_loss": 0.5832977131575414, "rf_loss": 0.0, "total_loss": 0.5832977131575414, "lyap1_mean": -0.19843491911888123, "lyap1_max": -0.1628326177597046, "frac_above_star": 0.0 }, { "step": 111, "sup_loss": 0.7156677699012743, "rf_loss": 2.832912105077412e-05, "total_loss": 0.7159510611154201, "lyap1_mean": -0.18722228705883026, "lyap1_max": -0.034945666790008545, "frac_above_star": 0.125 }, { "step": 112, "sup_loss": 0.6814256596508148, "rf_loss": 0.0, "total_loss": 0.6814256596508148, "lyap1_mean": -0.16948023438453674, "lyap1_max": -0.10405611246824265, "frac_above_star": 0.0 }, { "step": 113, "sup_loss": 0.6723503993307438, "rf_loss": 0.0, "total_loss": 0.6723503993307438, "lyap1_mean": -0.17860108613967896, "lyap1_max": -0.08338036388158798, "frac_above_star": 0.0 }, { "step": 114, "sup_loss": 0.5544590957495593, "rf_loss": 0.0, "total_loss": 0.5544590957495593, "lyap1_mean": -0.21950607001781464, "lyap1_max": -0.12801465392112732, "frac_above_star": 0.0 }, { "step": 115, "sup_loss": 0.5981281308295814, "rf_loss": 0.0, "total_loss": 0.5981281308295814, "lyap1_mean": -0.17478057742118835, "lyap1_max": -0.09439365565776825, "frac_above_star": 0.0 }, { "step": 116, "sup_loss": 0.6474670975699613, "rf_loss": 0.0, "total_loss": 0.6474670975699613, "lyap1_mean": -0.18672454357147217, "lyap1_max": -0.12268798053264618, "frac_above_star": 0.0 }, { "step": 117, "sup_loss": 0.8041441807898295, "rf_loss": 0.0, "total_loss": 0.8041441807898295, "lyap1_mean": -0.17857396602630615, "lyap1_max": -0.13994570076465607, "frac_above_star": 0.0 }, { "step": 118, "sup_loss": 0.4998158286401133, "rf_loss": 0.0, "total_loss": 0.4998158286401133, "lyap1_mean": -0.1981722116470337, "lyap1_max": -0.10624043643474579, "frac_above_star": 0.0 }, { "step": 119, "sup_loss": 0.58764011100537, "rf_loss": 0.0, "total_loss": 0.58764011100537, "lyap1_mean": -0.19531869888305664, "lyap1_max": -0.1328994482755661, "frac_above_star": 0.0 }, { "step": 120, "sup_loss": 0.5877959165633464, "rf_loss": 0.0, "total_loss": 0.5877959165633464, "lyap1_mean": -0.2022669017314911, "lyap1_max": -0.15155364573001862, "frac_above_star": 0.0 }, { "step": 121, "sup_loss": 0.7102715727481126, "rf_loss": 4.036358859593747e-06, "total_loss": 0.710311936337618, "lyap1_mean": -0.17315416038036346, "lyap1_max": -0.044317495077848434, "frac_above_star": 0.125 }, { "step": 122, "sup_loss": 0.7486520809548546, "rf_loss": 0.0, "total_loss": 0.7486520809548546, "lyap1_mean": -0.19023016095161438, "lyap1_max": -0.1492830067873001, "frac_above_star": 0.0 }, { "step": 123, "sup_loss": 0.7256768742762878, "rf_loss": 0.0, "total_loss": 0.7256768742762878, "lyap1_mean": -0.2051115185022354, "lyap1_max": -0.13396583497524261, "frac_above_star": 0.0 }, { "step": 124, "sup_loss": 0.8365473740745412, "rf_loss": 0.0, "total_loss": 0.8365473740745412, "lyap1_mean": -0.2048102766275406, "lyap1_max": -0.15678644180297852, "frac_above_star": 0.0 }, { "step": 125, "sup_loss": 0.5929228659299373, "rf_loss": 6.58467479297542e-06, "total_loss": 0.5929887126769575, "lyap1_mean": -0.2139703631401062, "lyap1_max": -0.042742080986499786, "frac_above_star": 0.125 }, { "step": 126, "sup_loss": 0.532579717617711, "rf_loss": 0.0, "total_loss": 0.532579717617711, "lyap1_mean": -0.2120150476694107, "lyap1_max": -0.1323821246623993, "frac_above_star": 0.0 }, { "step": 127, "sup_loss": 0.5116838507358473, "rf_loss": 0.0, "total_loss": 0.5116838507358473, "lyap1_mean": -0.21394801139831543, "lyap1_max": -0.12784112989902496, "frac_above_star": 0.0 }, { "step": 128, "sup_loss": 0.4772271903006805, "rf_loss": 0.0, "total_loss": 0.4772271903006805, "lyap1_mean": -0.1926710456609726, "lyap1_max": -0.08498414605855942, "frac_above_star": 0.0 }, { "step": 129, "sup_loss": 0.4008461127505293, "rf_loss": 0.0, "total_loss": 0.4008461127505293, "lyap1_mean": -0.20454956591129303, "lyap1_max": -0.13309788703918457, "frac_above_star": 0.0 }, { "step": 130, "sup_loss": 0.7495469966120952, "rf_loss": 5.145889645064017e-06, "total_loss": 0.7495984555094554, "lyap1_mean": -0.18169043958187103, "lyap1_max": -0.043583840131759644, "frac_above_star": 0.125 }, { "step": 131, "sup_loss": 0.4312446202546212, "rf_loss": 0.0, "total_loss": 0.4312446202546212, "lyap1_mean": -0.21696242690086365, "lyap1_max": -0.15814265608787537, "frac_above_star": 0.0 }, { "step": 132, "sup_loss": 0.5582560007559362, "rf_loss": 0.0, "total_loss": 0.5582560007559362, "lyap1_mean": -0.20400217175483704, "lyap1_max": -0.13376562297344208, "frac_above_star": 0.0 }, { "step": 133, "sup_loss": 0.7041088457924948, "rf_loss": 0.0, "total_loss": 0.7041088457924948, "lyap1_mean": -0.20680229365825653, "lyap1_max": -0.1754983514547348, "frac_above_star": 0.0 }, { "step": 134, "sup_loss": 0.563875814983224, "rf_loss": 0.0, "total_loss": 0.563875814983224, "lyap1_mean": -0.22375597059726715, "lyap1_max": -0.1756380796432495, "frac_above_star": 0.0 }, { "step": 135, "sup_loss": 0.5877927375513854, "rf_loss": 0.0, "total_loss": 0.5877927375513854, "lyap1_mean": -0.18356719613075256, "lyap1_max": -0.13984067738056183, "frac_above_star": 0.0 }, { "step": 136, "sup_loss": 0.6967049828519027, "rf_loss": 0.0, "total_loss": 0.6967049828519027, "lyap1_mean": -0.20563051104545593, "lyap1_max": -0.13849720358848572, "frac_above_star": 0.0 }, { "step": 137, "sup_loss": 0.7493791300779891, "rf_loss": 0.0, "total_loss": 0.7493791300779891, "lyap1_mean": -0.18854603171348572, "lyap1_max": -0.1198568046092987, "frac_above_star": 0.0 }, { "step": 138, "sup_loss": 0.5831394019311282, "rf_loss": 0.0, "total_loss": 0.5831394019311282, "lyap1_mean": -0.2047521024942398, "lyap1_max": -0.09193161129951477, "frac_above_star": 0.0 }, { "step": 139, "sup_loss": 0.7034274396937668, "rf_loss": 0.0, "total_loss": 0.7034274396937668, "lyap1_mean": -0.2071250081062317, "lyap1_max": -0.1298181712627411, "frac_above_star": 0.0 }, { "step": 140, "sup_loss": 0.8352350575091843, "rf_loss": 0.0, "total_loss": 0.8352350575091843, "lyap1_mean": -0.20648932456970215, "lyap1_max": -0.12333369255065918, "frac_above_star": 0.0 }, { "step": 141, "sup_loss": 0.8202135030534674, "rf_loss": 0.0, "total_loss": 0.8202135030534674, "lyap1_mean": -0.19115962088108063, "lyap1_max": -0.12690258026123047, "frac_above_star": 0.0 }, { "step": 142, "sup_loss": 0.4437849793664359, "rf_loss": 0.0, "total_loss": 0.4437849793664359, "lyap1_mean": -0.21630491316318512, "lyap1_max": -0.07135376334190369, "frac_above_star": 0.0 }, { "step": 143, "sup_loss": 0.5956905084282531, "rf_loss": 0.0, "total_loss": 0.5956905084282531, "lyap1_mean": -0.23176078498363495, "lyap1_max": -0.1232210025191307, "frac_above_star": 0.0 }, { "step": 144, "sup_loss": 0.8676920416610701, "rf_loss": 0.0, "total_loss": 0.8676920416610701, "lyap1_mean": -0.16267666220664978, "lyap1_max": -0.12483109533786774, "frac_above_star": 0.0 }, { "step": 145, "sup_loss": 0.8153725133475355, "rf_loss": 0.0, "total_loss": 0.8153725133475355, "lyap1_mean": -0.17761245369911194, "lyap1_max": -0.11855889856815338, "frac_above_star": 0.0 }, { "step": 146, "sup_loss": 0.5622308373239437, "rf_loss": 0.0, "total_loss": 0.5622308373239437, "lyap1_mean": -0.2352740466594696, "lyap1_max": -0.15084615349769592, "frac_above_star": 0.0 }, { "step": 147, "sup_loss": 0.6061167118306385, "rf_loss": 0.0, "total_loss": 0.6061167118306385, "lyap1_mean": -0.18306130170822144, "lyap1_max": -0.14161424338817596, "frac_above_star": 0.0 }, { "step": 148, "sup_loss": 0.646654928721227, "rf_loss": 0.0, "total_loss": 0.646654928721227, "lyap1_mean": -0.2142477035522461, "lyap1_max": -0.1069549024105072, "frac_above_star": 0.0 }, { "step": 149, "sup_loss": 0.4528785677865034, "rf_loss": 0.0, "total_loss": 0.4528785677865034, "lyap1_mean": -0.23243194818496704, "lyap1_max": -0.18399018049240112, "frac_above_star": 0.0 }, { "step": 150, "sup_loss": 0.6228646929758556, "rf_loss": 0.0, "total_loss": 0.6228646929758556, "lyap1_mean": -0.2326427400112152, "lyap1_max": -0.13410033285617828, "frac_above_star": 0.0 }, { "step": 151, "sup_loss": 0.5784476138471064, "rf_loss": 0.0, "total_loss": 0.5784476138471064, "lyap1_mean": -0.19768209755420685, "lyap1_max": -0.08153486996889114, "frac_above_star": 0.0 }, { "step": 152, "sup_loss": 0.6835010917593224, "rf_loss": 0.0, "total_loss": 0.6835010917593224, "lyap1_mean": -0.20450472831726074, "lyap1_max": -0.1402837634086609, "frac_above_star": 0.0 }, { "step": 153, "sup_loss": 0.6460169724066586, "rf_loss": 0.0, "total_loss": 0.6460169724066586, "lyap1_mean": -0.1713595688343048, "lyap1_max": -0.08505097031593323, "frac_above_star": 0.0 }, { "step": 154, "sup_loss": 0.6073178057823506, "rf_loss": 4.770677332999185e-05, "total_loss": 0.6077948735010986, "lyap1_mean": -0.17077234387397766, "lyap1_max": -0.03046402893960476, "frac_above_star": 0.125 }, { "step": 155, "sup_loss": 0.5707823729647311, "rf_loss": 0.0, "total_loss": 0.5707823729647311, "lyap1_mean": -0.20443472266197205, "lyap1_max": -0.12300200760364532, "frac_above_star": 0.0 }, { "step": 156, "sup_loss": 0.7517248274665449, "rf_loss": 0.0, "total_loss": 0.7517248274665449, "lyap1_mean": -0.21624569594860077, "lyap1_max": -0.15273524820804596, "frac_above_star": 0.0 }, { "step": 157, "sup_loss": 0.7550228256164159, "rf_loss": 0.0, "total_loss": 0.7550228256164159, "lyap1_mean": -0.20119717717170715, "lyap1_max": -0.13842016458511353, "frac_above_star": 0.0 }, { "step": 158, "sup_loss": 0.8257631081075811, "rf_loss": 0.0, "total_loss": 0.8257631081075811, "lyap1_mean": -0.18291744589805603, "lyap1_max": -0.11714653670787811, "frac_above_star": 0.0 }, { "step": 159, "sup_loss": 0.6355959916056814, "rf_loss": 0.0, "total_loss": 0.6355959916056814, "lyap1_mean": -0.2216596007347107, "lyap1_max": -0.12651950120925903, "frac_above_star": 0.0 }, { "step": 160, "sup_loss": 0.8345994522684059, "rf_loss": 0.0, "total_loss": 0.8345994522684059, "lyap1_mean": -0.170243501663208, "lyap1_max": -0.08337725698947906, "frac_above_star": 0.0 }, { "step": 161, "sup_loss": 0.400479856276031, "rf_loss": 0.0, "total_loss": 0.400479856276031, "lyap1_mean": -0.23095226287841797, "lyap1_max": -0.15229277312755585, "frac_above_star": 0.0 }, { "step": 162, "sup_loss": 0.4768457229339521, "rf_loss": 0.0, "total_loss": 0.4768457229339521, "lyap1_mean": -0.23988571763038635, "lyap1_max": -0.13837072253227234, "frac_above_star": 0.0 }, { "step": 163, "sup_loss": 0.6855541955945201, "rf_loss": 0.0, "total_loss": 0.6855541955945201, "lyap1_mean": -0.20827777683734894, "lyap1_max": -0.1385776251554489, "frac_above_star": 0.0 }, { "step": 164, "sup_loss": 0.5615322774888153, "rf_loss": 3.528164961608127e-05, "total_loss": 0.5618850939704242, "lyap1_mean": -0.17946332693099976, "lyap1_max": -0.03319960832595825, "frac_above_star": 0.125 }, { "step": 165, "sup_loss": 0.46664185241567757, "rf_loss": 0.0, "total_loss": 0.46664185241567757, "lyap1_mean": -0.22228142619132996, "lyap1_max": -0.14169782400131226, "frac_above_star": 0.0 }, { "step": 166, "sup_loss": 0.7100832104551925, "rf_loss": 6.677029159618542e-05, "total_loss": 0.7107509133857063, "lyap1_mean": -0.18150594830513, "lyap1_max": -0.0268880482763052, "frac_above_star": 0.125 }, { "step": 167, "sup_loss": 0.8433739255526028, "rf_loss": 0.0, "total_loss": 0.8433739255526028, "lyap1_mean": -0.1936882734298706, "lyap1_max": -0.10591065138578415, "frac_above_star": 0.0 }, { "step": 168, "sup_loss": 0.7218067810208214, "rf_loss": 0.0, "total_loss": 0.7218067810208214, "lyap1_mean": -0.20266053080558777, "lyap1_max": -0.14435790479183197, "frac_above_star": 0.0 }, { "step": 169, "sup_loss": 0.5928926416845838, "rf_loss": 0.0, "total_loss": 0.5928926416845838, "lyap1_mean": -0.20775346457958221, "lyap1_max": -0.13561299443244934, "frac_above_star": 0.0 }, { "step": 170, "sup_loss": 0.4930069609340155, "rf_loss": 0.0, "total_loss": 0.4930069609340155, "lyap1_mean": -0.24277272820472717, "lyap1_max": -0.15739299356937408, "frac_above_star": 0.0 }, { "step": 171, "sup_loss": 0.6495077558904317, "rf_loss": 0.0, "total_loss": 0.6495077558904317, "lyap1_mean": -0.18608960509300232, "lyap1_max": -0.13392075896263123, "frac_above_star": 0.0 }, { "step": 172, "sup_loss": 0.5778910870978861, "rf_loss": 0.0, "total_loss": 0.5778910870978861, "lyap1_mean": -0.1896805763244629, "lyap1_max": -0.12239302694797516, "frac_above_star": 0.0 }, { "step": 173, "sup_loss": 0.5670474070025211, "rf_loss": 0.0, "total_loss": 0.5670474070025211, "lyap1_mean": -0.20000123977661133, "lyap1_max": -0.13916289806365967, "frac_above_star": 0.0 }, { "step": 174, "sup_loss": 0.8113227436469832, "rf_loss": 0.0, "total_loss": 0.8113227436469832, "lyap1_mean": -0.20318841934204102, "lyap1_max": -0.0724237710237503, "frac_above_star": 0.0 }, { "step": 175, "sup_loss": 0.5686242042782321, "rf_loss": 0.0, "total_loss": 0.5686242042782321, "lyap1_mean": -0.20981794595718384, "lyap1_max": -0.12486933171749115, "frac_above_star": 0.0 }, { "step": 176, "sup_loss": 0.6433767881453153, "rf_loss": 0.0, "total_loss": 0.6433767881453153, "lyap1_mean": -0.18674199283123016, "lyap1_max": -0.121048703789711, "frac_above_star": 0.0 }, { "step": 177, "sup_loss": 0.632422996664613, "rf_loss": 0.0, "total_loss": 0.632422996664613, "lyap1_mean": -0.17558817565441132, "lyap1_max": -0.1252283751964569, "frac_above_star": 0.0 }, { "step": 178, "sup_loss": 0.5675086403532894, "rf_loss": 0.0, "total_loss": 0.5675086403532894, "lyap1_mean": -0.2108987271785736, "lyap1_max": -0.15896984934806824, "frac_above_star": 0.0 }, { "step": 179, "sup_loss": 0.6308019669801944, "rf_loss": 0.0, "total_loss": 0.6308019669801944, "lyap1_mean": -0.1990661919116974, "lyap1_max": -0.16533495485782623, "frac_above_star": 0.0 }, { "step": 180, "sup_loss": 0.61015281138549, "rf_loss": 0.0004897950566373765, "total_loss": 0.6150507620682791, "lyap1_mean": -0.16111186146736145, "lyap1_max": 0.0022938873153179884, "frac_above_star": 0.25 }, { "step": 181, "sup_loss": 0.5258386702329458, "rf_loss": 0.0, "total_loss": 0.5258386702329458, "lyap1_mean": -0.21739423274993896, "lyap1_max": -0.15318156778812408, "frac_above_star": 0.0 }, { "step": 182, "sup_loss": 0.6280928429612475, "rf_loss": 0.0, "total_loss": 0.6280928429612475, "lyap1_mean": -0.19950926303863525, "lyap1_max": -0.14998115599155426, "frac_above_star": 0.0 }, { "step": 183, "sup_loss": 0.6073739712056119, "rf_loss": 0.0, "total_loss": 0.6073739712056119, "lyap1_mean": -0.1919657588005066, "lyap1_max": -0.060053758323192596, "frac_above_star": 0.0 }, { "step": 184, "sup_loss": 0.449097527668729, "rf_loss": 0.0, "total_loss": 0.449097527668729, "lyap1_mean": -0.21088320016860962, "lyap1_max": -0.14188550412654877, "frac_above_star": 0.0 }, { "step": 185, "sup_loss": 0.41847866772665626, "rf_loss": 0.0, "total_loss": 0.41847866772665626, "lyap1_mean": -0.2498043030500412, "lyap1_max": -0.15051552653312683, "frac_above_star": 0.0 }, { "step": 186, "sup_loss": 0.5470732300834652, "rf_loss": 0.0, "total_loss": 0.5470732300834652, "lyap1_mean": -0.21463564038276672, "lyap1_max": -0.13305023312568665, "frac_above_star": 0.0 }, { "step": 187, "sup_loss": 0.5928415066305116, "rf_loss": 0.0, "total_loss": 0.5928415066305116, "lyap1_mean": -0.21944648027420044, "lyap1_max": -0.15302401781082153, "frac_above_star": 0.0 }, { "step": 188, "sup_loss": 0.7115969208547334, "rf_loss": 0.0, "total_loss": 0.7115969208547334, "lyap1_mean": -0.19479309022426605, "lyap1_max": -0.10219204425811768, "frac_above_star": 0.0 }, { "step": 189, "sup_loss": 0.8666635708379027, "rf_loss": 0.0, "total_loss": 0.8666635708379027, "lyap1_mean": -0.20331376791000366, "lyap1_max": -0.1257995069026947, "frac_above_star": 0.0 }, { "step": 190, "sup_loss": 0.5491049317698938, "rf_loss": 0.0, "total_loss": 0.5491049317698938, "lyap1_mean": -0.18936565518379211, "lyap1_max": -0.12966521084308624, "frac_above_star": 0.0 }, { "step": 191, "sup_loss": 0.7180045364776377, "rf_loss": 0.0, "total_loss": 0.7180045364776377, "lyap1_mean": -0.19625556468963623, "lyap1_max": -0.13425108790397644, "frac_above_star": 0.0 }, { "step": 192, "sup_loss": 0.6155840207892554, "rf_loss": 0.0, "total_loss": 0.6155840207892554, "lyap1_mean": -0.21135061979293823, "lyap1_max": -0.16226764023303986, "frac_above_star": 0.0 }, { "step": 193, "sup_loss": 0.4395152414453938, "rf_loss": 0.0, "total_loss": 0.4395152414453938, "lyap1_mean": -0.2165890336036682, "lyap1_max": -0.08697529882192612, "frac_above_star": 0.0 }, { "step": 194, "sup_loss": 0.8777933349330381, "rf_loss": 0.0, "total_loss": 0.8777933349330381, "lyap1_mean": -0.17694713175296783, "lyap1_max": -0.13006161153316498, "frac_above_star": 0.0 }, { "step": 195, "sup_loss": 0.4676728214698174, "rf_loss": 0.0, "total_loss": 0.4676728214698174, "lyap1_mean": -0.20978495478630066, "lyap1_max": -0.06491933017969131, "frac_above_star": 0.0 }, { "step": 196, "sup_loss": 0.8157122276216145, "rf_loss": 0.0, "total_loss": 0.8157122276216145, "lyap1_mean": -0.1560392677783966, "lyap1_max": -0.11054389178752899, "frac_above_star": 0.0 }, { "step": 197, "sup_loss": 0.6887069531016712, "rf_loss": 0.0, "total_loss": 0.6887069531016712, "lyap1_mean": -0.22056058049201965, "lyap1_max": -0.1249123364686966, "frac_above_star": 0.0 }, { "step": 198, "sup_loss": 0.6549785822953171, "rf_loss": 0.0, "total_loss": 0.6549785822953171, "lyap1_mean": -0.20498737692832947, "lyap1_max": -0.14473292231559753, "frac_above_star": 0.0 }, { "step": 199, "sup_loss": 0.5931491489256056, "rf_loss": 0.0, "total_loss": 0.5931491489256056, "lyap1_mean": -0.16275423765182495, "lyap1_max": -0.07426565140485764, "frac_above_star": 0.0 }, { "step": 200, "sup_loss": 0.7647836789121369, "rf_loss": 0.0, "total_loss": 0.7647836789121369, "lyap1_mean": -0.1644914448261261, "lyap1_max": -0.08896409720182419, "frac_above_star": 0.0 }, { "step": 201, "sup_loss": 0.6047298083745406, "rf_loss": 0.0, "total_loss": 0.6047298083745406, "lyap1_mean": -0.19607070088386536, "lyap1_max": -0.14765456318855286, "frac_above_star": 0.0 }, { "step": 202, "sup_loss": 0.7179749491431686, "rf_loss": 0.0, "total_loss": 0.7179749491431686, "lyap1_mean": -0.20036940276622772, "lyap1_max": -0.0851418673992157, "frac_above_star": 0.0 }, { "step": 203, "sup_loss": 0.5882547811186345, "rf_loss": 0.0, "total_loss": 0.5882547811186345, "lyap1_mean": -0.19406482577323914, "lyap1_max": -0.11948516219854355, "frac_above_star": 0.0 }, { "step": 204, "sup_loss": 0.8687362271315668, "rf_loss": 0.0, "total_loss": 0.8687362271315668, "lyap1_mean": -0.182657390832901, "lyap1_max": -0.14728671312332153, "frac_above_star": 0.0 }, { "step": 205, "sup_loss": 0.6869394652537703, "rf_loss": 0.0, "total_loss": 0.6869394652537703, "lyap1_mean": -0.19941982626914978, "lyap1_max": -0.14883649349212646, "frac_above_star": 0.0 }, { "step": 206, "sup_loss": 0.6816107273448638, "rf_loss": 0.0, "total_loss": 0.6816107273448638, "lyap1_mean": -0.20716366171836853, "lyap1_max": -0.1337496042251587, "frac_above_star": 0.0 }, { "step": 207, "sup_loss": 0.8990259838657207, "rf_loss": 0.0, "total_loss": 0.8990259838657207, "lyap1_mean": -0.1720457673072815, "lyap1_max": -0.1120566576719284, "frac_above_star": 0.0 }, { "step": 208, "sup_loss": 0.7286642281930277, "rf_loss": 0.0, "total_loss": 0.7286642281930277, "lyap1_mean": -0.2149023413658142, "lyap1_max": -0.0969642847776413, "frac_above_star": 0.0 }, { "step": 209, "sup_loss": 0.7181270902368173, "rf_loss": 0.0, "total_loss": 0.7181270902368173, "lyap1_mean": -0.1789305955171585, "lyap1_max": -0.1318063735961914, "frac_above_star": 0.0 }, { "step": 210, "sup_loss": 0.6880416247341339, "rf_loss": 0.0, "total_loss": 0.6880416247341339, "lyap1_mean": -0.20852741599082947, "lyap1_max": -0.164077490568161, "frac_above_star": 0.0 }, { "step": 211, "sup_loss": 0.46516003244966314, "rf_loss": 0.0, "total_loss": 0.46516003244966314, "lyap1_mean": -0.17923963069915771, "lyap1_max": -0.08775073289871216, "frac_above_star": 0.0 }, { "step": 212, "sup_loss": 0.7747517594275912, "rf_loss": 0.0, "total_loss": 0.7747517594275912, "lyap1_mean": -0.18764923512935638, "lyap1_max": -0.15302231907844543, "frac_above_star": 0.0 }, { "step": 213, "sup_loss": 0.5911512512042719, "rf_loss": 0.0, "total_loss": 0.5911512512042719, "lyap1_mean": -0.1814614236354828, "lyap1_max": -0.10764815658330917, "frac_above_star": 0.0 }, { "step": 214, "sup_loss": 0.8255641091361329, "rf_loss": 0.0, "total_loss": 0.8255641091361329, "lyap1_mean": -0.1938202977180481, "lyap1_max": -0.14749383926391602, "frac_above_star": 0.0 }, { "step": 215, "sup_loss": 0.5355848921372608, "rf_loss": 0.0, "total_loss": 0.5355848921372608, "lyap1_mean": -0.23224031925201416, "lyap1_max": -0.09511595964431763, "frac_above_star": 0.0 }, { "step": 216, "sup_loss": 0.5237713325781176, "rf_loss": 0.0, "total_loss": 0.5237713325781176, "lyap1_mean": -0.20616477727890015, "lyap1_max": -0.13460896909236908, "frac_above_star": 0.0 }, { "step": 217, "sup_loss": 0.6845327307626905, "rf_loss": 0.0, "total_loss": 0.6845327307626905, "lyap1_mean": -0.213209867477417, "lyap1_max": -0.13395428657531738, "frac_above_star": 0.0 }, { "step": 218, "sup_loss": 0.4365561686804773, "rf_loss": 0.0, "total_loss": 0.4365561686804773, "lyap1_mean": -0.2317594438791275, "lyap1_max": -0.1456560492515564, "frac_above_star": 0.0 }, { "step": 219, "sup_loss": 0.7489246906122351, "rf_loss": 0.0, "total_loss": 0.7489246906122351, "lyap1_mean": -0.21497467160224915, "lyap1_max": -0.16153545677661896, "frac_above_star": 0.0 }, { "step": 220, "sup_loss": 0.6226879895609553, "rf_loss": 0.0, "total_loss": 0.6226879895609553, "lyap1_mean": -0.2018626183271408, "lyap1_max": -0.14777329564094543, "frac_above_star": 0.0 }, { "step": 221, "sup_loss": 0.6176710127399485, "rf_loss": 0.0, "total_loss": 0.6176710127399485, "lyap1_mean": -0.18920880556106567, "lyap1_max": -0.11728831380605698, "frac_above_star": 0.0 }, { "step": 222, "sup_loss": 0.7471889065633798, "rf_loss": 0.0, "total_loss": 0.7471889065633798, "lyap1_mean": -0.1934327483177185, "lyap1_max": -0.13927027583122253, "frac_above_star": 0.0 }, { "step": 223, "sup_loss": 0.6652412151660972, "rf_loss": 0.0, "total_loss": 0.6652412151660972, "lyap1_mean": -0.2077174186706543, "lyap1_max": -0.15974101424217224, "frac_above_star": 0.0 }, { "step": 224, "sup_loss": 0.5531021348349586, "rf_loss": 0.0, "total_loss": 0.5531021348349586, "lyap1_mean": -0.24349234998226166, "lyap1_max": -0.14861637353897095, "frac_above_star": 0.0 }, { "step": 225, "sup_loss": 0.6145669473437381, "rf_loss": 0.0, "total_loss": 0.6145669473437381, "lyap1_mean": -0.19002535939216614, "lyap1_max": -0.13535729050636292, "frac_above_star": 0.0 }, { "step": 226, "sup_loss": 0.676204157699914, "rf_loss": 0.0, "total_loss": 0.676204157699914, "lyap1_mean": -0.20304293930530548, "lyap1_max": -0.12886755168437958, "frac_above_star": 0.0 }, { "step": 227, "sup_loss": 0.7270620498335346, "rf_loss": 0.0, "total_loss": 0.7270620498335346, "lyap1_mean": -0.18738427758216858, "lyap1_max": -0.07992863655090332, "frac_above_star": 0.0 }, { "step": 228, "sup_loss": 0.7343344834613565, "rf_loss": 0.0, "total_loss": 0.7343344834613565, "lyap1_mean": -0.19570563733577728, "lyap1_max": -0.14891564846038818, "frac_above_star": 0.0 }, { "step": 229, "sup_loss": 0.6209384827097724, "rf_loss": 0.0, "total_loss": 0.6209384827097724, "lyap1_mean": -0.16853196918964386, "lyap1_max": -0.0954430028796196, "frac_above_star": 0.0 }, { "step": 230, "sup_loss": 0.4965299418140961, "rf_loss": 0.0, "total_loss": 0.4965299418140961, "lyap1_mean": -0.2552441954612732, "lyap1_max": -0.13357387483119965, "frac_above_star": 0.0 }, { "step": 231, "sup_loss": 0.5447527831092208, "rf_loss": 0.0, "total_loss": 0.5447527831092208, "lyap1_mean": -0.2510998845100403, "lyap1_max": -0.14958667755126953, "frac_above_star": 0.0 }, { "step": 232, "sup_loss": 0.44276770684008376, "rf_loss": 0.0, "total_loss": 0.44276770684008376, "lyap1_mean": -0.2295585721731186, "lyap1_max": -0.12558750808238983, "frac_above_star": 0.0 }, { "step": 233, "sup_loss": 0.6638873316193467, "rf_loss": 0.000399629061575979, "total_loss": 0.6678836223515218, "lyap1_mean": -0.16523225605487823, "lyap1_max": 0.006542305462062359, "frac_above_star": 0.125 }, { "step": 234, "sup_loss": 0.7441185268258137, "rf_loss": 0.0, "total_loss": 0.7441185268258137, "lyap1_mean": -0.19292184710502625, "lyap1_max": -0.11682596802711487, "frac_above_star": 0.0 }, { "step": 235, "sup_loss": 0.5188958814875773, "rf_loss": 0.0, "total_loss": 0.5188958814875773, "lyap1_mean": -0.24961619079113007, "lyap1_max": -0.15866920351982117, "frac_above_star": 0.0 }, { "step": 236, "sup_loss": 0.6913494517845652, "rf_loss": 0.0, "total_loss": 0.6913494517845652, "lyap1_mean": -0.2013171911239624, "lyap1_max": -0.15841642022132874, "frac_above_star": 0.0 }, { "step": 237, "sup_loss": 0.749524573409244, "rf_loss": 0.0, "total_loss": 0.749524573409244, "lyap1_mean": -0.198990136384964, "lyap1_max": -0.1388969123363495, "frac_above_star": 0.0 }, { "step": 238, "sup_loss": 0.7025699436115729, "rf_loss": 0.0, "total_loss": 0.7025699436115729, "lyap1_mean": -0.18805401027202606, "lyap1_max": -0.12639333307743073, "frac_above_star": 0.0 }, { "step": 239, "sup_loss": 0.5359770592928145, "rf_loss": 0.0, "total_loss": 0.5359770592928145, "lyap1_mean": -0.217665895819664, "lyap1_max": -0.14082607626914978, "frac_above_star": 0.0 }, { "step": 240, "sup_loss": 0.6430705507342079, "rf_loss": 0.0, "total_loss": 0.6430705507342079, "lyap1_mean": -0.1752490997314453, "lyap1_max": -0.1365225464105606, "frac_above_star": 0.0 }, { "step": 241, "sup_loss": 0.8122379716289592, "rf_loss": 0.0, "total_loss": 0.8122379716289592, "lyap1_mean": -0.18503081798553467, "lyap1_max": -0.08871650695800781, "frac_above_star": 0.0 }, { "step": 242, "sup_loss": 0.5610528171257888, "rf_loss": 0.0, "total_loss": 0.5610528171257888, "lyap1_mean": -0.21184517443180084, "lyap1_max": -0.1401902288198471, "frac_above_star": 0.0 }, { "step": 243, "sup_loss": 0.6268265947911122, "rf_loss": 0.0, "total_loss": 0.6268265947911122, "lyap1_mean": -0.25786492228507996, "lyap1_max": -0.1484510600566864, "frac_above_star": 0.0 }, { "step": 244, "sup_loss": 0.7774390813394559, "rf_loss": 0.0, "total_loss": 0.7774390813394559, "lyap1_mean": -0.20239108800888062, "lyap1_max": -0.13664431869983673, "frac_above_star": 0.0 }, { "step": 245, "sup_loss": 0.6485711538754377, "rf_loss": 0.0, "total_loss": 0.6485711538754377, "lyap1_mean": -0.19165365397930145, "lyap1_max": -0.13562846183776855, "frac_above_star": 0.0 }, { "step": 246, "sup_loss": 0.6340407906616154, "rf_loss": 0.0, "total_loss": 0.6340407906616154, "lyap1_mean": -0.21165643632411957, "lyap1_max": -0.18734601140022278, "frac_above_star": 0.0 }, { "step": 247, "sup_loss": 0.5002010095276697, "rf_loss": 0.0, "total_loss": 0.5002010095276697, "lyap1_mean": -0.22989000380039215, "lyap1_max": -0.09553690254688263, "frac_above_star": 0.0 }, { "step": 248, "sup_loss": 0.5886790596582384, "rf_loss": 0.0, "total_loss": 0.5886790596582384, "lyap1_mean": -0.19525735080242157, "lyap1_max": -0.1284600794315338, "frac_above_star": 0.0 }, { "step": 249, "sup_loss": 0.4677360674858931, "rf_loss": 0.0, "total_loss": 0.4677360674858931, "lyap1_mean": -0.21176673471927643, "lyap1_max": -0.1349661946296692, "frac_above_star": 0.0 }, { "step": 250, "sup_loss": 0.6820351581748441, "rf_loss": 0.0, "total_loss": 0.6820351581748441, "lyap1_mean": -0.22553136944770813, "lyap1_max": -0.15090954303741455, "frac_above_star": 0.0 }, { "step": 251, "sup_loss": 0.5154981679682633, "rf_loss": 0.0, "total_loss": 0.5154981679682633, "lyap1_mean": -0.20461168885231018, "lyap1_max": -0.06962965428829193, "frac_above_star": 0.0 }, { "step": 252, "sup_loss": 0.710339055411171, "rf_loss": 0.0, "total_loss": 0.710339055411171, "lyap1_mean": -0.17916253209114075, "lyap1_max": -0.10785667598247528, "frac_above_star": 0.0 }, { "step": 253, "sup_loss": 0.6532457507034521, "rf_loss": 0.0, "total_loss": 0.6532457507034521, "lyap1_mean": -0.21800638735294342, "lyap1_max": -0.1495962291955948, "frac_above_star": 0.0 }, { "step": 254, "sup_loss": 0.5785991267504845, "rf_loss": 0.0, "total_loss": 0.5785991267504845, "lyap1_mean": -0.20258021354675293, "lyap1_max": -0.09281677007675171, "frac_above_star": 0.0 }, { "step": 255, "sup_loss": 0.735606394313626, "rf_loss": 0.0, "total_loss": 0.735606394313626, "lyap1_mean": -0.22837942838668823, "lyap1_max": -0.14530766010284424, "frac_above_star": 0.0 }, { "step": 256, "sup_loss": 0.40556751801577395, "rf_loss": 0.0, "total_loss": 0.40556751801577395, "lyap1_mean": -0.22732436656951904, "lyap1_max": -0.14934980869293213, "frac_above_star": 0.0 }, { "step": 257, "sup_loss": 0.5212032317219596, "rf_loss": 0.0, "total_loss": 0.5212032317219596, "lyap1_mean": -0.2266208678483963, "lyap1_max": -0.15092498064041138, "frac_above_star": 0.0 }, { "step": 258, "sup_loss": 0.6194087198951125, "rf_loss": 0.0, "total_loss": 0.6194087198951125, "lyap1_mean": -0.23279377818107605, "lyap1_max": -0.15293967723846436, "frac_above_star": 0.0 }, { "step": 259, "sup_loss": 0.7010078821177878, "rf_loss": 0.0, "total_loss": 0.7010078821177878, "lyap1_mean": -0.22671744227409363, "lyap1_max": -0.16852310299873352, "frac_above_star": 0.0 }, { "step": 260, "sup_loss": 0.7873634798714566, "rf_loss": 0.00032050005393102765, "total_loss": 0.7905684802943516, "lyap1_mean": -0.17944949865341187, "lyap1_max": 0.0006359592080116272, "frac_above_star": 0.125 }, { "step": 261, "sup_loss": 0.5677103470000727, "rf_loss": 0.0, "total_loss": 0.5677103470000727, "lyap1_mean": -0.2340777963399887, "lyap1_max": -0.12701141834259033, "frac_above_star": 0.0 }, { "step": 262, "sup_loss": 0.5589603329638633, "rf_loss": 0.0, "total_loss": 0.5589603329638633, "lyap1_mean": -0.19813737273216248, "lyap1_max": -0.06794442236423492, "frac_above_star": 0.0 }, { "step": 263, "sup_loss": 0.5317778684868595, "rf_loss": 0.0, "total_loss": 0.5317778684868595, "lyap1_mean": -0.23329786956310272, "lyap1_max": -0.17043384909629822, "frac_above_star": 0.0 }, { "step": 264, "sup_loss": 0.6016443016344399, "rf_loss": 0.0, "total_loss": 0.6016443016344399, "lyap1_mean": -0.21522793173789978, "lyap1_max": -0.10651891678571701, "frac_above_star": 0.0 }, { "step": 265, "sup_loss": 0.669381043186165, "rf_loss": 0.0, "total_loss": 0.669381043186165, "lyap1_mean": -0.23044681549072266, "lyap1_max": -0.1514340192079544, "frac_above_star": 0.0 }, { "step": 266, "sup_loss": 0.6177230620190153, "rf_loss": 0.0, "total_loss": 0.6177230620190153, "lyap1_mean": -0.24319922924041748, "lyap1_max": -0.16463223099708557, "frac_above_star": 0.0 }, { "step": 267, "sup_loss": 0.6490102827713804, "rf_loss": 0.0, "total_loss": 0.6490102827713804, "lyap1_mean": -0.17153862118721008, "lyap1_max": -0.10556592047214508, "frac_above_star": 0.0 }, { "step": 268, "sup_loss": 0.7209047828811763, "rf_loss": 0.0, "total_loss": 0.7209047828811763, "lyap1_mean": -0.21882590651512146, "lyap1_max": -0.13429629802703857, "frac_above_star": 0.0 }, { "step": 269, "sup_loss": 0.624089753613391, "rf_loss": 0.0, "total_loss": 0.624089753613391, "lyap1_mean": -0.23265042901039124, "lyap1_max": -0.18409639596939087, "frac_above_star": 0.0 }, { "step": 270, "sup_loss": 0.6839350702657916, "rf_loss": 0.0, "total_loss": 0.6839350702657916, "lyap1_mean": -0.19725045561790466, "lyap1_max": -0.1207718700170517, "frac_above_star": 0.0 }, { "step": 271, "sup_loss": 0.5157462367993206, "rf_loss": 0.0, "total_loss": 0.5157462367993206, "lyap1_mean": -0.1985214352607727, "lyap1_max": -0.11036394536495209, "frac_above_star": 0.0 }, { "step": 272, "sup_loss": 0.7071610443847546, "rf_loss": 0.0, "total_loss": 0.7071610443847546, "lyap1_mean": -0.17402000725269318, "lyap1_max": -0.06326930224895477, "frac_above_star": 0.0 }, { "step": 273, "sup_loss": 0.5309942313081077, "rf_loss": 0.0, "total_loss": 0.5309942313081077, "lyap1_mean": -0.2158316969871521, "lyap1_max": -0.08887538313865662, "frac_above_star": 0.0 }, { "step": 274, "sup_loss": 0.7142519553446859, "rf_loss": 6.341738298942801e-06, "total_loss": 0.7143153727294943, "lyap1_mean": -0.17434048652648926, "lyap1_max": -0.04287722706794739, "frac_above_star": 0.125 }, { "step": 275, "sup_loss": 0.7229026322373567, "rf_loss": 0.0, "total_loss": 0.7229026322373567, "lyap1_mean": -0.1955108791589737, "lyap1_max": -0.07400323450565338, "frac_above_star": 0.0 }, { "step": 276, "sup_loss": 0.46284527550457544, "rf_loss": 0.0, "total_loss": 0.46284527550457544, "lyap1_mean": -0.2101568579673767, "lyap1_max": -0.08780448883771896, "frac_above_star": 0.0 }, { "step": 277, "sup_loss": 0.5357066846657672, "rf_loss": 0.0, "total_loss": 0.5357066846657672, "lyap1_mean": -0.1930445432662964, "lyap1_max": -0.1298808604478836, "frac_above_star": 0.0 }, { "step": 278, "sup_loss": 0.6379496581566793, "rf_loss": 0.0, "total_loss": 0.6379496581566793, "lyap1_mean": -0.20854787528514862, "lyap1_max": -0.14570274949073792, "frac_above_star": 0.0 }, { "step": 279, "sup_loss": 0.7509267926053067, "rf_loss": 0.0, "total_loss": 0.7509267926053067, "lyap1_mean": -0.21874669194221497, "lyap1_max": -0.15162450075149536, "frac_above_star": 0.0 }, { "step": 280, "sup_loss": 0.8385968944915521, "rf_loss": 0.0, "total_loss": 0.8385968944915521, "lyap1_mean": -0.22255003452301025, "lyap1_max": -0.1767907589673996, "frac_above_star": 0.0 }, { "step": 281, "sup_loss": 0.6086281122131114, "rf_loss": 0.0, "total_loss": 0.6086281122131114, "lyap1_mean": -0.20129919052124023, "lyap1_max": -0.15607738494873047, "frac_above_star": 0.0 }, { "step": 282, "sup_loss": 0.5286728193228203, "rf_loss": 0.0, "total_loss": 0.5286728193228203, "lyap1_mean": -0.22995124757289886, "lyap1_max": -0.1618523895740509, "frac_above_star": 0.0 }, { "step": 283, "sup_loss": 0.6074324453196915, "rf_loss": 0.0007418236345984042, "total_loss": 0.6148506815492603, "lyap1_mean": -0.18350297212600708, "lyap1_max": 0.027036283165216446, "frac_above_star": 0.125 }, { "step": 284, "sup_loss": 0.7753260279909635, "rf_loss": 0.0, "total_loss": 0.7753260279909635, "lyap1_mean": -0.19298504292964935, "lyap1_max": -0.11830654740333557, "frac_above_star": 0.0 }, { "step": 285, "sup_loss": 0.6649656946704688, "rf_loss": 0.0, "total_loss": 0.6649656946704688, "lyap1_mean": -0.20865383744239807, "lyap1_max": -0.12304385751485825, "frac_above_star": 0.0 }, { "step": 286, "sup_loss": 0.46066301918422503, "rf_loss": 0.0, "total_loss": 0.46066301918422503, "lyap1_mean": -0.20852267742156982, "lyap1_max": -0.12857352197170258, "frac_above_star": 0.0 }, { "step": 287, "sup_loss": 0.7667831053649123, "rf_loss": 0.0, "total_loss": 0.7667831053649123, "lyap1_mean": -0.18527644872665405, "lyap1_max": -0.09752162545919418, "frac_above_star": 0.0 }, { "step": 288, "sup_loss": 0.7025058780975046, "rf_loss": 0.0, "total_loss": 0.7025058780975046, "lyap1_mean": -0.20340809226036072, "lyap1_max": -0.12992212176322937, "frac_above_star": 0.0 }, { "step": 289, "sup_loss": 0.6773697630220173, "rf_loss": 0.0, "total_loss": 0.6773697630220173, "lyap1_mean": -0.2123134285211563, "lyap1_max": -0.15755394101142883, "frac_above_star": 0.0 }, { "step": 290, "sup_loss": 0.6254785050924282, "rf_loss": 0.0, "total_loss": 0.6254785050924282, "lyap1_mean": -0.2014375627040863, "lyap1_max": -0.08749916404485703, "frac_above_star": 0.0 }, { "step": 291, "sup_loss": 0.6830871133516344, "rf_loss": 0.0, "total_loss": 0.6830871133516344, "lyap1_mean": -0.17875906825065613, "lyap1_max": -0.13185003399848938, "frac_above_star": 0.0 }, { "step": 292, "sup_loss": 0.6511363721324225, "rf_loss": 0.0, "total_loss": 0.6511363721324225, "lyap1_mean": -0.20482604205608368, "lyap1_max": -0.14485621452331543, "frac_above_star": 0.0 }, { "step": 293, "sup_loss": 0.4567075364780384, "rf_loss": 0.0, "total_loss": 0.4567075364780384, "lyap1_mean": -0.19366693496704102, "lyap1_max": -0.12563195824623108, "frac_above_star": 0.0 }, { "step": 294, "sup_loss": 0.6109672467315146, "rf_loss": 0.0, "total_loss": 0.6109672467315146, "lyap1_mean": -0.21247343719005585, "lyap1_max": -0.1538855880498886, "frac_above_star": 0.0 }, { "step": 295, "sup_loss": 0.31313102800476356, "rf_loss": 0.0, "total_loss": 0.31313102800476356, "lyap1_mean": -0.23999741673469543, "lyap1_max": -0.15004315972328186, "frac_above_star": 0.0 }, { "step": 296, "sup_loss": 0.7654567861809497, "rf_loss": 0.0, "total_loss": 0.7654567861809497, "lyap1_mean": -0.19834670424461365, "lyap1_max": -0.12276718020439148, "frac_above_star": 0.0 }, { "step": 297, "sup_loss": 0.4674179344473515, "rf_loss": 0.0, "total_loss": 0.4674179344473515, "lyap1_mean": -0.2254909723997116, "lyap1_max": -0.1673107147216797, "frac_above_star": 0.0 }, { "step": 298, "sup_loss": 0.5364962892234902, "rf_loss": 0.0, "total_loss": 0.5364962892234902, "lyap1_mean": -0.23171478509902954, "lyap1_max": -0.15965606272220612, "frac_above_star": 0.0 }, { "step": 299, "sup_loss": 0.40788380888634584, "rf_loss": 0.0, "total_loss": 0.40788380888634584, "lyap1_mean": -0.2391020655632019, "lyap1_max": -0.1688903421163559, "frac_above_star": 0.0 }, { "step": 300, "sup_loss": 0.5915238802992534, "rf_loss": 0.0, "total_loss": 0.5915238802992534, "lyap1_mean": -0.22844335436820984, "lyap1_max": -0.160817950963974, "frac_above_star": 0.0 }, { "step": 301, "sup_loss": 0.6540136573681983, "rf_loss": 0.0, "total_loss": 0.6540136573681983, "lyap1_mean": -0.20998932421207428, "lyap1_max": -0.15383896231651306, "frac_above_star": 0.0 }, { "step": 302, "sup_loss": 0.6808466777318155, "rf_loss": 0.0, "total_loss": 0.6808466777318155, "lyap1_mean": -0.19895756244659424, "lyap1_max": -0.15490186214447021, "frac_above_star": 0.0 }, { "step": 303, "sup_loss": 0.6440083416927299, "rf_loss": 0.0, "total_loss": 0.6440083416927299, "lyap1_mean": -0.18580996990203857, "lyap1_max": -0.1513211578130722, "frac_above_star": 0.0 }, { "step": 304, "sup_loss": 0.629350808973947, "rf_loss": 0.0, "total_loss": 0.629350808973947, "lyap1_mean": -0.19507020711898804, "lyap1_max": -0.12522336840629578, "frac_above_star": 0.0 }, { "step": 305, "sup_loss": 0.5386285429869909, "rf_loss": 0.0, "total_loss": 0.5386285429869909, "lyap1_mean": -0.20694032311439514, "lyap1_max": -0.1612226814031601, "frac_above_star": 0.0 }, { "step": 306, "sup_loss": 0.7132075638167829, "rf_loss": 0.0, "total_loss": 0.7132075638167829, "lyap1_mean": -0.18681934475898743, "lyap1_max": -0.09840725362300873, "frac_above_star": 0.0 }, { "step": 307, "sup_loss": 0.5529240328500811, "rf_loss": 0.0, "total_loss": 0.5529240328500811, "lyap1_mean": -0.20348040759563446, "lyap1_max": -0.15505194664001465, "frac_above_star": 0.0 }, { "step": 308, "sup_loss": 0.4087644268590468, "rf_loss": 0.0, "total_loss": 0.4087644268590468, "lyap1_mean": -0.22185181081295013, "lyap1_max": -0.12267230451107025, "frac_above_star": 0.0 }, { "step": 309, "sup_loss": 0.6790686395338948, "rf_loss": 0.0, "total_loss": 0.6790686395338948, "lyap1_mean": -0.21406623721122742, "lyap1_max": -0.16052374243736267, "frac_above_star": 0.0 }, { "step": 310, "sup_loss": 0.4609579295527928, "rf_loss": 0.0, "total_loss": 0.4609579295527928, "lyap1_mean": -0.2494196593761444, "lyap1_max": -0.1498427391052246, "frac_above_star": 0.0 }, { "step": 311, "sup_loss": 0.707625676306318, "rf_loss": 0.0, "total_loss": 0.707625676306318, "lyap1_mean": -0.21246835589408875, "lyap1_max": -0.08755619823932648, "frac_above_star": 0.0 }, { "step": 312, "sup_loss": 0.44257311694502954, "rf_loss": 0.0, "total_loss": 0.44257311694502954, "lyap1_mean": -0.22885774075984955, "lyap1_max": -0.12664450705051422, "frac_above_star": 0.0 }, { "step": 313, "sup_loss": 0.4470586642982615, "rf_loss": 0.0, "total_loss": 0.4470586642982615, "lyap1_mean": -0.23420727252960205, "lyap1_max": -0.16033044457435608, "frac_above_star": 0.0 }, { "step": 314, "sup_loss": 0.8660470184182062, "rf_loss": 0.0, "total_loss": 0.8660470184182062, "lyap1_mean": -0.20514647662639618, "lyap1_max": -0.16238521039485931, "frac_above_star": 0.0 }, { "step": 315, "sup_loss": 0.6602418428331925, "rf_loss": 0.0, "total_loss": 0.6602418428331925, "lyap1_mean": -0.21938326954841614, "lyap1_max": -0.15006369352340698, "frac_above_star": 0.0 }, { "step": 316, "sup_loss": 0.5694420669476936, "rf_loss": 0.0, "total_loss": 0.5694420669476936, "lyap1_mean": -0.21052849292755127, "lyap1_max": -0.13944149017333984, "frac_above_star": 0.0 }, { "step": 317, "sup_loss": 0.695989903984418, "rf_loss": 0.0, "total_loss": 0.695989903984418, "lyap1_mean": -0.22205331921577454, "lyap1_max": -0.16457606852054596, "frac_above_star": 0.0 }, { "step": 318, "sup_loss": 0.5452148153806283, "rf_loss": 0.0, "total_loss": 0.5452148153806283, "lyap1_mean": -0.24797193706035614, "lyap1_max": -0.1893368661403656, "frac_above_star": 0.0 }, { "step": 319, "sup_loss": 0.4857685998637117, "rf_loss": 0.0, "total_loss": 0.4857685998637117, "lyap1_mean": -0.23541739583015442, "lyap1_max": -0.1908964216709137, "frac_above_star": 0.0 }, { "step": 320, "sup_loss": 0.592646129502498, "rf_loss": 0.0, "total_loss": 0.592646129502498, "lyap1_mean": -0.2227933257818222, "lyap1_max": -0.17848709225654602, "frac_above_star": 0.0 }, { "step": 321, "sup_loss": 0.4855272561632321, "rf_loss": 0.0, "total_loss": 0.4855272561632321, "lyap1_mean": -0.2196572721004486, "lyap1_max": -0.06551793962717056, "frac_above_star": 0.0 }, { "step": 322, "sup_loss": 0.5740623353734476, "rf_loss": 0.0, "total_loss": 0.5740623353734476, "lyap1_mean": -0.1998814195394516, "lyap1_max": -0.09437894076108932, "frac_above_star": 0.0 }, { "step": 323, "sup_loss": 0.8885185202821775, "rf_loss": 0.0, "total_loss": 0.8885185202821775, "lyap1_mean": -0.19435900449752808, "lyap1_max": -0.13477680087089539, "frac_above_star": 0.0 }, { "step": 324, "sup_loss": 0.5705096405135992, "rf_loss": 0.0, "total_loss": 0.5705096405135992, "lyap1_mean": -0.21889877319335938, "lyap1_max": -0.14275586605072021, "frac_above_star": 0.0 }, { "step": 325, "sup_loss": 0.4665195324406845, "rf_loss": 0.0, "total_loss": 0.4665195324406845, "lyap1_mean": -0.2211432307958603, "lyap1_max": -0.16028320789337158, "frac_above_star": 0.0 }, { "step": 326, "sup_loss": 0.779748169210806, "rf_loss": 0.0, "total_loss": 0.779748169210806, "lyap1_mean": -0.19235774874687195, "lyap1_max": -0.13172972202301025, "frac_above_star": 0.0 }, { "step": 327, "sup_loss": 0.585515569129418, "rf_loss": 0.0, "total_loss": 0.585515569129418, "lyap1_mean": -0.2366032898426056, "lyap1_max": -0.17283187806606293, "frac_above_star": 0.0 }, { "step": 328, "sup_loss": 0.511874477686214, "rf_loss": 0.0, "total_loss": 0.511874477686214, "lyap1_mean": -0.22222289443016052, "lyap1_max": -0.1432960331439972, "frac_above_star": 0.0 }, { "step": 329, "sup_loss": 0.5461505621721452, "rf_loss": 0.0, "total_loss": 0.5461505621721452, "lyap1_mean": -0.2037917673587799, "lyap1_max": -0.11324268579483032, "frac_above_star": 0.0 }, { "step": 330, "sup_loss": 0.6486150814675141, "rf_loss": 0.0, "total_loss": 0.6486150814675141, "lyap1_mean": -0.21274591982364655, "lyap1_max": -0.1399303376674652, "frac_above_star": 0.0 }, { "step": 331, "sup_loss": 0.6789002858963946, "rf_loss": 0.0, "total_loss": 0.6789002858963946, "lyap1_mean": -0.20342637598514557, "lyap1_max": -0.1052863746881485, "frac_above_star": 0.0 }, { "step": 332, "sup_loss": 0.6659264329389913, "rf_loss": 0.0, "total_loss": 0.6659264329389913, "lyap1_mean": -0.18696169555187225, "lyap1_max": -0.08391546458005905, "frac_above_star": 0.0 }, { "step": 333, "sup_loss": 0.592778944652384, "rf_loss": 0.0, "total_loss": 0.592778944652384, "lyap1_mean": -0.20941010117530823, "lyap1_max": -0.1030006930232048, "frac_above_star": 0.0 }, { "step": 334, "sup_loss": 0.45449988335519487, "rf_loss": 0.0, "total_loss": 0.45449988335519487, "lyap1_mean": -0.25045883655548096, "lyap1_max": -0.19002722203731537, "frac_above_star": 0.0 }, { "step": 335, "sup_loss": 0.6237568859685305, "rf_loss": 0.0, "total_loss": 0.6237568859685305, "lyap1_mean": -0.18097098171710968, "lyap1_max": -0.10087580978870392, "frac_above_star": 0.0 }, { "step": 336, "sup_loss": 0.44663650673321925, "rf_loss": 0.0, "total_loss": 0.44663650673321925, "lyap1_mean": -0.21681317687034607, "lyap1_max": -0.15622249245643616, "frac_above_star": 0.0 }, { "step": 337, "sup_loss": 0.5752391415951026, "rf_loss": 0.0, "total_loss": 0.5752391415951026, "lyap1_mean": -0.19021475315093994, "lyap1_max": -0.0939602479338646, "frac_above_star": 0.0 }, { "step": 338, "sup_loss": 0.3695605073663505, "rf_loss": 0.0, "total_loss": 0.3695605073663505, "lyap1_mean": -0.2700919210910797, "lyap1_max": -0.1922680139541626, "frac_above_star": 0.0 }, { "step": 339, "sup_loss": 0.5854984983893918, "rf_loss": 0.0, "total_loss": 0.5854984983893918, "lyap1_mean": -0.230684295296669, "lyap1_max": -0.13717587292194366, "frac_above_star": 0.0 }, { "step": 340, "sup_loss": 0.5879843361493751, "rf_loss": 0.0, "total_loss": 0.5879843361493751, "lyap1_mean": -0.22085818648338318, "lyap1_max": -0.1643618941307068, "frac_above_star": 0.0 }, { "step": 341, "sup_loss": 0.6609124146372717, "rf_loss": 0.0, "total_loss": 0.6609124146372717, "lyap1_mean": -0.22820556163787842, "lyap1_max": -0.14310424029827118, "frac_above_star": 0.0 }, { "step": 342, "sup_loss": 0.44449064775871444, "rf_loss": 0.0, "total_loss": 0.44449064775871444, "lyap1_mean": -0.23251499235630035, "lyap1_max": -0.15377113223075867, "frac_above_star": 0.0 }, { "step": 343, "sup_loss": 0.4946391209698592, "rf_loss": 0.0, "total_loss": 0.4946391209698592, "lyap1_mean": -0.23693051934242249, "lyap1_max": -0.15311840176582336, "frac_above_star": 0.0 }, { "step": 344, "sup_loss": 0.46234511295821396, "rf_loss": 0.0, "total_loss": 0.46234511295821396, "lyap1_mean": -0.2535727620124817, "lyap1_max": -0.14363867044448853, "frac_above_star": 0.0 }, { "step": 345, "sup_loss": 0.5869246225486722, "rf_loss": 0.0, "total_loss": 0.5869246225486722, "lyap1_mean": -0.1864006221294403, "lyap1_max": -0.08194048702716827, "frac_above_star": 0.0 }, { "step": 346, "sup_loss": 0.5479690874929435, "rf_loss": 0.0, "total_loss": 0.5479690874929435, "lyap1_mean": -0.22075700759887695, "lyap1_max": -0.12000446021556854, "frac_above_star": 0.0 }, { "step": 347, "sup_loss": 0.724446098598122, "rf_loss": 0.0, "total_loss": 0.724446098598122, "lyap1_mean": -0.1998179852962494, "lyap1_max": -0.12232448160648346, "frac_above_star": 0.0 }, { "step": 348, "sup_loss": 0.6431907279087362, "rf_loss": 0.0, "total_loss": 0.6431907279087362, "lyap1_mean": -0.21460610628128052, "lyap1_max": -0.13227346539497375, "frac_above_star": 0.0 }, { "step": 349, "sup_loss": 0.5805938399347761, "rf_loss": 0.0, "total_loss": 0.5805938399347761, "lyap1_mean": -0.22945956885814667, "lyap1_max": -0.12836483120918274, "frac_above_star": 0.0 }, { "step": 350, "sup_loss": 0.7767255250390784, "rf_loss": 0.0, "total_loss": 0.7767255250390784, "lyap1_mean": -0.17105141282081604, "lyap1_max": -0.07277780771255493, "frac_above_star": 0.0 }, { "step": 351, "sup_loss": 0.6834070983895129, "rf_loss": 0.0, "total_loss": 0.6834070983895129, "lyap1_mean": -0.19405382871627808, "lyap1_max": -0.13347342610359192, "frac_above_star": 0.0 }, { "step": 352, "sup_loss": 0.668352841631971, "rf_loss": 0.0, "total_loss": 0.668352841631971, "lyap1_mean": -0.22689369320869446, "lyap1_max": -0.14872883260250092, "frac_above_star": 0.0 }, { "step": 353, "sup_loss": 0.7209997215575427, "rf_loss": 0.0, "total_loss": 0.7209997215575427, "lyap1_mean": -0.21089453995227814, "lyap1_max": -0.1808469593524933, "frac_above_star": 0.0 }, { "step": 354, "sup_loss": 0.7923669863195466, "rf_loss": 0.0, "total_loss": 0.7923669863195466, "lyap1_mean": -0.20666776597499847, "lyap1_max": -0.1538865864276886, "frac_above_star": 0.0 }, { "step": 355, "sup_loss": 0.7509271830901899, "rf_loss": 0.0, "total_loss": 0.7509271830901899, "lyap1_mean": -0.21455755829811096, "lyap1_max": -0.1760244220495224, "frac_above_star": 0.0 }, { "step": 356, "sup_loss": 0.772157391662404, "rf_loss": 0.0, "total_loss": 0.772157391662404, "lyap1_mean": -0.20755545794963837, "lyap1_max": -0.08903278410434723, "frac_above_star": 0.0 }, { "step": 357, "sup_loss": 0.6100629417569802, "rf_loss": 0.0, "total_loss": 0.6100629417569802, "lyap1_mean": -0.213352233171463, "lyap1_max": -0.14093752205371857, "frac_above_star": 0.0 }, { "step": 358, "sup_loss": 0.5995438494362794, "rf_loss": 0.00011052437184844166, "total_loss": 0.60064909312566, "lyap1_mean": -0.17746403813362122, "lyap1_max": -0.020264584571123123, "frac_above_star": 0.125 }, { "step": 359, "sup_loss": 0.5676877421409371, "rf_loss": 0.0, "total_loss": 0.5676877421409371, "lyap1_mean": -0.22986847162246704, "lyap1_max": -0.14239609241485596, "frac_above_star": 0.0 }, { "step": 360, "sup_loss": 0.5716199612044225, "rf_loss": 0.0, "total_loss": 0.5716199612044225, "lyap1_mean": -0.2023630440235138, "lyap1_max": -0.15584540367126465, "frac_above_star": 0.0 }, { "step": 361, "sup_loss": 0.6918978852360045, "rf_loss": 0.0, "total_loss": 0.6918978852360045, "lyap1_mean": -0.20789708197116852, "lyap1_max": -0.1639281064271927, "frac_above_star": 0.0 }, { "step": 362, "sup_loss": 0.6810905533540892, "rf_loss": 0.0, "total_loss": 0.6810905533540892, "lyap1_mean": -0.1852123737335205, "lyap1_max": -0.1310468316078186, "frac_above_star": 0.0 }, { "step": 363, "sup_loss": 0.827021516236963, "rf_loss": 0.0, "total_loss": 0.827021516236963, "lyap1_mean": -0.17587244510650635, "lyap1_max": -0.13469673693180084, "frac_above_star": 0.0 }, { "step": 364, "sup_loss": 0.6112914244955131, "rf_loss": 0.0, "total_loss": 0.6112914244955131, "lyap1_mean": -0.21683329343795776, "lyap1_max": -0.14571020007133484, "frac_above_star": 0.0 }, { "step": 365, "sup_loss": 0.41170966096907663, "rf_loss": 0.0, "total_loss": 0.41170966096907663, "lyap1_mean": -0.24644891917705536, "lyap1_max": -0.174571692943573, "frac_above_star": 0.0 }, { "step": 366, "sup_loss": 0.5929771856071757, "rf_loss": 0.0, "total_loss": 0.5929771856071757, "lyap1_mean": -0.21925899386405945, "lyap1_max": -0.1593049019575119, "frac_above_star": 0.0 }, { "step": 367, "sup_loss": 0.6977408131933172, "rf_loss": 0.0, "total_loss": 0.6977408131933172, "lyap1_mean": -0.22557860612869263, "lyap1_max": -0.14963893592357635, "frac_above_star": 0.0 }, { "step": 368, "sup_loss": 0.8045605962002531, "rf_loss": 0.0, "total_loss": 0.8045605962002531, "lyap1_mean": -0.19593700766563416, "lyap1_max": -0.13351640105247498, "frac_above_star": 0.0 }, { "step": 369, "sup_loss": 0.5605410580342659, "rf_loss": 0.0, "total_loss": 0.5605410580342659, "lyap1_mean": -0.20284387469291687, "lyap1_max": -0.14832647144794464, "frac_above_star": 0.0 }, { "step": 370, "sup_loss": 0.7055439984778094, "rf_loss": 0.0, "total_loss": 0.7055439984778094, "lyap1_mean": -0.21607887744903564, "lyap1_max": -0.17973560094833374, "frac_above_star": 0.0 }, { "step": 371, "sup_loss": 0.4762201168342183, "rf_loss": 0.0, "total_loss": 0.4762201168342183, "lyap1_mean": -0.24783311784267426, "lyap1_max": -0.17381051182746887, "frac_above_star": 0.0 }, { "step": 372, "sup_loss": 0.762709188065877, "rf_loss": 0.0, "total_loss": 0.762709188065877, "lyap1_mean": -0.17611925303936005, "lyap1_max": -0.14503054320812225, "frac_above_star": 0.0 }, { "step": 373, "sup_loss": 0.4975718653575674, "rf_loss": 0.0, "total_loss": 0.4975718653575674, "lyap1_mean": -0.20971643924713135, "lyap1_max": -0.14238668978214264, "frac_above_star": 0.0 }, { "step": 374, "sup_loss": 0.7006730644120136, "rf_loss": 0.0, "total_loss": 0.7006730644120136, "lyap1_mean": -0.20291917026042938, "lyap1_max": -0.13062244653701782, "frac_above_star": 0.0 }, { "step": 375, "sup_loss": 0.5554011090503748, "rf_loss": 0.0, "total_loss": 0.5554011090503748, "lyap1_mean": -0.21270637214183807, "lyap1_max": -0.09814846515655518, "frac_above_star": 0.0 }, { "step": 376, "sup_loss": 0.5874085146002342, "rf_loss": 0.0, "total_loss": 0.5874085146002342, "lyap1_mean": -0.22418086230754852, "lyap1_max": -0.09906986355781555, "frac_above_star": 0.0 }, { "step": 377, "sup_loss": 0.57646098843119, "rf_loss": 0.0, "total_loss": 0.57646098843119, "lyap1_mean": -0.17926345765590668, "lyap1_max": -0.1295628696680069, "frac_above_star": 0.0 }, { "step": 378, "sup_loss": 0.4866621580888519, "rf_loss": 0.0, "total_loss": 0.4866621580888519, "lyap1_mean": -0.2619060277938843, "lyap1_max": -0.1311393678188324, "frac_above_star": 0.0 }, { "step": 379, "sup_loss": 0.46805725509250135, "rf_loss": 0.0, "total_loss": 0.46805725509250135, "lyap1_mean": -0.21309199929237366, "lyap1_max": -0.12426955997943878, "frac_above_star": 0.0 }, { "step": 380, "sup_loss": 0.5309384717194086, "rf_loss": 0.0, "total_loss": 0.5309384717194086, "lyap1_mean": -0.22918032109737396, "lyap1_max": -0.13180653750896454, "frac_above_star": 0.0 }, { "step": 381, "sup_loss": 0.41827593126934237, "rf_loss": 0.0, "total_loss": 0.41827593126934237, "lyap1_mean": -0.2373732328414917, "lyap1_max": -0.1767939180135727, "frac_above_star": 0.0 }, { "step": 382, "sup_loss": 0.6498874717516949, "rf_loss": 0.0, "total_loss": 0.6498874717516949, "lyap1_mean": -0.2211063951253891, "lyap1_max": -0.1681242436170578, "frac_above_star": 0.0 }, { "step": 383, "sup_loss": 0.4349429443795348, "rf_loss": 0.0, "total_loss": 0.4349429443795348, "lyap1_mean": -0.23977139592170715, "lyap1_max": -0.15850691497325897, "frac_above_star": 0.0 }, { "step": 384, "sup_loss": 0.469866004179881, "rf_loss": 0.0, "total_loss": 0.469866004179881, "lyap1_mean": -0.24687765538692474, "lyap1_max": -0.1496664583683014, "frac_above_star": 0.0 }, { "step": 385, "sup_loss": 0.43359337235130546, "rf_loss": 0.0, "total_loss": 0.43359337235130546, "lyap1_mean": -0.22131499648094177, "lyap1_max": -0.13582707941532135, "frac_above_star": 0.0 }, { "step": 386, "sup_loss": 0.4734871103249728, "rf_loss": 0.0, "total_loss": 0.4734871103249728, "lyap1_mean": -0.23007088899612427, "lyap1_max": -0.17124953866004944, "frac_above_star": 0.0 }, { "step": 387, "sup_loss": 0.6691472553045726, "rf_loss": 0.0, "total_loss": 0.6691472553045726, "lyap1_mean": -0.19179195165634155, "lyap1_max": -0.1319137066602707, "frac_above_star": 0.0 }, { "step": 388, "sup_loss": 0.6979663960549036, "rf_loss": 0.0, "total_loss": 0.6979663960549036, "lyap1_mean": -0.21627482771873474, "lyap1_max": -0.14623385667800903, "frac_above_star": 0.0 }, { "step": 389, "sup_loss": 0.6237416675999153, "rf_loss": 0.0, "total_loss": 0.6237416675999153, "lyap1_mean": -0.21857845783233643, "lyap1_max": -0.10471954196691513, "frac_above_star": 0.0 }, { "step": 390, "sup_loss": 0.592283839738404, "rf_loss": 0.0, "total_loss": 0.592283839738404, "lyap1_mean": -0.22861918807029724, "lyap1_max": -0.13160422444343567, "frac_above_star": 0.0 }, { "step": 391, "sup_loss": 0.5736176372306763, "rf_loss": 0.0, "total_loss": 0.5736176372306763, "lyap1_mean": -0.24211814999580383, "lyap1_max": -0.18566088378429413, "frac_above_star": 0.0 }, { "step": 392, "sup_loss": 0.6444058381097122, "rf_loss": 0.0, "total_loss": 0.6444058381097122, "lyap1_mean": -0.22793933749198914, "lyap1_max": -0.17087076604366302, "frac_above_star": 0.0 }, { "step": 393, "sup_loss": 0.8271271033467851, "rf_loss": 0.0, "total_loss": 0.8271271033467851, "lyap1_mean": -0.2071262001991272, "lyap1_max": -0.13778746128082275, "frac_above_star": 0.0 }, { "step": 394, "sup_loss": 0.7073345279766219, "rf_loss": 0.0, "total_loss": 0.7073345279766219, "lyap1_mean": -0.2169470489025116, "lyap1_max": -0.1730356067419052, "frac_above_star": 0.0 }, { "step": 395, "sup_loss": 0.4800006230765676, "rf_loss": 0.0, "total_loss": 0.4800006230765676, "lyap1_mean": -0.2330458164215088, "lyap1_max": -0.1380104422569275, "frac_above_star": 0.0 }, { "step": 396, "sup_loss": 0.41241350825328316, "rf_loss": 0.0, "total_loss": 0.41241350825328316, "lyap1_mean": -0.2461528480052948, "lyap1_max": -0.15010911226272583, "frac_above_star": 0.0 }, { "step": 397, "sup_loss": 0.46628195857002963, "rf_loss": 0.0, "total_loss": 0.46628195857002963, "lyap1_mean": -0.25954166054725647, "lyap1_max": -0.14834284782409668, "frac_above_star": 0.0 }, { "step": 398, "sup_loss": 0.7680981684316472, "rf_loss": 0.0, "total_loss": 0.7680981684316472, "lyap1_mean": -0.1957109421491623, "lyap1_max": -0.13842631876468658, "frac_above_star": 0.0 }, { "step": 399, "sup_loss": 0.45414655548607197, "rf_loss": 0.0, "total_loss": 0.45414655548607197, "lyap1_mean": -0.23266930878162384, "lyap1_max": -0.16785207390785217, "frac_above_star": 0.0 }, { "step": 400, "sup_loss": 0.5470993818360478, "rf_loss": 0.0, "total_loss": 0.5470993818360478, "lyap1_mean": -0.247371107339859, "lyap1_max": -0.16775265336036682, "frac_above_star": 0.0 }, { "step": 401, "sup_loss": 0.6060890249464561, "rf_loss": 0.0, "total_loss": 0.6060890249464561, "lyap1_mean": -0.23491084575653076, "lyap1_max": -0.13046878576278687, "frac_above_star": 0.0 }, { "step": 402, "sup_loss": 0.6433086862722057, "rf_loss": 0.0, "total_loss": 0.6433086862722057, "lyap1_mean": -0.22624745965003967, "lyap1_max": -0.14554187655448914, "frac_above_star": 0.0 }, { "step": 403, "sup_loss": 0.5770216706921802, "rf_loss": 0.0, "total_loss": 0.5770216706921802, "lyap1_mean": -0.18863479793071747, "lyap1_max": -0.05036577209830284, "frac_above_star": 0.0 }, { "step": 404, "sup_loss": 0.37260353217195485, "rf_loss": 0.0, "total_loss": 0.37260353217195485, "lyap1_mean": -0.25863468647003174, "lyap1_max": -0.17592760920524597, "frac_above_star": 0.0 }, { "step": 405, "sup_loss": 0.7498940344575351, "rf_loss": 0.0, "total_loss": 0.7498940344575351, "lyap1_mean": -0.19469135999679565, "lyap1_max": -0.11755923926830292, "frac_above_star": 0.0 }, { "step": 406, "sup_loss": 0.7474589738389056, "rf_loss": 0.0, "total_loss": 0.7474589738389056, "lyap1_mean": -0.2232781946659088, "lyap1_max": -0.1286342740058899, "frac_above_star": 0.0 }, { "step": 407, "sup_loss": 0.79894796149443, "rf_loss": 0.0, "total_loss": 0.79894796149443, "lyap1_mean": -0.23811206221580505, "lyap1_max": -0.13449008762836456, "frac_above_star": 0.0 }, { "step": 408, "sup_loss": 0.573565627500277, "rf_loss": 0.0, "total_loss": 0.573565627500277, "lyap1_mean": -0.2281595766544342, "lyap1_max": -0.17105528712272644, "frac_above_star": 0.0 }, { "step": 409, "sup_loss": 0.9797702182875103, "rf_loss": 0.0, "total_loss": 0.9797702182875103, "lyap1_mean": -0.19455677270889282, "lyap1_max": -0.16017811000347137, "frac_above_star": 0.0 }, { "step": 410, "sup_loss": 0.5941237637733225, "rf_loss": 0.0, "total_loss": 0.5941237637733225, "lyap1_mean": -0.21421773731708527, "lyap1_max": -0.12659311294555664, "frac_above_star": 0.0 }, { "step": 411, "sup_loss": 0.6828079838237895, "rf_loss": 0.0, "total_loss": 0.6828079838237895, "lyap1_mean": -0.19643931090831757, "lyap1_max": -0.15614956617355347, "frac_above_star": 0.0 }, { "step": 412, "sup_loss": 0.8023839143217346, "rf_loss": 0.0, "total_loss": 0.8023839143217346, "lyap1_mean": -0.19028116762638092, "lyap1_max": -0.1554807722568512, "frac_above_star": 0.0 }, { "step": 413, "sup_loss": 0.6272650259856455, "rf_loss": 0.0, "total_loss": 0.6272650259856455, "lyap1_mean": -0.20130380988121033, "lyap1_max": -0.14557811617851257, "frac_above_star": 0.0 }, { "step": 414, "sup_loss": 0.832685347032309, "rf_loss": 0.0, "total_loss": 0.832685347032309, "lyap1_mean": -0.20160439610481262, "lyap1_max": -0.15023809671401978, "frac_above_star": 0.0 }, { "step": 415, "sup_loss": 0.6041836947260294, "rf_loss": 0.0, "total_loss": 0.6041836947260294, "lyap1_mean": -0.21403717994689941, "lyap1_max": -0.17294955253601074, "frac_above_star": 0.0 }, { "step": 416, "sup_loss": 0.5730397834845384, "rf_loss": 0.0, "total_loss": 0.5730397834845384, "lyap1_mean": -0.15468549728393555, "lyap1_max": -0.0571526363492012, "frac_above_star": 0.0 }, { "step": 417, "sup_loss": 0.6746630578893192, "rf_loss": 0.0, "total_loss": 0.6746630578893192, "lyap1_mean": -0.20595599710941315, "lyap1_max": -0.13853368163108826, "frac_above_star": 0.0 }, { "step": 418, "sup_loss": 0.6149385373678194, "rf_loss": 0.0, "total_loss": 0.6149385373678194, "lyap1_mean": -0.23565509915351868, "lyap1_max": -0.15242862701416016, "frac_above_star": 0.0 }, { "step": 419, "sup_loss": 0.6117796917844956, "rf_loss": 0.0, "total_loss": 0.6117796917844956, "lyap1_mean": -0.21939457952976227, "lyap1_max": -0.11468124389648438, "frac_above_star": 0.0 }, { "step": 420, "sup_loss": 0.546369001468315, "rf_loss": 0.0, "total_loss": 0.546369001468315, "lyap1_mean": -0.2253008782863617, "lyap1_max": -0.1351310908794403, "frac_above_star": 0.0 }, { "step": 421, "sup_loss": 0.5678360193643954, "rf_loss": 0.0, "total_loss": 0.5678360193643954, "lyap1_mean": -0.2235012650489807, "lyap1_max": -0.14428293704986572, "frac_above_star": 0.0 }, { "step": 422, "sup_loss": 0.4621307066297527, "rf_loss": 0.0, "total_loss": 0.4621307066297527, "lyap1_mean": -0.2540198266506195, "lyap1_max": -0.1689125895500183, "frac_above_star": 0.0 }, { "step": 423, "sup_loss": 0.4006336773551642, "rf_loss": 0.00018839319818653166, "total_loss": 0.40251760927882185, "lyap1_mean": -0.17290790379047394, "lyap1_max": -0.011178027838468552, "frac_above_star": 0.125 }, { "step": 424, "sup_loss": 0.5542560673345038, "rf_loss": 0.0, "total_loss": 0.5542560673345038, "lyap1_mean": -0.24215170741081238, "lyap1_max": -0.17764568328857422, "frac_above_star": 0.0 }, { "step": 425, "sup_loss": 0.4613437735594227, "rf_loss": 0.0, "total_loss": 0.4613437735594227, "lyap1_mean": -0.2527486979961395, "lyap1_max": -0.17467980086803436, "frac_above_star": 0.0 }, { "step": 426, "sup_loss": 0.5147426055170997, "rf_loss": 0.0, "total_loss": 0.5147426055170997, "lyap1_mean": -0.2252729833126068, "lyap1_max": -0.09682126343250275, "frac_above_star": 0.0 }, { "step": 427, "sup_loss": 0.5989016739704492, "rf_loss": 0.0, "total_loss": 0.5989016739704492, "lyap1_mean": -0.257686585187912, "lyap1_max": -0.1756468117237091, "frac_above_star": 0.0 }, { "step": 428, "sup_loss": 0.4808609429131941, "rf_loss": 0.0, "total_loss": 0.4808609429131941, "lyap1_mean": -0.23024070262908936, "lyap1_max": -0.1409391313791275, "frac_above_star": 0.0 }, { "step": 429, "sup_loss": 0.822633134213223, "rf_loss": 0.0, "total_loss": 0.822633134213223, "lyap1_mean": -0.19250787794589996, "lyap1_max": -0.15449683368206024, "frac_above_star": 0.0 }, { "step": 430, "sup_loss": 0.6980670798374189, "rf_loss": 0.0, "total_loss": 0.6980670798374189, "lyap1_mean": -0.22877156734466553, "lyap1_max": -0.17860949039459229, "frac_above_star": 0.0 }, { "step": 431, "sup_loss": 0.5913083975718165, "rf_loss": 0.0, "total_loss": 0.5913083975718165, "lyap1_mean": -0.21428176760673523, "lyap1_max": -0.14880067110061646, "frac_above_star": 0.0 }, { "step": 432, "sup_loss": 0.5742548025339517, "rf_loss": 0.0, "total_loss": 0.5742548025339517, "lyap1_mean": -0.19972869753837585, "lyap1_max": -0.14378806948661804, "frac_above_star": 0.0 }, { "step": 433, "sup_loss": 0.622112604269508, "rf_loss": 0.0, "total_loss": 0.622112604269508, "lyap1_mean": -0.20484450459480286, "lyap1_max": -0.10459718108177185, "frac_above_star": 0.0 }, { "step": 434, "sup_loss": 0.6283092626466985, "rf_loss": 0.0, "total_loss": 0.6283092626466985, "lyap1_mean": -0.20850074291229248, "lyap1_max": -0.1568463146686554, "frac_above_star": 0.0 }, { "step": 435, "sup_loss": 0.5279803230739013, "rf_loss": 0.0, "total_loss": 0.5279803230739013, "lyap1_mean": -0.22041699290275574, "lyap1_max": -0.12634703516960144, "frac_above_star": 0.0 }, { "step": 436, "sup_loss": 0.4704183942727489, "rf_loss": 0.0, "total_loss": 0.4704183942727489, "lyap1_mean": -0.22725048661231995, "lyap1_max": -0.15891343355178833, "frac_above_star": 0.0 }, { "step": 437, "sup_loss": 0.6599533321301443, "rf_loss": 0.0, "total_loss": 0.6599533321301443, "lyap1_mean": -0.21564775705337524, "lyap1_max": -0.1603040099143982, "frac_above_star": 0.0 }, { "step": 438, "sup_loss": 0.5377865665047743, "rf_loss": 0.0, "total_loss": 0.5377865665047743, "lyap1_mean": -0.19312168657779694, "lyap1_max": -0.16351372003555298, "frac_above_star": 0.0 }, { "step": 439, "sup_loss": 0.5872892527228014, "rf_loss": 0.0, "total_loss": 0.5872892527228014, "lyap1_mean": -0.21844707429409027, "lyap1_max": -0.16125667095184326, "frac_above_star": 0.0 }, { "step": 440, "sup_loss": 0.8405998383238293, "rf_loss": 0.0, "total_loss": 0.8405998383238293, "lyap1_mean": -0.17636080086231232, "lyap1_max": -0.10924814641475677, "frac_above_star": 0.0 }, { "step": 441, "sup_loss": 0.5349202265220784, "rf_loss": 0.0, "total_loss": 0.5349202265220784, "lyap1_mean": -0.21927517652511597, "lyap1_max": -0.1201939508318901, "frac_above_star": 0.0 }, { "step": 442, "sup_loss": 0.4967888737238917, "rf_loss": 0.0, "total_loss": 0.4967888737238917, "lyap1_mean": -0.22101856768131256, "lyap1_max": -0.1005643755197525, "frac_above_star": 0.0 }, { "step": 443, "sup_loss": 0.6759895032257268, "rf_loss": 0.0, "total_loss": 0.6759895032257268, "lyap1_mean": -0.19441074132919312, "lyap1_max": -0.12647679448127747, "frac_above_star": 0.0 }, { "step": 444, "sup_loss": 0.7682728672484888, "rf_loss": 0.0, "total_loss": 0.7682728672484888, "lyap1_mean": -0.20455695688724518, "lyap1_max": -0.14391641318798065, "frac_above_star": 0.0 }, { "step": 445, "sup_loss": 0.5340596002239556, "rf_loss": 0.0, "total_loss": 0.5340596002239556, "lyap1_mean": -0.1894068866968155, "lyap1_max": -0.13329464197158813, "frac_above_star": 0.0 }, { "step": 446, "sup_loss": 0.6097720622595074, "rf_loss": 0.0, "total_loss": 0.6097720622595074, "lyap1_mean": -0.2007661759853363, "lyap1_max": -0.13857173919677734, "frac_above_star": 0.0 }, { "step": 447, "sup_loss": 0.5704053144381531, "rf_loss": 0.0, "total_loss": 0.5704053144381531, "lyap1_mean": -0.2089853584766388, "lyap1_max": -0.14381247758865356, "frac_above_star": 0.0 }, { "step": 448, "sup_loss": 0.7708318842935611, "rf_loss": 0.0, "total_loss": 0.7708318842935611, "lyap1_mean": -0.18507841229438782, "lyap1_max": -0.10562454164028168, "frac_above_star": 0.0 }, { "step": 449, "sup_loss": 0.7827587676296863, "rf_loss": 0.0, "total_loss": 0.7827587676296863, "lyap1_mean": -0.2189193069934845, "lyap1_max": -0.12284156680107117, "frac_above_star": 0.0 }, { "step": 450, "sup_loss": 0.6689201247995654, "rf_loss": 0.0, "total_loss": 0.6689201247995654, "lyap1_mean": -0.23185619711875916, "lyap1_max": -0.17608337104320526, "frac_above_star": 0.0 }, { "step": 451, "sup_loss": 0.551504014224502, "rf_loss": 0.0, "total_loss": 0.551504014224502, "lyap1_mean": -0.25491681694984436, "lyap1_max": -0.18205681443214417, "frac_above_star": 0.0 }, { "step": 452, "sup_loss": 0.6246585033839481, "rf_loss": 0.0, "total_loss": 0.6246585033839481, "lyap1_mean": -0.22794301807880402, "lyap1_max": -0.13384383916854858, "frac_above_star": 0.0 }, { "step": 453, "sup_loss": 0.8146147253527948, "rf_loss": 0.0, "total_loss": 0.8146147253527948, "lyap1_mean": -0.22990316152572632, "lyap1_max": -0.16613446176052094, "frac_above_star": 0.0 }, { "step": 454, "sup_loss": 0.6524028392458605, "rf_loss": 0.0, "total_loss": 0.6524028392458605, "lyap1_mean": -0.21140530705451965, "lyap1_max": -0.14374259114265442, "frac_above_star": 0.0 }, { "step": 455, "sup_loss": 0.5805174857947933, "rf_loss": 0.0, "total_loss": 0.5805174857947933, "lyap1_mean": -0.20731066167354584, "lyap1_max": -0.12318490445613861, "frac_above_star": 0.0 }, { "step": 456, "sup_loss": 0.4502186005223158, "rf_loss": 0.0, "total_loss": 0.4502186005223158, "lyap1_mean": -0.24037030339241028, "lyap1_max": -0.12203490734100342, "frac_above_star": 0.0 }, { "step": 457, "sup_loss": 0.5549551508442796, "rf_loss": 0.0, "total_loss": 0.5549551508442796, "lyap1_mean": -0.21457484364509583, "lyap1_max": -0.14574328064918518, "frac_above_star": 0.0 }, { "step": 458, "sup_loss": 0.5703739531721798, "rf_loss": 0.0, "total_loss": 0.5703739531721798, "lyap1_mean": -0.2315698266029358, "lyap1_max": -0.13514766097068787, "frac_above_star": 0.0 }, { "step": 459, "sup_loss": 0.5834769831844926, "rf_loss": 0.0, "total_loss": 0.5834769831844926, "lyap1_mean": -0.22849972546100616, "lyap1_max": -0.15692950785160065, "frac_above_star": 0.0 }, { "step": 460, "sup_loss": 0.5677209152087253, "rf_loss": 0.0, "total_loss": 0.5677209152087253, "lyap1_mean": -0.24614152312278748, "lyap1_max": -0.15802611410617828, "frac_above_star": 0.0 }, { "step": 461, "sup_loss": 0.5595694271107275, "rf_loss": 0.0, "total_loss": 0.5595694271107275, "lyap1_mean": -0.24104417860507965, "lyap1_max": -0.17910099029541016, "frac_above_star": 0.0 }, { "step": 462, "sup_loss": 0.4690980258067601, "rf_loss": 0.0, "total_loss": 0.4690980258067601, "lyap1_mean": -0.2452768087387085, "lyap1_max": -0.16175620257854462, "frac_above_star": 0.0 }, { "step": 463, "sup_loss": 0.818847195428604, "rf_loss": 0.0, "total_loss": 0.818847195428604, "lyap1_mean": -0.22236952185630798, "lyap1_max": -0.15004590153694153, "frac_above_star": 0.0 }, { "step": 464, "sup_loss": 0.6151018863736678, "rf_loss": 0.0, "total_loss": 0.6151018863736678, "lyap1_mean": -0.21482911705970764, "lyap1_max": -0.09503337740898132, "frac_above_star": 0.0 }, { "step": 465, "sup_loss": 0.6259128074392135, "rf_loss": 0.0, "total_loss": 0.6259128074392135, "lyap1_mean": -0.19102607667446136, "lyap1_max": -0.1449204534292221, "frac_above_star": 0.0 }, { "step": 466, "sup_loss": 0.5730434710274545, "rf_loss": 0.0, "total_loss": 0.5730434710274545, "lyap1_mean": -0.24374115467071533, "lyap1_max": -0.16072188317775726, "frac_above_star": 0.0 }, { "step": 467, "sup_loss": 0.4797580199735464, "rf_loss": 0.0, "total_loss": 0.4797580199735464, "lyap1_mean": -0.230105921626091, "lyap1_max": -0.1578637957572937, "frac_above_star": 0.0 }, { "step": 468, "sup_loss": 0.8231880235770999, "rf_loss": 0.0, "total_loss": 0.8231880235770999, "lyap1_mean": -0.20298781991004944, "lyap1_max": -0.0805358961224556, "frac_above_star": 0.0 }, { "step": 469, "sup_loss": 0.7107948332991013, "rf_loss": 0.0, "total_loss": 0.7107948332991013, "lyap1_mean": -0.18164268136024475, "lyap1_max": -0.08889242261648178, "frac_above_star": 0.0 }, { "step": 470, "sup_loss": 0.5532651436458066, "rf_loss": 0.0, "total_loss": 0.5532651436458066, "lyap1_mean": -0.2296716272830963, "lyap1_max": -0.17731808125972748, "frac_above_star": 0.0 }, { "step": 471, "sup_loss": 0.7506978985467345, "rf_loss": 0.0, "total_loss": 0.7506978985467345, "lyap1_mean": -0.20572766661643982, "lyap1_max": -0.16034196317195892, "frac_above_star": 0.0 }, { "step": 472, "sup_loss": 0.640069551850923, "rf_loss": 0.0, "total_loss": 0.640069551850923, "lyap1_mean": -0.1999901384115219, "lyap1_max": -0.15610679984092712, "frac_above_star": 0.0 }, { "step": 473, "sup_loss": 0.5611310548035375, "rf_loss": 0.0, "total_loss": 0.5611310548035375, "lyap1_mean": -0.22579239308834076, "lyap1_max": -0.15909507870674133, "frac_above_star": 0.0 }, { "step": 474, "sup_loss": 0.37755203101877316, "rf_loss": 0.0, "total_loss": 0.37755203101877316, "lyap1_mean": -0.22984983026981354, "lyap1_max": -0.1553807556629181, "frac_above_star": 0.0 }, { "step": 475, "sup_loss": 0.788111336470161, "rf_loss": 0.0, "total_loss": 0.788111336470161, "lyap1_mean": -0.17285682260990143, "lyap1_max": -0.12928509712219238, "frac_above_star": 0.0 }, { "step": 476, "sup_loss": 0.5692312890868217, "rf_loss": 0.0, "total_loss": 0.5692312890868217, "lyap1_mean": -0.23381999135017395, "lyap1_max": -0.12067683786153793, "frac_above_star": 0.0 }, { "step": 477, "sup_loss": 0.4842579373264275, "rf_loss": 0.0, "total_loss": 0.4842579373264275, "lyap1_mean": -0.2727886140346527, "lyap1_max": -0.1940649449825287, "frac_above_star": 0.0 }, { "step": 478, "sup_loss": 0.6094397031476663, "rf_loss": 0.0, "total_loss": 0.6094397031476663, "lyap1_mean": -0.22106488049030304, "lyap1_max": -0.16366024315357208, "frac_above_star": 0.0 }, { "step": 479, "sup_loss": 0.5971989900374587, "rf_loss": 0.0, "total_loss": 0.5971989900374587, "lyap1_mean": -0.2181301712989807, "lyap1_max": -0.1530958116054535, "frac_above_star": 0.0 }, { "step": 480, "sup_loss": 0.6713177318919344, "rf_loss": 0.0, "total_loss": 0.6713177318919344, "lyap1_mean": -0.2184915393590927, "lyap1_max": -0.1814681887626648, "frac_above_star": 0.0 }, { "step": 481, "sup_loss": 0.5228367497324832, "rf_loss": 0.0, "total_loss": 0.5228367497324832, "lyap1_mean": -0.22797653079032898, "lyap1_max": -0.14713995158672333, "frac_above_star": 0.0 }, { "step": 482, "sup_loss": 0.8152582095690803, "rf_loss": 0.0, "total_loss": 0.8152582095690803, "lyap1_mean": -0.21665066480636597, "lyap1_max": -0.1391698122024536, "frac_above_star": 0.0 }, { "step": 483, "sup_loss": 0.574700934196167, "rf_loss": 0.0, "total_loss": 0.574700934196167, "lyap1_mean": -0.21301104128360748, "lyap1_max": -0.10645733773708344, "frac_above_star": 0.0 }, { "step": 484, "sup_loss": 0.5598177696274965, "rf_loss": 0.0, "total_loss": 0.5598177696274965, "lyap1_mean": -0.2458435446023941, "lyap1_max": -0.14060968160629272, "frac_above_star": 0.0 }, { "step": 485, "sup_loss": 0.7191556913916637, "rf_loss": 0.0, "total_loss": 0.7191556913916637, "lyap1_mean": -0.23266196250915527, "lyap1_max": -0.1437108814716339, "frac_above_star": 0.0 }, { "step": 486, "sup_loss": 0.6567477350083338, "rf_loss": 0.0, "total_loss": 0.6567477350083338, "lyap1_mean": -0.22213956713676453, "lyap1_max": -0.1710439920425415, "frac_above_star": 0.0 }, { "step": 487, "sup_loss": 0.45876177384092176, "rf_loss": 0.0, "total_loss": 0.45876177384092176, "lyap1_mean": -0.2387300431728363, "lyap1_max": -0.08665876090526581, "frac_above_star": 0.0 }, { "step": 488, "sup_loss": 0.6932138391433285, "rf_loss": 0.0, "total_loss": 0.6932138391433285, "lyap1_mean": -0.2065650224685669, "lyap1_max": -0.13189248740673065, "frac_above_star": 0.0 }, { "step": 489, "sup_loss": 0.48031332835719526, "rf_loss": 0.0, "total_loss": 0.48031332835719526, "lyap1_mean": -0.24465778470039368, "lyap1_max": -0.09884530305862427, "frac_above_star": 0.0 }, { "step": 490, "sup_loss": 0.5642522943112197, "rf_loss": 0.0, "total_loss": 0.5642522943112197, "lyap1_mean": -0.22475336492061615, "lyap1_max": -0.1256757378578186, "frac_above_star": 0.0 }, { "step": 491, "sup_loss": 0.6721265003939094, "rf_loss": 0.0, "total_loss": 0.6721265003939094, "lyap1_mean": -0.2352738082408905, "lyap1_max": -0.16954371333122253, "frac_above_star": 0.0 }, { "step": 492, "sup_loss": 0.7614344393339444, "rf_loss": 0.0, "total_loss": 0.7614344393339444, "lyap1_mean": -0.2063005566596985, "lyap1_max": -0.16296163201332092, "frac_above_star": 0.0 }, { "step": 493, "sup_loss": 0.5751549553515443, "rf_loss": 0.0, "total_loss": 0.5751549553515443, "lyap1_mean": -0.21087966859340668, "lyap1_max": -0.10467313975095749, "frac_above_star": 0.0 }, { "step": 494, "sup_loss": 0.7259734377054724, "rf_loss": 0.0, "total_loss": 0.7259734377054724, "lyap1_mean": -0.2070980817079544, "lyap1_max": -0.10363219678401947, "frac_above_star": 0.0 }, { "step": 495, "sup_loss": 0.7602490716883397, "rf_loss": 0.0, "total_loss": 0.7602490716883397, "lyap1_mean": -0.1845816820859909, "lyap1_max": -0.09565240144729614, "frac_above_star": 0.0 }, { "step": 496, "sup_loss": 0.4906964264759617, "rf_loss": 0.0, "total_loss": 0.4906964264759617, "lyap1_mean": -0.20967888832092285, "lyap1_max": -0.16176092624664307, "frac_above_star": 0.0 }, { "step": 497, "sup_loss": 0.6845335841918382, "rf_loss": 0.0, "total_loss": 0.6845335841918382, "lyap1_mean": -0.18434417247772217, "lyap1_max": -0.09851005673408508, "frac_above_star": 0.0 }, { "step": 498, "sup_loss": 0.7078062872270657, "rf_loss": 0.0, "total_loss": 0.7078062872270657, "lyap1_mean": -0.22571706771850586, "lyap1_max": -0.16094744205474854, "frac_above_star": 0.0 }, { "step": 499, "sup_loss": 0.40959508305204967, "rf_loss": 0.00010468860273249447, "total_loss": 0.41064196902116695, "lyap1_mean": -0.22179558873176575, "lyap1_max": -0.02106025628745556, "frac_above_star": 0.125 } ], "evals": [ { "step": 0, "acc": 0.517578125, "tok_acc": 0.8276668595679012 }, { "step": 100, "acc": 0.583984375, "tok_acc": 0.8514660493827161 }, { "step": 200, "acc": 0.5703125, "tok_acc": 0.8477768132716049 }, { "step": 300, "acc": 0.638671875, "tok_acc": 0.8697193287037037 }, { "step": 400, "acc": 0.607421875, "tok_acc": 0.8614969135802469 }, { "step": 500, "acc": 0.615234375, "tok_acc": 0.8655478395061729 }, { "step": 500, "acc": 0.615234375, "tok_acc": 0.8655478395061729 } ], "final_acc": 0.615234375, "final_tok_acc": 0.8655478395061729 }