{ "args": { "ckpt_root": "/home/yurenh2/rrm/hrm/checkpoints/Sudoku-extreme-1k-aug-1000 ACT-torch/HierarchicalReasoningModel_ACTV1 righteous-python", "ckpt_name": "step_26040", "n_steps": 500, "batch_size": 8, "lr": 1e-05, "alpha_rf": 10.0, "lambda_star": 0.0, "k_lyap": 2, "lyap_act_steps": 4, "seed": 42, "eval_every": 100, "eval_n": 512, "eval_batch_size": 32, "out": "/home/yurenh2/rrm/research/flossing/step3_D_rf_26040_lstar0.json" }, "initial_acc": 0.517578125, "initial_tok_acc": 0.8276668595679012, "steps": [ { "step": 0, "sup_loss": 0.5709326593550843, "rf_loss": 0.0, "total_loss": 0.5709326593550843, "lyap1_mean": -0.18472686409950256, "lyap1_max": -0.04164290055632591, "frac_above_star": 0.0 }, { "step": 1, "sup_loss": 0.4537315985598272, "rf_loss": 0.0, "total_loss": 0.4537315985598272, "lyap1_mean": -0.18278884887695312, "lyap1_max": -0.07852113246917725, "frac_above_star": 0.0 }, { "step": 2, "sup_loss": 0.7113479716905943, "rf_loss": 0.0, "total_loss": 0.7113479716905943, "lyap1_mean": -0.19486622512340546, "lyap1_max": -0.1192842349410057, "frac_above_star": 0.0 }, { "step": 3, "sup_loss": 0.597583092054463, "rf_loss": 0.0, "total_loss": 0.597583092054463, "lyap1_mean": -0.18127819895744324, "lyap1_max": -0.0903722271323204, "frac_above_star": 0.0 }, { "step": 4, "sup_loss": 0.5738701157693367, "rf_loss": 0.0, "total_loss": 0.5738701157693367, "lyap1_mean": -0.1465875506401062, "lyap1_max": -0.0674026608467102, "frac_above_star": 0.0 }, { "step": 5, "sup_loss": 0.8187648733421766, "rf_loss": 0.0, "total_loss": 0.8187648733421766, "lyap1_mean": -0.13810217380523682, "lyap1_max": -0.023307686671614647, "frac_above_star": 0.0 }, { "step": 6, "sup_loss": 0.5935503668105154, "rf_loss": 0.0, "total_loss": 0.5935503668105154, "lyap1_mean": -0.18558409810066223, "lyap1_max": -0.14445218443870544, "frac_above_star": 0.0 }, { "step": 7, "sup_loss": 0.6116007363203012, "rf_loss": 0.0, "total_loss": 0.6116007363203012, "lyap1_mean": -0.17203228175640106, "lyap1_max": -0.13824281096458435, "frac_above_star": 0.0 }, { "step": 8, "sup_loss": 0.7647240980851782, "rf_loss": 0.0, "total_loss": 0.7647240980851782, "lyap1_mean": -0.13947001099586487, "lyap1_max": -0.09547226876020432, "frac_above_star": 0.0 }, { "step": 9, "sup_loss": 0.8396100166154439, "rf_loss": 0.0, "total_loss": 0.8396100166154439, "lyap1_mean": -0.13995055854320526, "lyap1_max": -0.03150452673435211, "frac_above_star": 0.0 }, { "step": 10, "sup_loss": 0.6428039585044509, "rf_loss": 0.0, "total_loss": 0.6428039585044509, "lyap1_mean": -0.15870139002799988, "lyap1_max": -0.09396694600582123, "frac_above_star": 0.0 }, { "step": 11, "sup_loss": 0.5811422490218018, "rf_loss": 0.0, "total_loss": 0.5811422490218018, "lyap1_mean": -0.19246718287467957, "lyap1_max": -0.10694313049316406, "frac_above_star": 0.0 }, { "step": 12, "sup_loss": 0.5142992216071943, "rf_loss": 0.0, "total_loss": 0.5142992216071943, "lyap1_mean": -0.17781132459640503, "lyap1_max": -0.10174864530563354, "frac_above_star": 0.0 }, { "step": 13, "sup_loss": 0.6980310100472148, "rf_loss": 0.0, "total_loss": 0.6980310100472148, "lyap1_mean": -0.1402999758720398, "lyap1_max": -0.0456048846244812, "frac_above_star": 0.0 }, { "step": 14, "sup_loss": 0.5892403047533569, "rf_loss": 0.0, "total_loss": 0.5892403047533569, "lyap1_mean": -0.16698290407657623, "lyap1_max": -0.03724510222673416, "frac_above_star": 0.0 }, { "step": 15, "sup_loss": 0.6831909016860896, "rf_loss": 0.0, "total_loss": 0.6831909016860896, "lyap1_mean": -0.1744181364774704, "lyap1_max": -0.07581361383199692, "frac_above_star": 0.0 }, { "step": 16, "sup_loss": 0.5609518770313622, "rf_loss": 0.0, "total_loss": 0.5609518770313622, "lyap1_mean": -0.15907441079616547, "lyap1_max": -0.03832785412669182, "frac_above_star": 0.0 }, { "step": 17, "sup_loss": 0.7168034194474827, "rf_loss": 0.0, "total_loss": 0.7168034194474827, "lyap1_mean": -0.13614536821842194, "lyap1_max": -0.07818807661533356, "frac_above_star": 0.0 }, { "step": 18, "sup_loss": 0.5966043230778727, "rf_loss": 0.0, "total_loss": 0.5966043230778727, "lyap1_mean": -0.19817839562892914, "lyap1_max": -0.12519890069961548, "frac_above_star": 0.0 }, { "step": 19, "sup_loss": 0.47885175270739827, "rf_loss": 0.0, "total_loss": 0.47885175270739827, "lyap1_mean": -0.18308168649673462, "lyap1_max": -0.014672264456748962, "frac_above_star": 0.0 }, { "step": 20, "sup_loss": 0.5983548755237532, "rf_loss": 0.0, "total_loss": 0.5983548755237532, "lyap1_mean": -0.17639592289924622, "lyap1_max": -0.06831589341163635, "frac_above_star": 0.0 }, { "step": 21, "sup_loss": 0.5746365896558261, "rf_loss": 0.0, "total_loss": 0.5746365896558261, "lyap1_mean": -0.16372406482696533, "lyap1_max": -0.11158832907676697, "frac_above_star": 0.0 }, { "step": 22, "sup_loss": 0.6301474495948247, "rf_loss": 0.0, "total_loss": 0.6301474495948247, "lyap1_mean": -0.16582883894443512, "lyap1_max": -0.06442220509052277, "frac_above_star": 0.0 }, { "step": 23, "sup_loss": 0.5427223688141529, "rf_loss": 0.0, "total_loss": 0.5427223688141529, "lyap1_mean": -0.1792174130678177, "lyap1_max": -0.11282213777303696, "frac_above_star": 0.0 }, { "step": 24, "sup_loss": 0.7867869354688557, "rf_loss": 0.0, "total_loss": 0.7867869354688557, "lyap1_mean": -0.14375832676887512, "lyap1_max": -0.10010765492916107, "frac_above_star": 0.0 }, { "step": 25, "sup_loss": 0.817251779312334, "rf_loss": 4.548199285636656e-06, "total_loss": 0.8172972613051903, "lyap1_mean": -0.12222366780042648, "lyap1_max": 0.00603204732760787, "frac_above_star": 0.125 }, { "step": 26, "sup_loss": 0.8035067499033389, "rf_loss": 0.0, "total_loss": 0.8035067499033389, "lyap1_mean": -0.1318286508321762, "lyap1_max": -0.07215680927038193, "frac_above_star": 0.0 }, { "step": 27, "sup_loss": 0.4270028163263247, "rf_loss": 0.0, "total_loss": 0.4270028163263247, "lyap1_mean": -0.18793411552906036, "lyap1_max": -0.07287189364433289, "frac_above_star": 0.0 }, { "step": 28, "sup_loss": 0.7617109706684106, "rf_loss": 0.0, "total_loss": 0.7617109706684106, "lyap1_mean": -0.13562969863414764, "lyap1_max": -0.05400077626109123, "frac_above_star": 0.0 }, { "step": 29, "sup_loss": 0.7822640095468119, "rf_loss": 0.0, "total_loss": 0.7822640095468119, "lyap1_mean": -0.14778971672058105, "lyap1_max": -0.0919022187590599, "frac_above_star": 0.0 }, { "step": 30, "sup_loss": 0.6729986206898457, "rf_loss": 0.0, "total_loss": 0.6729986206898457, "lyap1_mean": -0.1395232230424881, "lyap1_max": -0.02846486121416092, "frac_above_star": 0.0 }, { "step": 31, "sup_loss": 0.6373579476035567, "rf_loss": 8.829884609440342e-05, "total_loss": 0.6382409360499488, "lyap1_mean": -0.1356256902217865, "lyap1_max": 0.026578012853860855, "frac_above_star": 0.125 }, { "step": 32, "sup_loss": 0.5830916228134961, "rf_loss": 0.0, "total_loss": 0.5830916228134961, "lyap1_mean": -0.14453251659870148, "lyap1_max": -0.08446592092514038, "frac_above_star": 0.0 }, { "step": 33, "sup_loss": 0.521404521173602, "rf_loss": 0.0, "total_loss": 0.521404521173602, "lyap1_mean": -0.17164994776248932, "lyap1_max": -0.09436239302158356, "frac_above_star": 0.0 }, { "step": 34, "sup_loss": 0.7941034261864478, "rf_loss": 0.0, "total_loss": 0.7941034261864478, "lyap1_mean": -0.15527258813381195, "lyap1_max": -0.10340406745672226, "frac_above_star": 0.0 }, { "step": 35, "sup_loss": 0.4363282311965954, "rf_loss": 0.0, "total_loss": 0.4363282311965954, "lyap1_mean": -0.18346171081066132, "lyap1_max": -0.10809855163097382, "frac_above_star": 0.0 }, { "step": 36, "sup_loss": 0.6136871672257647, "rf_loss": 0.0, "total_loss": 0.6136871672257647, "lyap1_mean": -0.17476990818977356, "lyap1_max": -0.11162661761045456, "frac_above_star": 0.0 }, { "step": 37, "sup_loss": 0.8029722518854867, "rf_loss": 0.0, "total_loss": 0.8029722518854867, "lyap1_mean": -0.15289001166820526, "lyap1_max": -0.09114080667495728, "frac_above_star": 0.0 }, { "step": 38, "sup_loss": 0.513709011562989, "rf_loss": 0.0, "total_loss": 0.513709011562989, "lyap1_mean": -0.17961949110031128, "lyap1_max": -0.09186246991157532, "frac_above_star": 0.0 }, { "step": 39, "sup_loss": 0.7502787226987873, "rf_loss": 0.0, "total_loss": 0.7502787226987873, "lyap1_mean": -0.1405312716960907, "lyap1_max": -0.0837816596031189, "frac_above_star": 0.0 }, { "step": 40, "sup_loss": 0.6877028622418593, "rf_loss": 0.0, "total_loss": 0.6877028622418593, "lyap1_mean": -0.17151132225990295, "lyap1_max": -0.13685926795005798, "frac_above_star": 0.0 }, { "step": 41, "sup_loss": 0.4863387269811524, "rf_loss": 0.0, "total_loss": 0.4863387269811524, "lyap1_mean": -0.21138250827789307, "lyap1_max": -0.1175619587302208, "frac_above_star": 0.0 }, { "step": 42, "sup_loss": 0.7514742933668795, "rf_loss": 0.0, "total_loss": 0.7514742933668795, "lyap1_mean": -0.16092783212661743, "lyap1_max": -0.031270831823349, "frac_above_star": 0.0 }, { "step": 43, "sup_loss": 0.7129178077227725, "rf_loss": 0.0, "total_loss": 0.7129178077227725, "lyap1_mean": -0.1851135790348053, "lyap1_max": -0.10778182744979858, "frac_above_star": 0.0 }, { "step": 44, "sup_loss": 0.8868683315345265, "rf_loss": 0.0, "total_loss": 0.8868683315345265, "lyap1_mean": -0.1670822948217392, "lyap1_max": -0.11507737636566162, "frac_above_star": 0.0 }, { "step": 45, "sup_loss": 0.6351602932222572, "rf_loss": 0.0, "total_loss": 0.6351602932222572, "lyap1_mean": -0.1371801495552063, "lyap1_max": -0.061941247433423996, "frac_above_star": 0.0 }, { "step": 46, "sup_loss": 0.6563493031305806, "rf_loss": 0.0, "total_loss": 0.6563493031305806, "lyap1_mean": -0.17162778973579407, "lyap1_max": -0.09708268940448761, "frac_above_star": 0.0 }, { "step": 47, "sup_loss": 0.647606127062305, "rf_loss": 0.0, "total_loss": 0.647606127062305, "lyap1_mean": -0.1585829257965088, "lyap1_max": -0.11212565749883652, "frac_above_star": 0.0 }, { "step": 48, "sup_loss": 0.5985624645375054, "rf_loss": 0.0, "total_loss": 0.5985624645375054, "lyap1_mean": -0.16952288150787354, "lyap1_max": -0.00444550346583128, "frac_above_star": 0.0 }, { "step": 49, "sup_loss": 0.5917569659446742, "rf_loss": 0.0, "total_loss": 0.5917569659446742, "lyap1_mean": -0.16630221903324127, "lyap1_max": -0.10793127119541168, "frac_above_star": 0.0 }, { "step": 50, "sup_loss": 0.6085986407724109, "rf_loss": 0.0, "total_loss": 0.6085986407724109, "lyap1_mean": -0.18211820721626282, "lyap1_max": -0.10828250646591187, "frac_above_star": 0.0 }, { "step": 51, "sup_loss": 0.8413370421486563, "rf_loss": 0.0, "total_loss": 0.8413370421486563, "lyap1_mean": -0.15773043036460876, "lyap1_max": -0.06584006547927856, "frac_above_star": 0.0 }, { "step": 52, "sup_loss": 0.5183901930392883, "rf_loss": 0.0, "total_loss": 0.5183901930392883, "lyap1_mean": -0.16177651286125183, "lyap1_max": -0.049565624445676804, "frac_above_star": 0.0 }, { "step": 53, "sup_loss": 0.6302464230587657, "rf_loss": 0.0, "total_loss": 0.6302464230587657, "lyap1_mean": -0.16698575019836426, "lyap1_max": -0.08847765624523163, "frac_above_star": 0.0 }, { "step": 54, "sup_loss": 0.5887948076394037, "rf_loss": 0.0, "total_loss": 0.5887948076394037, "lyap1_mean": -0.15485382080078125, "lyap1_max": -0.06163830682635307, "frac_above_star": 0.0 }, { "step": 55, "sup_loss": 0.6782536216819343, "rf_loss": 0.0, "total_loss": 0.6782536216819343, "lyap1_mean": -0.1806010901927948, "lyap1_max": -0.13877363502979279, "frac_above_star": 0.0 }, { "step": 56, "sup_loss": 0.5827696306391047, "rf_loss": 0.0, "total_loss": 0.5827696306391047, "lyap1_mean": -0.1872037798166275, "lyap1_max": -0.0712938904762268, "frac_above_star": 0.0 }, { "step": 57, "sup_loss": 0.6474822727773479, "rf_loss": 0.0, "total_loss": 0.6474822727773479, "lyap1_mean": -0.1662570834159851, "lyap1_max": -0.06317443400621414, "frac_above_star": 0.0 }, { "step": 58, "sup_loss": 0.6788763995223821, "rf_loss": 0.0, "total_loss": 0.6788763995223821, "lyap1_mean": -0.1647149920463562, "lyap1_max": -0.09737633913755417, "frac_above_star": 0.0 }, { "step": 59, "sup_loss": 0.47308183679881255, "rf_loss": 0.0, "total_loss": 0.47308183679881255, "lyap1_mean": -0.18589964509010315, "lyap1_max": -0.12766408920288086, "frac_above_star": 0.0 }, { "step": 60, "sup_loss": 0.658854769842467, "rf_loss": 0.0, "total_loss": 0.658854769842467, "lyap1_mean": -0.16994233429431915, "lyap1_max": -0.061627887189388275, "frac_above_star": 0.0 }, { "step": 61, "sup_loss": 0.5568001125947928, "rf_loss": 0.0, "total_loss": 0.5568001125947928, "lyap1_mean": -0.15149489045143127, "lyap1_max": -0.022932160645723343, "frac_above_star": 0.0 }, { "step": 62, "sup_loss": 0.3920446858339084, "rf_loss": 0.0, "total_loss": 0.3920446858339084, "lyap1_mean": -0.19239003956317902, "lyap1_max": -0.10116466134786606, "frac_above_star": 0.0 }, { "step": 63, "sup_loss": 0.721397570023637, "rf_loss": 0.0, "total_loss": 0.721397570023637, "lyap1_mean": -0.11694826185703278, "lyap1_max": -0.0010510149877518415, "frac_above_star": 0.0 }, { "step": 64, "sup_loss": 0.6330102172688891, "rf_loss": 0.0, "total_loss": 0.6330102172688891, "lyap1_mean": -0.1513533890247345, "lyap1_max": -0.017508748918771744, "frac_above_star": 0.0 }, { "step": 65, "sup_loss": 0.8250728506941158, "rf_loss": 0.0, "total_loss": 0.8250728506941158, "lyap1_mean": -0.17732658982276917, "lyap1_max": -0.09383243322372437, "frac_above_star": 0.0 }, { "step": 66, "sup_loss": 0.5940941855190451, "rf_loss": 0.0, "total_loss": 0.5940941855190451, "lyap1_mean": -0.1654309332370758, "lyap1_max": -0.1284300982952118, "frac_above_star": 0.0 }, { "step": 67, "sup_loss": 0.4664364560962616, "rf_loss": 0.0, "total_loss": 0.4664364560962616, "lyap1_mean": -0.1642216444015503, "lyap1_max": -0.06826764345169067, "frac_above_star": 0.0 }, { "step": 68, "sup_loss": 0.6827257766025395, "rf_loss": 0.0, "total_loss": 0.6827257766025395, "lyap1_mean": -0.15604588389396667, "lyap1_max": -0.033950455486774445, "frac_above_star": 0.0 }, { "step": 69, "sup_loss": 0.7690185307512533, "rf_loss": 0.0, "total_loss": 0.7690185307512533, "lyap1_mean": -0.14441591501235962, "lyap1_max": -0.04283683001995087, "frac_above_star": 0.0 }, { "step": 70, "sup_loss": 0.6848736940860772, "rf_loss": 0.0, "total_loss": 0.6848736940860772, "lyap1_mean": -0.1828622668981552, "lyap1_max": -0.1170906275510788, "frac_above_star": 0.0 }, { "step": 71, "sup_loss": 0.7542726315728827, "rf_loss": 0.0, "total_loss": 0.7542726315728827, "lyap1_mean": -0.1594351828098297, "lyap1_max": -0.12077991664409637, "frac_above_star": 0.0 }, { "step": 72, "sup_loss": 0.42682296156124, "rf_loss": 0.0, "total_loss": 0.42682296156124, "lyap1_mean": -0.1843143105506897, "lyap1_max": -0.1570216864347458, "frac_above_star": 0.0 }, { "step": 73, "sup_loss": 0.5746759420306596, "rf_loss": 0.0, "total_loss": 0.5746759420306596, "lyap1_mean": -0.19194787740707397, "lyap1_max": -0.15704798698425293, "frac_above_star": 0.0 }, { "step": 74, "sup_loss": 0.6472347139375125, "rf_loss": 0.0, "total_loss": 0.6472347139375125, "lyap1_mean": -0.18024486303329468, "lyap1_max": -0.08175953477621078, "frac_above_star": 0.0 }, { "step": 75, "sup_loss": 0.6434590189756606, "rf_loss": 0.0, "total_loss": 0.6434590189756606, "lyap1_mean": -0.12922370433807373, "lyap1_max": -0.08600979298353195, "frac_above_star": 0.0 }, { "step": 76, "sup_loss": 0.558842837989357, "rf_loss": 0.0, "total_loss": 0.558842837989357, "lyap1_mean": -0.16661901772022247, "lyap1_max": -0.08575361967086792, "frac_above_star": 0.0 }, { "step": 77, "sup_loss": 0.6260539351643165, "rf_loss": 0.0, "total_loss": 0.6260539351643165, "lyap1_mean": -0.17542681097984314, "lyap1_max": -0.14538516104221344, "frac_above_star": 0.0 }, { "step": 78, "sup_loss": 0.861482869698535, "rf_loss": 0.0, "total_loss": 0.861482869698535, "lyap1_mean": -0.1483696699142456, "lyap1_max": -0.11332204192876816, "frac_above_star": 0.0 }, { "step": 79, "sup_loss": 0.7148390509002194, "rf_loss": 0.0, "total_loss": 0.7148390509002194, "lyap1_mean": -0.15092776715755463, "lyap1_max": -0.1086602658033371, "frac_above_star": 0.0 }, { "step": 80, "sup_loss": 0.6532735136873377, "rf_loss": 0.0, "total_loss": 0.6532735136873377, "lyap1_mean": -0.17219707369804382, "lyap1_max": -0.07662263512611389, "frac_above_star": 0.0 }, { "step": 81, "sup_loss": 0.397951504033647, "rf_loss": 0.0, "total_loss": 0.397951504033647, "lyap1_mean": -0.18101228773593903, "lyap1_max": -0.1068848967552185, "frac_above_star": 0.0 }, { "step": 82, "sup_loss": 0.5690674482673395, "rf_loss": 0.0, "total_loss": 0.5690674482673395, "lyap1_mean": -0.16561073064804077, "lyap1_max": -0.040073543787002563, "frac_above_star": 0.0 }, { "step": 83, "sup_loss": 0.6969073781404801, "rf_loss": 0.0, "total_loss": 0.6969073781404801, "lyap1_mean": -0.15943306684494019, "lyap1_max": -0.08403140306472778, "frac_above_star": 0.0 }, { "step": 84, "sup_loss": 0.718420066845627, "rf_loss": 0.0, "total_loss": 0.718420066845627, "lyap1_mean": -0.1287401020526886, "lyap1_max": -0.05855541676282883, "frac_above_star": 0.0 }, { "step": 85, "sup_loss": 0.7393493357043255, "rf_loss": 0.0, "total_loss": 0.7393493357043255, "lyap1_mean": -0.1613348126411438, "lyap1_max": -0.07303096354007721, "frac_above_star": 0.0 }, { "step": 86, "sup_loss": 0.7361247995323846, "rf_loss": 0.0, "total_loss": 0.7361247995323846, "lyap1_mean": -0.1712632179260254, "lyap1_max": -0.1111355870962143, "frac_above_star": 0.0 }, { "step": 87, "sup_loss": 0.665967349699131, "rf_loss": 0.0, "total_loss": 0.665967349699131, "lyap1_mean": -0.13269855082035065, "lyap1_max": -0.06142164766788483, "frac_above_star": 0.0 }, { "step": 88, "sup_loss": 0.8668512995073326, "rf_loss": 0.0, "total_loss": 0.8668512995073326, "lyap1_mean": -0.1623269021511078, "lyap1_max": -0.06179894506931305, "frac_above_star": 0.0 }, { "step": 89, "sup_loss": 0.7472489198897707, "rf_loss": 0.0, "total_loss": 0.7472489198897707, "lyap1_mean": -0.16679202020168304, "lyap1_max": -0.07163617014884949, "frac_above_star": 0.0 }, { "step": 90, "sup_loss": 0.45785369931819686, "rf_loss": 0.0, "total_loss": 0.45785369931819686, "lyap1_mean": -0.14543414115905762, "lyap1_max": -0.07081221789121628, "frac_above_star": 0.0 }, { "step": 91, "sup_loss": 0.6713364617643696, "rf_loss": 0.0, "total_loss": 0.6713364617643696, "lyap1_mean": -0.16620296239852905, "lyap1_max": -0.1152341216802597, "frac_above_star": 0.0 }, { "step": 92, "sup_loss": 0.6798887309407537, "rf_loss": 0.0, "total_loss": 0.6798887309407537, "lyap1_mean": -0.18379780650138855, "lyap1_max": -0.08940088003873825, "frac_above_star": 0.0 }, { "step": 93, "sup_loss": 0.470993184242424, "rf_loss": 0.0, "total_loss": 0.470993184242424, "lyap1_mean": -0.1753304898738861, "lyap1_max": -0.07410664856433868, "frac_above_star": 0.0 }, { "step": 94, "sup_loss": 0.7099687879292464, "rf_loss": 0.0, "total_loss": 0.7099687879292464, "lyap1_mean": -0.13737663626670837, "lyap1_max": -0.02115902304649353, "frac_above_star": 0.0 }, { "step": 95, "sup_loss": 0.6304236624334681, "rf_loss": 0.0, "total_loss": 0.6304236624334681, "lyap1_mean": -0.16854791343212128, "lyap1_max": -0.13022518157958984, "frac_above_star": 0.0 }, { "step": 96, "sup_loss": 0.7120030864178615, "rf_loss": 0.0, "total_loss": 0.7120030864178615, "lyap1_mean": -0.16556787490844727, "lyap1_max": -0.059217117726802826, "frac_above_star": 0.0 }, { "step": 97, "sup_loss": 0.49628548442866827, "rf_loss": 0.0, "total_loss": 0.49628548442866827, "lyap1_mean": -0.16981056332588196, "lyap1_max": -0.09900077432394028, "frac_above_star": 0.0 }, { "step": 98, "sup_loss": 0.7436049322671723, "rf_loss": 0.0, "total_loss": 0.7436049322671723, "lyap1_mean": -0.18156345188617706, "lyap1_max": -0.08804964274168015, "frac_above_star": 0.0 }, { "step": 99, "sup_loss": 0.5238087801518918, "rf_loss": 0.0, "total_loss": 0.5238087801518918, "lyap1_mean": -0.19207635521888733, "lyap1_max": -0.10540645569562912, "frac_above_star": 0.0 }, { "step": 100, "sup_loss": 0.5774716897504695, "rf_loss": 0.0, "total_loss": 0.5774716897504695, "lyap1_mean": -0.1739678531885147, "lyap1_max": -0.11489246785640717, "frac_above_star": 0.0 }, { "step": 101, "sup_loss": 0.5231556343723287, "rf_loss": 2.1604860194202047e-06, "total_loss": 0.5231772392334324, "lyap1_mean": -0.1403467059135437, "lyap1_max": 0.004157389514148235, "frac_above_star": 0.125 }, { "step": 102, "sup_loss": 0.683954065967664, "rf_loss": 0.0, "total_loss": 0.683954065967664, "lyap1_mean": -0.16159150004386902, "lyap1_max": -0.10724122822284698, "frac_above_star": 0.0 }, { "step": 103, "sup_loss": 0.673855342863094, "rf_loss": 0.0, "total_loss": 0.673855342863094, "lyap1_mean": -0.1392432153224945, "lyap1_max": -0.09444575011730194, "frac_above_star": 0.0 }, { "step": 104, "sup_loss": 0.7308201298778694, "rf_loss": 0.0, "total_loss": 0.7308201298778694, "lyap1_mean": -0.1400500386953354, "lyap1_max": -0.05964689701795578, "frac_above_star": 0.0 }, { "step": 105, "sup_loss": 0.7183844608879186, "rf_loss": 0.0, "total_loss": 0.7183844608879186, "lyap1_mean": -0.16069242358207703, "lyap1_max": -0.10598012059926987, "frac_above_star": 0.0 }, { "step": 106, "sup_loss": 0.703889093445469, "rf_loss": 0.0, "total_loss": 0.703889093445469, "lyap1_mean": -0.16085049510002136, "lyap1_max": -0.09450648725032806, "frac_above_star": 0.0 }, { "step": 107, "sup_loss": 0.7585623041551177, "rf_loss": 0.0, "total_loss": 0.7585623041551177, "lyap1_mean": -0.17502331733703613, "lyap1_max": -0.11126396059989929, "frac_above_star": 0.0 }, { "step": 108, "sup_loss": 0.6285093504506747, "rf_loss": 0.0, "total_loss": 0.6285093504506747, "lyap1_mean": -0.14805707335472107, "lyap1_max": -0.0061344183050096035, "frac_above_star": 0.0 }, { "step": 109, "sup_loss": 0.7506853835027976, "rf_loss": 0.0, "total_loss": 0.7506853835027976, "lyap1_mean": -0.14569415152072906, "lyap1_max": -0.08929413557052612, "frac_above_star": 0.0 }, { "step": 110, "sup_loss": 0.6462080920140123, "rf_loss": 0.0, "total_loss": 0.6462080920140123, "lyap1_mean": -0.18132932484149933, "lyap1_max": -0.10848363488912582, "frac_above_star": 0.0 }, { "step": 111, "sup_loss": 0.7425096371613439, "rf_loss": 0.0, "total_loss": 0.7425096371613439, "lyap1_mean": -0.16515275835990906, "lyap1_max": -0.023672889918088913, "frac_above_star": 0.0 }, { "step": 112, "sup_loss": 0.7617734319468721, "rf_loss": 0.0, "total_loss": 0.7617734319468721, "lyap1_mean": -0.16278308629989624, "lyap1_max": -0.11334371566772461, "frac_above_star": 0.0 }, { "step": 113, "sup_loss": 0.7429994084178121, "rf_loss": 0.0, "total_loss": 0.7429994084178121, "lyap1_mean": -0.14945060014724731, "lyap1_max": -0.03888426721096039, "frac_above_star": 0.0 }, { "step": 114, "sup_loss": 0.5267895653243198, "rf_loss": 0.0, "total_loss": 0.5267895653243198, "lyap1_mean": -0.19663462042808533, "lyap1_max": -0.12710979580879211, "frac_above_star": 0.0 }, { "step": 115, "sup_loss": 0.5565786392899637, "rf_loss": 0.0, "total_loss": 0.5565786392899637, "lyap1_mean": -0.13070335984230042, "lyap1_max": -0.03979885205626488, "frac_above_star": 0.0 }, { "step": 116, "sup_loss": 0.6669617407688825, "rf_loss": 0.0, "total_loss": 0.6669617407688825, "lyap1_mean": -0.14918240904808044, "lyap1_max": -0.10453256219625473, "frac_above_star": 0.0 }, { "step": 117, "sup_loss": 0.8919492397026759, "rf_loss": 0.0, "total_loss": 0.8919492397026759, "lyap1_mean": -0.1505049765110016, "lyap1_max": -0.07825712859630585, "frac_above_star": 0.0 }, { "step": 118, "sup_loss": 0.4710842552117467, "rf_loss": 0.0, "total_loss": 0.4710842552117467, "lyap1_mean": -0.15943017601966858, "lyap1_max": -0.09568998217582703, "frac_above_star": 0.0 }, { "step": 119, "sup_loss": 0.6251381927293124, "rf_loss": 0.0, "total_loss": 0.6251381927293124, "lyap1_mean": -0.14373569190502167, "lyap1_max": -0.06169363856315613, "frac_above_star": 0.0 }, { "step": 120, "sup_loss": 0.5066496812910415, "rf_loss": 0.0, "total_loss": 0.5066496812910415, "lyap1_mean": -0.1958259791135788, "lyap1_max": -0.1477712243795395, "frac_above_star": 0.0 }, { "step": 121, "sup_loss": 0.7547321366686087, "rf_loss": 0.00020556825620587915, "total_loss": 0.756787819143356, "lyap1_mean": -0.12657774984836578, "lyap1_max": 0.040553003549575806, "frac_above_star": 0.125 }, { "step": 122, "sup_loss": 0.7638001595410133, "rf_loss": 0.0, "total_loss": 0.7638001595410133, "lyap1_mean": -0.1522892415523529, "lyap1_max": -0.08786033093929291, "frac_above_star": 0.0 }, { "step": 123, "sup_loss": 0.7328743644942293, "rf_loss": 0.0, "total_loss": 0.7328743644942293, "lyap1_mean": -0.16936597228050232, "lyap1_max": -0.10127531737089157, "frac_above_star": 0.0 }, { "step": 124, "sup_loss": 0.8598762363137328, "rf_loss": 0.0, "total_loss": 0.8598762363137328, "lyap1_mean": -0.16397269070148468, "lyap1_max": -0.12449608743190765, "frac_above_star": 0.0 }, { "step": 125, "sup_loss": 0.6361224805438286, "rf_loss": 0.0, "total_loss": 0.6361224805438286, "lyap1_mean": -0.16441287100315094, "lyap1_max": -0.003912968095391989, "frac_above_star": 0.0 }, { "step": 126, "sup_loss": 0.5353405608963704, "rf_loss": 0.0, "total_loss": 0.5353405608963704, "lyap1_mean": -0.18839746713638306, "lyap1_max": -0.10522984713315964, "frac_above_star": 0.0 }, { "step": 127, "sup_loss": 0.48159890175980585, "rf_loss": 0.0, "total_loss": 0.48159890175980585, "lyap1_mean": -0.1902238428592682, "lyap1_max": -0.09681003540754318, "frac_above_star": 0.0 }, { "step": 128, "sup_loss": 0.4968575787194232, "rf_loss": 0.0, "total_loss": 0.4968575787194232, "lyap1_mean": -0.1681714802980423, "lyap1_max": -0.12721289694309235, "frac_above_star": 0.0 }, { "step": 129, "sup_loss": 0.49441572515794663, "rf_loss": 0.0, "total_loss": 0.49441572515794663, "lyap1_mean": -0.15709425508975983, "lyap1_max": -0.06226184964179993, "frac_above_star": 0.0 }, { "step": 130, "sup_loss": 0.6815041913818336, "rf_loss": 0.0, "total_loss": 0.6815041913818336, "lyap1_mean": -0.16429884731769562, "lyap1_max": -0.043527211993932724, "frac_above_star": 0.0 }, { "step": 131, "sup_loss": 0.4634879950259534, "rf_loss": 0.0, "total_loss": 0.4634879950259534, "lyap1_mean": -0.17791926860809326, "lyap1_max": -0.12318724393844604, "frac_above_star": 0.0 }, { "step": 132, "sup_loss": 0.6064607875869855, "rf_loss": 0.0, "total_loss": 0.6064607875869855, "lyap1_mean": -0.17092099785804749, "lyap1_max": -0.10002817958593369, "frac_above_star": 0.0 }, { "step": 133, "sup_loss": 0.6685585300948974, "rf_loss": 0.0, "total_loss": 0.6685585300948974, "lyap1_mean": -0.1789056658744812, "lyap1_max": -0.12728065252304077, "frac_above_star": 0.0 }, { "step": 134, "sup_loss": 0.5519405556303378, "rf_loss": 0.0, "total_loss": 0.5519405556303378, "lyap1_mean": -0.19462084770202637, "lyap1_max": -0.13060909509658813, "frac_above_star": 0.0 }, { "step": 135, "sup_loss": 0.7045589713840603, "rf_loss": 0.0, "total_loss": 0.7045589713840603, "lyap1_mean": -0.16444037854671478, "lyap1_max": -0.12477811425924301, "frac_above_star": 0.0 }, { "step": 136, "sup_loss": 0.7850105819752746, "rf_loss": 0.0, "total_loss": 0.7850105819752746, "lyap1_mean": -0.1737174093723297, "lyap1_max": -0.10541144013404846, "frac_above_star": 0.0 }, { "step": 137, "sup_loss": 0.7785755139098886, "rf_loss": 0.0, "total_loss": 0.7785755139098886, "lyap1_mean": -0.18544209003448486, "lyap1_max": -0.12326653301715851, "frac_above_star": 0.0 }, { "step": 138, "sup_loss": 0.5597011781455243, "rf_loss": 0.0, "total_loss": 0.5597011781455243, "lyap1_mean": -0.1937633454799652, "lyap1_max": -0.10527308285236359, "frac_above_star": 0.0 }, { "step": 139, "sup_loss": 0.6420759315860217, "rf_loss": 0.0, "total_loss": 0.6420759315860217, "lyap1_mean": -0.15952451527118683, "lyap1_max": -0.1008034199476242, "frac_above_star": 0.0 }, { "step": 140, "sup_loss": 0.8089228618042498, "rf_loss": 0.0, "total_loss": 0.8089228618042498, "lyap1_mean": -0.1759156882762909, "lyap1_max": -0.08576956391334534, "frac_above_star": 0.0 }, { "step": 141, "sup_loss": 0.812003107936831, "rf_loss": 0.0, "total_loss": 0.812003107936831, "lyap1_mean": -0.1607247292995453, "lyap1_max": -0.12249063700437546, "frac_above_star": 0.0 }, { "step": 142, "sup_loss": 0.4479740771091684, "rf_loss": 0.0, "total_loss": 0.4479740771091684, "lyap1_mean": -0.20000380277633667, "lyap1_max": -0.10555298626422882, "frac_above_star": 0.0 }, { "step": 143, "sup_loss": 0.5817672780196375, "rf_loss": 0.0, "total_loss": 0.5817672780196375, "lyap1_mean": -0.21298713982105255, "lyap1_max": -0.12004043906927109, "frac_above_star": 0.0 }, { "step": 144, "sup_loss": 0.8797154348488917, "rf_loss": 0.0, "total_loss": 0.8797154348488917, "lyap1_mean": -0.15399882197380066, "lyap1_max": -0.09458988904953003, "frac_above_star": 0.0 }, { "step": 145, "sup_loss": 0.7232432633885784, "rf_loss": 0.0, "total_loss": 0.7232432633885784, "lyap1_mean": -0.16347497701644897, "lyap1_max": -0.06838824599981308, "frac_above_star": 0.0 }, { "step": 146, "sup_loss": 0.6496779163352263, "rf_loss": 0.0, "total_loss": 0.6496779163352263, "lyap1_mean": -0.21644507348537445, "lyap1_max": -0.17353467643260956, "frac_above_star": 0.0 }, { "step": 147, "sup_loss": 0.5966363329780522, "rf_loss": 0.0, "total_loss": 0.5966363329780522, "lyap1_mean": -0.14191633462905884, "lyap1_max": -0.014518341980874538, "frac_above_star": 0.0 }, { "step": 148, "sup_loss": 0.7682823559945844, "rf_loss": 0.0, "total_loss": 0.7682823559945844, "lyap1_mean": -0.18606597185134888, "lyap1_max": -0.0672815665602684, "frac_above_star": 0.0 }, { "step": 149, "sup_loss": 0.48843997782688237, "rf_loss": 1.5960429664119147e-05, "total_loss": 0.48859958212716154, "lyap1_mean": -0.16264842450618744, "lyap1_max": 0.011299709789454937, "frac_above_star": 0.125 }, { "step": 150, "sup_loss": 0.5459912834235725, "rf_loss": 0.0, "total_loss": 0.5459912834235725, "lyap1_mean": -0.22184190154075623, "lyap1_max": -0.1826731562614441, "frac_above_star": 0.0 }, { "step": 151, "sup_loss": 0.5772671115429909, "rf_loss": 0.0, "total_loss": 0.5772671115429909, "lyap1_mean": -0.19352543354034424, "lyap1_max": -0.14144814014434814, "frac_above_star": 0.0 }, { "step": 152, "sup_loss": 0.6428379037491997, "rf_loss": 0.0, "total_loss": 0.6428379037491997, "lyap1_mean": -0.185125470161438, "lyap1_max": -0.13151797652244568, "frac_above_star": 0.0 }, { "step": 153, "sup_loss": 0.6925685108833266, "rf_loss": 0.0, "total_loss": 0.6925685108833266, "lyap1_mean": -0.16966179013252258, "lyap1_max": -0.10489576309919357, "frac_above_star": 0.0 }, { "step": 154, "sup_loss": 0.5983692706905355, "rf_loss": 0.0, "total_loss": 0.5983692706905355, "lyap1_mean": -0.15205121040344238, "lyap1_max": -0.024969544261693954, "frac_above_star": 0.0 }, { "step": 155, "sup_loss": 0.5316189453574188, "rf_loss": 0.0, "total_loss": 0.5316189453574188, "lyap1_mean": -0.18959608674049377, "lyap1_max": -0.12221087515354156, "frac_above_star": 0.0 }, { "step": 156, "sup_loss": 0.7406186095827086, "rf_loss": 0.0, "total_loss": 0.7406186095827086, "lyap1_mean": -0.1970748007297516, "lyap1_max": -0.1529281586408615, "frac_above_star": 0.0 }, { "step": 157, "sup_loss": 0.740008784172204, "rf_loss": 0.0, "total_loss": 0.740008784172204, "lyap1_mean": -0.1874978244304657, "lyap1_max": -0.14316855370998383, "frac_above_star": 0.0 }, { "step": 158, "sup_loss": 0.8327116138901606, "rf_loss": 0.0, "total_loss": 0.8327116138901606, "lyap1_mean": -0.16397586464881897, "lyap1_max": -0.12425532937049866, "frac_above_star": 0.0 }, { "step": 159, "sup_loss": 0.6326493237895445, "rf_loss": 0.0, "total_loss": 0.6326493237895445, "lyap1_mean": -0.2086288332939148, "lyap1_max": -0.10337858647108078, "frac_above_star": 0.0 }, { "step": 160, "sup_loss": 0.8025968103576084, "rf_loss": 0.0, "total_loss": 0.8025968103576084, "lyap1_mean": -0.15555360913276672, "lyap1_max": -0.11220382153987885, "frac_above_star": 0.0 }, { "step": 161, "sup_loss": 0.5347459026657402, "rf_loss": 0.0, "total_loss": 0.5347459026657402, "lyap1_mean": -0.191791832447052, "lyap1_max": -0.06744301319122314, "frac_above_star": 0.0 }, { "step": 162, "sup_loss": 0.5489169539931192, "rf_loss": 0.0, "total_loss": 0.5489169539931192, "lyap1_mean": -0.21898183226585388, "lyap1_max": -0.10425346344709396, "frac_above_star": 0.0 }, { "step": 163, "sup_loss": 0.6873355043020226, "rf_loss": 0.0, "total_loss": 0.6873355043020226, "lyap1_mean": -0.1897520124912262, "lyap1_max": -0.11232604086399078, "frac_above_star": 0.0 }, { "step": 164, "sup_loss": 0.5877940564883443, "rf_loss": 2.716142807912547e-05, "total_loss": 0.5880656707800495, "lyap1_mean": -0.1529943346977234, "lyap1_max": 0.014740807935595512, "frac_above_star": 0.125 }, { "step": 165, "sup_loss": 0.5680939563641257, "rf_loss": 0.0, "total_loss": 0.5680939563641257, "lyap1_mean": -0.19812071323394775, "lyap1_max": -0.1274873912334442, "frac_above_star": 0.0 }, { "step": 166, "sup_loss": 0.6364573033743302, "rf_loss": 0.0, "total_loss": 0.6364573033743302, "lyap1_mean": -0.17068974673748016, "lyap1_max": -0.08150409907102585, "frac_above_star": 0.0 }, { "step": 167, "sup_loss": 0.8229395469826807, "rf_loss": 0.0, "total_loss": 0.8229395469826807, "lyap1_mean": -0.16639558970928192, "lyap1_max": -0.08304523676633835, "frac_above_star": 0.0 }, { "step": 168, "sup_loss": 0.6654180807504827, "rf_loss": 0.0, "total_loss": 0.6654180807504827, "lyap1_mean": -0.19577012956142426, "lyap1_max": -0.13709217309951782, "frac_above_star": 0.0 }, { "step": 169, "sup_loss": 0.5607177853343124, "rf_loss": 0.0, "total_loss": 0.5607177853343124, "lyap1_mean": -0.20034848153591156, "lyap1_max": -0.12562024593353271, "frac_above_star": 0.0 }, { "step": 170, "sup_loss": 0.5051097297444527, "rf_loss": 0.0, "total_loss": 0.5051097297444527, "lyap1_mean": -0.23387402296066284, "lyap1_max": -0.1652885377407074, "frac_above_star": 0.0 }, { "step": 171, "sup_loss": 0.6527895366933933, "rf_loss": 0.0, "total_loss": 0.6527895366933933, "lyap1_mean": -0.16222573816776276, "lyap1_max": -0.07033611834049225, "frac_above_star": 0.0 }, { "step": 172, "sup_loss": 0.6014942054393526, "rf_loss": 0.0, "total_loss": 0.6014942054393526, "lyap1_mean": -0.17703285813331604, "lyap1_max": -0.12114321440458298, "frac_above_star": 0.0 }, { "step": 173, "sup_loss": 0.4851730399211569, "rf_loss": 0.0, "total_loss": 0.4851730399211569, "lyap1_mean": -0.19343218207359314, "lyap1_max": -0.1578855812549591, "frac_above_star": 0.0 }, { "step": 174, "sup_loss": 0.7279731731996669, "rf_loss": 0.0, "total_loss": 0.7279731731996669, "lyap1_mean": -0.18288783729076385, "lyap1_max": -0.09210478514432907, "frac_above_star": 0.0 }, { "step": 175, "sup_loss": 0.6187028876696454, "rf_loss": 0.0, "total_loss": 0.6187028876696454, "lyap1_mean": -0.18516868352890015, "lyap1_max": -0.12050573527812958, "frac_above_star": 0.0 }, { "step": 176, "sup_loss": 0.6365063295099235, "rf_loss": 0.0, "total_loss": 0.6365063295099235, "lyap1_mean": -0.1625199317932129, "lyap1_max": -0.08603774756193161, "frac_above_star": 0.0 }, { "step": 177, "sup_loss": 0.6256958261469656, "rf_loss": 0.0, "total_loss": 0.6256958261469656, "lyap1_mean": -0.17851519584655762, "lyap1_max": -0.09873935580253601, "frac_above_star": 0.0 }, { "step": 178, "sup_loss": 0.5806311870145986, "rf_loss": 0.0, "total_loss": 0.5806311870145986, "lyap1_mean": -0.1954081952571869, "lyap1_max": -0.1280255764722824, "frac_above_star": 0.0 }, { "step": 179, "sup_loss": 0.5270597892799554, "rf_loss": 0.0, "total_loss": 0.5270597892799554, "lyap1_mean": -0.18695306777954102, "lyap1_max": -0.1367555558681488, "frac_above_star": 0.0 }, { "step": 180, "sup_loss": 0.6557933962968071, "rf_loss": 0.0, "total_loss": 0.6557933962968071, "lyap1_mean": -0.15144571661949158, "lyap1_max": -0.0006251583690755069, "frac_above_star": 0.0 }, { "step": 181, "sup_loss": 0.4872700727079539, "rf_loss": 0.0, "total_loss": 0.4872700727079539, "lyap1_mean": -0.19529838860034943, "lyap1_max": -0.10506512224674225, "frac_above_star": 0.0 }, { "step": 182, "sup_loss": 0.7107089730249458, "rf_loss": 0.0, "total_loss": 0.7107089730249458, "lyap1_mean": -0.1818455308675766, "lyap1_max": -0.0915827751159668, "frac_above_star": 0.0 }, { "step": 183, "sup_loss": 0.6665424230109457, "rf_loss": 0.0, "total_loss": 0.6665424230109457, "lyap1_mean": -0.14988598227500916, "lyap1_max": -0.047298088669776917, "frac_above_star": 0.0 }, { "step": 184, "sup_loss": 0.42477363804588014, "rf_loss": 0.0, "total_loss": 0.42477363804588014, "lyap1_mean": -0.19928254187107086, "lyap1_max": -0.10007524490356445, "frac_above_star": 0.0 }, { "step": 185, "sup_loss": 0.4400530182674368, "rf_loss": 0.0, "total_loss": 0.4400530182674368, "lyap1_mean": -0.24661582708358765, "lyap1_max": -0.13337385654449463, "frac_above_star": 0.0 }, { "step": 186, "sup_loss": 0.5655318222239646, "rf_loss": 0.0, "total_loss": 0.5655318222239646, "lyap1_mean": -0.21137735247612, "lyap1_max": -0.090215764939785, "frac_above_star": 0.0 }, { "step": 187, "sup_loss": 0.5940940517381357, "rf_loss": 0.0, "total_loss": 0.5940940517381357, "lyap1_mean": -0.2127700001001358, "lyap1_max": -0.1477786749601364, "frac_above_star": 0.0 }, { "step": 188, "sup_loss": 0.8349321059445795, "rf_loss": 0.0, "total_loss": 0.8349321059445795, "lyap1_mean": -0.18069881200790405, "lyap1_max": -0.07421427220106125, "frac_above_star": 0.0 }, { "step": 189, "sup_loss": 0.8133786059327817, "rf_loss": 0.0, "total_loss": 0.8133786059327817, "lyap1_mean": -0.17181959748268127, "lyap1_max": -0.08487120270729065, "frac_above_star": 0.0 }, { "step": 190, "sup_loss": 0.7492684792000334, "rf_loss": 0.0, "total_loss": 0.7492684792000334, "lyap1_mean": -0.18165580928325653, "lyap1_max": -0.13193684816360474, "frac_above_star": 0.0 }, { "step": 191, "sup_loss": 0.653471886033279, "rf_loss": 0.0, "total_loss": 0.653471886033279, "lyap1_mean": -0.207014262676239, "lyap1_max": -0.15826547145843506, "frac_above_star": 0.0 }, { "step": 192, "sup_loss": 0.6365917194389581, "rf_loss": 0.0, "total_loss": 0.6365917194389581, "lyap1_mean": -0.1842191368341446, "lyap1_max": -0.1245940625667572, "frac_above_star": 0.0 }, { "step": 193, "sup_loss": 0.3998859013518479, "rf_loss": 0.0, "total_loss": 0.3998859013518479, "lyap1_mean": -0.22119861841201782, "lyap1_max": -0.07545958459377289, "frac_above_star": 0.0 }, { "step": 194, "sup_loss": 0.9082165094710438, "rf_loss": 0.0, "total_loss": 0.9082165094710438, "lyap1_mean": -0.16745831072330475, "lyap1_max": -0.11147600412368774, "frac_above_star": 0.0 }, { "step": 195, "sup_loss": 0.5050288870021935, "rf_loss": 0.0, "total_loss": 0.5050288870021935, "lyap1_mean": -0.19249188899993896, "lyap1_max": -0.1021115630865097, "frac_above_star": 0.0 }, { "step": 196, "sup_loss": 0.7532891542466421, "rf_loss": 0.0, "total_loss": 0.7532891542466421, "lyap1_mean": -0.18400734663009644, "lyap1_max": -0.12134106457233429, "frac_above_star": 0.0 }, { "step": 197, "sup_loss": 0.5423722096756773, "rf_loss": 0.0, "total_loss": 0.5423722096756773, "lyap1_mean": -0.20725812017917633, "lyap1_max": -0.08085224032402039, "frac_above_star": 0.0 }, { "step": 198, "sup_loss": 0.6009423979331727, "rf_loss": 0.0, "total_loss": 0.6009423979331727, "lyap1_mean": -0.20202291011810303, "lyap1_max": -0.1659374088048935, "frac_above_star": 0.0 }, { "step": 199, "sup_loss": 0.6208669925243495, "rf_loss": 0.0, "total_loss": 0.6208669925243495, "lyap1_mean": -0.17080381512641907, "lyap1_max": -0.07606574147939682, "frac_above_star": 0.0 }, { "step": 200, "sup_loss": 0.7711118706752605, "rf_loss": 0.0, "total_loss": 0.7711118706752605, "lyap1_mean": -0.14533007144927979, "lyap1_max": -0.08939565718173981, "frac_above_star": 0.0 }, { "step": 201, "sup_loss": 0.5762177239052891, "rf_loss": 0.0, "total_loss": 0.5762177239052891, "lyap1_mean": -0.17492035031318665, "lyap1_max": -0.12838837504386902, "frac_above_star": 0.0 }, { "step": 202, "sup_loss": 0.6769118850558024, "rf_loss": 0.0, "total_loss": 0.6769118850558024, "lyap1_mean": -0.19990310072898865, "lyap1_max": -0.10189828276634216, "frac_above_star": 0.0 }, { "step": 203, "sup_loss": 0.5895279495276788, "rf_loss": 0.0, "total_loss": 0.5895279495276788, "lyap1_mean": -0.20022916793823242, "lyap1_max": -0.1344572752714157, "frac_above_star": 0.0 }, { "step": 204, "sup_loss": 0.8413389971542649, "rf_loss": 0.0, "total_loss": 0.8413389971542649, "lyap1_mean": -0.17662313580513, "lyap1_max": -0.14446687698364258, "frac_above_star": 0.0 }, { "step": 205, "sup_loss": 0.6971975637493174, "rf_loss": 0.0, "total_loss": 0.6971975637493174, "lyap1_mean": -0.18620674312114716, "lyap1_max": -0.09516873210668564, "frac_above_star": 0.0 }, { "step": 206, "sup_loss": 0.6168185277758008, "rf_loss": 0.0, "total_loss": 0.6168185277758008, "lyap1_mean": -0.1898498833179474, "lyap1_max": -0.13361531496047974, "frac_above_star": 0.0 }, { "step": 207, "sup_loss": 0.8334405972811936, "rf_loss": 0.0, "total_loss": 0.8334405972811936, "lyap1_mean": -0.1740899682044983, "lyap1_max": -0.13845941424369812, "frac_above_star": 0.0 }, { "step": 208, "sup_loss": 0.6794604026457728, "rf_loss": 0.0, "total_loss": 0.6794604026457728, "lyap1_mean": -0.19401413202285767, "lyap1_max": -0.08722114562988281, "frac_above_star": 0.0 }, { "step": 209, "sup_loss": 0.6279444522621701, "rf_loss": 0.0, "total_loss": 0.6279444522621701, "lyap1_mean": -0.18119296431541443, "lyap1_max": -0.13031037151813507, "frac_above_star": 0.0 }, { "step": 210, "sup_loss": 0.6619698307989045, "rf_loss": 0.0, "total_loss": 0.6619698307989045, "lyap1_mean": -0.18808089196681976, "lyap1_max": -0.11215493083000183, "frac_above_star": 0.0 }, { "step": 211, "sup_loss": 0.512477945878355, "rf_loss": 0.0, "total_loss": 0.512477945878355, "lyap1_mean": -0.15431645512580872, "lyap1_max": -0.09080630540847778, "frac_above_star": 0.0 }, { "step": 212, "sup_loss": 0.7928889644907863, "rf_loss": 0.0, "total_loss": 0.7928889644907863, "lyap1_mean": -0.17847202718257904, "lyap1_max": -0.14659258723258972, "frac_above_star": 0.0 }, { "step": 213, "sup_loss": 0.598170388345071, "rf_loss": 0.0, "total_loss": 0.598170388345071, "lyap1_mean": -0.16671538352966309, "lyap1_max": -0.10012146085500717, "frac_above_star": 0.0 }, { "step": 214, "sup_loss": 0.7217380637282729, "rf_loss": 0.0, "total_loss": 0.7217380637282729, "lyap1_mean": -0.18659745156764984, "lyap1_max": -0.1233309656381607, "frac_above_star": 0.0 }, { "step": 215, "sup_loss": 0.5275838028388544, "rf_loss": 0.0, "total_loss": 0.5275838028388544, "lyap1_mean": -0.2107745110988617, "lyap1_max": -0.059159304946660995, "frac_above_star": 0.0 }, { "step": 216, "sup_loss": 0.5180137231573532, "rf_loss": 0.0, "total_loss": 0.5180137231573532, "lyap1_mean": -0.19923685491085052, "lyap1_max": -0.09573506563901901, "frac_above_star": 0.0 }, { "step": 217, "sup_loss": 0.7317760561607882, "rf_loss": 0.0, "total_loss": 0.7317760561607882, "lyap1_mean": -0.20531103014945984, "lyap1_max": -0.09016452729701996, "frac_above_star": 0.0 }, { "step": 218, "sup_loss": 0.3863822380717161, "rf_loss": 0.0, "total_loss": 0.3863822380717161, "lyap1_mean": -0.21770527958869934, "lyap1_max": -0.12124085426330566, "frac_above_star": 0.0 }, { "step": 219, "sup_loss": 0.6413152317866546, "rf_loss": 0.0, "total_loss": 0.6413152317866546, "lyap1_mean": -0.20588578283786774, "lyap1_max": -0.15815992653369904, "frac_above_star": 0.0 }, { "step": 220, "sup_loss": 0.5846004287927397, "rf_loss": 0.0, "total_loss": 0.5846004287927397, "lyap1_mean": -0.20143575966358185, "lyap1_max": -0.1717517375946045, "frac_above_star": 0.0 }, { "step": 221, "sup_loss": 0.5746991259974432, "rf_loss": 0.0, "total_loss": 0.5746991259974432, "lyap1_mean": -0.18192094564437866, "lyap1_max": -0.11587512493133545, "frac_above_star": 0.0 }, { "step": 222, "sup_loss": 0.7416600634919821, "rf_loss": 0.0, "total_loss": 0.7416600634919821, "lyap1_mean": -0.18745210766792297, "lyap1_max": -0.019930556416511536, "frac_above_star": 0.0 }, { "step": 223, "sup_loss": 0.6789613428250972, "rf_loss": 0.0, "total_loss": 0.6789613428250972, "lyap1_mean": -0.18654628098011017, "lyap1_max": -0.13545271754264832, "frac_above_star": 0.0 }, { "step": 224, "sup_loss": 0.4988223204287827, "rf_loss": 0.0, "total_loss": 0.4988223204287827, "lyap1_mean": -0.23297467827796936, "lyap1_max": -0.1591380089521408, "frac_above_star": 0.0 }, { "step": 225, "sup_loss": 0.574541263506592, "rf_loss": 0.0, "total_loss": 0.574541263506592, "lyap1_mean": -0.18594717979431152, "lyap1_max": -0.14040428400039673, "frac_above_star": 0.0 }, { "step": 226, "sup_loss": 0.6748131213675786, "rf_loss": 0.0, "total_loss": 0.6748131213675786, "lyap1_mean": -0.1859448254108429, "lyap1_max": -0.07669638097286224, "frac_above_star": 0.0 }, { "step": 227, "sup_loss": 0.7823256893117815, "rf_loss": 0.0, "total_loss": 0.7823256893117815, "lyap1_mean": -0.14126835763454437, "lyap1_max": -0.09209351241588593, "frac_above_star": 0.0 }, { "step": 228, "sup_loss": 0.7013193251398889, "rf_loss": 0.0, "total_loss": 0.7013193251398889, "lyap1_mean": -0.18973864614963531, "lyap1_max": -0.0867653489112854, "frac_above_star": 0.0 }, { "step": 229, "sup_loss": 0.5615674164555056, "rf_loss": 0.0, "total_loss": 0.5615674164555056, "lyap1_mean": -0.14694306254386902, "lyap1_max": -0.09908362478017807, "frac_above_star": 0.0 }, { "step": 230, "sup_loss": 0.5484360184865077, "rf_loss": 0.0, "total_loss": 0.5484360184865077, "lyap1_mean": -0.21054330468177795, "lyap1_max": -0.12875021994113922, "frac_above_star": 0.0 }, { "step": 231, "sup_loss": 0.5851770889212125, "rf_loss": 0.0, "total_loss": 0.5851770889212125, "lyap1_mean": -0.20899872481822968, "lyap1_max": -0.15053240954875946, "frac_above_star": 0.0 }, { "step": 232, "sup_loss": 0.45230500280638913, "rf_loss": 0.0, "total_loss": 0.45230500280638913, "lyap1_mean": -0.22442898154258728, "lyap1_max": -0.09790579974651337, "frac_above_star": 0.0 }, { "step": 233, "sup_loss": 0.5835474683251404, "rf_loss": 0.0, "total_loss": 0.5835474683251404, "lyap1_mean": -0.1932036131620407, "lyap1_max": -0.14970991015434265, "frac_above_star": 0.0 }, { "step": 234, "sup_loss": 0.8071970599948786, "rf_loss": 0.0, "total_loss": 0.8071970599948786, "lyap1_mean": -0.15869629383087158, "lyap1_max": -0.1133202314376831, "frac_above_star": 0.0 }, { "step": 235, "sup_loss": 0.5737930265636231, "rf_loss": 0.0, "total_loss": 0.5737930265636231, "lyap1_mean": -0.20969268679618835, "lyap1_max": -0.13586506247520447, "frac_above_star": 0.0 }, { "step": 236, "sup_loss": 0.6797859560260143, "rf_loss": 0.0, "total_loss": 0.6797859560260143, "lyap1_mean": -0.1847599446773529, "lyap1_max": -0.10684444010257721, "frac_above_star": 0.0 }, { "step": 237, "sup_loss": 0.7282897959051738, "rf_loss": 0.0, "total_loss": 0.7282897959051738, "lyap1_mean": -0.18843069672584534, "lyap1_max": -0.12965653836727142, "frac_above_star": 0.0 }, { "step": 238, "sup_loss": 0.7000614513045897, "rf_loss": 0.0, "total_loss": 0.7000614513045897, "lyap1_mean": -0.16323968768119812, "lyap1_max": -0.07210776209831238, "frac_above_star": 0.0 }, { "step": 239, "sup_loss": 0.5864120027934195, "rf_loss": 0.0, "total_loss": 0.5864120027934195, "lyap1_mean": -0.22082579135894775, "lyap1_max": -0.12202437222003937, "frac_above_star": 0.0 }, { "step": 240, "sup_loss": 0.6084040924732792, "rf_loss": 0.0, "total_loss": 0.6084040924732792, "lyap1_mean": -0.18410786986351013, "lyap1_max": -0.06253083050251007, "frac_above_star": 0.0 }, { "step": 241, "sup_loss": 0.8345470026973849, "rf_loss": 0.0, "total_loss": 0.8345470026973849, "lyap1_mean": -0.1579337865114212, "lyap1_max": -0.0272408127784729, "frac_above_star": 0.0 }, { "step": 242, "sup_loss": 0.5713998515157955, "rf_loss": 0.0, "total_loss": 0.5713998515157955, "lyap1_mean": -0.20360364019870758, "lyap1_max": -0.1592111438512802, "frac_above_star": 0.0 }, { "step": 243, "sup_loss": 0.6096693606430007, "rf_loss": 0.0, "total_loss": 0.6096693606430007, "lyap1_mean": -0.23549193143844604, "lyap1_max": -0.10957565903663635, "frac_above_star": 0.0 }, { "step": 244, "sup_loss": 0.7045783256782954, "rf_loss": 0.0, "total_loss": 0.7045783256782954, "lyap1_mean": -0.1997494399547577, "lyap1_max": -0.1633760780096054, "frac_above_star": 0.0 }, { "step": 245, "sup_loss": 0.5955321525404883, "rf_loss": 0.0, "total_loss": 0.5955321525404883, "lyap1_mean": -0.19693619012832642, "lyap1_max": -0.1459246575832367, "frac_above_star": 0.0 }, { "step": 246, "sup_loss": 0.6555734113077835, "rf_loss": 0.0, "total_loss": 0.6555734113077835, "lyap1_mean": -0.15803244709968567, "lyap1_max": -0.11777400970458984, "frac_above_star": 0.0 }, { "step": 247, "sup_loss": 0.4212589613938469, "rf_loss": 0.0, "total_loss": 0.4212589613938469, "lyap1_mean": -0.22008013725280762, "lyap1_max": -0.10012718290090561, "frac_above_star": 0.0 }, { "step": 248, "sup_loss": 0.5574121042032574, "rf_loss": 0.0, "total_loss": 0.5574121042032574, "lyap1_mean": -0.205031156539917, "lyap1_max": -0.15290270745754242, "frac_above_star": 0.0 }, { "step": 249, "sup_loss": 0.4552264284790628, "rf_loss": 0.0, "total_loss": 0.4552264284790628, "lyap1_mean": -0.20807483792304993, "lyap1_max": -0.10412444174289703, "frac_above_star": 0.0 }, { "step": 250, "sup_loss": 0.7576068427695233, "rf_loss": 0.0, "total_loss": 0.7576068427695233, "lyap1_mean": -0.21729722619056702, "lyap1_max": -0.12487022578716278, "frac_above_star": 0.0 }, { "step": 251, "sup_loss": 0.532847456197343, "rf_loss": 0.0, "total_loss": 0.532847456197343, "lyap1_mean": -0.2087923139333725, "lyap1_max": -0.11960875242948532, "frac_above_star": 0.0 }, { "step": 252, "sup_loss": 0.6851119009106368, "rf_loss": 0.0, "total_loss": 0.6851119009106368, "lyap1_mean": -0.16274216771125793, "lyap1_max": -0.10698308795690536, "frac_above_star": 0.0 }, { "step": 253, "sup_loss": 0.7244790598951485, "rf_loss": 0.0, "total_loss": 0.7244790598951485, "lyap1_mean": -0.184770405292511, "lyap1_max": -0.1252956986427307, "frac_above_star": 0.0 }, { "step": 254, "sup_loss": 0.5157174592139232, "rf_loss": 0.0, "total_loss": 0.5157174592139232, "lyap1_mean": -0.1887914389371872, "lyap1_max": -0.046691589057445526, "frac_above_star": 0.0 }, { "step": 255, "sup_loss": 0.6431732934645851, "rf_loss": 0.0, "total_loss": 0.6431732934645851, "lyap1_mean": -0.2084350734949112, "lyap1_max": -0.13359272480010986, "frac_above_star": 0.0 }, { "step": 256, "sup_loss": 0.3815739160467118, "rf_loss": 0.0, "total_loss": 0.3815739160467118, "lyap1_mean": -0.23863281309604645, "lyap1_max": -0.19798544049263, "frac_above_star": 0.0 }, { "step": 257, "sup_loss": 0.5269504779699585, "rf_loss": 0.0, "total_loss": 0.5269504779699585, "lyap1_mean": -0.2032645344734192, "lyap1_max": -0.10239192843437195, "frac_above_star": 0.0 }, { "step": 258, "sup_loss": 0.6118227850962039, "rf_loss": 0.0, "total_loss": 0.6118227850962039, "lyap1_mean": -0.19699692726135254, "lyap1_max": -0.10368481278419495, "frac_above_star": 0.0 }, { "step": 259, "sup_loss": 0.7165804062400436, "rf_loss": 0.0, "total_loss": 0.7165804062400436, "lyap1_mean": -0.20380517840385437, "lyap1_max": -0.06294184923171997, "frac_above_star": 0.0 }, { "step": 260, "sup_loss": 0.7420857004943276, "rf_loss": 0.0, "total_loss": 0.7420857004943276, "lyap1_mean": -0.1792520433664322, "lyap1_max": -0.08090441673994064, "frac_above_star": 0.0 }, { "step": 261, "sup_loss": 0.5912472370406531, "rf_loss": 0.0, "total_loss": 0.5912472370406531, "lyap1_mean": -0.2358292043209076, "lyap1_max": -0.1645435094833374, "frac_above_star": 0.0 }, { "step": 262, "sup_loss": 0.6189042462634529, "rf_loss": 0.0, "total_loss": 0.6189042462634529, "lyap1_mean": -0.17791533470153809, "lyap1_max": -0.05249137803912163, "frac_above_star": 0.0 }, { "step": 263, "sup_loss": 0.5000213322221764, "rf_loss": 0.0, "total_loss": 0.5000213322221764, "lyap1_mean": -0.20615559816360474, "lyap1_max": -0.1445314884185791, "frac_above_star": 0.0 }, { "step": 264, "sup_loss": 0.5718912173300827, "rf_loss": 0.0, "total_loss": 0.5718912173300827, "lyap1_mean": -0.18680906295776367, "lyap1_max": -0.0035286422353237867, "frac_above_star": 0.0 }, { "step": 265, "sup_loss": 0.7623782636858654, "rf_loss": 0.0, "total_loss": 0.7623782636858654, "lyap1_mean": -0.20019195973873138, "lyap1_max": -0.12598471343517303, "frac_above_star": 0.0 }, { "step": 266, "sup_loss": 0.5513525667452733, "rf_loss": 0.0, "total_loss": 0.5513525667452733, "lyap1_mean": -0.21320241689682007, "lyap1_max": -0.107155442237854, "frac_above_star": 0.0 }, { "step": 267, "sup_loss": 0.6298618723007406, "rf_loss": 0.0, "total_loss": 0.6298618723007406, "lyap1_mean": -0.15993478894233704, "lyap1_max": -0.05761319398880005, "frac_above_star": 0.0 }, { "step": 268, "sup_loss": 0.6471992436510657, "rf_loss": 0.0, "total_loss": 0.6471992436510657, "lyap1_mean": -0.211825892329216, "lyap1_max": -0.11933913081884384, "frac_above_star": 0.0 }, { "step": 269, "sup_loss": 0.6184704835147438, "rf_loss": 0.0, "total_loss": 0.6184704835147438, "lyap1_mean": -0.21122729778289795, "lyap1_max": -0.13626499474048615, "frac_above_star": 0.0 }, { "step": 270, "sup_loss": 0.7248206950062472, "rf_loss": 0.0, "total_loss": 0.7248206950062472, "lyap1_mean": -0.17642372846603394, "lyap1_max": -0.05269160121679306, "frac_above_star": 0.0 }, { "step": 271, "sup_loss": 0.4948518952343299, "rf_loss": 0.0, "total_loss": 0.4948518952343299, "lyap1_mean": -0.21097183227539062, "lyap1_max": -0.13665908575057983, "frac_above_star": 0.0 }, { "step": 272, "sup_loss": 0.717207941675246, "rf_loss": 0.0, "total_loss": 0.717207941675246, "lyap1_mean": -0.18877747654914856, "lyap1_max": -0.09135892987251282, "frac_above_star": 0.0 }, { "step": 273, "sup_loss": 0.4680622361949261, "rf_loss": 0.0, "total_loss": 0.4680622361949261, "lyap1_mean": -0.23423555493354797, "lyap1_max": -0.1593630164861679, "frac_above_star": 0.0 }, { "step": 274, "sup_loss": 0.7061199682754703, "rf_loss": 0.0, "total_loss": 0.7061199682754703, "lyap1_mean": -0.16886195540428162, "lyap1_max": -0.04170934855937958, "frac_above_star": 0.0 }, { "step": 275, "sup_loss": 0.655936375007585, "rf_loss": 0.0, "total_loss": 0.655936375007585, "lyap1_mean": -0.18335115909576416, "lyap1_max": -0.07446620613336563, "frac_above_star": 0.0 }, { "step": 276, "sup_loss": 0.5528033893323819, "rf_loss": 0.0, "total_loss": 0.5528033893323819, "lyap1_mean": -0.20333799719810486, "lyap1_max": -0.07793614268302917, "frac_above_star": 0.0 }, { "step": 277, "sup_loss": 0.511118571548442, "rf_loss": 0.0, "total_loss": 0.511118571548442, "lyap1_mean": -0.20717228949069977, "lyap1_max": -0.10768254846334457, "frac_above_star": 0.0 }, { "step": 278, "sup_loss": 0.6022763329684696, "rf_loss": 0.0, "total_loss": 0.6022763329684696, "lyap1_mean": -0.20858202874660492, "lyap1_max": -0.15471795201301575, "frac_above_star": 0.0 }, { "step": 279, "sup_loss": 0.6633374422521987, "rf_loss": 0.0, "total_loss": 0.6633374422521987, "lyap1_mean": -0.19902168214321136, "lyap1_max": -0.12896686792373657, "frac_above_star": 0.0 }, { "step": 280, "sup_loss": 0.8485106758972668, "rf_loss": 0.0, "total_loss": 0.8485106758972668, "lyap1_mean": -0.21111896634101868, "lyap1_max": -0.1639191061258316, "frac_above_star": 0.0 }, { "step": 281, "sup_loss": 0.5994228533188966, "rf_loss": 0.0, "total_loss": 0.5994228533188966, "lyap1_mean": -0.18312054872512817, "lyap1_max": -0.08309488743543625, "frac_above_star": 0.0 }, { "step": 282, "sup_loss": 0.4694115031400887, "rf_loss": 0.0, "total_loss": 0.4694115031400887, "lyap1_mean": -0.22399678826332092, "lyap1_max": -0.13577349483966827, "frac_above_star": 0.0 }, { "step": 283, "sup_loss": 0.6489331946807275, "rf_loss": 0.0, "total_loss": 0.6489331946807275, "lyap1_mean": -0.19033457338809967, "lyap1_max": -0.053469449281692505, "frac_above_star": 0.0 }, { "step": 284, "sup_loss": 0.7779979402883872, "rf_loss": 0.0, "total_loss": 0.7779979402883872, "lyap1_mean": -0.1697358638048172, "lyap1_max": -0.04647897928953171, "frac_above_star": 0.0 }, { "step": 285, "sup_loss": 0.5872561791719259, "rf_loss": 0.0, "total_loss": 0.5872561791719259, "lyap1_mean": -0.2095394730567932, "lyap1_max": -0.12189950793981552, "frac_above_star": 0.0 }, { "step": 286, "sup_loss": 0.4596701827103055, "rf_loss": 0.0, "total_loss": 0.4596701827103055, "lyap1_mean": -0.21175679564476013, "lyap1_max": -0.13707782328128815, "frac_above_star": 0.0 }, { "step": 287, "sup_loss": 0.8738979158492989, "rf_loss": 0.0, "total_loss": 0.8738979158492989, "lyap1_mean": -0.17131701111793518, "lyap1_max": -0.09467896819114685, "frac_above_star": 0.0 }, { "step": 288, "sup_loss": 0.7156924309934743, "rf_loss": 0.0, "total_loss": 0.7156924309934743, "lyap1_mean": -0.17758658528327942, "lyap1_max": -0.0936880111694336, "frac_above_star": 0.0 }, { "step": 289, "sup_loss": 0.6791981876851153, "rf_loss": 0.0, "total_loss": 0.6791981876851153, "lyap1_mean": -0.2065422683954239, "lyap1_max": -0.15270066261291504, "frac_above_star": 0.0 }, { "step": 290, "sup_loss": 0.6609259419074645, "rf_loss": 0.0, "total_loss": 0.6609259419074645, "lyap1_mean": -0.1596880555152893, "lyap1_max": -0.10381035506725311, "frac_above_star": 0.0 }, { "step": 291, "sup_loss": 0.6231714585601352, "rf_loss": 0.0, "total_loss": 0.6231714585601352, "lyap1_mean": -0.19707456231117249, "lyap1_max": -0.08881165832281113, "frac_above_star": 0.0 }, { "step": 292, "sup_loss": 0.6311314456054539, "rf_loss": 0.0, "total_loss": 0.6311314456054539, "lyap1_mean": -0.20047904551029205, "lyap1_max": -0.1404634416103363, "frac_above_star": 0.0 }, { "step": 293, "sup_loss": 0.5047424042408466, "rf_loss": 0.0, "total_loss": 0.5047424042408466, "lyap1_mean": -0.18673208355903625, "lyap1_max": -0.061900749802589417, "frac_above_star": 0.0 }, { "step": 294, "sup_loss": 0.5642462522138321, "rf_loss": 0.0, "total_loss": 0.5642462522138321, "lyap1_mean": -0.20698975026607513, "lyap1_max": -0.13737426698207855, "frac_above_star": 0.0 }, { "step": 295, "sup_loss": 0.3357777552347809, "rf_loss": 0.0, "total_loss": 0.3357777552347809, "lyap1_mean": -0.21511167287826538, "lyap1_max": -0.15001313388347626, "frac_above_star": 0.0 }, { "step": 296, "sup_loss": 0.7820351549654857, "rf_loss": 0.0, "total_loss": 0.7820351549654857, "lyap1_mean": -0.18001598119735718, "lyap1_max": -0.10143452882766724, "frac_above_star": 0.0 }, { "step": 297, "sup_loss": 0.5676022553317746, "rf_loss": 0.0, "total_loss": 0.5676022553317746, "lyap1_mean": -0.1430688202381134, "lyap1_max": -0.06571389734745026, "frac_above_star": 0.0 }, { "step": 298, "sup_loss": 0.5164999257245955, "rf_loss": 0.0, "total_loss": 0.5164999257245955, "lyap1_mean": -0.22075599431991577, "lyap1_max": -0.16197937726974487, "frac_above_star": 0.0 }, { "step": 299, "sup_loss": 0.43465535142057543, "rf_loss": 0.0, "total_loss": 0.43465535142057543, "lyap1_mean": -0.21162354946136475, "lyap1_max": -0.14653265476226807, "frac_above_star": 0.0 }, { "step": 300, "sup_loss": 0.4999927892004426, "rf_loss": 0.0, "total_loss": 0.4999927892004426, "lyap1_mean": -0.21222880482673645, "lyap1_max": -0.13471344113349915, "frac_above_star": 0.0 }, { "step": 301, "sup_loss": 0.6419136781051095, "rf_loss": 0.0, "total_loss": 0.6419136781051095, "lyap1_mean": -0.21842646598815918, "lyap1_max": -0.14819541573524475, "frac_above_star": 0.0 }, { "step": 302, "sup_loss": 0.7184835675517953, "rf_loss": 0.0, "total_loss": 0.7184835675517953, "lyap1_mean": -0.19375571608543396, "lyap1_max": -0.14576612412929535, "frac_above_star": 0.0 }, { "step": 303, "sup_loss": 0.6668186092587706, "rf_loss": 0.0, "total_loss": 0.6668186092587706, "lyap1_mean": -0.1563647985458374, "lyap1_max": -0.09767866134643555, "frac_above_star": 0.0 }, { "step": 304, "sup_loss": 0.5886426428198844, "rf_loss": 0.0, "total_loss": 0.5886426428198844, "lyap1_mean": -0.1869887113571167, "lyap1_max": -0.11474504321813583, "frac_above_star": 0.0 }, { "step": 305, "sup_loss": 0.5819470605860133, "rf_loss": 0.0, "total_loss": 0.5819470605860133, "lyap1_mean": -0.18046294152736664, "lyap1_max": -0.10532092303037643, "frac_above_star": 0.0 }, { "step": 306, "sup_loss": 0.6685692275108768, "rf_loss": 0.0, "total_loss": 0.6685692275108768, "lyap1_mean": -0.16952255368232727, "lyap1_max": -0.07361996918916702, "frac_above_star": 0.0 }, { "step": 307, "sup_loss": 0.6560717224491739, "rf_loss": 0.0, "total_loss": 0.6560717224491739, "lyap1_mean": -0.21112211048603058, "lyap1_max": -0.09937465190887451, "frac_above_star": 0.0 }, { "step": 308, "sup_loss": 0.4186001999349876, "rf_loss": 0.0, "total_loss": 0.4186001999349876, "lyap1_mean": -0.22547774016857147, "lyap1_max": -0.14976739883422852, "frac_above_star": 0.0 }, { "step": 309, "sup_loss": 0.6776406281541831, "rf_loss": 0.0, "total_loss": 0.6776406281541831, "lyap1_mean": -0.1833326518535614, "lyap1_max": -0.10521209239959717, "frac_above_star": 0.0 }, { "step": 310, "sup_loss": 0.40551002016333226, "rf_loss": 0.0, "total_loss": 0.40551002016333226, "lyap1_mean": -0.23695823550224304, "lyap1_max": -0.09792619198560715, "frac_above_star": 0.0 }, { "step": 311, "sup_loss": 0.6892406996954383, "rf_loss": 0.0, "total_loss": 0.6892406996954383, "lyap1_mean": -0.2016395926475525, "lyap1_max": -0.09467709064483643, "frac_above_star": 0.0 }, { "step": 312, "sup_loss": 0.5877242276417233, "rf_loss": 0.0, "total_loss": 0.5877242276417233, "lyap1_mean": -0.20739957690238953, "lyap1_max": -0.06636649370193481, "frac_above_star": 0.0 }, { "step": 313, "sup_loss": 0.5430511934957004, "rf_loss": 0.0, "total_loss": 0.5430511934957004, "lyap1_mean": -0.21065844595432281, "lyap1_max": -0.13060283660888672, "frac_above_star": 0.0 }, { "step": 314, "sup_loss": 0.8803535795084014, "rf_loss": 0.0, "total_loss": 0.8803535795084014, "lyap1_mean": -0.1857832968235016, "lyap1_max": -0.1175488755106926, "frac_above_star": 0.0 }, { "step": 315, "sup_loss": 0.6627528378192635, "rf_loss": 0.0, "total_loss": 0.6627528378192635, "lyap1_mean": -0.20149578154087067, "lyap1_max": -0.1099119484424591, "frac_above_star": 0.0 }, { "step": 316, "sup_loss": 0.5789342480232099, "rf_loss": 0.0, "total_loss": 0.5789342480232099, "lyap1_mean": -0.2053331881761551, "lyap1_max": -0.14896173775196075, "frac_above_star": 0.0 }, { "step": 317, "sup_loss": 0.6906240859629285, "rf_loss": 0.0, "total_loss": 0.6906240859629285, "lyap1_mean": -0.20366495847702026, "lyap1_max": -0.16215787827968597, "frac_above_star": 0.0 }, { "step": 318, "sup_loss": 0.577792260096764, "rf_loss": 0.0, "total_loss": 0.577792260096764, "lyap1_mean": -0.21726560592651367, "lyap1_max": -0.10607753694057465, "frac_above_star": 0.0 }, { "step": 319, "sup_loss": 0.5722200480933208, "rf_loss": 0.0, "total_loss": 0.5722200480933208, "lyap1_mean": -0.2302064448595047, "lyap1_max": -0.15408235788345337, "frac_above_star": 0.0 }, { "step": 320, "sup_loss": 0.6508213234899658, "rf_loss": 0.0, "total_loss": 0.6508213234899658, "lyap1_mean": -0.19187375903129578, "lyap1_max": -0.13157692551612854, "frac_above_star": 0.0 }, { "step": 321, "sup_loss": 0.47385235645879986, "rf_loss": 0.0, "total_loss": 0.47385235645879986, "lyap1_mean": -0.18041148781776428, "lyap1_max": -0.04731091856956482, "frac_above_star": 0.0 }, { "step": 322, "sup_loss": 0.5540987578209245, "rf_loss": 0.0, "total_loss": 0.5540987578209245, "lyap1_mean": -0.16657018661499023, "lyap1_max": -0.07768111675977707, "frac_above_star": 0.0 }, { "step": 323, "sup_loss": 0.9011917319108097, "rf_loss": 0.0, "total_loss": 0.9011917319108097, "lyap1_mean": -0.17512476444244385, "lyap1_max": -0.10239966958761215, "frac_above_star": 0.0 }, { "step": 324, "sup_loss": 0.6071310052896857, "rf_loss": 0.0, "total_loss": 0.6071310052896857, "lyap1_mean": -0.20789191126823425, "lyap1_max": -0.09531428664922714, "frac_above_star": 0.0 }, { "step": 325, "sup_loss": 0.582458570647056, "rf_loss": 0.0, "total_loss": 0.582458570647056, "lyap1_mean": -0.17439937591552734, "lyap1_max": -0.08293897658586502, "frac_above_star": 0.0 }, { "step": 326, "sup_loss": 0.8106188970154662, "rf_loss": 0.0, "total_loss": 0.8106188970154662, "lyap1_mean": -0.16168546676635742, "lyap1_max": -0.053428199142217636, "frac_above_star": 0.0 }, { "step": 327, "sup_loss": 0.6312333608267489, "rf_loss": 0.0, "total_loss": 0.6312333608267489, "lyap1_mean": -0.20303195714950562, "lyap1_max": -0.13282987475395203, "frac_above_star": 0.0 }, { "step": 328, "sup_loss": 0.5422648221897417, "rf_loss": 0.0, "total_loss": 0.5422648221897417, "lyap1_mean": -0.19051404297351837, "lyap1_max": -0.07751069217920303, "frac_above_star": 0.0 }, { "step": 329, "sup_loss": 0.5163909029289683, "rf_loss": 0.0, "total_loss": 0.5163909029289683, "lyap1_mean": -0.19445833563804626, "lyap1_max": -0.13371263444423676, "frac_above_star": 0.0 }, { "step": 330, "sup_loss": 0.6181871005718456, "rf_loss": 0.0, "total_loss": 0.6181871005718456, "lyap1_mean": -0.21415221691131592, "lyap1_max": -0.12783290445804596, "frac_above_star": 0.0 }, { "step": 331, "sup_loss": 0.6829852307647862, "rf_loss": 0.0, "total_loss": 0.6829852307647862, "lyap1_mean": -0.15502427518367767, "lyap1_max": -0.07957062125205994, "frac_above_star": 0.0 }, { "step": 332, "sup_loss": 0.6879567782925539, "rf_loss": 0.0, "total_loss": 0.6879567782925539, "lyap1_mean": -0.1819939911365509, "lyap1_max": -0.028732536360621452, "frac_above_star": 0.0 }, { "step": 333, "sup_loss": 0.6029713276998413, "rf_loss": 3.826450483757071e-05, "total_loss": 0.603353972755493, "lyap1_mean": -0.18572357296943665, "lyap1_max": 0.017496172338724136, "frac_above_star": 0.125 }, { "step": 334, "sup_loss": 0.45567067729668537, "rf_loss": 0.0, "total_loss": 0.45567067729668537, "lyap1_mean": -0.2405601590871811, "lyap1_max": -0.07903667539358139, "frac_above_star": 0.0 }, { "step": 335, "sup_loss": 0.6695800862384511, "rf_loss": 0.0, "total_loss": 0.6695800862384511, "lyap1_mean": -0.16050902009010315, "lyap1_max": -0.07255368679761887, "frac_above_star": 0.0 }, { "step": 336, "sup_loss": 0.47959168957172627, "rf_loss": 0.0, "total_loss": 0.47959168957172627, "lyap1_mean": -0.21810755133628845, "lyap1_max": -0.12287141382694244, "frac_above_star": 0.0 }, { "step": 337, "sup_loss": 0.6797811820079066, "rf_loss": 0.0, "total_loss": 0.6797811820079066, "lyap1_mean": -0.15427827835083008, "lyap1_max": -0.06944482028484344, "frac_above_star": 0.0 }, { "step": 338, "sup_loss": 0.45031763710734607, "rf_loss": 0.0, "total_loss": 0.45031763710734607, "lyap1_mean": -0.2577511966228485, "lyap1_max": -0.12987101078033447, "frac_above_star": 0.0 }, { "step": 339, "sup_loss": 0.612827626013735, "rf_loss": 0.0, "total_loss": 0.612827626013735, "lyap1_mean": -0.21244710683822632, "lyap1_max": -0.1695183962583542, "frac_above_star": 0.0 }, { "step": 340, "sup_loss": 0.617710493869964, "rf_loss": 0.0, "total_loss": 0.617710493869964, "lyap1_mean": -0.20625047385692596, "lyap1_max": -0.1609116643667221, "frac_above_star": 0.0 }, { "step": 341, "sup_loss": 0.6152667160237358, "rf_loss": 0.0, "total_loss": 0.6152667160237358, "lyap1_mean": -0.22426238656044006, "lyap1_max": -0.1430836319923401, "frac_above_star": 0.0 }, { "step": 342, "sup_loss": 0.4258543016668707, "rf_loss": 0.0, "total_loss": 0.4258543016668707, "lyap1_mean": -0.20931020379066467, "lyap1_max": -0.11437708139419556, "frac_above_star": 0.0 }, { "step": 343, "sup_loss": 0.5054577904708717, "rf_loss": 0.0, "total_loss": 0.5054577904708717, "lyap1_mean": -0.21300777792930603, "lyap1_max": -0.09619505703449249, "frac_above_star": 0.0 }, { "step": 344, "sup_loss": 0.4650392369019393, "rf_loss": 0.0, "total_loss": 0.4650392369019393, "lyap1_mean": -0.2412421703338623, "lyap1_max": -0.14713002741336823, "frac_above_star": 0.0 }, { "step": 345, "sup_loss": 0.5114353556061555, "rf_loss": 0.0, "total_loss": 0.5114353556061555, "lyap1_mean": -0.17073482275009155, "lyap1_max": -0.04239789396524429, "frac_above_star": 0.0 }, { "step": 346, "sup_loss": 0.530774454967623, "rf_loss": 0.0, "total_loss": 0.530774454967623, "lyap1_mean": -0.1936408430337906, "lyap1_max": -0.1057838723063469, "frac_above_star": 0.0 }, { "step": 347, "sup_loss": 0.7561842376707624, "rf_loss": 0.0, "total_loss": 0.7561842376707624, "lyap1_mean": -0.19192439317703247, "lyap1_max": -0.13412657380104065, "frac_above_star": 0.0 }, { "step": 348, "sup_loss": 0.6017917432870841, "rf_loss": 0.0, "total_loss": 0.6017917432870841, "lyap1_mean": -0.21505501866340637, "lyap1_max": -0.1551818996667862, "frac_above_star": 0.0 }, { "step": 349, "sup_loss": 0.6351538286787377, "rf_loss": 0.0, "total_loss": 0.6351538286787377, "lyap1_mean": -0.20465058088302612, "lyap1_max": -0.04359325021505356, "frac_above_star": 0.0 }, { "step": 350, "sup_loss": 0.782842096319724, "rf_loss": 0.0, "total_loss": 0.782842096319724, "lyap1_mean": -0.13674487173557281, "lyap1_max": -0.061379313468933105, "frac_above_star": 0.0 }, { "step": 351, "sup_loss": 0.5910700662074077, "rf_loss": 0.0, "total_loss": 0.5910700662074077, "lyap1_mean": -0.1918736696243286, "lyap1_max": -0.005033716559410095, "frac_above_star": 0.0 }, { "step": 352, "sup_loss": 0.5966124670342008, "rf_loss": 0.0, "total_loss": 0.5966124670342008, "lyap1_mean": -0.21596181392669678, "lyap1_max": -0.14188343286514282, "frac_above_star": 0.0 }, { "step": 353, "sup_loss": 0.675918530851194, "rf_loss": 0.0, "total_loss": 0.675918530851194, "lyap1_mean": -0.19547432661056519, "lyap1_max": -0.1526150107383728, "frac_above_star": 0.0 }, { "step": 354, "sup_loss": 0.7168136633100655, "rf_loss": 0.0, "total_loss": 0.7168136633100655, "lyap1_mean": -0.18883001804351807, "lyap1_max": -0.06116810068488121, "frac_above_star": 0.0 }, { "step": 355, "sup_loss": 0.678914560936435, "rf_loss": 0.0, "total_loss": 0.678914560936435, "lyap1_mean": -0.204725980758667, "lyap1_max": -0.1210031732916832, "frac_above_star": 0.0 }, { "step": 356, "sup_loss": 0.7881227113058328, "rf_loss": 0.0, "total_loss": 0.7881227113058328, "lyap1_mean": -0.18319512903690338, "lyap1_max": -0.09052859246730804, "frac_above_star": 0.0 }, { "step": 357, "sup_loss": 0.5294555377656751, "rf_loss": 0.0, "total_loss": 0.5294555377656751, "lyap1_mean": -0.21538054943084717, "lyap1_max": -0.16080915927886963, "frac_above_star": 0.0 }, { "step": 358, "sup_loss": 0.5268954028957669, "rf_loss": 0.0, "total_loss": 0.5268954028957669, "lyap1_mean": -0.20286843180656433, "lyap1_max": -0.004223668482154608, "frac_above_star": 0.0 }, { "step": 359, "sup_loss": 0.6616861391966553, "rf_loss": 0.0, "total_loss": 0.6616861391966553, "lyap1_mean": -0.2135724425315857, "lyap1_max": -0.13193802535533905, "frac_above_star": 0.0 }, { "step": 360, "sup_loss": 0.606203764556421, "rf_loss": 0.0, "total_loss": 0.606203764556421, "lyap1_mean": -0.160806804895401, "lyap1_max": -0.09549286961555481, "frac_above_star": 0.0 }, { "step": 361, "sup_loss": 0.8928659020905169, "rf_loss": 0.0, "total_loss": 0.8928659020905169, "lyap1_mean": -0.16604696214199066, "lyap1_max": -0.05280466005206108, "frac_above_star": 0.0 }, { "step": 362, "sup_loss": 0.7083959801570291, "rf_loss": 0.0, "total_loss": 0.7083959801570291, "lyap1_mean": -0.15882061421871185, "lyap1_max": -0.03835834562778473, "frac_above_star": 0.0 }, { "step": 363, "sup_loss": 0.7482588618571201, "rf_loss": 0.0, "total_loss": 0.7482588618571201, "lyap1_mean": -0.15882053971290588, "lyap1_max": -0.09018184244632721, "frac_above_star": 0.0 }, { "step": 364, "sup_loss": 0.6308320943439704, "rf_loss": 0.0, "total_loss": 0.6308320943439704, "lyap1_mean": -0.18016958236694336, "lyap1_max": -0.09750163555145264, "frac_above_star": 0.0 }, { "step": 365, "sup_loss": 0.4164091509955829, "rf_loss": 0.0, "total_loss": 0.4164091509955829, "lyap1_mean": -0.22297818958759308, "lyap1_max": -0.14620640873908997, "frac_above_star": 0.0 }, { "step": 366, "sup_loss": 0.5987280149112422, "rf_loss": 0.0, "total_loss": 0.5987280149112422, "lyap1_mean": -0.20581157505512238, "lyap1_max": -0.13173836469650269, "frac_above_star": 0.0 }, { "step": 367, "sup_loss": 0.6271995162277311, "rf_loss": 0.0, "total_loss": 0.6271995162277311, "lyap1_mean": -0.2065156102180481, "lyap1_max": -0.10696878284215927, "frac_above_star": 0.0 }, { "step": 368, "sup_loss": 0.6818754835047333, "rf_loss": 0.0, "total_loss": 0.6818754835047333, "lyap1_mean": -0.17280782759189606, "lyap1_max": -0.08220875263214111, "frac_above_star": 0.0 }, { "step": 369, "sup_loss": 0.5613284646544792, "rf_loss": 0.0, "total_loss": 0.5613284646544792, "lyap1_mean": -0.15868282318115234, "lyap1_max": -0.040507685393095016, "frac_above_star": 0.0 }, { "step": 370, "sup_loss": 0.7062698803339427, "rf_loss": 0.0, "total_loss": 0.7062698803339427, "lyap1_mean": -0.20176076889038086, "lyap1_max": -0.1737232804298401, "frac_above_star": 0.0 }, { "step": 371, "sup_loss": 0.5138421031993283, "rf_loss": 0.0, "total_loss": 0.5138421031993283, "lyap1_mean": -0.24099764227867126, "lyap1_max": -0.1382274329662323, "frac_above_star": 0.0 }, { "step": 372, "sup_loss": 0.6737039514335528, "rf_loss": 0.0, "total_loss": 0.6737039514335528, "lyap1_mean": -0.1585230529308319, "lyap1_max": -0.10426023602485657, "frac_above_star": 0.0 }, { "step": 373, "sup_loss": 0.4708590665689304, "rf_loss": 0.0, "total_loss": 0.4708590665689304, "lyap1_mean": -0.19795387983322144, "lyap1_max": -0.10054431855678558, "frac_above_star": 0.0 }, { "step": 374, "sup_loss": 0.6915544440031035, "rf_loss": 0.0, "total_loss": 0.6915544440031035, "lyap1_mean": -0.1804148405790329, "lyap1_max": -0.0661967545747757, "frac_above_star": 0.0 }, { "step": 375, "sup_loss": 0.5588678318956251, "rf_loss": 0.0, "total_loss": 0.5588678318956251, "lyap1_mean": -0.18470902740955353, "lyap1_max": -0.06487395614385605, "frac_above_star": 0.0 }, { "step": 376, "sup_loss": 0.5274282106751615, "rf_loss": 0.0, "total_loss": 0.5274282106751615, "lyap1_mean": -0.20193055272102356, "lyap1_max": -0.08201418071985245, "frac_above_star": 0.0 }, { "step": 377, "sup_loss": 0.581763876803729, "rf_loss": 0.0, "total_loss": 0.581763876803729, "lyap1_mean": -0.17592361569404602, "lyap1_max": -0.07936382293701172, "frac_above_star": 0.0 }, { "step": 378, "sup_loss": 0.4597660492247642, "rf_loss": 0.0, "total_loss": 0.4597660492247642, "lyap1_mean": -0.2564019560813904, "lyap1_max": -0.1167556494474411, "frac_above_star": 0.0 }, { "step": 379, "sup_loss": 0.46006944011459255, "rf_loss": 0.0, "total_loss": 0.46006944011459255, "lyap1_mean": -0.20380762219429016, "lyap1_max": -0.13572263717651367, "frac_above_star": 0.0 }, { "step": 380, "sup_loss": 0.5632022352276694, "rf_loss": 0.0, "total_loss": 0.5632022352276694, "lyap1_mean": -0.20880866050720215, "lyap1_max": -0.09361293166875839, "frac_above_star": 0.0 }, { "step": 381, "sup_loss": 0.4364613193999451, "rf_loss": 0.0, "total_loss": 0.4364613193999451, "lyap1_mean": -0.21988144516944885, "lyap1_max": -0.09750216454267502, "frac_above_star": 0.0 }, { "step": 382, "sup_loss": 0.66264301138006, "rf_loss": 0.0, "total_loss": 0.66264301138006, "lyap1_mean": -0.1951894313097, "lyap1_max": -0.12072128057479858, "frac_above_star": 0.0 }, { "step": 383, "sup_loss": 0.4515309581351513, "rf_loss": 0.0, "total_loss": 0.4515309581351513, "lyap1_mean": -0.23244574666023254, "lyap1_max": -0.12313459813594818, "frac_above_star": 0.0 }, { "step": 384, "sup_loss": 0.44204852509041537, "rf_loss": 0.0, "total_loss": 0.44204852509041537, "lyap1_mean": -0.22741319239139557, "lyap1_max": -0.13253024220466614, "frac_above_star": 0.0 }, { "step": 385, "sup_loss": 0.5102926892672601, "rf_loss": 0.0, "total_loss": 0.5102926892672601, "lyap1_mean": -0.19103452563285828, "lyap1_max": -0.08420859277248383, "frac_above_star": 0.0 }, { "step": 386, "sup_loss": 0.45695202603060114, "rf_loss": 0.0, "total_loss": 0.45695202603060114, "lyap1_mean": -0.24187232553958893, "lyap1_max": -0.11189377307891846, "frac_above_star": 0.0 }, { "step": 387, "sup_loss": 0.6926642116318935, "rf_loss": 0.0, "total_loss": 0.6926642116318935, "lyap1_mean": -0.17316362261772156, "lyap1_max": -0.05011987313628197, "frac_above_star": 0.0 }, { "step": 388, "sup_loss": 0.6684021219317057, "rf_loss": 0.0, "total_loss": 0.6684021219317057, "lyap1_mean": -0.2088947892189026, "lyap1_max": -0.16127729415893555, "frac_above_star": 0.0 }, { "step": 389, "sup_loss": 0.5515624315984612, "rf_loss": 0.0, "total_loss": 0.5515624315984612, "lyap1_mean": -0.20058554410934448, "lyap1_max": -0.09298398345708847, "frac_above_star": 0.0 }, { "step": 390, "sup_loss": 0.601766807616978, "rf_loss": 0.0, "total_loss": 0.601766807616978, "lyap1_mean": -0.2196391075849533, "lyap1_max": -0.06671483814716339, "frac_above_star": 0.0 }, { "step": 391, "sup_loss": 0.6718063090991536, "rf_loss": 0.0, "total_loss": 0.6718063090991536, "lyap1_mean": -0.23165051639080048, "lyap1_max": -0.13598200678825378, "frac_above_star": 0.0 }, { "step": 392, "sup_loss": 0.6701925497567233, "rf_loss": 0.0, "total_loss": 0.6701925497567233, "lyap1_mean": -0.19613829255104065, "lyap1_max": -0.154951810836792, "frac_above_star": 0.0 }, { "step": 393, "sup_loss": 0.7559909388765815, "rf_loss": 0.0, "total_loss": 0.7559909388765815, "lyap1_mean": -0.17928481101989746, "lyap1_max": -0.10894026607275009, "frac_above_star": 0.0 }, { "step": 394, "sup_loss": 0.6862059105799613, "rf_loss": 0.0, "total_loss": 0.6862059105799613, "lyap1_mean": -0.20451520383358002, "lyap1_max": -0.13031339645385742, "frac_above_star": 0.0 }, { "step": 395, "sup_loss": 0.6238241736162596, "rf_loss": 0.0, "total_loss": 0.6238241736162596, "lyap1_mean": -0.2125069797039032, "lyap1_max": -0.13419416546821594, "frac_above_star": 0.0 }, { "step": 396, "sup_loss": 0.5543267540897161, "rf_loss": 0.0, "total_loss": 0.5543267540897161, "lyap1_mean": -0.1750076413154602, "lyap1_max": -0.06425385922193527, "frac_above_star": 0.0 }, { "step": 397, "sup_loss": 0.4419858617270676, "rf_loss": 0.0, "total_loss": 0.4419858617270676, "lyap1_mean": -0.2407246083021164, "lyap1_max": -0.16595309972763062, "frac_above_star": 0.0 }, { "step": 398, "sup_loss": 0.7529441848064666, "rf_loss": 0.0, "total_loss": 0.7529441848064666, "lyap1_mean": -0.2003626525402069, "lyap1_max": -0.12171699106693268, "frac_above_star": 0.0 }, { "step": 399, "sup_loss": 0.4274941310651707, "rf_loss": 0.0, "total_loss": 0.4274941310651707, "lyap1_mean": -0.253703773021698, "lyap1_max": -0.12632986903190613, "frac_above_star": 0.0 }, { "step": 400, "sup_loss": 0.541843113607991, "rf_loss": 0.0, "total_loss": 0.541843113607991, "lyap1_mean": -0.23306682705879211, "lyap1_max": -0.13942019641399384, "frac_above_star": 0.0 }, { "step": 401, "sup_loss": 0.6333644034043541, "rf_loss": 0.0, "total_loss": 0.6333644034043541, "lyap1_mean": -0.21318838000297546, "lyap1_max": -0.12276913225650787, "frac_above_star": 0.0 }, { "step": 402, "sup_loss": 0.6134673184430651, "rf_loss": 0.0, "total_loss": 0.6134673184430651, "lyap1_mean": -0.2013246715068817, "lyap1_max": -0.10854886472225189, "frac_above_star": 0.0 }, { "step": 403, "sup_loss": 0.6480385852394712, "rf_loss": 0.0, "total_loss": 0.6480385852394712, "lyap1_mean": -0.1586003452539444, "lyap1_max": -0.06721264123916626, "frac_above_star": 0.0 }, { "step": 404, "sup_loss": 0.44802136543671495, "rf_loss": 0.0, "total_loss": 0.44802136543671495, "lyap1_mean": -0.23569346964359283, "lyap1_max": -0.1620783805847168, "frac_above_star": 0.0 }, { "step": 405, "sup_loss": 0.7822260581145454, "rf_loss": 0.0, "total_loss": 0.7822260581145454, "lyap1_mean": -0.20069602131843567, "lyap1_max": -0.07712525129318237, "frac_above_star": 0.0 }, { "step": 406, "sup_loss": 0.7710663304577412, "rf_loss": 0.0, "total_loss": 0.7710663304577412, "lyap1_mean": -0.22981709241867065, "lyap1_max": -0.12577027082443237, "frac_above_star": 0.0 }, { "step": 407, "sup_loss": 0.5577066597882143, "rf_loss": 0.0, "total_loss": 0.5577066597882143, "lyap1_mean": -0.21974991261959076, "lyap1_max": -0.13262882828712463, "frac_above_star": 0.0 }, { "step": 408, "sup_loss": 0.5472606186887976, "rf_loss": 0.0, "total_loss": 0.5472606186887976, "lyap1_mean": -0.19248127937316895, "lyap1_max": -0.0850316733121872, "frac_above_star": 0.0 }, { "step": 409, "sup_loss": 0.8200874989493157, "rf_loss": 0.0, "total_loss": 0.8200874989493157, "lyap1_mean": -0.18073473870754242, "lyap1_max": -0.08566507697105408, "frac_above_star": 0.0 }, { "step": 410, "sup_loss": 0.6317165754752954, "rf_loss": 0.0, "total_loss": 0.6317165754752954, "lyap1_mean": -0.18964365124702454, "lyap1_max": -0.08450456708669662, "frac_above_star": 0.0 }, { "step": 411, "sup_loss": 0.6428149157862336, "rf_loss": 0.0, "total_loss": 0.6428149157862336, "lyap1_mean": -0.1839533895254135, "lyap1_max": -0.1360056847333908, "frac_above_star": 0.0 }, { "step": 412, "sup_loss": 0.8019578563453434, "rf_loss": 0.0, "total_loss": 0.8019578563453434, "lyap1_mean": -0.17444077134132385, "lyap1_max": -0.09533258527517319, "frac_above_star": 0.0 }, { "step": 413, "sup_loss": 0.6817477327435983, "rf_loss": 0.0, "total_loss": 0.6817477327435983, "lyap1_mean": -0.20133468508720398, "lyap1_max": -0.14374417066574097, "frac_above_star": 0.0 }, { "step": 414, "sup_loss": 0.8517326786046907, "rf_loss": 0.0, "total_loss": 0.8517326786046907, "lyap1_mean": -0.1866406798362732, "lyap1_max": -0.1291995793581009, "frac_above_star": 0.0 }, { "step": 415, "sup_loss": 0.5885188598494874, "rf_loss": 0.0, "total_loss": 0.5885188598494874, "lyap1_mean": -0.2051071673631668, "lyap1_max": -0.11106543987989426, "frac_above_star": 0.0 }, { "step": 416, "sup_loss": 0.6389622126057347, "rf_loss": 0.0, "total_loss": 0.6389622126057347, "lyap1_mean": -0.1401863992214203, "lyap1_max": -0.04137813299894333, "frac_above_star": 0.0 }, { "step": 417, "sup_loss": 0.7242631118632783, "rf_loss": 0.0, "total_loss": 0.7242631118632783, "lyap1_mean": -0.20014476776123047, "lyap1_max": -0.09285998344421387, "frac_above_star": 0.0 }, { "step": 418, "sup_loss": 0.6170678917932148, "rf_loss": 0.0, "total_loss": 0.6170678917932148, "lyap1_mean": -0.20304855704307556, "lyap1_max": -0.07744231075048447, "frac_above_star": 0.0 }, { "step": 419, "sup_loss": 0.5834679257993275, "rf_loss": 0.0, "total_loss": 0.5834679257993275, "lyap1_mean": -0.19520199298858643, "lyap1_max": -0.07508471608161926, "frac_above_star": 0.0 }, { "step": 420, "sup_loss": 0.6184184670481919, "rf_loss": 0.0, "total_loss": 0.6184184670481919, "lyap1_mean": -0.22614485025405884, "lyap1_max": -0.08879595249891281, "frac_above_star": 0.0 }, { "step": 421, "sup_loss": 0.5834496232695248, "rf_loss": 0.0, "total_loss": 0.5834496232695248, "lyap1_mean": -0.21686387062072754, "lyap1_max": -0.11697535216808319, "frac_above_star": 0.0 }, { "step": 422, "sup_loss": 0.46873376242182047, "rf_loss": 0.0, "total_loss": 0.46873376242182047, "lyap1_mean": -0.20978090167045593, "lyap1_max": -0.1583404839038849, "frac_above_star": 0.0 }, { "step": 423, "sup_loss": 0.4277216868881535, "rf_loss": 0.0, "total_loss": 0.4277216868881535, "lyap1_mean": -0.18250460922718048, "lyap1_max": -0.06321868300437927, "frac_above_star": 0.0 }, { "step": 424, "sup_loss": 0.56364931635572, "rf_loss": 0.0, "total_loss": 0.56364931635572, "lyap1_mean": -0.2385718822479248, "lyap1_max": -0.18002289533615112, "frac_above_star": 0.0 }, { "step": 425, "sup_loss": 0.4246765232390541, "rf_loss": 0.0, "total_loss": 0.4246765232390541, "lyap1_mean": -0.23518259823322296, "lyap1_max": -0.0972171276807785, "frac_above_star": 0.0 }, { "step": 426, "sup_loss": 0.5237068134679024, "rf_loss": 0.0, "total_loss": 0.5237068134679024, "lyap1_mean": -0.2115860879421234, "lyap1_max": -0.11454209685325623, "frac_above_star": 0.0 }, { "step": 427, "sup_loss": 0.5997124572467873, "rf_loss": 0.0, "total_loss": 0.5997124572467873, "lyap1_mean": -0.23042023181915283, "lyap1_max": -0.10170955955982208, "frac_above_star": 0.0 }, { "step": 428, "sup_loss": 0.5299713536257804, "rf_loss": 0.0, "total_loss": 0.5299713536257804, "lyap1_mean": -0.22233423590660095, "lyap1_max": -0.146438330411911, "frac_above_star": 0.0 }, { "step": 429, "sup_loss": 0.8505029093063249, "rf_loss": 0.0, "total_loss": 0.8505029093063249, "lyap1_mean": -0.1852549910545349, "lyap1_max": -0.15016363561153412, "frac_above_star": 0.0 }, { "step": 430, "sup_loss": 0.6260532971507008, "rf_loss": 0.0, "total_loss": 0.6260532971507008, "lyap1_mean": -0.22456932067871094, "lyap1_max": -0.19372230768203735, "frac_above_star": 0.0 }, { "step": 431, "sup_loss": 0.6205153009455984, "rf_loss": 0.0, "total_loss": 0.6205153009455984, "lyap1_mean": -0.1905740648508072, "lyap1_max": -0.10736075043678284, "frac_above_star": 0.0 }, { "step": 432, "sup_loss": 0.5522194151031772, "rf_loss": 0.0, "total_loss": 0.5522194151031772, "lyap1_mean": -0.18396684527397156, "lyap1_max": -0.14840683341026306, "frac_above_star": 0.0 }, { "step": 433, "sup_loss": 0.684030551364668, "rf_loss": 0.0, "total_loss": 0.684030551364668, "lyap1_mean": -0.19913317263126373, "lyap1_max": -0.11573466658592224, "frac_above_star": 0.0 }, { "step": 434, "sup_loss": 0.6835258893157763, "rf_loss": 0.0, "total_loss": 0.6835258893157763, "lyap1_mean": -0.2122216671705246, "lyap1_max": -0.1381903737783432, "frac_above_star": 0.0 }, { "step": 435, "sup_loss": 0.4847939587595649, "rf_loss": 0.0, "total_loss": 0.4847939587595649, "lyap1_mean": -0.1715138852596283, "lyap1_max": -0.04178324341773987, "frac_above_star": 0.0 }, { "step": 436, "sup_loss": 0.45466420254999934, "rf_loss": 0.0, "total_loss": 0.45466420254999934, "lyap1_mean": -0.23010817170143127, "lyap1_max": -0.11812260746955872, "frac_above_star": 0.0 }, { "step": 437, "sup_loss": 0.666091944664287, "rf_loss": 0.0, "total_loss": 0.666091944664287, "lyap1_mean": -0.22724004089832306, "lyap1_max": -0.16292116045951843, "frac_above_star": 0.0 }, { "step": 438, "sup_loss": 0.6010085088582172, "rf_loss": 0.0, "total_loss": 0.6010085088582172, "lyap1_mean": -0.18015745282173157, "lyap1_max": -0.12485748529434204, "frac_above_star": 0.0 }, { "step": 439, "sup_loss": 0.6026152472485455, "rf_loss": 0.0, "total_loss": 0.6026152472485455, "lyap1_mean": -0.18596377968788147, "lyap1_max": -0.0804155170917511, "frac_above_star": 0.0 }, { "step": 440, "sup_loss": 0.8088728448626544, "rf_loss": 0.0, "total_loss": 0.8088728448626544, "lyap1_mean": -0.17091886699199677, "lyap1_max": -0.10065191239118576, "frac_above_star": 0.0 }, { "step": 441, "sup_loss": 0.5145146161590706, "rf_loss": 0.0, "total_loss": 0.5145146161590706, "lyap1_mean": -0.19709008932113647, "lyap1_max": -0.0920170471072197, "frac_above_star": 0.0 }, { "step": 442, "sup_loss": 0.5473842973334815, "rf_loss": 0.0, "total_loss": 0.5473842973334815, "lyap1_mean": -0.20682984590530396, "lyap1_max": -0.07919889688491821, "frac_above_star": 0.0 }, { "step": 443, "sup_loss": 0.7171780707521886, "rf_loss": 0.0, "total_loss": 0.7171780707521886, "lyap1_mean": -0.17546863853931427, "lyap1_max": -0.0773872658610344, "frac_above_star": 0.0 }, { "step": 444, "sup_loss": 0.8109926573104049, "rf_loss": 0.0, "total_loss": 0.8109926573104049, "lyap1_mean": -0.17671331763267517, "lyap1_max": -0.10567508637905121, "frac_above_star": 0.0 }, { "step": 445, "sup_loss": 0.5187260248264307, "rf_loss": 0.0, "total_loss": 0.5187260248264307, "lyap1_mean": -0.18257877230644226, "lyap1_max": -0.09571998566389084, "frac_above_star": 0.0 }, { "step": 446, "sup_loss": 0.64499367743222, "rf_loss": 0.0, "total_loss": 0.64499367743222, "lyap1_mean": -0.18543002009391785, "lyap1_max": -0.0919903814792633, "frac_above_star": 0.0 }, { "step": 447, "sup_loss": 0.5922426600876496, "rf_loss": 0.0, "total_loss": 0.5922426600876496, "lyap1_mean": -0.1853993982076645, "lyap1_max": -0.09295933693647385, "frac_above_star": 0.0 }, { "step": 448, "sup_loss": 0.7907148444100979, "rf_loss": 0.0, "total_loss": 0.7907148444100979, "lyap1_mean": -0.19381244480609894, "lyap1_max": -0.11008801311254501, "frac_above_star": 0.0 }, { "step": 449, "sup_loss": 0.769561283686713, "rf_loss": 0.0, "total_loss": 0.769561283686713, "lyap1_mean": -0.20024415850639343, "lyap1_max": -0.13815838098526, "frac_above_star": 0.0 }, { "step": 450, "sup_loss": 0.5945196157979601, "rf_loss": 0.0, "total_loss": 0.5945196157979601, "lyap1_mean": -0.21762865781784058, "lyap1_max": -0.1536758691072464, "frac_above_star": 0.0 }, { "step": 451, "sup_loss": 0.5127424454829249, "rf_loss": 0.0, "total_loss": 0.5127424454829249, "lyap1_mean": -0.21969911456108093, "lyap1_max": -0.09908488392829895, "frac_above_star": 0.0 }, { "step": 452, "sup_loss": 0.568696628716902, "rf_loss": 0.0, "total_loss": 0.568696628716902, "lyap1_mean": -0.2138366550207138, "lyap1_max": -0.09322752803564072, "frac_above_star": 0.0 }, { "step": 453, "sup_loss": 0.7562978214840389, "rf_loss": 0.0, "total_loss": 0.7562978214840389, "lyap1_mean": -0.20691806077957153, "lyap1_max": -0.12872862815856934, "frac_above_star": 0.0 }, { "step": 454, "sup_loss": 0.6551328185418259, "rf_loss": 0.0, "total_loss": 0.6551328185418259, "lyap1_mean": -0.20642487704753876, "lyap1_max": -0.07981183379888535, "frac_above_star": 0.0 }, { "step": 455, "sup_loss": 0.68868814881439, "rf_loss": 0.0, "total_loss": 0.68868814881439, "lyap1_mean": -0.1813572645187378, "lyap1_max": -0.011597412638366222, "frac_above_star": 0.0 }, { "step": 456, "sup_loss": 0.4367098554190726, "rf_loss": 0.0, "total_loss": 0.4367098554190726, "lyap1_mean": -0.24434518814086914, "lyap1_max": -0.14177510142326355, "frac_above_star": 0.0 }, { "step": 457, "sup_loss": 0.45969433008608135, "rf_loss": 0.0, "total_loss": 0.45969433008608135, "lyap1_mean": -0.1993560492992401, "lyap1_max": -0.09999115765094757, "frac_above_star": 0.0 }, { "step": 458, "sup_loss": 0.5287129636895747, "rf_loss": 0.0, "total_loss": 0.5287129636895747, "lyap1_mean": -0.20102721452713013, "lyap1_max": -0.11296612024307251, "frac_above_star": 0.0 }, { "step": 459, "sup_loss": 0.6001089480990052, "rf_loss": 0.0, "total_loss": 0.6001089480990052, "lyap1_mean": -0.2047824263572693, "lyap1_max": -0.16775868833065033, "frac_above_star": 0.0 }, { "step": 460, "sup_loss": 0.49769986376214453, "rf_loss": 0.0, "total_loss": 0.49769986376214453, "lyap1_mean": -0.2387564778327942, "lyap1_max": -0.12966139614582062, "frac_above_star": 0.0 }, { "step": 461, "sup_loss": 0.4930502541504891, "rf_loss": 0.0, "total_loss": 0.4930502541504891, "lyap1_mean": -0.2362280786037445, "lyap1_max": -0.1668357104063034, "frac_above_star": 0.0 }, { "step": 462, "sup_loss": 0.46169493105784926, "rf_loss": 0.0, "total_loss": 0.46169493105784926, "lyap1_mean": -0.22429259121418, "lyap1_max": -0.16607175767421722, "frac_above_star": 0.0 }, { "step": 463, "sup_loss": 0.802166309212678, "rf_loss": 0.0, "total_loss": 0.802166309212678, "lyap1_mean": -0.20674104988574982, "lyap1_max": -0.13305266201496124, "frac_above_star": 0.0 }, { "step": 464, "sup_loss": 0.5747584587530254, "rf_loss": 0.0, "total_loss": 0.5747584587530254, "lyap1_mean": -0.20135027170181274, "lyap1_max": -0.07635249197483063, "frac_above_star": 0.0 }, { "step": 465, "sup_loss": 0.5848124214260316, "rf_loss": 0.0, "total_loss": 0.5848124214260316, "lyap1_mean": -0.1798902153968811, "lyap1_max": -0.13341239094734192, "frac_above_star": 0.0 }, { "step": 466, "sup_loss": 0.5697222687688868, "rf_loss": 0.0, "total_loss": 0.5697222687688868, "lyap1_mean": -0.22785009443759918, "lyap1_max": -0.16904041171073914, "frac_above_star": 0.0 }, { "step": 467, "sup_loss": 0.49221582119529633, "rf_loss": 0.0, "total_loss": 0.49221582119529633, "lyap1_mean": -0.22846445441246033, "lyap1_max": -0.13291165232658386, "frac_above_star": 0.0 }, { "step": 468, "sup_loss": 0.7697801596926565, "rf_loss": 0.0, "total_loss": 0.7697801596926565, "lyap1_mean": -0.1920282542705536, "lyap1_max": -0.10256457328796387, "frac_above_star": 0.0 }, { "step": 469, "sup_loss": 0.6922007454802507, "rf_loss": 0.0, "total_loss": 0.6922007454802507, "lyap1_mean": -0.17902615666389465, "lyap1_max": -0.12225094437599182, "frac_above_star": 0.0 }, { "step": 470, "sup_loss": 0.5505792665285443, "rf_loss": 0.0, "total_loss": 0.5505792665285443, "lyap1_mean": -0.21936741471290588, "lyap1_max": -0.1531541794538498, "frac_above_star": 0.0 }, { "step": 471, "sup_loss": 0.6353451253510249, "rf_loss": 0.0, "total_loss": 0.6353451253510249, "lyap1_mean": -0.20361590385437012, "lyap1_max": -0.14439085125923157, "frac_above_star": 0.0 }, { "step": 472, "sup_loss": 0.6428148542581822, "rf_loss": 0.0, "total_loss": 0.6428148542581822, "lyap1_mean": -0.19642044603824615, "lyap1_max": -0.10523774474859238, "frac_above_star": 0.0 }, { "step": 473, "sup_loss": 0.5288797155319798, "rf_loss": 0.0, "total_loss": 0.5288797155319798, "lyap1_mean": -0.2076386958360672, "lyap1_max": -0.12072043865919113, "frac_above_star": 0.0 }, { "step": 474, "sup_loss": 0.3863632477579415, "rf_loss": 0.0, "total_loss": 0.3863632477579415, "lyap1_mean": -0.23749133944511414, "lyap1_max": -0.16364428400993347, "frac_above_star": 0.0 }, { "step": 475, "sup_loss": 0.8369189233501023, "rf_loss": 0.0, "total_loss": 0.8369189233501023, "lyap1_mean": -0.18644171953201294, "lyap1_max": -0.12330862134695053, "frac_above_star": 0.0 }, { "step": 476, "sup_loss": 0.5872188216009459, "rf_loss": 0.0, "total_loss": 0.5872188216009459, "lyap1_mean": -0.20678067207336426, "lyap1_max": -0.08927386999130249, "frac_above_star": 0.0 }, { "step": 477, "sup_loss": 0.5041393667798287, "rf_loss": 0.0, "total_loss": 0.5041393667798287, "lyap1_mean": -0.26429998874664307, "lyap1_max": -0.18356218934059143, "frac_above_star": 0.0 }, { "step": 478, "sup_loss": 0.5765562308926201, "rf_loss": 0.0, "total_loss": 0.5765562308926201, "lyap1_mean": -0.17559175193309784, "lyap1_max": -0.018731923773884773, "frac_above_star": 0.0 }, { "step": 479, "sup_loss": 0.4974266827365548, "rf_loss": 0.0, "total_loss": 0.4974266827365548, "lyap1_mean": -0.20852211117744446, "lyap1_max": -0.1370886266231537, "frac_above_star": 0.0 }, { "step": 480, "sup_loss": 0.620334603373274, "rf_loss": 0.0, "total_loss": 0.620334603373274, "lyap1_mean": -0.1951858550310135, "lyap1_max": -0.10776694864034653, "frac_above_star": 0.0 }, { "step": 481, "sup_loss": 0.5299444770294112, "rf_loss": 0.0, "total_loss": 0.5299444770294112, "lyap1_mean": -0.2059299498796463, "lyap1_max": -0.1464439481496811, "frac_above_star": 0.0 }, { "step": 482, "sup_loss": 0.8489174008467093, "rf_loss": 0.0, "total_loss": 0.8489174008467093, "lyap1_mean": -0.15450772643089294, "lyap1_max": -0.08675898611545563, "frac_above_star": 0.0 }, { "step": 483, "sup_loss": 0.6135943418403578, "rf_loss": 0.0, "total_loss": 0.6135943418403578, "lyap1_mean": -0.19584394991397858, "lyap1_max": -0.11074253171682358, "frac_above_star": 0.0 }, { "step": 484, "sup_loss": 0.5798082526804116, "rf_loss": 0.0, "total_loss": 0.5798082526804116, "lyap1_mean": -0.21491551399230957, "lyap1_max": -0.12314432114362717, "frac_above_star": 0.0 }, { "step": 485, "sup_loss": 0.7496293059904233, "rf_loss": 0.0, "total_loss": 0.7496293059904233, "lyap1_mean": -0.20109547674655914, "lyap1_max": -0.1007969006896019, "frac_above_star": 0.0 }, { "step": 486, "sup_loss": 0.6538638055579475, "rf_loss": 0.0, "total_loss": 0.6538638055579475, "lyap1_mean": -0.1966100037097931, "lyap1_max": -0.11787473410367966, "frac_above_star": 0.0 }, { "step": 487, "sup_loss": 0.43945334240033507, "rf_loss": 0.0, "total_loss": 0.43945334240033507, "lyap1_mean": -0.2015993744134903, "lyap1_max": -0.10837997496128082, "frac_above_star": 0.0 }, { "step": 488, "sup_loss": 0.625604220847771, "rf_loss": 0.0, "total_loss": 0.625604220847771, "lyap1_mean": -0.18927493691444397, "lyap1_max": -0.13037115335464478, "frac_above_star": 0.0 }, { "step": 489, "sup_loss": 0.4542147766218148, "rf_loss": 0.0, "total_loss": 0.4542147766218148, "lyap1_mean": -0.23917371034622192, "lyap1_max": -0.16002675890922546, "frac_above_star": 0.0 }, { "step": 490, "sup_loss": 0.5484596541851076, "rf_loss": 0.0, "total_loss": 0.5484596541851076, "lyap1_mean": -0.22205352783203125, "lyap1_max": -0.17208266258239746, "frac_above_star": 0.0 }, { "step": 491, "sup_loss": 0.5796549757431813, "rf_loss": 0.0, "total_loss": 0.5796549757431813, "lyap1_mean": -0.19787657260894775, "lyap1_max": -0.08027331531047821, "frac_above_star": 0.0 }, { "step": 492, "sup_loss": 0.7017277310690098, "rf_loss": 0.0, "total_loss": 0.7017277310690098, "lyap1_mean": -0.2054646611213684, "lyap1_max": -0.13146935403347015, "frac_above_star": 0.0 }, { "step": 493, "sup_loss": 0.524999132601167, "rf_loss": 0.0, "total_loss": 0.524999132601167, "lyap1_mean": -0.20288428664207458, "lyap1_max": -0.12655335664749146, "frac_above_star": 0.0 }, { "step": 494, "sup_loss": 0.6519588463532211, "rf_loss": 0.0, "total_loss": 0.6519588463532211, "lyap1_mean": -0.187330961227417, "lyap1_max": -0.0487985759973526, "frac_above_star": 0.0 }, { "step": 495, "sup_loss": 0.7896045312148756, "rf_loss": 0.0, "total_loss": 0.7896045312148756, "lyap1_mean": -0.17342408001422882, "lyap1_max": -0.08557955920696259, "frac_above_star": 0.0 }, { "step": 496, "sup_loss": 0.5254194586683845, "rf_loss": 0.0, "total_loss": 0.5254194586683845, "lyap1_mean": -0.1896812915802002, "lyap1_max": -0.12433528155088425, "frac_above_star": 0.0 }, { "step": 497, "sup_loss": 0.7277837074862891, "rf_loss": 0.0, "total_loss": 0.7277837074862891, "lyap1_mean": -0.20564937591552734, "lyap1_max": -0.15159422159194946, "frac_above_star": 0.0 }, { "step": 498, "sup_loss": 0.7733371556421542, "rf_loss": 0.0, "total_loss": 0.7733371556421542, "lyap1_mean": -0.19215822219848633, "lyap1_max": -0.08312106132507324, "frac_above_star": 0.0 }, { "step": 499, "sup_loss": 0.5344660911309098, "rf_loss": 0.0, "total_loss": 0.5344660911309098, "lyap1_mean": -0.19354604184627533, "lyap1_max": -0.031829528510570526, "frac_above_star": 0.0 } ], "evals": [ { "step": 0, "acc": 0.517578125, "tok_acc": 0.8276668595679012 }, { "step": 100, "acc": 0.572265625, "tok_acc": 0.8473427854938271 }, { "step": 200, "acc": 0.583984375, "tok_acc": 0.8522376543209876 }, { "step": 300, "acc": 0.615234375, "tok_acc": 0.8610869984567902 }, { "step": 400, "acc": 0.58984375, "tok_acc": 0.8527440200617284 }, { "step": 500, "acc": 0.611328125, "tok_acc": 0.8640769675925926 }, { "step": 500, "acc": 0.611328125, "tok_acc": 0.8640769675925926 } ], "final_acc": 0.611328125, "final_tok_acc": 0.8640769675925926 }