{ "args": { "ckpt_root": "/home/yurenh2/rrm/hrm/checkpoints/Sudoku-extreme-1k-aug-1000 ACT-torch/HierarchicalReasoningModel_ACTV1 righteous-python", "ckpt_name": "step_26040", "n_steps": 200, "batch_size": 8, "lr": 5e-06, "alpha_rf": 10.0, "lambda_star": -0.85, "k_lyap": 2, "lyap_act_steps": 4, "rf_mode": "fixed", "rf_eps": 1e-06, "seed": 42, "eval_every": 50, "eval_n": 512, "eval_batch_size": 32, "out": "/home/yurenh2/rrm/research/flossing/ab_rf.json" }, "initial_acc": 0.517578125, "initial_tok_acc": 0.8276668595679012, "steps": [ { "step": 0, "sup_loss": 0.5765840774308245, "rf_loss": 0.0188673734664917, "total_loss": 0.7652578120957415, "mean_lyap": -0.8058679103851318, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 1, "sup_loss": 0.40554469917943053, "rf_loss": 0.0057648103684186935, "total_loss": 0.46319280286361747, "mean_lyap": -0.8606383800506592, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 2, "sup_loss": 0.7296058169551144, "rf_loss": 0.015785561874508858, "total_loss": 0.8874614319749127, "mean_lyap": -0.7925797700881958, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 3, "sup_loss": 0.5326514314440994, "rf_loss": 0.010626970790326595, "total_loss": 0.6389211412100105, "mean_lyap": -0.8121544718742371, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 4, "sup_loss": 0.5782588876956446, "rf_loss": 0.015642518177628517, "total_loss": 0.7346840657466395, "mean_lyap": -0.7712883353233337, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 5, "sup_loss": 0.8227696935048122, "rf_loss": 0.018467212095856667, "total_loss": 1.0074418107380887, "mean_lyap": -0.7421821355819702, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 6, "sup_loss": 0.6188131744701122, "rf_loss": 0.009561344981193542, "total_loss": 0.7144266242820476, "mean_lyap": -0.788561224937439, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 7, "sup_loss": 0.6447263690556088, "rf_loss": 0.016454031690955162, "total_loss": 0.8092666896904507, "mean_lyap": -0.7436193823814392, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 8, "sup_loss": 0.8350695073343292, "rf_loss": 0.01805921457707882, "total_loss": 1.0156616568304075, "mean_lyap": -0.747126579284668, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 9, "sup_loss": 0.8473975550740483, "rf_loss": 0.018726294860243797, "total_loss": 1.0346605074017767, "mean_lyap": -0.7429935932159424, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 10, "sup_loss": 0.6606808108891549, "rf_loss": 0.013587037101387978, "total_loss": 0.7965511781777443, "mean_lyap": -0.7866835594177246, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 11, "sup_loss": 0.63067866316374, "rf_loss": 0.015567373484373093, "total_loss": 0.7863524054580515, "mean_lyap": -0.8150412440299988, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 12, "sup_loss": 0.42009245690532176, "rf_loss": 0.007377433590590954, "total_loss": 0.49386679467387645, "mean_lyap": -0.8051602840423584, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 13, "sup_loss": 0.7549789601332388, "rf_loss": 0.01539212092757225, "total_loss": 0.9089001768595419, "mean_lyap": -0.7535644769668579, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 14, "sup_loss": 0.5930591245881306, "rf_loss": 0.009710620157420635, "total_loss": 0.6901653280249821, "mean_lyap": -0.8298624157905579, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 15, "sup_loss": 0.6888967057957366, "rf_loss": 0.009040959179401398, "total_loss": 0.7793062975897506, "mean_lyap": -0.8225681781768799, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 16, "sup_loss": 0.5512681465998905, "rf_loss": 0.01129273883998394, "total_loss": 0.6641955387250202, "mean_lyap": -0.7970694899559021, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 17, "sup_loss": 0.7051346908681223, "rf_loss": 0.013604645617306232, "total_loss": 0.8411811451785395, "mean_lyap": -0.7470482587814331, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 1.0 }, { "step": 18, "sup_loss": 0.5706506700775847, "rf_loss": 0.010291795246303082, "total_loss": 0.6735686244032607, "mean_lyap": -0.7999143600463867, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 19, "sup_loss": 0.5140771953697019, "rf_loss": 0.009903106838464737, "total_loss": 0.6131082637543492, "mean_lyap": -0.8433663845062256, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 20, "sup_loss": 0.6330896925310444, "rf_loss": 0.01402571052312851, "total_loss": 0.7733467977623295, "mean_lyap": -0.7908270359039307, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 21, "sup_loss": 0.6550339587133366, "rf_loss": 0.006650024093687534, "total_loss": 0.7215341977875668, "mean_lyap": -0.8017191290855408, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 22, "sup_loss": 0.6974606218591559, "rf_loss": 0.004491833969950676, "total_loss": 0.7423789615586627, "mean_lyap": -0.8529043197631836, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 23, "sup_loss": 0.6516045363274935, "rf_loss": 0.008527552708983421, "total_loss": 0.736880067142618, "mean_lyap": -0.7849105000495911, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 24, "sup_loss": 0.7038636713393823, "rf_loss": 0.010556367225944996, "total_loss": 0.8094273417361871, "mean_lyap": -0.7658365964889526, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 25, "sup_loss": 0.7385914636352537, "rf_loss": 0.011378636583685875, "total_loss": 0.8523778331974028, "mean_lyap": -0.7721314430236816, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 26, "sup_loss": 0.9184711394722027, "rf_loss": 0.009672008454799652, "total_loss": 1.0151912240201992, "mean_lyap": -0.7574284672737122, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 1.0 }, { "step": 27, "sup_loss": 0.5379478623015401, "rf_loss": 0.0028337787371128798, "total_loss": 0.5662856501383302, "mean_lyap": -0.9130557775497437, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 28, "sup_loss": 0.8321097197966094, "rf_loss": 0.018430069088935852, "total_loss": 1.016410410685968, "mean_lyap": -0.7524938583374023, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 29, "sup_loss": 0.6580051011166252, "rf_loss": 0.006823045201599598, "total_loss": 0.7262355512699761, "mean_lyap": -0.8172051906585693, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 30, "sup_loss": 0.7026907211304697, "rf_loss": 0.006128185428678989, "total_loss": 0.7639725735546145, "mean_lyap": -0.8284720182418823, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 31, "sup_loss": 0.7111782013007493, "rf_loss": 0.01262273732572794, "total_loss": 0.8374055801459641, "mean_lyap": -0.7845479249954224, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 32, "sup_loss": 0.7769751564526539, "rf_loss": 0.011238861829042435, "total_loss": 0.8893637747430783, "mean_lyap": -0.7726147174835205, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 33, "sup_loss": 0.6691901240099508, "rf_loss": 0.00915505737066269, "total_loss": 0.7607406977165777, "mean_lyap": -0.7760234475135803, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 34, "sup_loss": 0.644363289681166, "rf_loss": 0.002750927349552512, "total_loss": 0.6718725636423524, "mean_lyap": -0.8608823418617249, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 35, "sup_loss": 0.5456849349717176, "rf_loss": 0.005364897195249796, "total_loss": 0.5993339059928929, "mean_lyap": -0.8570781350135803, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 36, "sup_loss": 0.6267922329648362, "rf_loss": 0.003588401945307851, "total_loss": 0.6626762519522534, "mean_lyap": -0.8452996015548706, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 37, "sup_loss": 0.860164007674845, "rf_loss": 0.008395137265324593, "total_loss": 0.9441153766028006, "mean_lyap": -0.77690589427948, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 38, "sup_loss": 0.5987716705341, "rf_loss": 0.0041238958947360516, "total_loss": 0.640010630412783, "mean_lyap": -0.8743618726730347, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 39, "sup_loss": 0.8265189456842287, "rf_loss": 0.003278082702308893, "total_loss": 0.859299771775995, "mean_lyap": -0.8121100664138794, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 40, "sup_loss": 0.8077702268238799, "rf_loss": 0.008977587334811687, "total_loss": 0.8975461020346419, "mean_lyap": -0.7760306000709534, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 41, "sup_loss": 0.5790201635319739, "rf_loss": 0.004197108559310436, "total_loss": 0.6209912509877235, "mean_lyap": -0.8581048250198364, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 42, "sup_loss": 0.7746859350804977, "rf_loss": 0.005175702273845673, "total_loss": 0.8264429578189544, "mean_lyap": -0.842041015625, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 43, "sup_loss": 0.7331061879104849, "rf_loss": 0.007015871815383434, "total_loss": 0.8032649079269644, "mean_lyap": -0.8373122215270996, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 44, "sup_loss": 0.869654493387017, "rf_loss": 0.005932656116783619, "total_loss": 0.928981052692208, "mean_lyap": -0.794861376285553, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 45, "sup_loss": 0.7347313761262009, "rf_loss": 0.002129987347871065, "total_loss": 0.756031248673589, "mean_lyap": -0.8495690226554871, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 46, "sup_loss": 0.7337837421752077, "rf_loss": 0.00745191378518939, "total_loss": 0.8083028772331339, "mean_lyap": -0.7664467096328735, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 1.0 }, { "step": 47, "sup_loss": 0.6650665995203973, "rf_loss": 0.0027223234064877033, "total_loss": 0.6922898326539517, "mean_lyap": -0.8546332120895386, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 48, "sup_loss": 0.6728695801522537, "rf_loss": 0.0034027229994535446, "total_loss": 0.7068968101467892, "mean_lyap": -0.8466753959655762, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 49, "sup_loss": 0.6627326494175514, "rf_loss": 0.0034537501633167267, "total_loss": 0.6972701510507187, "mean_lyap": -0.81462562084198, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75, "eval_acc": 0.501953125, "eval_tok_acc": 0.8258825231481481 }, { "step": 50, "sup_loss": 0.6882688690824927, "rf_loss": 0.004383894149214029, "total_loss": 0.7321078096433105, "mean_lyap": -0.8475438356399536, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 51, "sup_loss": 0.7352788257973389, "rf_loss": 0.004841075744479895, "total_loss": 0.7836895841734605, "mean_lyap": -0.8208181858062744, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 52, "sup_loss": 0.5743374201962224, "rf_loss": 0.0043980712071061134, "total_loss": 0.6183181304046383, "mean_lyap": -0.8833464980125427, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 53, "sup_loss": 0.6902312712113531, "rf_loss": 0.0017992472276091576, "total_loss": 0.7082237434874447, "mean_lyap": -0.8604968786239624, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 54, "sup_loss": 0.6803814939750245, "rf_loss": 0.002090118359774351, "total_loss": 0.7012826785040905, "mean_lyap": -0.854358434677124, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 55, "sup_loss": 0.595873137691564, "rf_loss": 0.0007154205814003944, "total_loss": 0.603027343505568, "mean_lyap": -0.8682422637939453, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 56, "sup_loss": 0.6642178889411797, "rf_loss": 0.0020344697404652834, "total_loss": 0.6845625858801713, "mean_lyap": -0.8675365447998047, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 57, "sup_loss": 0.7082779751524824, "rf_loss": 0.002637912053614855, "total_loss": 0.7346570947573083, "mean_lyap": -0.8571688532829285, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 58, "sup_loss": 0.9503993268684144, "rf_loss": 0.002218063920736313, "total_loss": 0.9725799660757776, "mean_lyap": -0.8307374119758606, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 59, "sup_loss": 0.514957090437054, "rf_loss": 0.004192134365439415, "total_loss": 0.5568784340914481, "mean_lyap": -0.8466053605079651, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 60, "sup_loss": 0.7337269250892405, "rf_loss": 0.0026380610652267933, "total_loss": 0.7601075348101859, "mean_lyap": -0.8249342441558838, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 61, "sup_loss": 0.6457141234391504, "rf_loss": 0.003588218940421939, "total_loss": 0.681596313309031, "mean_lyap": -0.8772332072257996, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 62, "sup_loss": 0.6506520749543354, "rf_loss": 0.0017656260170042515, "total_loss": 0.6683083341930554, "mean_lyap": -0.8678171634674072, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 63, "sup_loss": 0.8176543999352315, "rf_loss": 0.0010715246899053454, "total_loss": 0.8283696470671156, "mean_lyap": -0.856634259223938, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 64, "sup_loss": 0.7193349828825767, "rf_loss": 0.0008531392668373883, "total_loss": 0.7278663754345353, "mean_lyap": -0.8669513463973999, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 65, "sup_loss": 0.890794052989882, "rf_loss": 0.0030753673054277897, "total_loss": 0.9215477251128373, "mean_lyap": -0.8245968818664551, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 66, "sup_loss": 0.669179298339029, "rf_loss": 0.0008702079649083316, "total_loss": 0.6778813781045276, "mean_lyap": -0.8781542778015137, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 67, "sup_loss": 0.7648352138231196, "rf_loss": 0.0006933381664566696, "total_loss": 0.7717685956041016, "mean_lyap": -0.8727739453315735, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 68, "sup_loss": 0.6999706120344925, "rf_loss": 0.0015010021161288023, "total_loss": 0.7149806336614418, "mean_lyap": -0.8707051277160645, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 69, "sup_loss": 0.9418434380324208, "rf_loss": 0.0017435763729736209, "total_loss": 0.959279201063665, "mean_lyap": -0.8469928503036499, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 70, "sup_loss": 0.7006143229115153, "rf_loss": 0.0020230370573699474, "total_loss": 0.7208446944165373, "mean_lyap": -0.8506982922554016, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 71, "sup_loss": 0.8045005220383133, "rf_loss": 0.0029563107527792454, "total_loss": 0.8340636286347832, "mean_lyap": -0.8255416750907898, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 72, "sup_loss": 0.5909958039108959, "rf_loss": 0.000791383848991245, "total_loss": 0.5989096420515624, "mean_lyap": -0.8960390090942383, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 73, "sup_loss": 0.7791527680286758, "rf_loss": 0.0012979984749108553, "total_loss": 0.7921327523121231, "mean_lyap": -0.8992996215820312, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 74, "sup_loss": 0.7237759233288961, "rf_loss": 0.003918964881449938, "total_loss": 0.7629655712120729, "mean_lyap": -0.883576512336731, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 75, "sup_loss": 0.7495548237028731, "rf_loss": 0.003698775079101324, "total_loss": 0.7865425754252089, "mean_lyap": -0.8133399486541748, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 76, "sup_loss": 0.8387171345259399, "rf_loss": 0.000946269603446126, "total_loss": 0.8481798300947399, "mean_lyap": -0.890516996383667, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 77, "sup_loss": 0.6733659814251263, "rf_loss": 0.0012616110034286976, "total_loss": 0.6859820914594132, "mean_lyap": -0.8804075717926025, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 78, "sup_loss": 0.6498098301149544, "rf_loss": 0.0013569702859967947, "total_loss": 0.6633795334405836, "mean_lyap": -0.8641673922538757, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 79, "sup_loss": 0.7837405819809202, "rf_loss": 0.003930794075131416, "total_loss": 0.8230485227322344, "mean_lyap": -0.8169339895248413, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.875 }, { "step": 80, "sup_loss": 0.7228979195130653, "rf_loss": 0.0015914338873699307, "total_loss": 0.7388122590852565, "mean_lyap": -0.8627505302429199, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 81, "sup_loss": 0.512824455845056, "rf_loss": 0.0014878996880725026, "total_loss": 0.5277034524929504, "mean_lyap": -0.892520546913147, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 82, "sup_loss": 0.6486249230331146, "rf_loss": 0.0009839815320447087, "total_loss": 0.658464738120731, "mean_lyap": -0.8969285488128662, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 83, "sup_loss": 0.7256714011449372, "rf_loss": 0.0012018897105008364, "total_loss": 0.7376902977842843, "mean_lyap": -0.8888238668441772, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 84, "sup_loss": 0.7549937936440195, "rf_loss": 0.0016620211536064744, "total_loss": 0.7716140049472536, "mean_lyap": -0.8613144159317017, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 85, "sup_loss": 0.7208673455028051, "rf_loss": 0.003234194591641426, "total_loss": 0.7532092914192193, "mean_lyap": -0.8572639226913452, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 86, "sup_loss": 0.78733164410316, "rf_loss": 0.0003821868449449539, "total_loss": 0.7911535125526096, "mean_lyap": -0.9119746685028076, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 87, "sup_loss": 0.7460947798003501, "rf_loss": 0.0010051638819277287, "total_loss": 0.7561464186196274, "mean_lyap": -0.8535745143890381, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 88, "sup_loss": 0.8429616427629429, "rf_loss": 0.0019365833140909672, "total_loss": 0.86232747497253, "mean_lyap": -0.84560227394104, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 89, "sup_loss": 0.7729191359746813, "rf_loss": 0.0007418215391226113, "total_loss": 0.7803373512494921, "mean_lyap": -0.9108904004096985, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 90, "sup_loss": 0.6472762192297998, "rf_loss": 0.0025497586466372013, "total_loss": 0.6727738047648493, "mean_lyap": -0.8673484325408936, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 91, "sup_loss": 0.7268315836183069, "rf_loss": 0.0027970762457698584, "total_loss": 0.7548023465416668, "mean_lyap": -0.8777827620506287, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 92, "sup_loss": 0.8650996847170713, "rf_loss": 0.0013330209767445922, "total_loss": 0.8784298947173479, "mean_lyap": -0.8683897852897644, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 93, "sup_loss": 0.6219829422071615, "rf_loss": 0.00327981635928154, "total_loss": 0.654781105799977, "mean_lyap": -0.8831396102905273, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 94, "sup_loss": 0.7396657856699419, "rf_loss": 0.0007561829988844693, "total_loss": 0.7472276155423713, "mean_lyap": -0.858811616897583, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 95, "sup_loss": 0.6485665339088734, "rf_loss": 0.0004259114502929151, "total_loss": 0.6528256485282179, "mean_lyap": -0.9049522876739502, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 96, "sup_loss": 0.7588329886284089, "rf_loss": 0.0001585835125297308, "total_loss": 0.7604188237537062, "mean_lyap": -0.8950439691543579, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.5 }, { "step": 97, "sup_loss": 0.5817993282506224, "rf_loss": 0.0007148263975977898, "total_loss": 0.5889475922266003, "mean_lyap": -0.8832213282585144, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 98, "sup_loss": 0.7425204173943035, "rf_loss": 0.0005265326471999288, "total_loss": 0.7477857436334722, "mean_lyap": -0.9243374466896057, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 99, "sup_loss": 0.6873691285748474, "rf_loss": 8.11655081633944e-06, "total_loss": 0.6874502940793729, "mean_lyap": -0.9182790517807007, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25, "eval_acc": 0.49609375, "eval_tok_acc": 0.8252797067901234 }, { "step": 100, "sup_loss": 0.6026084183219523, "rf_loss": 0.0004853458667639643, "total_loss": 0.6074618769313843, "mean_lyap": -0.9124417304992676, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 101, "sup_loss": 0.6220611178877565, "rf_loss": 0.0004740226431749761, "total_loss": 0.6268013444359216, "mean_lyap": -0.8781635761260986, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 102, "sup_loss": 0.6987778955866084, "rf_loss": 0.0006725198472850025, "total_loss": 0.7055030941758738, "mean_lyap": -0.9354679584503174, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 103, "sup_loss": 0.767754078471799, "rf_loss": 0.0006385964807122946, "total_loss": 0.7741400432789219, "mean_lyap": -0.8678494691848755, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.75 }, { "step": 104, "sup_loss": 0.8160985431055674, "rf_loss": 0.0003366229357197881, "total_loss": 0.8194647724627653, "mean_lyap": -0.877155065536499, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 105, "sup_loss": 0.7349091845713341, "rf_loss": 0.003131158882752061, "total_loss": 0.7662207747958386, "mean_lyap": -0.845853328704834, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 106, "sup_loss": 0.74589114177769, "rf_loss": 0.00018192798597738147, "total_loss": 0.7477104216374638, "mean_lyap": -0.901712954044342, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 107, "sup_loss": 0.6818353474665824, "rf_loss": 0.0024454190861433744, "total_loss": 0.7062895387936774, "mean_lyap": -0.8897325992584229, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 108, "sup_loss": 0.6976428133612792, "rf_loss": 0.00034954847069457173, "total_loss": 0.7011382979518096, "mean_lyap": -0.9129797220230103, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 109, "sup_loss": 0.8553529329252825, "rf_loss": 0.0001104350303648971, "total_loss": 0.8564572832434834, "mean_lyap": -0.911565899848938, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 110, "sup_loss": 0.7512660300233496, "rf_loss": 0.00010126684355782345, "total_loss": 0.7522786985025836, "mean_lyap": -0.8916236758232117, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 111, "sup_loss": 0.8306927707564853, "rf_loss": 0.0005017618532292545, "total_loss": 0.8357103894051932, "mean_lyap": -0.8902592658996582, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 112, "sup_loss": 0.8014963296245178, "rf_loss": 0.0018839503172785044, "total_loss": 0.8203358323316415, "mean_lyap": -0.849699854850769, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 113, "sup_loss": 0.6868572114680728, "rf_loss": 0.0007329108193516731, "total_loss": 0.6941863196615895, "mean_lyap": -0.872833251953125, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.625 }, { "step": 114, "sup_loss": 0.5947612592092519, "rf_loss": 0.0003032636595889926, "total_loss": 0.5977938958051419, "mean_lyap": -0.9618325233459473, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 115, "sup_loss": 0.7042847137019506, "rf_loss": 0.0, "total_loss": 0.7042847137019506, "mean_lyap": -0.9470847845077515, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 116, "sup_loss": 0.7489247878014463, "rf_loss": 0.0008320758352056146, "total_loss": 0.7572455459206718, "mean_lyap": -0.898413896560669, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 117, "sup_loss": 0.876237977646276, "rf_loss": 2.0203569874865934e-05, "total_loss": 0.8764400133523006, "mean_lyap": -0.9036564826965332, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 118, "sup_loss": 0.653222449990118, "rf_loss": 9.613390284357592e-05, "total_loss": 0.6541837890331057, "mean_lyap": -0.9079935550689697, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 119, "sup_loss": 0.6358519552300581, "rf_loss": 5.34353603143245e-05, "total_loss": 0.6363863088332014, "mean_lyap": -0.9442797899246216, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 120, "sup_loss": 0.8665854133898904, "rf_loss": 0.0, "total_loss": 0.8665854133898904, "mean_lyap": -0.8926280736923218, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 121, "sup_loss": 0.8598103150897419, "rf_loss": 0.0006828162586316466, "total_loss": 0.866638477908889, "mean_lyap": -0.8766176700592041, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 122, "sup_loss": 0.8078568441048074, "rf_loss": 0.0004030819109175354, "total_loss": 0.8118876631557751, "mean_lyap": -0.8897646069526672, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 123, "sup_loss": 0.9200362731816376, "rf_loss": 0.00048203484038822353, "total_loss": 0.9248566214108969, "mean_lyap": -0.8854799270629883, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 124, "sup_loss": 0.9848050393934372, "rf_loss": 0.00012617840548045933, "total_loss": 0.9860668233900342, "mean_lyap": -0.8772153854370117, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 125, "sup_loss": 0.6607478220181227, "rf_loss": 0.0005259730387479067, "total_loss": 0.6660075524056017, "mean_lyap": -0.9292822480201721, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 126, "sup_loss": 0.6867021993540716, "rf_loss": 7.451939018210396e-05, "total_loss": 0.6874473932704446, "mean_lyap": -0.9073169827461243, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 127, "sup_loss": 0.6364257130573185, "rf_loss": 0.0, "total_loss": 0.6364257130573185, "mean_lyap": -0.9700829982757568, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 128, "sup_loss": 0.6242236350181207, "rf_loss": 0.000526409363374114, "total_loss": 0.6294877286518619, "mean_lyap": -0.8782105445861816, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 129, "sup_loss": 0.7518952417691622, "rf_loss": 5.401653652370442e-06, "total_loss": 0.7519492583038669, "mean_lyap": -0.9081242084503174, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 130, "sup_loss": 0.7010888911268471, "rf_loss": 0.0005437328945845366, "total_loss": 0.7065262200726925, "mean_lyap": -0.9411056041717529, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 131, "sup_loss": 0.6262936821470324, "rf_loss": 5.3317453421186656e-06, "total_loss": 0.6263469996004536, "mean_lyap": -0.9436657428741455, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 132, "sup_loss": 0.6594826955787076, "rf_loss": 0.0, "total_loss": 0.6594826955787076, "mean_lyap": -0.959723949432373, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 133, "sup_loss": 0.7808365199441274, "rf_loss": 0.0001904903765534982, "total_loss": 0.7827414237387662, "mean_lyap": -0.9030304551124573, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 134, "sup_loss": 0.6615815674486567, "rf_loss": 9.443930321140215e-05, "total_loss": 0.6625259604953226, "mean_lyap": -0.9540624618530273, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 135, "sup_loss": 0.9383803996531257, "rf_loss": 5.5584264373464976e-06, "total_loss": 0.9384359839165897, "mean_lyap": -0.895117998123169, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 136, "sup_loss": 0.6256120798884699, "rf_loss": 0.0001487397530581802, "total_loss": 0.6270994774772594, "mean_lyap": -0.9466730356216431, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 137, "sup_loss": 0.7893132553639189, "rf_loss": 8.546098251827061e-05, "total_loss": 0.7901678651891016, "mean_lyap": -0.926414966583252, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 138, "sup_loss": 0.6373277113802505, "rf_loss": 0.0, "total_loss": 0.6373277113802505, "mean_lyap": -0.9512477517127991, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 139, "sup_loss": 0.7214324678174807, "rf_loss": 2.2458484636445064e-06, "total_loss": 0.7214549263012077, "mean_lyap": -0.9204102754592896, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 140, "sup_loss": 0.8744445381065415, "rf_loss": 1.2479569704737514e-05, "total_loss": 0.8745693338035889, "mean_lyap": -0.8943758010864258, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 141, "sup_loss": 0.9106080119595603, "rf_loss": 0.00022716728562954813, "total_loss": 0.9128796849031673, "mean_lyap": -0.8702834844589233, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 142, "sup_loss": 0.6605944012717532, "rf_loss": 5.409423101809807e-05, "total_loss": 0.6611353435746582, "mean_lyap": -0.9433302879333496, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 143, "sup_loss": 0.6644375708800444, "rf_loss": 0.0, "total_loss": 0.6644375708800444, "mean_lyap": -0.9677567481994629, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 144, "sup_loss": 0.8626739651198232, "rf_loss": 0.000472456740681082, "total_loss": 0.8673985324102187, "mean_lyap": -0.8641602993011475, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.375 }, { "step": 145, "sup_loss": 0.82435230048377, "rf_loss": 0.00033521762816235423, "total_loss": 0.8277044768818088, "mean_lyap": -0.8977236747741699, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 146, "sup_loss": 0.5942559147617289, "rf_loss": 0.0, "total_loss": 0.5942559147617289, "mean_lyap": -0.9904095530509949, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 147, "sup_loss": 0.6775069135795322, "rf_loss": 0.0012124822242185473, "total_loss": 0.6896317360545483, "mean_lyap": -0.9161025285720825, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 148, "sup_loss": 0.7089058125671526, "rf_loss": 5.499004487319326e-07, "total_loss": 0.7089113115717536, "mean_lyap": -0.9259845018386841, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 149, "sup_loss": 0.6823098888984611, "rf_loss": 7.607099519191252e-07, "total_loss": 0.682317495998094, "mean_lyap": -0.9467276930809021, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125, "eval_acc": 0.470703125, "eval_tok_acc": 0.8197096836419753 }, { "step": 150, "sup_loss": 0.5880605189294362, "rf_loss": 0.0, "total_loss": 0.5880605189294362, "mean_lyap": -1.0149933099746704, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 151, "sup_loss": 0.5608997467994814, "rf_loss": 0.00025979886413551867, "total_loss": 0.5634977353826289, "mean_lyap": -0.9140228033065796, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 152, "sup_loss": 0.770011182713256, "rf_loss": 0.00036662607453763485, "total_loss": 0.7736774434586323, "mean_lyap": -0.9008445739746094, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 153, "sup_loss": 0.7527060619298268, "rf_loss": 0.0, "total_loss": 0.7527060619298268, "mean_lyap": -0.9543828368186951, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 154, "sup_loss": 0.8604835750154125, "rf_loss": 0.00045156461419537663, "total_loss": 0.864999221040951, "mean_lyap": -0.8754521608352661, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 155, "sup_loss": 0.6627886082106433, "rf_loss": 8.739302575122565e-05, "total_loss": 0.6636625384972594, "mean_lyap": -0.9325603246688843, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 156, "sup_loss": 0.7936160388567672, "rf_loss": 1.1148687917739153e-05, "total_loss": 0.7937275257359446, "mean_lyap": -0.9105346202850342, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 157, "sup_loss": 0.8559562711499866, "rf_loss": 3.2170348276849836e-05, "total_loss": 0.856277974647307, "mean_lyap": -0.9146195650100708, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 158, "sup_loss": 1.1579173010988004, "rf_loss": 0.0, "total_loss": 1.1579173010988004, "mean_lyap": -0.9106019139289856, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 159, "sup_loss": 0.7768453036590028, "rf_loss": 2.2159605578053743e-05, "total_loss": 0.7770668997147834, "mean_lyap": -0.91521155834198, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 160, "sup_loss": 0.8526309708666, "rf_loss": 0.0, "total_loss": 0.8526309708666, "mean_lyap": -0.9097278714179993, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 161, "sup_loss": 0.5008964067830873, "rf_loss": 4.362715480965562e-05, "total_loss": 0.5013326783239079, "mean_lyap": -0.9181713461875916, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 162, "sup_loss": 0.5992556645198497, "rf_loss": 0.0, "total_loss": 0.5992556645198497, "mean_lyap": -0.9893726110458374, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 163, "sup_loss": 0.9138912274150771, "rf_loss": 0.0, "total_loss": 0.9138912274150771, "mean_lyap": -0.9009734392166138, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 164, "sup_loss": 0.5685104715166784, "rf_loss": 7.916953472886235e-05, "total_loss": 0.5693021668348632, "mean_lyap": -0.9717569351196289, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 165, "sup_loss": 0.6171784802888035, "rf_loss": 0.0, "total_loss": 0.6171784802888035, "mean_lyap": -0.9582620859146118, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 166, "sup_loss": 0.8162310645315405, "rf_loss": 0.0004606795555446297, "total_loss": 0.8208378600287791, "mean_lyap": -0.8890138864517212, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 167, "sup_loss": 0.9108215564133297, "rf_loss": 0.0, "total_loss": 0.9108215564133297, "mean_lyap": -0.932681679725647, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 168, "sup_loss": 0.7919173869680999, "rf_loss": 9.947708167601377e-05, "total_loss": 0.7929121577557562, "mean_lyap": -0.8980196714401245, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 169, "sup_loss": 0.7066477397933514, "rf_loss": 1.0202940757153556e-05, "total_loss": 0.7067497692009229, "mean_lyap": -0.9571099281311035, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 170, "sup_loss": 0.7139214627311085, "rf_loss": 0.0, "total_loss": 0.7139214627311085, "mean_lyap": -0.945033848285675, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 171, "sup_loss": 0.7709420698813313, "rf_loss": 0.0, "total_loss": 0.7709420698813313, "mean_lyap": -0.9268935918807983, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 172, "sup_loss": 0.7228295302931781, "rf_loss": 0.0, "total_loss": 0.7228295302931781, "mean_lyap": -0.9544382691383362, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 173, "sup_loss": 0.5613587950956674, "rf_loss": 0.0, "total_loss": 0.5613587950956674, "mean_lyap": -0.9500914216041565, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 174, "sup_loss": 0.8143955457077544, "rf_loss": 0.0, "total_loss": 0.8143955457077544, "mean_lyap": -0.9618834853172302, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 175, "sup_loss": 0.7053880198605798, "rf_loss": 3.6345554690342396e-05, "total_loss": 0.7057514754220351, "mean_lyap": -0.9382758140563965, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 176, "sup_loss": 0.8231483867413522, "rf_loss": 0.0007249140762723982, "total_loss": 0.8303975273876608, "mean_lyap": -0.8953840732574463, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 177, "sup_loss": 0.7462800069585852, "rf_loss": 0.0, "total_loss": 0.7462800069585852, "mean_lyap": -0.9380788803100586, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 178, "sup_loss": 0.679239566645776, "rf_loss": 0.00017107199528254569, "total_loss": 0.6809502865403938, "mean_lyap": -0.9349449872970581, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 179, "sup_loss": 0.7266091879144229, "rf_loss": 6.751439286745153e-06, "total_loss": 0.7266767023109283, "mean_lyap": -0.9303713440895081, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 180, "sup_loss": 0.7539549592732316, "rf_loss": 2.5886556613841094e-05, "total_loss": 0.7542138248357321, "mean_lyap": -0.9419723153114319, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 181, "sup_loss": 0.5703976586739969, "rf_loss": 0.0, "total_loss": 0.5703976586739969, "mean_lyap": -0.9483802318572998, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 182, "sup_loss": 0.7608988161297702, "rf_loss": 2.3554461222374812e-05, "total_loss": 0.761134360734718, "mean_lyap": -0.9507160186767578, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 183, "sup_loss": 0.7900601838013458, "rf_loss": 3.0407780286623165e-05, "total_loss": 0.790364261611488, "mean_lyap": -0.9561895132064819, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 184, "sup_loss": 0.44977169118096466, "rf_loss": 0.0, "total_loss": 0.44977169118096466, "mean_lyap": -0.9784150123596191, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 185, "sup_loss": 0.6665112013097232, "rf_loss": 0.0, "total_loss": 0.6665112013097232, "mean_lyap": -1.0041429996490479, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 186, "sup_loss": 0.6233770500298779, "rf_loss": 0.0, "total_loss": 0.6233770500298779, "mean_lyap": -0.9526543617248535, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 187, "sup_loss": 0.7298426783748505, "rf_loss": 0.0, "total_loss": 0.7298426783748505, "mean_lyap": -0.9848892092704773, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 188, "sup_loss": 0.7994810007461031, "rf_loss": 0.00028055161237716675, "total_loss": 0.8022865168698747, "mean_lyap": -0.9289549589157104, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 189, "sup_loss": 0.9004618817356048, "rf_loss": 0.00013723062875214964, "total_loss": 0.9018341879940225, "mean_lyap": -0.9448005557060242, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 190, "sup_loss": 0.7561349029708767, "rf_loss": 1.4175058993259881e-07, "total_loss": 0.7561363204768045, "mean_lyap": -0.913082480430603, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 191, "sup_loss": 0.8108956146054335, "rf_loss": 0.0, "total_loss": 0.8108956146054335, "mean_lyap": -0.943326473236084, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 192, "sup_loss": 0.7575437858379497, "rf_loss": 0.00023609009804204106, "total_loss": 0.7599046867019548, "mean_lyap": -0.8917972445487976, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 193, "sup_loss": 0.512322704611355, "rf_loss": 0.00016364955808967352, "total_loss": 0.5139592001922517, "mean_lyap": -0.9673264622688293, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 194, "sup_loss": 0.9945017941952325, "rf_loss": 0.0, "total_loss": 0.9945017941952325, "mean_lyap": -0.926647424697876, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 195, "sup_loss": 0.6566390093757337, "rf_loss": 0.0, "total_loss": 0.6566390093757337, "mean_lyap": -0.9722451567649841, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 196, "sup_loss": 0.8823300548771821, "rf_loss": 0.0, "total_loss": 0.8823300548771821, "mean_lyap": -0.9026472568511963, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0 }, { "step": 197, "sup_loss": 0.6761996844994566, "rf_loss": 0.00010285572352586314, "total_loss": 0.6772282416910594, "mean_lyap": -0.9098778963088989, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.25 }, { "step": 198, "sup_loss": 0.6647835467672074, "rf_loss": 1.9416085706325248e-05, "total_loss": 0.6649777076169947, "mean_lyap": -0.9130200147628784, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.125 }, { "step": 199, "sup_loss": 0.8157799126017244, "rf_loss": 0.0, "total_loss": 0.8157799126017244, "mean_lyap": -0.948731541633606, "lam_star": -0.8500000238418579, "excess_frac_nonzero": 0.0, "eval_acc": 0.466796875, "eval_tok_acc": 0.818311149691358 } ], "final_acc": 0.466796875, "final_tok_acc": 0.818311149691358 }