{ "args": { "model": "trm", "ckpt_root": "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro", "ckpt_name": "__random__", "train_steps": 2, "batch_size": 8, "task_batch_size": 8, "floss_batch_size": 2, "train_lr": 0.0001, "floss_lr": 0.0001, "floss_steps": 1, "interfloss_at": "0", "interfloss_every": 1, "interfloss_start": 1, "interfloss_stop": 1, "floss_mode": "engelken_l2", "lambda_star": 0.0, "k_lyap": 1, "lyap_act_steps": 1, "lyap_start_act": 0, "seed": 42, "eval_every": 1, "eval_n": 8, "eval_batch_size": 8, "floss_log_every": 1, "eval_after_floss": false, "kl_beta": 0.0, "kl_replay_size": 64, "kl_batch_size": 8, "kl_temperature": 1.0, "init_seed": 123, "train_puzzle_emb": true, "puzzle_emb_lr": 0.0001, "puzzle_emb_weight_decay": 1.0, "out": "research/flossing/flossing_suite/results/smoke/trm_step7_decoupled_periodic_smoke.json" }, "initial_acc": 0.0, "initial_tok_acc": 0.07561728395061729, "interfloss_steps": [ 0, 1 ], "task_steps": [ { "train_step": 1, "sup_loss": 2.57209548232992 }, { "train_step": 2, "sup_loss": 2.56865356540629 } ], "floss_episodes": [ { "episode": 0, "train_step": 0, "steps": [ { "step": 0, "loss": 0.04431530460715294, "floss_loss": 0.04431530460715294, "kl_loss": 0.0, "lyap1_mean": 0.21050173044204712, "lyap1_max": 0.2125818431377411, "lyap_mean": 0.21050173044204712, "volume_mean": 0.21050173044204712, "volume_max": 0.2125818431377411, "frac_active": 1.0 } ] }, { "episode": 1, "train_step": 1, "steps": [ { "step": 0, "loss": 0.04459226503968239, "floss_loss": 0.04459226503968239, "kl_loss": 0.0, "lyap1_mean": 0.2111663520336151, "lyap1_max": 0.21218420565128326, "lyap_mean": 0.2111663520336151, "volume_mean": 0.2111663520336151, "volume_max": 0.21218420565128326, "frac_active": 1.0 } ] } ], "evals": [ { "kind": "initial", "train_step": 0, "acc": 0.0, "tok_acc": 0.07561728395061729 }, { "kind": "task", "train_step": 1, "acc": 0.0, "tok_acc": 0.07253086419753087 }, { "kind": "task", "train_step": 2, "acc": 0.0, "tok_acc": 0.08796296296296297 }, { "kind": "final", "train_step": 2, "acc": 0.0, "tok_acc": 0.08796296296296297 } ], "final_acc": 0.0, "final_tok_acc": 0.08796296296296297 }