{ "args": { "model": "trm", "ckpt_root": "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro", "ckpt_name": "__random__", "train_steps": 1, "batch_size": 32, "task_batch_size": 32, "floss_batch_size": 4, "train_lr": 0.0001, "floss_lr": 0.0001, "floss_steps": 0, "interfloss_at": "", "interfloss_every": 0, "interfloss_start": 0, "interfloss_stop": -1, "floss_mode": "engelken_l2", "lambda_star": 0.0, "k_lyap": 4, "lyap_act_steps": 4, "lyap_start_act": 0, "seed": 43, "eval_every": 1, "eval_n": 8, "eval_batch_size": 8, "floss_log_every": 1, "eval_after_floss": false, "kl_beta": 0.0, "kl_replay_size": 64, "kl_batch_size": 8, "kl_temperature": 1.0, "init_seed": 123, "train_puzzle_emb": true, "puzzle_emb_lr": 0.0001, "puzzle_emb_weight_decay": 1.0, "out": "research/flossing/flossing_suite/results/smoke/trm_task_batch32_smoke.json" }, "initial_acc": 0.0, "initial_tok_acc": 0.07561728395061729, "interfloss_steps": [], "task_steps": [ { "train_step": 1, "sup_loss": 2.581977193130616 } ], "floss_episodes": [], "evals": [ { "kind": "initial", "train_step": 0, "acc": 0.0, "tok_acc": 0.07561728395061729 }, { "kind": "task", "train_step": 1, "acc": 0.0, "tok_acc": 0.09722222222222222 }, { "kind": "final", "train_step": 1, "acc": 0.0, "tok_acc": 0.09722222222222222 } ], "final_acc": 0.0, "final_tok_acc": 0.09722222222222222 }