{ "args": { "model": "trm", "ckpt_root": "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_singleGPU", "ckpt_name": "step_26041", "mode": "multi_perturbed_ce", "train_steps": 2, "batch_size": 2, "lr": 1e-05, "noise_std": 0.001, "noise_min": null, "noise_max": null, "noise_sampling": "normal", "clean_prob": 0.0, "sigma_start": null, "sigma_ramp_steps": 0, "n_trajectories": 2, "rollout_impl": "parallel_fixed", "perturb": "both", "seed": 777, "eval_every": 1, "eval_n": 8, "eval_batch_size": 8, "out": "smoke_resume_step9_part2.json", "save_dir": null, "save_best": true, "save_final": true, "save_every_eval": false, "save_train_state": true, "resume_state": "smoke_resume_step9_part1_ckpts/latest_state.pt" }, "initial_acc": 0.375, "initial_tok_acc": 0.7577160493827161, "steps": [ { "train_step": 2, "loss": 0.4363347887992859, "clean_loss": 0.4366205930709839, "noisy_loss_mean": 0.4360489547252655, "noise_std_target": 0.001, "noise_std_mean": 0.0010000000474974513, "noise_std_max": 0.0010000000474974513, "effective_batch": 4 } ], "evals": [ { "kind": "initial", "train_step": 0, "acc": 0.375, "tok_acc": 0.7577160493827161 }, { "kind": "task", "train_step": 2, "acc": 0.375, "tok_acc": 0.7777777777777778 }, { "kind": "final", "train_step": 2, "acc": 0.375, "tok_acc": 0.7777777777777778 } ], "checkpoints": [ { "kind": "best", "train_step": 2, "acc": 0.375, "path": "smoke_resume_step9_part2_ckpts/best.pt" }, { "kind": "best_state", "train_step": 2, "acc": 0.375, "path": "smoke_resume_step9_part2_ckpts/best_state.pt" }, { "kind": "latest_state", "train_step": 2, "acc": 0.375, "path": "smoke_resume_step9_part2_ckpts/latest_state.pt" }, { "kind": "final", "train_step": 2, "acc": 0.375, "path": "smoke_resume_step9_part2_ckpts/final.pt" }, { "kind": "final_state", "train_step": 2, "acc": 0.375, "path": "smoke_resume_step9_part2_ckpts/final_state.pt" } ], "resume_state": "smoke_resume_step9_part1_ckpts/latest_state.pt", "resume_step": 1, "best_acc": 0.375, "best_step": 2, "best_checkpoint": "smoke_resume_step9_part2_ckpts/best.pt", "best_state_checkpoint": "smoke_resume_step9_part2_ckpts/best_state.pt", "latest_state_checkpoint": "smoke_resume_step9_part2_ckpts/latest_state.pt", "final_acc": 0.375, "final_tok_acc": 0.7777777777777778, "final_checkpoint": "smoke_resume_step9_part2_ckpts/final.pt", "final_state_checkpoint": "smoke_resume_step9_part2_ckpts/final_state.pt" }