From 66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Sat, 13 Jun 2026 12:35:36 -0500 Subject: rrm workspace: TRM/HRM/SRM code, Maze dataset, dynamical-analysis pipeline Curated export for clone-and-run Maze training (2x A6000) + diagnostics. trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible). Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md. Co-Authored-By: Claude Fable 5 --- research/flossing/smoke_resume_step9_part2.json | 109 ++++++++++++++++++++++++ 1 file changed, 109 insertions(+) create mode 100644 research/flossing/smoke_resume_step9_part2.json (limited to 'research/flossing/smoke_resume_step9_part2.json') diff --git a/research/flossing/smoke_resume_step9_part2.json b/research/flossing/smoke_resume_step9_part2.json new file mode 100644 index 0000000..c97bf02 --- /dev/null +++ b/research/flossing/smoke_resume_step9_part2.json @@ -0,0 +1,109 @@ +{ + "args": { + "model": "trm", + "ckpt_root": "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_singleGPU", + "ckpt_name": "step_26041", + "mode": "multi_perturbed_ce", + "train_steps": 2, + "batch_size": 2, + "lr": 1e-05, + "noise_std": 0.001, + "noise_min": null, + "noise_max": null, + "noise_sampling": "normal", + "clean_prob": 0.0, + "sigma_start": null, + "sigma_ramp_steps": 0, + "n_trajectories": 2, + "rollout_impl": "parallel_fixed", + "perturb": "both", + "seed": 777, + "eval_every": 1, + "eval_n": 8, + "eval_batch_size": 8, + "out": "smoke_resume_step9_part2.json", + "save_dir": null, + "save_best": true, + "save_final": true, + "save_every_eval": false, + "save_train_state": true, + "resume_state": "smoke_resume_step9_part1_ckpts/latest_state.pt" + }, + "initial_acc": 0.375, + "initial_tok_acc": 0.7577160493827161, + "steps": [ + { + "train_step": 2, + "loss": 0.4363347887992859, + "clean_loss": 0.4366205930709839, + "noisy_loss_mean": 0.4360489547252655, + "noise_std_target": 0.001, + "noise_std_mean": 0.0010000000474974513, + "noise_std_max": 0.0010000000474974513, + "effective_batch": 4 + } + ], + "evals": [ + { + "kind": "initial", + "train_step": 0, + "acc": 0.375, + "tok_acc": 0.7577160493827161 + }, + { + "kind": "task", + "train_step": 2, + "acc": 0.375, + "tok_acc": 0.7777777777777778 + }, + { + "kind": "final", + "train_step": 2, + "acc": 0.375, + "tok_acc": 0.7777777777777778 + } + ], + "checkpoints": [ + { + "kind": "best", + "train_step": 2, + "acc": 0.375, + "path": "smoke_resume_step9_part2_ckpts/best.pt" + }, + { + "kind": "best_state", + "train_step": 2, + "acc": 0.375, + "path": "smoke_resume_step9_part2_ckpts/best_state.pt" + }, + { + "kind": "latest_state", + "train_step": 2, + "acc": 0.375, + "path": "smoke_resume_step9_part2_ckpts/latest_state.pt" + }, + { + "kind": "final", + "train_step": 2, + "acc": 0.375, + "path": "smoke_resume_step9_part2_ckpts/final.pt" + }, + { + "kind": "final_state", + "train_step": 2, + "acc": 0.375, + "path": "smoke_resume_step9_part2_ckpts/final_state.pt" + } + ], + "resume_state": "smoke_resume_step9_part1_ckpts/latest_state.pt", + "resume_step": 1, + "best_acc": 0.375, + "best_step": 2, + "best_checkpoint": "smoke_resume_step9_part2_ckpts/best.pt", + "best_state_checkpoint": "smoke_resume_step9_part2_ckpts/best_state.pt", + "latest_state_checkpoint": "smoke_resume_step9_part2_ckpts/latest_state.pt", + "final_acc": 0.375, + "final_tok_acc": 0.7777777777777778, + "final_checkpoint": "smoke_resume_step9_part2_ckpts/final.pt", + "final_state_checkpoint": "smoke_resume_step9_part2_ckpts/final_state.pt" +} \ No newline at end of file -- cgit v1.2.3