summaryrefslogtreecommitdiff
path: root/research/flossing/smoke_resume_step9_part2.json
diff options
context:
space:
mode:
authorYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
committerYurenHao0426 <blackhao0426@gmail.com>2026-06-13 12:35:36 -0500
commit66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a (patch)
treec29cba61124018755a19b02c9d33e3ad5f2e05cc /research/flossing/smoke_resume_step9_part2.json
rrm workspace: TRM/HRM/SRM code, Maze dataset, dynamical-analysis pipelineHEADmain
Curated export for clone-and-run Maze training (2x A6000) + diagnostics. trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible). Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md. Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Diffstat (limited to 'research/flossing/smoke_resume_step9_part2.json')
-rw-r--r--research/flossing/smoke_resume_step9_part2.json109
1 files changed, 109 insertions, 0 deletions
diff --git a/research/flossing/smoke_resume_step9_part2.json b/research/flossing/smoke_resume_step9_part2.json
new file mode 100644
index 0000000..c97bf02
--- /dev/null
+++ b/research/flossing/smoke_resume_step9_part2.json
@@ -0,0 +1,109 @@
+{
+ "args": {
+ "model": "trm",
+ "ckpt_root": "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_singleGPU",
+ "ckpt_name": "step_26041",
+ "mode": "multi_perturbed_ce",
+ "train_steps": 2,
+ "batch_size": 2,
+ "lr": 1e-05,
+ "noise_std": 0.001,
+ "noise_min": null,
+ "noise_max": null,
+ "noise_sampling": "normal",
+ "clean_prob": 0.0,
+ "sigma_start": null,
+ "sigma_ramp_steps": 0,
+ "n_trajectories": 2,
+ "rollout_impl": "parallel_fixed",
+ "perturb": "both",
+ "seed": 777,
+ "eval_every": 1,
+ "eval_n": 8,
+ "eval_batch_size": 8,
+ "out": "smoke_resume_step9_part2.json",
+ "save_dir": null,
+ "save_best": true,
+ "save_final": true,
+ "save_every_eval": false,
+ "save_train_state": true,
+ "resume_state": "smoke_resume_step9_part1_ckpts/latest_state.pt"
+ },
+ "initial_acc": 0.375,
+ "initial_tok_acc": 0.7577160493827161,
+ "steps": [
+ {
+ "train_step": 2,
+ "loss": 0.4363347887992859,
+ "clean_loss": 0.4366205930709839,
+ "noisy_loss_mean": 0.4360489547252655,
+ "noise_std_target": 0.001,
+ "noise_std_mean": 0.0010000000474974513,
+ "noise_std_max": 0.0010000000474974513,
+ "effective_batch": 4
+ }
+ ],
+ "evals": [
+ {
+ "kind": "initial",
+ "train_step": 0,
+ "acc": 0.375,
+ "tok_acc": 0.7577160493827161
+ },
+ {
+ "kind": "task",
+ "train_step": 2,
+ "acc": 0.375,
+ "tok_acc": 0.7777777777777778
+ },
+ {
+ "kind": "final",
+ "train_step": 2,
+ "acc": 0.375,
+ "tok_acc": 0.7777777777777778
+ }
+ ],
+ "checkpoints": [
+ {
+ "kind": "best",
+ "train_step": 2,
+ "acc": 0.375,
+ "path": "smoke_resume_step9_part2_ckpts/best.pt"
+ },
+ {
+ "kind": "best_state",
+ "train_step": 2,
+ "acc": 0.375,
+ "path": "smoke_resume_step9_part2_ckpts/best_state.pt"
+ },
+ {
+ "kind": "latest_state",
+ "train_step": 2,
+ "acc": 0.375,
+ "path": "smoke_resume_step9_part2_ckpts/latest_state.pt"
+ },
+ {
+ "kind": "final",
+ "train_step": 2,
+ "acc": 0.375,
+ "path": "smoke_resume_step9_part2_ckpts/final.pt"
+ },
+ {
+ "kind": "final_state",
+ "train_step": 2,
+ "acc": 0.375,
+ "path": "smoke_resume_step9_part2_ckpts/final_state.pt"
+ }
+ ],
+ "resume_state": "smoke_resume_step9_part1_ckpts/latest_state.pt",
+ "resume_step": 1,
+ "best_acc": 0.375,
+ "best_step": 2,
+ "best_checkpoint": "smoke_resume_step9_part2_ckpts/best.pt",
+ "best_state_checkpoint": "smoke_resume_step9_part2_ckpts/best_state.pt",
+ "latest_state_checkpoint": "smoke_resume_step9_part2_ckpts/latest_state.pt",
+ "final_acc": 0.375,
+ "final_tok_acc": 0.7777777777777778,
+ "final_checkpoint": "smoke_resume_step9_part2_ckpts/final.pt",
+ "final_state_checkpoint": "smoke_resume_step9_part2_ckpts/final_state.pt"
+} \ No newline at end of file