{ "args": { "model": "trm", "ckpt_root": "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_singleGPU", "ckpt_name": null, "init_from": "random", "mode": "baseline_clean", "train_steps": 1, "batch_size": 2, "lr": 0.0001, "noise_std": 0.001, "noise_min": null, "noise_max": null, "noise_sampling": "normal", "clean_prob": 0.0, "sigma_start": null, "sigma_ramp_steps": 0, "n_trajectories": 4, "rollout_impl": "parallel_fixed", "perturb": "both", "seed": 2027, "eval_every": 1, "eval_n": 64, "eval_batch_size": 16, "out": "smoke_scratch_trm_baseline.json", "save_dir": null, "save_best": false, "save_final": false, "save_every_eval": false, "save_train_state": false, "resume_state": null }, "initial_acc": 0.0, "initial_tok_acc": 0.0933641975308642, "steps": [ { "train_step": 1, "loss": 2.542586088180542, "clean_loss": 2.542586088180542, "noisy_loss_mean": 0.0, "noise_std_target": 0.001, "noise_std_mean": 0.0, "noise_std_max": 0.0, "effective_batch": 2 } ], "evals": [ { "kind": "initial", "train_step": 0, "acc": 0.0, "tok_acc": 0.0933641975308642 }, { "kind": "task", "train_step": 1, "acc": 0.0, "tok_acc": 0.09510030864197531 }, { "kind": "final", "train_step": 1, "acc": 0.0, "tok_acc": 0.09510030864197531 } ], "checkpoints": [], "resume_state": null, "resume_step": 0, "final_acc": 0.0, "final_tok_acc": 0.09510030864197531 }