diff options
Diffstat (limited to 'research/flossing/flossing_suite/results/smoke/trm_step7_decoupled_periodic_smoke.json')
| -rw-r--r-- | research/flossing/flossing_suite/results/smoke/trm_step7_decoupled_periodic_smoke.json | 120 |
1 files changed, 120 insertions, 0 deletions
diff --git a/research/flossing/flossing_suite/results/smoke/trm_step7_decoupled_periodic_smoke.json b/research/flossing/flossing_suite/results/smoke/trm_step7_decoupled_periodic_smoke.json new file mode 100644 index 0000000..927e492 --- /dev/null +++ b/research/flossing/flossing_suite/results/smoke/trm_step7_decoupled_periodic_smoke.json @@ -0,0 +1,120 @@ +{ + "args": { + "model": "trm", + "ckpt_root": "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro", + "ckpt_name": "__random__", + "train_steps": 2, + "batch_size": 8, + "task_batch_size": 8, + "floss_batch_size": 2, + "train_lr": 0.0001, + "floss_lr": 0.0001, + "floss_steps": 1, + "interfloss_at": "0", + "interfloss_every": 1, + "interfloss_start": 1, + "interfloss_stop": 1, + "floss_mode": "engelken_l2", + "lambda_star": 0.0, + "k_lyap": 1, + "lyap_act_steps": 1, + "lyap_start_act": 0, + "seed": 42, + "eval_every": 1, + "eval_n": 8, + "eval_batch_size": 8, + "floss_log_every": 1, + "eval_after_floss": false, + "kl_beta": 0.0, + "kl_replay_size": 64, + "kl_batch_size": 8, + "kl_temperature": 1.0, + "init_seed": 123, + "train_puzzle_emb": true, + "puzzle_emb_lr": 0.0001, + "puzzle_emb_weight_decay": 1.0, + "out": "research/flossing/flossing_suite/results/smoke/trm_step7_decoupled_periodic_smoke.json" + }, + "initial_acc": 0.0, + "initial_tok_acc": 0.07561728395061729, + "interfloss_steps": [ + 0, + 1 + ], + "task_steps": [ + { + "train_step": 1, + "sup_loss": 2.57209548232992 + }, + { + "train_step": 2, + "sup_loss": 2.56865356540629 + } + ], + "floss_episodes": [ + { + "episode": 0, + "train_step": 0, + "steps": [ + { + "step": 0, + "loss": 0.04431530460715294, + "floss_loss": 0.04431530460715294, + "kl_loss": 0.0, + "lyap1_mean": 0.21050173044204712, + "lyap1_max": 0.2125818431377411, + "lyap_mean": 0.21050173044204712, + "volume_mean": 0.21050173044204712, + "volume_max": 0.2125818431377411, + "frac_active": 1.0 + } + ] + }, + { + "episode": 1, + "train_step": 1, + "steps": [ + { + "step": 0, + "loss": 0.04459226503968239, + "floss_loss": 0.04459226503968239, + "kl_loss": 0.0, + "lyap1_mean": 0.2111663520336151, + "lyap1_max": 0.21218420565128326, + "lyap_mean": 0.2111663520336151, + "volume_mean": 0.2111663520336151, + "volume_max": 0.21218420565128326, + "frac_active": 1.0 + } + ] + } + ], + "evals": [ + { + "kind": "initial", + "train_step": 0, + "acc": 0.0, + "tok_acc": 0.07561728395061729 + }, + { + "kind": "task", + "train_step": 1, + "acc": 0.0, + "tok_acc": 0.07253086419753087 + }, + { + "kind": "task", + "train_step": 2, + "acc": 0.0, + "tok_acc": 0.08796296296296297 + }, + { + "kind": "final", + "train_step": 2, + "acc": 0.0, + "tok_acc": 0.08796296296296297 + } + ], + "final_acc": 0.0, + "final_tok_acc": 0.08796296296296297 +}
\ No newline at end of file |
