diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-06-29 12:15:51 -0500 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-06-29 12:15:51 -0500 |
| commit | a6ec4288a2232988b130b2f00bb2565f81706966 (patch) | |
| tree | 1bb86e7f0b899b823b9e7fdf383e832d30a181e0 /flossing_suite/archive_failed_oom_b8 | |
Recursive reasoning dynamics: analysis pipeline, paper drafts, toy models
Failure=more-chaotic (task-general under validity labeling) reduces to convergence/completeness
detection; mechanism (transient chaos vs multistability vs input-induced) under investigation.
Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Diffstat (limited to 'flossing_suite/archive_failed_oom_b8')
3 files changed, 90 insertions, 0 deletions
diff --git a/flossing_suite/archive_failed_oom_b8/trm_seed123_baseline_nofloss_b8_10000.cmd.sh b/flossing_suite/archive_failed_oom_b8/trm_seed123_baseline_nofloss_b8_10000.cmd.sh new file mode 100755 index 0000000..98411d8 --- /dev/null +++ b/flossing_suite/archive_failed_oom_b8/trm_seed123_baseline_nofloss_b8_10000.cmd.sh @@ -0,0 +1,30 @@ +#!/usr/bin/env bash +set -euo pipefail +cd "/home/yurenh2/rrm" +export CUDA_VISIBLE_DEVICES="0" +export PYTHONUNBUFFERED=1 +exec "/home/yurenh2/miniconda3/envs/rrm/bin/python" research/flossing/step7_interfloss.py \ + --model trm \ + --ckpt-root "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro" \ + --ckpt-name __random__ \ + --init-seed 123 \ + --train-steps "10000" \ + --batch-size 8 \ + --train-lr 1e-4 \ + --floss-lr 1e-4 \ + --floss-mode engelken_l2 \ + --lambda-star 0 \ + --k-lyap 4 \ + --lyap-act-steps 4 \ + --seed 42 \ + --eval-every 1000 \ + --eval-n "1000" \ + --eval-batch-size 64 \ + --floss-log-every 10 \ + --train-puzzle-emb \ + --puzzle-emb-lr 1e-4 \ + --puzzle-emb-weight-decay 1.0 \ + --kl-beta 0 \ + --floss-steps "0" \ + --interfloss-at "" \ + --out "/home/yurenh2/rrm/research/flossing/flossing_suite/results/trm_faithful/trm_seed123_baseline_nofloss_b8_10000.json" diff --git a/flossing_suite/archive_failed_oom_b8/trm_seed123_pre_inter_0_500_b8_k4_10000.cmd.sh b/flossing_suite/archive_failed_oom_b8/trm_seed123_pre_inter_0_500_b8_k4_10000.cmd.sh new file mode 100755 index 0000000..e3f25ab --- /dev/null +++ b/flossing_suite/archive_failed_oom_b8/trm_seed123_pre_inter_0_500_b8_k4_10000.cmd.sh @@ -0,0 +1,30 @@ +#!/usr/bin/env bash +set -euo pipefail +cd "/home/yurenh2/rrm" +export CUDA_VISIBLE_DEVICES="3" +export PYTHONUNBUFFERED=1 +exec "/home/yurenh2/miniconda3/envs/rrm/bin/python" research/flossing/step7_interfloss.py \ + --model trm \ + --ckpt-root "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro" \ + --ckpt-name __random__ \ + --init-seed 123 \ + --train-steps "10000" \ + --batch-size 8 \ + --train-lr 1e-4 \ + --floss-lr 1e-4 \ + --floss-mode engelken_l2 \ + --lambda-star 0 \ + --k-lyap 4 \ + --lyap-act-steps 4 \ + --seed 42 \ + --eval-every 1000 \ + --eval-n "1000" \ + --eval-batch-size 64 \ + --floss-log-every 10 \ + --train-puzzle-emb \ + --puzzle-emb-lr 1e-4 \ + --puzzle-emb-weight-decay 1.0 \ + --kl-beta 0 \ + --floss-steps "500" \ + --interfloss-at "0,500" \ + --out "/home/yurenh2/rrm/research/flossing/flossing_suite/results/trm_faithful/trm_seed123_pre_inter_0_500_b8_k4_10000.json" diff --git a/flossing_suite/archive_failed_oom_b8/trm_seed123_prefloss_0_b8_k4_10000.cmd.sh b/flossing_suite/archive_failed_oom_b8/trm_seed123_prefloss_0_b8_k4_10000.cmd.sh new file mode 100755 index 0000000..86c445d --- /dev/null +++ b/flossing_suite/archive_failed_oom_b8/trm_seed123_prefloss_0_b8_k4_10000.cmd.sh @@ -0,0 +1,30 @@ +#!/usr/bin/env bash +set -euo pipefail +cd "/home/yurenh2/rrm" +export CUDA_VISIBLE_DEVICES="1" +export PYTHONUNBUFFERED=1 +exec "/home/yurenh2/miniconda3/envs/rrm/bin/python" research/flossing/step7_interfloss.py \ + --model trm \ + --ckpt-root "/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro" \ + --ckpt-name __random__ \ + --init-seed 123 \ + --train-steps "10000" \ + --batch-size 8 \ + --train-lr 1e-4 \ + --floss-lr 1e-4 \ + --floss-mode engelken_l2 \ + --lambda-star 0 \ + --k-lyap 4 \ + --lyap-act-steps 4 \ + --seed 42 \ + --eval-every 1000 \ + --eval-n "1000" \ + --eval-batch-size 64 \ + --floss-log-every 10 \ + --train-puzzle-emb \ + --puzzle-emb-lr 1e-4 \ + --puzzle-emb-weight-decay 1.0 \ + --kl-beta 0 \ + --floss-steps "500" \ + --interfloss-at "0" \ + --out "/home/yurenh2/rrm/research/flossing/flossing_suite/results/trm_faithful/trm_seed123_prefloss_0_b8_k4_10000.json" |
