summaryrefslogtreecommitdiff
path: root/research/flossing/run_H_after_SRM.sh
diff options
context:
space:
mode:
Diffstat (limited to 'research/flossing/run_H_after_SRM.sh')
-rwxr-xr-xresearch/flossing/run_H_after_SRM.sh29
1 files changed, 29 insertions, 0 deletions
diff --git a/research/flossing/run_H_after_SRM.sh b/research/flossing/run_H_after_SRM.sh
new file mode 100755
index 0000000..a1750e2
--- /dev/null
+++ b/research/flossing/run_H_after_SRM.sh
@@ -0,0 +1,29 @@
+#!/bin/bash
+# Wait for SRM-runner to finish, then run H: Engelken L2 on converged HRM step_26040.
+# Tests whether Engelken hurts in refinement regime (CF hinge gave +9.8% on this ckpt).
+set -e
+cd /home/yurenh2/rrm/research/flossing
+source /home/yurenh2/miniconda3/etc/profile.d/conda.sh
+conda activate rrm
+export CUDA_VISIBLE_DEVICES=2
+
+SRM_RUNNER_PID=$1
+echo "[$(date '+%H:%M:%S')] H-runner waiting for SRM-runner PID $SRM_RUNNER_PID..." >> step4_runner.log
+while kill -0 "$SRM_RUNNER_PID" 2>/dev/null; do
+ sleep 30
+done
+echo "[$(date '+%H:%M:%S')] SRM done. Starting Phase H: Engelken L2 (α=10, k=4) on converged step_26040" >> step4_runner.log
+
+CKPT_ROOT="/home/yurenh2/rrm/hrm/checkpoints/Sudoku-extreme-1k-aug-1000 ACT-torch/HierarchicalReasoningModel_ACTV1 righteous-python"
+
+python step3_train_with_rf.py \
+ --ckpt-root "$CKPT_ROOT" \
+ --ckpt-name step_26040 \
+ --n-steps 500 --batch-size 8 \
+ --alpha-rf 10.0 --rf-mode engelken_l2 \
+ --k-lyap 4 --lyap-act-steps 4 \
+ --eval-every 100 --eval-n 512 --eval-batch-size 32 \
+ --out step3_H_engelken_l2_26040.json \
+ > step3_H.log 2>&1
+
+echo "[$(date '+%H:%M:%S')] Phase H complete (Engelken on converged HRM)" >> step4_runner.log