From f1c2cc22d46a6976df3555391e667c7e61592fad Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Wed, 4 Feb 2026 18:59:35 -0600 Subject: Initial commit: RL floating-point noise project --- scripts/submit_single_job.sh | 32 ++++++++++++++++++++++++++++++++ 1 file changed, 32 insertions(+) create mode 100755 scripts/submit_single_job.sh (limited to 'scripts/submit_single_job.sh') diff --git a/scripts/submit_single_job.sh b/scripts/submit_single_job.sh new file mode 100755 index 0000000..7fe7492 --- /dev/null +++ b/scripts/submit_single_job.sh @@ -0,0 +1,32 @@ +#!/bin/bash +# submit_single_job.sh +# Submit a single training job +# Usage: ./submit_single_job.sh +# Example: ./submit_single_job.sh bf16 1 + +PRECISION_MODE=${1:-"bf16"} +SEED=${2:-1} + +PROJECT_DIR="/projects/bfqt/users/yurenh2/ml-projects/rl-floating-noise" +cd "$PROJECT_DIR" + +mkdir -p results/slurm_logs + +JOB_NAME="rlvr_${PRECISION_MODE}_s${SEED}" + +echo "Submitting job: $JOB_NAME" +echo " Precision: $PRECISION_MODE" +echo " Seed: $SEED" + +JOB_ID=$(sbatch \ + --job-name="$JOB_NAME" \ + --export=ALL,PRECISION_MODE="$PRECISION_MODE",SEED="$SEED" \ + scripts/slurm_train.sh | awk '{print $4}') + +echo "" +echo "Submitted! Job ID: $JOB_ID" +echo "" +echo "Monitor with: squeue -j $JOB_ID" +echo "View output: tail -f results/slurm_logs/${JOB_NAME}_${JOB_ID}.out" +echo "Cancel: scancel $JOB_ID" + -- cgit v1.2.3