#!/bin/bash #SBATCH --job-name=run_multiturn #SBATCH --account=bfqt-delta-gpu #SBATCH --partition=gpuA100x4 #SBATCH --nodes=1 #SBATCH --ntasks=1 #SBATCH --cpus-per-task=16 #SBATCH --gres=gpu:nvidia_a100:4 #SBATCH --mem=200G #SBATCH --time=48:00:00 #SBATCH --output=logs/run_multiturn_%j.out #SBATCH --error=logs/run_multiturn_%j.err # Run FIXED experiment with proper multi-turn conversation and user simulation # This uses LocalUserAgent for user simulation and proper metrics extraction set -e cd /projects/bfqt/users/yurenh2/ml-projects/personalization-user-model # Create logs and results directories mkdir -p collaborativeagents/slurm/logs mkdir -p collaborativeagents/results echo "Starting MULTI-TURN experiment at $(date)" echo "Job ID: $SLURM_JOB_ID" echo "Node: $SLURMD_NODENAME" echo "GPUs: $CUDA_VISIBLE_DEVICES" # Activate environment source /u/yurenh2/miniforge3/etc/profile.d/conda.sh conda activate eval # Check GPU availability nvidia-smi # Redirect HF cache to project space (avoid home quota issues) export HF_HOME=/projects/bfqt/users/yurenh2/.cache/huggingface mkdir -p $HF_HOME # Add project to path export PYTHONPATH="${PWD}/src:${PWD}/collaborativeagents:${PYTHONPATH}" # Run experiments cd collaborativeagents/scripts # INITIAL TEST: Run with reduced parameters to validate the fix # - 5 profiles (instead of 20) # - 3 sessions per profile (instead of 5) # - All 7 methods echo "Running MULTI-TURN experiments with user simulation..." python run_experiments.py \ --methods vanilla,all_memory,rag,rag_vector,contextual,reflection,reflection_grpo \ --datasets math-500 \ --n-profiles 5 \ --n-sessions 3 \ --profile-path ../data/complex_profiles_v2/profiles_100.jsonl \ --output-dir ../results/multiturn_test_$(date +%Y%m%d_%H%M%S) echo "Multi-turn experiment completed at $(date)"