diff options
| -rw-r--r-- | Qwen2.5-Eval/evaluation/sh/eval_all_math.sh | 6 |
1 files changed, 3 insertions, 3 deletions
diff --git a/Qwen2.5-Eval/evaluation/sh/eval_all_math.sh b/Qwen2.5-Eval/evaluation/sh/eval_all_math.sh index ee580e3..8e8067d 100644 --- a/Qwen2.5-Eval/evaluation/sh/eval_all_math.sh +++ b/Qwen2.5-Eval/evaluation/sh/eval_all_math.sh @@ -1,7 +1,7 @@ set -x export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" MODEL_NAME_OR_PATH="/volume/ailab4sci/ztgao/em/checkpoints/qwen25_math_7b_1shot_pi1/step_10" -OUTPUT_DIR="/volume/ailab4sci/ztgao/em/checkpoints/qwen25_math_7b_1shot_pi1/step_10/temp03/eval" +OUTPUT_DIR="/volume/ailab4sci/ztgao/em/checkpoints/qwen25_math_7b_1shot_pi1/step_10/temp00/eval" mkdir -p $OUTPUT_DIR PROMPT_TYPE="qwen25-math-cot" MAX_TOKENS_PER_CALL="3072" @@ -20,7 +20,7 @@ python3 -u math_eval.py \ --prompt_type ${PROMPT_TYPE} \ --num_test_sample ${NUM_TEST_SAMPLE} \ --seed 0 \ - --temperature 0.3 \ + --temperature 0 \ --n_sampling 1 \ --top_p 1 \ --start 0 \ @@ -28,4 +28,4 @@ python3 -u math_eval.py \ --use_vllm \ --save_outputs \ --max_tokens_per_call ${MAX_TOKENS_PER_CALL} \ - --overwrite
\ No newline at end of file + --overwrite |
