Initial commit

author: Yuren Hao <yurenh2@timan108.cs.illinois.edu> 2025-09-04 22:16:22 -0500
committer: Yuren Hao <yurenh2@timan108.cs.illinois.edu> 2025-09-04 22:16:22 -0500
commit: fc6d57ffb8d5ddb5820fcc00b5491a585c259ebc (patch)
tree: e9841f93a353e2107225cfc721d1ce57c0e594dc /code_eval/test-humaneval-ckpt-list.sh
1 files changed, 28 insertions, 0 deletions
diff --git a/code_eval/test-humaneval-ckpt-list.sh b/code_eval/test-humaneval-ckpt-list.sh
new file mode 100644
index 0000000..03514bd
--- /dev/null
+++ b/code_eval/test-humaneval-ckpt-list.sh
@@ -0,0 +1,28 @@
+export VLLM_ENABLE_V1_MULTIPROCESSING=0
+
+# Declare an associative array to store model mappings
+# TODO:Replace with actual model name and path
+declare -A model_dict=(
+    ["model_name_1"]="/path/to/model1"  
+    ["model_name_2"]="/path/to/model2"
+)
+
+# 外层循环：遍历model_dict
+for exp_name in "${!model_dict[@]}"; do
+    model="${model_dict[$exp_name]}"
+    echo "Evaluating model: $model"
+
+    python OpenCodeEval/main.py  --model_name $model \
+                    --task "HumanEval" \
+                    --save "test/output_humaneval_${exp_name}" \
+                    --num_gpus 1 \
+                    --batch_size 164 \
+                    --max_tokens 4096 \
+                    --temperature 0.1 \
+                    --seed 0 \
+                    --prompt_type "Completion" \
+                    --model_type "Chat" \
+                    --prompt_prefix $'Please provide a self-contained Python script that solves the following problem in a markdown code block:\n```python\n' \
+                    --prompt_suffix $'\n```\n' \
+
+done
+\ No newline at end of file
author	Yuren Hao <yurenh2@timan108.cs.illinois.edu>	2025-09-04 22:16:22 -0500
committer	Yuren Hao <yurenh2@timan108.cs.illinois.edu>	2025-09-04 22:16:22 -0500
commit	fc6d57ffb8d5ddb5820fcc00b5491a585c259ebc (patch)
tree	e9841f93a353e2107225cfc721d1ce57c0e594dc /code_eval/test-humaneval-ckpt-list.sh