update code and kk eval

author: = <=> 2025-06-04 11:49:37 +0800
committer: = <=> 2025-06-04 11:49:37 +0800
commit: 947d9dfdf16ae37109898111a5caacae7377b96d (patch)
tree: ff4e884020fb7d968a6192106f370b215647f569 /code_eval/test-mbpp-ckpt-list.sh
parent: 5e163b529a78d528b745b8b57ba794b7b2bba97a (diff)
1 files changed, 32 insertions, 0 deletions
diff --git a/code_eval/test-mbpp-ckpt-list.sh b/code_eval/test-mbpp-ckpt-list.sh
new file mode 100644
index 0000000..b7bb5fd
--- /dev/null
+++ b/code_eval/test-mbpp-ckpt-list.sh
@@ -0,0 +1,32 @@
+export VLLM_ENABLE_V1_MULTIPROCESSING=0
+
+# Declare an associative array to store model mappings
+# TODO:Replace with actual model name and path
+declare -A model_dict=(
+    ["model_name_1"]="/path/to/model1"  
+    ["model_name_2"]="/path/to/model2"
+)
+
+# 外层循环：遍历model_dict
+for exp_name in "${!model_dict[@]}"; do
+    model="${model_dict[$exp_name]}"
+    echo "Evaluating model: $model"
+
+    python OpenCodeEval/main.py  --model_name $model \
+                    --task "MBPP" \
+                    --save "test_mbpp/output_mbpp_step_${exp_name}" \
+                    --num_gpus 1 \
+                    --batch_size 378 \
+                    --max_tokens 4096 \
+                    --temperature 0.0 \
+                    --seed 0 \
+                    --time_out 3.0 \
+                    --prompt_type "Instruction" \
+                    --model_type "Chat" \
+                    --prompt_prefix "" \
+                    --prompt_suffix "" \
+                    --trust_remote_code
+
+done
+
+
author	= <=>	2025-06-04 11:49:37 +0800
committer	= <=>	2025-06-04 11:49:37 +0800
commit	947d9dfdf16ae37109898111a5caacae7377b96d (patch)
tree	ff4e884020fb7d968a6192106f370b215647f569 /code_eval/test-mbpp-ckpt-list.sh
parent	5e163b529a78d528b745b8b57ba794b7b2bba97a (diff)