diff options
Diffstat (limited to 'code_eval/OpenCodeEval/data/dataset.sh')
| -rwxr-xr-x | code_eval/OpenCodeEval/data/dataset.sh | 28 |
1 files changed, 28 insertions, 0 deletions
diff --git a/code_eval/OpenCodeEval/data/dataset.sh b/code_eval/OpenCodeEval/data/dataset.sh new file mode 100755 index 0000000..0e85f8f --- /dev/null +++ b/code_eval/OpenCodeEval/data/dataset.sh @@ -0,0 +1,28 @@ +#!/bin/bash + +# 定义要下载的文件的 URL 列表 +urls=( + "https://github.com/bigcode-project/bigcodebench-annotation/releases/download/v0.1.1/BigCodeBench-Hard.jsonl.gz" + "https://github.com/bigcode-project/bigcodebench-annotation/releases/download/v0.1.1/BigCodeBench.jsonl.gz" + "https://github.com/evalplus/humanevalplus_release/releases/download/v0.1.10/HumanEvalPlus.jsonl.gz" + "https://github.com/evalplus/mbppplus_release/releases/download/v0.2.0/MbppPlus.jsonl.gz" + "https://github.com/openai/human-eval/raw/master/data/HumanEval.jsonl.gz" +) + +# 下载并解压每个文件 +for url in "${urls[@]}"; do + # 获取文件名 + filename=$(basename "$url") + + # 删除已有的压缩文件和解压后的文件,确保不会重复 + [ -f "$filename" ] && rm "$filename" + [ -f "${filename%.gz}" ] && rm "${filename%.gz}" + + echo "Downloading $url..." + wget "$url" + + echo "Unzipping $filename..." + gunzip "$filename" +done + +echo "All files have been downloaded and unzipped." |
