From e43b3f8aa36c198b95c1e46bea2eaf3893b13dc3 Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Wed, 17 Dec 2025 04:29:37 -0600 Subject: Initial commit (clean history) --- scripts/download_personamem.py | 25 +++++++++++++++++++++++++ 1 file changed, 25 insertions(+) create mode 100644 scripts/download_personamem.py (limited to 'scripts/download_personamem.py') diff --git a/scripts/download_personamem.py b/scripts/download_personamem.py new file mode 100644 index 0000000..31b4e0e --- /dev/null +++ b/scripts/download_personamem.py @@ -0,0 +1,25 @@ +from huggingface_hub import hf_hub_download +import os + +repo_id = "bowen-upenn/PersonaMem" +local_dir = "data/raw_datasets/personamem" +files_to_download = [ + "questions_32k.csv", + "shared_contexts_32k.jsonl" +] + +os.makedirs(local_dir, exist_ok=True) + +print(f"Downloading files from {repo_id} to {local_dir}...") + +for filename in files_to_download: + print(f"Downloading {filename}...") + hf_hub_download( + repo_id=repo_id, + filename=filename, + repo_type="dataset", + local_dir=local_dir + ) + +print("Download complete.") + -- cgit v1.2.3