summaryrefslogtreecommitdiff
path: root/scripts/debug_context_file.py
diff options
context:
space:
mode:
authorYurenHao0426 <blackhao0426@gmail.com>2025-12-17 04:29:37 -0600
committerYurenHao0426 <blackhao0426@gmail.com>2025-12-17 04:29:37 -0600
commite43b3f8aa36c198b95c1e46bea2eaf3893b13dc3 (patch)
tree6ce8a00d2f8b9ebd83c894a27ea01ac50cfb2ff5 /scripts/debug_context_file.py
Initial commit (clean history)HEADmain
Diffstat (limited to 'scripts/debug_context_file.py')
-rw-r--r--scripts/debug_context_file.py14
1 files changed, 14 insertions, 0 deletions
diff --git a/scripts/debug_context_file.py b/scripts/debug_context_file.py
new file mode 100644
index 0000000..81ac6b9
--- /dev/null
+++ b/scripts/debug_context_file.py
@@ -0,0 +1,14 @@
+import json
+
+path = "data/raw_datasets/personamem/shared_contexts_32k.jsonl"
+with open(path, 'r') as f:
+ line = f.readline()
+ data = json.loads(line)
+ print(f"Type: {type(data)}")
+ if isinstance(data, dict):
+ print(f"Keys: {list(data.keys())}")
+ # Peek into values
+ for k, v in data.items():
+ print(f"Key '{k}' type: {type(v)}")
+ if isinstance(v, list):
+ print(f" Length: {len(v)}")