diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2025-12-17 04:29:37 -0600 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2025-12-17 04:29:37 -0600 |
| commit | e43b3f8aa36c198b95c1e46bea2eaf3893b13dc3 (patch) | |
| tree | 6ce8a00d2f8b9ebd83c894a27ea01ac50cfb2ff5 /scripts/debug_context_file.py | |
Diffstat (limited to 'scripts/debug_context_file.py')
| -rw-r--r-- | scripts/debug_context_file.py | 14 |
1 files changed, 14 insertions, 0 deletions
diff --git a/scripts/debug_context_file.py b/scripts/debug_context_file.py new file mode 100644 index 0000000..81ac6b9 --- /dev/null +++ b/scripts/debug_context_file.py @@ -0,0 +1,14 @@ +import json + +path = "data/raw_datasets/personamem/shared_contexts_32k.jsonl" +with open(path, 'r') as f: + line = f.readline() + data = json.loads(line) + print(f"Type: {type(data)}") + if isinstance(data, dict): + print(f"Keys: {list(data.keys())}") + # Peek into values + for k, v in data.items(): + print(f"Key '{k}' type: {type(v)}") + if isinstance(v, list): + print(f" Length: {len(v)}") |
