From 7a4ad471c9026c7882504b1c8b730045b4bb74af Mon Sep 17 00:00:00 2001 From: CHEN SHENGYUAN Date: Thu, 18 Dec 2025 15:35:33 +0800 Subject: enable vectorized retrieval with sparse matrix operations --- src/ner.py | 3 +++ 1 file changed, 3 insertions(+) (limited to 'src/ner.py') diff --git a/src/ner.py b/src/ner.py index 2ca4afb..4ee788e 100644 --- a/src/ner.py +++ b/src/ner.py @@ -1,5 +1,7 @@ import spacy from collections import defaultdict +import pdb + class SpacyNER: def __init__(self,spacy_model): @@ -25,6 +27,7 @@ class SpacyNER: sentence_to_entities = defaultdict(list) unique_entities = set() passage_hash_id_to_entities = {} + pdb.set_trace() for ent in doc.ents: if ent.label_ == "ORDINAL" or ent.label_ == "CARDINAL": continue -- cgit v1.2.3