mgbam commited on
Commit
3354fcc
·
verified ·
1 Parent(s): f16d0f1

Update mcp/nlp.py

Browse files
Files changed (1) hide show
  1. mcp/nlp.py +3 -3
mcp/nlp.py CHANGED
@@ -7,13 +7,13 @@ def load_model():
7
  return spacy.load("en_core_web_sm")
8
  except OSError:
9
  raise RuntimeError(
10
- "spaCy model 'en_core_web_sm' not found. "
11
- "Install it in your Dockerfile or requirements.txt before building the app."
12
  )
13
 
14
  nlp = load_model()
15
 
16
  def extract_keywords(text: str):
17
- """Extract entities (longer than 2 chars, no duplicates)."""
18
  doc = nlp(text)
19
  return list({ent.text for ent in doc.ents if len(ent.text.strip()) > 2})
 
7
  return spacy.load("en_core_web_sm")
8
  except OSError:
9
  raise RuntimeError(
10
+ "spaCy model 'en_core_web_sm' is not installed. "
11
+ "Ensure Dockerfile downloads it at build time."
12
  )
13
 
14
  nlp = load_model()
15
 
16
  def extract_keywords(text: str):
17
+ """Extract unique Named Entities longer than 2 characters."""
18
  doc = nlp(text)
19
  return list({ent.text for ent in doc.ents if len(ent.text.strip()) > 2})