Spaces:

Omkar008
/

geo_location_api

Running

Omkar008 commited on Aug 30, 2024

Commit

b748bd2

verified ·

1 Parent(s): 55d5cbb

Update core/init_nlp.py

Files changed (1) hide show

core/init_nlp.py CHANGED Viewed

@@ -3,29 +3,32 @@ import nltk.downloader
 import spacy
 from core.config import settings
 from pathlib import Path
 def initialize_nlp():
     print("Initializing NLP resources...")
-    nltk_data_path = Path("/tmp/nltk_data")
-    nltk_data_path.mkdir(parents=True, exist_ok=True)
-    nltk.data.path.append(str(nltk_data_path))
-    # Download NLTK resources
-    nltk_resources = [
-        'maxent_ne_chunker',
-        'words',
-        'treebank',
-        'maxent_treebank_pos_tagger',
-        'punkt',
-        'averaged_perceptron_tagger'
-    ]
-    for resource in nltk_resources:
-        nltk.downloader.download(resource, download_dir=str(nltk_data_path) ,quiet=True)
     # Load spaCy model
-    spacy.load(settings.SPACY_MODEL)
     print("NLP resources initialized successfully.")

 import spacy
 from core.config import settings
 from pathlib import Path
+import en_core_web_sm
 def initialize_nlp():
     print("Initializing NLP resources...")
+    # nltk_data_path = Path("/tmp/nltk_data")
+    # nltk_data_path.mkdir(parents=True, exist_ok=True)
+    # nltk.data.path.append(str(nltk_data_path))
+    # # Download NLTK resources
+    # nltk_resources = [
+    #     'maxent_ne_chunker',
+    #     'words',
+    #     'treebank',
+    #     'maxent_treebank_pos_tagger',
+    #     'punkt',
+    #     'averaged_perceptron_tagger'
+    # ]
+    # for resource in nltk_resources:
+    #     nltk.downloader.download(resource, download_dir=str(nltk_data_path) ,quiet=True)
     # Load spaCy model
+    # spacy.load(settings.SPACY_MODEL)
+    spacy.load("en_core_web_sm")
+    en_core_web_sm.load()
     print("NLP resources initialized successfully.")