sileod commited on
Commit
a51d9c2
·
verified ·
1 Parent(s): d2e2fb3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -2
app.py CHANGED
@@ -1,8 +1,12 @@
1
  import gradio as gr
2
  from transformers import pipeline
3
  import nltk
4
- nltk.download('punkt')
5
- from nltk.tokenize import sent_tokenize
 
 
 
 
6
 
7
  # Initialize the classifiers
8
  zero_shot_classifier = pipeline("zero-shot-classification", model="tasksource/ModernBERT-base-nli")
 
1
  import gradio as gr
2
  from transformers import pipeline
3
  import nltk
4
+
5
+ def sent_tokenize(text):
6
+ # Regular expression to split sentences
7
+ sentence_endings = re.compile(r'(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\?|!)(\s|$)')
8
+ sentences = sentence_endings.split(text)
9
+ return [s.strip() for s in sentences if s.strip()]
10
 
11
  # Initialize the classifiers
12
  zero_shot_classifier = pipeline("zero-shot-classification", model="tasksource/ModernBERT-base-nli")