edithram23 commited on
Commit
39f0789
·
verified ·
1 Parent(s): 57bcde6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +19 -10
app.py CHANGED
@@ -182,16 +182,25 @@ if uploaded_file is not None:
182
  sentences = sentence_tokenize(text)
183
  for sent in sentences:
184
  x = mask_generation(sent)
185
-
186
- sent_n_q_c=[]
187
- sent_n = list(set(sent.lower().replace('.',' ').split("\n")))
188
- for i in sent_n:
189
- for j in i.split(" "):
190
- sent_n_q_c+=j.split(',')
191
- x_q = x.lower().replace('.',' ').split(' ')
192
- e=[]
193
- for i in x_q:
194
- e+=i.split(',')
 
 
 
 
 
 
 
 
 
195
  t5_words=set(sent_n_q_c).difference(set(e))
196
  entities,words_out = extract_entities(sent)
197
  # print("\nwords_out:",words_out)
 
182
  sentences = sentence_tokenize(text)
183
  for sent in sentences:
184
  x = mask_generation(sent)
185
+ sent_out = re.sub("\n","|",sent)
186
+ sent_out = re.sub(".","|",sent_out)
187
+ sent_out = re.sub(",","|",sent_out)
188
+ sent_out = re.sub(" ","|",sent_out)
189
+ sent_n_q_c=sent_out.split("|")
190
+ # sent_n_q_c=[]
191
+ # sent_n = list(set(sent.lower().replace('.',' ').split("\n")))
192
+ # for i in sent_n:
193
+ # for j in i.split(" "):
194
+ # sent_n_q_c+=j.split(',')
195
+ # x_q = x.lower().replace('.',' ').split(' ')
196
+ # e=[]
197
+ # for i in x_q:
198
+ # e+=i.split(',')
199
+ sent_out = re.sub("\n","|",x)
200
+ sent_out = re.sub(".","|",sent_out)
201
+ sent_out = re.sub(",","|",sent_out)
202
+ sent_out = re.sub(" ","|",sent_out)
203
+ e = sent_out.split("|")
204
  t5_words=set(sent_n_q_c).difference(set(e))
205
  entities,words_out = extract_entities(sent)
206
  # print("\nwords_out:",words_out)