Spaces:

VGG11
/

armenian_chatbot_bert_multilingual

Runtime error

Mary12 commited on Aug 21, 2023

Commit

6bd0993

1 Parent(s): d9c2c2b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -38,21 +38,26 @@ def extract_text_from_txt(file_path):
         return txt_file.read()
     # return text
-def extract_text_from_doc(file_path):
-    # text = ""
-    # doc = docx.Document(file_path)
-    # for texts in doc.paragraphs:
-    #     text+= texts.text + "\n"
-    # return texts
     doc = docx.Document(file_path)
-    fullText = []
-    for para in doc.paragraphs:
-        fullText.append(para.text)
-    return '\n'.join(fullText)
 def model(model_name):
   tokenizer = AutoTokenizer.from_pretrained(model_name)
   model = AutoModelForQuestionAnswering.from_pretrained(model_name,return_dict = False)

         return txt_file.read()
     # return text
+# def extract_text_from_doc(file_path):
+#     doc = docx.Document(file_path)
+#     fullText = []
+#     for para in doc.paragraphs:
+#         fullText.append(para.text)
+#     return '\n'.join(fullText)
+def extract_text_from_paragraph(para):
+    return para.text
+def extract_text_from_doc(file_path):
     doc = docx.Document(file_path)
+    with concurrent.futures.ThreadPoolExecutor() as executor:
+        results = list(executor.map(extract_text_from_paragraph, doc.paragraphs))
+    return '\n'.join(results)
 def model(model_name):
   tokenizer = AutoTokenizer.from_pretrained(model_name)
   model = AutoModelForQuestionAnswering.from_pretrained(model_name,return_dict = False)