Spaces:

la04
/

RAG_test_1

Sleeping

la04 commited on Jan 9

Commit

f965a1f

verified ·

1 Parent(s): bb5fea8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,18 +11,14 @@ import os
 class LayoutLMv3OCR:
     def __init__(self):
         self.processor = LayoutLMv3Processor.from_pretrained("microsoft/layoutlmv3-base")
-        # Ändere AutoModelForSeq2SeqLM zu AutoModelForTokenClassification
         self.model = AutoModelForTokenClassification.from_pretrained("microsoft/layoutlmv3-base")
     def extract_text(self, pdf_path):
         images = convert_from_path(pdf_path)
         text_pages = []
         for image in images:
-            # Bilder werden für die OCR-Prozesse vorbereitet
             inputs = self.processor(images=image, return_tensors="pt")
-            # Modell wird zur Textextraktion genutzt
             outputs = self.model(**inputs)
-            # Hier wird der dekodierte Text extrahiert
             text = self.processor.batch_decode(outputs.logits, skip_special_tokens=True)[0]
             text_pages.append(text)
         return text_pages
@@ -52,9 +48,10 @@ def chatbot_response(pdf, question):
     os.remove(pdf_path)
     return answer
-pdf_input = gr.inputs.File(label="PDF-Datei hochladen")
-question_input = gr.inputs.Textbox(label="Frage eingeben")
-response_output = gr.outputs.Textbox(label="Antwort")
 interface = gr.Interface(
     fn=chatbot_response,

 class LayoutLMv3OCR:
     def __init__(self):
         self.processor = LayoutLMv3Processor.from_pretrained("microsoft/layoutlmv3-base")
         self.model = AutoModelForTokenClassification.from_pretrained("microsoft/layoutlmv3-base")
     def extract_text(self, pdf_path):
         images = convert_from_path(pdf_path)
         text_pages = []
         for image in images:
             inputs = self.processor(images=image, return_tensors="pt")
             outputs = self.model(**inputs)
             text = self.processor.batch_decode(outputs.logits, skip_special_tokens=True)[0]
             text_pages.append(text)
         return text_pages
     os.remove(pdf_path)
     return answer
+# Ändere 'inputs' und 'outputs' zur neuen Gradio API
+pdf_input = gr.File(label="PDF-Datei hochladen")
+question_input = gr.Textbox(label="Frage eingeben")
+response_output = gr.Textbox(label="Antwort")
 interface = gr.Interface(
     fn=chatbot_response,