Spaces:

amendolajine
/

OPIT

Running

amendolajine commited on Nov 29, 2023

Commit

520e96b

1 Parent(s): 9b3a68b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,10 +11,11 @@ model = BartForConditionalGeneration.from_pretrained('facebook/bart-large-cnn')
 synthesiser = pipeline("text-to-speech", "suno/bark")
 # Function to extract abstract from PDF
-def extract_abstract(pdf_content):
-    # Convert NamedString object to bytes
-    pdf_bytes = pdf_content["content"]
     doc = fitz.open(stream=pdf_bytes, filetype="pdf")
     first_page = doc[0].get_text()
     start_idx = first_page.lower().find("abstract")
@@ -25,8 +26,8 @@ def extract_abstract(pdf_content):
         return "Abstract not found or 'Introduction' not found in the first page."
 # Function to process text (summarize and convert to speech)
-def process_text(pdf_content):
-    abstract_text = extract_abstract(pdf_content)
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)

 synthesiser = pipeline("text-to-speech", "suno/bark")
 # Function to extract abstract from PDF
+def extract_abstract(pdf_file):
+    # Read PDF file
+    pdf_bytes = pdf_file.read()
+    # Open PDF with fitz
     doc = fitz.open(stream=pdf_bytes, filetype="pdf")
     first_page = doc[0].get_text()
     start_idx = first_page.lower().find("abstract")
         return "Abstract not found or 'Introduction' not found in the first page."
 # Function to process text (summarize and convert to speech)
+def process_text(pdf_file):
+    abstract_text = extract_abstract(pdf_file)
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)