Spaces:

amendolajine
/

OPIT

Running

amendolajine commited on Nov 29, 2023

Commit

0cdfeaa

1 Parent(s): 962d09d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,10 +11,7 @@ model = BartForConditionalGeneration.from_pretrained('facebook/bart-large-cnn')
 synthesiser = pipeline("text-to-speech", "suno/bark")
 # Function to extract abstract from PDF
-def extract_abstract(pdf_file):
-    # Access the byte content of the uploaded file
-    pdf_bytes = pdf_file["data"]
     # Open PDF with fitz
     doc = fitz.open(stream=pdf_bytes, filetype="pdf")
     first_page = doc[0].get_text()
@@ -26,8 +23,10 @@ def extract_abstract(pdf_file):
         return "Abstract not found or 'Introduction' not found in the first page."
 # Function to process text (summarize and convert to speech)
-def process_text(pdf_file):
-    abstract_text = extract_abstract(pdf_file)
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)

 synthesiser = pipeline("text-to-speech", "suno/bark")
 # Function to extract abstract from PDF
+def extract_abstract(pdf_bytes):
     # Open PDF with fitz
     doc = fitz.open(stream=pdf_bytes, filetype="pdf")
     first_page = doc[0].get_text()
         return "Abstract not found or 'Introduction' not found in the first page."
 # Function to process text (summarize and convert to speech)
+def process_text(uploaded_file):
+    # Extract the file data (byte content) from the uploaded file
+    pdf_bytes = uploaded_file["data"]
+    abstract_text = extract_abstract(pdf_bytes)
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)