amendolajine commited on
Commit
8328d05
·
1 Parent(s): 2a7b912

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -2
app.py CHANGED
@@ -12,14 +12,19 @@ synthesiser = pipeline("text-to-speech", "suno/bark")
12
 
13
  # Function to extract abstract from PDF
14
  def extract_abstract(pdf_content):
15
- doc = fitz.open("pdf", pdf_content)
 
 
 
 
 
16
  first_page = doc[0].get_text()
17
  start_idx = first_page.lower().find("abstract")
18
  end_idx = first_page.lower().find("introduction")
19
  if start_idx != -1 and end_idx != -1:
20
  return first_page[start_idx:end_idx].strip()
21
  else:
22
- return "Abstract not found or '1 Introduction' not found in the first page."
23
 
24
  # Function to process text (summarize and convert to speech)
25
  def process_text(pdf_content):
 
12
 
13
  # Function to extract abstract from PDF
14
  def extract_abstract(pdf_content):
15
+ # Convert the byte stream to bytes
16
+ pdf_bytes = pdf_content.read()
17
+
18
+ # Open the PDF with PyMuPDF
19
+ doc = fitz.open(stream=pdf_bytes, filetype="pdf")
20
+
21
  first_page = doc[0].get_text()
22
  start_idx = first_page.lower().find("abstract")
23
  end_idx = first_page.lower().find("introduction")
24
  if start_idx != -1 and end_idx != -1:
25
  return first_page[start_idx:end_idx].strip()
26
  else:
27
+ return "Abstract not found or 'Introduction' not found in the first page."
28
 
29
  # Function to process text (summarize and convert to speech)
30
  def process_text(pdf_content):