Redmind commited on
Commit
f081ce4
·
verified ·
1 Parent(s): 117bf92

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -1,6 +1,7 @@
1
  from fastapi import FastAPI
2
  import os
3
  import fitz # PyMuPDF for PDFs
 
4
  from pptx import Presentation # python-pptx for PowerPoint
5
  from sentence_transformers import SentenceTransformer # Text embeddings
6
  import torch
@@ -49,7 +50,7 @@ def search(query: str):
49
  ### Step 1: Extract Text from PDF ###
50
  def extract_text_from_pdf(pdf_path):
51
  text = ""
52
- doc = fitz.open(pdf_path)
53
  for page in doc:
54
  text += page.get_text() + "\n"
55
  return text.strip()
 
1
  from fastapi import FastAPI
2
  import os
3
  import fitz # PyMuPDF for PDFs
4
+ import pymupdf
5
  from pptx import Presentation # python-pptx for PowerPoint
6
  from sentence_transformers import SentenceTransformer # Text embeddings
7
  import torch
 
50
  ### Step 1: Extract Text from PDF ###
51
  def extract_text_from_pdf(pdf_path):
52
  text = ""
53
+ doc = pymupdf.open(pdf_path)
54
  for page in doc:
55
  text += page.get_text() + "\n"
56
  return text.strip()