Update app.py
Browse files
app.py
CHANGED
@@ -7,7 +7,7 @@ import numpy as np
|
|
7 |
from sklearn.feature_extraction.text import TfidfVectorizer
|
8 |
from sklearn.metrics.pairwise import cosine_similarity
|
9 |
from io import StringIO
|
10 |
-
|
11 |
# Function to extract text from a PDF file
|
12 |
def extract_text_from_pdf(pdf_file):
|
13 |
reader = PyPDF2.PdfReader(pdf_file)
|
|
|
7 |
from sklearn.feature_extraction.text import TfidfVectorizer
|
8 |
from sklearn.metrics.pairwise import cosine_similarity
|
9 |
from io import StringIO
|
10 |
+
import pytesseract
|
11 |
# Function to extract text from a PDF file
|
12 |
def extract_text_from_pdf(pdf_file):
|
13 |
reader = PyPDF2.PdfReader(pdf_file)
|