kumar989's picture
Create app.py
f575c3b
raw
history blame
500 Bytes
import os
import PyPDF2
from PIL import Image
import pytesseract
# Directory for storing PDF resumes and job applications
pdf_directory = '/content/pdf_files'
# Directory for storing extracted text from PDFs
text_directory = '/content/extracted_text'
# OCR output directory for scanned PDFs
ocr_directory = '/content/ocr_output'
# Create directories if they don't exist
os.makedirs(pdf_directory, exist_ok=True)
os.makedirs(text_directory, exist_ok=True)
os.makedirs(ocr_directory, exist_ok=True)