Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
import streamlit as st
|
2 |
from transformers import pipeline, VisionEncoderDecoderModel, ViTImageProcessor
|
3 |
from PIL import Image
|
4 |
-
import fitz
|
5 |
import logging
|
6 |
from concurrent.futures import ThreadPoolExecutor
|
7 |
import torch
|
@@ -17,9 +17,9 @@ def setup_logging():
|
|
17 |
@st.cache_resource
|
18 |
def load_models():
|
19 |
logging.info("Loading Hugging Face models...")
|
20 |
-
#
|
21 |
-
processor = ViTImageProcessor.from_pretrained("
|
22 |
-
model = VisionEncoderDecoderModel.from_pretrained("
|
23 |
|
24 |
# Load translation models
|
25 |
translator_hi = pipeline("translation", model="Helsinki-NLP/opus-mt-en-hi")
|
|
|
1 |
import streamlit as st
|
2 |
from transformers import pipeline, VisionEncoderDecoderModel, ViTImageProcessor
|
3 |
from PIL import Image
|
4 |
+
import fitz # PyMuPDF for PDF processing
|
5 |
import logging
|
6 |
from concurrent.futures import ThreadPoolExecutor
|
7 |
import torch
|
|
|
17 |
@st.cache_resource
|
18 |
def load_models():
|
19 |
logging.info("Loading Hugging Face models...")
|
20 |
+
# Use an alternative model from Hugging Face for image captioning
|
21 |
+
processor = ViTImageProcessor.from_pretrained("google/vit-base-patch16-224")
|
22 |
+
model = VisionEncoderDecoderModel.from_pretrained("google/vit-base-patch16-224")
|
23 |
|
24 |
# Load translation models
|
25 |
translator_hi = pipeline("translation", model="Helsinki-NLP/opus-mt-en-hi")
|