mdasad3617 commited on
Commit
ed4ebee
·
verified ·
1 Parent(s): 57cc735

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -1,7 +1,7 @@
1
  import streamlit as st
2
  from transformers import pipeline, VisionEncoderDecoderModel, ViTImageProcessor
3
  from PIL import Image
4
- import fitz
5
  import logging
6
  from concurrent.futures import ThreadPoolExecutor
7
  import torch
@@ -17,9 +17,9 @@ def setup_logging():
17
  @st.cache_resource
18
  def load_models():
19
  logging.info("Loading Hugging Face models...")
20
- # Load image-to-text model from Hugging Face
21
- processor = ViTImageProcessor.from_pretrained("microsoft/vision-transformation-transformer")
22
- model = VisionEncoderDecoderModel.from_pretrained("microsoft/vision-transformation-transformer")
23
 
24
  # Load translation models
25
  translator_hi = pipeline("translation", model="Helsinki-NLP/opus-mt-en-hi")
 
1
  import streamlit as st
2
  from transformers import pipeline, VisionEncoderDecoderModel, ViTImageProcessor
3
  from PIL import Image
4
+ import fitz # PyMuPDF for PDF processing
5
  import logging
6
  from concurrent.futures import ThreadPoolExecutor
7
  import torch
 
17
  @st.cache_resource
18
  def load_models():
19
  logging.info("Loading Hugging Face models...")
20
+ # Use an alternative model from Hugging Face for image captioning
21
+ processor = ViTImageProcessor.from_pretrained("google/vit-base-patch16-224")
22
+ model = VisionEncoderDecoderModel.from_pretrained("google/vit-base-patch16-224")
23
 
24
  # Load translation models
25
  translator_hi = pipeline("translation", model="Helsinki-NLP/opus-mt-en-hi")