Spaces:

awacke1
/

TorchTransformers-CV-SFT

Running

awacke1 commited on Mar 21

Commit

81afc2a

verified ·

1 Parent(s): d0e6378

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 import os
 import glob
-import time  # Added missing import
 import streamlit as st
 from PIL import Image
 import torch
@@ -172,9 +172,8 @@ with tab2:
         if st.button("Run OCR 🚀", key="ocr_run"):
             if ocr_model == "Qwen2-VL-OCR-2B":
                 processor, model = load_ocr_qwen2vl()
-                # Prepare inputs correctly for Qwen2-VL
-                messages = [{"role": "user", "content": [{"type": "image", "image": image}, {"type": "text", "text": prompt}]}]
-                inputs = processor(messages, return_tensors="pt").to("cpu")
                 outputs = model.generate(**inputs, max_new_tokens=1024)
                 text = processor.batch_decode(outputs, skip_special_tokens=True)[0]
             else:  # GOT-OCR2_0

 #!/usr/bin/env python3
 import os
 import glob
+import time
 import streamlit as st
 from PIL import Image
 import torch
         if st.button("Run OCR 🚀", key="ocr_run"):
             if ocr_model == "Qwen2-VL-OCR-2B":
                 processor, model = load_ocr_qwen2vl()
+                # Simplified input: pass image and text directly
+                inputs = processor(text=prompt, images=image, return_tensors="pt").to("cpu")
                 outputs = model.generate(**inputs, max_new_tokens=1024)
                 text = processor.batch_decode(outputs, skip_special_tokens=True)[0]
             else:  # GOT-OCR2_0