visual / app.py
ravinder012's picture
Create app.py
dd9585a verified
raw
history blame contribute delete
258 Bytes
# Load model directly
from transformers import AutoProcessor, AutoModelForImageTextToText
processor = AutoProcessor.from_pretrained("bytedance-research/UI-TARS-2B-SFT")
model = AutoModelForImageTextToText.from_pretrained("bytedance-research/UI-TARS-2B-SFT")