prithivMLmods commited on
Commit
f33a64a
·
verified ·
1 Parent(s): 926d2ec

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -8
app.py CHANGED
@@ -21,7 +21,6 @@ from transformers import (
21
  TextIteratorStreamer,
22
  )
23
 
24
- from transformers import Blip2Processor, Blip2ForConditionalGeneration
25
  from transformers.image_utils import load_image
26
 
27
  # Constants for text generation
@@ -49,10 +48,10 @@ model_z = Qwen2_5_VLForConditionalGeneration.from_pretrained(
49
  torch_dtype=torch.float16
50
  ).to(device).eval()
51
 
52
- # Load blip2-opt-2.7b
53
- MODEL_ID_K = "Salesforce/blip2-opt-2.7b"
54
- processor_k = Blip2Processor.from_pretrained(MODEL_ID_K, trust_remote_code=True)
55
- model_k = Blip2ForConditionalGeneration.from_pretrained(
56
  MODEL_ID_K,
57
  trust_remote_code=True,
58
  torch_dtype=torch.float16
@@ -95,7 +94,7 @@ def generate_image(model_name: str, text: str, image: Image.Image,
95
  elif model_name == "SpaceThinker-3B":
96
  processor = processor_z
97
  model = model_z
98
- elif model_name == "blip2-opt-2.7b":
99
  processor = processor_k
100
  model = model_k
101
  else:
@@ -148,7 +147,7 @@ def generate_video(model_name: str, text: str, video_path: str,
148
  elif model_name == "SpaceThinker-3B":
149
  processor = processor_z
150
  model = model_z
151
- elif model_name == "blip2-opt-2.7b":
152
  processor = processor_k
153
  model = model_k
154
  else:
@@ -251,7 +250,7 @@ with gr.Blocks(css=css, theme="bethecloud/storj_theme") as demo:
251
  with gr.Column():
252
  output = gr.Textbox(label="Output", interactive=False, lines=2, scale=2)
253
  model_choice = gr.Radio(
254
- choices=["SkyCaptioner-V1", "SpaceThinker-3B", "blip2-opt-2.7b"],
255
  label="Select Model",
256
  value="SkyCaptioner-V1"
257
  )
 
21
  TextIteratorStreamer,
22
  )
23
 
 
24
  from transformers.image_utils import load_image
25
 
26
  # Constants for text generation
 
48
  torch_dtype=torch.float16
49
  ).to(device).eval()
50
 
51
+ # Load coreOCR-7B-050325-preview
52
+ MODEL_ID_K = "prithivMLmods/coreOCR-7B-050325-preview"
53
+ processor_k = AutoProcessor.from_pretrained(MODEL_ID_K, trust_remote_code=True)
54
+ model_k = Qwen2_5_VLForConditionalGeneration.from_pretrained(
55
  MODEL_ID_K,
56
  trust_remote_code=True,
57
  torch_dtype=torch.float16
 
94
  elif model_name == "SpaceThinker-3B":
95
  processor = processor_z
96
  model = model_z
97
+ elif model_name == "coreOCR-7B-050325-preview":
98
  processor = processor_k
99
  model = model_k
100
  else:
 
147
  elif model_name == "SpaceThinker-3B":
148
  processor = processor_z
149
  model = model_z
150
+ elif model_name == "coreOCR-7B-050325-preview":
151
  processor = processor_k
152
  model = model_k
153
  else:
 
250
  with gr.Column():
251
  output = gr.Textbox(label="Output", interactive=False, lines=2, scale=2)
252
  model_choice = gr.Radio(
253
+ choices=["SkyCaptioner-V1", "SpaceThinker-3B", "coreOCR-7B-050325-preview"],
254
  label="Select Model",
255
  value="SkyCaptioner-V1"
256
  )