Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -274,11 +274,11 @@ with gr.Blocks(css=css, theme="bethecloud/storj_theme") as demo:
|
|
274 |
value="SkyCaptioner-V1"
|
275 |
)
|
276 |
|
277 |
-
gr.Markdown("**Model Info
|
278 |
-
gr.Markdown("
|
279 |
-
gr.Markdown("
|
280 |
-
gr.Markdown("
|
281 |
-
gr.Markdown("
|
282 |
|
283 |
image_submit.click(
|
284 |
fn=generate_image,
|
|
|
274 |
value="SkyCaptioner-V1"
|
275 |
)
|
276 |
|
277 |
+
gr.Markdown("**Model Info 💻** | [Report Bug](https://huggingface.co/collections/prithivMLmods/multimodal-implementations-67c9982ea04b39f0608badb0)")
|
278 |
+
gr.Markdown("> [SkyCaptioner-V1](https://huggingface.co/Skywork/SkyCaptioner-V1): structural video captioning model designed to generate high-quality, structural descriptions for video data. It integrates specialized sub-expert models.")
|
279 |
+
gr.Markdown("> [SpaceThinker-Qwen2.5VL-3B](https://huggingface.co/remyxai/SpaceThinker-Qwen2.5VL-3B): thinking/reasoning multimodal/vision-language model (VLM) trained to enhance spatial reasoning.")
|
280 |
+
gr.Markdown("> [coreOCR-7B-050325-preview](https://huggingface.co/prithivMLmods/coreOCR-7B-050325-preview): model is a fine-tuned version of qwen/qwen2-vl-7b, optimized for document-level optical character recognition (ocr), long-context vision-language understanding.")
|
281 |
+
gr.Markdown("> [Imgscope-OCR-2B-0527](https://huggingface.co/prithivMLmods/Imgscope-OCR-2B-0527): fine-tuned version of qwen2-vl-2b-instruct, specifically optimized for messy handwriting recognition, document ocr, realistic handwritten ocr, and math problem solving with latex formatting.")
|
282 |
|
283 |
image_submit.click(
|
284 |
fn=generate_image,
|