Spaces:

prithivMLmods
/

Imgscope-OCR-Mini

Running on Zero

prithivMLmods commited on Mar 18

Commit

42f9ebc

verified ·

1 Parent(s): 0ed1602

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,6 @@
 import os
 import re
 import uuid
 import json
@@ -93,9 +95,7 @@ SYSTEM_PROMPT = load_system_prompt(MODEL_ID, "SYSTEM_PROMPT.txt")
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Initialize the Mistral LLM via vllm.
-# Note: Running this model on GPU may require very high VRAM.
-# The 'enforce_eager=True' parameter disables asynchronous output,
-# which avoids the NotImplementedError on platforms that do not support it.
 llm = LLM(model=MODEL_ID, tokenizer_mode="mistral", device=device, enforce_eager=True)
 # -----------------------------------------------------------------------------

 import os
+os.environ["VLLM_ENABLE_CHUNKED_PREFILL"] = "False"  # Disable chunked prefill as a workaround
 import re
 import uuid
 import json
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Initialize the Mistral LLM via vllm.
+# The 'enforce_eager=True' parameter disables asynchronous output.
 llm = LLM(model=MODEL_ID, tokenizer_mode="mistral", device=device, enforce_eager=True)
 # -----------------------------------------------------------------------------