Spaces:
Runtime error
Runtime error
Update inference.py
Browse files- inference.py +1 -1
inference.py
CHANGED
@@ -36,7 +36,7 @@ from deepseek_vl.utils.conversation import Conversation
|
|
36 |
from transformers import BitsAndBytesConfig
|
37 |
from transformers import QuantoConfig
|
38 |
|
39 |
-
quanto_config = QuantoConfig(weights="
|
40 |
|
41 |
def load_model(model_path):
|
42 |
vl_chat_processor: VLChatProcessor = VLChatProcessor.from_pretrained(model_path)
|
|
|
36 |
from transformers import BitsAndBytesConfig
|
37 |
from transformers import QuantoConfig
|
38 |
|
39 |
+
quanto_config = QuantoConfig(weights="int4")
|
40 |
|
41 |
def load_model(model_path):
|
42 |
vl_chat_processor: VLChatProcessor = VLChatProcessor.from_pretrained(model_path)
|