Spaces:
Running
on
Zero
Running
on
Zero
Load in 4bits
Browse files
app.py
CHANGED
@@ -71,7 +71,8 @@ def get_interface(model_name: str):
|
|
71 |
additional_model_config={
|
72 |
"device_map": "auto" if has_cuda else "cpu",
|
73 |
"quantization_config": BitsAndBytesConfig(
|
74 |
-
|
|
|
75 |
) if has_cuda else None,
|
76 |
},
|
77 |
**model_config
|
|
|
71 |
additional_model_config={
|
72 |
"device_map": "auto" if has_cuda else "cpu",
|
73 |
"quantization_config": BitsAndBytesConfig(
|
74 |
+
load_in_4bit=True,
|
75 |
+
llm_int8_enable_fp32_cpu_offload=True
|
76 |
) if has_cuda else None,
|
77 |
},
|
78 |
**model_config
|