Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -205,10 +205,20 @@ def load_model():
|
|
205 |
tokenizer.add_special_tokens(special_tokens)
|
206 |
|
207 |
print("Loading model from Hugging Face Hub...")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
208 |
model = AutoModelForCausalLM.from_pretrained(
|
209 |
model_id,
|
|
|
210 |
torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
|
211 |
-
trust_remote_code=True
|
|
|
212 |
)
|
213 |
|
214 |
# Move model to device manually
|
|
|
205 |
tokenizer.add_special_tokens(special_tokens)
|
206 |
|
207 |
print("Loading model from Hugging Face Hub...")
|
208 |
+
# Create config first
|
209 |
+
config = SmolLM2Config(
|
210 |
+
pad_token_id=tokenizer.pad_token_id,
|
211 |
+
bos_token_id=tokenizer.bos_token_id,
|
212 |
+
eos_token_id=tokenizer.eos_token_id
|
213 |
+
)
|
214 |
+
|
215 |
+
# Load model from Hub
|
216 |
model = AutoModelForCausalLM.from_pretrained(
|
217 |
model_id,
|
218 |
+
config=config,
|
219 |
torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
|
220 |
+
trust_remote_code=True,
|
221 |
+
low_cpu_mem_usage=True
|
222 |
)
|
223 |
|
224 |
# Move model to device manually
|