Spaces:

jatingocodeo
/

SmolLM2

Runtime error

jatingocodeo commited on Jan 25

Commit

bbaff56

verified ·

1 Parent(s): 7276d4c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -51,6 +51,7 @@ class SmolLM2Config(PretrainedConfig):
 class SmolLM2ForCausalLM(PreTrainedModel):
     config_class = SmolLM2Config
     def __init__(self, config):
         super().__init__(config)
@@ -94,12 +95,17 @@ def load_model():
         }
         tokenizer.add_special_tokens(special_tokens)
         model = AutoModelForCausalLM.from_pretrained(
             model_id,
             torch_dtype=torch.float16,
-            device_map="auto",
             pad_token_id=tokenizer.pad_token_id
         )
         # Resize token embeddings to match new tokenizer
         model.resize_token_embeddings(len(tokenizer))
         return model, tokenizer

 class SmolLM2ForCausalLM(PreTrainedModel):
     config_class = SmolLM2Config
+    _no_split_modules = ["LlamaDecoderLayer"]
     def __init__(self, config):
         super().__init__(config)
         }
         tokenizer.add_special_tokens(special_tokens)
+        # Load model without device_map
         model = AutoModelForCausalLM.from_pretrained(
             model_id,
             torch_dtype=torch.float16,
             pad_token_id=tokenizer.pad_token_id
         )
+        # Move model to device manually
+        device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        model = model.to(device)
         # Resize token embeddings to match new tokenizer
         model.resize_token_embeddings(len(tokenizer))
         return model, tokenizer