llm

Sleeping

Chris4K commited on Jan 12

Commit

c783845

verified ·

1 Parent(s): 0dad39b

Update services/model_service.py

Files changed (1) hide show

services/model_service.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# services/model_service.py
 from transformers import AutoTokenizer, AutoModelForCausalLM, LlamaConfig
 from sentence_transformers import SentenceTransformer
 import torch
@@ -28,15 +27,13 @@ class ModelService:
             # Load tokenizer
             self.tokenizer = AutoTokenizer.from_pretrained(settings.MODEL_NAME)
-            # Load model configuration and modify rope_scaling if applicable
             config = LlamaConfig.from_pretrained(settings.MODEL_NAME)
             if hasattr(config, "rope_scaling"):
-                logger.info("Updating rope_scaling configuration...")
-                config.rope_scaling = {
-                    "type": "linear",  # Ensure the type is valid
-                    "factor": 32.0    # Ensure factor is a valid float
-                }
             # Load model with the updated configuration
             self.model = AutoModelForCausalLM.from_pretrained(

 from transformers import AutoTokenizer, AutoModelForCausalLM, LlamaConfig
 from sentence_transformers import SentenceTransformer
 import torch
             # Load tokenizer
             self.tokenizer = AutoTokenizer.from_pretrained(settings.MODEL_NAME)
+            # Load model configuration without modifying rope_scaling
             config = LlamaConfig.from_pretrained(settings.MODEL_NAME)
+            # Remove rope_scaling if present
             if hasattr(config, "rope_scaling"):
+                logger.info("Removing rope_scaling from configuration...")
+                config.rope_scaling = None
             # Load model with the updated configuration
             self.model = AutoModelForCausalLM.from_pretrained(