Tonic commited on
Commit
cb932c7
·
verified ·
1 Parent(s): 07eab17

removes use cache

Browse files
Files changed (1) hide show
  1. model.py +1 -2
model.py CHANGED
@@ -89,8 +89,7 @@ class SmolLM3Model:
89
  model_kwargs = {
90
  "torch_dtype": self.torch_dtype,
91
  "device_map": self.device_map,
92
- "trust_remote_code": True,
93
- "use_cache": False # Disable KV cache for training
94
  }
95
 
96
  # Only add flash attention if the model supports it
 
89
  model_kwargs = {
90
  "torch_dtype": self.torch_dtype,
91
  "device_map": self.device_map,
92
+ "trust_remote_code": True
 
93
  }
94
 
95
  # Only add flash attention if the model supports it