Spaces:

rawc0der
/

t2i-model-mayhem

Sleeping

rawc0der commited on Jan 19

Commit

96db79f

1 Parent(s): b9620be

change model context

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import spaces
 from fastapi import FastAPI, HTTPException, UploadFile, File
 from typing import Optional, Dict, Any
 import torch
@@ -123,8 +124,8 @@ class ModelManager:
                 if hasattr(self.current_pipeline, 'enable_xformers_memory_efficient_attention'):
                     self.current_pipeline.enable_xformers_memory_efficient_attention()
-                if self._device == "cuda":
-                    self.current_pipeline.enable_model_cpu_offload()
                 self.current_model = model_name
@@ -159,7 +160,8 @@ class ModelContext:
         pipeline = model_manager.load_model(self.model_name)
         if hasattr(pipeline, 'reset_device_map'):
             pipeline.reset_device_map()
-        pipeline.enable_model_cpu_offload()
         return pipeline
     def __exit__(self, exc_type, exc_val, exc_tb):

 import spaces
+from accelerate import dispatch_model
 from fastapi import FastAPI, HTTPException, UploadFile, File
 from typing import Optional, Dict, Any
 import torch
                 if hasattr(self.current_pipeline, 'enable_xformers_memory_efficient_attention'):
                     self.current_pipeline.enable_xformers_memory_efficient_attention()
+                # if self._device == "cuda":
+                #     self.current_pipeline.enable_model_cpu_offload()
                 self.current_model = model_name
         pipeline = model_manager.load_model(self.model_name)
         if hasattr(pipeline, 'reset_device_map'):
             pipeline.reset_device_map()
+        # Enable automatic device mapping strategy
+        dispatch_model(pipeline)
         return pipeline
     def __exit__(self, exc_type, exc_val, exc_tb):