Update app.py
Browse files
app.py
CHANGED
@@ -102,9 +102,9 @@ def loadModel():
|
|
102 |
quantization_config=quantization_config,
|
103 |
max_memory={
|
104 |
0: "20GB", # GPU 0 with 20GB memory
|
105 |
-
1: "
|
106 |
-
2: "
|
107 |
-
|
108 |
#"cpu": "5GB" # CPU with 100GB memory
|
109 |
},
|
110 |
)
|
@@ -117,9 +117,9 @@ def loadModel():
|
|
117 |
torch_dtype=torch.float16,
|
118 |
is_trainable=False,
|
119 |
max_memory={
|
120 |
-
|
121 |
-
|
122 |
-
2: "
|
123 |
3: "40GB", # GPU 0 with 20GB memory
|
124 |
#"cpu": "5GB" # CPU with 100GB memory
|
125 |
},
|
|
|
102 |
quantization_config=quantization_config,
|
103 |
max_memory={
|
104 |
0: "20GB", # GPU 0 with 20GB memory
|
105 |
+
1: "40GB", # GPU 0 with 20GB memory
|
106 |
+
2: "40GB", # GPU 0 with 20GB memory
|
107 |
+
3: "40GB", # GPU 0 with 20GB memory
|
108 |
#"cpu": "5GB" # CPU with 100GB memory
|
109 |
},
|
110 |
)
|
|
|
117 |
torch_dtype=torch.float16,
|
118 |
is_trainable=False,
|
119 |
max_memory={
|
120 |
+
0: "20GB", # GPU 0 with 20GB memory
|
121 |
+
1: "8GB", # GPU 0 with 20GB memory
|
122 |
+
2: "8GB", # GPU 0 with 20GB memory
|
123 |
3: "40GB", # GPU 0 with 20GB memory
|
124 |
#"cpu": "5GB" # CPU with 100GB memory
|
125 |
},
|