Spaces:
Runtime error
Runtime error
Commit
Β·
20d1f1f
1
Parent(s):
d1340d0
Act
Browse files
app.py
CHANGED
@@ -8,7 +8,7 @@ For more information on `huggingface_hub` Inference API support, please check th
|
|
8 |
"""
|
9 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
10 |
client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
|
11 |
-
pipe = pipeline("text-generation", model="HiTZ/latxa-7b-v1"
|
12 |
|
13 |
|
14 |
def respond(
|
|
|
8 |
"""
|
9 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
10 |
client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
|
11 |
+
pipe = pipeline("text-generation", model="HiTZ/latxa-7b-v1", device_map="auto", model_kwargs={"load_in_8bit": True})
|
12 |
|
13 |
|
14 |
def respond(
|