Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -11,9 +11,9 @@ print(f"CUDA device: {torch.cuda.get_device_name(torch.cuda.current_device())}")
|
|
11 |
For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
|
12 |
"""
|
13 |
# client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
|
14 |
-
client = InferenceClient("deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B")
|
15 |
-
|
16 |
|
|
|
17 |
def respond(
|
18 |
message,
|
19 |
history: list[tuple[str, str]],
|
|
|
11 |
For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
|
12 |
"""
|
13 |
# client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
|
14 |
+
client = InferenceClient("deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B").to('cuda')
|
|
|
15 |
|
16 |
+
@spaces.GPU
|
17 |
def respond(
|
18 |
message,
|
19 |
history: list[tuple[str, str]],
|