Spaces:
Runtime error
Runtime error
Update Dockerfile
Browse files- Dockerfile +2 -5
Dockerfile
CHANGED
@@ -3,8 +3,5 @@ FROM ghcr.io/huggingface/text-generation-inference:latest
|
|
3 |
# Define the model to use
|
4 |
ENV MODEL_ID="adaptiveaiventures/Llama-2-7b-chat-finetune"
|
5 |
|
6 |
-
# Set the number of GPU shards (
|
7 |
-
|
8 |
-
|
9 |
-
# Run the TGI server
|
10 |
-
CMD ["--model-id", "${MODEL_ID}", "--port", "8080", "--num-shard", "${NUM_SHARD}"]
|
|
|
3 |
# Define the model to use
|
4 |
ENV MODEL_ID="adaptiveaiventures/Llama-2-7b-chat-finetune"
|
5 |
|
6 |
+
# Set the number of GPU shards (1 if using CPU, 2+ if using multiple GPUs)
|
7 |
+
CMD ["--model-id", "adaptiveaiventures/Llama-2-7b-chat-finetune", "--port", "8080", "--num-shard", "1"]
|
|
|
|
|
|