Spaces:
Sleeping
Sleeping
vkrishnan569
commited on
Commit
•
415b325
1
Parent(s):
3280898
Server Deployment
Browse files- Dockerfile +1 -1
- main.py +1 -1
Dockerfile
CHANGED
@@ -8,4 +8,4 @@ RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
|
|
8 |
|
9 |
COPY . .
|
10 |
|
11 |
-
CMD ["
|
|
|
8 |
|
9 |
COPY . .
|
10 |
|
11 |
+
CMD ["uvicorn", "-b", "0.0.0.0:7860","model:app"]
|
main.py
CHANGED
@@ -3,7 +3,7 @@ from llama_cpp import Llama
|
|
3 |
from huggingface_hub import hf_hub_download
|
4 |
|
5 |
# Initialize the Llama model with chat format set to "llama-2"
|
6 |
-
llm = Llama(model_path="
|
7 |
|
8 |
# Define the system prompt
|
9 |
system_prompt = (
|
|
|
3 |
from huggingface_hub import hf_hub_download
|
4 |
|
5 |
# Initialize the Llama model with chat format set to "llama-2"
|
6 |
+
llm = Llama(model_path="./llama-2-7b-chat.Q2_K.gguf", chat_format="llama-2")
|
7 |
|
8 |
# Define the system prompt
|
9 |
system_prompt = (
|