Spaces:
Paused
Paused
Upload main.py
Browse fileschanged to gguf
main.py
CHANGED
@@ -19,8 +19,9 @@ app = FastAPI(docs_url="/")
|
|
19 |
|
20 |
# pipe = pipeline(model="TheBloke/Llama-2-7B-GGML/llama-2-7b.ggmlv3.q4_0.bin")
|
21 |
|
22 |
-
model_name_or_path = "TheBloke/Llama-2-7B-
|
23 |
-
model_basename = "llama-2-7b.
|
|
|
24 |
model_path = hf_hub_download(repo_id=model_name_or_path, filename=model_basename)
|
25 |
|
26 |
llm = Llama(model_path=model_path)
|
|
|
19 |
|
20 |
# pipe = pipeline(model="TheBloke/Llama-2-7B-GGML/llama-2-7b.ggmlv3.q4_0.bin")
|
21 |
|
22 |
+
model_name_or_path = "TheBloke/Llama-2-7B-GGUF"
|
23 |
+
model_basename = "llama-2-7b.Q4_0.gguf"
|
24 |
+
|
25 |
model_path = hf_hub_download(repo_id=model_name_or_path, filename=model_basename)
|
26 |
|
27 |
llm = Llama(model_path=model_path)
|