Update app.py
Browse files
app.py
CHANGED
@@ -12,6 +12,7 @@ os.system("ulimit -l unlimited")
|
|
12 |
app = FastAPI()
|
13 |
|
14 |
hf_hub_download("TheBloke/deepseek-coder-1.3b-base-GGUF", "deepseek-coder-1.3b-base.Q5_K_M.gguf", local_dir="./")
|
|
|
15 |
model_l = Llama(model_path="./deepseek-coder-1.3b-base.Q5_K_M.gguf", n_ctx=16192, n_gpu_layers=0, n_threads=2, use_mlock=True)
|
16 |
|
17 |
|
@@ -38,7 +39,7 @@ async def completion(request: Request):
|
|
38 |
except:
|
39 |
return {"responses": "Error!"}
|
40 |
|
41 |
-
|
42 |
app = create_app(
|
43 |
Settings(
|
44 |
n_threads=2, # set to number of cpu cores
|
|
|
12 |
app = FastAPI()
|
13 |
|
14 |
hf_hub_download("TheBloke/deepseek-coder-1.3b-base-GGUF", "deepseek-coder-1.3b-base.Q5_K_M.gguf", local_dir="./")
|
15 |
+
'''
|
16 |
model_l = Llama(model_path="./deepseek-coder-1.3b-base.Q5_K_M.gguf", n_ctx=16192, n_gpu_layers=0, n_threads=2, use_mlock=True)
|
17 |
|
18 |
|
|
|
39 |
except:
|
40 |
return {"responses": "Error!"}
|
41 |
|
42 |
+
'''
|
43 |
app = create_app(
|
44 |
Settings(
|
45 |
n_threads=2, # set to number of cpu cores
|