Spaces:

edersonmelo
/

deployllm

Sleeping

edersonmelo commited on Jun 19, 2024

Commit

6981cab

verified ·

1 Parent(s): d857963

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -8,10 +8,11 @@ app = FastAPI()
 llm = None
 def start_llm():
     llm = Llama(model_path="./tinyllama-1.1b-chat.gguf")
 @app.post("/health")
     return {"status": "ok"}
 @app.post("/deployllm")
@@ -29,5 +30,4 @@ async def stream(item: dict):
     return llm(prompt, max_tokens=max_tokens, temperature=temperatura)
-threading.Thread(target=start_llm).start()

 llm = None
 def start_llm():
+    global llm  # Adicione esta linha para modificar a variável global
     llm = Llama(model_path="./tinyllama-1.1b-chat.gguf")
 @app.post("/health")
+def health_check():
     return {"status": "ok"}
 @app.post("/deployllm")
     return llm(prompt, max_tokens=max_tokens, temperature=temperatura)
+threading.Thread(target=start_llm).start()