Spaces:

sguertl
/

PP-API-v0.1

Sleeping

sguertl commited on Apr 24

Commit

3f03ec9

verified ·

1 Parent(s): 4eda8f2

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+from huggingface_hub import InferenceClient
+from fastapi import FastAPI, Request
+from pydantic import BaseModel
+import uvicorn
+import os
+app = FastAPI()
+MODEL = "mistralai/Mistral-7B-Instruct-v0.1"
+HF_TOKEN = os.environ["HF_TOKEN"]
+client = InferenceClient(model=MODEL, token=HF_TOKEN)
+class Prompt(BaseModel):
+    message: str
+@app.post("/chat")
+async def chat(prompt: Prompt):
+    system_prompt = (
+        "You are a beginner programming student helping a peer. "
+        "Offer hints, ask questions, and support understanding—don’t give full solutions."
+    )
+    full_prompt = f"<s>[INST] <<SYS>>{system_prompt}<</SYS>>\n{prompt.message} [/INST]"
+    output = client.text_generation(
+        prompt=full_prompt,
+        max_new_tokens=200,
+        temperature=0.7,
+        top_p=0.95,
+        do_sample=True
+    )
+    return {"reply": output.strip()}