pvanand commited on
Commit
ed88192
·
verified ·
1 Parent(s): 997768a

Create routers/llm_chat.py

Browse files
Files changed (1) hide show
  1. routers/llm_chat.py +51 -0
routers/llm_chat.py ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # routers/llm_chat.py
2
+ from fastapi import APIRouter, HTTPException, Header
3
+ import requests
4
+ import os
5
+ from pydantic import BaseModel
6
+
7
+ router = APIRouter(
8
+ prefix="/api/v1", # Prefix for all routes in this router
9
+ tags=["LLM Chat"], # Tag for OpenAPI documentation
10
+ )
11
+
12
+ # Load environment variables
13
+ LLM_API_URL = os.getenv("LLM_API_URL", "https://pvanand-audio-chat.hf.space/llm-agent")
14
+ API_KEY = os.getenv("API_KEY", "44d5c")
15
+
16
+ # Pydantic model for request validation
17
+ class LLMChatRequest(BaseModel):
18
+ prompt: str
19
+ system_message: str = ""
20
+ model_id: str = "openai/gpt-4o-mini"
21
+ conversation_id: str = "string"
22
+ user_id: str = "string"
23
+
24
+ @router.post("/llm-chat", summary="Send a prompt to the LLM", description="This endpoint sends a prompt to the LLM and returns the response.")
25
+ async def llm_chat(
26
+ request: LLMChatRequest,
27
+ x_api_key: str = Header(None, description="API Key for authentication")
28
+ ):
29
+ if x_api_key != API_KEY:
30
+ raise HTTPException(status_code=403, detail="Invalid API Key")
31
+
32
+ payload = {
33
+ "prompt": request.prompt,
34
+ "system_message": request.system_message,
35
+ "model_id": request.model_id,
36
+ "conversation_id": request.conversation_id,
37
+ "user_id": request.user_id
38
+ }
39
+
40
+ headers = {
41
+ "accept": "application/json",
42
+ "X-API-Key": x_api_key,
43
+ "Content-Type": "application/json"
44
+ }
45
+
46
+ # Use requests to call the external API
47
+ response = requests.post(LLM_API_URL, json=payload, headers=headers)
48
+ if response.status_code != 200:
49
+ raise HTTPException(status_code=response.status_code, detail="Error from LLM API")
50
+
51
+ return response.json()