flare / routes /chat_handler.py
ciyidogan's picture
Upload chat_handler.py
605e58b verified
"""
Flare – Chat Handler (REST API Only - Realtime moved to Event-Driven)
====================================================================
"""
import re, json, sys, httpx, os
from datetime import datetime
from typing import Dict, List, Optional, Any
from fastapi import APIRouter, HTTPException, Header, Request
from pydantic import BaseModel
import requests
from llm.prompt_builder import build_intent_prompt, build_parameter_prompt
from utils.logger import log_info, log_error, log_warning, log_debug
from api.api_executor import call_api as execute_api
from config.config_provider import ConfigProvider
from llm.validation_engine import validate
from chat_session.session import session_store, Session
# Initialize router
router = APIRouter()
# ───────────────────────── GLOBAL VARS ───────────────────────── #
cfg = ConfigProvider.get()
llm_provider = None
# ───────────────────────── HELPERS ───────────────────────── #
def _trim_response(raw: str) -> str:
"""
Remove everything after the first logical assistant block or intent tag.
Also strips trailing 'assistant' artifacts and prompt injections.
"""
# Stop at our own rules if model leaked them
for stop in ["#DETECTED_INTENT", "⚠️", "\nassistant", "assistant\n", "assistant"]:
idx = raw.find(stop)
if idx != -1:
raw = raw[:idx]
# Normalise selamlama
raw = re.sub(r"Hoş[\s-]?geldin(iz)?", "Hoş geldiniz", raw, flags=re.IGNORECASE)
return raw.strip()
def _safe_intent_parse(raw: str) -> tuple[str, str]:
"""Extract intent name and extra tail."""
m = re.search(r"#DETECTED_INTENT:\s*([A-Za-z0-9_-]+)", raw)
if not m:
return "", raw
name = m.group(1)
# Remove 'assistant' suffix if exists
if name.endswith("assistant"):
name = name[:-9] # Remove last 9 chars ("assistant")
log_info(f"🔧 Removed 'assistant' suffix from intent name")
tail = raw[m.end():]
log_info(f"🎯 Parsed intent: {name}")
return name, tail
# ───────────────────────── LLM SETUP ───────────────────────── #
def setup_llm_provider():
"""Initialize LLM provider using factory pattern"""
global llm_provider
try:
from llm.llm_factory import LLMFactory
llm_provider = LLMFactory.create_provider()
log_info("✅ LLM provider initialized successfully")
except Exception as e:
log_error("❌ Failed to initialize LLM provider", e)
raise
# ───────────────────────── LLM GENERATION ───────────────────────── #
async def llm_generate(s: Session, prompt: str, user_msg: str) -> str:
"""Call LLM provider with proper error handling"""
global llm_provider
if llm_provider is None:
setup_llm_provider()
try:
# Get version config from session
version = s.get_version_config()
if not version:
# Fallback: get from project config
project = next((p for p in cfg.projects if p.name == s.project_name), None)
if not project:
raise ValueError(f"Project not found: {s.project_name}")
version = next((v for v in project.versions if v.published), None)
if not version:
raise ValueError("No published version found")
log_info(f"🚀 Calling LLM for session {s.session_id[:8]}...")
log_info(f"📋 Prompt preview (first 200 chars): {prompt[:200]}...")
history = s.chat_history
# Call the configured LLM provider
raw = await llm_provider.generate(
user_input=user_msg,
system_prompt=prompt,
context=history[-10:] if history else []
)
log_info(f"🪄 LLM raw response: {raw[:100]}...")
return raw
except requests.exceptions.Timeout:
log_warning(f"⏱️ LLM timeout for session {s.session_id[:8]}")
raise HTTPException(status_code=504, detail="LLM request timed out")
except Exception as e:
log_error("❌ LLM error", e)
raise HTTPException(status_code=500, detail=f"LLM error: {str(e)}")
# ───────────────────────── PARAMETER EXTRACTION ───────────────────────── #
def _extract_parameters_from_response(raw: str, session: Session, intent_config) -> bool:
"""Extract parameters from the LLM response"""
try:
# Look for JSON block in response
json_match = re.search(r'```json\s*(.*?)\s*```', raw, re.DOTALL)
if not json_match:
# Try to find JSON without code block
json_match = re.search(r'\{[^}]+\}', raw)
if not json_match:
log_info("❌ No JSON found in response")
return False
json_str = json_match.group(1) if '```' in raw else json_match.group(0)
params = json.loads(json_str)
any_valid = False
for param_name, param_value in params.items():
# Find parameter config
param_config = next(
(p for p in intent_config.parameters if p.name == param_name),
None
)
if not param_config:
log_info(f"⚠️ Parameter config not found for: {param_name}")
continue
# Validate parameter
if validate(str(param_value), param_config):
session.variables[param_config.variable_name] = str(param_value)
any_valid = True
log_info(f"✅ Extracted {param_name}={param_value}{param_config.variable_name}")
else:
log_info(f"❌ Invalid {param_name}={param_value}")
return any_valid
except json.JSONDecodeError as e:
log_error("❌ JSON parsing error", e)
log_error(f"❌ Failed to parse: {raw[:200]}")
return False
except Exception as e:
log_error("❌ Parameter processing error", e)
return False
# ───────────────────────── API EXECUTION ───────────────────────── #
async def _execute_api_call(session: Session, intent_config) -> str:
"""Execute API call and return humanized response with better error handling"""
try:
session.state = "call_api"
api_name = intent_config.action
api_config = cfg.get_api(api_name)
if not api_config:
log_info(f"❌ API config not found: {api_name}")
session.reset_flow()
return get_user_friendly_error("api_error", {"api_name": api_name})
log_info(f"📡 Calling API: {api_name}")
log_info(f"📦 API variables: {session.variables}")
# Execute API call with session
response = execute_api(api_config, session)
api_json = response.json()
log_info(f"✅ API response: {api_json}")
# Humanize response
session.state = "humanize"
if api_config.response_prompt:
prompt = api_config.response_prompt.replace(
"{{api_response}}",
json.dumps(api_json, ensure_ascii=False)
)
human_response = await llm_generate(session, prompt, json.dumps(api_json))
session.reset_flow()
return human_response if human_response else f"İşlem sonucu: {api_json}"
else:
session.reset_flow()
return f"İşlem tamamlandı: {api_json}"
except requests.exceptions.Timeout:
log_warning(f"⏱️ API timeout: {api_name}")
session.reset_flow()
return get_user_friendly_error("api_timeout")
except Exception as e:
log_error("❌ API call error", e)
session.reset_flow()
return get_user_friendly_error("api_error", {"api_name": api_name})
# ───────────────────────── REQUEST MODELS ───────────────────────── #
class ChatRequest(BaseModel):
message: str
class StartRequest(BaseModel):
project_name: str
version_no: Optional[int] = None
is_realtime: bool = False
locale: Optional[str] = None
class ChatResponse(BaseModel):
session_id: str
answer: str
# ───────────────────────── API ENDPOINTS ───────────────────────── #
@router.post("/start_session", response_model=ChatResponse)
async def start_session(req: StartRequest, request: Request):
"""Create new session - supports both REST and realtime"""
global llm_provider
try:
# Validate project exists
project = next((p for p in cfg.projects if p.name == req.project_name and p.enabled), None)
if not project:
raise HTTPException(404, f"Project '{req.project_name}' not found or disabled")
# Determine locale
session_locale = req.locale
if not session_locale:
session_locale = project.default_locale
# Validate locale is supported by project
if session_locale not in project.supported_locales:
raise HTTPException(
400,
f"Locale '{session_locale}' not supported by project. Supported: {project.supported_locales}"
)
# Find version
if req.version_no:
version = next((v for v in project.versions if v.no == req.version_no), None)
if not version:
raise HTTPException(404, f"Version {req.version_no} not found for project '{req.project_name}'")
else:
published_versions = [v for v in project.versions if v.published]
if not published_versions:
raise HTTPException(404, f"No published version for project '{req.project_name}'")
version = max(published_versions, key=lambda v: v.no)
# Create session
session = session_store.create_session(
project_name=req.project_name,
version_no=version.no,
is_realtime=req.is_realtime,
locale=session_locale
)
session.set_version_config(version)
# For realtime sessions, publish event to start the flow
if req.is_realtime and hasattr(request.app.state, 'event_bus'):
from chat_session.event_bus import Event, EventType
await request.app.state.event_bus.publish(Event(
type=EventType.SESSION_STARTED,
session_id=session.session_id,
data={
"session": session,
"has_welcome": bool(version.welcome_prompt),
"welcome_text": version.welcome_prompt or "Hoş geldiniz! Size nasıl yardımcı olabilirim?",
"locale": session_locale,
"project_name": req.project_name,
"version_no": version.no
}
))
# For realtime, return minimal response
return ChatResponse(
session_id=session.session_id,
answer="[REALTIME_MODE] Connect via WebSocket to continue."
)
# For REST mode, process welcome prompt normally
else:
# Create LLM provider if not exists
if not llm_provider:
from llm.llm_factory import LLMFactory
llm_provider = LLMFactory.create_provider()
log_info(f"🤖 LLM Provider created: {type(llm_provider).__name__}")
# Process welcome prompt
greeting = "Hoş geldiniz! Size nasıl yardımcı olabilirim?"
if version.welcome_prompt:
log_info(f"🎉 Processing welcome prompt for session {session.session_id[:8]}...")
try:
welcome_result = await llm_provider.generate(
user_input="",
system_prompt=version.welcome_prompt,
context=[]
)
if welcome_result and welcome_result.strip():
greeting = welcome_result.strip()
except Exception as e:
log_error("⚠️ Welcome prompt processing failed", e)
session.add_turn("assistant", greeting)
log_info(f"✅ Session created for project '{req.project_name}' version {version.no}")
return ChatResponse(session_id=session.session_id, answer=greeting)
except HTTPException:
raise
except Exception as e:
log_error("❌ Session creation error", e)
raise HTTPException(500, f"Session creation failed: {str(e)}")
@router.post("/chat")
async def chat(req: ChatRequest, x_session_id: str = Header(...)):
"""Process chat message - REST API only (realtime uses WebSocket)"""
try:
# Get session
session = session_store.get_session(x_session_id)
if not session:
raise HTTPException(
status_code=404,
detail=get_user_friendly_error("session_not_found")
)
# Check if this is a realtime session
if session.is_realtime:
raise HTTPException(
status_code=400,
detail="This is a realtime session. Please use WebSocket connection instead."
)
# Session expiry check
if session.is_expired():
session_store.delete_session(x_session_id)
raise HTTPException(
status_code=401,
detail=get_user_friendly_error("session_expired")
)
# Update last activity
session.last_activity = datetime.utcnow().isoformat()
session_store.update_session(session)
# Add user message to history
session.add_message("user", req.message)
log_info(f"💬 User [{session.session_id[:8]}...]: {req.message}")
# Get project and version config
project = next((p for p in cfg.projects if p.name == session.project_name), None)
if not project:
raise HTTPException(
status_code=404,
detail=get_user_friendly_error("project_not_found")
)
version = session.get_version_config()
if not version:
raise HTTPException(
status_code=400,
detail=get_user_friendly_error("version_not_found")
)
# Process based on current state
if session.state == "idle":
# Build intent detection prompt
prompt = build_intent_prompt(version, session.chat_history, project.default_locale)
raw = await llm_generate(session, prompt, req.message)
# Check for intent
intent_name, tail = _safe_intent_parse(raw)
if intent_name:
# Find intent config
intent_config = next((i for i in version.intents if i.name == intent_name), None)
if intent_config:
session.current_intent = intent_name
session.set_intent_config(intent_config)
session.state = "collect_params"
log_info(f"🎯 Intent detected: {intent_name}")
# Check if parameters were already extracted
if tail and _extract_parameters_from_response(tail, session, intent_config):
log_info("📦 Some parameters extracted from initial response")
# Check what parameters are missing
missing_params = [
p.name for p in intent_config.parameters
if p.required and p.variable_name not in session.variables
]
if not missing_params:
# All required parameters collected, execute API
response = await _execute_api_call(session, intent_config)
session.add_message("assistant", response)
return {"response": response, "intent": intent_name, "state": "completed"}
else:
# Need to collect more parameters
collection_config = cfg.global_config.llm_provider.settings.get("parameter_collection_config", {})
max_params = collection_config.get("max_params_per_question", 2)
# Decide which parameters to ask
params_to_ask = missing_params[:max_params]
param_prompt = build_parameter_prompt(
version=version,
intent_config=intent_config,
chat_history=session.chat_history,
collected_params=session.variables,
missing_params=missing_params,
params_to_ask=params_to_ask,
max_params=max_params,
project_locale=project.default_locale,
unanswered_params=session.unanswered_parameters
)
param_question = await llm_generate(session, param_prompt, req.message)
clean_question = _trim_response(param_question)
session.add_message("assistant", clean_question)
return {"response": clean_question, "intent": intent_name, "state": "collecting_params"}
else:
log_info(f"⚠️ Unknown intent: {intent_name}")
# No intent detected, return general response
clean_response = _trim_response(raw)
session.add_message("assistant", clean_response)
return {"response": clean_response, "state": "idle"}
elif session.state == "collect_params":
# Continue parameter collection
intent_config = session.get_intent_config()
# Try to extract parameters from user message
param_prompt = f"""
Extract parameters from user message: "{req.message}"
Expected parameters:
{json.dumps([{
'name': p.name,
'type': p.type,
'required': p.required,
'extraction_prompt': p.extraction_prompt
} for p in intent_config.parameters if p.variable_name not in session.variables], ensure_ascii=False)}
Return as JSON object with parameter names as keys.
"""
raw = await llm_generate(session, param_prompt, req.message)
_extract_parameters_from_response(raw, session, intent_config)
# Check what parameters are still missing
missing_params = [
p.name for p in intent_config.parameters
if p.required and p.variable_name not in session.variables
]
if not missing_params:
# All parameters collected, execute API
response = await _execute_api_call(session, intent_config)
session.add_message("assistant", response)
return {"response": response, "intent": session.current_intent, "state": "completed"}
else:
# Still need more parameters
collection_config = cfg.global_config.llm_provider.settings.get("parameter_collection_config", {})
max_params = collection_config.get("max_params_per_question", 2)
params_to_ask = missing_params[:max_params]
param_prompt = build_parameter_prompt(
version=version,
intent_config=intent_config,
chat_history=session.chat_history,
collected_params=session.variables,
missing_params=missing_params,
params_to_ask=params_to_ask,
max_params=max_params,
project_locale=project.default_locale,
unanswered_params=session.unanswered_parameters
)
param_question = await llm_generate(session, param_prompt, req.message)
clean_question = _trim_response(param_question)
session.add_message("assistant", clean_question)
return {"response": clean_question, "intent": session.current_intent, "state": "collecting_params"}
else:
# Unknown state, reset
session.reset_flow()
return {"response": get_user_friendly_error("internal_error"), "state": "error"}
except HTTPException:
raise
except requests.exceptions.Timeout:
log_error(f"Timeout in chat for session {x_session_id[:8]}")
return {
"response": get_user_friendly_error("llm_timeout"),
"state": "error",
"error": True
}
except Exception as e:
log_error("❌ Chat error", e)
import traceback
traceback.print_exc()
return {
"response": get_user_friendly_error("internal_error"),
"state": "error",
"error": True
}
@router.post("/end_session")
async def end_session(x_session_id: str = Header(...), request: Request = None):
"""End a session - works for both REST and realtime"""
try:
session = session_store.get_session(x_session_id)
if not session:
raise HTTPException(404, "Session not found")
# For realtime sessions, publish end event
if session.is_realtime and request and hasattr(request.app.state, 'event_bus'):
from chat_session.event_bus import Event, EventType
await request.app.state.event_bus.publish(Event(
type=EventType.SESSION_ENDED,
session_id=x_session_id,
data={"reason": "user_request"}
))
# Delete session
session_store.delete_session(x_session_id)
return {"message": "Session ended successfully"}
except HTTPException:
raise
except Exception as e:
log_error("❌ Error ending session", e)
raise HTTPException(500, f"Failed to end session: {str(e)}")
# ───────────────────────── HELPER FUNCTIONS ───────────────────────── #
def get_user_friendly_error(error_type: str, context: dict = None) -> str:
"""Get user-friendly error messages"""
error_messages = {
"session_not_found": "Oturumunuz bulunamadı. Lütfen yeni bir konuşma başlatın.",
"project_not_found": "Proje konfigürasyonu bulunamadı. Lütfen yönetici ile iletişime geçin.",
"version_not_found": "Proje versiyonu bulunamadı. Lütfen geçerli bir versiyon seçin.",
"intent_not_found": "Üzgünüm, ne yapmak istediğinizi anlayamadım. Lütfen daha açık bir şekilde belirtir misiniz?",
"api_timeout": "İşlem zaman aşımına uğradı. Lütfen tekrar deneyin.",
"api_error": "İşlem sırasında bir hata oluştu. Lütfen daha sonra tekrar deneyin.",
"parameter_validation": "Girdiğiniz bilgide bir hata var. Lütfen kontrol edip tekrar deneyin.",
"llm_error": "Sistem yanıt veremedi. Lütfen biraz sonra tekrar deneyin.",
"llm_timeout": "Sistem meşgul. Lütfen birkaç saniye bekleyip tekrar deneyin.",
"session_expired": "Oturumunuz zaman aşımına uğradı. Lütfen yeni bir konuşma başlatın.",
"rate_limit": "Çok fazla istek gönderdiniz. Lütfen biraz bekleyin.",
"internal_error": "Beklenmeyen bir hata oluştu. Lütfen yönetici ile iletişime geçin."
}
message = error_messages.get(error_type, error_messages["internal_error"])
# Context bilgisi varsa ekle
if context:
if error_type == "parameter_validation" and "field" in context:
message = f"{context['field']} alanı için {message}"
elif error_type == "api_error" and "api_name" in context:
message = f"{context['api_name']} servisi için {message}"
return message
def validate_parameter_with_message(param_config, value, locale="tr") -> tuple[bool, str]:
"""Validate parameter and return user-friendly message"""
try:
# Type validation
if param_config.type == "int":
try:
int(value)
except ValueError:
return False, f"Lütfen geçerli bir sayı girin."
elif param_config.type == "float":
try:
float(value)
except ValueError:
return False, f"Lütfen geçerli bir ondalık sayı girin."
elif param_config.type == "date":
# Date parsing with locale support
from config.locale_manager import LocaleManager
parsed_date = LocaleManager.parse_date_expression(value, locale)
if not parsed_date:
return False, f"Lütfen geçerli bir tarih girin (örn: yarın, 15 Haziran, 2025-06-15)."
elif param_config.type == "bool":
if value.lower() not in ["evet", "hayır", "yes", "no", "true", "false"]:
return False, f"Lütfen 'evet' veya 'hayır' olarak cevaplayın."
# Regex validation
if param_config.validation_regex:
import re
if not re.match(param_config.validation_regex, value):
return False, param_config.invalid_prompt or "Girdiğiniz değer geçerli formatta değil."
return True, ""
except Exception as e:
log_error(f"Parameter validation error", e)
return False, "Değer kontrol edilirken bir hata oluştu."
# Initialize LLM on module load
setup_llm_provider()