llm-explain / src /llm_explain /routing /explain_router.py
Kiran5's picture
Add application file
563c5bc
'''
Copyright 2024 Infosys Ltd.
Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"),
to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense,
and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in all copies
or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE
AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
'''
from llm_explain.mappers.mappers import UncertainityResponse, UncertainityRequest, \
TokenImportanceResponse, TokenImportanceRequest, GoTResponse, GoTRequest, \
SafeSearchResponse, SafeSearchRequest, SentimentAnalysisRequest, SentimentAnalysisResponse
from llm_explain.service.service import ExplainService as service
from llm_explain.config.logger import CustomLogger, request_id_var
from fastapi import APIRouter, HTTPException
from datetime import datetime
import concurrent.futures
import requests
import asyncio
import uuid
import os
explanation = APIRouter()
log = CustomLogger()
telemetry_flag = os.getenv("TELEMETRY_FLAG")
tel_error_url = os.getenv("ERROR_LOG_TELEMETRY_URL")
## FUNCTION FOR FAIL_SAFE TELEMETRY
def send_telemetry_request(explainability_telemetry_request, url):
try:
response = requests.post(url, json=explainability_telemetry_request)
response.raise_for_status()
response_data = response.json()
log.info(f"Telemetry response: {response_data}")
except Exception as e:
log.error(str(e))
raise HTTPException(
status_code=500,
detail="Please check with administration!!",
headers={"X-Error": "Please check with administration!!"})
def telemetry_error_logging(cie, request_id_var, api_endpoint):
function_name = None
# Get the traceback of the exception
current_tb = cie.__traceback__
# Traverse to the first traceback not from site-packages
while current_tb:
# Check if the traceback is not from site-packages
if "site-packages" not in current_tb.tb_frame.f_code.co_filename:
# Get the function name and file name
function_name = current_tb.tb_frame.f_code.co_name
# Move to the next traceback
current_tb = current_tb.tb_next
if telemetry_flag== "True":
error_input = {
"tenetName": "Explainability",
"errorCode": function_name +'_'+ request_id_var.get(),
"errorMessage": str(cie),
"apiEndPoint": api_endpoint,
"errorRequestMethod": "POST"
}
with concurrent.futures.ThreadPoolExecutor() as executor:
executor.submit(send_telemetry_request, error_input, tel_error_url)
@explanation.post('/llm-explainability/sentiment-analysis',
response_model = SentimentAnalysisResponse,
summary = "Sentiment analysis of the prompt along with token importance")
def sentiment_analysis(payload: SentimentAnalysisRequest):
id = uuid.uuid4().hex
request_id_var.set(id)
log.info("Entered create usecase routing method")
try:
start_time = datetime.now()
log.info(f"start_time: {start_time}")
log.info("before invoking sentiment_analysis service ")
response = service.sentiment_analysis(payload)
log.info("after invoking sentiment_analysis service ")
log.info("exit create usecase routing method")
end_time = datetime.now()
log.info(f"end_time: {end_time}")
total_time = end_time - start_time
log.info(f"total_time: {total_time}")
return response
except Exception as cie:
log.error(cie)
telemetry_error_logging(cie, request_id_var, "/llm-explainability/sentiment-analysis")
log.info("exit router sentiment_analysis method")
raise HTTPException(status_code=500, detail=str(cie))
@explanation.post('/llm-explainability/uncertainty',
response_model = UncertainityResponse,
summary = "Get uncertainty scores for the given input")
def calculate_uncertainty(payload: UncertainityRequest):
id = uuid.uuid4().hex
request_id_var.set(id)
log.info("Entered create usecase routing method")
try:
start_time = datetime.now()
log.info(f"start_time: {start_time}")
log.info("before invoking local_explanation service ")
response = asyncio.run(service.local_explanation(payload))
log.info("after invoking local_explanation service ")
log.info("exit create usecase routing method")
end_time = datetime.now()
log.info(f"end_time: {end_time}")
total_time = end_time - start_time
log.info(f"total_time: {total_time}")
return response
except Exception as cie:
log.error(cie)
telemetry_error_logging(cie, request_id_var, "/llm-explainability/uncertainty")
log.info("exit router local_explanation method")
raise HTTPException(status_code=500, detail=str(cie))
@explanation.post('/llm-explainability/token-importance',
response_model = TokenImportanceResponse,
summary = "Get importance for each token in the input prompt")
def token_importance(payload: TokenImportanceRequest):
id = uuid.uuid4().hex
request_id_var.set(id)
log.info("Entered create usecase routing method")
try:
start_time = datetime.now()
log.info(f"start_time: {start_time}")
log.info("before invoking token_importance service ")
response = asyncio.run(service.token_importance(payload))
log.info("after invoking token_importance service ")
log.info("exit create usecase routing method")
end_time = datetime.now()
log.info(f"end_time: {end_time}")
total_time = end_time - start_time
log.info(f"total_time: {total_time}")
return response
except Exception as cie:
log.error(cie)
telemetry_error_logging(cie, request_id_var, "/llm-explainability/token-importance")
log.info("exit router token_importance method")
raise HTTPException(status_code=500, detail=str(cie))
@explanation.post('/llm-explainability/got',
response_model = GoTResponse,
summary = "Graph-of-Thoughts Reasoning")
def graph_of_thoughts(payload: GoTRequest):
id = uuid.uuid4().hex
request_id_var.set(id)
log.info("Entered create usecase routing method")
try:
start_time = datetime.now()
log.info(f"start_time: {start_time}")
log.info("before invoking graph_of_thoughts service ")
response = asyncio.run(service.graph_of_thoughts(payload))
log.info("after invoking graph_of_thoughts service ")
log.info("exit create usecase routing method")
end_time = datetime.now()
log.info(f"end_time: {end_time}")
total_time = end_time - start_time
log.info(f"total_time: {total_time}")
return response
except Exception as cie:
log.error(cie)
telemetry_error_logging(cie, request_id_var, "/llm-explainability/got")
log.info("exit router graph_of_thoughts method")
raise HTTPException(status_code=500, detail=str(cie))
@explanation.post('/llm-explainability/serper_response',
response_model = SafeSearchResponse,
summary = "Verify LLM response with Google Search")
def searchAugmentation(payload: SafeSearchRequest):
id = uuid.uuid4().hex
request_id_var.set(id)
log.info("Entered create usecase routing method")
try:
start_time = datetime.now()
log.info(f"start_time: {start_time}")
log.info("before invoking search_augmentation service ")
response = asyncio.run(service.search_augmentation(payload))
log.info("after invoking search_augmentation service ")
log.info("exit create usecase routing method")
end_time = datetime.now()
log.info(f"end_time: {end_time}")
total_time = end_time - start_time
log.info(f"total_time: {total_time}")
return response
except Exception as cie:
log.error(cie)
telemetry_error_logging(cie, request_id_var, "/llm-explainability/serper_response")
log.info("exit router search_augmentation method")
raise HTTPException(status_code=500, detail=str(cie))