Spaces:

bachephysicdun
/

Backend

Sleeping

App Files Files Community

Backend / app /main.py

bachephysicdun

implemented rag and filtered_rag

8dbef5d 9 months ago

raw

history blame contribute delete

8.69 kB

	import sys
	import os
	from datetime import datetime

	from langchain_core.runnables import Runnable
	from langchain_core.callbacks import BaseCallbackHandler
	from fastapi import FastAPI, Request, Depends
	from sse_starlette.sse import EventSourceResponse
	from langserve.serialization import WellKnownLCSerializer
	from typing import List
	from sqlalchemy.orm import Session

	import schemas
	from chains import simple_chain, formatted_chain, history_chain, rag_chain, filtered_rag_chain
	import crud, models, schemas, prompts
	from database import SessionLocal, engine
	from callbacks import LogResponseCallback

	# models.Base comes from SQLAlchemy’s declarative_base() in database.py.
	# It acts as the base class for all ORM models (defined in models.py).
	# .metadata.create_all(): Tells SQLAlchemy to create all the tables defined
	# in the models module if they don’t already exist in the database.
	# -> metadata is a catalog of all the tables and other schema constructs in your database.
	# -> create_all() method creates all the tables that don't exist yet in the database.
	# -> bind=engine specifies which database engine to use for this operation.
	models.Base.metadata.create_all(bind=engine)

	app = FastAPI()

	def get_db():
	"""This is a dependency function used to create and provide a
	database session to various endpoints in the FastAPI app.
	"""
	# A new SQLAlchemy session is created using the SessionLocal session factory.
	# This session will be used for database transactions.
	db = SessionLocal()

	# This pattern ensures that each request gets its own database session and that
	# the session is properly closed when the request is finished, preventing resource leaks.
	try:
	yield db
	finally:
	db.close()

	# ..
	# "async" marks the function as asynchronous, allowing it to pause and resume during operations like streaming or I/O.
	async def generate_stream(input_data: schemas.BaseModel, runnable: Runnable, callbacks: List[BaseCallbackHandler]=[]):
	"""generate_stream is an asynchronous generator that processes input data,
	streams output data from a runnable object, serializes each output, and yields
	it to the client in real-time as part of a server-sent event (SSE) stream.
	It uses callbacks to customize the processing, serializes each piece of output
	using WellKnownLCSerializer, and indicates the end of the stream with a final “end” event.
	"""
	for output in runnable.stream(input_data.dict(), config={"callbacks": callbacks}):
	data = WellKnownLCSerializer().dumps(output).decode("utf-8")
	yield {'data': data, "event": "data"}
	# After all the data has been streamed and the loop is complete, the function yields a final event to signal
	# the end of the stream. This sends an {"event": "end"} message to the client, letting them know that no more
	# data will be sent.
	yield {"event": "end"}

	# This registers the function simple_stream as a handler for HTTP POST requests at the URL endpoint /simple/stream.
	# It means that when a client sends a POST request to this endpoint, this function will be triggered.
	@app.post("/simple/stream")
	async def simple_stream(request: Request):
	"""the function handles a POST request at the /simple/stream endpoint,
	extracts the JSON body, unpacks the "input" field, and then uses it to
	initialize a UserQuestion schema object (which performs validation
	and data transformation) and then initiates a server-sent event response
	to stream data back to the client based on the user’s question.
	"""
	# await is used because parsing the JSON may involve asynchronous I/O operations,
	# especially when handling larger payloads.
	data = await request.json()
	user_question = schemas.UserQuestion(**data['input'])
	# This line returns an EventSourceResponse, which is typically used to handle server-sent events (SSE).
	# It’s a special kind of response that streams data back to the client in real time.
	return EventSourceResponse(generate_stream(user_question, simple_chain))


	@app.post("/formatted/stream")
	async def formatted_stream(request: Request):
	# TODO: use the formatted_chain to implement the "/formatted/stream" endpoint.
	data = await request.json()
	user_question = schemas.UserQuestion(**data['input'])
	return EventSourceResponse(generate_stream(user_question, formatted_chain))


	@app.post("/history/stream")
	async def history_stream(request: Request, db: Session = Depends(get_db)):
	# TODO: Let's implement the "/history/stream" endpoint. The endpoint should follow those steps:
	# - The endpoint receives the request
	data = await request.json()

	# - The request is parsed into a user request
	user_request = schemas.UserRequest(**data['input'])

	# - The user request is used to pull the chat history of the user
	chat_history = crud.get_user_chat_history(db=db, username=user_request.username)

	# - We add as part of the user history the current question by using add_message.
	message = schemas.MessageBase(message=user_request.question, type='User', timestamp=datetime.now())
	crud.add_message(db, message=message, username=user_request.username)

	# - We create an instance of HistoryInput by using format_chat_history.
	history_input = schemas.HistoryInput(
	question=user_request.question,
	chat_history=prompts.format_chat_history(chat_history)
	)

	# - We use the history input within the history chain.
	return EventSourceResponse(generate_stream(
	history_input, history_chain, [LogResponseCallback(user_request, db)]
	))


	@app.post("/rag/stream")
	async def rag_stream(request: Request, db: Session = Depends(get_db)):
	# TODO: Let's implement the "/rag/stream" endpoint. The endpoint should follow those steps:
	# - The endpoint receives the request
	# - The request is parsed into a user request
	# - The user request is used to pull the chat history of the user
	# - We add as part of the user history the current question by using add_message.
	# - We create an instance of HistoryInput by using format_chat_history.
	# - We use the history input within the rag chain.

	data = await request.json()
	user_request = schemas.UserRequest(**data['input'])
	chat_history = crud.get_user_chat_history(db=db, username=user_request.username)
	message = schemas.MessageBase(message=user_request.question, type='User', timestamp=datetime.now())
	crud.add_message(db, message=message, username=user_request.username)
	rag_input = schemas.HistoryInput(
	question=user_request.question,
	chat_history=prompts.format_chat_history(chat_history)
	)

	return EventSourceResponse(generate_stream(
	rag_input, rag_chain, [LogResponseCallback(user_request, db)]
	))


	@app.post("/filtered_rag/stream")
	async def filtered_rag_stream(request: Request, db: Session = Depends(get_db)):
	# TODO: Let's implement the "/filtered_rag/stream" endpoint. The endpoint should follow those steps:
	# - The endpoint receives the request
	# - The request is parsed into a user request
	# - The user request is used to pull the chat history of the user
	# - We add as part of the user history the current question by using add_message.
	# - We create an instance of HistoryInput by using format_chat_history.
	# - We use the history input within the filtered rag chain.

	data = await request.json()
	user_request = schemas.UserRequest(**data['input'])
	chat_history = crud.get_user_chat_history(db=db, username=user_request.username)
	message = schemas.MessageBase(message=user_request.question, type='User', timestamp=datetime.now())
	crud.add_message(db, message=message, username=user_request.username)
	rag_input = schemas.HistoryInput(
	question=user_request.question,
	chat_history=prompts.format_chat_history(chat_history)
	)

	return EventSourceResponse(generate_stream(
	rag_input, filtered_rag_chain, [LogResponseCallback(user_request, db)]
	))


	# Run From the Parent Directory with Script
	# If you want to use uvicorn.run from within a script using "app.main:app",
	# you need to provide the proper path. In this way no matter you run the code
	# locally or on the huggingface space, you will alwazs use "app.main:app" as
	# input argument in the uvicorn.run

	# Add the parent directory to sys.path
	sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

	if __name__ == "__main__":
	import uvicorn
	uvicorn.run("app.main:app", host="localhost", reload=True, port=8000)