Spaces:

Intel
/

intel-ai-enterprise-inference

Running

Benjamin Consolvo

header chatbot

e7b14e0 3 months ago

3.08 kB

	# Import necessary libraries

	import streamlit as st
	import os
	from openai import OpenAI
	import json

	working_dir = os.path.dirname(os.path.abspath(__file__))
	endpoint_data = json.load(open(f"{working_dir}/model_info.json"))

	def clear_chat():
	st.session_state.messages = []

	st.title("Intel® AI for Enterprise Inference")
	st.header("LLM chatbot")

	# Extract the keys (model names) from the JSON data
	model_names = list(endpoint_data.keys())


	with st.sidebar:
	modelname = st.selectbox("Select a LLM model (Running on Intel® Gaudi®) ", model_names)
	st.write(f"You selected: {modelname}")
	st.button("Start New Chat", on_click=clear_chat)
	try:
	#if you can provide the API key in the HF settings under "Variables and secrets", you will not need to enter your OpenAI-compatible API key every time.
	st.session_state.api_key = st.secrets["openai_apikey"]
	except KeyError:
	# Add a text input for the API key if not in session state
	api_key = st.text_input("Enter your API Key", type="password")
	if api_key:
	st.session_state.api_key = api_key

	# Check if the API key is provided
	if "api_key" not in st.session_state or not st.session_state.api_key:
	st.error("Please enter your API Key in the sidebar.")
	else:
	try:
	endpoint = endpoint_data[modelname]

	api_key = st.session_state.api_key
	base_url = endpoint
	client = OpenAI(api_key=api_key, base_url=base_url)

	# Extract the model name
	models = client.models.list()
	modelname = models.data[0].id

	if "messages" not in st.session_state:
	st.session_state.messages = []

	for message in st.session_state.messages:
	with st.chat_message(message["role"]):
	st.markdown(message["content"])

	if prompt := st.chat_input("What is up?"):
	st.session_state.messages.append({"role": "user", "content": prompt})
	with st.chat_message("user"):
	st.markdown(prompt)

	with st.chat_message("assistant"):
	try:
	stream = client.chat.completions.create(
	model=modelname,
	messages=[
	{"role": m["role"], "content": m["content"]}
	for m in st.session_state.messages
	],
	max_tokens=1024,
	stream=True,
	)
	response = st.write_stream(stream)
	except Exception as e:
	st.error(f"An error occurred while generating the response: {e}")
	response = "An error occurred while generating the response."

	st.session_state.messages.append({"role": "assistant", "content": response})
	except KeyError as e:
	st.error(f"Key error: {e}")
	except Exception as e:
	st.error(f"An unexpected error occurred: {e}")