Benjamin Consolvo
header chatbot
e7b14e0
raw
history blame
3.08 kB
# Import necessary libraries
import streamlit as st
import os
from openai import OpenAI
import json
working_dir = os.path.dirname(os.path.abspath(__file__))
endpoint_data = json.load(open(f"{working_dir}/model_info.json"))
def clear_chat():
st.session_state.messages = []
st.title("Intel® AI for Enterprise Inference")
st.header("LLM chatbot")
# Extract the keys (model names) from the JSON data
model_names = list(endpoint_data.keys())
with st.sidebar:
modelname = st.selectbox("Select a LLM model (Running on Intel® Gaudi®) ", model_names)
st.write(f"You selected: {modelname}")
st.button("Start New Chat", on_click=clear_chat)
try:
#if you can provide the API key in the HF settings under "Variables and secrets", you will not need to enter your OpenAI-compatible API key every time.
st.session_state.api_key = st.secrets["openai_apikey"]
except KeyError:
# Add a text input for the API key if not in session state
api_key = st.text_input("Enter your API Key", type="password")
if api_key:
st.session_state.api_key = api_key
# Check if the API key is provided
if "api_key" not in st.session_state or not st.session_state.api_key:
st.error("Please enter your API Key in the sidebar.")
else:
try:
endpoint = endpoint_data[modelname]
api_key = st.session_state.api_key
base_url = endpoint
client = OpenAI(api_key=api_key, base_url=base_url)
# Extract the model name
models = client.models.list()
modelname = models.data[0].id
if "messages" not in st.session_state:
st.session_state.messages = []
for message in st.session_state.messages:
with st.chat_message(message["role"]):
st.markdown(message["content"])
if prompt := st.chat_input("What is up?"):
st.session_state.messages.append({"role": "user", "content": prompt})
with st.chat_message("user"):
st.markdown(prompt)
with st.chat_message("assistant"):
try:
stream = client.chat.completions.create(
model=modelname,
messages=[
{"role": m["role"], "content": m["content"]}
for m in st.session_state.messages
],
max_tokens=1024,
stream=True,
)
response = st.write_stream(stream)
except Exception as e:
st.error(f"An error occurred while generating the response: {e}")
response = "An error occurred while generating the response."
st.session_state.messages.append({"role": "assistant", "content": response})
except KeyError as e:
st.error(f"Key error: {e}")
except Exception as e:
st.error(f"An unexpected error occurred: {e}")