Spaces:

Intel
/

intel-ai-enterprise-inference

Running

File size: 3,161 Bytes

0dc0782
 
 
 
 
 
 
 
 
 
e7b14e0
 
0dc0782
 
97ccf9a
 
fa5b702
caad47f
0577ef7
 
 
3dc90a2
 
0577ef7
3dc90a2
9b804ec
3dc90a2
ee982c9
3dc90a2
9b804ec
3dc90a2
0dc0782
 
fa5b702
2ce7cb5
 
 
ee982c9
2ce7cb5
ee982c9
2ce7cb5
 
 
fa5b702
 
 
0dc0782
fa5b702
 
 
0dc0782
fa5b702
 
 
 
0dc0782
fa5b702
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0dc0782
fa5b702

# Import necessary libraries

import streamlit as st
import os
from openai import OpenAI
import json

def clear_chat():
    st.session_state.messages = []

st.title("Intel® AI for Enterprise Inference")
st.header("LLM chatbot")

with st.sidebar:
    api_key = st.session_state.api_key = st.secrets["openai_apikey"]  #Enter openai_api key under "Secrets " in HF settings
    base_url = st.session_state.base_url = os.environ.get("base_url") #Enter base_url under "Variables" in HF settings
    client = OpenAI(api_key=api_key, base_url=base_url)
    models = client.models.list()
    model_names = sorted([model.id for model in models])  # Extract 'id' from each model object
    default_model_name = "meta-llama/Llama-3.3-70B-Instruct"  # Replace with your desired default model name
    
    # Use st.session_state to persist the selected model
    if "selected_model" not in st.session_state:
        st.session_state.selected_model = default_model_name if default_model_name in model_names else model_names[0]

    # Create the selectbox without the `index` parameter
    modelname = st.selectbox(
        "Select an LLM model (Running on Intel® Gaudi®). Hosted on Denvr Dataworks.",
        model_names,
        key="selected_model",  # This ties the widget to st.session_state["selected_model"]
    )
    st.write(f"You selected: {modelname}")
    st.button("Start New Chat", on_click=clear_chat)
    
    st.markdown("---")  # Add a horizontal line for separation
    st.markdown(
        """

        Check the latest models hosted on [Denvr Dataworks](https://www.denvrdata.com/intel), and get your own OpenAI-compatible API key.



        Come and chat with other AI developers on [Intel’s DevHub Discord server](https://discord.gg/kfJ3NKEw5t).

        """
    )
    
try:
    if "messages" not in st.session_state:
        st.session_state.messages = []

    for message in st.session_state.messages:
        with st.chat_message(message["role"]):
            st.markdown(message["content"])

    if prompt := st.chat_input("What is up?"):
        st.session_state.messages.append({"role": "user", "content": prompt})
        with st.chat_message("user"):
            st.markdown(prompt)

        with st.chat_message("assistant"):
            try:
                stream = client.chat.completions.create(
                    model=modelname,
                    messages=[
                        {"role": m["role"], "content": m["content"]}
                        for m in st.session_state.messages
                    ],
                    max_tokens=4096,
                    stream=True,
                )
                response = st.write_stream(stream)
            except Exception as e:
                st.error(f"An error occurred while generating the response: {e}")
                response = "An error occurred while generating the response."

        st.session_state.messages.append({"role": "assistant", "content": response})
except KeyError as e:
    st.error(f"Key error: {e}")
except Exception as e:
    st.error(f"An unexpected error occurred: {e}")