Spaces:

drmasad
/

HAH-2024-v0.1

Runtime error

App Files Files

drmasad commited on Apr 26, 2024

Commit

849fdd5

verified ·

1 Parent(s): 2b5d309

Update app.py

Browse files

Files changed (1) hide show

app.py +105 -81

app.py CHANGED Viewed

@@ -1,120 +1,144 @@
-""" HAH 2024 v0.1 Chatbot
-@author: Dr M As'ad
-@email: [email protected]
-"""
 import streamlit as st
 from openai import OpenAI
 import os
-import sys
-from dotenv import load_dotenv, dotenv_values
 load_dotenv()
-# initialize the client
-client = OpenAI(
-  base_url="https://api-inference.huggingface.co/v1",
-  api_key=os.environ.get('HUGGINGFACEHUB_API_TOKEN')
-)
-#Create supported models
-model_links ={
-    "HAH-2024-v0.1":"drmasad/HAH-2024-v0.11",
-    "Mistral":"mistralai/Mistral-7B-Instruct-v0.2",
 }
-model_info ={
-    "HAH-2024-v0.1":
-        {'description':"""The HAH-2024-v0.1 model is a **Large Language Model (LLM)** that's able to have question and answer interactions.\n \
-            \nIt was created by fine tuning Mistra 7b instruct usin 3000 review articles on diabetes** \n""",
-        'logo':'https://www.hmgaihub.com/untitled.png'},
-    "Mistral":
-    {'description':
-        """The Mistral model is a **Large Language Model (LLM)** that's able to have question and answer interactions...""",
-    'logo':
-        'https://mistral.ai/images/logo_hubc88c4ece131b91c7cb753f40e9e1cc5_2589_256x0_resize_q97_h2_lanczos_3.webp'},
-}
-def reset_conversation():
-    '''
-    Resets Conversation
-    '''
-    st.session_state.conversation = []
-    st.session_state.messages = []
-    return None
-# Define the available models
-models =[key for key in model_links.keys()]
-# Create the sidebar with the dropdown for model selection
 selected_model = st.sidebar.selectbox("Select Model", models)
-#Create a temperature slider
-temp_values = st.sidebar.slider('Select a temperature value', 0.0, 1.0, (0.5))
-#Add reset button to clear conversation
-st.sidebar.button('Reset Chat', on_click=reset_conversation) #Reset button
-# Create model description
 st.sidebar.write(f"You're now chatting with **{selected_model}**")
-st.sidebar.markdown(model_info[selected_model]['description'])
-st.sidebar.image(model_info[selected_model]['logo'])
-st.sidebar.markdown("*Generated content may be inaccurate or false.*")
-if "prev_option" not in st.session_state:
-    st.session_state.prev_option = selected_model
-if st.session_state.prev_option != selected_model:
-    st.session_state.messages = []
-    # st.write(f"Changed to {selected_model}")
-    st.session_state.prev_option = selected_model
-    reset_conversation()
-#Pull in the model we want to use
-repo_id = model_links[selected_model]
-st.subheader(f'AI - {selected_model}')
-# st.title(f'ChatBot Using {selected_model}')
-# Set a default model
-if selected_model not in st.session_state:
-    st.session_state[selected_model] = model_links[selected_model]
 # Initialize chat history
 if "messages" not in st.session_state:
     st.session_state.messages = []
-# Display chat messages from history on app rerun
 for message in st.session_state.messages:
     with st.chat_message(message["role"]):
         st.markdown(message["content"])
-# Accept user input
-if prompt := st.chat_input(f"Hi I'm {selected_model}, ask me a question"):
-    # Display user message in chat message container
     with st.chat_message("user"):
         st.markdown(prompt)
-    # Add user message to chat history
-    st.session_state.messages.append({"role": "user", "content": prompt})
-    # Display assistant response in chat message container
     with st.chat_message("assistant"):
-        stream = client.chat.completions.create(
-            model=model_links[selected_model],
-            messages=[
-                {"role": m["role"], "content": m["content"]}
-                for m in st.session_state.messages
-            ],
-            temperature=temp_values,#0.5,
-            stream=True,
-            max_tokens=3000,
         )
-        response = st.write_stream(stream)
-    st.session_state.messages.append({"role": "assistant", "content": response})

+# Import necessary libraries
 import streamlit as st
+from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, pipeline
 from openai import OpenAI
 import os
+import torch
+from peft import LoraConfig, PeftModel, prepare_model_for_kbit_training, get_peft_model
+from dotenv import load_dotenv
+# Load environment variables
 load_dotenv()
+# Define model links and configurations
+model_links = {
+    "HAH-2024-v0.1": "drmasad/HAH-2024-v0.11",
+    "Mistral": "mistralai/Mistral-7B-Instruct-v0.2",
 }
+# Initialize the OpenAI client (if needed for Hugging Face Inference API)
+client = OpenAI(
+    base_url="https://api-inference.huggingface.co/v1",
+    api_key=os.environ.get("HUGGINGFACEHUB_API_TOKEN"),
+)
+# Define sidebar options
+models = list(model_links.keys())
+# Sidebar model selection
 selected_model = st.sidebar.selectbox("Select Model", models)
+# Sidebar temperature control
+temp_values = st.sidebar.slider("Select a temperature value", 0.0, 1.0, (0.5))
+# Reset conversation functionality
+def reset_conversation():
+    st.session_state.conversation = []
+    st.session_state.messages = []
+st.sidebar.button("Reset Chat", on_click=reset_conversation)
+# Display model information on the sidebar
+model_info = {
+    "HAH-2024-v0.1": {
+        "description": "HAH-2024-v0.1 is a fine-tuned model based on Mistral 7B. It's designed for conversations on diabetes.",
+        "logo": "https://www.hmgaihub.com/untitled.png",
+    },
+    "Mistral": {
+        "description": "Mistral is a large language model with multi-task capabilities.",
+        "logo": "https://mistral.ai/images/logo_hubc88c4ece131b91c7cb753f40e9e1cc5_2589_256x0_resize_q97_h2_lanczos_3.webp",
+    },
+}
 st.sidebar.write(f"You're now chatting with **{selected_model}**")
+st.sidebar.markdown(model_info[selected_model]["description"])
+st.sidebar.image(model_info[selected_model]["logo"])
+# Load the appropriate model based on user selection
+def load_model(selected_model_name):
+    if selected_model_name == "HAH-2024-v0.1":
+        # Setup for HAH-2024-v0.1
+        model_name = model_links["HAH-2024-v0.1"]
+        base_model = "mistralai/Mistral-7B-Instruct-v0.2"
+        # Load model with quantization configuration
+        bnb_config = BitsAndBytesConfig(
+            load_in_4bit=True,
+            bnb_4bit_quant_type="nf4",
+            bnb_4bit_compute_dtype=torch.bfloat16,
+            bnb_4bit_use_double_quant=False,
+        )
+        model = AutoModelForCausalLM.from_pretrained(
+            model_name,
+            quantization_config=bnb_config,
+            torch_dtype=torch.bfloat16,
+            device_map="auto",
+            trust_remote_code=True,
+        )
+        model.config.use_cache = False
+        model = prepare_model_for_kbit_training(model)
+        peft_config = LoraConfig(
+            lora_alpha=16,
+            lora_dropout=0.1,
+            r=64,
+            bias="none",
+            task_type="CAUSAL_LM",
+            target_modules=["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj"],
+        )
+        model = get_peft_model(model, peft_config)
+        tokenizer = AutoTokenizer.from_pretrained(base_model, trust_remote_code=True)
+    elif selected_model_name == "Mistral":
+        # Setup for Mistral 7B
+        model = AutoModelForCausalLM.from_pretrained(
+            model_links[selected_model_name]
+        )
+        tokenizer = AutoTokenizer.from_pretrained(model_links[selected_model_name])
+    return model, tokenizer
 # Initialize chat history
 if "messages" not in st.session_state:
     st.session_state.messages = []
+# Load the selected model
+model, tokenizer = load_model(selected_model)
+st.subheader(f"AI - {selected_model}")
+# Display previous chat messages
 for message in st.session_state.messages:
     with st.chat_message(message["role"]):
         st.markdown(message["content"])
+# User input for conversation
+if prompt := st.chat_input("Ask a question"):
+    # Display user input
     with st.chat_message("user"):
         st.markdown(prompt)
+    # Store the user message
+    st.session_state.messages.append({"role": "user", "content": prompt})
+    # Generate the assistant's response
     with st.chat_message("assistant"):
+        pipe = pipeline(
+            task="text-generation",
+            model=model,
+            tokenizer=tokenizer,
+            max_length=1024,
+            temperature=temp_values
         )
+        result = pipe(f"<s>[INST] {prompt}</s>", do_sample=True)
+        response = result[0]["generated_text"]
+        st.markdown(response)
+    # Store the assistant's response
+    st.session_state.messages.append({"role": "assistant", "content": response})