Spaces:

Chris4K
/

agent-reference-implemenation

Sleeping

File size: 7,346 Bytes

fdfb0c4
45f17fe
d6555d8
 
d7ca359
d2b3f71
6cc2332
 
fb5ba89
 
 
 
 
 
 
d7ca359
6bab521
023be31
 
b066a4d
3709e0d
d6555d8
3709e0d
6bab521
 
 
3709e0d
6bab521
 
4dc413a
6bab521
4dc413a
b066a4d
bd4ac0b
 
97b1f2a
e8494e9
 
a20648e
e8494e9
 
713dd39
e8494e9
 
 
 
 
 
 
 
 
fd41e8f
 
 
 
 
7155419
 
7755f96
 
fb5ba89
7755f96
 
 
 
 
 
6bab521
 
fb5ba89
7755f96
 
 
fb5ba89
 
c218a80
 
 
 
7755f96
 
c218a80
7755f96
c218a80
7755f96
c218a80
7755f96
 
 
 
 
 
e58825b
7755f96
 
 
 
 
 
 
cddf298
 
7155419
 
 
59f5c48
11e5281
 
cddf298
 
11e5281
 
 
 
 
 
 
b066a4d
7155419
 
cddf298
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
02159ac
 
 
cddf298
 
 
 
 
 
 
 
3892b72
cddf298
cc5fac8
cddf298
cc5fac8
cddf298
67d6edc
7155419
3ccf35b
7155419
 
 
 
 
47cf4e1
 
7155419
 
 
 
 
 
 
47cf4e1
 
3ccf35b
 
7155419
 
cddf298
 
 
 
 
 
 
 
 
 
 
 
02159ac
cddf298
 
7155419

import streamlit as st
import os
import requests

from PIL import Image
#from pydub.playback import Audio
from pydub import AudioSegment

import IPython
import soundfile as sf

def play_audio(audio):
    sf.write("speech_converted.wav", audio.numpy(), samplerate=16000)
    return IPython.display.Audio("speech_converted.wav")
    

# From transformers import BertModel, BertTokenizer
from transformers import load_tool
#from transformers import HfAgent, load_tool

import torch
from transformers import AutoModelForCausalLM, AutoTokenizer, Agent, LocalAgent

# checkpoint = "THUDM/agentlm-7b"
# model = AutoModelForCausalLM.from_pretrained(checkpoint, device_map="auto", torch_dtype=torch.bfloat16)
# tokenizer = AutoTokenizer.from_pretrained(checkpoint)

# agent = LocalAgent(model, tokenizer)
# agent.run("Draw me a picture of rivers and lakes.")

# print(agent.run("Is the following `text` (in Spanish) positive or negative?", text="¡Este es un API muy agradable!"))

# Load tools
random_character_tool = load_tool("Chris4K/random-character-tool")
text_generation_tool = load_tool("Chris4K/text-generation-tool")
#sentiment_tool = load_tool("Chris4K/sentiment-tool")
token_counter_tool = load_tool("Chris4K/token-counter-tool")
most_downloaded_model = load_tool("Chris4K/most-downloaded-model")
#rag_tool = load_tool("Chris4K/rag-tool")
word_counter_tool = load_tool("Chris4K/word-counter-tool")
sentence_counter_tool = load_tool("Chris4K/sentence-counter-tool") 
emojify_text_tool = load_tool("Chris4K/EmojifyTextTool") 
namedEntityRecognitionTool = load_tool("Chris4K/NamedEntityRecognitionTool") 
textDownloadTool = load_tool("Chris4K/TextDownloadTool") 
sourcecode_retriever_tool = load_tool("Chris4K/source-code-retriever-tool") 

text_to_image = load_tool("Chris4K/text-to-image") 
text_to_video = load_tool("Chris4K/text-to-video") 
image_transformation = load_tool("Chris4K/image-transformation") 
latent_upscaler_tool = load_tool("Chris4K/latent-upscaler-tool")  

tools = [random_character_tool, text_generation_tool, 
         #sentiment_tool, 
         token_counter_tool, most_downloaded_model,
         word_counter_tool, sentence_counter_tool, emojify_text_tool , namedEntityRecognitionTool, sourcecode_retriever_tool,
         text_to_image, text_to_video, image_transformation, latent_upscaler_tool ]
 
# Define the custom HfAgent class with token and input_params for e.g max_new_token
class CustomHfAgent(Agent):
    def __init__(
        self, url_endpoint, token=os.environ['HF_token'], chat_prompt_template=None, run_prompt_template=None, additional_tools=None, input_params=None
    ):
        super().__init__(
            chat_prompt_template=chat_prompt_template,
            run_prompt_template=run_prompt_template,
            additional_tools=additional_tools,
        )
        self.url_endpoint = url_endpoint
        self.token = token
        self.input_params = input_params

    def generate_one(self, prompt, stop):
        headers = {"Authorization": self.token}
        # Use the value from input_params or a default value if not provided
        max_new_tokens = self.input_params.get("max_new_tokens", 192)
        
        # Set padding and truncation options
        parameters = {"max_new_tokens": max_new_tokens, "return_full_text": False, "stop": stop, "padding": True, "truncation": True}
        
        inputs = {
            "inputs": prompt,
            "parameters": parameters,
        }
        
        response = requests.post(self.url_endpoint, json=inputs, headers=headers)

        if response.status_code == 429:
            print("Getting rate-limited, waiting a tiny bit before trying again.")
            time.sleep(1)
            return self._generate_one(prompt)
        elif response.status_code != 200:
            raise ValueError(f"Errors {inputs} {response.status_code}: {response.json()}")
        print(response)
        result = response.json()[0]["generated_text"]
        # Inference API returns the stop sequence
        for stop_seq in stop:
            if result.endswith(stop_seq):
                return result[: -len(stop_seq)]
        return result

#################
#################
# Define the callback function to handle the form submission
def handle_submission():
    selected_tools = [tools[idx] for idx, checkbox in enumerate(tool_checkboxes) if checkbox]
    print(selected_tools)
    # Initialize the agent
    agent = CustomHfAgent(
        #url_endpoint="https://api-inference.huggingface.co/models/bigcode/starcoder", # mistralai/Mixtral-8x7B-v0.1 # bigscience/bloom
        url_endpoint="https://api-inference.huggingface.co/models/bigscience/bloom", # 
        token=os.environ['HF_token'],
        additional_tools=selected_tools,
        input_params={"max_new_tokens": 192},
    )
    #agent.tools = selected_tools

    response = agent.run(user_message)

    print("Agent Response\n {}".format(response))
    
    return response

# Add the callback function to the Streamlit app
#if submit_button:
#    handle_submission()
#################

###### 
        
st.title("Hugging Face Agent and tools")

# Initialize chat history
if "messages" not in st.session_state:
    st.session_state.messages = []

# Display chat messages from history on app rerun
for message in st.session_state.messages:
    with st.chat_message(message["role"]):
        st.markdown(message["content"])
        
# Checkboxes for the tools to be used by the agent
tool_checkboxes = [st.checkbox(f"{tool.name} --- {tool.description} ") for tool in tools]

# Display a welcome message
with st.chat_message("assistant"):
    st.markdown("Hello there! How can I assist you today?")
 
# Input field for the user's message
#user_message = st.chat_input("Enter message")

# React to user input
if user_message := st.chat_input("Enter message"):
    # Display user message in chat message container
    st.chat_message("user").markdown(user_message)
    # Add user message to chat history
    st.session_state.messages.append({"role": "user", "content": user_message})

    response = handle_submission()
    # Display the agent's response
    ## https://docs.streamlit.io/library/cheatsheet
    with st.chat_message("assistant"):
        if response is None:
            st.warning("The agent's response is None. Please try again.")
        elif isinstance(response, Image.Image):
            st.image(response)
#        elif hasattr(response, 'audio'):
        elif "audio" in str(response):
            audio_data = base64.b64decode(response.split(",")[1])
            audio = AudioSegment.from_file(io.BytesIO(audio_data))
            st.audio(audio)
        elif isinstance(response, AudioSegment):
            st.audio(response)
        elif isinstance(response, str):
            st.markdown(response)
        elif isinstance(response, int):
            st.markdown(response)
        #elif "text" in response:
        #    st.markdown(response)
        else:
            st.warning("Unrecognized response type. Please try again.")
            
    
    # Display assistant response in chat message container
    #with st.chat_message("assistant"):
    #    st.markdown(response)
    # Add assistant response to chat history
    st.session_state.messages.append({"role": "assistant", "content": response})


# Submit button
#submit_button = st.button("Submit")