File size: 728 Bytes
a59bc9c
70bcdad
ffd4434
ee24018
834791f
70bcdad
776a762
ee24018
70bcdad
776a762
70bcdad
 
776a762
70bcdad
776a762
 
 
 
 
 
 
834791f
ee24018
 
776a762
ee24018
 
 
776a762
70bcdad
 
776a762
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import gradio as gr
from huggingface_hub import InferenceClient

client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")

def respond(message, history):
    response = ""

    messages = [{"role": "system", "content": "You are a friendly chatbot."}]

    if history:
        messages.extend(history)

    messages.append({"role": "user", "content": message})

    stream = client.chat_completion(
        messages,
        max_tokens=100,
        temperature=1.2,
        stream=True
    )

    for message in stream:
        token = message.choices[0].delta.content

        if token is not None:
            response += token
            yield response

chatbot = gr.ChatInterface(respond, type="messages")

chatbot.launch()