ModelChat

Sleeping

wwpop commited on Oct 10, 2024

Commit

9a86ca9

verified ·

1 Parent(s): af90de5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ from huggingface_hub import InferenceClient
 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 def respond(
@@ -28,6 +28,7 @@ def respond(
     response = ""
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         stream=True,
@@ -45,8 +46,8 @@ For information on how to customize the ChatInterface, peruse the gradio docs: h
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot and replay in Chinese.", label="System message"),
-        gr.Slider(minimum=1, maximum=4096, value=1024, step=1, label="Max new tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(
             minimum=0.1,

 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
+client = InferenceClient(api_key="")
 def respond(
     response = ""
     for message in client.chat_completion(
+        model="Qwen/Qwen2.5-72B-Instruct",
         messages,
         max_tokens=max_tokens,
         stream=True,
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
+        gr.Textbox(value="You are Qwen, created by Alibaba Cloud. You are a helpful assistant.", label="System message"),
+        gr.Slider(minimum=1, maximum=8888, value=2048, step=1, label="Max new tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(
             minimum=0.1,