Spaces:

davnas
/

provaAncora

Runtime error

App Files Files Community

davnas commited on Dec 8, 2024

Commit

c0b7ba2

verified ·

1 Parent(s): b930272

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -23

app.py CHANGED Viewed

@@ -1,30 +1,26 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
 client = InferenceClient("davnas/Italian_Cousine_2.1")
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-):
-    # Format the prompt in the way your working Colab example does
-    prompt = f"User: {message}\nAssistant:"
-    # If you want to include history
     for user_msg, assistant_msg in history:
-        prompt = f"User: {user_msg}\nAssistant: {assistant_msg}\n" + prompt
-    # If you want to include system message
-    if system_message:
-        prompt = f"{system_message}\n" + prompt
-    response = ""
-    # Use text_generation instead of chat_completion
     for token in client.text_generation(
         prompt,
         max_new_tokens=max_tokens,
@@ -35,20 +31,36 @@ def respond(
         response += token
         yield response
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(
             minimum=0.1,
             maximum=1.0,
             value=0.95,
             step=0.05,
-            label="Top-p (nucleus sampling)",
         ),
-    ],
 )
 if __name__ == "__main__":

 import gradio as gr
 from huggingface_hub import InferenceClient
+# Initialize the client
 client = InferenceClient("davnas/Italian_Cousine_2.1")
+def respond(message, history: list[tuple[str, str]], system_message, max_tokens, temperature, top_p):
+    # Format the prompt including history and system message
+    prompt = ""
+    # Add system message if provided
+    if system_message:
+        prompt = f"{system_message}\n"
+    # Add conversation history
     for user_msg, assistant_msg in history:
+        prompt += f"User: {user_msg}\nAssistant: {assistant_msg}\n"
+    # Add current message
+    prompt += f"User: {message}\nAssistant:"
+    response = ""
+    # Stream the response
     for token in client.text_generation(
         prompt,
         max_new_tokens=max_tokens,
         response += token
         yield response
+# Create the interface
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
+        gr.Textbox(
+            value="You are a friendly Chatbot.",
+            label="System message"
+        ),
+        gr.Slider(
+            minimum=1,
+            maximum=2048,
+            value=512,
+            step=1,
+            label="Max new tokens"
+        ),
+        gr.Slider(
+            minimum=0.1,
+            maximum=4.0,
+            value=0.7,
+            step=0.1,
+            label="Temperature"
+        ),
         gr.Slider(
             minimum=0.1,
             maximum=1.0,
             value=0.95,
             step=0.05,
+            label="Top-p (nucleus sampling)"
         ),
+    ]
 )
 if __name__ == "__main__":