Oxy-1-Small-Optimisation-Prompt-Engineering

Running

App Files Files Community

TornadoAI commited on Dec 7, 2024

Commit

2dc42b7

verified ·

1 Parent(s): 19626ed

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -8

app.py CHANGED Viewed

@@ -51,16 +51,17 @@ def predict(
         json_response = response.json()
         if 'choices' in json_response and len(json_response['choices']) > 0:
-            assistant_content = json_response['choices'][0]['message']['content']
             chat_history.append({"role": "assistant", "content": assistant_content})
         else:
             chat_history.append({"role": "assistant", "content": "Error: No response from assistant."})
-        return chat_history
     except Exception as e:
         chat_history.append({"role": "assistant", "content": f"Error: {str(e)}"})
-        return chat_history
 css = """
 .gradio-container {
@@ -126,8 +127,8 @@ footer {
 with gr.Blocks(
     theme=gr.themes.Soft(
         primary_hue="orange",
-        secondary_hue="gray",
-        neutral_hue="slate",
         spacing_size="sm",
         radius_size="lg",
         font=["Inter", "ui-sans-serif", "system-ui"]
@@ -196,6 +197,7 @@ with gr.Blocks(
                 step=0.05,
                 label="Top-p"
             )
     def show_chat():
         return gr.update(visible=False), gr.update(visible=True)
@@ -203,7 +205,7 @@ with gr.Blocks(
     msg.submit(
         predict,
         [msg, chatbot, temperature, top_p],
-        chatbot
     ).then(
         lambda: "",
         None,
@@ -213,7 +215,7 @@ with gr.Blocks(
     submit.click(
         predict,
         [msg, chatbot, temperature, top_p],
-        chatbot
     ).then(
         lambda: "",
         None,
@@ -231,4 +233,4 @@ if __name__ == "__main__":
         server_name="0.0.0.0",
         server_port=7860,
         share=True
-    )

         json_response = response.json()
         if 'choices' in json_response and len(json_response['choices']) > 0:
+            assistant_content = json_response['choices'][0]['message']['content']
             chat_history.append({"role": "assistant", "content": assistant_content})
+            stats_content = f"*Powered by Oxygen, Generation time: {json_response["usage"]["metrics"]["inference_time_ms"]} ms , Tokens per second: {json_response["usage"]["metrics"]["tokens_per_second"]} , Generation cost: {round(json_response["usage"]["cost"]["total"],10)} EUR*"
         else:
             chat_history.append({"role": "assistant", "content": "Error: No response from assistant."})
+        return chat_history, stats_content
     except Exception as e:
         chat_history.append({"role": "assistant", "content": f"Error: {str(e)}"})
+        return chat_history, "*Generation error..*"
 css = """
 .gradio-container {
 with gr.Blocks(
     theme=gr.themes.Soft(
         primary_hue="orange",
+        secondary_hue="zinc",
+        neutral_hue="zinc",
         spacing_size="sm",
         radius_size="lg",
         font=["Inter", "ui-sans-serif", "system-ui"]
                 step=0.05,
                 label="Top-p"
             )
+        stats_display = gr.Markdown()
     def show_chat():
         return gr.update(visible=False), gr.update(visible=True)
     msg.submit(
         predict,
         [msg, chatbot, temperature, top_p],
+       [chatbot, stats_display]
     ).then(
         lambda: "",
         None,
     submit.click(
         predict,
         [msg, chatbot, temperature, top_p],
+        [chatbot, stats_display]
     ).then(
         lambda: "",
         None,
         server_name="0.0.0.0",
         server_port=7860,
         share=True
+    )