Spaces:

mobinln
/

chatbot

Sleeping

mobinln commited on Jun 15, 2024

Commit

9d6f55d

1 Parent(s): 549b996

change to phi3 vision

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,14 +4,7 @@ from huggingface_hub import InferenceClient
 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
-choices = [
-    "meta-llama/Meta-Llama-3-8B-Instruct",
-    "microsoft/Phi-3-vision-128k-instruct",
-    "Qwen/Qwen2-0.5B-Instruct",
-]
-client1 = InferenceClient(model=choices[0])
-client2 = InferenceClient(model=choices[1])
-client3 = InferenceClient(model=choices[2])
 def respond(
@@ -21,7 +14,6 @@ def respond(
     max_tokens,
     temperature,
     top_p,
-    model,
 ):
     messages = [{"role": "system", "content": system_message}]
@@ -35,9 +27,6 @@ def respond(
     response = ""
-    client = (
-        client1 if model == choices[0] else client2 if model == choices[1] else client3
-    )
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
@@ -67,7 +56,6 @@ demo = gr.ChatInterface(
             step=0.05,
             label="Top-p (nucleus sampling)",
         ),
-        gr.Dropdown(choices=choices, value=choices[0], label="Model"),
     ],
     multimodal=True,
 )

 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
+client = InferenceClient(model="microsoft/Phi-3-vision-128k-instruct")
 def respond(
     max_tokens,
     temperature,
     top_p,
 ):
     messages = [{"role": "system", "content": system_message}]
     response = ""
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
             step=0.05,
             label="Top-p (nucleus sampling)",
         ),
     ],
     multimodal=True,
 )