Spaces:

HuggingFaceM4
/

idefics_playground

Runtime error

App Files Files Community

VictorSanh commited on Aug 19, 2023

Commit

69ef035

1 Parent(s): 00346ea

fixes

Browse files

Files changed (1) hide show

app_dialogue.py +6 -7

app_dialogue.py CHANGED Viewed

@@ -15,9 +15,9 @@ from text_generation import Client
 from transformers import AutoProcessor
-MODELS = [  # TODO uncomment
     "HuggingFaceM4/idefics-9b-instruct",
-    # "HuggingFaceM4/idefics-80b-instruct",
 ]
 API_PATHS = {
@@ -326,7 +326,7 @@ with gr.Blocks(title="IDEFICS Playground", theme=gr.themes.Base()) as demo:
                 **EMBARGO UNTIL AUGUST 22ND** This demo showcaes **IDEFICS**, a open-access large visual lanugage model. Like GPT-4, the multimodal model accepts arbitrary sequences of image and text inputs and produces text outputs. IDEFICS can answer questions about images, describe visual content, create stories grounded in multiple images, etc.
                 <br>IDEFICS (which stans for **I**mage-aware **D**ecoder **E**nhanced à la **F**lamingo with **I**nterleaved **C**ross-attention**S**) is an open-access reproduction of [Flamingo](https://huggingface.co/papers/2204.14198), a closed-source visual language model developed by Deepmind. IDEFICS was built solely on publicly available data and models. It is currently the only visual language model of this scale available in open-access.
-                📚 The variants available in this demo were fine-tuned on a mixture of supervised and intruction fine-tuning to make the models more suitable in conversational settings. For more details, we refer to our [blog post](TODO).
                 🅿️ **Intended uses:** This demo along with the [supporting models](https://huggingface.co/models?sort=trending&search=HuggingFaceM4%2Fidefics) are provided as research artefacts to the community. We detail misuses and out-of-scope uses [here](https://huggingface.co/HuggingFaceM4/idefics-80b#misuse-and-out-of-scope-use).
@@ -338,7 +338,7 @@ with gr.Blocks(title="IDEFICS Playground", theme=gr.themes.Base()) as demo:
     with gr.Row(elem_id="model_selector_row"):
         model_selector = gr.Dropdown(
             choices=MODELS,
-            value="HuggingFaceM4/idefics-9b-instruct",
             interactive=True,
             show_label=False,
             container=False,
@@ -555,7 +555,6 @@ with gr.Blocks(title="IDEFICS Playground", theme=gr.themes.Base()) as demo:
         model_selector="HuggingFaceM4/idefics-80b-instruct"
         user_prompt_str=message
         chat_history=[]
-        decoding_strategy="Greedy"
         max_new_tokens=512
         formated_prompt_list, user_prompt_list = format_user_prompt_with_im_history_and_system_conditioning(
@@ -596,7 +595,7 @@ with gr.Blocks(title="IDEFICS Playground", theme=gr.themes.Base()) as demo:
         query = prompt_list_to_tgi_input(formated_prompt_list)
         generated_text = client.generate(prompt=query, **generation_args)
         if generated_text.endswith("\nUser"):
-            generated_text = generate_text[:-5]
         last_turn = chat_history.pop(-1)
         last_turn[-1] += generated_text
@@ -831,7 +830,7 @@ with gr.Blocks(title="IDEFICS Playground", theme=gr.themes.Base()) as demo:
         inputs=[textbox, imagebox],
         outputs=[textbox, imagebox, chatbot],
         fn=process_example,
-        cache_examples=False,
         examples_per_page=6,
         label=(
             "Click on any example below to get started.\nFor convenience, the model generations have been"

 from transformers import AutoProcessor
+MODELS = [
     "HuggingFaceM4/idefics-9b-instruct",
+    "HuggingFaceM4/idefics-80b-instruct",
 ]
 API_PATHS = {
                 **EMBARGO UNTIL AUGUST 22ND** This demo showcaes **IDEFICS**, a open-access large visual lanugage model. Like GPT-4, the multimodal model accepts arbitrary sequences of image and text inputs and produces text outputs. IDEFICS can answer questions about images, describe visual content, create stories grounded in multiple images, etc.
                 <br>IDEFICS (which stans for **I**mage-aware **D**ecoder **E**nhanced à la **F**lamingo with **I**nterleaved **C**ross-attention**S**) is an open-access reproduction of [Flamingo](https://huggingface.co/papers/2204.14198), a closed-source visual language model developed by Deepmind. IDEFICS was built solely on publicly available data and models. It is currently the only visual language model of this scale available in open-access.
+                📚 The variants available in this demo were fine-tuned on a mixture of supervised and intruction fine-tuning to make the models more suitable in conversational settings. For more details, we refer to our [blog post](https://huggingface.co/blog/idefics).
                 🅿️ **Intended uses:** This demo along with the [supporting models](https://huggingface.co/models?sort=trending&search=HuggingFaceM4%2Fidefics) are provided as research artefacts to the community. We detail misuses and out-of-scope uses [here](https://huggingface.co/HuggingFaceM4/idefics-80b#misuse-and-out-of-scope-use).
     with gr.Row(elem_id="model_selector_row"):
         model_selector = gr.Dropdown(
             choices=MODELS,
+            value="HuggingFaceM4/idefics-80b-instruct",
             interactive=True,
             show_label=False,
             container=False,
         model_selector="HuggingFaceM4/idefics-80b-instruct"
         user_prompt_str=message
         chat_history=[]
         max_new_tokens=512
         formated_prompt_list, user_prompt_list = format_user_prompt_with_im_history_and_system_conditioning(
         query = prompt_list_to_tgi_input(formated_prompt_list)
         generated_text = client.generate(prompt=query, **generation_args)
         if generated_text.endswith("\nUser"):
+            generated_text = generated_text[:-5]
         last_turn = chat_history.pop(-1)
         last_turn[-1] += generated_text
         inputs=[textbox, imagebox],
         outputs=[textbox, imagebox, chatbot],
         fn=process_example,
+        cache_examples=True,
         examples_per_page=6,
         label=(
             "Click on any example below to get started.\nFor convenience, the model generations have been"