Spaces:

akhaliq
/

gemini-1.5-flash-8b-exp-0924

Running

App Files Files Community

akhaliq HF staff commited on Sep 24, 2024

Commit

a15e449

verified ·

1 Parent(s): 3e818ad

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -26

app.py CHANGED Viewed

@@ -1,9 +1,7 @@
 import os
 import google.generativeai as genai
 import gradio as gr
-from gradio_multimodalchatbot import MultimodalChatbot
 from PIL import Image
-import io
 # Configure the API
 genai.configure(api_key=os.environ["GEMINI_API_KEY"])
@@ -17,7 +15,7 @@ generation_config = {
 }
 model = genai.GenerativeModel(
-    model_name="Gemini-1.5-Flash-8B-Exp-0924",
     generation_config=generation_config,
 )
@@ -25,41 +23,38 @@ model = genai.GenerativeModel(
 chat_session = model.start_chat(history=[])
 def process_file(file):
-    if file.type.startswith('image'):
-        return Image.open(file.path)
-    elif file.type.startswith('audio') or file.type.startswith('video'):
-        return file.path
     else:
         return None
-def respond(message, history):
-    files = []
-    for file in message.get('files', []):
-        processed_file = process_file(file['file'])
-        if processed_file:
-            files.append(processed_file)
-    prompt = message['text']
-    if files:
-        response = chat_session.send_message([prompt, *files])
     else:
-        response = chat_session.send_message(prompt)
-    return {"text": response.text, "files": []}
 with gr.Blocks() as demo:
     gr.Markdown("# Gemini Multimodal Chatbot")
     gr.Markdown("Chat with the Gemini 1.5 Pro model. You can send text, images, audio, and video!")
-    chatbot = MultimodalChatbot(
-        height=600,
-        bubble_full_width=False,
-        avatar_images=(None, "https://lh3.googleusercontent.com/d/1pIo02xepBgqt9gMdFkJHSocJfH_A2dqj"),
-        render_markdown=True
-    )
-    chatbot.chat(respond, fill_height=False)
 if __name__ == "__main__":
     demo.launch()

 import os
 import google.generativeai as genai
 import gradio as gr
 from PIL import Image
 # Configure the API
 genai.configure(api_key=os.environ["GEMINI_API_KEY"])
 }
 model = genai.GenerativeModel(
+    model_name="gemini-1.5-pro-latest",
     generation_config=generation_config,
 )
 chat_session = model.start_chat(history=[])
 def process_file(file):
+    if file.name.lower().endswith(('.png', '.jpg', '.jpeg', '.gif', '.bmp')):
+        return Image.open(file.name)
+    elif file.name.lower().endswith(('.mp3', '.wav', '.ogg')):
+        return file.name  # Return the file path for audio
+    elif file.name.lower().endswith(('.mp4', '.avi', '.mov')):
+        return file.name  # Return the file path for video
     else:
         return None
+def respond(message, chat_history, files):
+    processed_files = [process_file(file) for file in files if file is not None]
+    if processed_files:
+        response = chat_session.send_message([message, *processed_files])
     else:
+        response = chat_session.send_message(message)
+    chat_history.append((message, response.text))
+    return "", chat_history
 with gr.Blocks() as demo:
     gr.Markdown("# Gemini Multimodal Chatbot")
     gr.Markdown("Chat with the Gemini 1.5 Pro model. You can send text, images, audio, and video!")
+    chatbot = gr.Chatbot()
+    msg = gr.Textbox()
+    clear = gr.ClearButton([msg, chatbot])
+    file_output = gr.File()
+    upload_button = gr.UploadButton("📁 Upload files", file_types=["image", "audio", "video"], file_count="multiple")
+    msg.submit(respond, [msg, chatbot, upload_button], [msg, chatbot])
 if __name__ == "__main__":
     demo.launch()