|
import streamlit as st |
|
import requests |
|
import os |
|
from transformers import MBartForConditionalGeneration, MBart50TokenizerFast |
|
|
|
|
|
Image_Token = os.getenv('Image_generation').strip() |
|
Content_Token = os.getenv('Content_generation','').strip() |
|
Image_prompt_token = os.getenv('Prompt_generation').strip() |
|
|
|
|
|
Image_generation = {"Authorization": f"Bearer {Image_Token}"} |
|
Content_generation = { |
|
"Authorization": f"Bearer {Content_Token}", |
|
"Content-Type": "application/json" |
|
} |
|
Image_Prompt = { |
|
"Authorization": f"Bearer {Image_prompt_token}", |
|
"Content-Type": "application/json" |
|
} |
|
|
|
|
|
image_generation_urls = { |
|
"black-forest-labs/FLUX.1-schnell": "https://api-inference.huggingface.co/models/black-forest-labs/FLUX.1-schnell", |
|
"CompVis/stable-diffusion-v1-4": "https://api-inference.huggingface.co/models/CompVis/stable-diffusion-v1-4", |
|
"black-forest-labs/FLUX.1-dev": "https://api-inference.huggingface.co/models/black-forest-labs/FLUX.1-dev" |
|
} |
|
|
|
|
|
content_models = { |
|
"llama-3.1-70b-versatile": "llama-3.1-70b-versatile", |
|
"llama3-8b-8192": "llama3-8b-8192", |
|
"gemma2-9b-it": "gemma2-9b-it", |
|
"mixtral-8x7b-32768": "mixtral-8x7b-32768" |
|
} |
|
|
|
|
|
@st.cache_resource |
|
def load_translation_model(): |
|
with st.spinner('Loading translation model... Please wait.If you are here for First Time it takes 2 Mins to Please wait'): |
|
model = MBartForConditionalGeneration.from_pretrained("facebook/mbart-large-50-many-to-one-mmt") |
|
tokenizer = MBart50TokenizerFast.from_pretrained("facebook/mbart-large-50-many-to-one-mmt") |
|
return model, tokenizer |
|
|
|
|
|
def translate_text_local(text): |
|
model, tokenizer = load_translation_model() |
|
with st.spinner('Translation is on progress.If you are here for First Time it takes 2 Mins to Please wait'): |
|
inputs = tokenizer(text, return_tensors="pt", max_length=512, truncation=True) |
|
translated_tokens = model.generate(**inputs, forced_bos_token_id=tokenizer.lang_code_to_id["en_XX"]) |
|
translated_text = tokenizer.batch_decode(translated_tokens, skip_special_tokens=True)[0] |
|
return translated_text |
|
|
|
|
|
def generate_content(english_text, max_tokens, temperature, model): |
|
url = "https://api.groq.com/openai/v1/chat/completions" |
|
payload = { |
|
"model": model, |
|
"messages": [ |
|
{"role": "system", "content": "You are a creative and insightful writer."}, |
|
{"role": "user", "content": f"Write educational content about {english_text} within {max_tokens} tokens."} |
|
], |
|
"max_tokens": max_tokens, |
|
"temperature": temperature |
|
} |
|
response = requests.post(url, json=payload, headers=Content_generation) |
|
if response.status_code == 200: |
|
result = response.json() |
|
return result['choices'][0]['message']['content'] |
|
else: |
|
st.error(f"Content Generation Error: {response.status_code}") |
|
return None |
|
|
|
|
|
def generate_image_prompt(english_text): |
|
payload = { |
|
"model": "mixtral-8x7b-32768", |
|
"messages": [ |
|
{"role": "system", "content": "You are a professional Text to image prompt generator."}, |
|
{"role": "user", "content": f"Create a text to image generation prompt about {english_text} within 150 tokens."} |
|
], |
|
"max_tokens": 150 |
|
} |
|
response = requests.post("https://api.groq.com/openai/v1/chat/completions", json=payload, headers=Image_Prompt) |
|
if response.status_code == 200: |
|
result = response.json() |
|
return result['choices'][0]['message']['content'] |
|
else: |
|
st.error(f"Prompt Generation Error: {response.status_code}") |
|
return None |
|
|
|
|
|
def generate_image(image_prompt, model_url): |
|
data = {"inputs": image_prompt} |
|
response = requests.post(model_url, headers=Image_generation, json=data) |
|
if response.status_code == 200: |
|
return response.content |
|
else: |
|
st.error(f"Image Generation Error {response.status_code}: {response.text}") |
|
return None |
|
|
|
|
|
def show_user_guide(): |
|
st.title("FusionMind User Guide") |
|
st.write(""" |
|
### Welcome to the FusionMind User Guide! |
|
### How to use this app: |
|
1. **Input Tamil Text**: |
|
- You can either select one of the suggested Tamil phrases or input your own text. The app primarily focuses on Tamil inputs, but it supports a wide range of other languages as well (see the list below). |
|
2. **Generate Translations**: |
|
- Once you've input your text, the app will automatically translate it to English. The translation model is a **many-to-one model**, meaning it can take input from various languages and translate it into English. |
|
3. **Generate Educational Content**: |
|
- After translating the text into English, the app will generate **educational content** based on the translated input. You can adjust the creativity of the content generation using the temperature slider, and control the length of the output with the token limit setting. |
|
4. **Generate Images**: |
|
- In addition to generating content, the app can also generate an **image** related to the translated content. You don’t need to worry about creating complex image prompts—FusionMind includes an automatic **image prompt generator** that will convert your input into a well-defined image prompt, ensuring better image generation results. |
|
--- |
|
### Features: |
|
- **Multilingual Translation**: |
|
- FusionMind supports a **many-to-one translation model**, so you can input text in a wide variety of languages, not just Tamil. Below are the supported languages: |
|
- **Arabic (ar_AR)**, **Czech (cs_CZ)**, **German (de_DE)**, **English (en_XX)**, **Spanish (es_XX)**, **Estonian (et_EE)**, **Finnish (fi_FI)**, **French (fr_XX)**, **Gujarati (gu_IN)**, **Hindi (hi_IN)**, **Italian (it_IT)**, **Japanese (ja_XX)**, **Kazakh (kk_KZ)**, **Korean (ko_KR)**, **Lithuanian (lt_LT)**, **Latvian (lv_LV)**, **Burmese (my_MM)**, **Nepali (ne_NP)**, **Dutch (nl_XX)**, **Romanian (ro_RO)**, **Russian (ru_RU)**, **Sinhala (si_LK)**, **Turkish (tr_TR)**, **Vietnamese (vi_VN)**, **Chinese (zh_CN)**, **Afrikaans (af_ZA)**, **Azerbaijani (az_AZ)**, **Bengali (bn_IN)**, **Persian (fa_IR)**, **Hebrew (he_IL)**, **Croatian (hr_HR)**, **Indonesian (id_ID)**, **Georgian (ka_GE)**, **Khmer (km_KH)**, **Macedonian (mk_MK)**, **Malayalam (ml_IN)**, **Mongolian (mn_MN)**, **Marathi (mr_IN)**, **Polish (pl_PL)**, **Pashto (ps_AF)**, **Portuguese (pt_XX)**, **Swedish (sv_SE)**, **Swahili (sw_KE)**, **Tamil (ta_IN)**, **Telugu (te_IN)**, **Thai (th_TH)**, **Tagalog (tl_XX)**, **Ukrainian (uk_UA)**, **Urdu (ur_PK)**, **Xhosa (xh_ZA)**, **Galician (gl_ES)**, **Slovene (sl_SI)**. |
|
- **Temperature Adjustment**: |
|
- You can adjust the **temperature** of the content generation. A **higher temperature** makes the content more creative and varied, while a **lower temperature** generates more focused and deterministic responses. |
|
- **Token Limit**: |
|
- Set the **maximum number of tokens** for content generation. This allows you to control the length of the generated educational content. |
|
- **Auto-Generated Image Prompts**: |
|
- One of the unique features of FusionMind is the **auto-generated image prompts**. Even if you're not experienced in creating detailed prompts for image generation, the app will take care of this for you. It automatically converts the translated text or content into a well-defined prompt that produces more accurate and high-quality images. |
|
--- |
|
Enjoy the multimodal experience with **FusionMind** and explore its powerful translation, content generation, and image generation features! |
|
""") |
|
|
|
|
|
def main(): |
|
|
|
st.sidebar.title("FusionMind Options") |
|
page = st.sidebar.radio("Select a page:", ["Main App", "User Guide"]) |
|
|
|
if page == "User Guide": |
|
show_user_guide() |
|
return |
|
|
|
st.title("🅰️ℹ️ FusionMind ➡️ Multimodal") |
|
|
|
|
|
st.sidebar.header("Settings") |
|
temperature = st.sidebar.slider("Select Temperature", 0.1, 1.0, 0.7) |
|
max_tokens = st.sidebar.slider("Max Tokens for Content Generation", 100, 400, 200) |
|
|
|
|
|
content_model = st.sidebar.selectbox("Select Content Generation Model", list(content_models.keys()), index=0) |
|
|
|
|
|
image_model = st.sidebar.selectbox("Select Image Generation Model", list(image_generation_urls.keys()), index=0) |
|
|
|
|
|
st.write("## Suggested Inputs") |
|
suggestions = ["தரவு அறிவியல்", "உளவியல்", "ராக்கெட் எப்படி வேலை செய்கிறது"] |
|
selected_suggestion = st.selectbox("Select a suggestion or enter your own:", [""] + suggestions) |
|
|
|
|
|
tamil_input = st.text_input("Enter Tamil text (or select a suggestion):", selected_suggestion) |
|
|
|
if st.button("Generate"): |
|
|
|
if tamil_input: |
|
st.write("### Translated English Text:") |
|
english_text = translate_text_local(tamil_input) |
|
if english_text: |
|
st.success(english_text) |
|
|
|
|
|
st.write("### Generated Content:") |
|
with st.spinner('Generating content...'): |
|
content_output = generate_content(english_text, max_tokens, temperature, content_models[content_model]) |
|
if content_output: |
|
st.success(content_output) |
|
|
|
|
|
st.write("### Generated Image:") |
|
with st.spinner('Generating image...'): |
|
image_prompt = generate_image_prompt(english_text) |
|
image_data = generate_image(image_prompt, image_generation_urls[image_model]) |
|
if image_data: |
|
st.image(image_data, caption="Generated Image") |
|
|
|
if __name__ == "__main__": |
|
main() |