Seed-VC-characters

Running

App Files Files Community

soiz1 commited on Mar 11

Commit

a1bbd98

verified ·

1 Parent(s): 3310f9f

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -42

app.py CHANGED Viewed

@@ -733,36 +733,21 @@ if __name__ == "__main__":
     ).launch()
 import gradio as gr
-# ギャラリーの画像と対応するMP3ファイル
-gallery_data = [
-    {
-        "image": "default/sikokumetan.webp",
-        "mp3": "default/sikokumetan.mp3"
-    }
-]
-# ギャラリーの画像が選択された際の処理
-def on_image_select(image_path):
-    for item in gallery_data:
-        if item["image"] == image_path:
-            return item["mp3"]
-    return None
-# 出力の再定義 (重要)
-outputs = [
-    gr.Audio(label="ストリーム出力音声", streaming=True, format='mp3'),
-    gr.Audio(label="完全出力音声", streaming=False, format='wav')
-]
 if __name__ == "__main__":
     description = ("Zero-shot音声変換モデル（学習不要）。ローカルでの利用方法は[GitHubリポジトリ](https://github.com/Plachtaa/seed-vc)をご覧ください。"
                    "参考音声が25秒を超える場合、自動的に25秒にクリップされます。"
                    "また、元音声と参考音声の合計時間が30秒を超える場合、元音声は分割処理されます。")
     inputs = [
         gr.Audio(type="filepath", label="元音声"),
         gr.Audio(type="filepath", label="参考音声"),
@@ -774,25 +759,24 @@ if __name__ == "__main__":
         gr.Slider(label='音程変換', minimum=-24, maximum=24, step=1, value=0, info="半音単位の音程変換。F0条件付きモデル使用時にのみ有効です"),
     ]
-    # ギャラリーコンポーネントの追加
-    gallery = gr.Gallery(
-        value=[item["image"] for item in gallery_data],
-        label="参考音声選択画像",
-        interactive=True,
-        columns=3
-    )
-    # ギャラリー画像が選択されたときにMP3を自動で設定
-    def update_reference_audio(selected_image):
-        return on_image_select(selected_image)
-    # 参考音声を選択するためのインターフェースを更新
-    gr.Interface(
-        fn=voice_conversion,
-        description=description,
-        inputs=[*inputs, gallery],
-        outputs=outputs,  # ここでoutputsを正しく指定
-        title="Seed Voice Conversion",
-        examples=examples,
-        cache_examples=False,
-    ).launch()

     ).launch()
 import gradio as gr
+gallery_data = {"sikokumetan": {"webp": "default/sikokumetan.webp", "mp3": "default/sikokumetan.mp3"}}
+def update_reference(selected_image):
+    for key, value in gallery_data.items():
+        if value["webp"] == selected_image:
+            return value["mp3"]
+    return ""
 if __name__ == "__main__":
     description = ("Zero-shot音声変換モデル（学習不要）。ローカルでの利用方法は[GitHubリポジトリ](https://github.com/Plachtaa/seed-vc)をご覧ください。"
                    "参考音声が25秒を超える場合、自動的に25秒にクリップされます。"
                    "また、元音声と参考音声の合計時間が30秒を超える場合、元音声は分割処理されます。")
     inputs = [
         gr.Audio(type="filepath", label="元音声"),
         gr.Audio(type="filepath", label="参考音声"),
         gr.Slider(label='音程変換', minimum=-24, maximum=24, step=1, value=0, info="半音単位の音程変換。F0条件付きモデル使用時にのみ有効です"),
     ]
+    examples = [["examples/source/yae_0.wav", "examples/reference/dingzhen_0.wav", 25, 1.0, 0.7, False, True, 0],
+                ["examples/source/jay_0.wav", "examples/reference/azuma_0.wav", 25, 1.0, 0.7, True, True, 0],
+                ["examples/source/Wiz Khalifa,Charlie Puth - See You Again [vocals]_[cut_28sec].wav",
+                 "examples/reference/teio_0.wav", 100, 1.0, 0.7, True, False, 0],
+                ["examples/source/TECHNOPOLIS - 2085 [vocals]_[cut_14sec].wav",
+                 "examples/reference/trump_0.wav", 50, 1.0, 0.7, True, False, -12],
+                ]
+    outputs = [gr.Audio(label="ストリーム出力音声", streaming=True, format='mp3'),
+               gr.Audio(label="完全出力音声", streaming=False, format='wav')]
+    with gr.Blocks() as interface:
+        gr.Interface(fn=voice_conversion, description=description, inputs=inputs, outputs=outputs, title="Seed Voice Conversion", examples=examples, cache_examples=False)
+        with gr.Row():
+            gallery = gr.Gallery(label="ギャラリー", show_label=True)
+            gallery.add([gallery_data["sikokumetan"]["webp"]])
+        gallery.select(update_reference, outputs=inputs[1])
+    interface.launch()