Spaces:
Running
Running
Update app.py
Browse filesAdded gpt-4o speech generation support, o3/o4 support
app.py
CHANGED
@@ -459,8 +459,11 @@ STANDARD_TEXT_MODELS = [
|
|
459 |
"o1-2024-12-17",
|
460 |
"o1-preview-2024-09-12",
|
461 |
"o1-preview",
|
|
|
462 |
"o3-mini",
|
463 |
"o3-mini-2025-01-31",
|
|
|
|
|
464 |
"gpt-4o-2024-08-06",
|
465 |
"gpt-4o",
|
466 |
"gpt-4o-mini-2024-07-18",
|
@@ -475,6 +478,7 @@ STANDARD_TEXT_MODELS = [
|
|
475 |
STANDARD_AUDIO_MODELS = [
|
476 |
"tts-1",
|
477 |
"tts-1-hd",
|
|
|
478 |
]
|
479 |
|
480 |
STANDARD_VOICES = [
|
@@ -484,6 +488,9 @@ STANDARD_VOICES = [
|
|
484 |
"onyx",
|
485 |
"nova",
|
486 |
"shimmer",
|
|
|
|
|
|
|
487 |
]
|
488 |
|
489 |
class DialogueItem(BaseModel):
|
@@ -735,7 +742,8 @@ with gr.Blocks(title="PDF to Audio", css="""
|
|
735 |
audio_model = gr.Dropdown(
|
736 |
label="Audio Generation Model",
|
737 |
choices=STANDARD_AUDIO_MODELS,
|
738 |
-
value="tts
|
|
|
739 |
info="Select the model to generate the audio.",
|
740 |
)
|
741 |
speaker_1_voice = gr.Dropdown(
|
|
|
459 |
"o1-2024-12-17",
|
460 |
"o1-preview-2024-09-12",
|
461 |
"o1-preview",
|
462 |
+
"o1-pro",
|
463 |
"o3-mini",
|
464 |
"o3-mini-2025-01-31",
|
465 |
+
"o3",
|
466 |
+
"o4-mini",
|
467 |
"gpt-4o-2024-08-06",
|
468 |
"gpt-4o",
|
469 |
"gpt-4o-mini-2024-07-18",
|
|
|
478 |
STANDARD_AUDIO_MODELS = [
|
479 |
"tts-1",
|
480 |
"tts-1-hd",
|
481 |
+
"gpt-4o-mini-tts",
|
482 |
]
|
483 |
|
484 |
STANDARD_VOICES = [
|
|
|
488 |
"onyx",
|
489 |
"nova",
|
490 |
"shimmer",
|
491 |
+
"verse",
|
492 |
+
"sage",
|
493 |
+
"coral",
|
494 |
]
|
495 |
|
496 |
class DialogueItem(BaseModel):
|
|
|
742 |
audio_model = gr.Dropdown(
|
743 |
label="Audio Generation Model",
|
744 |
choices=STANDARD_AUDIO_MODELS,
|
745 |
+
value="gpt-4o-mini-tts",
|
746 |
+
#value="tts-1",
|
747 |
info="Select the model to generate the audio.",
|
748 |
)
|
749 |
speaker_1_voice = gr.Dropdown(
|