mjbuehler commited on
Commit
49ffe9d
·
verified ·
1 Parent(s): 215871a

Update app.py

Browse files

Added gpt-4o speech generation support, o3/o4 support

Files changed (1) hide show
  1. app.py +9 -1
app.py CHANGED
@@ -459,8 +459,11 @@ STANDARD_TEXT_MODELS = [
459
  "o1-2024-12-17",
460
  "o1-preview-2024-09-12",
461
  "o1-preview",
 
462
  "o3-mini",
463
  "o3-mini-2025-01-31",
 
 
464
  "gpt-4o-2024-08-06",
465
  "gpt-4o",
466
  "gpt-4o-mini-2024-07-18",
@@ -475,6 +478,7 @@ STANDARD_TEXT_MODELS = [
475
  STANDARD_AUDIO_MODELS = [
476
  "tts-1",
477
  "tts-1-hd",
 
478
  ]
479
 
480
  STANDARD_VOICES = [
@@ -484,6 +488,9 @@ STANDARD_VOICES = [
484
  "onyx",
485
  "nova",
486
  "shimmer",
 
 
 
487
  ]
488
 
489
  class DialogueItem(BaseModel):
@@ -735,7 +742,8 @@ with gr.Blocks(title="PDF to Audio", css="""
735
  audio_model = gr.Dropdown(
736
  label="Audio Generation Model",
737
  choices=STANDARD_AUDIO_MODELS,
738
- value="tts-1",
 
739
  info="Select the model to generate the audio.",
740
  )
741
  speaker_1_voice = gr.Dropdown(
 
459
  "o1-2024-12-17",
460
  "o1-preview-2024-09-12",
461
  "o1-preview",
462
+ "o1-pro",
463
  "o3-mini",
464
  "o3-mini-2025-01-31",
465
+ "o3",
466
+ "o4-mini",
467
  "gpt-4o-2024-08-06",
468
  "gpt-4o",
469
  "gpt-4o-mini-2024-07-18",
 
478
  STANDARD_AUDIO_MODELS = [
479
  "tts-1",
480
  "tts-1-hd",
481
+ "gpt-4o-mini-tts",
482
  ]
483
 
484
  STANDARD_VOICES = [
 
488
  "onyx",
489
  "nova",
490
  "shimmer",
491
+ "verse",
492
+ "sage",
493
+ "coral",
494
  ]
495
 
496
  class DialogueItem(BaseModel):
 
742
  audio_model = gr.Dropdown(
743
  label="Audio Generation Model",
744
  choices=STANDARD_AUDIO_MODELS,
745
+ value="gpt-4o-mini-tts",
746
+ #value="tts-1",
747
  info="Select the model to generate the audio.",
748
  )
749
  speaker_1_voice = gr.Dropdown(