Spaces:

AIGC-Audio
/

AudioGPT

Build error

App Files Files Community

lmzjms commited on Apr 4, 2023

Commit

d3ddefb

1 Parent(s): 9382970

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -164,7 +164,7 @@ class ConversationBot:
         self.tts = TTS(device="cpu")
         # self.t2s = T2S(device="cuda:0")
         # self.i2a = I2A(device="cpu")
-        # self.a2t = A2T(device="cpu")
         # self.asr = ASR(device="cuda:0")
         # self.inpaint = Inpaint(device="cpu")
         #self.tts_ood = TTS_OOD(device="cuda:0")
@@ -191,13 +191,13 @@ class ConversationBot:
             #                  "The input to this tool should be a comma seperated string of three, representing text, note and duration sequence since User Input Text, Note and Duration Sequence are all provided."),
             Tool(name="Synthesize Speech Given the User Input Text", func=self.tts.inference,
                  description="useful for when you want to convert a user input text into speech audio it saved it to a file."
-                             "The input to this tool should be a string, representing the text used to be converted to speech.")]
             # Tool(name="Generate Audio From The Image", func=self.i2a.inference,
             #      description="useful for when you want to generate an audio based on an image."
             #                   "The input to this tool should be a string, representing the image_path. "),
-            # Tool(name="Generate Text From The Audio", func=self.a2t.inference,
-            #      description="useful for when you want to describe an audio in text, receives audio_path as input."
-            #                  "The input to this tool should be a string, representing the audio_path."),
             # Tool(name="Audio Inpainting", func=self.inpaint.show_mel_fn,
             #      description="useful for when you want to inpaint a mel spectrum of an audio and predict this audio, this tool will generate a mel spectrum and you can inpaint it, receives audio_path as input, "
             #                  "The input to this tool should be a string, representing the audio_path.")]

         self.tts = TTS(device="cpu")
         # self.t2s = T2S(device="cuda:0")
         # self.i2a = I2A(device="cpu")
+        self.a2t = A2T(device="cpu")
         # self.asr = ASR(device="cuda:0")
         # self.inpaint = Inpaint(device="cpu")
         #self.tts_ood = TTS_OOD(device="cuda:0")
             #                  "The input to this tool should be a comma seperated string of three, representing text, note and duration sequence since User Input Text, Note and Duration Sequence are all provided."),
             Tool(name="Synthesize Speech Given the User Input Text", func=self.tts.inference,
                  description="useful for when you want to convert a user input text into speech audio it saved it to a file."
+                             "The input to this tool should be a string, representing the text used to be converted to speech."),
             # Tool(name="Generate Audio From The Image", func=self.i2a.inference,
             #      description="useful for when you want to generate an audio based on an image."
             #                   "The input to this tool should be a string, representing the image_path. "),
+            Tool(name="Generate Text From The Audio", func=self.a2t.inference,
+                 description="useful for when you want to describe an audio in text, receives audio_path as input."
+                             "The input to this tool should be a string, representing the audio_path.")]
             # Tool(name="Audio Inpainting", func=self.inpaint.show_mel_fn,
             #      description="useful for when you want to inpaint a mel spectrum of an audio and predict this audio, this tool will generate a mel spectrum and you can inpaint it, receives audio_path as input, "
             #                  "The input to this tool should be a string, representing the audio_path.")]