Spaces:
Runtime error
Runtime error
StormblessedKal
commited on
Commit
•
e13b6d4
1
Parent(s):
5dfe293
add new parameter
Browse files- src/__pycache__/predict.cpython-310.pyc +0 -0
- src/__pycache__/rp_schema.cpython-310.pyc +0 -0
- src/predict.py +31 -34
- src/rp_handler.py +5 -1
- src/rp_schema.py +5 -1
src/__pycache__/predict.cpython-310.pyc
CHANGED
Binary files a/src/__pycache__/predict.cpython-310.pyc and b/src/__pycache__/predict.cpython-310.pyc differ
|
|
src/__pycache__/rp_schema.cpython-310.pyc
CHANGED
Binary files a/src/__pycache__/rp_schema.cpython-310.pyc and b/src/__pycache__/rp_schema.cpython-310.pyc differ
|
|
src/predict.py
CHANGED
@@ -204,7 +204,7 @@ class Predictor:
|
|
204 |
return {"url": file_url}
|
205 |
|
206 |
|
207 |
-
def predict(self,s3_url,passage,process_audio):
|
208 |
output_dir = 'processed'
|
209 |
gen_id = str(uuid.uuid4())
|
210 |
os.makedirs(output_dir,exist_ok=True)
|
@@ -222,41 +222,38 @@ class Predictor:
|
|
222 |
local_file_path = os.path.join(raw_dir,s3_key)
|
223 |
self.download_file_from_s3(self.s3_client,bucket_name,s3_key,local_file_path)
|
224 |
#voice_clone with styletts2
|
225 |
-
|
226 |
-
|
227 |
-
|
228 |
-
|
229 |
-
|
230 |
-
|
231 |
-
|
232 |
-
|
233 |
-
|
234 |
-
|
235 |
-
|
236 |
-
|
237 |
-
|
238 |
-
|
239 |
-
|
240 |
-
|
241 |
-
|
242 |
-
|
243 |
-
|
244 |
-
(
|
245 |
-
|
246 |
-
|
247 |
-
|
248 |
-
|
249 |
-
|
250 |
-
|
251 |
-
|
252 |
-
|
253 |
-
print(mp3_final_output_2)
|
254 |
|
255 |
-
self.upload_file_to_s3(
|
256 |
-
self.upload_file_to_s3(mp3_final_output_2,'demovidelyusergenerations',f"{gen_id}-voice-clone-2.mp3")
|
257 |
shutil.rmtree(os.path.join(output_dir,gen_id))
|
258 |
-
return {"
|
259 |
-
"voice_clone_2":f"https://demovidelyusergenerations.s3.amazonaws.com/{gen_id}-voice-clone-2.mp3"
|
260 |
}
|
261 |
|
262 |
|
|
|
204 |
return {"url": file_url}
|
205 |
|
206 |
|
207 |
+
def predict(self,s3_url,passage,process_audio,run_type='styletts2'):
|
208 |
output_dir = 'processed'
|
209 |
gen_id = str(uuid.uuid4())
|
210 |
os.makedirs(output_dir,exist_ok=True)
|
|
|
222 |
local_file_path = os.path.join(raw_dir,s3_key)
|
223 |
self.download_file_from_s3(self.s3_client,bucket_name,s3_key,local_file_path)
|
224 |
#voice_clone with styletts2
|
225 |
+
if run_type == 'styletts2':
|
226 |
+
model,sampler = self.model,self.sampler
|
227 |
+
result = self.process_audio_file(local_file_path,passage,model,sampler)
|
228 |
+
final_output = os.path.join(results_dir,f"{gen_id}-voice-clone-1.wav")
|
229 |
+
|
230 |
+
sf.write(final_output,result,24000)
|
231 |
+
if process_audio:
|
232 |
+
(new_sr, wav1) = self._fn(final_output,"Midpoint",32,0.5)
|
233 |
+
sf.write(final_output,wav1,new_sr)
|
234 |
+
mp3_final_output = str(final_output).replace('wav','mp3')
|
235 |
+
self.convert_wav_to_mp3(final_output,mp3_final_output)
|
236 |
+
|
237 |
+
if run_type == 'openvoice':
|
238 |
+
s_ref = self.compute_style(local_file_path, self.model)
|
239 |
+
base_speaker_tts,tone_color_converter = self.base_speaker_tts,self.tone_color_converter
|
240 |
+
reference_speaker = local_file_path
|
241 |
+
target_se, audio_name = se_extractor.get_se(reference_speaker, tone_color_converter, target_dir=openvoice_dir, vad=False)
|
242 |
+
src_path = os.path.join(results_dir,f"{gen_id}-tmp.wav")
|
243 |
+
openvoice_output = os.path.join(results_dir,f"{gen_id}-voice-clone-2.wav")
|
244 |
+
base_speaker_tts.tts(passage,src_path,speaker='default',language='English',speed=1.0)
|
245 |
+
|
246 |
+
source_se = torch.load(f'{self.ckpt_base}/en_default_se.pth').to(self.device)
|
247 |
+
tone_color_converter.convert(audio_src_path=src_path,src_se=source_se,tgt_se=target_se,output_path=openvoice_output,message='')
|
248 |
+
if process_audio:
|
249 |
+
(new_sr, wav1) = self._fn(openvoice_output,"Midpoint",32,0.5)
|
250 |
+
sf.write(openvoice_output,wav1,new_sr)
|
251 |
+
mp3_final_output = str(openvoice_output).replace('wav','mp3')
|
252 |
+
self.convert_wav_to_mp3(openvoice_output,mp3_final_output)
|
|
|
253 |
|
254 |
+
self.upload_file_to_s3(mp3_final_output,'demovidelyusergenerations',f"{gen_id}-voice-clone.mp3")
|
|
|
255 |
shutil.rmtree(os.path.join(output_dir,gen_id))
|
256 |
+
return {"voice_clone":f"https://demovidelyusergenerations.s3.amazonaws.com/{gen_id}-voice-clone.mp3"
|
|
|
257 |
}
|
258 |
|
259 |
|
src/rp_handler.py
CHANGED
@@ -50,7 +50,11 @@ def run_voice_clone_job(job):
|
|
50 |
process_audio = False
|
51 |
|
52 |
if method_type == 'voice_clone':
|
53 |
-
|
|
|
|
|
|
|
|
|
54 |
if method_type == 'voice_clone_with_emotions':
|
55 |
result = MODEL.predict_with_emotions(s3_url,passage,process_audio)
|
56 |
if method_type == 'voice_clone_with_multi_lang':
|
|
|
50 |
process_audio = False
|
51 |
|
52 |
if method_type == 'voice_clone':
|
53 |
+
run_type = job_input.get('run_type')
|
54 |
+
if run_type is not None:
|
55 |
+
result = MODEL.predict(s3_url,passage,process_audio,run_type)
|
56 |
+
else:
|
57 |
+
result = MODEL.predict(s3_url,passage,process_audio)
|
58 |
if method_type == 'voice_clone_with_emotions':
|
59 |
result = MODEL.predict_with_emotions(s3_url,passage,process_audio)
|
60 |
if method_type == 'voice_clone_with_multi_lang':
|
src/rp_schema.py
CHANGED
@@ -28,6 +28,10 @@ INPUT_VALIDATIONS = {
|
|
28 |
'type': bool,
|
29 |
'required': False,
|
30 |
'default': False
|
|
|
|
|
|
|
|
|
|
|
31 |
}
|
32 |
-
|
33 |
}
|
|
|
28 |
'type': bool,
|
29 |
'required': False,
|
30 |
'default': False
|
31 |
+
},
|
32 |
+
'run_type': {
|
33 |
+
'type': str,
|
34 |
+
'required': False,
|
35 |
+
'default': False
|
36 |
}
|
|
|
37 |
}
|