Spaces:

undetectable
/

voice-clone

Configuration error

App Files Files Community

renator commited on Jan 25, 2024

Commit

e0491f4

1 Parent(s): f96db58

checking times

Browse files

Files changed (3) hide show

Dockerfile +2 -1
project.log +0 -0
texttovoice/views.py +26 -13

Dockerfile CHANGED Viewed

@@ -38,7 +38,8 @@ COPY packages/matching.py /usr/local/lib/python3.10/site-packages/librosa/util/m
 COPY packages/spectrum.py /usr/local/lib/python3.10/site-packages/librosa/core/spectrum.py
 COPY packages/pitch.py /usr/local/lib/python3.10/site-packages/librosa/core/pitch.py
 RUN chmod -R 777 /usr/local/lib/python3.10/site-packages/librosa \
-    && chmod 777 /tmp && mkdir /.local && chmod -R 777 /.local  && mkdir /.cache && chmod -R 777 /.cache
 # Set the environment variable for the NUMBA cache directory

 COPY packages/spectrum.py /usr/local/lib/python3.10/site-packages/librosa/core/spectrum.py
 COPY packages/pitch.py /usr/local/lib/python3.10/site-packages/librosa/core/pitch.py
 RUN chmod -R 777 /usr/local/lib/python3.10/site-packages/librosa \
+    && chmod 777 /tmp && mkdir /.local && chmod -R 777 /.local  && mkdir /.cache && chmod -R 777 /.cache && \
+     mkdir /.config && chmod -R 777  /.config
 # Set the environment variable for the NUMBA cache directory

project.log ADDED Viewed

The diff for this file is too large to render. See raw diff

texttovoice/views.py CHANGED Viewed

@@ -1,5 +1,8 @@
 import os
 import uuid
 from django.http import FileResponse
 from rest_framework import status
 from rest_framework.response import Response
@@ -14,6 +17,9 @@ from drf_yasg import openapi
 from drf_yasg.utils import swagger_auto_schema
 class TextToSpeechCreateView(CreateAPIView):
     serializer_class = TextToSpeechSerializer
     authentication_classes = [TokenAuthentication]  # Apply token authentication
@@ -43,19 +49,16 @@ class TextToSpeechCreateView(CreateAPIView):
     def create(self, request, *args, **kwargs):
         serializer = self.get_serializer(data=request.data)
         if serializer.is_valid():
             text = serializer.validated_data.get("text")
             speaker_wav = serializer.validated_data.get("speaker_wav")
             language = serializer.validated_data.get("language")
             output_filename = f"output_{uuid.uuid4()}.wav"
-            # try:
-            # Define the directory path
-            tmp_dir = "/.local"
-            # Check if the directory exists and create it if it doesn't
-            if not os.path.exists(tmp_dir):
-                os.makedirs(tmp_dir)
-            print("before creating the speaker file path", os.path)
             # Save the uploaded speaker file to a temporary location
             speaker_file_path = os.path.join('/tmp', speaker_wav.name)
@@ -63,12 +66,16 @@ class TextToSpeechCreateView(CreateAPIView):
                 for chunk in speaker_wav.chunks():
                     destination.write(chunk)
-            print("after creating the speaker file path",speaker_file_path)
             # Generate speech using tts.tts_to_file
-            tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2", gpu=False)
             tts.tts_to_file(text=text, file_path=output_filename, speaker_wav=speaker_file_path, language=language)
             # Define a function to delete the output file
             def file_iterator(file_name):
                 with open(file_name, 'rb') as f:
@@ -86,10 +93,16 @@ class TextToSpeechCreateView(CreateAPIView):
             # TextToSpeech.objects.create(
             # text=text,
             # speaker_wav=speaker_wav,
             # language=language,
             # created_by=request.user  # Assign the authenticated user here
-            #     )
-            response = FileResponse(file_iterator(output_filename), as_attachment=True, content_type='audio/wav')
             return response
             # except Exception as e:

 import os
 import uuid
+import time
+import logging  # Import the logging module
+import torch
 from django.http import FileResponse
 from rest_framework import status
 from rest_framework.response import Response
 from drf_yasg.utils import swagger_auto_schema
+# Initialize logger at module level
+logger = logging.getLogger(__name__)
 class TextToSpeechCreateView(CreateAPIView):
     serializer_class = TextToSpeechSerializer
     authentication_classes = [TokenAuthentication]  # Apply token authentication
     def create(self, request, *args, **kwargs):
         serializer = self.get_serializer(data=request.data)
         if serializer.is_valid():
+            gpu_available = torch.cuda.is_available()
             text = serializer.validated_data.get("text")
             speaker_wav = serializer.validated_data.get("speaker_wav")
             language = serializer.validated_data.get("language")
             output_filename = f"output_{uuid.uuid4()}.wav"
+            # Log the start time
+            start_time = time.time()
+            print("start", start_time)
+            logger.info(f"start time: {start_time} ")
             # Save the uploaded speaker file to a temporary location
             speaker_file_path = os.path.join('/tmp', speaker_wav.name)
                 for chunk in speaker_wav.chunks():
                     destination.write(chunk)
             # Generate speech using tts.tts_to_file
+            tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2", gpu=gpu_available)
             tts.tts_to_file(text=text, file_path=output_filename, speaker_wav=speaker_file_path, language=language)
+            # Log the end time
+            end_time = time.time()
+            # Calculate the processing time
+            processing_time = end_time - start_time
             # Define a function to delete the output file
             def file_iterator(file_name):
                 with open(file_name, 'rb') as f:
             # TextToSpeech.objects.create(
             # text=text,
             # speaker_wav=speaker_wav,
+            # output_wav=output_filename,
             # language=language,
             # created_by=request.user  # Assign the authenticated user here
+            # )
+            response = FileResponse(output_filename, as_attachment=True, content_type='audio/wav')
+            # Log the processing time using the logger
+            logger.info(f"start time: {start_time} , end time: {end_time} and Processing time: {processing_time} seconds")
+            print(f"start time: {start_time} , end time: {end_time} and Processing time: {processing_time} seconds")
             return response
             # except Exception as e: