Spaces:

ruslanmv
/

Youtube-Video-Translator

Running

App Files Files Community

ruslanmv commited on Feb 4

Commit

b87d15c

verified ·

1 Parent(s): 57f33b1

Update app.py

Browse files

Files changed (1) hide show

app.py +70 -63

app.py CHANGED Viewed

@@ -5,7 +5,7 @@
 # importing all necessary libraries
 import httpcore
-#setattr(httpcore, 'SyncHTTPTransport', 'AsyncHTTPProxy') # This line is problematic and should be removed or corrected based on the intended use.
 import pathlib
 import sys, os
 from gtts import gTTS
@@ -33,13 +33,13 @@ def download_video(url):
 def validate_youtube(url):
     #This creates a youtube objet
     try:
-        yt = YouTube(url)
     except Exception:
         print("Hi there URL seems invalid")
         return True
     #This will return the length of the video in sec as an int
     video_length = yt.length
-    if  video_length > 600:
         print("Your video is larger than 10 minutes")
         return True
     else:
@@ -52,7 +52,7 @@ def validate_url(url):
         print("Hi there URL seems invalid ")
         return True
     else:
-        return False
 def cleanup():
@@ -63,16 +63,16 @@ def cleanup():
     junks = []
     for files in types:
         junks.extend(glob.glob(files))
-    try:
         # Deleting those files
         for junk in junks:
             print("Deleting",junk)
             # Setting the path for the file to delete
             file = pathlib.Path(junk)
             # Calling the unlink method on the path
-            file.unlink()
     except Exception:
-        print("I cannot delete the file because it is being used by another process")
 def getSize(filename):
     st = os.stat(filename)
@@ -83,33 +83,33 @@ def clean_transcript(transcript_list):
     script = ""
     for text in transcript_list:
         t = text["text"]
-        if( (t != '[music]')  and \
-            (t != '[Music]')  and \
-            (t != '[музыка]') and \
-            (t != '[Музыка]') and \
-            (t != '[musik]')  and \
-            (t != '[Musik]')  and \
-            (t != '[musica]') and \
-            (t != '[Musica]') and \
-            (t != '[música]') and \
-            (t != '[Música]') and \
             (t != '[音楽]')   and \
-            (t != '[音乐]')
-        ) :
             script += t + " "
     return script
 def get_transcript(url,desired_language):
     id_you= url[url.index("=")+1:]
-    try:
         # retrieve the available transcripts
         transcript_list = YouTubeTranscriptApi.list_transcripts(id_you)
     except Exception:
         print('TranscriptsDisabled:')
         is_translated = False
-        return " ", " ", is_translated
     lista=[]
     transcript_translation_languages=[]
@@ -120,7 +120,7 @@ def get_transcript(url,desired_language):
         transcript.is_generated,
         transcript.is_translatable,
         transcript_translation_languages.append(transcript.translation_languages),
-                    ])
     print(lista)
     n_size=int(len(lista)/4)
     print("There are {} avialable scripts".format(n_size))
@@ -131,12 +131,12 @@ def get_transcript(url,desired_language):
     matrix=matrix.tolist()
     is_manually=False
     is_automatic=False
-    for lista in matrix:
         #print(lista)
         language_code=lista[0]
         is_generated=lista[1]
         is_translatable=lista[2]
-        if not is_generated and is_translatable :
             print("Script found manually generated")
             is_manually=True
             language_code_man=language_code
@@ -144,12 +144,12 @@ def get_transcript(url,desired_language):
             print("Script found automatic generated")
             is_automatic=True
             language_code_au=language_code
     if  is_manually:
         # we try filter for manually created transcripts
         print('We extract manually created transcripts')
-        transcript = transcript_list.find_manually_created_transcript([language_code])
     elif is_automatic:
         print('We  extract generated transcript')
         # or automatically generated ones, but not translated
@@ -169,13 +169,13 @@ def get_transcript(url,desired_language):
                 transcript_translated=transcript_translated.fetch()
                 translated=clean_transcript(transcript_translated)
                 is_translated = True
-    script_translated = ""
     if is_translated :
         script_translated = translated
     transcript=transcript.fetch()
     script = clean_transcript(transcript)
     return script, script_translated, is_translated
 # Set environment variables
@@ -226,7 +226,7 @@ def video_to_translate(url,initial_language,final_language):
     elif final_language == "Vietnamese":
         lang='vi'
     elif final_language == "Japanese":
-        lang='ja'
     # Initial directory
     home_dir= os.getenv('home_dir')
     print('Initial directory:',home_dir)
@@ -272,15 +272,15 @@ def video_to_translate(url,initial_language,final_language):
                     text=text+text_chunk+" "
                 text=str(text)
                 print(type(text))
             else:
                 try:
                         text = r.recognize_google(audio_data, language = lang_in)
                 except Exception:
-                    print("This video cannot be recognized")
-                    cleanup()
-                    return "./demo/tryagain.mp4"
         #print(text)
         print("Destination language ",lang)
@@ -294,20 +294,20 @@ def video_to_translate(url,initial_language,final_language):
             print("This text cannot be translated")
             cleanup()
             return "./demo/tryagain.mp4"
         #translation.text
         trans=translation.text
-    myobj = gTTS(text=trans, lang=lang, slow=False)
-    myobj.save("audio.wav")
     # loading audio file
     audioclip = AudioFileClip("audio.wav")
     # adding audio to the video clip
     new_audioclip = CompositeAudioClip([audioclip])
     videoclip.audio = new_audioclip
     new_video="video_translated_"+lang+".mp4"
     # Return back to main directory
     os.chdir(home_dir)
     print('Final directory',os.getcwd())
@@ -319,24 +319,31 @@ def video_to_translate(url,initial_language,final_language):
     return new_video
-initial_language = gr.Dropdown(["English", "Italian", "Japanese", "Russian", "Spanish", "German"], label="Initial Language")
-final_language = gr.Dropdown(["Russian", "Italian", "Spanish", "German", "English", "Japanese"], label="Final Language")
-url = gr.Textbox(label="Enter the YouTube URL below:")
-gr.Interface(
-    fn=video_to_translate,
-    inputs=[url, initial_language, final_language],
-    outputs='video',
-    #verbose=True, # Removed verbose as it's no longer a valid parameter
-    title='Video Youtube Translator',
-    description='A simple application that translates Youtube small videos from English, Italian, Japanese, Russian, Spanish, and German to Italian, Spanish, Russian, English, and Japanese. Wait one minute to process.',
-    article='''<div>
-        <p style="text-align: center">All you need to do is paste the Youtube link and hit submit, then wait for compiling. After that, click on Play/Pause for listening to the video. The video is saved in an mp4 format.
-        The video length limit is 10 minutes. For more information, visit <a href="https://ruslanmv.com/">ruslanmv.com</a>
-        </p>
-    </div>''',
-    examples=[
-        ["https://www.youtube.com/watch?v=uLVRZE8OAI4", "English", "Spanish"],
-    ]
-).launch()

 # importing all necessary libraries
 import httpcore
+setattr(httpcore, 'SyncHTTPTransport', Any)
 import pathlib
 import sys, os
 from gtts import gTTS
 def validate_youtube(url):
     #This creates a youtube objet
     try:
+        yt = YouTube(url)
     except Exception:
         print("Hi there URL seems invalid")
         return True
     #This will return the length of the video in sec as an int
     video_length = yt.length
+    if    video_length > 600:
         print("Your video is larger than 10 minutes")
         return True
     else:
         print("Hi there URL seems invalid ")
         return True
     else:
+        return False
 def cleanup():
     junks = []
     for files in types:
         junks.extend(glob.glob(files))
+    try:
         # Deleting those files
         for junk in junks:
             print("Deleting",junk)
             # Setting the path for the file to delete
             file = pathlib.Path(junk)
             # Calling the unlink method on the path
+            file.unlink()
     except Exception:
+        print("I cannot delete the file because it is being used by another process")
 def getSize(filename):
     st = os.stat(filename)
     script = ""
     for text in transcript_list:
         t = text["text"]
+        if( (t != '[music]')  and  \
+            (t != '[Music]')  and  \
+            (t != '[музыка]') and  \
+            (t != '[Музыка]') and  \
+            (t != '[musik]')  and  \
+            (t != '[Musik]')  and  \
+            (t != '[musica]') and  \
+            (t != '[Musica]') and  \
+            (t != '[música]') and  \
+            (t != '[Música]') and  \
             (t != '[音楽]')   and \
+            (t != '[音乐]')
+          ) :
             script += t + " "
     return script
 def get_transcript(url,desired_language):
     id_you= url[url.index("=")+1:]
+    try:
         # retrieve the available transcripts
         transcript_list = YouTubeTranscriptApi.list_transcripts(id_you)
     except Exception:
         print('TranscriptsDisabled:')
         is_translated = False
+        return " ", " ", is_translated
     lista=[]
     transcript_translation_languages=[]
         transcript.is_generated,
         transcript.is_translatable,
         transcript_translation_languages.append(transcript.translation_languages),
+                     ])
     print(lista)
     n_size=int(len(lista)/4)
     print("There are {} avialable scripts".format(n_size))
     matrix=matrix.tolist()
     is_manually=False
     is_automatic=False
+    for lista in matrix:
         #print(lista)
         language_code=lista[0]
         is_generated=lista[1]
         is_translatable=lista[2]
+        if not is_generated and is_translatable :
             print("Script found manually generated")
             is_manually=True
             language_code_man=language_code
             print("Script found automatic generated")
             is_automatic=True
             language_code_au=language_code
     if  is_manually:
         # we try filter for manually created transcripts
         print('We extract manually created transcripts')
+        transcript = transcript_list.find_manually_created_transcript([language_code])
     elif is_automatic:
         print('We  extract generated transcript')
         # or automatically generated ones, but not translated
                 transcript_translated=transcript_translated.fetch()
                 translated=clean_transcript(transcript_translated)
                 is_translated = True
+    script_translated = ""
     if is_translated :
         script_translated = translated
     transcript=transcript.fetch()
     script = clean_transcript(transcript)
     return script, script_translated, is_translated
 # Set environment variables
     elif final_language == "Vietnamese":
         lang='vi'
     elif final_language == "Japanese":
+        lang='ja'
     # Initial directory
     home_dir= os.getenv('home_dir')
     print('Initial directory:',home_dir)
                     text=text+text_chunk+" "
                 text=str(text)
                 print(type(text))
             else:
                 try:
                         text = r.recognize_google(audio_data, language = lang_in)
                 except Exception:
+                        print("This video cannot be recognized")
+                        cleanup()
+                        return "./demo/tryagain.mp4"
         #print(text)
         print("Destination language ",lang)
             print("This text cannot be translated")
             cleanup()
             return "./demo/tryagain.mp4"
         #translation.text
         trans=translation.text
+    myobj = gTTS(text=trans, lang=lang, slow=False)
+    myobj.save("audio.wav")
     # loading audio file
     audioclip = AudioFileClip("audio.wav")
     # adding audio to the video clip
     new_audioclip = CompositeAudioClip([audioclip])
     videoclip.audio = new_audioclip
     new_video="video_translated_"+lang+".mp4"
     # Return back to main directory
     os.chdir(home_dir)
     print('Final directory',os.getcwd())
     return new_video
+initial_language = gr.inputs.Dropdown(["English","Italian","Japanese","Russian","Spanish","German"])
+final_language = gr.inputs.Dropdown([ "Russian","Italian","Spanish","German","English","Japanese"])
+url =gr.inputs.Textbox(label = "Enter the YouTube URL below:")
+gr.Interface(fn = video_to_translate,
+            inputs = [url,initial_language,final_language],
+            outputs = 'video',
+            verbose = True,
+            title = 'Video Youtube Translator',
+            description = 'A simple application that translates Youtube small videos from English, Italian, Japanese, Russian, Spanish, and German  to  Italian, Spanish, Russian, English and Japanese.  Wait one minute to process.',
+            article =
+                        '''<div>
+                            <p style="text-align: center"> All you need to do is to paste the Youtube link and hit submit,, then wait for compiling. After that click on Play/Pause for listing to the video. The video is saved in an mp4 format.
+                            The lenght video limit is 10 minutes. For more information visit <a href="https://ruslanmv.com/">ruslanmv.com</a>
+                            </p>
+                        </div>''',
+           examples = [
+                        ["https://www.youtube.com/watch?v=uLVRZE8OAI4", "English","Spanish"],
+                        ["https://www.youtube.com/watch?v=fkGCLIQx1MI", "English","Russian"],
+                        ["https://www.youtube.com/watch?v=6Q6hFtitthQ", "Italian","English"],
+                        ["https://www.youtube.com/watch?v=s5XvjAC7ai8", "Russian","English"],
+                        ["https://www.youtube.com/watch?v=qzzweIQoIOU", "Japanese","English"],
+                        ["https://www.youtube.com/watch?v=nOGZvu6tJFE", "German","Spanish"]
+                        ]
+            ).launch()