Spaces:

Artificial-superintelligence
/

Aita

Running

App Files Files Community

Artificial-superintelligence commited on Nov 12, 2024

Commit

cc01dfc

verified ·

1 Parent(s): aaf4dac

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -29

app.py CHANGED Viewed

@@ -12,6 +12,27 @@ from indic_transliteration import sanscript
 from indic_transliteration.sanscript import transliterate
 import azure.cognitiveservices.speech as speechsdk
 import ffmpeg
 # Tamil-specific voice configurations
 TAMIL_VOICES = {
@@ -25,7 +46,6 @@ class TamilTextProcessor:
     @staticmethod
     def normalize_tamil_text(text):
         """Normalize Tamil text for better pronunciation"""
-        # Convert Tamil numerals to English numerals
         tamil_numerals = {'௦': '0', '௧': '1', '௨': '2', '௩': '3', '௪': '4',
                          '௫': '5', '௬': '6', '௭': '7', '௮': '8', '௯': '9'}
         for tamil_num, eng_num in tamil_numerals.items():
@@ -35,9 +55,7 @@ class TamilTextProcessor:
     @staticmethod
     def process_for_tts(text):
         """Process Tamil text for TTS"""
-        # Remove any unsupported characters
         text = ''.join(char for char in text if ord(char) < 65535)
-        # Normalize whitespace
         text = ' '.join(text.split())
         return text
@@ -75,11 +93,8 @@ class TamilDubber:
             video = VideoFileClip(video_path)
             audio_path = self.create_temp_file(".wav")
             video.audio.write_audiofile(audio_path)
-            # Transcribe using Whisper
             result = self.whisper_model.transcribe(audio_path)
             return result["segments"], video.duration
         except Exception as e:
             st.error(f"Error in audio extraction: {e}")
             raise
@@ -103,7 +118,6 @@ class TamilDubber:
                 })
             except Exception as e:
                 st.warning(f"Translation warning for segment: {str(e)}")
-                # Keep original text if translation fails
                 translated_segments.append({
                     "text": segment["text"],
                     "start": segment["start"],
@@ -138,7 +152,27 @@ class TamilDubber:
             st.error(f"Error creating subtitles: {e}")
             raise
 def main():
     st.title("Tamil Movie Dubbing System")
     st.sidebar.header("டப்பிங் அமைப்புகள்")  # Dubbing Settings in Tamil
@@ -182,7 +216,6 @@ def main():
                     status_text.text("Generating Tamil audio...")
                     output_segments = []
                     video = VideoFileClip(temp_video_path)
-                    final_audio_path = dubber.create_temp_file(".mp3")
                     for idx, segment in enumerate(translated_segments):
                         audio_path = dubber.generate_audio(segment["text"])
@@ -193,44 +226,39 @@ def main():
                         })
                         progress_bar.progress(0.50 + (0.25 * (idx + 1) / len(translated_segments)))
-                    # Generate subtitles if requested
-                    if generate_subtitles:
-                        subtitle_path = dubber.create_temp_file(".srt")
-                        dubber.create_subtitles(translated_segments, subtitle_path)
                     # Create final video
                     status_text.text("Creating final video...")
                     output_path = dubber.create_temp_file(".mp4")
                     # Add subtitles if enabled
                     if generate_subtitles:
-                        def create_subtitle_clip(txt):
-                            return TextClip(
-                                txt=txt,
-                                fontsize=subtitle_size,
-                                color=subtitle_color,
-                                stroke_color='black',
-                                stroke_width=1
-                            )
                         subtitle_clips = []
                         for segment in translated_segments:
-                            clip = create_subtitle_clip(segment["text"])
-                            clip = clip.set_position(('center', 'bottom'))
-                            clip = clip.set_start(segment["start"])
-                            clip = clip.set_duration(segment["duration"])
-                            subtitle_clips.append(clip)
                         final_video = CompositeVideoClip([video] + subtitle_clips)
                     else:
                         final_video = video
-                    # Write final video
                     final_video.write_videofile(
                         output_path,
                         codec='libx264',
                         audio_codec='aac',
-                        fps=video.fps
                     )
                     progress_bar.progress(1.0)

 from indic_transliteration.sanscript import transliterate
 import azure.cognitiveservices.speech as speechsdk
 import ffmpeg
+from PIL import Image
+import imageio
+# Configure MoviePy to use imageio for reading images
+imageio.plugins.ffmpeg.download()
+# Configure ImageMagick policy to allow PDF and text file handling
+def configure_imagemagick():
+    """Configure ImageMagick policy to allow text operations"""
+    policy_file = "/etc/ImageMagick-6/policy.xml"
+    if os.path.exists(policy_file):
+        try:
+            with open(policy_file, 'r') as f:
+                policy_content = f.read()
+            # Modify policy to allow text file handling
+            policy_content = policy_content.replace('rights="none" pattern="@*"', 'rights="read|write" pattern="@*"')
+            with open(policy_file, 'w') as f:
+                f.write(policy_content)
+        except Exception as e:
+            st.warning(f"Unable to configure ImageMagick policy: {e}")
+            st.info("You may need to run this application with sudo privileges to modify ImageMagick policy")
 # Tamil-specific voice configurations
 TAMIL_VOICES = {
     @staticmethod
     def normalize_tamil_text(text):
         """Normalize Tamil text for better pronunciation"""
         tamil_numerals = {'௦': '0', '௧': '1', '௨': '2', '௩': '3', '௪': '4',
                          '௫': '5', '௬': '6', '௭': '7', '௮': '8', '௯': '9'}
         for tamil_num, eng_num in tamil_numerals.items():
     @staticmethod
     def process_for_tts(text):
         """Process Tamil text for TTS"""
         text = ''.join(char for char in text if ord(char) < 65535)
         text = ' '.join(text.split())
         return text
             video = VideoFileClip(video_path)
             audio_path = self.create_temp_file(".wav")
             video.audio.write_audiofile(audio_path)
             result = self.whisper_model.transcribe(audio_path)
             return result["segments"], video.duration
         except Exception as e:
             st.error(f"Error in audio extraction: {e}")
             raise
                 })
             except Exception as e:
                 st.warning(f"Translation warning for segment: {str(e)}")
                 translated_segments.append({
                     "text": segment["text"],
                     "start": segment["start"],
             st.error(f"Error creating subtitles: {e}")
             raise
+    def create_subtitle_clip(self, txt, size, color):
+        """Create subtitle clip with proper configuration"""
+        try:
+            return TextClip(
+                txt=txt,
+                font='DejaVu-Sans',  # Use a system font that supports Tamil
+                fontsize=size,
+                color=color,
+                stroke_color='black',
+                stroke_width=1,
+                method='caption',  # Use caption method instead of label
+                size=(720, None)  # Set width, let height adjust automatically
+            )
+        except Exception as e:
+            st.error(f"Error creating subtitle clip: {e}")
+            raise
 def main():
+    # Configure ImageMagick at startup
+    configure_imagemagick()
     st.title("Tamil Movie Dubbing System")
     st.sidebar.header("டப்பிங் அமைப்புகள்")  # Dubbing Settings in Tamil
                     status_text.text("Generating Tamil audio...")
                     output_segments = []
                     video = VideoFileClip(temp_video_path)
                     for idx, segment in enumerate(translated_segments):
                         audio_path = dubber.generate_audio(segment["text"])
                         })
                         progress_bar.progress(0.50 + (0.25 * (idx + 1) / len(translated_segments)))
                     # Create final video
                     status_text.text("Creating final video...")
                     output_path = dubber.create_temp_file(".mp4")
                     # Add subtitles if enabled
                     if generate_subtitles:
                         subtitle_clips = []
                         for segment in translated_segments:
+                            try:
+                                clip = dubber.create_subtitle_clip(
+                                    segment["text"],
+                                    subtitle_size,
+                                    subtitle_color
+                                )
+                                clip = clip.set_position(('center', 'bottom'))
+                                clip = clip.set_start(segment["start"])
+                                clip = clip.set_duration(segment["duration"])
+                                subtitle_clips.append(clip)
+                            except Exception as e:
+                                st.warning(f"Skipping subtitle for segment due to error: {e}")
                         final_video = CompositeVideoClip([video] + subtitle_clips)
                     else:
                         final_video = video
+                    # Write final video with proper codec settings
                     final_video.write_videofile(
                         output_path,
                         codec='libx264',
                         audio_codec='aac',
+                        fps=video.fps,
+                        threads=4,
+                        preset='medium'
                     )
                     progress_bar.progress(1.0)