Spaces:

Justtalk
/

JusTalk

Running

App Files Files Community

A-yum1 commited on Mar 21

Commit

82c048e

1 Parent(s): f514ea6

Update transcription.py

Browse files

Files changed (1) hide show

transcription.py +48 -2

transcription.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import os
 from faster_whisper import WhisperModel
 class TranscriptionMaker():
     #書き起こしファイルを吐き出すディレクトリを指定
@@ -14,8 +15,10 @@ class TranscriptionMaker():
             raise
     #音声ファイルのディレクトリを受け取り、書き起こしファイルを作成する
-    def create_transcription(self,audio_directory):
         results = []
         #ディレクトリ内のファイルを全て取得
         if not os.path.isdir(audio_directory):
             raise ValueError(f"The specified path is not a valid directory: {audio_directory}")
@@ -44,4 +47,47 @@ class TranscriptionMaker():
         except OSError as e:
             print(f"Error writing transcription file: {e}")
             raise
-        return output_file

 import os
 from faster_whisper import WhisperModel
+from pydub import AudioSegment
 class TranscriptionMaker():
     #書き起こしファイルを吐き出すディレクトリを指定
             raise
     #音声ファイルのディレクトリを受け取り、書き起こしファイルを作成する
+    def create_transcription(self,segments_directory):
         results = []
+        #細切れ音声をくっつける
+        audio_directory = self.merge_segments(segments_directory)
         #ディレクトリ内のファイルを全て取得
         if not os.path.isdir(audio_directory):
             raise ValueError(f"The specified path is not a valid directory: {audio_directory}")
         except OSError as e:
             print(f"Error writing transcription file: {e}")
             raise
+        return output_file
+    #ファイル名が連続しているならくっつける
+    def merge_segments(self,segments_dir,output_dir = "/tmp/data/merged_audio"):
+        if not os.path.exists(output_dir):
+            os.makedirs(output_dir, exist_ok=True)
+        files = sorted([f for f in os.listdir(segments_dir) if f.endswith('.wav')])
+        merged_files = []
+        current_group = []
+        previous_index = None
+        for file in files:
+            # ファイル名から番号を抽出（例: "0.wav" -> 0）
+            file_index = int(file.split('.')[0])
+            # 番号が連続していない場合、新しいグループを作成
+            if previous_index is not None and file_index != previous_index + 1:
+                # 現在のグループを結合して保存
+                if current_group:
+                    merged_files.append(current_group)
+                current_group = []
+            # 現在のファイルをグループに追加
+            current_group.append(file)
+            previous_index = file_index
+        # 最後のグループを追加
+        if current_group:
+            merged_files.append(current_group)
+        # グループごとに結合して保存
+        for i, group in enumerate(merged_files):
+            combined_audio = AudioSegment.empty()
+            for file in group:
+                file_path = os.path.join(segments_dir, file)
+                segment = AudioSegment.from_file(file_path)
+                combined_audio += segment
+            # 出力ファイル名を設定して保存
+            output_file = os.path.join(output_dir, f'merged_{i}.wav')
+            combined_audio.export(output_file, format='wav')
+        return output_dir