Spaces:

Justtalk
/

JusTalk

Running

App Files Files Community

A-yum1 commited on Mar 29

Commit

64a73ca

1 Parent(s): d8bbfec

Update app.py

Browse files

Files changed (3) hide show

__pycache__/process.cpython-310.pyc +0 -0
app.py +1 -1
process.py +10 -3

__pycache__/process.cpython-310.pyc CHANGED Viewed

Binary files a/__pycache__/process.cpython-310.pyc and b/__pycache__/process.cpython-310.pyc differ

app.py CHANGED Viewed

@@ -335,7 +335,7 @@ def upload_audio():
             user_rates = {users[i]: rates[i] for i in range(len(users))}
             return jsonify({"rates": rates, "user_rates": user_rates}), 200
         else:
-            matched_time, unmatched_time, merged_segments = process.process_audio(reference_paths[0], audio_path, threshold=0.05)
             total_audio = transcripter.save_marged_segments(merged_segments)
             print("単一ユーザーの処理")
             total_time = matched_time + unmatched_time

             user_rates = {users[i]: rates[i] for i in range(len(users))}
             return jsonify({"rates": rates, "user_rates": user_rates}), 200
         else:
+            matched_time, unmatched_time, merged_segments = process.process_audio(reference_paths[0], audio_path, users[0], threshold=0.05)
             total_audio = transcripter.save_marged_segments(merged_segments)
             print("単一ユーザーの処理")
             total_time = matched_time + unmatched_time

process.py CHANGED Viewed

@@ -245,7 +245,7 @@ class AudioProcessor():
             print(f"類似度計算でエラーが発生しました: {e}")
             return None
-    def process_audio(self, reference_path, input_path, output_folder='/tmp/data/matched_segments', seg_duration=1.0, threshold=0.5):
         """
         入力音声からリファレンス音声に類似したセグメントを抽出する
@@ -259,6 +259,7 @@ class AudioProcessor():
         output_folder (str): 類似セグメントを保存するディレクトリ
         seg_duration (float): セグメントの長さ（秒）
         threshold (float): 類似度の閾値
         Returns:
         tuple: (マッチした時間（ミリ秒）, マッチしなかった時間（ミリ秒）, 分類済みのセグメント)
@@ -311,7 +312,10 @@ class AudioProcessor():
                     # 話者が変わった場合、保存
                     if wasSpeaking != isSpeaking:
                         if current_segment:
-                            merged_segments.append((wasSpeaking, current_segment))
                         wasSpeaking = isSpeaking
                         current_segment = [segment_file]
                     # 変わらなかった場合、結合
@@ -322,7 +326,10 @@ class AudioProcessor():
                     print(f"セグメント {file} の類似度計算でエラーが発生しました: {e}")
             # 余りを保存
             if current_segment:
-                merged_segments.append((wasSpeaking, current_segment))
             unmatched_time_ms = total_duration_ms - matched_time_ms
             return matched_time_ms, unmatched_time_ms, merged_segments

             print(f"類似度計算でエラーが発生しました: {e}")
             return None
+    def process_audio(self, reference_path, input_path, user,output_folder='/tmp/data/matched_segments', seg_duration=1.0, threshold=0.5):
         """
         入力音声からリファレンス音声に類似したセグメントを抽出する
         output_folder (str): 類似セグメントを保存するディレクトリ
         seg_duration (float): セグメントの長さ（秒）
         threshold (float): 類似度の閾値
+        user(str): ユーザー名
         Returns:
         tuple: (マッチした時間（ミリ秒）, マッチしなかった時間（ミリ秒）, 分類済みのセグメント)
                     # 話者が変わった場合、保存
                     if wasSpeaking != isSpeaking:
                         if current_segment:
+                            if wasSpeaking:
+                                merged_segments.append((user, current_segment))
+                            else:
+                                merged_segments.append(("other",current_segment))
                         wasSpeaking = isSpeaking
                         current_segment = [segment_file]
                     # 変わらなかった場合、結合
                     print(f"セグメント {file} の類似度計算でエラーが発生しました: {e}")
             # 余りを保存
             if current_segment:
+                if wasSpeaking:
+                    merged_segments.append((user, current_segment))
+                else:
+                    merged_segments.append(("other",current_segment))
             unmatched_time_ms = total_duration_ms - matched_time_ms
             return matched_time_ms, unmatched_time_ms, merged_segments