Update app.py
Browse files
app.py
CHANGED
@@ -50,68 +50,34 @@ pipe = pipeline(
|
|
50 |
def associate_speakers_with_timestamps(transcription_result, diarization):
|
51 |
word_segments = transcription_result['chunks']
|
52 |
diarization_segments = list(diarization.itertracks(yield_label=True))
|
53 |
-
|
54 |
-
# Pré-calcul des chevauchements
|
55 |
-
overlaps = set()
|
56 |
-
for i in range(1, len(diarization_segments)):
|
57 |
-
if diarization_segments[i-1][0].end > diarization_segments[i][0].start:
|
58 |
-
overlaps.add(diarization_segments[i][0].start)
|
59 |
-
|
60 |
speaker_transcription = []
|
61 |
-
|
62 |
-
|
63 |
-
|
64 |
-
diar_iter = iter(diarization_segments)
|
65 |
-
current_segment, _, current_speaker = next(diar_iter)
|
66 |
|
67 |
for word in word_segments:
|
68 |
-
word_start,
|
69 |
-
|
70 |
-
while word_start >= current_segment.end:
|
71 |
-
if current_text:
|
72 |
-
speaker_transcription.append((current_speaker, ' '.join(current_text)))
|
73 |
-
current_text = []
|
74 |
-
current_segment, _, current_speaker = next(diar_iter, (None, None, None))
|
75 |
-
if current_segment is None:
|
76 |
-
break
|
77 |
-
|
78 |
-
if current_segment is None:
|
79 |
-
break
|
80 |
-
|
81 |
-
if word_start in overlaps:
|
82 |
-
current_text.append(f"[{word['text']}]")
|
83 |
-
else:
|
84 |
-
current_text.append(word['text'])
|
85 |
|
86 |
-
|
87 |
-
|
88 |
|
89 |
-
|
90 |
|
91 |
-
|
92 |
-
|
93 |
-
|
94 |
-
|
95 |
-
|
96 |
-
|
97 |
-
|
98 |
-
|
99 |
-
|
100 |
-
|
101 |
-
if
|
102 |
-
|
103 |
-
return [(speaker, text) for text in merged]
|
104 |
-
|
105 |
-
return [item for group in groupby(speaker_transcription, key=lambda x: x[0]) for item in merge_group(group)]
|
106 |
-
|
107 |
-
def merge_short_segments(speaker_transcription, min_words=3):
|
108 |
-
merged = []
|
109 |
-
for speaker, text in speaker_transcription:
|
110 |
-
if not merged or merged[-1][0] != speaker or len(merged[-1][1].split()) >= min_words:
|
111 |
-
merged.append((speaker, text))
|
112 |
else:
|
113 |
-
|
114 |
-
|
|
|
115 |
|
116 |
def simplify_diarization_output(speaker_transcription):
|
117 |
simplified = []
|
|
|
50 |
def associate_speakers_with_timestamps(transcription_result, diarization):
|
51 |
word_segments = transcription_result['chunks']
|
52 |
diarization_segments = list(diarization.itertracks(yield_label=True))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
53 |
speaker_transcription = []
|
54 |
+
current_segment_index = 0
|
55 |
+
previous_speaker = None
|
|
|
|
|
|
|
56 |
|
57 |
for word in word_segments:
|
58 |
+
word_start, word_end = word['timestamp']
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
59 |
|
60 |
+
while current_segment_index < len(diarization_segments) - 1 and diarization_segments[current_segment_index][0].end <= word_start:
|
61 |
+
current_segment_index += 1
|
62 |
|
63 |
+
current_segment, _, current_speaker = diarization_segments[current_segment_index]
|
64 |
|
65 |
+
# Vérifier s'il y a un chevauchement avec le segment précédent
|
66 |
+
if current_segment_index > 0:
|
67 |
+
previous_segment, _, previous_speaker = diarization_segments[current_segment_index - 1]
|
68 |
+
if previous_segment.end > word_start and previous_speaker != current_speaker:
|
69 |
+
word_text = f"[{word['text']}]"
|
70 |
+
else:
|
71 |
+
word_text = word['text']
|
72 |
+
else:
|
73 |
+
word_text = word['text']
|
74 |
+
|
75 |
+
if not speaker_transcription or speaker_transcription[-1][0] != current_speaker:
|
76 |
+
speaker_transcription.append((current_speaker, word_text))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
77 |
else:
|
78 |
+
speaker_transcription[-1] = (current_speaker, speaker_transcription[-1][1] + " " + word_text)
|
79 |
+
|
80 |
+
return speaker_transcription
|
81 |
|
82 |
def simplify_diarization_output(speaker_transcription):
|
83 |
simplified = []
|