snyamson commited on
Commit
28bef83
·
1 Parent(s): 8116686

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +18 -2
app.py CHANGED
@@ -21,6 +21,8 @@ if uploaded_file:
21
  segment_duration = 120 # Segment duration in seconds (2 minutes)
22
  num_segments = len(resampled_waveform[0]) // (segment_duration * 16000)
23
  segment_transcriptions = []
 
 
24
 
25
  # Transcribe each segment
26
  for i in range(num_segments):
@@ -41,7 +43,21 @@ if uploaded_file:
41
  # Combine segment transcriptions into the full transcript
42
  full_transcript = " ".join(segment_transcriptions)
43
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  # Display the transcript
45
  st.header("Transcription")
46
- st.write(full_transcript)
47
- st.write('Hello')
 
21
  segment_duration = 120 # Segment duration in seconds (2 minutes)
22
  num_segments = len(resampled_waveform[0]) // (segment_duration * 16000)
23
  segment_transcriptions = []
24
+ current_speaker = None
25
+ current_paragraph = ""
26
 
27
  # Transcribe each segment
28
  for i in range(num_segments):
 
43
  # Combine segment transcriptions into the full transcript
44
  full_transcript = " ".join(segment_transcriptions)
45
 
46
+ # Separate transcript by speakers and apply paragraphs
47
+ for line in full_transcript.split('. '): # You can adjust the separator depending on your audio content
48
+ if line.endswith((':', 'said')):
49
+ if current_paragraph:
50
+ st.write(f"Speaker: {current_speaker}")
51
+ st.write(current_paragraph + ".")
52
+ current_speaker = line
53
+ current_paragraph = ""
54
+ else:
55
+ current_paragraph += line + ". "
56
+ # Adding the last speaker paragraph
57
+ if current_paragraph:
58
+ st.write(f"Speaker: {current_speaker}")
59
+ st.write(current_paragraph + ".")
60
+
61
  # Display the transcript
62
  st.header("Transcription")
63
+ st.write(full_transcript)