Ngoufack commited on
Commit
233782b
·
1 Parent(s): 4bd07f3

update 2.0

Browse files
Files changed (2) hide show
  1. app.py +8 -8
  2. requirements.txt +2 -1
app.py CHANGED
@@ -12,7 +12,7 @@ import os
12
  MODEL_NAME = "openai/whisper-medium"
13
  BATCH_SIZE = 8
14
  FILE_LIMIT_MB = 1000
15
- YT_LENGTH_LIMIT_S = 3600 # limit to 1 hour YouTube files
16
 
17
  device = 0 if torch.cuda.is_available() else "cpu"
18
 
@@ -115,11 +115,11 @@ file_transcribe = gr.Interface(
115
  gr.Radio(["transcribe", "translate"], label="Task", value="transcribe"),
116
  ],
117
  outputs="text",
118
- title="Whisper Large V3: Transcribe Audio",
119
  description=(
120
- "Transcribe long-form microphone or audio inputs with the click of a button! Demo uses the"
121
- f" checkpoint [{MODEL_NAME}](https://huggingface.co/{MODEL_NAME}) and 🤗 Transformers to transcribe audio files"
122
- " of arbitrary length."
123
  ),
124
  allow_flagging="never",
125
  )
@@ -131,10 +131,10 @@ yt_transcribe = gr.Interface(
131
  gr.Radio(["transcribe", "translate"], label="Task", value="transcribe")
132
  ],
133
  outputs=["html", "text"],
134
- title="Whisper Large V3: Transcribe YouTube",
135
  description=(
136
- "Transcribe long-form YouTube videos with the click of a button! Demo uses the checkpoint"
137
- f" [{MODEL_NAME}](https://huggingface.co/{MODEL_NAME}) and 🤗 Transformers to transcribe video files of"
138
  " arbitrary length."
139
  ),
140
  allow_flagging="never",
 
12
  MODEL_NAME = "openai/whisper-medium"
13
  BATCH_SIZE = 8
14
  FILE_LIMIT_MB = 1000
15
+ YT_LENGTH_LIMIT_S = 600 # limit to 1 hour YouTube files
16
 
17
  device = 0 if torch.cuda.is_available() else "cpu"
18
 
 
115
  gr.Radio(["transcribe", "translate"], label="Task", value="transcribe"),
116
  ],
117
  outputs="text",
118
+ title="Verbalens Project: Demo 1 prototype",
119
  description=(
120
+ "Transcribe long-form videos with the click of a button! Demo uses the checkpoint"
121
+ f" [{MODEL_NAME}](https://huggingface.co/{MODEL_NAME}), Nemo Diarization and Transformers to transcribe video files of"
122
+ " arbitrary length."
123
  ),
124
  allow_flagging="never",
125
  )
 
131
  gr.Radio(["transcribe", "translate"], label="Task", value="transcribe")
132
  ],
133
  outputs=["html", "text"],
134
+ title="Verbalens Project: Demo 1 prototype",
135
  description=(
136
+ "Transcribe long-form videos with the click of a button! Demo uses the checkpoint"
137
+ f" [{MODEL_NAME}](https://huggingface.co/{MODEL_NAME}), Nemo Diarization and Transformers to transcribe video files of"
138
  " arbitrary length."
139
  ),
140
  allow_flagging="never",
requirements.txt CHANGED
@@ -2,4 +2,5 @@ transformers
2
  yt-dlp
3
  torch
4
  torchvision
5
- torchaudio
 
 
2
  yt-dlp
3
  torch
4
  torchvision
5
+ torchaudio
6
+ nemo_toolkit