RamAnanth1 commited on
Commit
c1df16f
·
1 Parent(s): ddfe2b4

Update dataset/transcript_dataset.py

Browse files
Files changed (1) hide show
  1. dataset/transcript_dataset.py +2 -1
dataset/transcript_dataset.py CHANGED
@@ -10,6 +10,7 @@ from dataset.hf_dataset import HFDataset
10
  class TranscriptDataset(HFDataset):
11
 
12
  def __init__(self, name) -> None:
 
13
  super().__init__(name)
14
 
15
  def generate_dataset(self, input, download_path, overwrite, whisper_config):
@@ -25,7 +26,7 @@ class TranscriptDataset(HFDataset):
25
  #emptyDataset=self.dataset["train"].filter(lambda e: e["id"] is None)
26
  emptyDataset=self.dataset["train"]
27
  whisper_config["number_videos"] = 5
28
- whisperPP = WhisperPP(emptyDataset, **whisper_config)
29
  downloader = YoutubeDownloader(download_path)
30
  if not overwrite:
31
  downloader.config["download_archive"] = os.path.join(download_path,"video_record.txt")
 
10
  class TranscriptDataset(HFDataset):
11
 
12
  def __init__(self, name) -> None:
13
+ self.name = name
14
  super().__init__(name)
15
 
16
  def generate_dataset(self, input, download_path, overwrite, whisper_config):
 
26
  #emptyDataset=self.dataset["train"].filter(lambda e: e["id"] is None)
27
  emptyDataset=self.dataset["train"]
28
  whisper_config["number_videos"] = 5
29
+ whisperPP = WhisperPP(emptyDataset, self.name, **whisper_config)
30
  downloader = YoutubeDownloader(download_path)
31
  if not overwrite:
32
  downloader.config["download_archive"] = os.path.join(download_path,"video_record.txt")