Spaces:
Runtime error
Runtime error
Commit
·
c1df16f
1
Parent(s):
ddfe2b4
Update dataset/transcript_dataset.py
Browse files
dataset/transcript_dataset.py
CHANGED
@@ -10,6 +10,7 @@ from dataset.hf_dataset import HFDataset
|
|
10 |
class TranscriptDataset(HFDataset):
|
11 |
|
12 |
def __init__(self, name) -> None:
|
|
|
13 |
super().__init__(name)
|
14 |
|
15 |
def generate_dataset(self, input, download_path, overwrite, whisper_config):
|
@@ -25,7 +26,7 @@ class TranscriptDataset(HFDataset):
|
|
25 |
#emptyDataset=self.dataset["train"].filter(lambda e: e["id"] is None)
|
26 |
emptyDataset=self.dataset["train"]
|
27 |
whisper_config["number_videos"] = 5
|
28 |
-
whisperPP = WhisperPP(emptyDataset, **whisper_config)
|
29 |
downloader = YoutubeDownloader(download_path)
|
30 |
if not overwrite:
|
31 |
downloader.config["download_archive"] = os.path.join(download_path,"video_record.txt")
|
|
|
10 |
class TranscriptDataset(HFDataset):
|
11 |
|
12 |
def __init__(self, name) -> None:
|
13 |
+
self.name = name
|
14 |
super().__init__(name)
|
15 |
|
16 |
def generate_dataset(self, input, download_path, overwrite, whisper_config):
|
|
|
26 |
#emptyDataset=self.dataset["train"].filter(lambda e: e["id"] is None)
|
27 |
emptyDataset=self.dataset["train"]
|
28 |
whisper_config["number_videos"] = 5
|
29 |
+
whisperPP = WhisperPP(emptyDataset, self.name, **whisper_config)
|
30 |
downloader = YoutubeDownloader(download_path)
|
31 |
if not overwrite:
|
32 |
downloader.config["download_archive"] = os.path.join(download_path,"video_record.txt")
|