Spaces:

StarPigeon
/

ViDove

Sleeping

Eason Lu commited on Mar 21, 2023

Commit

97dba4f

1 Parent(s): 164a372

modify script split

Former-commit-id: 799cf8f91e4b3e0bac38800b8ef89760b5630cf4

Files changed (2) hide show

.gitignore CHANGED Viewed

@@ -1,3 +1,4 @@
 /downloads
 /results
-.DS_Store

 /downloads
 /results
+.DS_Store
+/__pycache__

pipeline.py CHANGED Viewed

@@ -2,9 +2,7 @@ import openai
 from pytube import YouTube
 import argparse
 import os
-import io
 import whisper
-import ffmpeg
 from tqdm import tqdm
 parser = argparse.ArgumentParser()
@@ -66,14 +64,12 @@ if args.link is not None and args.video_file is None:
         exit()
     video_path = f'{DOWNLOAD_PATH}/video/{video.default_filename}'
-    # video_file = open(video_path, "rb")
     audio_path = '{}/audio/{}'.format(DOWNLOAD_PATH, audio.default_filename)
     audio_file = open(audio_path, "rb")
     if VIDEO_NAME == 'placeholder':
         VIDEO_NAME = audio.default_filename.split('.')[0]
 elif args.video_file is not None:
     # Read from local
-    # video_file = open(args.video_file, "rb")
     video_path = args.video_file
     if args.audio_file is not None:
         audio_file= open(args.audio_file, "rb")
@@ -120,8 +116,8 @@ if not args.only_srt:
     print('ASS subtitle saved as: ' + assSub_en)
 # Split the video script by sentences and create chunks within the token limit
-n_threshold = 1500  # Token limit for the GPT-3 model
-script_split = script_input.split('.')
 script_arr = []
 script = ""

 from pytube import YouTube
 import argparse
 import os
 import whisper
 from tqdm import tqdm
 parser = argparse.ArgumentParser()
         exit()
     video_path = f'{DOWNLOAD_PATH}/video/{video.default_filename}'
     audio_path = '{}/audio/{}'.format(DOWNLOAD_PATH, audio.default_filename)
     audio_file = open(audio_path, "rb")
     if VIDEO_NAME == 'placeholder':
         VIDEO_NAME = audio.default_filename.split('.')[0]
 elif args.video_file is not None:
     # Read from local
     video_path = args.video_file
     if args.audio_file is not None:
         audio_file= open(args.audio_file, "rb")
     print('ASS subtitle saved as: ' + assSub_en)
 # Split the video script by sentences and create chunks within the token limit
+n_threshold = 1000  # Token limit for the GPT-3 model
+script_split = script_input.split('\n')
 script_arr = []
 script = ""