knowledge-scribe

Sleeping

dwb2023 commited on Oct 4, 2024

Commit

ae9e3f6

verified ·

1 Parent(s): 4811eae

torch and chunk settings

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,6 @@ from datetime import datetime
 from pathlib import Path
 import tempfile
 import pandas as pd
-import accelerate
 import gradio as gr
 import yt_dlp as youtube_dl
@@ -34,7 +33,8 @@ model = AutoModelForSpeechSeq2Seq.from_pretrained(
     MODEL_NAME,
     use_cache=False,
     device_map="auto",
-    low_cpu_mem_usage=False
 )
 # Flash Attention setup for memory and speed optimization if supported
@@ -56,7 +56,7 @@ pipe = pipeline(
     model=model,
     tokenizer=tokenizer,
     feature_extractor=feature_extractor,
-    chunk_length_s=30,
 )
 def reset_and_update_dataset(new_data):

 from pathlib import Path
 import tempfile
 import pandas as pd
 import gradio as gr
 import yt_dlp as youtube_dl
     MODEL_NAME,
     use_cache=False,
     device_map="auto",
+    low_cpu_mem_usage=True,
+    attn_implementation="flash_attention_2"
 )
 # Flash Attention setup for memory and speed optimization if supported
     model=model,
     tokenizer=tokenizer,
     feature_extractor=feature_extractor,
+    chunk_length_s=900,  # Increased to 15 minutes
 )
 def reset_and_update_dataset(new_data):