nb-whisper-demo

Running on T4

versae commited on Oct 1, 2024

Commit

1c4706b

verified ·

1 Parent(s): 5aa1892

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -23,18 +23,18 @@ auth_token = os.environ.get("AUTH_TOKEN") or True
 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 print(f"Using device: {device}")
-@spaces.GPU(duration=60)
 def pipe(file, return_timestamps=False):
-    model = WhisperForConditionalGeneration.from_pretrained(MODEL_NAME, torch_dtype=torch.float16, low_cpu_mem_usage=True)
-    model.to(device)
-    processor = WhisperProcessor.from_pretrained(MODEL_NAME)
-    model.forward = torch.compile(model.forward, mode="reduce-overhead", fullgraph=True)
-    model.generation_config.cache_implementation = "static"
     asr = pipeline(
         task="automatic-speech-recognition",
-        model=model,
-        tokenizer=AutoTokenizer.from_pretrained(MODEL_NAME),
-        feature_extractor=AutoFeatureExtractor.from_pretrained(MODEL_NAME),
         chunk_length_s=30,
         device=device,
         token=auth_token,

 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 print(f"Using device: {device}")
+@spaces.GPU(duration=60 * 2)
 def pipe(file, return_timestamps=False):
+    # model = WhisperForConditionalGeneration.from_pretrained(MODEL_NAME, torch_dtype=torch.float16, low_cpu_mem_usage=True)
+    # model.to(device)
+    # processor = WhisperProcessor.from_pretrained(MODEL_NAME)
+    # model.forward = torch.compile(model.forward, mode="reduce-overhead", fullgraph=True)
+    # model.generation_config.cache_implementation = "static"
     asr = pipeline(
         task="automatic-speech-recognition",
+        model=MODEL_NAME,
+        # tokenizer=AutoTokenizer.from_pretrained(MODEL_NAME),
+        # feature_extractor=AutoFeatureExtractor.from_pretrained(MODEL_NAME),
         chunk_length_s=30,
         device=device,
         token=auth_token,