ynhe commited on
Commit
969c18f
·
verified ·
1 Parent(s): 0b3873a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -7
app.py CHANGED
@@ -12,24 +12,24 @@ import torch
12
  import gradio as gr
13
  from gradio.themes.utils import colors, fonts, sizes
14
 
15
- from faster_whisper import WhisperModel
16
  from moviepy.editor import VideoFileClip
17
  from transformers import AutoTokenizer, AutoModel
18
 
19
  import subprocess
20
- subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
21
 
22
  # ========================================
23
  # Model Initialization
24
  # ========================================
25
 
26
  if gr.NO_RELOAD:
27
- if torch.cuda.is_available():
28
- speech_model = WhisperModel("large-v3", device="cuda", compute_type="float16")
29
- else:
30
- speech_model = WhisperModel("large-v3", device="cpu")
31
 
32
- model_path = 'OpenGVLab/VideoChat-Flash-Qwen2-7B_res448'
33
 
34
  tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
35
  model = AutoModel.from_pretrained(model_path, trust_remote_code=True).half().cuda()
 
12
  import gradio as gr
13
  from gradio.themes.utils import colors, fonts, sizes
14
 
15
+ # from faster_whisper import WhisperModel
16
  from moviepy.editor import VideoFileClip
17
  from transformers import AutoTokenizer, AutoModel
18
 
19
  import subprocess
20
+ # subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
21
 
22
  # ========================================
23
  # Model Initialization
24
  # ========================================
25
 
26
  if gr.NO_RELOAD:
27
+ # if torch.cuda.is_available():
28
+ # speech_model = WhisperModel("large-v3", device="cuda", compute_type="float16")
29
+ # else:
30
+ # speech_model = WhisperModel("large-v3", device="cpu")
31
 
32
+ model_path = 'OpenGVLab/InternVideo2_5_Chat_8B'
33
 
34
  tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
35
  model = AutoModel.from_pretrained(model_path, trust_remote_code=True).half().cuda()