lym0302 commited on
Commit
3577d8a
·
1 Parent(s): dcf3642

mm_audio_tower

Browse files
third_party/VideoLLaMA2/videollama2/model/__init__.py CHANGED
@@ -52,6 +52,10 @@ VLLMConfigs = {
52
 
53
 
54
  def load_pretrained_model(model_path, model_base, model_name, load_8bit=False, load_4bit=False, device_map="auto", device="cuda", use_flash_attn=False, **kwargs):
 
 
 
 
55
  if 'token' in kwargs:
56
  token = kwargs['token']
57
  else:
@@ -205,4 +209,8 @@ def load_pretrained_model(model_path, model_base, model_name, load_8bit=False, l
205
  else:
206
  context_len = 2048
207
 
 
 
 
 
208
  return tokenizer, model, processor, context_len
 
52
 
53
 
54
  def load_pretrained_model(model_path, model_base, model_name, load_8bit=False, load_4bit=False, device_map="auto", device="cuda", use_flash_attn=False, **kwargs):
55
+ if hasattr(model.config, "mm_audio_tower"):
56
+ nname = model.config.mm_audio_tower.split("/")[-1]
57
+ model.config.mm_audio_tower = os.path.join(model_path, nname)
58
+
59
  if 'token' in kwargs:
60
  token = kwargs['token']
61
  else:
 
209
  else:
210
  context_len = 2048
211
 
212
+
213
+
214
+
215
+
216
  return tokenizer, model, processor, context_len