Update modeling_internvideo2.py
Browse files- modeling_internvideo2.py +3 -3
modeling_internvideo2.py
CHANGED
@@ -1066,10 +1066,10 @@ def pretrain_internvideo2_6b_patch14_224(config):
|
|
1066 |
embed_dim=3200, depth=48, num_heads=25, mlp_ratio=4,
|
1067 |
clip_embed_dim=config.vision_encoder.clip_embed_dim,
|
1068 |
attn_pool_num_heads=16, qkv_bias=False,
|
1069 |
-
# drop_path_rate=0.3,
|
1070 |
-
# init_values=0.00001,
|
1071 |
drop_path_rate=0,
|
1072 |
-
init_values=
|
|
|
|
|
1073 |
qk_normalization=True,
|
1074 |
use_flash_attn=config.vision_encoder.use_flash_attn,
|
1075 |
use_fused_rmsnorm=config.vision_encoder.use_fused_rmsnorm,
|
|
|
1066 |
embed_dim=3200, depth=48, num_heads=25, mlp_ratio=4,
|
1067 |
clip_embed_dim=config.vision_encoder.clip_embed_dim,
|
1068 |
attn_pool_num_heads=16, qkv_bias=False,
|
|
|
|
|
1069 |
drop_path_rate=0,
|
1070 |
+
init_values=0.00001,
|
1071 |
+
# drop_path_rate=0,
|
1072 |
+
# init_values=None,
|
1073 |
qk_normalization=True,
|
1074 |
use_flash_attn=config.vision_encoder.use_flash_attn,
|
1075 |
use_fused_rmsnorm=config.vision_encoder.use_fused_rmsnorm,
|