9f7215ccd7cb4c185eb4fac86e4d56da03631027e58e2bf4ed1b9ebafab18c8e
Browse files- config.json +5 -4
- generation_config.json +2 -1
- trainer_state.json +0 -0
- training_args.bin +2 -2
config.json
CHANGED
@@ -9,7 +9,7 @@
|
|
9 |
"eos_token_id": 2,
|
10 |
"hidden_act": "silu",
|
11 |
"hidden_size": 4096,
|
12 |
-
"image_aspect_ratio": "
|
13 |
"image_crop_resolution": null,
|
14 |
"image_grid_pinpoints": null,
|
15 |
"image_split_resolution": null,
|
@@ -28,7 +28,7 @@
|
|
28 |
"mm_vision_select_layer": -2,
|
29 |
"mm_vision_tower": "openai/clip-vit-large-patch14-336",
|
30 |
"mm_vision_tower_lr": 2e-06,
|
31 |
-
"model_type": "
|
32 |
"num_attention_heads": 32,
|
33 |
"num_hidden_layers": 32,
|
34 |
"num_key_value_heads": 32,
|
@@ -41,9 +41,10 @@
|
|
41 |
"tokenizer_model_max_length": 4096,
|
42 |
"tokenizer_padding_side": "right",
|
43 |
"torch_dtype": "bfloat16",
|
44 |
-
"transformers_version": "4.
|
45 |
"use_cache": true,
|
46 |
"use_mm_proj": true,
|
47 |
"vision_tower_pretrained": null,
|
48 |
-
"vocab_size": 32000
|
|
|
49 |
}
|
|
|
9 |
"eos_token_id": 2,
|
10 |
"hidden_act": "silu",
|
11 |
"hidden_size": 4096,
|
12 |
+
"image_aspect_ratio": "resize",
|
13 |
"image_crop_resolution": null,
|
14 |
"image_grid_pinpoints": null,
|
15 |
"image_split_resolution": null,
|
|
|
28 |
"mm_vision_select_layer": -2,
|
29 |
"mm_vision_tower": "openai/clip-vit-large-patch14-336",
|
30 |
"mm_vision_tower_lr": 2e-06,
|
31 |
+
"model_type": "llava_llama",
|
32 |
"num_attention_heads": 32,
|
33 |
"num_hidden_layers": 32,
|
34 |
"num_key_value_heads": 32,
|
|
|
41 |
"tokenizer_model_max_length": 4096,
|
42 |
"tokenizer_padding_side": "right",
|
43 |
"torch_dtype": "bfloat16",
|
44 |
+
"transformers_version": "4.40.0.dev0",
|
45 |
"use_cache": true,
|
46 |
"use_mm_proj": true,
|
47 |
"vision_tower_pretrained": null,
|
48 |
+
"vocab_size": 32000,
|
49 |
+
"s2": true
|
50 |
}
|
generation_config.json
CHANGED
@@ -1,9 +1,10 @@
|
|
1 |
{
|
|
|
2 |
"bos_token_id": 1,
|
3 |
"eos_token_id": 2,
|
4 |
"max_length": 4096,
|
5 |
"pad_token_id": 0,
|
6 |
"temperature": 0.9,
|
7 |
"top_p": 0.6,
|
8 |
-
"transformers_version": "4.
|
9 |
}
|
|
|
1 |
{
|
2 |
+
"attn_implementation": "flash_attention_2",
|
3 |
"bos_token_id": 1,
|
4 |
"eos_token_id": 2,
|
5 |
"max_length": 4096,
|
6 |
"pad_token_id": 0,
|
7 |
"temperature": 0.9,
|
8 |
"top_p": 0.6,
|
9 |
+
"transformers_version": "4.40.0.dev0"
|
10 |
}
|
trainer_state.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c98a00b5dd88431b27304126692f44fcac408310ecc11cea928cd126156b36f
|
3 |
+
size 7544
|