czczup commited on
Commit
370186d
·
verified ·
1 Parent(s): 3ec5736

Update README.md

Browse files
Files changed (2) hide show
  1. README.md +5 -9
  2. config.json +1 -59
README.md CHANGED
@@ -2,10 +2,8 @@
2
  license: mit
3
  pipeline_tag: image-text-to-text
4
  library_name: transformers
5
- base_model:
6
- - OpenGVLab/InternViT-6B-448px-V2_5
7
- - internlm/internlm2_5-20b-chat
8
- base_model_relation: merge
9
  language:
10
  - multilingual
11
  tags:
@@ -82,8 +80,6 @@ If `ImportError` occurs while executing this case, please install the required d
82
 
83
  When dealing with multiple images, you can put them all in one list. Keep in mind that multiple images will lead to a higher number of input tokens, and as a result, the size of the context window typically needs to be increased.
84
 
85
- question = 'Describe this video in detail.'
86
-
87
  ```python
88
  from lmdeploy import pipeline, TurbomindEngineConfig
89
  from lmdeploy.vl import load_image
@@ -147,7 +143,7 @@ print(sess.response.text)
147
  LMDeploy's `api_server` enables models to be easily packed into services with a single command. The provided RESTful APIs are compatible with OpenAI's interfaces. Below are an example of service startup:
148
 
149
  ```shell
150
- lmdeploy serve api_server OpenGVLab/InternVL2_5-26B-AWQ --backend turbomind --server-port 23333 --tp 2
151
  ```
152
 
153
  To use the OpenAI-style interface, you need to install OpenAI:
@@ -186,7 +182,7 @@ print(response)
186
 
187
  ## License
188
 
189
- This project is released under the MIT License. This project uses the pre-trained Qwen2.5-72B-Instruct as a component, which is licensed under the Qwen License.
190
 
191
  ## Citation
192
 
@@ -218,4 +214,4 @@ If you find this project useful in your research, please consider citing:
218
  pages={24185--24198},
219
  year={2024}
220
  }
221
- ```
 
2
  license: mit
3
  pipeline_tag: image-text-to-text
4
  library_name: transformers
5
+ base_model: OpenGVLab/InternVL2_5-26B
6
+ base_model_relation: quantized
 
 
7
  language:
8
  - multilingual
9
  tags:
 
80
 
81
  When dealing with multiple images, you can put them all in one list. Keep in mind that multiple images will lead to a higher number of input tokens, and as a result, the size of the context window typically needs to be increased.
82
 
 
 
83
  ```python
84
  from lmdeploy import pipeline, TurbomindEngineConfig
85
  from lmdeploy.vl import load_image
 
143
  LMDeploy's `api_server` enables models to be easily packed into services with a single command. The provided RESTful APIs are compatible with OpenAI's interfaces. Below are an example of service startup:
144
 
145
  ```shell
146
+ lmdeploy serve api_server OpenGVLab/InternVL2_5-26B-AWQ --server-port 23333 --tp 2
147
  ```
148
 
149
  To use the OpenAI-style interface, you need to install OpenAI:
 
182
 
183
  ## License
184
 
185
+ This project is released under the MIT License. This project uses the pre-trained internlm2_5-20b-chat as a component, which is licensed under the Apache License 2.0.
186
 
187
  ## Citation
188
 
 
214
  pages={24185--24198},
215
  year={2024}
216
  }
217
+ ```
config.json CHANGED
@@ -1,6 +1,5 @@
1
  {
2
- "_commit_hash": "a5d2234c494a87fee81ac05a45e79ef9c8a6b505",
3
- "_name_or_path": "/models/141/huggingface_hub/hub/models--OpenGVLab--InternVL2_5-26B/snapshots/a5d2234c494a87fee81ac05a45e79ef9c8a6b505/",
4
  "architectures": [
5
  "InternVLChatModel"
6
  ],
@@ -119,93 +118,36 @@
119
  "select_layer": -1,
120
  "template": "internvl2_5",
121
  "torch_dtype": "float16",
122
- "transformers_version": null,
123
  "use_backbone_lora": 0,
124
- "use_cache": false,
125
  "use_llm_lora": 0,
126
  "use_thumbnail": true,
127
  "vision_config": {
128
- "_attn_implementation_autoset": true,
129
- "_name_or_path": "",
130
- "add_cross_attention": false,
131
  "architectures": [
132
  "InternVisionModel"
133
  ],
134
  "attention_dropout": 0.0,
135
- "bad_words_ids": null,
136
- "begin_suppress_tokens": null,
137
- "bos_token_id": null,
138
- "chunk_size_feed_forward": 0,
139
- "cross_attention_hidden_size": null,
140
- "decoder_start_token_id": null,
141
- "diversity_penalty": 0.0,
142
- "do_sample": false,
143
  "drop_path_rate": 0.0,
144
  "dropout": 0.0,
145
- "early_stopping": false,
146
- "encoder_no_repeat_ngram_size": 0,
147
- "eos_token_id": null,
148
- "exponential_decay_length_penalty": null,
149
- "finetuning_task": null,
150
- "forced_bos_token_id": null,
151
- "forced_eos_token_id": null,
152
  "hidden_act": "gelu",
153
  "hidden_size": 3200,
154
- "id2label": {
155
- "0": "LABEL_0",
156
- "1": "LABEL_1"
157
- },
158
  "image_size": 448,
159
  "initializer_factor": 0.1,
160
  "initializer_range": 1e-10,
161
  "intermediate_size": 12800,
162
- "is_decoder": false,
163
- "is_encoder_decoder": false,
164
- "label2id": {
165
- "LABEL_0": 0,
166
- "LABEL_1": 1
167
- },
168
  "layer_norm_eps": 1e-06,
169
- "length_penalty": 1.0,
170
- "max_length": 20,
171
- "min_length": 0,
172
  "model_type": "intern_vit_6b",
173
- "no_repeat_ngram_size": 0,
174
  "norm_type": "rms_norm",
175
  "num_attention_heads": 25,
176
- "num_beam_groups": 1,
177
- "num_beams": 1,
178
  "num_channels": 3,
179
  "num_hidden_layers": 45,
180
- "num_return_sequences": 1,
181
  "output_attentions": false,
182
  "output_hidden_states": false,
183
- "output_scores": false,
184
- "pad_token_id": null,
185
  "patch_size": 14,
186
- "prefix": null,
187
- "problem_type": null,
188
- "pruned_heads": {},
189
  "qk_normalization": true,
190
  "qkv_bias": false,
191
- "remove_invalid_values": false,
192
- "repetition_penalty": 1.0,
193
  "return_dict": true,
194
- "return_dict_in_generate": false,
195
- "sep_token_id": null,
196
- "suppress_tokens": null,
197
- "task_specific_params": null,
198
- "temperature": 1.0,
199
- "tf_legacy_loss": false,
200
- "tie_encoder_decoder": false,
201
- "tie_word_embeddings": true,
202
- "tokenizer_class": null,
203
- "top_k": 50,
204
- "top_p": 1.0,
205
  "torch_dtype": "bfloat16",
206
- "torchscript": false,
207
  "transformers_version": "4.47.0",
208
- "typical_p": 1.0,
209
  "use_bfloat16": true,
210
  "use_flash_attn": false
211
  }
 
1
  {
2
+ "_commit_hash": null,
 
3
  "architectures": [
4
  "InternVLChatModel"
5
  ],
 
118
  "select_layer": -1,
119
  "template": "internvl2_5",
120
  "torch_dtype": "float16",
 
121
  "use_backbone_lora": 0,
 
122
  "use_llm_lora": 0,
123
  "use_thumbnail": true,
124
  "vision_config": {
 
 
 
125
  "architectures": [
126
  "InternVisionModel"
127
  ],
128
  "attention_dropout": 0.0,
 
 
 
 
 
 
 
 
129
  "drop_path_rate": 0.0,
130
  "dropout": 0.0,
 
 
 
 
 
 
 
131
  "hidden_act": "gelu",
132
  "hidden_size": 3200,
 
 
 
 
133
  "image_size": 448,
134
  "initializer_factor": 0.1,
135
  "initializer_range": 1e-10,
136
  "intermediate_size": 12800,
 
 
 
 
 
 
137
  "layer_norm_eps": 1e-06,
 
 
 
138
  "model_type": "intern_vit_6b",
 
139
  "norm_type": "rms_norm",
140
  "num_attention_heads": 25,
 
 
141
  "num_channels": 3,
142
  "num_hidden_layers": 45,
 
143
  "output_attentions": false,
144
  "output_hidden_states": false,
 
 
145
  "patch_size": 14,
 
 
 
146
  "qk_normalization": true,
147
  "qkv_bias": false,
 
 
148
  "return_dict": true,
 
 
 
 
 
 
 
 
 
 
 
149
  "torch_dtype": "bfloat16",
 
150
  "transformers_version": "4.47.0",
 
151
  "use_bfloat16": true,
152
  "use_flash_attn": false
153
  }