adityarajkishan commited on
Commit
e92118f
·
verified ·
1 Parent(s): f73020b

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +9 -16
config.json CHANGED
@@ -1,9 +1,11 @@
1
  {
 
2
  "architectures": [
3
  "VisionEncoderDecoderModel"
4
  ],
 
5
  "decoder": {
6
- "_name_or_path": "gpt2",
7
  "activation_function": "gelu_new",
8
  "add_cross_attention": true,
9
  "architectures": [
@@ -11,18 +13,16 @@
11
  ],
12
  "attn_pdrop": 0.1,
13
  "bad_words_ids": null,
14
- "begin_suppress_tokens": null,
15
  "bos_token_id": 50256,
16
  "chunk_size_feed_forward": 0,
17
  "cross_attention_hidden_size": null,
18
- "decoder_start_token_id": null,
19
  "diversity_penalty": 0.0,
20
  "do_sample": false,
21
  "early_stopping": false,
22
  "embd_pdrop": 0.1,
23
  "encoder_no_repeat_ngram_size": 0,
24
  "eos_token_id": 50256,
25
- "exponential_decay_length_penalty": null,
26
  "finetuning_task": null,
27
  "forced_bos_token_id": null,
28
  "forced_eos_token_id": null,
@@ -55,7 +55,7 @@
55
  "output_attentions": false,
56
  "output_hidden_states": false,
57
  "output_scores": false,
58
- "pad_token_id": null,
59
  "prefix": null,
60
  "problem_type": null,
61
  "pruned_heads": {},
@@ -73,7 +73,6 @@
73
  "summary_proj_to_labels": true,
74
  "summary_type": "cls_index",
75
  "summary_use_proj": true,
76
- "suppress_tokens": null,
77
  "task_specific_params": {
78
  "text-generation": {
79
  "do_sample": true,
@@ -81,7 +80,6 @@
81
  }
82
  },
83
  "temperature": 1.0,
84
- "tf_legacy_loss": false,
85
  "tie_encoder_decoder": false,
86
  "tie_word_embeddings": true,
87
  "tokenizer_class": null,
@@ -89,21 +87,20 @@
89
  "top_p": 1.0,
90
  "torch_dtype": null,
91
  "torchscript": false,
92
- "typical_p": 1.0,
93
  "use_bfloat16": false,
94
  "use_cache": true,
95
  "vocab_size": 50257
96
  },
97
  "decoder_start_token_id": 50256,
98
  "encoder": {
99
- "_name_or_path": "google/vit-base-patch16-224-in21k",
100
  "add_cross_attention": false,
101
  "architectures": [
102
  "ViTModel"
103
  ],
104
  "attention_probs_dropout_prob": 0.0,
105
  "bad_words_ids": null,
106
- "begin_suppress_tokens": null,
107
  "bos_token_id": null,
108
  "chunk_size_feed_forward": 0,
109
  "cross_attention_hidden_size": null,
@@ -112,9 +109,7 @@
112
  "do_sample": false,
113
  "early_stopping": false,
114
  "encoder_no_repeat_ngram_size": 0,
115
- "encoder_stride": 16,
116
  "eos_token_id": null,
117
- "exponential_decay_length_penalty": null,
118
  "finetuning_task": null,
119
  "forced_bos_token_id": null,
120
  "forced_eos_token_id": null,
@@ -160,10 +155,8 @@
160
  "return_dict": true,
161
  "return_dict_in_generate": false,
162
  "sep_token_id": null,
163
- "suppress_tokens": null,
164
  "task_specific_params": null,
165
  "temperature": 1.0,
166
- "tf_legacy_loss": false,
167
  "tie_encoder_decoder": false,
168
  "tie_word_embeddings": true,
169
  "tokenizer_class": null,
@@ -171,7 +164,7 @@
171
  "top_p": 1.0,
172
  "torch_dtype": null,
173
  "torchscript": false,
174
- "typical_p": 1.0,
175
  "use_bfloat16": false
176
  },
177
  "eos_token_id": 50256,
@@ -180,5 +173,5 @@
180
  "pad_token_id": 50256,
181
  "tie_word_embeddings": false,
182
  "torch_dtype": "float32",
183
- "transformers_version": "4.35.2"
184
  }
 
1
  {
2
+ "_name_or_path": "vit-gpt-pt",
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
6
+ "bos_token_id": 50256,
7
  "decoder": {
8
+ "_name_or_path": "",
9
  "activation_function": "gelu_new",
10
  "add_cross_attention": true,
11
  "architectures": [
 
13
  ],
14
  "attn_pdrop": 0.1,
15
  "bad_words_ids": null,
 
16
  "bos_token_id": 50256,
17
  "chunk_size_feed_forward": 0,
18
  "cross_attention_hidden_size": null,
19
+ "decoder_start_token_id": 50256,
20
  "diversity_penalty": 0.0,
21
  "do_sample": false,
22
  "early_stopping": false,
23
  "embd_pdrop": 0.1,
24
  "encoder_no_repeat_ngram_size": 0,
25
  "eos_token_id": 50256,
 
26
  "finetuning_task": null,
27
  "forced_bos_token_id": null,
28
  "forced_eos_token_id": null,
 
55
  "output_attentions": false,
56
  "output_hidden_states": false,
57
  "output_scores": false,
58
+ "pad_token_id": 50256,
59
  "prefix": null,
60
  "problem_type": null,
61
  "pruned_heads": {},
 
73
  "summary_proj_to_labels": true,
74
  "summary_type": "cls_index",
75
  "summary_use_proj": true,
 
76
  "task_specific_params": {
77
  "text-generation": {
78
  "do_sample": true,
 
80
  }
81
  },
82
  "temperature": 1.0,
 
83
  "tie_encoder_decoder": false,
84
  "tie_word_embeddings": true,
85
  "tokenizer_class": null,
 
87
  "top_p": 1.0,
88
  "torch_dtype": null,
89
  "torchscript": false,
90
+ "transformers_version": "4.15.0",
91
  "use_bfloat16": false,
92
  "use_cache": true,
93
  "vocab_size": 50257
94
  },
95
  "decoder_start_token_id": 50256,
96
  "encoder": {
97
+ "_name_or_path": "",
98
  "add_cross_attention": false,
99
  "architectures": [
100
  "ViTModel"
101
  ],
102
  "attention_probs_dropout_prob": 0.0,
103
  "bad_words_ids": null,
 
104
  "bos_token_id": null,
105
  "chunk_size_feed_forward": 0,
106
  "cross_attention_hidden_size": null,
 
109
  "do_sample": false,
110
  "early_stopping": false,
111
  "encoder_no_repeat_ngram_size": 0,
 
112
  "eos_token_id": null,
 
113
  "finetuning_task": null,
114
  "forced_bos_token_id": null,
115
  "forced_eos_token_id": null,
 
155
  "return_dict": true,
156
  "return_dict_in_generate": false,
157
  "sep_token_id": null,
 
158
  "task_specific_params": null,
159
  "temperature": 1.0,
 
160
  "tie_encoder_decoder": false,
161
  "tie_word_embeddings": true,
162
  "tokenizer_class": null,
 
164
  "top_p": 1.0,
165
  "torch_dtype": null,
166
  "torchscript": false,
167
+ "transformers_version": "4.15.0",
168
  "use_bfloat16": false
169
  },
170
  "eos_token_id": 50256,
 
173
  "pad_token_id": 50256,
174
  "tie_word_embeddings": false,
175
  "torch_dtype": "float32",
176
+ "transformers_version": null
177
  }