Update config.json
Browse files- config.json +27 -17
config.json
CHANGED
@@ -102,20 +102,12 @@
|
|
102 |
},
|
103 |
"max_position_embeddings": 1024,
|
104 |
"model_type": "bart",
|
105 |
-
"
|
106 |
-
"
|
107 |
-
"
|
108 |
-
"
|
109 |
-
"
|
110 |
-
"
|
111 |
-
"no_repeat_ngram_size": 2,
|
112 |
-
"num_beams": 5,
|
113 |
-
"num_embeddings": 50257,
|
114 |
-
"num_heads": 64,
|
115 |
-
"num_layers": 24,
|
116 |
-
"output_attentions": true,
|
117 |
-
"output_hidden_states": true,
|
118 |
-
"pad_token_id": 50267,
|
119 |
"reorder_and_upcast_attn": false,
|
120 |
"resid_pdrop": 0.1,
|
121 |
"scale_attn_by_inverse_layer_idx": false,
|
@@ -157,10 +149,28 @@
|
|
157 |
"temperature": 0.9,
|
158 |
"top_k": 50,
|
159 |
"top_p": 0.95
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
160 |
}
|
161 |
},
|
162 |
"torch_dtype": "float32",
|
163 |
-
"transformers_version": "4.
|
164 |
"use_cache": true,
|
165 |
-
"vocab_size":
|
166 |
-
}
|
|
|
102 |
},
|
103 |
"max_position_embeddings": 1024,
|
104 |
"model_type": "bart",
|
105 |
+
"no_repeat_ngram_size": 3,
|
106 |
+
"normalize_before": false,
|
107 |
+
"num_beams": 4,
|
108 |
+
"num_hidden_layers": 12,
|
109 |
+
"pad_token_id": 1,
|
110 |
+
"scale_embedding": false,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
111 |
"reorder_and_upcast_attn": false,
|
112 |
"resid_pdrop": 0.1,
|
113 |
"scale_attn_by_inverse_layer_idx": false,
|
|
|
149 |
"temperature": 0.9,
|
150 |
"top_k": 50,
|
151 |
"top_p": 0.95
|
152 |
+
},
|
153 |
+
"summarization": {
|
154 |
+
"length_penalty": 1.0,
|
155 |
+
"max_length": 128,
|
156 |
+
"min_length": 12,
|
157 |
+
"num_beams": 4
|
158 |
+
},
|
159 |
+
"summarization_cnn": {
|
160 |
+
"length_penalty": 2.0,
|
161 |
+
"max_length": 142,
|
162 |
+
"min_length": 56,
|
163 |
+
"num_beams": 4
|
164 |
+
},
|
165 |
+
"summarization_xsum": {
|
166 |
+
"length_penalty": 1.0,
|
167 |
+
"max_length": 62,
|
168 |
+
"min_length": 11,
|
169 |
+
"num_beams": 6
|
170 |
}
|
171 |
},
|
172 |
"torch_dtype": "float32",
|
173 |
+
"transformers_version": "4.7.0.dev0",
|
174 |
"use_cache": true,
|
175 |
+
"vocab_size": 50265
|
176 |
+
}
|