transformers-4.49 (#1)
Browse files- update modeling for transformers 4.49 (a922276c6075dfe39fe468a556ea1afcfe34989c)
Co-authored-by: Ella Charlaix <[email protected]>
- config.json +1 -1
- modeling_maira2.py +3 -3
config.json
CHANGED
@@ -36,7 +36,7 @@
|
|
36 |
"vocab_size": 32207
|
37 |
},
|
38 |
"torch_dtype": "float32",
|
39 |
-
"transformers_version": "4.
|
40 |
"vision_config": {
|
41 |
"apply_layernorm": true,
|
42 |
"architectures": [
|
|
|
36 |
"vocab_size": 32207
|
37 |
},
|
38 |
"torch_dtype": "float32",
|
39 |
+
"transformers_version": "4.49.0",
|
40 |
"vision_config": {
|
41 |
"apply_layernorm": true,
|
42 |
"architectures": [
|
modeling_maira2.py
CHANGED
@@ -105,7 +105,7 @@ class Maira2ForConditionalGeneration(LlavaForConditionalGeneration):
|
|
105 |
output_hidden_states: Optional[bool] = None,
|
106 |
return_dict: Optional[bool] = None,
|
107 |
cache_position: Optional[torch.LongTensor] = None,
|
108 |
-
|
109 |
) -> Union[Tuple, LlavaCausalLMOutputWithPast]:
|
110 |
r"""
|
111 |
Args:
|
@@ -246,7 +246,7 @@ class Maira2ForConditionalGeneration(LlavaForConditionalGeneration):
|
|
246 |
output_hidden_states=output_hidden_states,
|
247 |
return_dict=return_dict,
|
248 |
cache_position=cache_position,
|
249 |
-
|
250 |
)
|
251 |
|
252 |
logits = outputs[0]
|
@@ -356,4 +356,4 @@ class Maira2ForConditionalGeneration(LlavaForConditionalGeneration):
|
|
356 |
if labels is None:
|
357 |
final_labels = None
|
358 |
|
359 |
-
return final_embedding, final_attention_mask, final_labels, position_ids
|
|
|
105 |
output_hidden_states: Optional[bool] = None,
|
106 |
return_dict: Optional[bool] = None,
|
107 |
cache_position: Optional[torch.LongTensor] = None,
|
108 |
+
logits_to_keep: int = 0,
|
109 |
) -> Union[Tuple, LlavaCausalLMOutputWithPast]:
|
110 |
r"""
|
111 |
Args:
|
|
|
246 |
output_hidden_states=output_hidden_states,
|
247 |
return_dict=return_dict,
|
248 |
cache_position=cache_position,
|
249 |
+
logits_to_keep=logits_to_keep,
|
250 |
)
|
251 |
|
252 |
logits = outputs[0]
|
|
|
356 |
if labels is None:
|
357 |
final_labels = None
|
358 |
|
359 |
+
return final_embedding, final_attention_mask, final_labels, position_ids
|