katuni4ka echarlaix HF staff commited on
Commit
62bc4bb
·
verified ·
1 Parent(s): da3a669

transformers-4.49 (#1)

Browse files

- update modeling for transformers 4.49 (a922276c6075dfe39fe468a556ea1afcfe34989c)


Co-authored-by: Ella Charlaix <[email protected]>

Files changed (2) hide show
  1. config.json +1 -1
  2. modeling_maira2.py +3 -3
config.json CHANGED
@@ -36,7 +36,7 @@
36
  "vocab_size": 32207
37
  },
38
  "torch_dtype": "float32",
39
- "transformers_version": "4.48.3",
40
  "vision_config": {
41
  "apply_layernorm": true,
42
  "architectures": [
 
36
  "vocab_size": 32207
37
  },
38
  "torch_dtype": "float32",
39
+ "transformers_version": "4.49.0",
40
  "vision_config": {
41
  "apply_layernorm": true,
42
  "architectures": [
modeling_maira2.py CHANGED
@@ -105,7 +105,7 @@ class Maira2ForConditionalGeneration(LlavaForConditionalGeneration):
105
  output_hidden_states: Optional[bool] = None,
106
  return_dict: Optional[bool] = None,
107
  cache_position: Optional[torch.LongTensor] = None,
108
- num_logits_to_keep: int = 0,
109
  ) -> Union[Tuple, LlavaCausalLMOutputWithPast]:
110
  r"""
111
  Args:
@@ -246,7 +246,7 @@ class Maira2ForConditionalGeneration(LlavaForConditionalGeneration):
246
  output_hidden_states=output_hidden_states,
247
  return_dict=return_dict,
248
  cache_position=cache_position,
249
- num_logits_to_keep=num_logits_to_keep,
250
  )
251
 
252
  logits = outputs[0]
@@ -356,4 +356,4 @@ class Maira2ForConditionalGeneration(LlavaForConditionalGeneration):
356
  if labels is None:
357
  final_labels = None
358
 
359
- return final_embedding, final_attention_mask, final_labels, position_ids
 
105
  output_hidden_states: Optional[bool] = None,
106
  return_dict: Optional[bool] = None,
107
  cache_position: Optional[torch.LongTensor] = None,
108
+ logits_to_keep: int = 0,
109
  ) -> Union[Tuple, LlavaCausalLMOutputWithPast]:
110
  r"""
111
  Args:
 
246
  output_hidden_states=output_hidden_states,
247
  return_dict=return_dict,
248
  cache_position=cache_position,
249
+ logits_to_keep=logits_to_keep,
250
  )
251
 
252
  logits = outputs[0]
 
356
  if labels is None:
357
  final_labels = None
358
 
359
+ return final_embedding, final_attention_mask, final_labels, position_ids