Update modeling_internlm3.py (#18)

Files changed (2) hide show

modeling_internlm3.py CHANGED Viewed

@@ -793,7 +793,7 @@ class InternLM3Model(InternLM3PreTrainedModel):
     Args:
         config: InternLM3Config
     """
     def __init__(self, config: InternLM3Config):
         super().__init__(config)
         self.padding_idx = config.pad_token_id
@@ -1070,6 +1070,7 @@ class KwargsForCausalLM(FlashAttentionKwargs, LossKwargs): ...
 class InternLM3ForCausalLM(InternLM3PreTrainedModel, GenerationMixin):
     _tied_weights_keys = ["lm_head.weight"]
     _tp_plan = {"lm_head": "colwise_rep"}

     Args:
         config: InternLM3Config
     """
+    _auto_class = "AutoModel"
     def __init__(self, config: InternLM3Config):
         super().__init__(config)
         self.padding_idx = config.pad_token_id
 class InternLM3ForCausalLM(InternLM3PreTrainedModel, GenerationMixin):
+    _auto_class = "AutoModelForCausalLM"
     _tied_weights_keys = ["lm_head.weight"]
     _tp_plan = {"lm_head": "colwise_rep"}

tokenization_internlm3.py CHANGED Viewed

@@ -67,7 +67,7 @@ class InternLM3Tokenizer(PreTrainedTokenizer):
             Whether or not to add an initial space to the input. This allows to treat the leading word just as any
             other word. Again, this should be set with `from_slow=True` to make sure it's taken into account.
     """
     vocab_files_names = VOCAB_FILES_NAMES
     model_input_names = ["input_ids", "attention_mask"]

             Whether or not to add an initial space to the input. This allows to treat the leading word just as any
             other word. Again, this should be set with `from_slow=True` to make sure it's taken into account.
     """
+    _auto_class = "AutoTokenizer"
     vocab_files_names = VOCAB_FILES_NAMES
     model_input_names = ["input_ids", "attention_mask"]