baichuan-inc
/

Baichuan-13B-Base

Text Generation

text-generation-inference

Model card Files Files and versions Community

GradientGuru commited on Jul 11, 2023

Commit

63cd6bd

·

1 Parent(s): 54e47f6

Update modeling_baichuan.py

Files changed (1) hide show

modeling_baichuan.py +8 -1

modeling_baichuan.py CHANGED Viewed

@@ -4,6 +4,7 @@ import math
 from typing import List, Optional, Tuple, Union
 import torch
 from torch.nn import CrossEntropyLoss
 from transformers import PreTrainedModel
 from transformers.activations import ACT2FN
@@ -235,7 +236,13 @@ class BaichuanModel(BaichuanPreTrainedModel):
         self.post_init()
         self.max_cache_pos = config.model_max_length
         self.first_run = True
     def get_alibi_mask(self, tensor, seq_length_with_past):
         if self.first_run:
             self.first_run = False

 from typing import List, Optional, Tuple, Union
 import torch
+import torch.utils.checkpoint
 from torch.nn import CrossEntropyLoss
 from transformers import PreTrainedModel
 from transformers.activations import ACT2FN
         self.post_init()
         self.max_cache_pos = config.model_max_length
         self.first_run = True
+    def get_input_embeddings(self):
+        return self.embed_tokens
+    def set_input_embeddings(self, value):
+        self.embed_tokens = value
     def get_alibi_mask(self, tensor, seq_length_with_past):
         if self.first_run:
             self.first_run = False