Ontocord.AI
commited on
Commit
·
3a6a19a
1
Parent(s):
c5e4b95
Upload modeling_mpt.py with huggingface_hub
Browse files- modeling_mpt.py +2 -0
modeling_mpt.py
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
"""A simple, flexible implementation of a GPT model.
|
|
|
2 |
Inspired by https://github.com/karpathy/minGPT/blob/master/mingpt/model.py
|
3 |
"""
|
4 |
import math
|
@@ -307,6 +308,7 @@ class MPTForCausalLM(MPTPreTrainedModel):
|
|
307 |
@staticmethod
|
308 |
def _reorder_cache(past_key_values, beam_idx):
|
309 |
"""Used by HuggingFace generate when using beam search with kv-caching.
|
|
|
310 |
See https://github.com/huggingface/transformers/blob/3ec7a47664ebe40c40f4b722f6bb1cd30c3821ec/src/transformers/models/gpt2/modeling_gpt2.py#L1122-L1133
|
311 |
for an example in transformers.
|
312 |
"""
|
|
|
1 |
"""A simple, flexible implementation of a GPT model.
|
2 |
+
|
3 |
Inspired by https://github.com/karpathy/minGPT/blob/master/mingpt/model.py
|
4 |
"""
|
5 |
import math
|
|
|
308 |
@staticmethod
|
309 |
def _reorder_cache(past_key_values, beam_idx):
|
310 |
"""Used by HuggingFace generate when using beam search with kv-caching.
|
311 |
+
|
312 |
See https://github.com/huggingface/transformers/blob/3ec7a47664ebe40c40f4b722f6bb1cd30c3821ec/src/transformers/models/gpt2/modeling_gpt2.py#L1122-L1133
|
313 |
for an example in transformers.
|
314 |
"""
|