Upload BD3LM
Browse files- modeling_bd3lm.py +1 -1
modeling_bd3lm.py
CHANGED
@@ -341,7 +341,7 @@ class DDiTBlock(nn.Module):
|
|
341 |
qkv = self.attn_qkv(x)
|
342 |
# store kv cache in a sliding window (can't exceed context len)
|
343 |
if store_kv:
|
344 |
-
self.kv_cache = qkv[:, -(self.
|
345 |
|
346 |
qkv = einops.rearrange(
|
347 |
qkv,
|
|
|
341 |
qkv = self.attn_qkv(x)
|
342 |
# store kv cache in a sliding window (can't exceed context len)
|
343 |
if store_kv:
|
344 |
+
self.kv_cache = qkv[:, -(self.max_seqlen-self.block_size):]
|
345 |
|
346 |
qkv = einops.rearrange(
|
347 |
qkv,
|