marriola commited on
Commit
d5ecd4b
·
verified ·
1 Parent(s): 95c0f16

Upload BD3LM

Browse files
Files changed (1) hide show
  1. modeling_bd3lm.py +1 -1
modeling_bd3lm.py CHANGED
@@ -341,7 +341,7 @@ class DDiTBlock(nn.Module):
341
  qkv = self.attn_qkv(x)
342
  # store kv cache in a sliding window (can't exceed context len)
343
  if store_kv:
344
- self.kv_cache = qkv[:, -(self.n-self.block_size):]
345
 
346
  qkv = einops.rearrange(
347
  qkv,
 
341
  qkv = self.attn_qkv(x)
342
  # store kv cache in a sliding window (can't exceed context len)
343
  if store_kv:
344
+ self.kv_cache = qkv[:, -(self.max_seqlen-self.block_size):]
345
 
346
  qkv = einops.rearrange(
347
  qkv,