damerajee commited on
Commit
606f075
·
verified ·
1 Parent(s): 1d82b40

Update modeling_Llamoe.py

Browse files
Files changed (1) hide show
  1. modeling_Llamoe.py +1 -1
modeling_Llamoe.py CHANGED
@@ -745,7 +745,7 @@ class LlamoeDecoderLayer(nn.Module):
745
 
746
  self.self_attn = LLAMOE_ATTENTION_CLASSES[config._attn_implementation](config, layer_idx)
747
 
748
- self.block_sparse_moe = LlamoeBlockSparseTop2MLPSparseMoeBlock(config)
749
  self.input_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
750
  self.post_attention_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
751
 
 
745
 
746
  self.self_attn = LLAMOE_ATTENTION_CLASSES[config._attn_implementation](config, layer_idx)
747
 
748
+ self.block_sparse_moe = LlamoeBlockSparseTop2MLP(config)
749
  self.input_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
750
  self.post_attention_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
751