Update modeling_Llamoe.py
Browse files- modeling_Llamoe.py +1 -1
modeling_Llamoe.py
CHANGED
@@ -745,7 +745,7 @@ class LlamoeDecoderLayer(nn.Module):
|
|
745 |
|
746 |
self.self_attn = LLAMOE_ATTENTION_CLASSES[config._attn_implementation](config, layer_idx)
|
747 |
|
748 |
-
self.block_sparse_moe =
|
749 |
self.input_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
|
750 |
self.post_attention_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
|
751 |
|
|
|
745 |
|
746 |
self.self_attn = LLAMOE_ATTENTION_CLASSES[config._attn_implementation](config, layer_idx)
|
747 |
|
748 |
+
self.block_sparse_moe = LlamoeBlockSparseTop2MLP(config)
|
749 |
self.input_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
|
750 |
self.post_attention_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
|
751 |
|