Update modeling_Llamoe.py
Browse files- modeling_Llamoe.py +1 -1
modeling_Llamoe.py
CHANGED
@@ -678,7 +678,7 @@ class LlamoeDecoderLayer(nn.Module):
|
|
678 |
super().__init__()
|
679 |
self.hidden_size = config.hidden_size
|
680 |
|
681 |
-
self.self_attn =
|
682 |
|
683 |
self.block_sparse_moe = LlamoeSparseMoeBlock(config)
|
684 |
self.input_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
|
|
|
678 |
super().__init__()
|
679 |
self.hidden_size = config.hidden_size
|
680 |
|
681 |
+
self.self_attn = LLAMOE_ATTENTION_CLASSES[config._attn_implementation](config, layer_idx)
|
682 |
|
683 |
self.block_sparse_moe = LlamoeSparseMoeBlock(config)
|
684 |
self.input_layernorm = LlamoeRMSNorm(config.hidden_size, eps=config.rms_norm_eps)
|