Update modeling_Llamoe.py
Browse files- modeling_Llamoe.py +1 -1
modeling_Llamoe.py
CHANGED
@@ -320,7 +320,7 @@ def repeat_kv(hidden_states: torch.Tensor, n_rep: int) -> torch.Tensor:
|
|
320 |
class LlamoeAttention(nn.Module):
|
321 |
"""Multi-headed attention from 'Attention Is All You Need' paper"""
|
322 |
|
323 |
-
def __init__(self, config:
|
324 |
super().__init__()
|
325 |
self.config = config
|
326 |
self.layer_idx = layer_idx
|
|
|
320 |
class LlamoeAttention(nn.Module):
|
321 |
"""Multi-headed attention from 'Attention Is All You Need' paper"""
|
322 |
|
323 |
+
def __init__(self, config: LlamoeConfig, layer_idx: Optional[int] = None):
|
324 |
super().__init__()
|
325 |
self.config = config
|
326 |
self.layer_idx = layer_idx
|