damerajee commited on
Commit
28eb841
1 Parent(s): bdfe503

Update modeling_Llamoe.py

Browse files
Files changed (1) hide show
  1. modeling_Llamoe.py +1 -1
modeling_Llamoe.py CHANGED
@@ -320,7 +320,7 @@ def repeat_kv(hidden_states: torch.Tensor, n_rep: int) -> torch.Tensor:
320
  class LlamoeAttention(nn.Module):
321
  """Multi-headed attention from 'Attention Is All You Need' paper"""
322
 
323
- def __init__(self, config: LlamaConfig, layer_idx: Optional[int] = None):
324
  super().__init__()
325
  self.config = config
326
  self.layer_idx = layer_idx
 
320
  class LlamoeAttention(nn.Module):
321
  """Multi-headed attention from 'Attention Is All You Need' paper"""
322
 
323
+ def __init__(self, config: LlamoeConfig, layer_idx: Optional[int] = None):
324
  super().__init__()
325
  self.config = config
326
  self.layer_idx = layer_idx