zwt123home123
commited on
Commit
•
e2e3643
1
Parent(s):
af7dbc6
Update modeling_llama_attncut_window.py
Browse files
modeling_llama_attncut_window.py
CHANGED
@@ -821,7 +821,7 @@ class LlamaDecoderLayer(nn.Module):
|
|
821 |
|
822 |
offset=35
|
823 |
#import pdb; pdb.set_trace()
|
824 |
-
if attention_mask.shape[2]
|
825 |
attention_mask[:,:,offset:offset+576,offset:offset+576]=self.attention_mask_local
|
826 |
|
827 |
# import pdb; pdb.set_trace()
|
|
|
821 |
|
822 |
offset=35
|
823 |
#import pdb; pdb.set_trace()
|
824 |
+
if attention_mask.shape[2]>576:
|
825 |
attention_mask[:,:,offset:offset+576,offset:offset+576]=self.attention_mask_local
|
826 |
|
827 |
# import pdb; pdb.set_trace()
|