Update modeling_afmoe_scm_liger.py
Browse files
modeling_afmoe_scm_liger.py
CHANGED
|
@@ -301,6 +301,7 @@ class AfmoeSCMAttention(nn.Module):
|
|
| 301 |
|
| 302 |
self.scaling = self.head_dim**-0.5
|
| 303 |
self.attention_dropout = config.attention_dropout
|
|
|
|
| 304 |
self.is_local_attention = config.layer_types[layer_idx] == "sliding_attention"
|
| 305 |
self.sliding_window = config.sliding_window if self.is_local_attention else None
|
| 306 |
|
|
|
|
| 301 |
|
| 302 |
self.scaling = self.head_dim**-0.5
|
| 303 |
self.attention_dropout = config.attention_dropout
|
| 304 |
+
self.is_causal = True
|
| 305 |
self.is_local_attention = config.layer_types[layer_idx] == "sliding_attention"
|
| 306 |
self.sliding_window = config.sliding_window if self.is_local_attention else None
|
| 307 |
|