Update modeling_afmoe_scm.py
Browse files- modeling_afmoe_scm.py +1 -0
modeling_afmoe_scm.py
CHANGED
|
@@ -299,6 +299,7 @@ class AfmoeSCMAttention(nn.Module):
|
|
| 299 |
|
| 300 |
self.scaling = self.head_dim**-0.5
|
| 301 |
self.attention_dropout = config.attention_dropout
|
|
|
|
| 302 |
self.is_local_attention = config.layer_types[layer_idx] == "sliding_attention"
|
| 303 |
self.sliding_window = config.sliding_window if self.is_local_attention else None
|
| 304 |
|
|
|
|
| 299 |
|
| 300 |
self.scaling = self.head_dim**-0.5
|
| 301 |
self.attention_dropout = config.attention_dropout
|
| 302 |
+
self.is_causal = True
|
| 303 |
self.is_local_attention = config.layer_types[layer_idx] == "sliding_attention"
|
| 304 |
self.sliding_window = config.sliding_window if self.is_local_attention else None
|
| 305 |
|