Update modeling_nort5.py
Browse files- modeling_nort5.py +2 -2
modeling_nort5.py
CHANGED
|
@@ -134,7 +134,7 @@ class DecoderLayer(nn.Module):
|
|
| 134 |
if past_key_value is not None:
|
| 135 |
self_attn_past_key_value = past_key_value[:2]
|
| 136 |
cross_attn_past_key_value = past_key_value[2:]
|
| 137 |
-
query_offset = self_attn_past_key_value[0].size(
|
| 138 |
else:
|
| 139 |
self_attn_past_key_value, cross_attn_past_key_value = None, None
|
| 140 |
|
|
@@ -570,7 +570,7 @@ class NorT5ForConditionalGeneration(NorT5Model):
|
|
| 570 |
output_hidden_states: Optional[bool] = None,
|
| 571 |
return_dict: Optional[bool] = None,
|
| 572 |
):
|
| 573 |
-
use_cache = use_cache if use_cache is not None else self.config
|
| 574 |
return_dict = return_dict if return_dict is not None else self.config.use_return_dict
|
| 575 |
|
| 576 |
if encoder_outputs is None:
|
|
|
|
| 134 |
if past_key_value is not None:
|
| 135 |
self_attn_past_key_value = past_key_value[:2]
|
| 136 |
cross_attn_past_key_value = past_key_value[2:]
|
| 137 |
+
query_offset = self_attn_past_key_value[0].size(2)
|
| 138 |
else:
|
| 139 |
self_attn_past_key_value, cross_attn_past_key_value = None, None
|
| 140 |
|
|
|
|
| 570 |
output_hidden_states: Optional[bool] = None,
|
| 571 |
return_dict: Optional[bool] = None,
|
| 572 |
):
|
| 573 |
+
use_cache = use_cache if use_cache is not None else getattr(self.config, "use_cache", False)
|
| 574 |
return_dict = return_dict if return_dict is not None else self.config.use_return_dict
|
| 575 |
|
| 576 |
if encoder_outputs is None:
|