Update modernberg_model.py
Browse files- modernberg_model.py +1 -0
modernberg_model.py
CHANGED
|
@@ -413,6 +413,7 @@ class GriffinRecurrentblock(nn.Module):
|
|
| 413 |
attention_mask: torch.Tensor,
|
| 414 |
cache_position: torch.Tensor,
|
| 415 |
use_cache: bool = True,
|
|
|
|
| 416 |
) -> Tuple[torch.Tensor, Dict[str, torch.Tensor]]:
|
| 417 |
_, seq_len, _ = input_states.shape
|
| 418 |
|
|
|
|
| 413 |
attention_mask: torch.Tensor,
|
| 414 |
cache_position: torch.Tensor,
|
| 415 |
use_cache: bool = True,
|
| 416 |
+
**kwargs
|
| 417 |
) -> Tuple[torch.Tensor, Dict[str, torch.Tensor]]:
|
| 418 |
_, seq_len, _ = input_states.shape
|
| 419 |
|