Update modernberg_model.py
Browse files- modernberg_model.py +1 -0
modernberg_model.py
CHANGED
@@ -413,6 +413,7 @@ class GriffinRecurrentblock(nn.Module):
|
|
413 |
attention_mask: torch.Tensor,
|
414 |
cache_position: torch.Tensor,
|
415 |
use_cache: bool = True,
|
|
|
416 |
) -> Tuple[torch.Tensor, Dict[str, torch.Tensor]]:
|
417 |
_, seq_len, _ = input_states.shape
|
418 |
|
|
|
413 |
attention_mask: torch.Tensor,
|
414 |
cache_position: torch.Tensor,
|
415 |
use_cache: bool = True,
|
416 |
+
**kwargs
|
417 |
) -> Tuple[torch.Tensor, Dict[str, torch.Tensor]]:
|
418 |
_, seq_len, _ = input_states.shape
|
419 |
|