Respect sliding_window=None (#1214)
This commit is contained in:
@@ -94,7 +94,7 @@ def _prepare_decoder_attention_mask(
|
|||||||
sliding_window,
|
sliding_window,
|
||||||
): # pylint: disable=unused-argument
|
): # pylint: disable=unused-argument
|
||||||
# [bsz, seq_len]
|
# [bsz, seq_len]
|
||||||
if attention_mask is None:
|
if attention_mask is None or sliding_window is None:
|
||||||
return attention_mask
|
return attention_mask
|
||||||
|
|
||||||
# NOTE: attention mask and sliding masks are only broadcastable in certain scenarios.
|
# NOTE: attention mask and sliding masks are only broadcastable in certain scenarios.
|
||||||
@@ -151,7 +151,7 @@ def flashattn_forward(
|
|||||||
)
|
)
|
||||||
|
|
||||||
use_sliding_windows = (
|
use_sliding_windows = (
|
||||||
hasattr(self.config, "sliding_window") is not None
|
getattr(self.config, "sliding_window") is not None
|
||||||
and kv_seq_len > self.config.sliding_window
|
and kv_seq_len > self.config.sliding_window
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user