fix eval regression caused in 13f7efaf74
This commit is contained in:
@@ -155,12 +155,10 @@ def flashattn_forward(
|
|||||||
# during training q,k,v always have same seqlen
|
# during training q,k,v always have same seqlen
|
||||||
assert key_states.shape == query_states.shape
|
assert key_states.shape == query_states.shape
|
||||||
is_causal = True
|
is_causal = True
|
||||||
elif past_key_value is None:
|
|
||||||
is_causal = True
|
|
||||||
else:
|
else:
|
||||||
# turn off FA causal mask after first inference autoregressive iteration
|
# turn off FA causal mask after first inference autoregressive iteration
|
||||||
# only on first autoregressive step q,k,v have same seqlen
|
# only on first autoregressive step q,k,v have same seqlen
|
||||||
is_causal = past_key_value is not None
|
is_causal = key_states.shape == query_states.shape
|
||||||
|
|
||||||
if cu_seqlens is not None and max_seqlen is not None:
|
if cu_seqlens is not None and max_seqlen is not None:
|
||||||
# special handling using sample packing
|
# special handling using sample packing
|
||||||
|
|||||||
Reference in New Issue
Block a user