Merge pull request #451 from OpenAccess-AI-Collective/eval-is-causal
is_causal fix for evals?
This commit is contained in:
@@ -158,7 +158,7 @@ def flashattn_forward(
|
||||
else:
|
||||
# turn off FA causal mask after first inference autoregressive iteration
|
||||
# only on first autoregressive step q,k,v have same seqlen
|
||||
is_causal = past_key_value is not None
|
||||
is_causal = key_states.shape == query_states.shape
|
||||
|
||||
if cu_seqlens is not None and max_seqlen is not None:
|
||||
# special handling using sample packing
|
||||
|
||||
Reference in New Issue
Block a user