diff --git a/flash_attn/flash_attn_interface.py b/flash_attn/flash_attn_interface.py index 167a534..74bbe8e 100644 --- a/flash_attn/flash_attn_interface.py +++ b/flash_attn/flash_attn_interface.py @@ -721,7 +721,7 @@ def flash_attn_qkvpacked_func( softmax_scale, causal, window_size, - softcapping, + softcap, alibi_slopes, deterministic, return_attn_probs, @@ -1270,4 +1270,4 @@ def flash_attn_with_kvcache( rotary_interleaved, num_splits, ) - return (out, softmax_lse) if return_softmax_lse else out \ No newline at end of file + return (out, softmax_lse) if return_softmax_lse else out