diff --git a/vllm_flash_attn/flash_attn_interface.py b/vllm_flash_attn/flash_attn_interface.py index 6a5f16cf7..3a81a3027 100644 --- a/vllm_flash_attn/flash_attn_interface.py +++ b/vllm_flash_attn/flash_attn_interface.py @@ -709,7 +709,7 @@ def flash_attn_qkvpacked_func( alibi_slopes, deterministic, return_attn_probs, - out=out, + out, ) @@ -786,7 +786,7 @@ def flash_attn_kvpacked_func( alibi_slopes, deterministic, return_attn_probs, - out=out, + out, ) @@ -863,7 +863,7 @@ def flash_attn_func( alibi_slopes, deterministic, return_attn_probs, - out=out, + out, ) @@ -928,7 +928,7 @@ def flash_attn_varlen_qkvpacked_func( alibi_slopes, deterministic, return_attn_probs, - out=out, + out, ) @@ -1019,7 +1019,7 @@ def flash_attn_varlen_kvpacked_func( alibi_slopes, deterministic, return_attn_probs, - out=out, + out, ) @@ -1112,7 +1112,7 @@ def flash_attn_varlen_func( deterministic, return_attn_probs, block_table, - out=out, + out, )