diff --git a/csrc/attention/paged_attention_v2.cu b/csrc/attention/paged_attention_v2.cu index 13e070f30f643..0c9caeb687ecb 100644 --- a/csrc/attention/paged_attention_v2.cu +++ b/csrc/attention/paged_attention_v2.cu @@ -145,7 +145,7 @@ void paged_attention_v2_launcher( #define CALL_V2_LAUNCHER(T, CACHE_T, BLOCK_SIZE, KV_DTYPE, IS_BLOCK_SPARSE, \ NUM_THREADS, PARTITION_SIZE) \ paged_attention_v2_launcher( \ + IS_BLOCK_SPARSE, NUM_THREADS, PARTITION_SIZE>( \ out, exp_sums, max_logits, tmp_out, query, key_cache, value_cache, \ num_kv_heads, scale, block_tables, seq_lens, max_seq_len, alibi_slopes, \ k_scale, v_scale, tp_rank, blocksparse_local_blocks, \