From ca9562bf65d34c7b4e59027a57e50c65ac9ad3b0 Mon Sep 17 00:00:00 2001 From: NickLucche Date: Wed, 15 Jan 2025 14:28:52 +0000 Subject: [PATCH] fix blocksparse tests Signed-off-by: NickLucche --- tests/kernels/test_blocksparse_attention.py | 2 ++ vllm/attention/ops/ipex_attn.py | 1 + 2 files changed, 3 insertions(+) diff --git a/tests/kernels/test_blocksparse_attention.py b/tests/kernels/test_blocksparse_attention.py index fad342d1b5923..1cfba68483338 100644 --- a/tests/kernels/test_blocksparse_attention.py +++ b/tests/kernels/test_blocksparse_attention.py @@ -228,6 +228,7 @@ def test_paged_attention( block_size, max_seq_len, alibi_slopes, + None, # TODO add custom bias kv_cache_dtype, k_scale, v_scale, @@ -265,6 +266,7 @@ def test_paged_attention( block_size, max_seq_len, alibi_slopes, + None, kv_cache_dtype, k_scale, v_scale, diff --git a/vllm/attention/ops/ipex_attn.py b/vllm/attention/ops/ipex_attn.py index cbc6c74acf09a..5e4b1c8bc29e2 100644 --- a/vllm/attention/ops/ipex_attn.py +++ b/vllm/attention/ops/ipex_attn.py @@ -103,6 +103,7 @@ def forward_decode( block_size, max_context_len, alibi_slopes, + None, # TODO add custom bias kv_cache_dtype, k_scale, v_scale,