From a28664f532844cddea8be99cfde45a3af5554b03 Mon Sep 17 00:00:00 2001 From: Tian Zheng <29906817+Tom-Zheng@users.noreply.github.com> Date: Wed, 29 Oct 2025 12:51:37 +0000 Subject: [PATCH] Fix trtllm-gen attention illegal memory access --- flashinfer/decode.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/flashinfer/decode.py b/flashinfer/decode.py index 467152af38..45bc2c58ad 100644 --- a/flashinfer/decode.py +++ b/flashinfer/decode.py @@ -1988,7 +1988,7 @@ def paged_run( q.contiguous(), # NOTE(Siyuan): without contiguous, the result is incorrect paged_k_cache, paged_v_cache, - int_workspace_buffer, + float_workspace_buffer, block_tables, kv_lens_buffer, max_kv_len,