diff --git a/vllm/lora/ops/triton_ops/kernel_utils.py b/vllm/lora/ops/triton_ops/kernel_utils.py index 3572d3018622..5b8c19376106 100644 --- a/vllm/lora/ops/triton_ops/kernel_utils.py +++ b/vllm/lora/ops/triton_ops/kernel_utils.py @@ -130,7 +130,7 @@ def do_expand_kernel( # Identify A and B block pointers offset_k = tl.arange(0, BLOCK_K) a_ptr = (cur_input_ptr + ram[:, None] * input_d1_stride + - offset_k[None, :] * input_d2_stride, ) + offset_k[None, :] * input_d2_stride) b_ptr = (cur_lora_ptr + cur_lora_d0_stride * lora_index + offset_k[:, None] * cur_lora_d2_stride + rbn[None, :] * cur_lora_d1_stride)