diff --git a/vllm/_custom_ops.py b/vllm/_custom_ops.py index 92de39418054..70605d3c5f52 100644 --- a/vllm/_custom_ops.py +++ b/vllm/_custom_ops.py @@ -311,7 +311,7 @@ def apply_repetition_penalties(logits: torch.Tensor, prompt_mask: torch.Tensor, output_mask: A boolean tensor indicating which tokens appear in the output. repetition_penalties: The repetition penalties of shape (num_seqs, ). """ - if current_platform.is_cuda() and logits.is_contiguous(): + if logits.is_cuda and logits.is_contiguous(): apply_repetition_penalties_cuda(logits, prompt_mask, output_mask, repetition_penalties) else: