diff --git a/vllm/model_executor/guided_decoding/outlines_logits_processors.py b/vllm/model_executor/guided_decoding/outlines_logits_processors.py index 1c8f6cccb3e9a..5382f0f655264 100644 --- a/vllm/model_executor/guided_decoding/outlines_logits_processors.py +++ b/vllm/model_executor/guided_decoding/outlines_logits_processors.py @@ -61,7 +61,7 @@ def __call__(self, input_ids: List[int], -math.inf, device=scores.device) mask[allowed_tokens] = 0 - scores.add_(mask) + scores = scores.add(mask) return scores