We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5ba2396 commit 85b1d42Copy full SHA for 85b1d42
vllm_ascend/worker/model_runner_v1.py
@@ -2000,7 +2000,7 @@ def execute_model(
2000
logits = model_output_broadcast_data["logits"]
2001
2002
# Apply structured output bitmasks if present
2003
- if scheduler_output.grammar_bitmask is not None:
+ if scheduler_output.structured_output_request_ids:
2004
logits = self.apply_grammar_bitmask(scheduler_output, logits)
2005
2006
# Sample the next token and get logprobs if needed.
0 commit comments