Skip to content

Commit b53d3ef

Browse files
committed
support vllm==0.4.2
1 parent 1650d36 commit b53d3ef

File tree

3 files changed

+4
-0
lines changed

3 files changed

+4
-0
lines changed

api/utils/protocol.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -236,6 +236,8 @@ class ChatCompletionCreateParams(BaseModel):
236236

237237
guided_grammar: Optional[str] = None
238238

239+
guided_decoding_backend: Optional[str] = "lm-format-enforcer"
240+
239241

240242
class CompletionCreateParams(BaseModel):
241243
model: str

api/vllm_routes/chat.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -106,6 +106,7 @@ async def create_chat_completion(
106106
from vllm.model_executor.guided_decoding import get_guided_decoding_logits_processor
107107
guided_decode_logits_processor = (
108108
await get_guided_decoding_logits_processor(
109+
request.guided_decoding_backend,
109110
request,
110111
engine.tokenizer,
111112
)

api/vllm_routes/completion.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -145,6 +145,7 @@ async def create_completion(
145145
from vllm.model_executor.guided_decoding import get_guided_decoding_logits_processor
146146
guided_decode_logits_processor = (
147147
await get_guided_decoding_logits_processor(
148+
request.guided_decoding_backend,
148149
request,
149150
engine.tokenizer,
150151
)

0 commit comments

Comments
 (0)