Skip to content

Commit c01b133

Browse files
Saumya GandhiSaumya Gandhi
authored andcommitted
default art to vllm default generation config, instead of model
1 parent 25677a3 commit c01b133

File tree

2 files changed

+2
-0
lines changed

2 files changed

+2
-0
lines changed

src/art/dev/model.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,7 @@ def get_model_config(
4343
# which is the fallback for devices with compute capability < 8.0
4444
num_scheduler_steps=16 if torch.cuda.get_device_capability()[0] >= 8 else 1,
4545
enable_sleep_mode=enable_sleep_mode,
46+
generation_config="vllm",
4647
)
4748
engine_args.update(config.get("engine_args", {}))
4849
init_args.update(config.get("init_args", {}))

src/art/dev/openai_server.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@ def get_openai_server_config(
2727
num_scheduler_steps=16,
2828
served_model_name=base_model,
2929
disable_log_requests=True,
30+
generation_config="vllm",
3031
)
3132
engine_args.update(config.get("engine_args", {}))
3233
return OpenAIServerConfig(

0 commit comments

Comments
 (0)