We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 25677a3 commit c01b133Copy full SHA for c01b133
src/art/dev/model.py
@@ -43,6 +43,7 @@ def get_model_config(
43
# which is the fallback for devices with compute capability < 8.0
44
num_scheduler_steps=16 if torch.cuda.get_device_capability()[0] >= 8 else 1,
45
enable_sleep_mode=enable_sleep_mode,
46
+ generation_config="vllm",
47
)
48
engine_args.update(config.get("engine_args", {}))
49
init_args.update(config.get("init_args", {}))
src/art/dev/openai_server.py
@@ -27,6 +27,7 @@ def get_openai_server_config(
27
num_scheduler_steps=16,
28
served_model_name=base_model,
29
disable_log_requests=True,
30
31
32
33
return OpenAIServerConfig(
0 commit comments