Skip to content

Commit a21076e

Browse files
authored
[Misc] Ensure out-of-tree quantization method recognize by cli args (#14328)
Signed-off-by: liuyanyi <wolfsonliu@163.com>
1 parent 212007b commit a21076e

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

vllm/engine/arg_utils.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1478,15 +1478,15 @@ class AsyncEngineArgs(EngineArgs):
14781478
@staticmethod
14791479
def add_cli_args(parser: FlexibleArgumentParser,
14801480
async_args_only: bool = False) -> FlexibleArgumentParser:
1481+
# Initialize plugin to update the parser, for example, The plugin may
1482+
# adding a new kind of quantization method to --quantization argument or
1483+
# a new device to --device argument.
1484+
load_general_plugins()
14811485
if not async_args_only:
14821486
parser = EngineArgs.add_cli_args(parser)
14831487
parser.add_argument('--disable-log-requests',
14841488
action='store_true',
14851489
help='Disable logging requests.')
1486-
# Initialize plugin to update the parser, for example, The plugin may
1487-
# adding a new kind of quantization method to --quantization argument or
1488-
# a new device to --device argument.
1489-
load_general_plugins()
14901490
from vllm.platforms import current_platform
14911491
current_platform.pre_register_and_update(parser)
14921492
return parser

0 commit comments

Comments
 (0)