Skip to content
This repository was archived by the owner on Oct 11, 2024. It is now read-only.

Commit d72246c

Browse files
AllenDouRobert Shaw
authored andcommitted
[Misc] Fix arg names in quantizer script (vllm-project#5507)
1 parent 61a038e commit d72246c

File tree

1 file changed

+8
-8
lines changed

1 file changed

+8
-8
lines changed

examples/fp8/quantizer/quantize.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -332,7 +332,7 @@ def main(args):
332332

333333
if __name__ == "__main__":
334334
parser = argparse.ArgumentParser(description=__doc__)
335-
parser.add_argument("--model_dir",
335+
parser.add_argument("--model-dir",
336336
help="Specify where the HuggingFace model is",
337337
required=True)
338338
parser.add_argument("--device", default="cuda")
@@ -346,19 +346,19 @@ def main(args):
346346
"full_prec"
347347
],
348348
)
349-
parser.add_argument("--batch_size",
349+
parser.add_argument("--batch-size",
350350
help="Batch size for calibration.",
351351
type=int,
352352
default=1)
353-
parser.add_argument("--calib_size",
353+
parser.add_argument("--calib-size",
354354
help="Number of samples for calibration.",
355355
type=int,
356356
default=512)
357-
parser.add_argument("--output_dir", default="exported_model")
358-
parser.add_argument("--tp_size", type=int, default=1)
359-
parser.add_argument("--pp_size", type=int, default=1)
360-
parser.add_argument("--awq_block_size", type=int, default=128)
361-
parser.add_argument("--kv_cache_dtype",
357+
parser.add_argument("--output-dir", default="exported_model")
358+
parser.add_argument("--tp-size", type=int, default=1)
359+
parser.add_argument("--pp-size", type=int, default=1)
360+
parser.add_argument("--awq-block-size", type=int, default=128)
361+
parser.add_argument("--kv-cache-dtype",
362362
help="KV Cache dtype.",
363363
default=None,
364364
choices=["int8", "fp8", None])

0 commit comments

Comments
 (0)