@@ -332,7 +332,7 @@ def main(args):
332332
333333if __name__ == "__main__" :
334334 parser = argparse .ArgumentParser (description = __doc__ )
335- parser .add_argument ("--model_dir " ,
335+ parser .add_argument ("--model-dir " ,
336336 help = "Specify where the HuggingFace model is" ,
337337 required = True )
338338 parser .add_argument ("--device" , default = "cuda" )
@@ -346,19 +346,19 @@ def main(args):
346346 "full_prec"
347347 ],
348348 )
349- parser .add_argument ("--batch_size " ,
349+ parser .add_argument ("--batch-size " ,
350350 help = "Batch size for calibration." ,
351351 type = int ,
352352 default = 1 )
353- parser .add_argument ("--calib_size " ,
353+ parser .add_argument ("--calib-size " ,
354354 help = "Number of samples for calibration." ,
355355 type = int ,
356356 default = 512 )
357- parser .add_argument ("--output_dir " , default = "exported_model" )
358- parser .add_argument ("--tp_size " , type = int , default = 1 )
359- parser .add_argument ("--pp_size " , type = int , default = 1 )
360- parser .add_argument ("--awq_block_size " , type = int , default = 128 )
361- parser .add_argument ("--kv_cache_dtype " ,
357+ parser .add_argument ("--output-dir " , default = "exported_model" )
358+ parser .add_argument ("--tp-size " , type = int , default = 1 )
359+ parser .add_argument ("--pp-size " , type = int , default = 1 )
360+ parser .add_argument ("--awq-block-size " , type = int , default = 128 )
361+ parser .add_argument ("--kv-cache-dtype " ,
362362 help = "KV Cache dtype." ,
363363 default = None ,
364364 choices = ["int8" , "fp8" , None ])
0 commit comments