@@ -332,7 +332,7 @@ def main(args):
332
332
333
333
if __name__ == "__main__" :
334
334
parser = argparse .ArgumentParser (description = __doc__ )
335
- parser .add_argument ("--model_dir " ,
335
+ parser .add_argument ("--model-dir " ,
336
336
help = "Specify where the HuggingFace model is" ,
337
337
required = True )
338
338
parser .add_argument ("--device" , default = "cuda" )
@@ -346,19 +346,19 @@ def main(args):
346
346
"full_prec"
347
347
],
348
348
)
349
- parser .add_argument ("--batch_size " ,
349
+ parser .add_argument ("--batch-size " ,
350
350
help = "Batch size for calibration." ,
351
351
type = int ,
352
352
default = 1 )
353
- parser .add_argument ("--calib_size " ,
353
+ parser .add_argument ("--calib-size " ,
354
354
help = "Number of samples for calibration." ,
355
355
type = int ,
356
356
default = 512 )
357
- parser .add_argument ("--output_dir " , default = "exported_model" )
358
- parser .add_argument ("--tp_size " , type = int , default = 1 )
359
- parser .add_argument ("--pp_size " , type = int , default = 1 )
360
- parser .add_argument ("--awq_block_size " , type = int , default = 128 )
361
- parser .add_argument ("--kv_cache_dtype " ,
357
+ parser .add_argument ("--output-dir " , default = "exported_model" )
358
+ parser .add_argument ("--tp-size " , type = int , default = 1 )
359
+ parser .add_argument ("--pp-size " , type = int , default = 1 )
360
+ parser .add_argument ("--awq-block-size " , type = int , default = 128 )
361
+ parser .add_argument ("--kv-cache-dtype " ,
362
362
help = "KV Cache dtype." ,
363
363
default = None ,
364
364
choices = ["int8" , "fp8" , None ])
0 commit comments