File tree Expand file tree Collapse file tree 1 file changed +1
-8
lines changed
Expand file tree Collapse file tree 1 file changed +1
-8
lines changed Original file line number Diff line number Diff line change 55# 默认参数配置
66DEFAULT_PORT=8000
77DEFAULT_HOST=" localhost"
8- DEFAULT_GPU_UTIL=0.8
8+ DEFAULT_GPU_UTIL=0.9
99DEFAULT_TP_SIZE=1
10- DEFAULT_MODEL_LEN=4096
1110DEFAULT_TRUST_REMOTE_CODE=true
1211DEFUALT_SERVED_MODEL_NAME=" "
1312
@@ -71,10 +70,6 @@ parse_arguments() {
7170 DEFAULT_TP_SIZE=" $2 "
7271 shift 2
7372 ;;
74- --max-model-len)
75- DEFAULT_MODEL_LEN=" $2 "
76- shift 2
77- ;;
7873 --trust-remote-code)
7974 DEFAULT_TRUST_REMOTE_CODE=true
8075 shift
@@ -121,7 +116,6 @@ build_final_args() {
121116 " --host" " $DEFAULT_HOST "
122117 " --gpu-memory-utilization" " $DEFAULT_GPU_UTIL "
123118 " --tensor-parallel-size" " $DEFAULT_TP_SIZE "
124- " --max-model-len" " $DEFAULT_MODEL_LEN "
125119 " --served-model-name" " ${DEFUALT_SERVED_MODEL_NAME:- $(basename " $MODEL " )} "
126120 )
127121
@@ -213,7 +207,6 @@ start_vllm() {
213207 echo " Port : $DEFAULT_PORT "
214208 echo " GPU Utilization : $DEFAULT_GPU_UTIL "
215209 echo " Tensor Parallel : $DEFAULT_TP_SIZE "
216- echo " Max Model Length : $DEFAULT_MODEL_LEN "
217210 echo " Trust Remote Code : $DEFAULT_TRUST_REMOTE_CODE "
218211 echo " Extra Arguments : ${USER_ARGS[*]} "
219212 echo " Full Command : vllm serve ${FINAL_ARGS[*]} "
You can’t perform that action at this time.
0 commit comments