Skip to content

Commit 9f66019

Browse files
committed
update start vllm server script
1 parent ec361e5 commit 9f66019

File tree

1 file changed

+1
-8
lines changed

1 file changed

+1
-8
lines changed

vllm_musa/start_vllm_server.sh

Lines changed: 1 addition & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -5,9 +5,8 @@ set -e
55
# 默认参数配置
66
DEFAULT_PORT=8000
77
DEFAULT_HOST="localhost"
8-
DEFAULT_GPU_UTIL=0.8
8+
DEFAULT_GPU_UTIL=0.9
99
DEFAULT_TP_SIZE=1
10-
DEFAULT_MODEL_LEN=4096
1110
DEFAULT_TRUST_REMOTE_CODE=true
1211
DEFUALT_SERVED_MODEL_NAME=""
1312

@@ -71,10 +70,6 @@ parse_arguments() {
7170
DEFAULT_TP_SIZE="$2"
7271
shift 2
7372
;;
74-
--max-model-len)
75-
DEFAULT_MODEL_LEN="$2"
76-
shift 2
77-
;;
7873
--trust-remote-code)
7974
DEFAULT_TRUST_REMOTE_CODE=true
8075
shift
@@ -121,7 +116,6 @@ build_final_args() {
121116
"--host" "$DEFAULT_HOST"
122117
"--gpu-memory-utilization" "$DEFAULT_GPU_UTIL"
123118
"--tensor-parallel-size" "$DEFAULT_TP_SIZE"
124-
"--max-model-len" "$DEFAULT_MODEL_LEN"
125119
"--served-model-name" "${DEFUALT_SERVED_MODEL_NAME:-$(basename "$MODEL")}"
126120
)
127121

@@ -213,7 +207,6 @@ start_vllm() {
213207
echo "Port : $DEFAULT_PORT"
214208
echo "GPU Utilization : $DEFAULT_GPU_UTIL"
215209
echo "Tensor Parallel : $DEFAULT_TP_SIZE"
216-
echo "Max Model Length : $DEFAULT_MODEL_LEN"
217210
echo "Trust Remote Code : $DEFAULT_TRUST_REMOTE_CODE"
218211
echo "Extra Arguments : ${USER_ARGS[*]}"
219212
echo "Full Command : vllm serve ${FINAL_ARGS[*]}"

0 commit comments

Comments
 (0)