@@ -54,89 +54,89 @@ import (
54
54
55
55
var (
56
56
grpcPort = flag .Int (
57
- "grpcPort " ,
57
+ "grpc-port " ,
58
58
runserver .DefaultGrpcPort ,
59
59
"The gRPC port used for communicating with Envoy proxy" )
60
60
grpcHealthPort = flag .Int (
61
- "grpcHealthPort " ,
61
+ "grpc-health-port " ,
62
62
runserver .DefaultGrpcHealthPort ,
63
63
"The port used for gRPC liveness and readiness probes" )
64
64
metricsPort = flag .Int (
65
- "metricsPort " ,
65
+ "metrics-port " ,
66
66
runserver .DefaultMetricsPort ,
67
67
"The metrics port" )
68
68
enablePprof = flag .Bool (
69
- "enablePprof " ,
69
+ "enable-pprof " ,
70
70
runserver .DefaultEnablePprof ,
71
71
"Enables pprof handlers. Defaults to true. Set to false to disable pprof handlers." )
72
72
destinationEndpointHintKey = flag .String (
73
- "destinationEndpointHintKey " ,
73
+ "destination-endpoint-hint-key " ,
74
74
runserver .DefaultDestinationEndpointHintKey ,
75
75
"Header and response metadata key used by Envoy to route to the appropriate pod. This must match Envoy configuration." )
76
76
destinationEndpointHintMetadataNamespace = flag .String (
77
- "DestinationEndpointHintMetadataNamespace " ,
77
+ "destination-endpoint-hint-metadata-namespace " ,
78
78
runserver .DefaultDestinationEndpointHintMetadataNamespace ,
79
79
"The key for the outer namespace struct in the metadata field of the extproc response that is used to wrap the" +
80
80
"target endpoint. If not set, then an outer namespace struct should not be created." )
81
81
poolName = flag .String (
82
- "poolName " ,
82
+ "pool-name " ,
83
83
runserver .DefaultPoolName ,
84
84
"Name of the InferencePool this Endpoint Picker is associated with." )
85
85
poolNamespace = flag .String (
86
- "poolNamespace " ,
86
+ "pool-namespace " ,
87
87
runserver .DefaultPoolNamespace ,
88
88
"Namespace of the InferencePool this Endpoint Picker is associated with." )
89
89
refreshMetricsInterval = flag .Duration (
90
- "refreshMetricsInterval " ,
90
+ "refresh-metrics-interval " ,
91
91
runserver .DefaultRefreshMetricsInterval ,
92
92
"interval to refresh metrics" )
93
93
refreshPrometheusMetricsInterval = flag .Duration (
94
- "refreshPrometheusMetricsInterval " ,
94
+ "refresh-prometheus-metrics-interval " ,
95
95
runserver .DefaultRefreshPrometheusMetricsInterval ,
96
96
"interval to flush prometheus metrics" )
97
97
logVerbosity = flag .Int (
98
98
"v" ,
99
99
logging .DEFAULT ,
100
100
"number for the log level verbosity" )
101
101
secureServing = flag .Bool (
102
- "secureServing " ,
102
+ "secure-serving " ,
103
103
runserver .DefaultSecureServing ,
104
104
"Enables secure serving. Defaults to true." )
105
105
healthChecking = flag .Bool (
106
- "healthChecking " ,
106
+ "health-checking " ,
107
107
runserver .DefaultHealthChecking ,
108
108
"Enables health checking" )
109
109
certPath = flag .String (
110
- "certPath " ,
110
+ "cert-path " ,
111
111
runserver .DefaultCertPath ,
112
112
"The path to the certificate for secure serving. The certificate and private key files " +
113
113
"are assumed to be named tls.crt and tls.key, respectively. If not set, and secureServing is enabled, " +
114
114
"then a self-signed certificate is used." )
115
115
// metric flags
116
116
totalQueuedRequestsMetric = flag .String (
117
- "totalQueuedRequestsMetric " ,
117
+ "total-queued-requests-metric " ,
118
118
runserver .DefaultTotalQueuedRequestsMetric ,
119
119
"Prometheus metric for the number of queued requests." )
120
120
kvCacheUsagePercentageMetric = flag .String (
121
- "kvCacheUsagePercentageMetric " ,
121
+ "kv-cache-usage-percentage-metric " ,
122
122
runserver .DefaultKvCacheUsagePercentageMetric ,
123
123
"Prometheus metric for the fraction of KV-cache blocks currently in use (from 0 to 1)." )
124
124
// LoRA metrics
125
125
loraInfoMetric = flag .String (
126
- "loraInfoMetric " ,
126
+ "lora-info-metric " ,
127
127
runserver .DefaultLoraInfoMetric ,
128
128
"Prometheus metric for the LoRA info metrics (must be in vLLM label format)." )
129
129
// configuration flags
130
130
configFile = flag .String (
131
- "configFile " ,
131
+ "config-file " ,
132
132
runserver .DefaultConfigFile ,
133
133
"The path to the configuration file" )
134
134
configText = flag .String (
135
- "configText " ,
135
+ "config-text " ,
136
136
runserver .DefaultConfigText ,
137
137
"The configuration specified as text, in lieu of a file" )
138
138
139
- modelServerMetricsPort = flag .Int ("modelServerMetricsPort " , 0 , "Port to scrape metrics from pods. " +
139
+ modelServerMetricsPort = flag .Int ("model-server-metrics-port " , 0 , "Port to scrape metrics from pods. " +
140
140
"Default value will be set to InferencePool.Spec.TargetPortNumber if not set." )
141
141
modelServerMetricsPath = flag .String ("modelServerMetricsPath" , "/metrics" , "Path to scrape metrics from pods" )
142
142
modelServerMetricsScheme = flag .String ("modelServerMetricsScheme" , "http" , "Scheme to scrape metrics from pods" )
@@ -181,8 +181,8 @@ func bindEnvToFlags() {
181
181
"POOL_NAME" : "poolName" ,
182
182
"POOL_NAMESPACE" : "poolNamespace" ,
183
183
// durations & bools work too; flag.Set expects the *string* form
184
- "REFRESH_METRICS_INTERVAL" : "refreshMetricsInterval " ,
185
- "SECURE_SERVING" : "secureServing " ,
184
+ "REFRESH_METRICS_INTERVAL" : "refresh-metrics-interval " ,
185
+ "SECURE_SERVING" : "secure-serving " ,
186
186
} {
187
187
if v := os .Getenv (env ); v != "" {
188
188
// ignore error; Parse() will catch invalid values later
0 commit comments