File tree Expand file tree Collapse file tree 2 files changed +19
-2
lines changed Expand file tree Collapse file tree 2 files changed +19
-2
lines changed Original file line number Diff line number Diff line change @@ -170,6 +170,14 @@ data:
170
170
max_pending_requests: 40000
171
171
max_requests: 40000
172
172
max_retries: 1024
173
+ health_checks:
174
+ - timeout: 1s
175
+ interval: 5s
176
+ unhealthy_threshold: 3
177
+ healthy_threshold: 1
178
+ grpc_health_check:
179
+ service_name: "inference-extension"
180
+ authority: vllm-llama3-8b-instruct-epp.$E2E_NS:9003
173
181
# This ensures that envoy accepts untrusted certificates. We tried to explicitly
174
182
# set TrustChainVerification to ACCEPT_UNSTRUSTED, but that actually didn't work
175
183
# and what worked is setting the common_tls_context to empty.
@@ -193,6 +201,8 @@ data:
193
201
region: ext_proc/e2e/0
194
202
lb_endpoints:
195
203
- endpoint:
204
+ health_check_config:
205
+ port_value: 9003
196
206
address:
197
207
socket_address:
198
208
address: vllm-llama3-8b-instruct-epp.$E2E_NS
Original file line number Diff line number Diff line change @@ -20,10 +20,15 @@ spec:
20
20
selector :
21
21
app : vllm-llama3-8b-instruct-epp
22
22
ports :
23
- - protocol : TCP
23
+ - name : http2-por
24
+ protocol : TCP
24
25
port : 9002
25
26
targetPort : 9002
26
27
appProtocol : http2
28
+ - name : health-check-port
29
+ protocol : TCP
30
+ port : 9003
31
+ targetPort : 9003
27
32
type : ClusterIP
28
33
---
29
34
apiVersion : apps/v1
62
67
- " 9002"
63
68
- -grpcHealthPort
64
69
- " 9003"
70
+ - -secureServing
71
+ - " false"
65
72
env :
66
73
- name : USE_STREAMING
67
74
value : " true"
@@ -109,7 +116,7 @@ rules:
109
116
- subjectaccessreviews
110
117
verbs :
111
118
- create
112
- ---
119
+ ---
113
120
kind : ClusterRoleBinding
114
121
apiVersion : rbac.authorization.k8s.io/v1
115
122
metadata :
You can’t perform that action at this time.
0 commit comments