Skip to content

Commit 33217a6

Browse files
committed
feat: add health check for epp cluster
Signed-off-by: zhengkezhou1 <madzhou1@gmail.com>
1 parent 3368422 commit 33217a6

File tree

2 files changed

+19
-2
lines changed

2 files changed

+19
-2
lines changed

test/testdata/envoy.yaml

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -170,6 +170,14 @@ data:
170170
max_pending_requests: 40000
171171
max_requests: 40000
172172
max_retries: 1024
173+
health_checks:
174+
- timeout: 1s
175+
interval: 5s
176+
unhealthy_threshold: 3
177+
healthy_threshold: 1
178+
grpc_health_check:
179+
service_name: "inference-extension"
180+
authority: vllm-llama3-8b-instruct-epp.$E2E_NS:9003
173181
# This ensures that envoy accepts untrusted certificates. We tried to explicitly
174182
# set TrustChainVerification to ACCEPT_UNSTRUSTED, but that actually didn't work
175183
# and what worked is setting the common_tls_context to empty.
@@ -193,6 +201,8 @@ data:
193201
region: ext_proc/e2e/0
194202
lb_endpoints:
195203
- endpoint:
204+
health_check_config:
205+
port_value: 9003
196206
address:
197207
socket_address:
198208
address: vllm-llama3-8b-instruct-epp.$E2E_NS

test/testdata/inferencepool-e2e.yaml

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,10 +20,15 @@ spec:
2020
selector:
2121
app: vllm-llama3-8b-instruct-epp
2222
ports:
23-
- protocol: TCP
23+
- name: http2-por
24+
protocol: TCP
2425
port: 9002
2526
targetPort: 9002
2627
appProtocol: http2
28+
- name: health-check-port
29+
protocol: TCP
30+
port: 9003
31+
targetPort: 9003
2732
type: ClusterIP
2833
---
2934
apiVersion: apps/v1
@@ -62,6 +67,8 @@ spec:
6267
- "9002"
6368
- -grpcHealthPort
6469
- "9003"
70+
- -secureServing
71+
- "false"
6572
env:
6673
- name: USE_STREAMING
6774
value: "true"
@@ -109,7 +116,7 @@ rules:
109116
- subjectaccessreviews
110117
verbs:
111118
- create
112-
---
119+
---
113120
kind: ClusterRoleBinding
114121
apiVersion: rbac.authorization.k8s.io/v1
115122
metadata:

0 commit comments

Comments
 (0)