1
- {{ include "gateway-api- inference-extension.validations.inferencepool.common" $ }}
1
+ {{ if eq .Values.inferencePool.apiVersion " inference.networking.x-k8s.io/v1alpha2" }}
2
2
apiVersion : {{ .Values.inferencePool.apiVersion }}
3
3
kind : InferencePool
4
4
metadata :
@@ -7,17 +7,31 @@ metadata:
7
7
labels :
8
8
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
9
9
spec :
10
- {{ if eq .Values.inferencePool.apiVersion "inference.networking.x-k8s.io/v1alpha2"}}
11
- targetPortNumber :
12
- {{- range .Values.inferencePool.targetPorts }}
13
- - number : {{ .number }}
10
+ targetPortNumber : {{ .Values.inferencePool.targetPortNumber | default 8000 }}
11
+ selector :
12
+ {{- if .Values.inferencePool.modelServers.matchLabels }}
13
+ {{- range $key, $value := .Values.inferencePool.modelServers.matchLabels }}
14
+ {{ $key }}: {{ quote $value }}
14
15
{{- end }}
15
- {{ else }}
16
+ {{- end }}
17
+ extensionRef :
18
+ name : {{ include "gateway-api-inference-extension.name" . }}
19
+ portNumber : {{ .Values.inferenceExtension.extProcPort | default 9002 }}
20
+ failureMode : {{ .Values.inferenceExtension.failureMode | default "FailClose" }}
21
+ {{ else }}
22
+ {{ include "gateway-api-inference-extension.validations.inferencepool.common" $ }}
23
+ apiVersion : " inference.networking.k8s.io/v1"
24
+ kind : InferencePool
25
+ metadata :
26
+ name : {{ .Release.Name }}
27
+ namespace : {{ .Release.Namespace }}
28
+ labels :
29
+ {{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
30
+ spec :
16
31
targetPorts :
17
32
{{- range .Values.inferencePool.targetPorts }}
18
33
- number : {{ .number }}
19
34
{{- end }}
20
- {{- end}}
21
35
selector :
22
36
matchLabels :
23
37
{{- if .Values.inferencePool.modelServers.matchLabels }}
29
43
name : {{ include "gateway-api-inference-extension.name" . }}
30
44
port :
31
45
number : {{ .Values.inferenceExtension.extProcPort | default 9002 }}
46
+ {{- end }}
32
47
33
48
0 commit comments