Skip to content
Merged
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 8 additions & 1 deletion config/charts/inferencepool/templates/inferencepool.yaml
Original file line number Diff line number Diff line change
@@ -1,16 +1,23 @@
{{ include "gateway-api-inference-extension.validations.inferencepool.common" $ }}
apiVersion: inference.networking.k8s.io/v1
apiVersion: {{ .Values.inferencePool.apiVersion }}
kind: InferencePool
metadata:
name: {{ .Release.Name }}
namespace: {{ .Release.Namespace }}
labels:
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
spec:
{{ if eq .Values.inferencePool.apiVersion "inference.networking.x-k8s.io/v1alpha2"}}
targetPortNumber:
{{- range .Values.inferencePool.targetPorts }}
- number: {{ .number }}
{{- end }}
{{ else }}
targetPorts:
{{- range .Values.inferencePool.targetPorts }}
- number: {{ .number }}
{{- end }}
{{- end}}
selector:
matchLabels:
{{- if .Values.inferencePool.modelServers.matchLabels }}
Expand Down
1 change: 1 addition & 0 deletions config/charts/inferencepool/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,7 @@ inferencePool:
targetPorts:
- number: 8000
modelServerType: vllm # vllm, triton-tensorrt-llm
apiVersion: inference.networking.k8s.io/v1
# modelServers: # REQUIRED
# matchLabels:
# app: vllm-llama3-8b-instruct
Expand Down