We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b9891d2 commit a655bdaCopy full SHA for a655bda
config/charts/inferencepool/templates/inferencepool.yaml
@@ -1,5 +1,5 @@
1
{{ include "gateway-api-inference-extension.validations.inferencepool.common" $ }}
2
-apiVersion: inference.networking.k8s.io/v1
+apiVersion: {{ .Values.inferencePool.apiVersion }}
3
kind: InferencePool
4
metadata:
5
name: {{ .Release.Name }}
config/charts/inferencepool/values.yaml
@@ -44,6 +44,7 @@ inferencePool:
44
targetPorts:
45
- number: 8000
46
modelServerType: vllm # vllm, triton-tensorrt-llm
47
+ apiVersion: inference.networking.k8s.io/v1
48
# modelServers: # REQUIRED
49
# matchLabels:
50
# app: vllm-llama3-8b-instruct
0 commit comments