Skip to content

Commit 8fe1262

Browse files
committed
multi-provider monitoring charts (prometheus, gke)
Signed-off-by: sallyom <somalley@redhat.com>
1 parent bba0547 commit 8fe1262

File tree

5 files changed

+41
-34
lines changed

5 files changed

+41
-34
lines changed

config/charts/inferencepool/templates/epp-sa-token-secret.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
1-
{{- if .Values.inferenceExtension.monitoring.servicemonitor.enabled }}
1+
{{- if or .Values.inferenceExtension.monitoring.prometheus.enabled .Values.inferenceExtension.monitoring.gke.enabled }}
22
apiVersion: v1
33
kind: Secret
44
metadata:
5-
name: {{ include "gateway-api-inference-extension.name" . }}-token
6-
namespace: {{ .Release.Namespace }}
5+
name: {{ .Values.inferenceExtension.monitoring.secret.name }}
6+
namespace: {{ .Values.inferenceExtension.monitoring.secret.namespace }}
77
labels:
88
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
99
annotations:
Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if .Values.inferenceExtension.monitoring.servicemonitor.enabled }}
1+
{{- if .Values.inferenceExtension.monitoring.prometheus.enabled }}
22
apiVersion: monitoring.coreos.com/v1
33
kind: ServiceMonitor
44
metadata:
@@ -8,41 +8,41 @@ metadata:
88
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
99
spec:
1010
endpoints:
11-
- interval: {{ .Values.inferenceExtension.monitoring.servicemonitor.interval }}
12-
port: {{ .Values.inferenceExtension.monitoring.servicemonitor.port }}
13-
path: {{ .Values.inferenceExtension.monitoring.servicemonitor.path }}
11+
- interval: {{ .Values.inferenceExtension.monitoring.interval }}
12+
port: {{ .Values.inferenceExtension.monitoring.port }}
13+
path: {{ .Values.inferenceExtension.monitoring.path }}
1414
authorization:
1515
credentials:
1616
key: token
17-
name: {{ include "gateway-api-inference-extension.name" . }}-token
18-
{{- with .Values.inferenceExtension.monitoring.servicemonitor.scrapeTimeout }}
17+
name: {{ .Values.inferenceExtension.monitoring.secret.name }}
18+
{{- with .Values.inferenceExtension.monitoring.prometheus.scrapeTimeout }}
1919
scrapeTimeout: {{ . }}
2020
{{- end }}
21-
{{- with .Values.inferenceExtension.monitoring.servicemonitor.relabelings }}
21+
{{- with .Values.inferenceExtension.monitoring.prometheus.relabelings }}
2222
relabelings:
2323
{{- toYaml . | nindent 6 }}
2424
{{- end }}
25-
{{- with .Values.inferenceExtension.monitoring.servicemonitor.metricRelabelings }}
25+
{{- with .Values.inferenceExtension.monitoring.prometheus.metricRelabelings }}
2626
metricRelabelings:
2727
{{- toYaml . | nindent 6 }}
2828
{{- end }}
2929
jobLabel: {{ include "gateway-api-inference-extension.name" . }}
3030
namespaceSelector:
31-
{{- if .Values.inferenceExtension.monitoring.servicemonitor.namespaceSelector.any }}
31+
{{- if .Values.inferenceExtension.monitoring.prometheus.namespaceSelector.any }}
3232
any: true
3333
{{- else }}
3434
matchNames:
3535
- {{ .Release.Namespace }}
36-
{{- if .Values.inferenceExtension.monitoring.servicemonitor.namespaceSelector.matchNames }}
37-
{{- range .Values.inferenceExtension.monitoring.servicemonitor.namespaceSelector.matchNames }}
36+
{{- if .Values.inferenceExtension.monitoring.prometheus.namespaceSelector.matchNames }}
37+
{{- range .Values.inferenceExtension.monitoring.prometheus.namespaceSelector.matchNames }}
3838
- {{ . }}
3939
{{- end }}
4040
{{- end }}
4141
{{- end }}
4242
selector:
4343
matchLabels:
4444
{{- include "gateway-api-inference-extension.labels" . | nindent 6 }}
45-
{{- with .Values.inferenceExtension.monitoring.servicemonitor.selector.matchLabels }}
45+
{{- with .Values.inferenceExtension.monitoring.prometheus.selector.matchLabels }}
4646
{{- toYaml . | nindent 6 }}
4747
{{- end }}
4848
{{- end }}

config/charts/inferencepool/templates/gke.yaml

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
{{- if eq .Values.provider.name "gke" }}
1+
{{- if and (eq .Values.provider.name "gke") .Values.inferenceExtension.monitoring.gke.enabled }}
22
---
33
kind: HealthCheckPolicy
44
apiVersion: networking.gke.io/v1
@@ -44,17 +44,17 @@ metadata:
4444
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
4545
spec:
4646
endpoints:
47-
- port: metrics
48-
scheme: http
49-
interval: 5s
50-
path: /metrics
47+
- port: {{ .Values.inferenceExtension.monitoring.port }}
48+
scheme: {{ .Values.inferenceExtension.monitoring.scheme }}
49+
interval: {{ .Values.inferenceExtension.monitoring.interval }}
50+
path: {{ .Values.inferenceExtension.monitoring.path }}
5151
authorization:
5252
type: Bearer
5353
credentials:
5454
secret:
55-
name: {{ .Values.gke.monitoringSecret.name }}
55+
name: {{ .Values.inferenceExtension.monitoring.secret.name }}
5656
key: token
57-
namespace: {{ .Values.gke.monitoringSecret.namespace }}
57+
namespace: {{ .Values.inferenceExtension.monitoring.secret.namespace }}
5858
selector:
5959
matchLabels:
6060
{{- include "gateway-api-inference-extension.selectorLabels" . | nindent 8 }}

config/charts/inferencepool/templates/rbac.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,9 +17,9 @@ rules:
1717
- subjectaccessreviews
1818
verbs:
1919
- create
20-
{{- if .Values.inferenceExtension.monitoring.servicemonitor.enabled }}
20+
{{- if or .Values.inferenceExtension.monitoring.prometheus.enabled .Values.inferenceExtension.monitoring.gke.enabled }}
2121
- nonResourceURLs:
22-
- {{ .Values.inferenceExtension.monitoring.servicemonitor.path }}
22+
- {{ .Values.inferenceExtension.monitoring.path }}
2323
verbs:
2424
- get
2525
{{- end }}

config/charts/inferencepool/values.yaml

Lines changed: 17 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -38,13 +38,20 @@ inferenceExtension:
3838

3939
# Monitoring configuration for EPP
4040
monitoring:
41-
# ServiceMonitor configuration for EPP metrics collection with Prometheus Operator
42-
servicemonitor:
41+
# Common monitoring parameters
42+
path: "/metrics"
43+
interval: "10s"
44+
scheme: "http"
45+
# port -- Port name to scrape metrics from (must match service port name)
46+
port: "http-metrics"
47+
# secret -- Service account token secret for authentication
48+
secret:
49+
name: inference-gateway-sa-metrics-reader-secret
50+
namespace: default
51+
52+
# Prometheus ServiceMonitor configuration for EPP metrics collection with Prometheus Operator
53+
prometheus:
4354
enabled: false
44-
# port -- Port name to scrape metrics from (must match service port name)
45-
port: "http-metrics"
46-
path: "/metrics"
47-
interval: "10s"
4855
# scrapeTimeout: "10s"
4956
# relabelings -- RelabelConfigs to apply to samples before scraping
5057
relabelings: []
@@ -57,6 +64,10 @@ inferenceExtension:
5764
# matchLabels in template match the EPP service by default
5865
matchLabels: {}
5966

67+
# GKE monitoring configuration (ClusterPodMonitoring)
68+
gke:
69+
enabled: false
70+
6071
inferencePool:
6172
targetPorts:
6273
- number: 8000
@@ -68,7 +79,3 @@ inferencePool:
6879
provider:
6980
name: none
7081

71-
gke:
72-
monitoringSecret:
73-
name: inference-gateway-sa-metrics-reader-secret
74-
namespace: default

0 commit comments

Comments
 (0)