-
Notifications
You must be signed in to change notification settings - Fork 440
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Fix labels for Service Monitors #2878
Changes from 23 commits
1625097
78f1315
9ccd87f
5f55a01
e3174b6
edfb463
82fefa2
28baa37
7dcaadb
2e143ee
cc96402
978dfa0
f5b29d8
fff9870
6432371
2469162
0b2a439
3712c43
743247b
552cb3e
720c6b1
d1889d0
cc84a10
e5b251c
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,20 @@ | ||
# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix' | ||
change_type: bug_fix | ||
|
||
# The name of the component, or a single word describing the area of concern, (e.g. collector, target allocator, auto-instrumentation, opamp, github action) | ||
component: collector | ||
|
||
# A brief description of the change. Surround your text with quotes ("") if it needs to start with a backtick (`). | ||
note: Create a Service Monitor for the monitoring service and another one for the collector service when the Prometheus exporter is used. | ||
|
||
# One or more tracking issues related to the change | ||
issues: [2877] | ||
|
||
# (Optional) One or more lines of additional information to render under the primary note. | ||
# These lines will be padded with 2 spaces and then inserted directly into the document. | ||
# Use pipe (|) for multiline entries. | ||
subtext: | | ||
Create a Service Monitor for the collector Service when Prometheus exporter is used. A different Service Monitor is created for the monitoring service. | ||
This helps excluding the headless service (duplicating the metrics collection) and splits responsibilities between the two Service Monitors. | ||
Now, the operator.opentelemetry.io/collector-service-type label is used to differentiate the services. | ||
operator.opentelemetry.io/collector-monitoring-service and operator.opentelemetry.io/collector-headless-service are deprecated now. |
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -29,13 +29,26 @@ import ( | |
"github.com/open-telemetry/opentelemetry-operator/internal/naming" | ||
) | ||
|
||
// headless and monitoring labels are to differentiate the headless/monitoring services from the clusterIP service. | ||
// headless and monitoring labels are to differentiate the base/headless/monitoring services from the clusterIP service. | ||
const ( | ||
headlessLabel = "operator.opentelemetry.io/collector-headless-service" | ||
iblancasa marked this conversation as resolved.
Show resolved
Hide resolved
|
||
monitoringLabel = "operator.opentelemetry.io/collector-monitoring-service" | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. @iblancasa i think we should keep these around for now, mark them as deprecated and remove them in two+ versions rather than deleting them outright which would constitute a breaking change. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Done |
||
valueExists = "Exists" | ||
headlessLabel = "operator.opentelemetry.io/collector-headless-service" | ||
monitoringLabel = "operator.opentelemetry.io/collector-monitoring-service" | ||
serviceTypeLabel = "operator.opentelemetry.io/collector-service-type" | ||
valueExists = "Exists" | ||
) | ||
|
||
type ServiceType int | ||
|
||
const ( | ||
BaseServiceType ServiceType = iota | ||
HeadlessServiceType | ||
MonitoringServiceType | ||
) | ||
|
||
func (s ServiceType) String() string { | ||
return [...]string{"base", "headless", "monitoring"}[s] | ||
} | ||
|
||
func HeadlessService(params manifests.Params) (*corev1.Service, error) { | ||
h, err := Service(params) | ||
if h == nil || err != nil { | ||
|
@@ -44,6 +57,7 @@ func HeadlessService(params manifests.Params) (*corev1.Service, error) { | |
|
||
h.Name = naming.HeadlessService(params.OtelCol.Name) | ||
h.Labels[headlessLabel] = valueExists | ||
h.Labels[serviceTypeLabel] = HeadlessServiceType.String() | ||
|
||
// copy to avoid modifying params.OtelCol.Annotations | ||
annotations := map[string]string{ | ||
|
@@ -63,6 +77,7 @@ func MonitoringService(params manifests.Params) (*corev1.Service, error) { | |
name := naming.MonitoringService(params.OtelCol.Name) | ||
labels := manifestutils.Labels(params.OtelCol.ObjectMeta, name, params.OtelCol.Spec.Image, ComponentOpenTelemetryCollector, []string{}) | ||
labels[monitoringLabel] = valueExists | ||
labels[serviceTypeLabel] = MonitoringServiceType.String() | ||
|
||
metricsPort, err := params.OtelCol.Spec.Config.Service.MetricsPort() | ||
if err != nil { | ||
|
@@ -90,6 +105,7 @@ func MonitoringService(params manifests.Params) (*corev1.Service, error) { | |
func Service(params manifests.Params) (*corev1.Service, error) { | ||
name := naming.Service(params.OtelCol.Name) | ||
labels := manifestutils.Labels(params.OtelCol.ObjectMeta, name, params.OtelCol.Spec.Image, ComponentOpenTelemetryCollector, []string{}) | ||
labels[serviceTypeLabel] = BaseServiceType.String() | ||
|
||
out, err := params.OtelCol.Spec.Config.Yaml() | ||
if err != nil { | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -15,6 +15,7 @@ | |
package collector | ||
|
||
import ( | ||
"fmt" | ||
"strings" | ||
|
||
"github.com/go-logr/logr" | ||
|
@@ -29,30 +30,40 @@ import ( | |
"github.com/open-telemetry/opentelemetry-operator/internal/naming" | ||
) | ||
|
||
// ServiceMonitor returns the service monitor for the given instance. | ||
// ServiceMonitor returns the service monitor for the collector. | ||
func ServiceMonitor(params manifests.Params) (*monitoringv1.ServiceMonitor, error) { | ||
if !params.OtelCol.Spec.Observability.Metrics.EnableMetrics { | ||
params.Log.V(2).Info("Metrics disabled for this OTEL Collector", | ||
"params.OtelCol.name", params.OtelCol.Name, | ||
"params.OtelCol.namespace", params.OtelCol.Namespace, | ||
) | ||
return nil, nil | ||
} else if params.Config.PrometheusCRAvailability() == prometheus.NotAvailable { | ||
params.Log.V(1).Info("Cannot enable ServiceMonitor when prometheus CRDs are unavailable", | ||
"params.OtelCol.name", params.OtelCol.Name, | ||
"params.OtelCol.namespace", params.OtelCol.Namespace, | ||
) | ||
return nil, nil | ||
name := naming.ServiceMonitor(params.OtelCol.Name) | ||
endpoints := endpointsFromConfig(params.Log, params.OtelCol) | ||
if len(endpoints) > 0 { | ||
return createServiceMonitor(name, params, BaseServiceType, endpoints) | ||
} | ||
var sm monitoringv1.ServiceMonitor | ||
return nil, nil | ||
} | ||
|
||
// ServiceMonitor returns the service monitor for the monitoring service of the collector. | ||
func ServiceMonitorMonitoring(params manifests.Params) (*monitoringv1.ServiceMonitor, error) { | ||
name := naming.ServiceMonitor(fmt.Sprintf("%s-monitoring", params.OtelCol.Name)) | ||
endpoints := []monitoringv1.Endpoint{ | ||
{ | ||
Port: "monitoring", | ||
}, | ||
} | ||
return createServiceMonitor(name, params, MonitoringServiceType, endpoints) | ||
} | ||
|
||
if params.OtelCol.Spec.Mode == v1beta1.ModeSidecar { | ||
// createServiceMonitor creates a Service Monitor using the provided name, the params from the instance, a label to identify the service | ||
// to target (like the monitoring or the collector services) and the endpoints to scrape. | ||
func createServiceMonitor(name string, params manifests.Params, serviceType ServiceType, endpoints []monitoringv1.Endpoint) (*monitoringv1.ServiceMonitor, error) { | ||
if !shouldCreateServiceMonitor(params) { | ||
return nil, nil | ||
} | ||
name := naming.ServiceMonitor(params.OtelCol.Name) | ||
|
||
var sm monitoringv1.ServiceMonitor | ||
|
||
labels := manifestutils.Labels(params.OtelCol.ObjectMeta, name, params.OtelCol.Spec.Image, ComponentOpenTelemetryCollector, []string{}) | ||
selectorLabels := manifestutils.SelectorLabels(params.OtelCol.ObjectMeta, ComponentOpenTelemetryCollector) | ||
selectorLabels[monitoringLabel] = valueExists | ||
// This label is the one which differentiates the services | ||
selectorLabels[serviceTypeLabel] = serviceType.String() | ||
|
||
sm = monitoringv1.ServiceMonitor{ | ||
ObjectMeta: metav1.ObjectMeta{ | ||
|
@@ -61,11 +72,7 @@ func ServiceMonitor(params manifests.Params) (*monitoringv1.ServiceMonitor, erro | |
Labels: labels, | ||
}, | ||
Spec: monitoringv1.ServiceMonitorSpec{ | ||
Endpoints: append([]monitoringv1.Endpoint{ | ||
{ | ||
Port: "monitoring", | ||
}, | ||
}, endpointsFromConfig(params.Log, params.OtelCol)...), | ||
Endpoints: endpoints, | ||
NamespaceSelector: monitoringv1.NamespaceSelector{ | ||
MatchNames: []string{params.OtelCol.Namespace}, | ||
}, | ||
|
@@ -78,6 +85,25 @@ func ServiceMonitor(params manifests.Params) (*monitoringv1.ServiceMonitor, erro | |
return &sm, nil | ||
} | ||
|
||
func shouldCreateServiceMonitor(params manifests.Params) bool { | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. personal opinion but this statement can be written in a more readable way See the previous comment |
||
l := params.Log.WithValues( | ||
"params.OtelCol.name", params.OtelCol.Name, | ||
"params.OtelCol.namespace", params.OtelCol.Namespace, | ||
) | ||
|
||
if !params.OtelCol.Spec.Observability.Metrics.EnableMetrics { | ||
l.V(2).Info("Metrics disabled for this OTEL Collector. ServiceMonitor will not ve created") | ||
return false | ||
} else if params.Config.PrometheusCRAvailability() == prometheus.NotAvailable { | ||
l.V(2).Info("Cannot enable ServiceMonitor when prometheus CRDs are unavailable") | ||
return false | ||
} else if params.OtelCol.Spec.Mode == v1beta1.ModeSidecar { | ||
l.V(2).Info("Using sidecar mode. ServiceMonitor will not be created") | ||
return false | ||
} | ||
return true | ||
} | ||
|
||
func endpointsFromConfig(logger logr.Logger, otelcol v1beta1.OpenTelemetryCollector) []monitoringv1.Endpoint { | ||
// TODO: https://github.com/open-telemetry/opentelemetry-operator/issues/2603 | ||
cfgStr, err := otelcol.Spec.Config.Yaml() | ||
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
personal opinion but this statement can be written in a more readable way
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
and I would move the logger creation close to returning
false
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Why a double condition + no log message is easier to read than the current approach?
The current is easy to follow and understand why the method returns
false
.There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
A single log message with all parameters makes it clear to understand the overall state.
The function has 2 states (
true
andfalse
), aligning the condition to it makes it easier to understand