From fee17af3ae57a3d6fdab0daaaafe9921dddec8e7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Miko=C5=82aj=20=C5=9Awi=C4=85tek?= Date: Mon, 18 Sep 2023 17:22:04 +0200 Subject: [PATCH] feat(metrics)!: use otel by default --- .changelog/3284.breaking.txt | 1 + deploy/helm/sumologic/Chart.yaml | 2 +- deploy/helm/sumologic/README.md | 6 +- deploy/helm/sumologic/values.yaml | 9 +-- docs/v4-migration-doc.md | 44 ++++++++++++++- tests/helm/prometheus_test.go | 2 + .../metrics_collector_otc/basic.input.yaml | 6 -- .../metrics_collector_otc/custom.input.yaml | 2 - tests/helm/utils.go | 6 ++ .../helm_ot_default_namespaceoverride_test.go | 13 +++-- tests/integration/helm_ot_default_test.go | 6 +- tests/integration/helm_ot_metrics_test.go | 55 ------------------- ...elm_otc_fips_metadata_installation_test.go | 8 ++- tests/integration/helm_otlp_test.go | 15 +++-- .../helm_prometheus_metrics_test.go | 35 ++++++++++++ tests/integration/internal/constants.go | 3 +- tests/integration/values/values_common.yaml | 8 +++ .../values/values_helm_default_ot.yaml | 2 - ...ues_helm_default_ot_namespaceoverride.yaml | 12 ++++ .../values/values_helm_ot_metrics.yaml | 31 ----------- .../values_helm_prometheus_metrics.yaml | 18 ++++++ 21 files changed, 162 insertions(+), 122 deletions(-) create mode 100644 .changelog/3284.breaking.txt delete mode 100644 tests/integration/helm_ot_metrics_test.go create mode 100644 tests/integration/helm_prometheus_metrics_test.go delete mode 100644 tests/integration/values/values_helm_ot_metrics.yaml create mode 100644 tests/integration/values/values_helm_prometheus_metrics.yaml diff --git a/.changelog/3284.breaking.txt b/.changelog/3284.breaking.txt new file mode 100644 index 0000000000..2546cce43e --- /dev/null +++ b/.changelog/3284.breaking.txt @@ -0,0 +1 @@ +feat(metrics)!: use otel by default \ No newline at end of file diff --git a/deploy/helm/sumologic/Chart.yaml b/deploy/helm/sumologic/Chart.yaml index e53d5c7418..c23a010783 100644 --- a/deploy/helm/sumologic/Chart.yaml +++ b/deploy/helm/sumologic/Chart.yaml @@ -35,4 +35,4 @@ dependencies: - name: opentelemetry-operator version: 0.35.0 repository: https://open-telemetry.github.io/opentelemetry-helm-charts - condition: opentelemetry-operator.enabled + condition: opentelemetry-operator.enabled,sumologic.metrics.collector.otelcol.enabled diff --git a/deploy/helm/sumologic/README.md b/deploy/helm/sumologic/README.md index 53c7753d87..3014983940 100644 --- a/deploy/helm/sumologic/README.md +++ b/deploy/helm/sumologic/README.md @@ -87,7 +87,7 @@ The following table lists the configurable parameters of the Sumo Logic chart an | `sumologic.logs.sourceType` | The type of the Sumo Logic source being used for logs ingestion. Can be `http` for [HTTP Source](https://help.sumologic.com/docs/send-data/hosted-collectors/http-source/logs-metrics/) or `otlp` for [OTLP/HTTP Source](https://help.sumologic.com/docs/send-data/hosted-collectors/http-source/otlp/). | `http` | | `sumologic.metrics.enabled` | Set the enabled flag to false for disabling metrics ingestion altogether. | `true` | | `sumologic.metrics.otelcol.extraProcessors` | Extra processors configuration for metrics pipeline. See [/docs/collecting-application-metrics.md#metrics-modifications](/docs/collecting-application-metrics.md#metrics-modifications) for more information. | `[]` | -| `sumologic.metrics.remoteWriteProxy.enabled` | Enable a load balancing proxy for Prometheus remote writes. [See docs for more information.](/docs/prometheus.md#using-a-load-balancing-proxy-for-prometheus-remote-write) | `true` | +| `sumologic.metrics.remoteWriteProxy.enabled` | Enable a load balancing proxy for Prometheus remote writes. [See docs for more information.](/docs/prometheus.md#using-a-load-balancing-proxy-for-prometheus-remote-write) | `false` | | `sumologic.metrics.remoteWriteProxy.config.clientBodyBufferSize` | See the [nginx documentation](http://nginx.org/en/docs/http/ngx_http_core_module.html#client_body_buffer_size). Increase if you've also increased samples per send in Prometheus remote write. | `64k` | | `sumologic.metrics.remoteWriteProxy.config.workerCountAutotune` | This feature autodetects how much CPU is assigned to the nginx instance and setsthe right amount of workers based on that. Disable to use the default of 8 workers. | `true` | | `sumologic.metrics.remoteWriteProxy.config.enableAccessLogs` | Enable nginx access logs. | `false` | @@ -182,6 +182,7 @@ The following table lists the configurable parameters of the Sumo Logic chart an | `kube-prometheus-stack.alertmanager.enabled` | Deploy alertmanager. | `false` | | `kube-prometheus-stack.grafana.enabled` | If true, deploy the grafana sub-chart. | `false` | | `kube-prometheus-stack.grafana.defaultDashboardsEnabled` | Deploy default dashboards. These are loaded using the sidecar. | `false` | +| `kube-prometheus-stack.prometheusOperator.enabled` | Enable prometheus-operator | `false` | | `kube-prometheus-stack.prometheusOperator.podLabels` | Additional labels for prometheus operator pods. | `{}` | | `kube-prometheus-stack.prometheusOperator.podAnnotations` | Additional annotations for prometheus operator pods. | `{}` | | `kube-prometheus-stack.prometheusOperator.resources` | Resource limits for prometheus operator. Uses sub-chart defaults. | `{"limits": {"cpu": "200m", "memory": "200Mi"}, "requests": {"cpu": "100m", "memory": "100Mi"}}` | @@ -192,6 +193,7 @@ The following table lists the configurable parameters of the Sumo Logic chart an | `kube-prometheus-stack.kube-state-metrics.resources` | Resource limits for kube state metrics. Uses sub-chart defaults. | `{"limits": {"cpu": "100m", "memory": "64Mi"}, "requests": {"cpu": "10m", "memory": "32Mi"}}` | | `kube-prometheus-stack.kube-state-metrics.customLabels` | Custom labels to apply to service, deployment and pods. Uses sub-chart defaults. | `{}` | | `kube-prometheus-stack.kube-state-metrics.podAnnotations` | Additional annotations for pods in the DaemonSet. Uses sub-chart defaults. | `{}` | +| `kube-prometheus-stack.prometheus.enabled` | Enable Prometheus | `false` | | `kube-prometheus-stack.prometheus.additionalServiceMonitors` | List of ServiceMonitor objects to create. | See [values.yaml] | | `kube-prometheus-stack.prometheus.prometheusSpec.resources` | Resource limits for prometheus. Uses sub-chart defaults. | `{"limits": {"cpu": "2000m", "memory": "8Gi"}, "requests": {"cpu": "500m", "memory": "1Gi"}}` | | `kube-prometheus-stack.prometheus.prometheusSpec.containers` | Containers allows injecting additional containers. This is meant to allow adding an authentication proxy to a Prometheus pod. | See [values.yaml] | @@ -254,7 +256,7 @@ The following table lists the configurable parameters of the Sumo Logic chart an | `telegraf-operator.classes.default` | Name of the default output configuration. | `sumologic-prometheus` | | `telegraf-operator.image.sidecarImage` | Telegraf Operator sidecar image. | `public.ecr.aws/sumologic/telegraf:1.21.2` | | `telegraf-operator.imagePullSecrets` | Pull secrets for Telegraf Operator images. For more information on using Kubernetes secrets with container registries please refer to [Creating a Secret with a Docker config at kubernetes.io](https://kubernetes.io/docs/concepts/containers/images/#creating-a-secret-with-a-docker-config). | `[]` | -| `opentelemetry-operator.enabled` | Flag to control deploying OpenTelemetry Operator Helm sub-chart. | `false` | +| `opentelemetry-operator.enabled` | Flag to control deploying OpenTelemetry Operator Helm sub-chart. | `true` | | `opentelemetry-operator.createDefaultInstrumentation` | Flag to control creation of default Instrumentation object | `false` | | `opentelemetry-operator.instrumentation.dotnet.metrics.enabled` | Flag to control metrics export from DotNet instrumentation in `Instrumentation` resource. | `true` | | `opentelemetry-operator.instrumentation.dotnet.traces.enabled` | Flag to control traces export from DotNet instrumentation in `Instrumentation` resource. | `true` | diff --git a/deploy/helm/sumologic/values.yaml b/deploy/helm/sumologic/values.yaml index bad6d7286c..a1c6db792e 100644 --- a/deploy/helm/sumologic/values.yaml +++ b/deploy/helm/sumologic/values.yaml @@ -445,9 +445,8 @@ sumologic: collector: ### Otel metrics collector. Replaces Prometheus. ## To enable, you need opentelemetry-operator enabled as well. - ## Stability: Beta. otelcol: - enabled: false + enabled: true ## Default scrape interval scrapeInterval: 30s @@ -543,7 +542,7 @@ sumologic: ## This is an advanced feature, enable only if you're experiencing performance ## issues with metrics metadata enrichment. remoteWriteProxy: - enabled: true + enabled: false config: ## Increase this if you've increased samples_per_send in Prometheus to prevent nginx ## from spilling proxied request bodies to disk @@ -950,6 +949,7 @@ kube-prometheus-stack: enabled: false defaultDashboardsEnabled: false prometheusOperator: + enabled: false ## Labels to add to the operator pod podLabels: {} ## Annotations to add to the operator pod @@ -1105,6 +1105,7 @@ kube-prometheus-stack: regex: (?:node_load1|node_load5|node_load15|node_cpu_seconds_total|node_disk_io_time_weighted_seconds_total|node_disk_io_time_seconds_total|node_vmstat_pgpgin|node_vmstat_pgpgout|node_memory_MemFree_bytes|node_memory_Cached_bytes|node_memory_Buffers_bytes|node_memory_MemTotal_bytes|node_network_receive_drop_total|node_network_transmit_drop_total|node_network_receive_bytes_total|node_network_transmit_bytes_total|node_filesystem_avail_bytes|node_filesystem_size_bytes) sourceLabels: [__name__] prometheus: + enabled: false additionalServiceMonitors: [] prometheusSpec: ## Prometheus default scrape interval, default from upstream Kube Prometheus Stack Helm chart @@ -2377,7 +2378,7 @@ tailing-sidecar-operator: ## Configure OpenTelemetry Operator - Instrumentation ## ref: https://github.com/open-telemetry/opentelemetry-helm-charts/tree/main/charts/opentelemetry-operator opentelemetry-operator: - enabled: false + enabled: true ## Specific for Sumo Logic chart - Instrumentation resource creation instrumentationJobImage: diff --git a/docs/v4-migration-doc.md b/docs/v4-migration-doc.md index edcfbc96b4..b8b1718a3e 100644 --- a/docs/v4-migration-doc.md +++ b/docs/v4-migration-doc.md @@ -6,9 +6,11 @@ - [Important changes](#important-changes) - [OpenTelemetry Collector](#opentelemetry-collector) - [Drop Prometheus recording rule metrics](#drop-prometheus-recording-rule-metrics) + - [OpenTelemetry Collector for metrics collection](#opentelemetry-collector-for-metrics-collection) - [How to upgrade](#how-to-upgrade) - [Requirements](#requirements) - [Metrics migration](#metrics-migration) + - [Convert Prometheus remote writes to otel metrics filters](#convert-prometheus-remote-writes-to-otel-metrics-filters) - [Removing support for Fluent Bit and Fluentd](#removing-support-for-fluent-bit-and-fluentd) - [Configuration Migration](#configuration-migration) - [Switch to OTLP sources](#switch-to-otlp-sources) @@ -37,6 +39,13 @@ format. Please check [Solution Overview][solution-overview] and see below for de OpenTelemetry can't collect Prometheus recording rule metrics. The new version therefore stops collecting recording rule metrics and updates will be made to the Kubernetes App to remove these metrics. +### OpenTelemetry Collector for metrics collection + +By default, the OpenTelemetry Collector is now used for metrics collection instead of Prometheus. For the majority of use cases, this will +be a transparent change without any need for manual configuration changes. OpenTelemetry Collector will continue to collect the same default +metrics as Prometheus did previously, and will support the same mechanisms for collecting custom application metrics. Any exceptions will be +called out in the migration guide below. + ## How to upgrade ### Requirements @@ -53,7 +62,35 @@ export HELM_RELEASE_NAME=... ### Metrics migration -:construction: +If you don't have metrics collection enabled, skip straight to the [next major section](#switch-to-otlp-sources). + +#### Convert Prometheus remote writes to otel metrics filters + +**When?**: If you have custom remote writes defined in `kube-prometheus-stack.prometheus.additionalServiceMonitors` + +When using Prometheus for metrics collection in v3, we relied on remote writes for filtering forwarded metrics. Otel, which is the default +in v4, does not support remote writes, so we've moved this functionality to Otel processors, or ServiceMonitors if it can be done there. + +There are several scenarios here, depending on the exact use case: + +1. You're collecting different [Kubernetes metrics][kubernetes_metrics_v3] than what the Chart provides by default. You've modified the + existing ServiceMonitor for these metrics, and added a remote write as instructed by the documentation. + +You can safely delete the added remote write definition. No further action is required. + +1. As above, but you're also doing some additional data transformation via relabelling rules in the remote write definition. + +You'll need to either move the relabelling rules into the ServiceMonitor itself, or [add an equivalent filter +processor][otel_metrics_filter] rule to Otel. + +1. You're collecting custom application metrics by adding a [`prometheus.io/scrape` annotation][application_metrics_annotation]. You don't + need to filter these metrics. + +No action is needed. + +1. As above, but you also have a remote write definition to filter these metrics. + +You'll need to delete the remote write definition and [add an equivalent filter processor][otel_metrics_filter] rule to Otel. ### Removing support for Fluent Bit and Fluentd @@ -162,3 +199,8 @@ require additional action. Some Kubernetes objects, for example statefulsets, have a tight (63 characters) limit for their names. Because of that, we truncate the prefix that is attached to the names. In particular, the value under key `fullnameOverride` will be truncated to 22 characters. + +[application_metrics_annotation]: ./collecting-application-metrics.md#application-metrics-are-exposed-one-endpoint-scenario +[kubernetes_metrics_v3]: + https://github.com/SumoLogic/sumologic-kubernetes-collection/blob/release-v3/docs/collecting-kubernetes-metrics.md#collecting-kubernetes-metrics +[otel_metrics_filter]: ./collecting-application-metrics.md#filtering-metrics diff --git a/tests/helm/prometheus_test.go b/tests/helm/prometheus_test.go index 7c5d4ce14a..31f30ecc57 100644 --- a/tests/helm/prometheus_test.go +++ b/tests/helm/prometheus_test.go @@ -24,6 +24,7 @@ func TestServiceMonitors(t *testing.T) { ValuesYaml: ` kube-prometheus-stack: prometheus: + enabled: true additionalServiceMonitors: - name: collection-sumologic-fluentd-logs-test additionalLabels: @@ -55,6 +56,7 @@ kube-prometheus-stack: ValuesYaml: ` kube-prometheus-stack: prometheus: + enabled: true additionalServiceMonitors: - name: collection-sumologic-fluentd-logs-test additionalLabels: diff --git a/tests/helm/testdata/goldenfile/metrics_collector_otc/basic.input.yaml b/tests/helm/testdata/goldenfile/metrics_collector_otc/basic.input.yaml index f9797ab4e4..e69de29bb2 100644 --- a/tests/helm/testdata/goldenfile/metrics_collector_otc/basic.input.yaml +++ b/tests/helm/testdata/goldenfile/metrics_collector_otc/basic.input.yaml @@ -1,6 +0,0 @@ -sumologic: - metrics: - enabled: true - collector: - otelcol: - enabled: true diff --git a/tests/helm/testdata/goldenfile/metrics_collector_otc/custom.input.yaml b/tests/helm/testdata/goldenfile/metrics_collector_otc/custom.input.yaml index 9f55595179..d16eae3a30 100644 --- a/tests/helm/testdata/goldenfile/metrics_collector_otc/custom.input.yaml +++ b/tests/helm/testdata/goldenfile/metrics_collector_otc/custom.input.yaml @@ -1,9 +1,7 @@ sumologic: metrics: - enabled: true collector: otelcol: - enabled: true scrapeInterval: 60s autoscaling: enabled: true diff --git a/tests/helm/utils.go b/tests/helm/utils.go index df81b37bde..2b7baf0ec9 100644 --- a/tests/helm/utils.go +++ b/tests/helm/utils.go @@ -17,6 +17,7 @@ import ( "github.com/gruntwork-io/go-commons/files" "github.com/gruntwork-io/terratest/modules/helm" "github.com/gruntwork-io/terratest/modules/logger" + otoperator "github.com/open-telemetry/opentelemetry-operator/apis/v1alpha1" prometheus "github.com/prometheus-operator/prometheus-operator/pkg/apis/monitoring/v1" "github.com/stretchr/testify/require" "gopkg.in/yaml.v3" @@ -123,6 +124,11 @@ func UnmarshalMultipleK8sObjectsFromYaml(yamlDocs string) (objects []runtime.Obj return objects, err } + err = otoperator.AddToScheme(scheme) + if err != nil { + return objects, err + } + decoder := serializer.NewCodecFactory(scheme).UniversalDeserializer() multidocReader := utilyaml.NewYAMLReader(bufio.NewReader(bytes.NewReader([]byte(yamlDocs)))) diff --git a/tests/integration/helm_ot_default_namespaceoverride_test.go b/tests/integration/helm_ot_default_namespaceoverride_test.go index a4cc210cda..291b98ac4c 100644 --- a/tests/integration/helm_ot_default_namespaceoverride_test.go +++ b/tests/integration/helm_ot_default_namespaceoverride_test.go @@ -17,16 +17,21 @@ type ctxKey string func Test_Helm_Default_OT_NamespaceOverride(t *testing.T) { - expectedMetrics := internal.DefaultExpectedMetrics - // we have tracing enabled, so check tracing-specific metrics - expectedMetrics = append(expectedMetrics, internal.TracingOtelcolMetrics...) + expectedMetrics := []string{} + // defaults without otel metrics collector metrics, but with Prometheus metrics + expectedMetricsGroups := make([][]string, len(internal.DefaultExpectedMetricsGroups)) + copy(expectedMetricsGroups, internal.DefaultExpectedMetricsGroups) + expectedMetricsGroups = append(expectedMetricsGroups, internal.PrometheusMetrics, internal.DefaultOtelcolMetrics, internal.LogsOtelcolMetrics, internal.TracingOtelcolMetrics) + for _, metrics := range expectedMetricsGroups { + expectedMetrics = append(expectedMetrics, metrics...) + } installChecks := []featureCheck{ CheckSumologicSecret(15), CheckOtelcolMetadataLogsInstall, CheckOtelcolMetadataMetricsInstall, CheckOtelcolEventsInstall, - CheckPrometheusInstall, + CheckOtelcolMetricsCollectorInstall, CheckOtelcolLogsCollectorInstall, CheckTracesInstall, } diff --git a/tests/integration/helm_ot_default_test.go b/tests/integration/helm_ot_default_test.go index 79b83b5f60..64428b1765 100644 --- a/tests/integration/helm_ot_default_test.go +++ b/tests/integration/helm_ot_default_test.go @@ -20,16 +20,16 @@ func Test_Helm_Default_OT(t *testing.T) { CheckOtelcolMetadataLogsInstall, CheckOtelcolMetadataMetricsInstall, CheckOtelcolEventsInstall, - CheckPrometheusInstall, + CheckOtelcolMetricsCollectorInstall, CheckOtelcolLogsCollectorInstall, CheckTracesInstall, } featInstall := GetInstallFeature(installChecks) - featMetrics := GetMetricsFeature(expectedMetrics, Prometheus) + featMetrics := GetMetricsFeature(expectedMetrics, Otelcol) - featTelegrafMetrics := GetTelegrafMetricsFeature(internal.DefaultExpectedNginxAnnotatedMetrics, Prometheus, true) + featTelegrafMetrics := GetTelegrafMetricsFeature(internal.DefaultExpectedNginxAnnotatedMetrics, Otelcol, true) featLogs := GetLogsFeature() diff --git a/tests/integration/helm_ot_metrics_test.go b/tests/integration/helm_ot_metrics_test.go deleted file mode 100644 index 5809b210a0..0000000000 --- a/tests/integration/helm_ot_metrics_test.go +++ /dev/null @@ -1,55 +0,0 @@ -//go:build onlylatest -// +build onlylatest - -package integration - -import ( - "testing" - - "github.com/SumoLogic/sumologic-kubernetes-collection/tests/integration/internal" -) - -func Test_Helm_OT_Metrics(t *testing.T) { - expectedMetrics := []string{} - - // don't check recording rule metrics, not supported - expectedMetricsGroups := [][]string{ - internal.KubeStateMetrics, - internal.KubeDaemonSetMetrics, - internal.KubeDeploymentMetrics, - internal.KubeNodeMetrics, - internal.KubePodMetrics, - internal.KubeServiceMetrics, - internal.KubeletMetrics, - internal.KubeSchedulerMetrics, - internal.KubeApiServerMetrics, - internal.KubeEtcdMetrics, - internal.KubeControllerManagerMetrics, - internal.CoreDNSMetrics, - internal.CAdvisorMetrics, - internal.NodeExporterMetrics, - internal.AdditionalNodeExporterMetrics, - internal.DefaultOtelcolMetrics, - internal.MetricsCollectorOtelcolMetrics, - internal.OtherMetrics, - } - for _, metrics := range expectedMetricsGroups { - for _, metric := range metrics { - expectedMetrics = append(expectedMetrics, metric) - } - } - - installChecks := []featureCheck{ - CheckSumologicSecret(9), - CheckOtelcolMetadataMetricsInstall, - CheckOtelcolMetricsCollectorInstall, - } - - featInstall := GetInstallFeature(installChecks) - - featMetrics := GetMetricsFeature(expectedMetrics, Otelcol) - - featTelegrafMetrics := GetTelegrafMetricsFeature(internal.DefaultExpectedNginxAnnotatedMetrics, Otelcol, true) - - testenv.Test(t, featInstall, featMetrics, featTelegrafMetrics) -} diff --git a/tests/integration/helm_otc_fips_metadata_installation_test.go b/tests/integration/helm_otc_fips_metadata_installation_test.go index 7f8abe13d3..e1e903d3df 100644 --- a/tests/integration/helm_otc_fips_metadata_installation_test.go +++ b/tests/integration/helm_otc_fips_metadata_installation_test.go @@ -20,14 +20,16 @@ func Test_Helm_Default_OT_FIPS(t *testing.T) { CheckOtelcolMetadataLogsInstall, CheckOtelcolMetadataMetricsInstall, CheckOtelcolEventsInstall, - CheckPrometheusInstall, + CheckOtelcolMetricsCollectorInstall, CheckOtelcolLogsCollectorInstall, CheckTracesInstall, } featInstall := GetInstallFeature(installChecks) - featMetrics := GetMetricsFeature(expectedMetrics, Prometheus) + featMetrics := GetMetricsFeature(expectedMetrics, Otelcol) + + featTelegrafMetrics := GetTelegrafMetricsFeature(internal.DefaultExpectedNginxAnnotatedMetrics, Otelcol, true) featLogs := GetLogsFeature() @@ -37,5 +39,5 @@ func Test_Helm_Default_OT_FIPS(t *testing.T) { featTraces := GetTracesFeature() - testenv.Test(t, featInstall, featMetrics, featLogs, featMultilineLogs, featEvents, featTraces) + testenv.Test(t, featInstall, featMetrics, featTelegrafMetrics, featLogs, featMultilineLogs, featEvents, featTraces) } diff --git a/tests/integration/helm_otlp_test.go b/tests/integration/helm_otlp_test.go index efcba74906..3394915fd2 100644 --- a/tests/integration/helm_otlp_test.go +++ b/tests/integration/helm_otlp_test.go @@ -10,7 +10,6 @@ import ( ) func Test_Helm_OTLP(t *testing.T) { - expectedMetrics := internal.DefaultExpectedMetrics // we have tracing enabled, so check tracing-specific metrics expectedMetrics = append(expectedMetrics, internal.TracingOtelcolMetrics...) @@ -20,20 +19,24 @@ func Test_Helm_OTLP(t *testing.T) { CheckOtelcolMetadataLogsInstall, CheckOtelcolMetadataMetricsInstall, CheckOtelcolEventsInstall, - CheckPrometheusInstall, + CheckOtelcolMetricsCollectorInstall, CheckOtelcolLogsCollectorInstall, CheckTracesInstall, } featInstall := GetInstallFeature(installChecks) - featLogs := GetLogsFeature() + featMetrics := GetMetricsFeature(expectedMetrics, Otelcol) - featMetrics := GetMetricsFeature(expectedMetrics, Prometheus) + featTelegrafMetrics := GetTelegrafMetricsFeature(internal.DefaultExpectedNginxAnnotatedMetrics, Otelcol, true) - featTraces := GetTracesFeature() + featLogs := GetLogsFeature() + + featMultilineLogs := GetMultipleMultilineLogsFeature() featEvents := GetEventsFeature() - testenv.Test(t, featInstall, featLogs, featMetrics, featEvents, featTraces) + featTraces := GetTracesFeature() + + testenv.Test(t, featInstall, featMetrics, featTelegrafMetrics, featLogs, featMultilineLogs, featEvents, featTraces) } diff --git a/tests/integration/helm_prometheus_metrics_test.go b/tests/integration/helm_prometheus_metrics_test.go new file mode 100644 index 0000000000..b9d2cb9560 --- /dev/null +++ b/tests/integration/helm_prometheus_metrics_test.go @@ -0,0 +1,35 @@ +//go:build onlylatest +// +build onlylatest + +package integration + +import ( + "testing" + + "github.com/SumoLogic/sumologic-kubernetes-collection/tests/integration/internal" +) + +func Test_Helm_Prometheus_Metrics(t *testing.T) { + expectedMetrics := []string{} + // defaults without otel metrics collector metrics, but with Prometheus metrics + expectedMetricsGroups := make([][]string, len(internal.DefaultExpectedMetricsGroups)) + copy(expectedMetricsGroups, internal.DefaultExpectedMetricsGroups) + expectedMetricsGroups = append(expectedMetricsGroups, internal.PrometheusMetrics, internal.DefaultOtelcolMetrics) + for _, metrics := range expectedMetricsGroups { + expectedMetrics = append(expectedMetrics, metrics...) + } + + installChecks := []featureCheck{ + CheckSumologicSecret(9), + CheckOtelcolMetadataMetricsInstall, + CheckPrometheusInstall, + } + + featInstall := GetInstallFeature(installChecks) + + featMetrics := GetMetricsFeature(expectedMetrics, Prometheus) + + featTelegrafMetrics := GetTelegrafMetricsFeature(internal.DefaultExpectedNginxAnnotatedMetrics, Prometheus, true) + + testenv.Test(t, featInstall, featMetrics, featTelegrafMetrics) +} diff --git a/tests/integration/internal/constants.go b/tests/integration/internal/constants.go index e03c1b7b20..6943a05726 100644 --- a/tests/integration/internal/constants.go +++ b/tests/integration/internal/constants.go @@ -380,7 +380,6 @@ var ( CoreDNSMetrics, CAdvisorMetrics, NodeExporterMetrics, - PrometheusMetrics, OtherMetrics, AdditionalNodeExporterMetrics, } @@ -414,7 +413,7 @@ func InitializeConstants() error { } DefaultExpectedMetrics = []string{} - metricsGroupsWithOtelcol := append(DefaultExpectedMetricsGroups, DefaultOtelcolMetrics, LogsOtelcolMetrics) + metricsGroupsWithOtelcol := append(DefaultExpectedMetricsGroups, DefaultOtelcolMetrics, LogsOtelcolMetrics, MetricsCollectorOtelcolMetrics) for _, metrics := range metricsGroupsWithOtelcol { DefaultExpectedMetrics = append(DefaultExpectedMetrics, metrics...) } diff --git a/tests/integration/values/values_common.yaml b/tests/integration/values/values_common.yaml index daae630f19..ba04b0c48e 100644 --- a/tests/integration/values/values_common.yaml +++ b/tests/integration/values/values_common.yaml @@ -12,6 +12,13 @@ sumologic: endpoint: http://receiver-mock.receiver-mock:3000/terraform/api/ metrics: + collector: + otelcol: + scrapeInterval: 15s + resources: + requests: + memory: 128Mi + cpu: 50m remoteWriteProxy: resources: requests: @@ -132,6 +139,7 @@ otellogs: name: run-log-journal telegraf-operator: + enabled: true resources: requests: cpu: 5m diff --git a/tests/integration/values/values_helm_default_ot.yaml b/tests/integration/values/values_helm_default_ot.yaml index 4046d77150..580878f1a2 100644 --- a/tests/integration/values/values_helm_default_ot.yaml +++ b/tests/integration/values/values_helm_default_ot.yaml @@ -1,5 +1,3 @@ -telegraf-operator: - enabled: true metadata: logs: multiline: diff --git a/tests/integration/values/values_helm_default_ot_namespaceoverride.yaml b/tests/integration/values/values_helm_default_ot_namespaceoverride.yaml index c88c735d8d..22c6c662d5 100644 --- a/tests/integration/values/values_helm_default_ot_namespaceoverride.yaml +++ b/tests/integration/values/values_helm_default_ot_namespaceoverride.yaml @@ -1,3 +1,4 @@ +# This file uses Prometheus metrics, as the opentelemetry-operator Helm Chart doesn't support namespaceOverride namespaceOverride: "test-override" kube-prometheus-stack: @@ -8,3 +9,14 @@ kube-prometheus-stack: prometheus-node-exporter: namespaceOverride: "test-override" + + prometheus: + enabled: true + prometheusOperator: + enabled: true + +sumologic: + metrics: + collector: + otelcol: + enabled: false diff --git a/tests/integration/values/values_helm_ot_metrics.yaml b/tests/integration/values/values_helm_ot_metrics.yaml deleted file mode 100644 index fb4306e098..0000000000 --- a/tests/integration/values/values_helm_ot_metrics.yaml +++ /dev/null @@ -1,31 +0,0 @@ -sumologic: - logs: - enabled: false - traces: - enabled: false - events: - enabled: false - metrics: - enabled: true - remoteWriteProxy: - enabled: false - collector: - otelcol: - enabled: true - scrapeInterval: 15s - resources: - requests: - memory: 128Mi - cpu: 50m - -kube-prometheus-stack: - prometheus: - enabled: false - prometheusOperator: - enabled: false - -opentelemetry-operator: - enabled: true - -telegraf-operator: - enabled: true diff --git a/tests/integration/values/values_helm_prometheus_metrics.yaml b/tests/integration/values/values_helm_prometheus_metrics.yaml new file mode 100644 index 0000000000..c2ad721ee7 --- /dev/null +++ b/tests/integration/values/values_helm_prometheus_metrics.yaml @@ -0,0 +1,18 @@ +sumologic: + logs: + enabled: false + traces: + enabled: false + events: + enabled: false + metrics: + enabled: true + collector: + otelcol: + enabled: false + +kube-prometheus-stack: + prometheus: + enabled: true + prometheusOperator: + enabled: true