diff --git a/kubernetes/common/alloy/manifests/k8s-all-in-one.yaml b/kubernetes/common/alloy/manifests/k8s-all-in-one.yaml index a19d2b65..7ae9ff1e 100644 --- a/kubernetes/common/alloy/manifests/k8s-all-in-one.yaml +++ b/kubernetes/common/alloy/manifests/k8s-all-in-one.yaml @@ -7,8 +7,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -21,8 +21,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -125,8 +125,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -4435,8 +4435,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4476,8 +4476,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -4517,8 +4517,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4571,7 +4571,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -4746,10 +4746,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -4757,10 +4763,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -4773,8 +4784,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4796,8 +4807,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/common/grafana/manifests/k8s-all-in-one.yaml b/kubernetes/common/grafana/manifests/k8s-all-in-one.yaml index 463be7fa..0b929d71 100644 --- a/kubernetes/common/grafana/manifests/k8s-all-in-one.yaml +++ b/kubernetes/common/grafana/manifests/k8s-all-in-one.yaml @@ -11,7 +11,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana namespace: monitoring-system --- @@ -22,7 +22,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana namespace: monitoring-system rules: [] @@ -34,7 +34,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana-clusterrole rules: - apiGroups: @@ -54,7 +54,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana namespace: monitoring-system roleRef: @@ -73,7 +73,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana-clusterrolebinding roleRef: apiGroup: rbac.authorization.k8s.io @@ -151,7 +151,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana-config-dashboards namespace: monitoring-system --- @@ -4219,7 +4219,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana namespace: monitoring-system spec: @@ -4240,7 +4240,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana namespace: monitoring-system spec: @@ -4264,7 +4264,7 @@ spec: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 spec: automountServiceAccountToken: true containers: @@ -4456,7 +4456,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana namespace: monitoring-system spec: @@ -4483,7 +4483,7 @@ metadata: app.kubernetes.io/instance: grafana app.kubernetes.io/name: grafana app.kubernetes.io/version: 11.3.1 - helm.sh/chart: grafana-8.6.3 + helm.sh/chart: grafana-8.6.4 name: grafana namespace: monitoring-system spec: diff --git a/kubernetes/common/grafana/values.yaml b/kubernetes/common/grafana/values.yaml index 21ff94d3..95696c12 100644 --- a/kubernetes/common/grafana/values.yaml +++ b/kubernetes/common/grafana/values.yaml @@ -982,6 +982,23 @@ sidecar: # defaults to 66sec (sic!) # watchClientTimeout: 60 # + # maxTotalRetries: Total number of retries to allow for any http request. + # Takes precedence over other counts. Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry. + # maxTotalRetries: 5 + # + # maxConnectRetries: How many connection-related errors to retry on for any http request. + # These are errors raised before the request is sent to the remote server, which we assume has not triggered the server to process the request. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxConnectRetries: 10 + # + # maxReadRetries: How many times to retry on read errors for any http request + # These errors are raised after the request was sent to the server, so the request may have side-effects. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxReadRetries: 5 + # # Endpoint to send request to reload alerts reloadURL: "http://localhost:3000/api/admin/provisioning/alerting/reload" # Absolute path to shell script to execute after a alert got reloaded @@ -1035,6 +1052,24 @@ sidecar: # If specified, the sidecar will look for annotation with this name to create folder and put graph here. # You can use this parameter together with `provider.foldersFromFilesStructure`to annotate configmaps and create folder structure. folderAnnotation: null + # + # maxTotalRetries: Total number of retries to allow for any http request. + # Takes precedence over other counts. Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry. + # maxTotalRetries: 5 + # + # maxConnectRetries: How many connection-related errors to retry on for any http request. + # These are errors raised before the request is sent to the remote server, which we assume has not triggered the server to process the request. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxConnectRetries: 10 + # + # maxReadRetries: How many times to retry on read errors for any http request + # These errors are raised after the request was sent to the server, so the request may have side-effects. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxReadRetries: 5 + # # Endpoint to send request to reload alerts reloadURL: "http://localhost:3000/api/admin/provisioning/dashboards/reload" # Absolute path to shell script to execute after a configmap got reloaded @@ -1115,6 +1150,23 @@ sidecar: # defaults to 66sec (sic!) # watchClientTimeout: 60 # + # maxTotalRetries: Total number of retries to allow for any http request. + # Takes precedence over other counts. Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry. + # maxTotalRetries: 5 + # + # maxConnectRetries: How many connection-related errors to retry on for any http request. + # These are errors raised before the request is sent to the remote server, which we assume has not triggered the server to process the request. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxConnectRetries: 10 + # + # maxReadRetries: How many times to retry on read errors for any http request + # These errors are raised after the request was sent to the server, so the request may have side-effects. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxReadRetries: 5 + # # Endpoint to send request to reload datasources reloadURL: "http://localhost:3000/api/admin/provisioning/datasources/reload" # Absolute path to shell script to execute after a datasource got reloaded @@ -1157,6 +1209,23 @@ sidecar: # defaults to 66sec (sic!) # watchClientTimeout: 60 # + # maxTotalRetries: Total number of retries to allow for any http request. + # Takes precedence over other counts. Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry. + # maxTotalRetries: 5 + # + # maxConnectRetries: How many connection-related errors to retry on for any http request. + # These are errors raised before the request is sent to the remote server, which we assume has not triggered the server to process the request. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxConnectRetries: 10 + # + # maxReadRetries: How many times to retry on read errors for any http request + # These errors are raised after the request was sent to the server, so the request may have side-effects. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxReadRetries: 5 + # # Endpoint to send request to reload plugins reloadURL: "http://localhost:3000/api/admin/provisioning/plugins/reload" # Absolute path to shell script to execute after a plugin got reloaded @@ -1199,6 +1268,23 @@ sidecar: # defaults to 66sec (sic!) # watchClientTimeout: 60 # + # maxTotalRetries: Total number of retries to allow for any http request. + # Takes precedence over other counts. Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry. + # maxTotalRetries: 5 + # + # maxConnectRetries: How many connection-related errors to retry on for any http request. + # These are errors raised before the request is sent to the remote server, which we assume has not triggered the server to process the request. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxConnectRetries: 10 + # + # maxReadRetries: How many times to retry on read errors for any http request + # These errors are raised after the request was sent to the server, so the request may have side-effects. + # Applies to all requests to reloadURL and k8s api requests. + # Set to 0 to fail on the first retry of this type. + # maxReadRetries: 5 + # # Endpoint to send request to reload notifiers reloadURL: "http://localhost:3000/api/admin/provisioning/notifications/reload" # Absolute path to shell script to execute after a notifier got reloaded diff --git a/kubernetes/common/kube-prometheus-stack/manifests/k8s-all-in-one.yaml b/kubernetes/common/kube-prometheus-stack/manifests/k8s-all-in-one.yaml index 19d488bd..c6c25209 100644 --- a/kubernetes/common/kube-prometheus-stack/manifests/k8s-all-in-one.yaml +++ b/kubernetes/common/kube-prometheus-stack/manifests/k8s-all-in-one.yaml @@ -304,8 +304,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -389,8 +389,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -508,8 +508,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -567,8 +567,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -634,8 +634,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -676,8 +676,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -767,8 +767,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -942,8 +942,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1016,8 +1016,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1193,8 +1193,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1258,8 +1258,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1422,8 +1422,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1600,8 +1600,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1785,8 +1785,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1901,8 +1901,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -1993,8 +1993,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2117,8 +2117,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2180,8 +2180,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2231,8 +2231,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2315,8 +2315,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2393,8 +2393,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2449,8 +2449,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2498,8 +2498,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2584,8 +2584,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2645,8 +2645,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2715,8 +2715,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -2791,8 +2791,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 grafana_dashboard: "1" heritage: Helm release: kube-prometheus-stack @@ -3066,8 +3066,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-alertmanager.rules @@ -3225,8 +3225,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-config-reloaders @@ -3256,8 +3256,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-etcd @@ -3457,8 +3457,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-general.rules @@ -3517,8 +3517,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-k8s.rules.container-cpu-usage-seconds-tot @@ -3543,8 +3543,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-k8s.rules.container-memory-cache @@ -3568,8 +3568,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-k8s.rules.container-memory-rss @@ -3593,8 +3593,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-k8s.rules.container-memory-swap @@ -3618,8 +3618,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-k8s.rules.container-memory-working-set-by @@ -3643,8 +3643,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-k8s.rules.container-resource @@ -3730,8 +3730,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-k8s.rules.pod-owner @@ -3796,8 +3796,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-apiserver-availability.rules @@ -3927,8 +3927,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-apiserver-burnrate.rules @@ -4247,8 +4247,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-apiserver-histogram.rules @@ -4278,8 +4278,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-apiserver-slos @@ -4353,8 +4353,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-prometheus-general.rules @@ -4376,8 +4376,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-prometheus-node-recording.rules @@ -4411,8 +4411,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-scheduler.rules @@ -4475,8 +4475,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kube-state-metrics @@ -4550,8 +4550,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubelet.rules @@ -4587,8 +4587,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-apps @@ -4866,8 +4866,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-resources @@ -4997,8 +4997,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-storage @@ -5123,8 +5123,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-system @@ -5167,8 +5167,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-system-apiserver @@ -5257,8 +5257,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-system-controller-manager @@ -5286,8 +5286,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-system-kube-proxy @@ -5314,8 +5314,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-system-kubelet @@ -5473,8 +5473,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-kubernetes-system-scheduler @@ -5501,8 +5501,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-node-exporter @@ -5857,8 +5857,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-node-exporter.rules @@ -5938,8 +5938,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-node-network @@ -5967,8 +5967,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-node.rules @@ -6022,8 +6022,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-prometheus @@ -6365,8 +6365,8 @@ metadata: app.kubernetes.io/instance: kube-prometheus-stack app.kubernetes.io/managed-by: Helm app.kubernetes.io/part-of: kube-prometheus-stack - app.kubernetes.io/version: 66.3.0 - chart: kube-prometheus-stack-66.3.0 + app.kubernetes.io/version: 66.3.1 + chart: kube-prometheus-stack-66.3.1 heritage: Helm release: kube-prometheus-stack name: kube-prometheus-stack-prometheus-operator diff --git a/kubernetes/common/kube-prometheus-stack/values.yaml b/kubernetes/common/kube-prometheus-stack/values.yaml index 4b152ff2..fc06729e 100644 --- a/kubernetes/common/kube-prometheus-stack/values.yaml +++ b/kubernetes/common/kube-prometheus-stack/values.yaml @@ -2271,6 +2271,12 @@ prometheus-node-exporter: # targetLabel: nodename # replacement: $1 # action: replace + + ## Attach node metadata to discovered targets. Requires Prometheus v2.35.0 and above. + ## + # attachMetadata: + # node: false + rbac: ## If true, create PSPs for node-exporter ## diff --git a/kubernetes/microservices-mode/logs/k8s-all-in-one.yaml b/kubernetes/microservices-mode/logs/k8s-all-in-one.yaml index b8fb0b20..da932d82 100644 --- a/kubernetes/microservices-mode/logs/k8s-all-in-one.yaml +++ b/kubernetes/microservices-mode/logs/k8s-all-in-one.yaml @@ -10,8 +10,8 @@ metadata: labels: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki namespace: logging-system --- @@ -24,8 +24,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -50,8 +50,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -151,8 +151,8 @@ metadata: labels: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-clusterrole rules: - apiGroups: @@ -174,8 +174,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -192,8 +192,8 @@ metadata: labels: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-clusterrolebinding roleRef: apiGroup: rbac.authorization.k8s.io @@ -369,8 +369,8 @@ metadata: labels: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-runtime namespace: logging-system --- @@ -4864,8 +4864,8 @@ metadata: app.kubernetes.io/component: bloom-builder app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-bloom-builder namespace: logging-system spec: @@ -4948,8 +4948,8 @@ metadata: app.kubernetes.io/component: compactor app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-compactor namespace: logging-system spec: @@ -4975,8 +4975,8 @@ metadata: app.kubernetes.io/component: distributor app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-distributor namespace: logging-system spec: @@ -5030,8 +5030,8 @@ metadata: app.kubernetes.io/component: index-gateway app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-index-gateway namespace: logging-system spec: @@ -5084,8 +5084,8 @@ metadata: app.kubernetes.io/component: ingester app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-ingester namespace: logging-system spec: @@ -5138,8 +5138,8 @@ metadata: app.kubernetes.io/component: querier app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-querier namespace: logging-system spec: @@ -5165,8 +5165,8 @@ metadata: app.kubernetes.io/component: query-frontend app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-query-frontend namespace: logging-system spec: @@ -5197,8 +5197,8 @@ metadata: app.kubernetes.io/component: query-frontend app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 prometheus.io/service-monitor: "false" name: loki-distributed-query-frontend-headless namespace: logging-system @@ -5231,8 +5231,8 @@ metadata: app.kubernetes.io/component: query-scheduler app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-query-scheduler namespace: logging-system spec: @@ -5285,8 +5285,8 @@ metadata: labels: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-memberlist namespace: logging-system spec: @@ -5311,8 +5311,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5352,8 +5352,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5441,8 +5441,8 @@ metadata: app.kubernetes.io/component: bloom-builder app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-bloom-builder namespace: logging-system spec: @@ -5460,7 +5460,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: bloom-builder app.kubernetes.io/instance: loki-distributed @@ -5482,7 +5482,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: bloom-builder ports: @@ -5547,8 +5547,8 @@ metadata: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-distributor namespace: logging-system spec: @@ -5566,7 +5566,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: distributor app.kubernetes.io/instance: loki-distributed @@ -5588,7 +5588,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent livenessProbe: null name: distributor @@ -5646,8 +5646,8 @@ metadata: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-querier namespace: logging-system spec: @@ -5665,7 +5665,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: querier app.kubernetes.io/instance: loki-distributed @@ -5687,7 +5687,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent livenessProbe: null name: querier @@ -5755,8 +5755,8 @@ metadata: app.kubernetes.io/component: query-frontend app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-query-frontend namespace: logging-system spec: @@ -5774,7 +5774,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: query-frontend app.kubernetes.io/instance: loki-distributed @@ -5796,7 +5796,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: query-frontend ports: @@ -5852,8 +5852,8 @@ metadata: app.kubernetes.io/component: query-scheduler app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-query-scheduler namespace: logging-system spec: @@ -5871,7 +5871,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: query-scheduler app.kubernetes.io/instance: loki-distributed @@ -5893,7 +5893,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent livenessProbe: null name: query-scheduler @@ -6034,8 +6034,8 @@ metadata: app.kubernetes.io/component: bloom-gateway app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-bloom-gateway namespace: logging-system spec: @@ -6051,7 +6051,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: bloom-gateway app.kubernetes.io/instance: loki-distributed @@ -6073,7 +6073,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: bloom-gateway ports: @@ -6139,8 +6139,8 @@ metadata: app.kubernetes.io/component: bloom-planner app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-bloom-planner namespace: logging-system spec: @@ -6156,7 +6156,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: bloom-planner app.kubernetes.io/instance: loki-distributed @@ -6178,7 +6178,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: bloom-planner ports: @@ -6245,8 +6245,8 @@ metadata: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-compactor namespace: logging-system spec: @@ -6262,7 +6262,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: compactor app.kubernetes.io/instance: loki-distributed @@ -6284,7 +6284,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: compactor ports: @@ -6350,8 +6350,8 @@ metadata: app.kubernetes.io/component: index-gateway app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-index-gateway namespace: logging-system spec: @@ -6366,7 +6366,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: index-gateway app.kubernetes.io/instance: loki-distributed @@ -6388,7 +6388,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent livenessProbe: null name: index-gateway @@ -6452,8 +6452,8 @@ metadata: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-ingester namespace: logging-system spec: @@ -6469,7 +6469,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: ingester app.kubernetes.io/instance: loki-distributed @@ -6491,7 +6491,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: ingester ports: @@ -6559,8 +6559,8 @@ metadata: app.kubernetes.io/component: pattern-ingester app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-pattern-ingester namespace: logging-system spec: @@ -6576,7 +6576,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: pattern-ingester app.kubernetes.io/instance: loki-distributed @@ -6598,7 +6598,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: pattern-ingester ports: @@ -6665,8 +6665,8 @@ metadata: app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-ruler namespace: logging-system spec: @@ -6681,7 +6681,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: ruler app.kubernetes.io/instance: loki-distributed @@ -6703,7 +6703,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: ruler ports: @@ -6768,8 +6768,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6822,7 +6822,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -6900,8 +6900,8 @@ metadata: app.kubernetes.io/component: distributor app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-distributor namespace: logging-system spec: @@ -6919,8 +6919,8 @@ metadata: app.kubernetes.io/component: ingester app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-ingester namespace: logging-system spec: @@ -6943,8 +6943,8 @@ metadata: app.kubernetes.io/component: querier app.kubernetes.io/instance: loki-distributed app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-distributed-querier namespace: logging-system spec: @@ -7059,10 +7059,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -7070,10 +7076,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -7086,8 +7097,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -7143,8 +7154,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/microservices-mode/logs/loki/values.yaml b/kubernetes/microservices-mode/logs/loki/values.yaml index 78961a72..855e589a 100644 --- a/kubernetes/microservices-mode/logs/loki/values.yaml +++ b/kubernetes/microservices-mode/logs/loki/values.yaml @@ -56,7 +56,7 @@ loki: # -- Docker image repository repository: grafana/loki # -- Overrides the image tag whose default is the chart's appVersion - tag: 3.3.0 + tag: 3.3.1 # -- Overrides the image tag with an image digest digest: null # -- Docker image pull policy @@ -412,7 +412,9 @@ loki: prefix: index_ period: 24h # -- Check https://grafana.com/docs/loki/latest/configuration/#ruler for more info on configuring ruler - rulerConfig: {} + rulerConfig: + wal: + dir: /var/loki/ruler-wal # -- Structured loki configuration, takes precedence over `loki.config`, `loki.schemaConfig`, `loki.storageConfig` structuredConfig: {} # -- Additional query scheduler config @@ -518,7 +520,7 @@ enterprise: # -- Docker image repository repository: grafana/enterprise-logs # -- Docker image tag - tag: 3.3.0 + tag: 3.3.1 # -- Overrides the image tag with an image digest digest: null # -- Docker image pull policy diff --git a/kubernetes/microservices-mode/metrics/k8s-all-in-one.yaml b/kubernetes/microservices-mode/metrics/k8s-all-in-one.yaml index 1dc28649..8b406b54 100644 --- a/kubernetes/microservices-mode/metrics/k8s-all-in-one.yaml +++ b/kubernetes/microservices-mode/metrics/k8s-all-in-one.yaml @@ -7,8 +7,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -33,8 +33,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -137,8 +137,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -4702,8 +4702,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4743,8 +4743,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5962,8 +5962,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6016,7 +6016,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -6917,10 +6917,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -6928,10 +6934,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -6944,8 +6955,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -7364,8 +7375,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/microservices-mode/profiles/k8s-all-in-one.yaml b/kubernetes/microservices-mode/profiles/k8s-all-in-one.yaml index f3066766..686e18db 100644 --- a/kubernetes/microservices-mode/profiles/k8s-all-in-one.yaml +++ b/kubernetes/microservices-mode/profiles/k8s-all-in-one.yaml @@ -12,8 +12,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -36,8 +36,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system --- @@ -48,8 +48,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: profiles-system-pyroscope namespace: profiles-system rules: @@ -79,8 +79,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -181,8 +181,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: profiles-system-pyroscope namespace: profiles-system roleRef: @@ -203,8 +203,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -4675,8 +4675,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-config namespace: profiles-system --- @@ -4693,8 +4693,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-overrides-config namespace: profiles-system --- @@ -4765,8 +4765,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4806,8 +4806,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -4896,8 +4896,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-compactor namespace: profiles-system spec: @@ -4920,8 +4920,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-compactor-headless namespace: profiles-system spec: @@ -4945,8 +4945,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-distributor namespace: profiles-system spec: @@ -4969,8 +4969,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-distributor-headless namespace: profiles-system spec: @@ -4994,8 +4994,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-ingester namespace: profiles-system spec: @@ -5018,8 +5018,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-ingester-headless namespace: profiles-system spec: @@ -5042,8 +5042,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-memberlist namespace: profiles-system spec: @@ -5067,8 +5067,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-querier namespace: profiles-system spec: @@ -5091,8 +5091,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-querier-headless namespace: profiles-system spec: @@ -5116,8 +5116,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-query-frontend namespace: profiles-system spec: @@ -5140,8 +5140,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-query-frontend-headless namespace: profiles-system spec: @@ -5165,8 +5165,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-query-scheduler namespace: profiles-system spec: @@ -5189,8 +5189,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-query-scheduler-headless namespace: profiles-system spec: @@ -5214,8 +5214,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-store-gateway namespace: profiles-system spec: @@ -5238,8 +5238,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-store-gateway-headless namespace: profiles-system spec: @@ -5348,8 +5348,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-distributor namespace: profiles-system spec: @@ -5362,7 +5362,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -5397,7 +5397,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: distributor ports: @@ -5446,8 +5446,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-querier namespace: profiles-system spec: @@ -5460,7 +5460,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -5495,7 +5495,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: querier ports: @@ -5544,8 +5544,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-query-frontend namespace: profiles-system spec: @@ -5558,7 +5558,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -5593,7 +5593,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: query-frontend ports: @@ -5642,8 +5642,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-query-scheduler namespace: profiles-system spec: @@ -5656,7 +5656,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -5691,7 +5691,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: query-scheduler ports: @@ -5740,8 +5740,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5794,7 +5794,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -5873,8 +5873,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-compactor namespace: profiles-system spec: @@ -5889,7 +5889,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -5924,7 +5924,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: compactor ports: @@ -5977,8 +5977,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-ingester namespace: profiles-system spec: @@ -5993,7 +5993,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -6028,7 +6028,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: ingester ports: @@ -6078,8 +6078,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-store-gateway namespace: profiles-system spec: @@ -6094,7 +6094,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -6129,7 +6129,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: store-gateway ports: @@ -6274,10 +6274,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -6285,10 +6291,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -6301,8 +6312,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6358,8 +6369,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/microservices-mode/traces/k8s-all-in-one.yaml b/kubernetes/microservices-mode/traces/k8s-all-in-one.yaml index 207601ee..db23e36a 100644 --- a/kubernetes/microservices-mode/traces/k8s-all-in-one.yaml +++ b/kubernetes/microservices-mode/traces/k8s-all-in-one.yaml @@ -36,8 +36,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -62,7 +62,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed namespace: tracing-system --- @@ -75,8 +75,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -200,8 +200,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -5113,7 +5113,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-config namespace: tracing-system --- @@ -5129,7 +5129,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-runtime namespace: tracing-system --- @@ -5289,8 +5289,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5330,8 +5330,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5421,7 +5421,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-compactor namespace: tracing-system spec: @@ -5445,7 +5445,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-distributor namespace: tracing-system spec: @@ -5485,7 +5485,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 prometheus.io/service-monitor: "false" name: tempo-distributed-distributor-discovery namespace: tracing-system @@ -5522,7 +5522,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-gossip-ring namespace: tracing-system spec: @@ -5548,7 +5548,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-ingester namespace: tracing-system spec: @@ -5577,7 +5577,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 prometheus.io/service-monitor: "false" name: tempo-distributed-ingester-discovery namespace: tracing-system @@ -5608,7 +5608,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-metrics-generator namespace: tracing-system spec: @@ -5636,7 +5636,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 prometheus.io/service-monitor: "false" name: tempo-distributed-metrics-generator-discovery namespace: tracing-system @@ -5666,7 +5666,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-querier namespace: tracing-system spec: @@ -5693,7 +5693,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-query-frontend namespace: tracing-system spec: @@ -5720,7 +5720,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-query-frontend-discovery namespace: tracing-system spec: @@ -5839,7 +5839,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-compactor namespace: tracing-system spec: @@ -5858,7 +5858,7 @@ spec: template: metadata: annotations: - checksum/config: e82c35c24307dc55df92ad18fa2cee7d69ca492dbd81d1b1c9abb55b5c18a73d + checksum/config: cd10af2b40e4d6f55ac91e28648759d093ee6b206e2fff729f7319eb45a9cda6 logs.grafana.com/scrape: "true" profiles.grafana.com/cpu.port_name: http-metrics profiles.grafana.com/cpu.scrape: "true" @@ -5873,7 +5873,7 @@ spec: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 spec: containers: - args: @@ -5940,7 +5940,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-distributor namespace: tracing-system spec: @@ -5955,7 +5955,7 @@ spec: template: metadata: annotations: - checksum/config: e82c35c24307dc55df92ad18fa2cee7d69ca492dbd81d1b1c9abb55b5c18a73d + checksum/config: cd10af2b40e4d6f55ac91e28648759d093ee6b206e2fff729f7319eb45a9cda6 logs.grafana.com/scrape: "true" profiles.grafana.com/cpu.port_name: http-metrics profiles.grafana.com/cpu.scrape: "true" @@ -5970,7 +5970,7 @@ spec: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 spec: affinity: podAntiAffinity: @@ -6077,7 +6077,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-metrics-generator namespace: tracing-system spec: @@ -6092,7 +6092,7 @@ spec: template: metadata: annotations: - checksum/config: e82c35c24307dc55df92ad18fa2cee7d69ca492dbd81d1b1c9abb55b5c18a73d + checksum/config: cd10af2b40e4d6f55ac91e28648759d093ee6b206e2fff729f7319eb45a9cda6 logs.grafana.com/scrape: "true" profiles.grafana.com/cpu.port_name: http-metrics profiles.grafana.com/cpu.scrape: "true" @@ -6107,7 +6107,7 @@ spec: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 spec: affinity: podAntiAffinity: @@ -6205,7 +6205,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-querier namespace: tracing-system spec: @@ -6224,7 +6224,7 @@ spec: template: metadata: annotations: - checksum/config: e82c35c24307dc55df92ad18fa2cee7d69ca492dbd81d1b1c9abb55b5c18a73d + checksum/config: cd10af2b40e4d6f55ac91e28648759d093ee6b206e2fff729f7319eb45a9cda6 logs.grafana.com/scrape: "true" profiles.grafana.com/cpu.port_name: http-metrics profiles.grafana.com/cpu.scrape: "true" @@ -6239,7 +6239,7 @@ spec: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 spec: affinity: podAntiAffinity: @@ -6339,7 +6339,7 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-query-frontend namespace: tracing-system spec: @@ -6358,7 +6358,7 @@ spec: template: metadata: annotations: - checksum/config: e82c35c24307dc55df92ad18fa2cee7d69ca492dbd81d1b1c9abb55b5c18a73d + checksum/config: cd10af2b40e4d6f55ac91e28648759d093ee6b206e2fff729f7319eb45a9cda6 logs.grafana.com/scrape: "true" profiles.grafana.com/cpu.port_name: http-metrics profiles.grafana.com/cpu.scrape: "true" @@ -6372,7 +6372,7 @@ spec: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: tempo app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 spec: affinity: podAntiAffinity: @@ -6592,8 +6592,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6646,7 +6646,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -6727,7 +6727,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-ingester namespace: tracing-system spec: @@ -6742,7 +6742,7 @@ spec: template: metadata: annotations: - checksum/config: e82c35c24307dc55df92ad18fa2cee7d69ca492dbd81d1b1c9abb55b5c18a73d + checksum/config: cd10af2b40e4d6f55ac91e28648759d093ee6b206e2fff729f7319eb45a9cda6 logs.grafana.com/scrape: "true" profiles.grafana.com/cpu.port_name: http-metrics profiles.grafana.com/cpu.scrape: "true" @@ -6757,7 +6757,7 @@ spec: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 spec: affinity: podAntiAffinity: @@ -6864,7 +6864,7 @@ metadata: app.kubernetes.io/name: tempo app.kubernetes.io/part-of: memberlist app.kubernetes.io/version: 2.6.0 - helm.sh/chart: tempo-distributed-1.23.1 + helm.sh/chart: tempo-distributed-1.24.0 name: tempo-distributed-ingester namespace: tracing-system spec: @@ -6979,10 +6979,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -6990,10 +6996,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -7041,8 +7052,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -7098,8 +7109,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/monolithic-mode/all-in-one/k8s-all-in-one.yaml b/kubernetes/monolithic-mode/all-in-one/k8s-all-in-one.yaml index 2e3a80a9..a049426f 100644 --- a/kubernetes/monolithic-mode/all-in-one/k8s-all-in-one.yaml +++ b/kubernetes/monolithic-mode/all-in-one/k8s-all-in-one.yaml @@ -41,8 +41,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -95,8 +95,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system --- @@ -120,8 +120,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: profiles-system-pyroscope namespace: profiles-system rules: @@ -151,8 +151,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -488,8 +488,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: profiles-system-pyroscope namespace: profiles-system roleRef: @@ -510,8 +510,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -5364,8 +5364,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-config namespace: profiles-system --- @@ -5380,8 +5380,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-overrides-config namespace: profiles-system --- @@ -5684,8 +5684,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5725,8 +5725,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5865,8 +5865,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -5889,8 +5889,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 prometheus.io/service-monitor: "false" name: pyroscope-headless namespace: profiles-system @@ -5914,8 +5914,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-memberlist namespace: profiles-system spec: @@ -6299,8 +6299,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6353,7 +6353,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -6432,8 +6432,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -6448,7 +6448,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -6483,7 +6483,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: pyroscope ports: @@ -6639,8 +6639,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -6869,10 +6869,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -6880,10 +6886,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -6931,8 +6942,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6987,8 +6998,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -7053,8 +7064,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/monolithic-mode/logs/k8s-all-in-one.yaml b/kubernetes/monolithic-mode/logs/k8s-all-in-one.yaml index ce941e1f..f67c39e4 100644 --- a/kubernetes/monolithic-mode/logs/k8s-all-in-one.yaml +++ b/kubernetes/monolithic-mode/logs/k8s-all-in-one.yaml @@ -31,8 +31,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -57,8 +57,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -182,8 +182,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -4924,8 +4924,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4965,8 +4965,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5268,8 +5268,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5322,7 +5322,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -5497,10 +5497,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -5508,10 +5514,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -5559,8 +5570,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5616,8 +5627,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/monolithic-mode/metrics/k8s-all-in-one.yaml b/kubernetes/monolithic-mode/metrics/k8s-all-in-one.yaml index bf38497f..428bfd05 100644 --- a/kubernetes/monolithic-mode/metrics/k8s-all-in-one.yaml +++ b/kubernetes/monolithic-mode/metrics/k8s-all-in-one.yaml @@ -7,8 +7,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -33,8 +33,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -137,8 +137,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -4624,8 +4624,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4665,8 +4665,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -4840,8 +4840,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4894,7 +4894,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -5069,10 +5069,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -5080,10 +5086,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -5096,8 +5107,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5153,8 +5164,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/monolithic-mode/profiles/k8s-all-in-one.yaml b/kubernetes/monolithic-mode/profiles/k8s-all-in-one.yaml index b11c6c69..6d673f5b 100644 --- a/kubernetes/monolithic-mode/profiles/k8s-all-in-one.yaml +++ b/kubernetes/monolithic-mode/profiles/k8s-all-in-one.yaml @@ -12,8 +12,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -36,8 +36,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system --- @@ -48,8 +48,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: profiles-system-pyroscope namespace: profiles-system rules: @@ -79,8 +79,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -181,8 +181,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: profiles-system-pyroscope namespace: profiles-system roleRef: @@ -203,8 +203,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -4667,8 +4667,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-config namespace: profiles-system --- @@ -4683,8 +4683,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-overrides-config namespace: profiles-system --- @@ -4755,8 +4755,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4796,8 +4796,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -4886,8 +4886,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -4910,8 +4910,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 prometheus.io/service-monitor: "false" name: pyroscope-headless namespace: profiles-system @@ -4935,8 +4935,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope-memberlist namespace: profiles-system spec: @@ -5045,8 +5045,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5099,7 +5099,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -5178,8 +5178,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -5194,7 +5194,7 @@ spec: template: metadata: annotations: - checksum/config: b52110aa8e2312a57a09c43bbe0f090d8bcca6b4706f46cf39e75a8754edb11f + checksum/config: 55cee8d67e200c2894c7dd872e09e32b80c79d72e3fdd0abf801701c042a98bc profiles.grafana.com/cpu.port_name: http2 profiles.grafana.com/cpu.scrape: "true" profiles.grafana.com/goroutine.port_name: http2 @@ -5229,7 +5229,7 @@ spec: envFrom: - secretRef: name: pyroscope-env-h982fgc652 - image: grafana/pyroscope:1.9.1 + image: grafana/pyroscope:1.10.0 imagePullPolicy: IfNotPresent name: pyroscope ports: @@ -5284,8 +5284,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -5400,10 +5400,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -5411,10 +5417,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -5427,8 +5438,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5483,8 +5494,8 @@ metadata: app.kubernetes.io/instance: pyroscope app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: pyroscope - app.kubernetes.io/version: 1.9.1 - helm.sh/chart: pyroscope-1.9.1 + app.kubernetes.io/version: 1.10.0 + helm.sh/chart: pyroscope-1.10.0 name: pyroscope namespace: profiles-system spec: @@ -5520,8 +5531,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/monolithic-mode/traces/k8s-all-in-one.yaml b/kubernetes/monolithic-mode/traces/k8s-all-in-one.yaml index a9e0af5d..1091a35c 100644 --- a/kubernetes/monolithic-mode/traces/k8s-all-in-one.yaml +++ b/kubernetes/monolithic-mode/traces/k8s-all-in-one.yaml @@ -36,8 +36,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -75,8 +75,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -200,8 +200,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -5286,8 +5286,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5327,8 +5327,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5694,8 +5694,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5748,7 +5748,7 @@ spec: - secretRef: name: alloy-env-7hg2fmmgdb optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -6024,10 +6024,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -6035,10 +6041,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -6086,8 +6097,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6172,8 +6183,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/read-write-mode/logs/k8s-all-in-one.yaml b/kubernetes/read-write-mode/logs/k8s-all-in-one.yaml index e7caba90..1ae3dc21 100644 --- a/kubernetes/read-write-mode/logs/k8s-all-in-one.yaml +++ b/kubernetes/read-write-mode/logs/k8s-all-in-one.yaml @@ -10,8 +10,8 @@ metadata: labels: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki namespace: logging-system --- @@ -24,8 +24,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -50,8 +50,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -151,8 +151,8 @@ metadata: labels: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-clusterrole rules: - apiGroups: @@ -174,8 +174,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -192,8 +192,8 @@ metadata: labels: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-clusterrolebinding roleRef: apiGroup: rbac.authorization.k8s.io @@ -357,8 +357,8 @@ metadata: labels: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-runtime namespace: logging-system --- @@ -4852,8 +4852,8 @@ metadata: app.kubernetes.io/component: backend app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-backend namespace: logging-system spec: @@ -4906,8 +4906,8 @@ metadata: labels: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-memberlist namespace: logging-system spec: @@ -4958,8 +4958,8 @@ metadata: app.kubernetes.io/component: read app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-read namespace: logging-system spec: @@ -5014,8 +5014,8 @@ metadata: app.kubernetes.io/component: write app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-write namespace: logging-system spec: @@ -5072,8 +5072,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5113,8 +5113,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5203,8 +5203,8 @@ metadata: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-read namespace: logging-system spec: @@ -5222,7 +5222,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: read app.kubernetes.io/instance: loki @@ -5247,7 +5247,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: loki ports: @@ -5397,8 +5397,8 @@ metadata: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-backend namespace: logging-system spec: @@ -5414,7 +5414,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: backend app.kubernetes.io/instance: loki @@ -5459,7 +5459,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: loki ports: @@ -5531,8 +5531,8 @@ metadata: app.kubernetes.io/instance: loki app.kubernetes.io/name: loki app.kubernetes.io/part-of: memberlist - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-write namespace: logging-system spec: @@ -5548,7 +5548,7 @@ spec: template: metadata: annotations: - checksum/config: 01ba4719c80b6fe911b091a7c05124b64eeece964e09c058ef8f9805daca546b + checksum/config: 12ae32cb1ec02d01eda3581b127c1fee3b0dc53572ed6baf239721a03d82e126 labels: app.kubernetes.io/component: write app.kubernetes.io/instance: loki @@ -5571,7 +5571,7 @@ spec: envFrom: - secretRef: name: loki-env-58m52b99kc - image: docker.io/grafana/loki:3.3.0 + image: docker.io/grafana/loki:3.3.1 imagePullPolicy: IfNotPresent name: loki ports: @@ -5636,8 +5636,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5690,7 +5690,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -5768,8 +5768,8 @@ metadata: app.kubernetes.io/component: backend app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-backend namespace: logging-system spec: @@ -5787,8 +5787,8 @@ metadata: app.kubernetes.io/component: read app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-read namespace: logging-system spec: @@ -5806,8 +5806,8 @@ metadata: app.kubernetes.io/component: write app.kubernetes.io/instance: loki app.kubernetes.io/name: loki - app.kubernetes.io/version: 3.3.0 - helm.sh/chart: loki-6.22.0 + app.kubernetes.io/version: 3.3.1 + helm.sh/chart: loki-6.23.0 name: loki-write namespace: logging-system spec: @@ -5922,10 +5922,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -5933,10 +5939,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -5949,8 +5960,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -6006,8 +6017,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/kubernetes/read-write-mode/logs/loki/values.yaml b/kubernetes/read-write-mode/logs/loki/values.yaml index 78961a72..855e589a 100644 --- a/kubernetes/read-write-mode/logs/loki/values.yaml +++ b/kubernetes/read-write-mode/logs/loki/values.yaml @@ -56,7 +56,7 @@ loki: # -- Docker image repository repository: grafana/loki # -- Overrides the image tag whose default is the chart's appVersion - tag: 3.3.0 + tag: 3.3.1 # -- Overrides the image tag with an image digest digest: null # -- Docker image pull policy @@ -412,7 +412,9 @@ loki: prefix: index_ period: 24h # -- Check https://grafana.com/docs/loki/latest/configuration/#ruler for more info on configuring ruler - rulerConfig: {} + rulerConfig: + wal: + dir: /var/loki/ruler-wal # -- Structured loki configuration, takes precedence over `loki.config`, `loki.schemaConfig`, `loki.storageConfig` structuredConfig: {} # -- Additional query scheduler config @@ -518,7 +520,7 @@ enterprise: # -- Docker image repository repository: grafana/enterprise-logs # -- Docker image tag - tag: 3.3.0 + tag: 3.3.1 # -- Overrides the image tag with an image digest digest: null # -- Docker image pull policy diff --git a/kubernetes/read-write-mode/metrics/k8s-all-in-one.yaml b/kubernetes/read-write-mode/metrics/k8s-all-in-one.yaml index 10b737f4..4900e8ff 100644 --- a/kubernetes/read-write-mode/metrics/k8s-all-in-one.yaml +++ b/kubernetes/read-write-mode/metrics/k8s-all-in-one.yaml @@ -7,8 +7,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system --- @@ -21,8 +21,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy rules: - apiGroups: @@ -125,8 +125,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy roleRef: apiGroup: rbac.authorization.k8s.io @@ -4624,8 +4624,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -4665,8 +4665,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy-cluster namespace: monitoring-system spec: @@ -5019,8 +5019,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5073,7 +5073,7 @@ spec: - secretRef: name: alloy-env optional: true - image: docker.io/grafana/alloy:v1.5.0 + image: docker.io/grafana/alloy:v1.5.1 imagePullPolicy: IfNotPresent name: alloy ports: @@ -5248,10 +5248,16 @@ spec: description: The receiver could not push some spans to the pipeline under job {{ $labels.job }}. This could be due to reaching a limit such as the ones imposed by otelcol.processor.memory_limiter. - summary: The receiver could not push some spans to the pipeline. - expr: sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) - > 0 - for: 5m + summary: The receiver pushing spans to the pipeline success rate is below + 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_receiver_refused_spans_total{}[1m]) + rate(otelcol_receiver_accepted_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning - alert: OtelcolExporterFailedSpans @@ -5259,10 +5265,15 @@ spec: description: The exporter failed to send spans to their destination under job {{ $labels.job }}. There could be an issue with the payload or with the destination endpoint. - summary: The exporter failed to send spans to their destination. - expr: sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) - > 0 - for: 5m + summary: The exporter sending spans success rate is below 95%. + expr: | + (1 - ( + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m])) + / + sum by (cluster, namespace, job) (rate(otelcol_exporter_send_failed_spans_total{}[1m]) + rate(otelcol_exporter_sent_spans_total{}[1m])) + ) + ) < 0.95 + for: 10m labels: severity: warning --- @@ -5275,8 +5286,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: @@ -5397,8 +5408,8 @@ metadata: app.kubernetes.io/managed-by: Helm app.kubernetes.io/name: alloy app.kubernetes.io/part-of: alloy - app.kubernetes.io/version: v1.5.0 - helm.sh/chart: alloy-0.10.0 + app.kubernetes.io/version: v1.5.1 + helm.sh/chart: alloy-0.10.1 name: alloy namespace: monitoring-system spec: diff --git a/monitoring-mixins/k8s-all-in-one.yaml b/monitoring-mixins/k8s-all-in-one.yaml index c53e4185..e16b8190 100644 --- a/monitoring-mixins/k8s-all-in-one.yaml +++ b/monitoring-mixins/k8s-all-in-one.yaml @@ -3,6 +3,20 @@ data: apiserver.json: |- { "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { "datasource": { @@ -20,7 +34,7 @@ data: "options": { "content": "The SLO (service level objective) and other metrics displayed on this dashboard are for informational purposes only." }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "title": "Notice", "type": "text" }, @@ -44,7 +58,7 @@ data: }, "id": 2, "interval": "1m", - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -90,7 +104,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -124,7 +138,7 @@ data: }, "id": 4, "interval": "1m", - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -222,7 +236,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -266,7 +280,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -309,7 +323,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -343,7 +357,7 @@ data: }, "id": 8, "interval": "1m", - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -441,7 +455,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -485,7 +499,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -528,7 +542,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -571,7 +585,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -614,7 +628,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -660,7 +674,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -702,7 +716,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -745,7 +759,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -787,7 +801,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -803,7 +817,7 @@ data: } ], "refresh": "10s", - "schemaVersion": 36, + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -873,6 +887,20 @@ data: cluster-total.json: |- { "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { "datasource": { @@ -906,14 +934,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -952,14 +980,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1023,14 +1051,14 @@ data: "y": 9 }, "id": 3, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true }, @@ -1039,7 +1067,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true }, @@ -1048,7 +1076,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "avg by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "avg by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true }, @@ -1057,7 +1085,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "avg by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "avg by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true }, @@ -1066,7 +1094,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true }, @@ -1075,7 +1103,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true }, @@ -1084,7 +1112,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true }, @@ -1093,7 +1121,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", "instant": true } @@ -1188,14 +1216,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "avg by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "avg by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1234,14 +1262,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "avg by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "avg by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1280,14 +1308,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1326,14 +1354,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1372,14 +1400,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1418,14 +1446,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1464,14 +1492,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1510,14 +1538,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (namespace) (rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))", + "expr": "sum by (namespace) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1556,14 +1584,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (instance) (rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_OutSegs{cluster=\"$cluster\"}[$__rate_interval]))", + "expr": "sum by (instance) (\n rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_OutSegs{cluster=\"$cluster\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1602,14 +1630,14 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { "type": "prometheus", "uid": "${datasource}" }, - "expr": "sum by (instance) (rate(node_netstat_TcpExt_TCPSynRetrans{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval]))", + "expr": "sum by (instance) (\n rate(node_netstat_TcpExt_TCPSynRetrans{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "legendFormat": "__auto" } ], @@ -1618,7 +1646,7 @@ data: } ], "refresh": "10s", - "schemaVersion": 36, + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -1675,6 +1703,20 @@ data: controller-manager.json: |- { "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { "datasource": { @@ -1697,7 +1739,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -1748,7 +1790,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -1799,7 +1841,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -1850,7 +1892,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -1901,7 +1943,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -1976,7 +2018,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -2027,7 +2069,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -2078,7 +2120,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -2129,7 +2171,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -2180,7 +2222,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -2196,7 +2238,7 @@ data: } ], "refresh": "10s", - "schemaVersion": 36, + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -3447,6 +3489,20 @@ data: k8s-resources-cluster.json: |- { "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { "datasource": { @@ -3455,7 +3511,7 @@ data: }, "fieldConfig": { "defaults": { - "unit": "none" + "unit": "percentunit" } }, "gridPos": { @@ -3469,7 +3525,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3504,7 +3560,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3539,7 +3595,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3574,7 +3630,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3609,7 +3665,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3644,7 +3700,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3694,7 +3750,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3753,7 +3809,7 @@ data: "y": 12 }, "id": 8, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -3910,7 +3966,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4005,7 +4061,7 @@ data: "y": 24 }, "id": 10, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4182,7 +4238,7 @@ data: "y": 30 }, "id": 11, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4326,7 +4382,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4377,7 +4433,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4428,7 +4484,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4479,7 +4535,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4530,7 +4586,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4581,7 +4637,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4632,7 +4688,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4683,7 +4739,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4734,7 +4790,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4785,7 +4841,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4856,7 +4912,7 @@ data: "y": 96 }, "id": 22, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -4965,7 +5021,7 @@ data: } ], "refresh": "10s", - "schemaVersion": 36, + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -5022,6 +5078,20 @@ data: k8s-resources-namespace.json: |- { "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { "datasource": { @@ -5044,7 +5114,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5079,7 +5149,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5114,7 +5184,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5149,7 +5219,7 @@ data: "options": { "colorMode": "none" }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5251,7 +5321,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5266,7 +5336,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.cpu\"})", + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.cpu\"}))", "legendFormat": "quota - requests" }, { @@ -5274,7 +5344,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.cpu\"})", + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.cpu\"}))", "legendFormat": "quota - limits" } ], @@ -5326,7 +5396,7 @@ data: "y": 14 }, "id": 6, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5509,7 +5579,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5524,7 +5594,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.memory\"})", + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.memory\"}))", "legendFormat": "quota - requests" }, { @@ -5532,7 +5602,7 @@ data: "type": "prometheus", "uid": "${datasource}" }, - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.memory\"})", + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.memory\"}))", "legendFormat": "quota - limits" } ], @@ -5587,7 +5657,7 @@ data: "y": 28 }, "id": 8, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5777,7 +5847,7 @@ data: "y": 35 }, "id": 9, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5921,7 +5991,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -5972,7 +6042,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6023,7 +6093,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6074,7 +6144,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6125,7 +6195,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6176,7 +6246,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6227,7 +6297,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6278,7 +6348,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6349,7 +6419,7 @@ data: "y": 70 }, "id": 18, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -6458,7 +6528,7 @@ data: } ], "refresh": "10s", - "schemaVersion": 36, + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -6527,743 +6597,518 @@ apiVersion: v1 data: k8s-resources-node.json: |- { - "annotations": { - "list": [ ] - }, - "editable": true, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "links": [ ], - "refresh": "10s", - "rows": [ + "editable": false, + "links": [ { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 1, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ - { - "alias": "max capacity", - "color": "#F2495C", - "dashes": true, - "fill": 0, - "hiddenSeries": true, - "hideTooltip": true, - "legend": true, - "linewidth": 2, - "stack": false + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], + "panels": [ + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true, + "stacking": { + "mode": "normal" } - ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", node=~\"$node\", resource=\"cpu\"})", - "format": "time_series", - "legendFormat": "max capacity", - "legendLink": null + } + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "max capacity" }, - { - "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "time_series", - "legendFormat": "{{pod}}", - "legendLink": null - } + "properties": [ + { + "id": "color", + "value": { + "fixedColor": "red", + "mode": "fixed" + } + }, + { + "id": "custom.stacking", + "value": { + "mode": "none" + } + }, + { + "id": "custom.hideFrom", + "value": { + "legend": false, + "tooltip": true, + "viz": false + } + }, + { + "id": "custom.lineStyle", + "value": { + "dash": [ + 10, + 10 + ], + "fill": "dash" + } + } + ] + } + ] + }, + "gridPos": { + "h": 6, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 1, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "CPU Usage", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", job=\"integrations/kubernetes/kube-state-metrics\", node=~\"$node\", resource=\"cpu\"})", + "legendFormat": "max capacity" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "legendFormat": "{{pod}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, "title": "CPU Usage", - "titleSize": "h6" + "type": "timeseries" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "id": 2, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": false, - "steppedLine": false, - "styles": [ - { - "alias": "Time", - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "pattern": "Time", - "type": "hidden" - }, - { - "alias": "CPU Usage", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #A", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "CPU Requests", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #B", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "CPU Requests %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #C", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "CPU Limits", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #D", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "CPU Limits %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #E", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "Pod", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "pod", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "pattern": "/.*/", - "thresholds": [ ], - "type": "string", - "unit": "short" - } - ], - "targets": [ - { - "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "A" - }, - { - "expr": "sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "B" - }, - { - "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod) / sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "C" + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/%/" }, - { - "expr": "sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "D" + "properties": [ + { + "id": "unit", + "value": "percentunit" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Pod" }, - { - "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod) / sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "E" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "CPU Quota", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "properties": [ + { + "id": "links", + "value": [ + { + "title": "Drill down to pods", + "url": "/d/6581e46e4e5c7ba40a07646395ef7b23/k8s-resources-pod?${datasource:queryparam}&var-cluster=$cluster&var-namespace=$namespace&var-pod=${__data.fields.Pod}" + } + ] + } + ] + } + ] + }, + "gridPos": { + "h": 6, + "w": 24, + "x": 0, + "y": 6 + }, + "id": 2, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "transform": "table", - "type": "table", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "expr": "sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod) / sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", node=~\"$node\"}) by (pod) / sum(cluster:namespace:pod_cpu:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + } + ], + "title": "CPU Quota", + "transformations": [ + { + "id": "joinByField", + "options": { + "byField": "pod", + "mode": "outer" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false + "renameByName": { + "Value #A": "CPU Usage", + "Value #B": "CPU Requests", + "Value #C": "CPU Requests %", + "Value #D": "CPU Limits", + "Value #E": "CPU Limits %", + "pod": "Pod" } - ] + } } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "CPU Quota", - "titleSize": "h6" + "type": "table" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 3, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ - { - "alias": "max capacity", - "color": "#F2495C", - "dashes": true, - "fill": 0, - "hiddenSeries": true, - "hideTooltip": true, - "legend": true, - "linewidth": 2, - "stack": false - } - ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", node=~\"$node\", resource=\"memory\"})", - "format": "time_series", - "legendFormat": "max capacity", - "legendLink": null - }, - { - "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\", container!=\"\"}) by (pod)", - "format": "time_series", - "legendFormat": "{{pod}}", - "legendLink": null + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true, + "stacking": { + "mode": "normal" } + }, + "unit": "bytes" + }, + "overrides": [ + { + "matcher": { + "id": "byName", + "options": "max capacity" + }, + "properties": [ + { + "id": "color", + "value": { + "fixedColor": "red", + "mode": "fixed" + } + }, + { + "id": "custom.stacking", + "value": { + "mode": "none" + } + }, + { + "id": "custom.hideFrom", + "value": { + "legend": false, + "tooltip": true, + "viz": false + } + }, + { + "id": "custom.lineStyle", + "value": { + "dash": [ + 10, + 10 + ], + "fill": "dash" + } + } + ] + } + ] + }, + "gridPos": { + "h": 6, + "w": 24, + "x": 0, + "y": 12 + }, + "id": 3, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Memory Usage (w/o cache)", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", job=\"integrations/kubernetes/kube-state-metrics\", node=~\"$node\", resource=\"memory\"})", + "legendFormat": "max capacity" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\", container!=\"\"}) by (pod)", + "legendFormat": "{{pod}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Memory Usage", - "titleSize": "h6" + "title": "Memory Usage (w/o cache)", + "type": "timeseries" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "id": 4, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": false, - "steppedLine": false, - "styles": [ - { - "alias": "Time", - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "pattern": "Time", - "type": "hidden" - }, - { - "alias": "Memory Usage", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #A", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Requests", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #B", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Requests %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #C", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "Memory Limits", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #D", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Limits %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #E", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "Memory Usage (RSS)", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #F", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Usage (Cache)", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #G", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Usage (Swap)", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #H", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Pod", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "pod", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "pattern": "/.*/", - "thresholds": [ ], - "type": "string", - "unit": "short" - } - ], - "targets": [ - { - "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "A" - }, - { - "expr": "sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "B" - }, - { - "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod) / sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "C" - }, - { - "expr": "sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "D" - }, - { - "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod) / sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "E" - }, - { - "expr": "sum(node_namespace_pod_container:container_memory_rss{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "F" + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "unit": "bytes" + }, + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/%/" }, - { - "expr": "sum(node_namespace_pod_container:container_memory_cache{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "G" + "properties": [ + { + "id": "unit", + "value": "percentunit" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Pod" }, - { - "expr": "sum(node_namespace_pod_container:container_memory_swap{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "H" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Memory Quota", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "properties": [ + { + "id": "links", + "value": [ + { + "title": "Drill down to pods", + "url": "/d/6581e46e4e5c7ba40a07646395ef7b23/k8s-resources-pod?${datasource:queryparam}&var-cluster=$cluster&var-namespace=$namespace&var-pod=${__data.fields.Pod}" + } + ] + } + ] + } + ] + }, + "gridPos": { + "h": 6, + "w": 24, + "x": 0, + "y": 18 + }, + "id": 4, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "transform": "table", - "type": "table", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "expr": "sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod) / sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_requests{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(node_namespace_pod_container:container_memory_working_set_bytes{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod) / sum(cluster:namespace:pod_memory:active:kube_pod_container_resource_limits{cluster=\"$cluster\", node=~\"$node\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(node_namespace_pod_container:container_memory_rss{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(node_namespace_pod_container:container_memory_cache{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(node_namespace_pod_container:container_memory_swap{cluster=\"$cluster\", node=~\"$node\",container!=\"\"}) by (pod)", + "format": "table", + "instant": true + } + ], + "title": "Memory Quota", + "transformations": [ + { + "id": "joinByField", + "options": { + "byField": "pod", + "mode": "outer" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true, + "Time 7": true, + "Time 8": true }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false + "renameByName": { + "Value #A": "Memory Usage", + "Value #B": "Memory Requests", + "Value #C": "Memory Requests %", + "Value #D": "Memory Limits", + "Value #E": "Memory Limits %", + "Value #F": "Memory Usage (RSS)", + "Value #G": "Memory Usage (Cache)", + "Value #H": "Memory Usage (Swap)", + "pod": "Pod" } - ] + } } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Memory Quota", - "titleSize": "h6" + "type": "table" } ], - "schemaVersion": 14, - "style": "dark", + "refresh": "10s", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -7272,63 +7117,42 @@ data: "list": [ { "current": { + "selected": true, "text": "Metrics", "value": "Metrics" }, "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { - "text": "", - "value": "" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "cluster", "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"integrations/kubernetes/kube-state-metrics\"}, cluster)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "current": { - "text": "", - "value": "" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", "hide": 0, - "includeAll": false, - "label": null, + "label": "node", "multi": true, "name": "node", - "options": [ ], "query": "label_values(kube_node_info{cluster=\"$cluster\"}, node)", "refresh": 2, - "regex": "", - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" } ] }, @@ -7336,35 +7160,9 @@ data: "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Compute Resources / Node (Pods)", - "uid": "200ac8fdbfbb74b39aff88118e4d1c2c", - "version": 0 + "uid": "200ac8fdbfbb74b39aff88118e4d1c2c" } kind: ConfigMap metadata: @@ -7380,6 +7178,20 @@ data: k8s-resources-pod.json: |- { "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { "datasource": { @@ -7469,7 +7281,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -7575,7 +7387,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -7617,7 +7429,7 @@ data: "y": 14 }, "id": 3, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -7800,7 +7612,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -7861,7 +7673,7 @@ data: "y": 28 }, "id": 5, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8031,7 +7843,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8082,7 +7894,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8133,7 +7945,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8184,7 +7996,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8235,7 +8047,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8286,7 +8098,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8337,7 +8149,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8396,7 +8208,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8455,7 +8267,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8506,7 +8318,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8560,7 +8372,7 @@ data: "y": 70 }, "id": 16, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8669,7 +8481,7 @@ data: } ], "refresh": "10s", - "schemaVersion": 36, + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -8752,6 +8564,20 @@ data: k8s-resources-workload.json: |- { "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { "datasource": { @@ -8789,7 +8615,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8848,7 +8674,7 @@ data: "y": 7 }, "id": 2, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -8979,7 +8805,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9041,7 +8867,7 @@ data: "y": 21 }, "id": 4, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9192,7 +9018,7 @@ data: "y": 28 }, "id": 5, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9336,7 +9162,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9387,7 +9213,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9438,7 +9264,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9489,7 +9315,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9540,7 +9366,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9591,7 +9417,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9642,7 +9468,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9693,7 +9519,7 @@ data: "mode": "single" } }, - "pluginVersion": "v10.4.0", + "pluginVersion": "v11.1.0", "targets": [ { "datasource": { @@ -9709,7 +9535,7 @@ data: } ], "refresh": "10s", - "schemaVersion": 36, + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -9805,1687 +9631,1189 @@ apiVersion: v1 data: k8s-resources-workloads-namespace.json: |- { - "annotations": { - "list": [ ] - }, - "editable": true, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "links": [ ], - "refresh": "10s", - "rows": [ + "editable": false, + "links": [ { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 1, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ - { - "alias": "quota - requests", - "color": "#F2495C", - "dashes": true, - "fill": 0, - "hiddenSeries": true, - "hideTooltip": true, - "legend": true, - "linewidth": 2, - "stack": false - }, - { - "alias": "quota - limits", - "color": "#FF9830", - "dashes": true, - "fill": 0, - "hiddenSeries": true, - "hideTooltip": true, - "legend": true, - "linewidth": 2, - "stack": false - } - ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "time_series", - "legendFormat": "{{workload}} - {{workload_type}}", - "legendLink": null + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], + "panels": [ + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + } + }, + "overrides": [ + { + "matcher": { + "id": "byFrameRefID", + "options": "B" }, - { - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.cpu\"})", - "format": "time_series", - "legendFormat": "quota - requests", - "legendLink": null + "properties": [ + { + "id": "custom.lineStyle", + "value": { + "fill": "dash" + } + }, + { + "id": "custom.lineWidth", + "value": 2 + }, + { + "id": "color", + "value": { + "fixedColor": "red", + "mode": "fixed" + } + } + ] + }, + { + "matcher": { + "id": "byFrameRefID", + "options": "C" }, - { - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.cpu\"})", - "format": "time_series", - "legendFormat": "quota - limits", - "legendLink": null - } + "properties": [ + { + "id": "custom.lineStyle", + "value": { + "fill": "dash" + } + }, + { + "id": "custom.lineWidth", + "value": 2 + }, + { + "id": "color", + "value": { + "fixedColor": "orange", + "mode": "fixed" + } + } + ] + } + ] + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 0 + }, + "id": 1, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "CPU Usage", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "legendFormat": "{{workload}} - {{workload_type}}" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"requests.cpu|cpu\"}))", + "legendFormat": "quota - requests" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"limits.cpu\"}))", + "legendFormat": "quota - limits" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, "title": "CPU Usage", - "titleSize": "h6" + "type": "timeseries" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "id": 2, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": false, - "steppedLine": false, - "styles": [ - { - "alias": "Time", - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "pattern": "Time", - "type": "hidden" - }, - { - "alias": "Running Pods", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 0, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #A", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "CPU Usage", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #B", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "CPU Requests", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #C", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "CPU Requests %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #D", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "CPU Limits", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #E", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "CPU Limits %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #F", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "Workload", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": true, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "/d/a164a7f0339f99e89cea5cb47e9be617/k8s-resources-workload?var-datasource=$datasource&var-cluster=$cluster&var-namespace=$namespace&var-workload=$__cell&var-type=$__cell_2", - "pattern": "workload", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "Workload Type", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "workload_type", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "pattern": "/.*/", - "thresholds": [ ], - "type": "string", - "unit": "short" - } - ], - "targets": [ - { - "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload, workload_type)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "A" - }, - { - "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "B" - }, - { - "expr": "sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "C" + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/%/" }, - { - "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "D" + "properties": [ + { + "id": "unit", + "value": "percentunit" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Workload" }, - { - "expr": "sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "E" + "properties": [ + { + "id": "links", + "value": [ + { + "title": "Drill down to workloads", + "url": "/d/a164a7f0339f99e89cea5cb47e9be617/k8s-resources-workload?${datasource:queryparam}&var-cluster=$cluster&var-namespace=$namespace&var-type=${__data.fields.Type}&var-workload=${__data.fields.Workload}" + } + ] + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Running Pods" }, - { - "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "F" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "CPU Quota", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "properties": [ + { + "id": "unit", + "value": "none" + } + ] + } + ] + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 7 + }, + "id": 2, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "transform": "table", - "type": "table", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload, workload_type)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=\"$cluster\", namespace=\"$namespace\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"cpu\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + } + ], + "title": "CPU Quota", + "transformations": [ + { + "id": "joinByField", + "options": { + "byField": "workload", + "mode": "outer" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true, + "workload_type 2": true, + "workload_type 3": true, + "workload_type 4": true, + "workload_type 5": true, + "workload_type 6": true }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false + "indexByName": { + "Time 1": 0, + "Time 2": 1, + "Time 3": 2, + "Time 4": 3, + "Time 5": 4, + "Time 6": 5, + "Value #A": 8, + "Value #B": 9, + "Value #C": 10, + "Value #D": 11, + "Value #E": 12, + "Value #F": 13, + "workload": 6, + "workload_type 1": 7, + "workload_type 2": 14, + "workload_type 3": 15, + "workload_type 4": 16, + "workload_type 5": 17, + "workload_type 6": 18 + }, + "renameByName": { + "Value #A": "Running Pods", + "Value #B": "CPU Usage", + "Value #C": "CPU Requests", + "Value #D": "CPU Requests %", + "Value #E": "CPU Limits", + "Value #F": "CPU Limits %", + "workload": "Workload", + "workload_type 1": "Type" } - ] + } } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "CPU Quota", - "titleSize": "h6" + "type": "table" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 3, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ - { - "alias": "quota - requests", - "color": "#F2495C", - "dashes": true, - "fill": 0, - "hiddenSeries": true, - "hideTooltip": true, - "legend": true, - "linewidth": 2, - "stack": false - }, - { - "alias": "quota - limits", - "color": "#FF9830", - "dashes": true, - "fill": 0, - "hiddenSeries": true, - "hideTooltip": true, - "legend": true, - "linewidth": 2, - "stack": false - } - ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "time_series", - "legendFormat": "{{workload}} - {{workload_type}}", - "legendLink": null + "unit": "bytes" + }, + "overrides": [ + { + "matcher": { + "id": "byFrameRefID", + "options": "B" }, - { - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.memory\"})", - "format": "time_series", - "legendFormat": "quota - requests", - "legendLink": null + "properties": [ + { + "id": "custom.lineStyle", + "value": { + "fill": "dash" + } + }, + { + "id": "custom.lineWidth", + "value": 2 + }, + { + "id": "color", + "value": { + "fixedColor": "red", + "mode": "fixed" + } + } + ] + }, + { + "matcher": { + "id": "byFrameRefID", + "options": "C" }, - { - "expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.memory\"})", - "format": "time_series", - "legendFormat": "quota - limits", - "legendLink": null - } + "properties": [ + { + "id": "custom.lineStyle", + "value": { + "fill": "dash" + } + }, + { + "id": "custom.lineWidth", + "value": 2 + }, + { + "id": "color", + "value": { + "fixedColor": "orange", + "mode": "fixed" + } + } + ] + } + ] + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 14 + }, + "id": 3, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Memory Usage", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "legendFormat": "{{workload}} - {{workload_type}}" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"requests.memory|memory\"}))", + "legendFormat": "quota - requests" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"limits.memory\"}))", + "legendFormat": "quota - limits" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, "title": "Memory Usage", - "titleSize": "h6" + "type": "timeseries" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "id": 4, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": false, - "steppedLine": false, - "styles": [ - { - "alias": "Time", - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "pattern": "Time", - "type": "hidden" - }, - { - "alias": "Running Pods", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 0, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #A", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "Memory Usage", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #B", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Requests", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #C", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Requests %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #D", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "Memory Limits", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #E", - "thresholds": [ ], - "type": "number", - "unit": "bytes" - }, - { - "alias": "Memory Limits %", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #F", - "thresholds": [ ], - "type": "number", - "unit": "percentunit" - }, - { - "alias": "Workload", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": true, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "/d/a164a7f0339f99e89cea5cb47e9be617/k8s-resources-workload?var-datasource=$datasource&var-cluster=$cluster&var-namespace=$namespace&var-workload=$__cell&var-type=$__cell_2", - "pattern": "workload", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "Workload Type", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "workload_type", - "thresholds": [ ], - "type": "number", - "unit": "short" - }, - { - "alias": "", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "pattern": "/.*/", - "thresholds": [ ], - "type": "string", - "unit": "short" - } - ], - "targets": [ - { - "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload, workload_type)", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "A" - }, - { - "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "B" - }, - { - "expr": "sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "C" + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "unit": "bytes" + }, + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/%/" }, - { - "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "D" + "properties": [ + { + "id": "unit", + "value": "percentunit" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Workload" }, - { - "expr": "sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "E" + "properties": [ + { + "id": "links", + "value": [ + { + "title": "Drill down to workloads", + "url": "/d/a164a7f0339f99e89cea5cb47e9be617/k8s-resources-workload?${datasource:queryparam}&var-cluster=$cluster&var-namespace=$namespace&var-type=${__data.fields.Type}&var-workload=${__data.fields.Workload}" + } + ] + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Running Pods" }, - { - "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "F" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Memory Quota", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "properties": [ + { + "id": "unit", + "value": "none" + } + ] + } + ] + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 21 + }, + "id": 4, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "transform": "table", - "type": "table", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "count(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload, workload_type)", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_requests{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(\n container_memory_working_set_bytes{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\", container!=\"\", image!=\"\"}\n * on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n/sum(\n kube_pod_container_resource_limits{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\", namespace=\"$namespace\", resource=\"memory\"}\n* on(namespace,pod)\n group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}\n) by (workload, workload_type)\n", + "format": "table", + "instant": true } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, "title": "Memory Quota", - "titleSize": "h6" - }, - { - "collapse": false, - "height": "250px", - "panels": [ + "transformations": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "id": 5, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": false, - "steppedLine": false, - "styles": [ - { - "alias": "Time", - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "pattern": "Time", - "type": "hidden" - }, - { - "alias": "Current Receive Bandwidth", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #A", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Current Transmit Bandwidth", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #B", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Rate of Received Packets", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #C", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Transmitted Packets", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #D", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Received Packets Dropped", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #E", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Transmitted Packets Dropped", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #F", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Workload", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": true, - "linkTargetBlank": false, - "linkTooltip": "Drill down to pods", - "linkUrl": "/d/a164a7f0339f99e89cea5cb47e9be617/k8s-resources-workload?var-datasource=$datasource&var-cluster=$cluster&var-namespace=$namespace&var-workload=$__cell&var-type=$type", - "pattern": "workload", - "thresholds": [ ], - "type": "number", - "unit": "short" + "id": "joinByField", + "options": { + "byField": "workload", + "mode": "outer" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true, + "workload_type 2": true, + "workload_type 3": true, + "workload_type 4": true, + "workload_type 5": true, + "workload_type 6": true }, - { - "alias": "Workload Type", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTargetBlank": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "workload_type", - "thresholds": [ ], - "type": "number", - "unit": "short" + "indexByName": { + "Time 1": 0, + "Time 2": 1, + "Time 3": 2, + "Time 4": 3, + "Time 5": 4, + "Time 6": 5, + "Value #A": 8, + "Value #B": 9, + "Value #C": 10, + "Value #D": 11, + "Value #E": 12, + "Value #F": 13, + "workload": 6, + "workload_type 1": 7, + "workload_type 2": 14, + "workload_type 3": 15, + "workload_type 4": 16, + "workload_type 5": 17, + "workload_type 6": 18 }, - { - "alias": "", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "pattern": "/.*/", - "thresholds": [ ], - "type": "string", - "unit": "short" + "renameByName": { + "Value #A": "Running Pods", + "Value #B": "Memory Usage", + "Value #C": "Memory Requests", + "Value #D": "Memory Requests %", + "Value #E": "Memory Limits", + "Value #F": "Memory Limits %", + "workload": "Workload", + "workload_type 1": "Type" } - ], - "targets": [ - { - "expr": "(sum(irate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "A" - }, - { - "expr": "(sum(irate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "B" - }, - { - "expr": "(sum(irate(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "C" + } + } + ], + "type": "table" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/Bandwidth/" }, - { - "expr": "(sum(irate(container_network_transmit_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "D" + "properties": [ + { + "id": "unit", + "value": "Bps" + } + ] + }, + { + "matcher": { + "id": "byRegexp", + "options": "/Packets/" }, - { - "expr": "(sum(irate(container_network_receive_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "E" + "properties": [ + { + "id": "unit", + "value": "pps" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Workload" }, - { - "expr": "(sum(irate(container_network_transmit_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", - "format": "table", - "instant": true, - "legendFormat": "", - "refId": "F" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Current Network Usage", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "properties": [ + { + "id": "links", + "value": [ + { + "title": "Drill down to workloads", + "url": "/d/a164a7f0339f99e89cea5cb47e9be617/k8s-resources-workload?${datasource:queryparam}&var-cluster=$cluster&var-namespace=$namespace&var-type=${__data.fields.Type}&var-workload=${__data.fields.Workload}" + } + ] + } + ] + } + ] + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 28 + }, + "id": 5, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "transform": "table", - "type": "table", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "(sum(rate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "(sum(rate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "(sum(rate(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "(sum(rate(container_network_transmit_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "(sum(rate(container_network_receive_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", + "format": "table", + "instant": true + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "expr": "(sum(rate(container_network_transmit_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload_type=~\"$type\"}) by (workload))\n", + "format": "table", + "instant": true + } + ], + "title": "Current Network Usage", + "transformations": [ + { + "id": "joinByField", + "options": { + "byField": "workload", + "mode": "outer" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false + "indexByName": { + "Time 1": 0, + "Time 2": 1, + "Time 3": 2, + "Time 4": 3, + "Time 5": 4, + "Time 6": 5, + "Value #A": 7, + "Value #B": 8, + "Value #C": 9, + "Value #D": 10, + "Value #E": 11, + "Value #F": 12, + "workload": 6 + }, + "renameByName": { + "Value #A": "Current Receive Bandwidth", + "Value #B": "Current Transmit Bandwidth", + "Value #C": "Rate of Received Packets", + "Value #D": "Rate of Transmitted Packets", + "Value #E": "Rate of Received Packets Dropped", + "Value #F": "Rate of Transmitted Packets Dropped", + "workload": "Workload" } - ] + } } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Current Network Usage", - "titleSize": "h6" + "type": "table" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 6, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(sum(irate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } + "unit": "Bps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 35 + }, + "id": 6, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Receive Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 7, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(sum(irate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Transmit Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "expr": "(sum(rate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" + } + ], + "title": "Receive Bandwidth", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "unit": "Bps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 35 + }, + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "(sum(rate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Bandwidth", - "titleSize": "h6" + "title": "Transmit Bandwidth", + "type": "timeseries" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 8, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(avg(irate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } + "unit": "Bps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 42 + }, + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Average Container Bandwidth by Workload: Received", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "(avg(rate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" + } + ], + "title": "Average Container Bandwidth by Workload: Received", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "unit": "Bps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 42 + }, + "id": 9, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 9, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(avg(irate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Average Container Bandwidth by Workload: Transmitted", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "expr": "(avg(rate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" + } + ], + "title": "Average Container Bandwidth by Workload: Transmitted", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "unit": "pps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 49 + }, + "id": 10, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "(sum(rate(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Average Container Bandwidth by Workload", - "titleSize": "h6" + "title": "Rate of Received Packets", + "type": "timeseries" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 10, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(sum(irate(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } + "unit": "pps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 49 + }, + "id": 11, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 11, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(sum(irate(container_network_transmit_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "(sum(rate(container_network_transmit_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Rate of Packets", - "titleSize": "h6" + "title": "Rate of Transmitted Packets", + "type": "timeseries" }, { - "collapse": false, - "height": "250px", - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 12, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(sum(irate(container_network_receive_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } + "unit": "pps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 56 + }, + "id": 12, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 10, - "id": 13, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 0, - "links": [ ], - "nullPointMode": "null as zero", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(sum(irate(container_network_transmit_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "legendFormat": "{{workload}}", - "legendLink": null - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "expr": "(sum(rate(container_network_receive_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" + } + ], + "title": "Rate of Received Packets Dropped", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "unit": "pps" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 56 + }, + "id": 13, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] + "expr": "(sum(rate(container_network_transmit_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\", namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Rate of Packets Dropped", - "titleSize": "h6" + "title": "Rate of Transmitted Packets Dropped", + "type": "timeseries" } ], - "schemaVersion": 14, - "style": "dark", + "refresh": "10s", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -11494,127 +10822,66 @@ data: "list": [ { "current": { + "selected": true, "text": "Metrics", "value": "Metrics" }, "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { - "text": "", - "value": "" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "cluster", "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"integrations/kubernetes/kube-state-metrics\"}, cluster)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "current": { - "text": "", - "value": "" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "namespace", "name": "namespace", - "options": [ ], - "query": "label_values(kube_pod_info{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\"}, namespace)", + "query": "label_values(kube_namespace_status_phase{job=\"integrations/kubernetes/kube-state-metrics\", cluster=\"$cluster\"}, namespace)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "", - "value": "" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", - "definition": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\"}, workload_type)", "hide": 0, "includeAll": true, - "label": null, - "multi": false, - "name": "type", - "options": [ ], - "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\"}, workload_type)", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 0, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false - } - ] - }, - "time": { - "from": "now-1h", - "to": "now" - }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" + "label": "workload_type", + "name": "type", + "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\"}, workload_type)", + "refresh": 2, + "sort": 1, + "type": "query" + } ] }, + "time": { + "from": "now-1h", + "to": "now" + }, "timezone": "browser", "title": "Kubernetes / Compute Resources / Namespace (Workloads)", - "uid": "a87fb0d919ec0ea5f6543124e16c42a5", - "version": 0 + "uid": "a87fb0d919ec0ea5f6543124e16c42a5" } kind: ConfigMap metadata: @@ -11629,28 +10896,29 @@ apiVersion: v1 data: kubelet.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ ] - }, "editable": false, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { - "datasource": "$datasource", + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, "fieldConfig": { "defaults": { - "links": [ ], - "mappings": [ ], - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, "unit": "none" } }, @@ -11660,46 +10928,32 @@ data: "x": 0, "y": 0 }, - "id": 2, - "links": [ ], + "id": 1, + "interval": "1m", "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "textMode": "auto" + "colorMode": "none" }, - "pluginVersion": "7", + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(kubelet_node_name{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\"})", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "", - "refId": "A" + "instant": true } ], "title": "Running Kubelets", - "transparent": false, "type": "stat" }, { - "datasource": "$datasource", + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, "fieldConfig": { "defaults": { - "links": [ ], - "mappings": [ ], - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, "unit": "none" } }, @@ -11709,46 +10963,32 @@ data: "x": 4, "y": 0 }, - "id": 3, - "links": [ ], + "id": 2, + "interval": "1m", "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "textMode": "auto" + "colorMode": "none" }, - "pluginVersion": "7", + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(kubelet_running_pods{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}) OR sum(kubelet_running_pod_count{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"})", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(kubelet_running_pods{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"})", + "instant": true } ], "title": "Running Pods", - "transparent": false, "type": "stat" }, { - "datasource": "$datasource", + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, "fieldConfig": { "defaults": { - "links": [ ], - "mappings": [ ], - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, "unit": "none" } }, @@ -11758,46 +10998,32 @@ data: "x": 8, "y": 0 }, - "id": 4, - "links": [ ], + "id": 3, + "interval": "1m", "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "textMode": "auto" + "colorMode": "none" }, - "pluginVersion": "7", + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(kubelet_running_containers{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}) OR sum(kubelet_running_container_count{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"})", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(kubelet_running_containers{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"})", + "instant": true } ], "title": "Running Containers", - "transparent": false, "type": "stat" }, { - "datasource": "$datasource", + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, "fieldConfig": { "defaults": { - "links": [ ], - "mappings": [ ], - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, "unit": "none" } }, @@ -11807,46 +11033,32 @@ data: "x": 12, "y": 0 }, - "id": 5, - "links": [ ], + "id": 4, + "interval": "1m", "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "textMode": "auto" + "colorMode": "none" }, - "pluginVersion": "7", + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\", state=\"actual_state_of_world\"})", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "instant": true } ], "title": "Actual Volume Count", - "transparent": false, "type": "stat" }, { - "datasource": "$datasource", + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, "fieldConfig": { "defaults": { - "links": [ ], - "mappings": [ ], - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, "unit": "none" } }, @@ -11856,46 +11068,32 @@ data: "x": 16, "y": 0 }, - "id": 6, - "links": [ ], + "id": 5, + "interval": "1m", "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "textMode": "auto" + "colorMode": "none" }, - "pluginVersion": "7", + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\",state=\"desired_state_of_world\"})", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "instant": true } ], "title": "Desired Volume Count", - "transparent": false, "type": "stat" }, { - "datasource": "$datasource", + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, "fieldConfig": { "defaults": { - "links": [ ], - "mappings": [ ], - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, "unit": "none" } }, @@ -11905,1613 +11103,986 @@ data: "x": 20, "y": 0 }, - "id": 7, - "links": [ ], + "id": 6, + "interval": "1m", "options": { - "colorMode": "value", - "graphMode": "area", - "justifyMode": "auto", - "orientation": "auto", - "reduceOptions": { - "calcs": [ - "lastNotNull" - ], - "fields": "", - "values": false - }, - "textMode": "auto" + "colorMode": "none" }, - "pluginVersion": "7", + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(kubelet_node_config_error{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "instant": true } ], "title": "Config Error Count", - "transparent": false, "type": "stat" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, "gridPos": { "h": 7, "w": 12, "x": 0, "y": 7 }, - "id": 8, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(kubelet_runtime_operations_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (operation_type, instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{operation_type}}", - "refId": "A" + "legendFormat": "{{instance}} {{operation_type}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Operation Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, "gridPos": { "h": 7, "w": 12, "x": 12, "y": 7 }, - "id": 9, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(kubelet_runtime_operations_errors_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, operation_type)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{operation_type}}", - "refId": "A" + "legendFormat": "{{instance}} {{operation_type}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Operation Error Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, "gridPos": { "h": 7, "w": 24, "x": 0, "y": 14 }, - "id": 10, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 9, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(kubelet_runtime_operations_duration_seconds_bucket{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, operation_type, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{operation_type}}", - "refId": "A" + "legendFormat": "{{instance}} {{operation_type}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Operation duration 99th quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "title": "Operation Duration 99th quantile", + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { - "h": 7, - "w": 12, - "x": 0, - "y": 21 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "id": 11, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 21 }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "id": 10, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(kubelet_pod_start_duration_seconds_count{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} pod", - "refId": "A" + "legendFormat": "{{instance}} pod" }, { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(kubelet_pod_worker_duration_seconds_count{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} worker", - "refId": "B" + "legendFormat": "{{instance}} worker" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Pod Start Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, "gridPos": { "h": 7, "w": 12, "x": 12, "y": 21 }, - "id": 12, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 11, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_start_duration_seconds_bucket{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} pod", - "refId": "A" + "legendFormat": "{{instance}} pod" }, { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_worker_duration_seconds_bucket{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} worker", - "refId": "B" + "legendFormat": "{{instance}} worker" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Pod Start Duration", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, "gridPos": { "h": 7, "w": 12, "x": 0, "y": 28 }, - "id": 13, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 12, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(storage_operation_duration_seconds_count{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, operation_name, volume_plugin)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}", - "refId": "A" + "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Storage Operation Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, "gridPos": { "h": 7, "w": 12, "x": 12, "y": 28 }, - "id": 14, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 13, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(storage_operation_errors_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, operation_name, volume_plugin)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}", - "refId": "A" + "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Storage Operation Error Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, "gridPos": { "h": 7, "w": 24, "x": 0, "y": 35 }, - "id": 15, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 14, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(storage_operation_duration_seconds_bucket{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}[$__rate_interval])) by (instance, operation_name, volume_plugin, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}", - "refId": "A" + "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Storage Operation Duration 99th quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, "gridPos": { "h": 7, "w": 12, "x": 0, "y": 42 }, - "id": 16, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 15, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(kubelet_cgroup_manager_duration_seconds_count{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}[$__rate_interval])) by (instance, operation_type)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{operation_type}}", - "refId": "A" + "legendFormat": "{{operation_type}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Cgroup manager operation rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, "gridPos": { "h": 7, "w": 12, "x": 12, "y": 42 }, - "id": 17, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 16, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(kubelet_cgroup_manager_duration_seconds_bucket{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}[$__rate_interval])) by (instance, operation_type, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{operation_type}}", - "refId": "A" + "legendFormat": "{{instance}} {{operation_type}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Cgroup manager 99th quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "description": "Pod lifecycle event generator", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, "gridPos": { "h": 7, "w": 12, "x": 0, "y": 49 }, - "id": 18, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 17, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(kubelet_pleg_relist_duration_seconds_count{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}[$__rate_interval])) by (instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "legendFormat": "{{instance}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "PLEG relist rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, "gridPos": { "h": 7, "w": 12, "x": 12, "y": 49 }, - "id": 19, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 18, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_interval_seconds_bucket{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "legendFormat": "{{instance}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "PLEG relist interval", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, "gridPos": { "h": 7, "w": 24, "x": 0, "y": 56 }, - "id": 20, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 19, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_duration_seconds_bucket{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])) by (instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "legendFormat": "{{instance}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "PLEG relist duration", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, "gridPos": { "h": 7, "w": 24, "x": 0, "y": 63 }, - "id": 21, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 20, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\",code=~\"2..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "2xx", - "refId": "A" + "legendFormat": "2xx" }, { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\",code=~\"3..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "3xx", - "refId": "B" + "legendFormat": "3xx" }, { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\",code=~\"4..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "4xx", - "refId": "C" + "legendFormat": "4xx" }, { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\",code=~\"5..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "5xx", - "refId": "D" + "legendFormat": "5xx" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "RPC Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "title": "RPC rate", + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, "gridPos": { "h": 7, "w": 24, "x": 0, "y": 70 }, - "id": 22, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "id": 21, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\", instance=~\"$instance\"}[$__rate_interval])) by (instance, verb, url, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}} {{verb}} {{url}}", - "refId": "A" + "legendFormat": "{{instance}} {{verb}} {{url}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Request duration 99th quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "bytes" + } + }, "gridPos": { "h": 7, "w": 8, "x": 0, "y": 77 }, - "id": 23, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 22, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "process_resident_memory_bytes{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "legendFormat": "{{instance}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Memory", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "short" + } + }, "gridPos": { "h": 7, "w": 8, "x": 8, "y": 77 }, - "id": 24, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 23, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}[$__rate_interval])", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "legendFormat": "{{instance}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "CPU usage", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "short" + } + }, "gridPos": { "h": 7, "w": 8, "x": 16, "y": 77 }, - "id": 25, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 24, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "expr": "go_goroutines{cluster=\"$cluster\",job=\"integrations/kubernetes/kubelet\",instance=~\"$instance\"}", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" + "legendFormat": "{{instance}}" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Goroutines", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "type": "timeseries" } ], "refresh": "10s", - "rows": [ ], - "schemaVersion": 14, - "style": "dark", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -13527,51 +12098,35 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, "label": "cluster", - "multi": false, "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"integrations/kubernetes/kubelet\"}, cluster)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, "includeAll": true, "label": "instance", - "multi": false, "name": "instance", - "options": [ ], "query": "label_values(up{job=\"integrations/kubernetes/kubelet\",cluster=\"$cluster\"}, instance)", "refresh": 2, - "regex": "", - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" } ] }, @@ -13579,35 +12134,9 @@ data: "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Kubelet", - "uid": "3138fa155d5915769fbded898ac09fd9", - "version": 0 + "uid": "3138fa155d5915769fbded898ac09fd9" } kind: ConfigMap metadata: @@ -18283,7 +16812,7 @@ data: "sort": "none" } }, - "span": 4, + "span": 3, "targets": [ { "expr": "sum(cortex_bucket_index_estimated_compaction_jobs{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}) and (sum(rate(cortex_bucket_index_estimated_compaction_jobs_errors_total{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) == 0)", @@ -18295,6 +16824,86 @@ data: "title": "Estimated Compaction Jobs", "type": "timeseries" }, + { + "datasource": "$datasource", + "description": "### Source blocks age\nThe difference between the maximum timestamp of the block being compacted and the current time.\nA steadily increasing value indicates that the compactor cannot keep up with the produced blocks by the ingesters.\nIncrease the number of compactors when this value is consistently increasing.\n\n", + "fieldConfig": { + "defaults": { + "custom": { + "drawStyle": "line", + "fillOpacity": 1, + "lineWidth": 1, + "pointSize": 5, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + } + }, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ ] + }, + "unit": "ms" + }, + "overrides": [ ] + }, + "id": 6, + "links": [ ], + "nullPointMode": "null as zero", + "options": { + "legend": { + "showLegend": true + }, + "tooltip": { + "mode": "multi", + "sort": "none" + } + }, + "span": 3, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(cortex_compactor_block_max_time_delta_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) by (le)) * 1e3", + "format": "time_series", + "legendFormat": "99th Percentile", + "refId": "A" + }, + { + "expr": "histogram_quantile(0.50, sum(rate(cortex_compactor_block_max_time_delta_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) by (le)) * 1e3", + "format": "time_series", + "legendFormat": "50th Percentile", + "refId": "B" + }, + { + "expr": "sum(rate(cortex_compactor_block_max_time_delta_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) * 1e3 / sum(rate(cortex_compactor_block_max_time_delta_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval]))", + "format": "time_series", + "legendFormat": "Average", + "refId": "C" + } + ], + "title": "Source blocks age", + "type": "timeseries", + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + }, { "datasource": "$datasource", "description": "### TSDB compactions / sec\nRate of TSDB compactions. Single TSDB compaction takes one or more input blocks and produces one or more (during \"split\" phase) output blocks.\n\n", @@ -18321,7 +16930,7 @@ data: }, "overrides": [ ] }, - "id": 6, + "id": 7, "links": [ ], "options": { "legend": { @@ -18332,7 +16941,7 @@ data: "sort": "none" } }, - "span": 4, + "span": 3, "targets": [ { "expr": "sum(rate(prometheus_tsdb_compactions_total{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval]))", @@ -18370,7 +16979,7 @@ data: }, "overrides": [ ] }, - "id": 7, + "id": 8, "links": [ ], "nullPointMode": "null as zero", "options": { @@ -18382,7 +16991,7 @@ data: "sort": "none" } }, - "span": 4, + "span": 3, "targets": [ { "expr": "histogram_quantile(0.99, sum(rate(prometheus_tsdb_compaction_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) by (le)) * 1e3", @@ -18461,7 +17070,7 @@ data: }, "overrides": [ ] }, - "id": 8, + "id": 9, "links": [ ], "options": { "legend": { @@ -18510,7 +17119,7 @@ data: }, "overrides": [ ] }, - "id": 9, + "id": 10, "links": [ ], "options": { "legend": { @@ -18570,7 +17179,7 @@ data: }, "overrides": [ ] }, - "id": 10, + "id": 11, "links": [ ], "options": { "legend": { @@ -18649,7 +17258,7 @@ data: } ] }, - "id": 11, + "id": 12, "links": [ ], "options": { "legend": { @@ -18746,7 +17355,7 @@ data: } ] }, - "id": 12, + "id": 13, "links": [ ], "options": { "legend": { @@ -18800,180 +17409,180 @@ data: }, "overrides": [ ] }, - "id": 13, - "links": [ ], - "nullPointMode": "null as zero", - "options": { - "legend": { - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "none" - } - }, - "span": 6, - "targets": [ - { - "expr": "histogram_quantile(0.99, sum(rate(cortex_compactor_meta_sync_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) by (le)) * 1e3", - "format": "time_series", - "legendFormat": "99th Percentile", - "refId": "A" - }, - { - "expr": "histogram_quantile(0.50, sum(rate(cortex_compactor_meta_sync_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) by (le)) * 1e3", - "format": "time_series", - "legendFormat": "50th Percentile", - "refId": "B" - }, - { - "expr": "sum(rate(cortex_compactor_meta_sync_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) * 1e3 / sum(rate(cortex_compactor_meta_sync_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval]))", - "format": "time_series", - "legendFormat": "Average", - "refId": "C" - } - ], - "title": "Metadata sync duration", - "type": "timeseries", - "yaxes": [ - { - "format": "ms", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ] - } - ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Metadata sync", - "titleSize": "h6" - }, - { - "collapse": false, - "height": "250px", - "panels": [ - { - "datasource": "$datasource", - "fieldConfig": { - "defaults": { - "custom": { - "drawStyle": "line", - "fillOpacity": 100, - "lineWidth": 0, - "pointSize": 5, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "normal" - } - }, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, - "unit": "reqps" - }, - "overrides": [ ] - }, - "id": 14, - "links": [ ], - "options": { - "legend": { - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "none" - } - }, - "span": 3, - "targets": [ - { - "expr": "sum by(operation) (rate(thanos_objstore_bucket_operations_total{cluster=~\"$cluster\", namespace=~\"$namespace\",component=\"compactor\"}[$__rate_interval]))", - "format": "time_series", - "legendFormat": "{{operation}}", - "legendLink": null - } - ], - "title": "Operations / sec", - "type": "timeseries" - }, - { - "datasource": "$datasource", - "fieldConfig": { - "defaults": { - "max": 1, - "min": 0, - "noValue": "0", - "unit": "percentunit" - } - }, - "id": 15, - "links": [ ], - "options": { - "legend": { - "showLegend": true - }, - "tooltip": { - "mode": "multi", - "sort": "none" - } - }, - "span": 3, - "targets": [ - { - "expr": "sum by(operation) (rate(thanos_objstore_bucket_operation_failures_total{cluster=~\"$cluster\", namespace=~\"$namespace\",component=\"compactor\"}[$__rate_interval])) / sum by(operation) (rate(thanos_objstore_bucket_operations_total{cluster=~\"$cluster\", namespace=~\"$namespace\",component=\"compactor\"}[$__rate_interval])) >= 0", - "format": "time_series", - "legendFormat": "{{operation}}", - "legendLink": null - } - ], - "title": "Error rate", - "type": "timeseries" - }, - { - "datasource": "$datasource", - "fieldConfig": { - "defaults": { - "custom": { - "drawStyle": "line", - "fillOpacity": 1, - "lineWidth": 1, - "pointSize": 5, - "showPoints": "never", - "spanNulls": false, - "stacking": { - "group": "A", - "mode": "none" - } - }, - "min": 0, - "thresholds": { - "mode": "absolute", - "steps": [ ] - }, - "unit": "ms" - }, - "overrides": [ ] - }, + "id": 14, + "links": [ ], + "nullPointMode": "null as zero", + "options": { + "legend": { + "showLegend": true + }, + "tooltip": { + "mode": "multi", + "sort": "none" + } + }, + "span": 6, + "targets": [ + { + "expr": "histogram_quantile(0.99, sum(rate(cortex_compactor_meta_sync_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) by (le)) * 1e3", + "format": "time_series", + "legendFormat": "99th Percentile", + "refId": "A" + }, + { + "expr": "histogram_quantile(0.50, sum(rate(cortex_compactor_meta_sync_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) by (le)) * 1e3", + "format": "time_series", + "legendFormat": "50th Percentile", + "refId": "B" + }, + { + "expr": "sum(rate(cortex_compactor_meta_sync_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval])) * 1e3 / sum(rate(cortex_compactor_meta_sync_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|compactor.*|cortex|mimir-backend.*))\"}[$__rate_interval]))", + "format": "time_series", + "legendFormat": "Average", + "refId": "C" + } + ], + "title": "Metadata sync duration", + "type": "timeseries", + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] + } + ], + "repeat": null, + "repeatIteration": null, + "repeatRowId": null, + "showTitle": true, + "title": "Metadata sync", + "titleSize": "h6" + }, + { + "collapse": false, + "height": "250px", + "panels": [ + { + "datasource": "$datasource", + "fieldConfig": { + "defaults": { + "custom": { + "drawStyle": "line", + "fillOpacity": 100, + "lineWidth": 0, + "pointSize": 5, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "normal" + } + }, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ ] + }, + "unit": "reqps" + }, + "overrides": [ ] + }, + "id": 15, + "links": [ ], + "options": { + "legend": { + "showLegend": true + }, + "tooltip": { + "mode": "multi", + "sort": "none" + } + }, + "span": 3, + "targets": [ + { + "expr": "sum by(operation) (rate(thanos_objstore_bucket_operations_total{cluster=~\"$cluster\", namespace=~\"$namespace\",component=\"compactor\"}[$__rate_interval]))", + "format": "time_series", + "legendFormat": "{{operation}}", + "legendLink": null + } + ], + "title": "Operations / sec", + "type": "timeseries" + }, + { + "datasource": "$datasource", + "fieldConfig": { + "defaults": { + "max": 1, + "min": 0, + "noValue": "0", + "unit": "percentunit" + } + }, "id": 16, "links": [ ], + "options": { + "legend": { + "showLegend": true + }, + "tooltip": { + "mode": "multi", + "sort": "none" + } + }, + "span": 3, + "targets": [ + { + "expr": "sum by(operation) (rate(thanos_objstore_bucket_operation_failures_total{cluster=~\"$cluster\", namespace=~\"$namespace\",component=\"compactor\"}[$__rate_interval])) / sum by(operation) (rate(thanos_objstore_bucket_operations_total{cluster=~\"$cluster\", namespace=~\"$namespace\",component=\"compactor\"}[$__rate_interval])) >= 0", + "format": "time_series", + "legendFormat": "{{operation}}", + "legendLink": null + } + ], + "title": "Error rate", + "type": "timeseries" + }, + { + "datasource": "$datasource", + "fieldConfig": { + "defaults": { + "custom": { + "drawStyle": "line", + "fillOpacity": 1, + "lineWidth": 1, + "pointSize": 5, + "showPoints": "never", + "spanNulls": false, + "stacking": { + "group": "A", + "mode": "none" + } + }, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ ] + }, + "unit": "ms" + }, + "overrides": [ ] + }, + "id": 17, + "links": [ ], "nullPointMode": "null as zero", "options": { "legend": { @@ -19051,7 +17660,7 @@ data: }, "overrides": [ ] }, - "id": 17, + "id": 18, "links": [ ], "nullPointMode": "null as zero", "options": { @@ -19142,7 +17751,7 @@ data: }, "overrides": [ ] }, - "id": 18, + "id": 19, "links": [ ], "nullPointMode": "null as zero", "options": { @@ -19221,7 +17830,7 @@ data: }, "overrides": [ ] }, - "id": 19, + "id": 20, "links": [ ], "nullPointMode": "null as zero", "options": { @@ -19300,7 +17909,7 @@ data: }, "overrides": [ ] }, - "id": 20, + "id": 21, "links": [ ], "nullPointMode": "null as zero", "options": { @@ -19379,7 +17988,7 @@ data: }, "overrides": [ ] }, - "id": 21, + "id": 22, "links": [ ], "nullPointMode": "null as zero", "options": { @@ -19606,7 +18215,7 @@ data: } ] }, - "id": 22, + "id": 23, "links": [ ], "options": { "legend": { @@ -19654,7 +18263,7 @@ data: }, "overrides": [ ] }, - "id": 23, + "id": 24, "links": [ ], "nullPointMode": "null as zero", "options": { @@ -25285,7 +23894,7 @@ data: "span": 4, "targets": [ { - "expr": "# Query the new metric introduced in Mimir 2.10.\n(\n sum by(request_type) (rate(cortex_frontend_query_result_cache_hits_total{$read_path_matcher}[$__rate_interval]))\n /\n sum by(request_type) (rate(cortex_frontend_query_result_cache_requests_total{$read_path_matcher}[$__rate_interval]))\n)\n# Otherwise fallback to the previous general-purpose metrics.\nor\n(\n label_replace(\n # Query metrics before and after dskit cache refactor.\n sum (\n rate(thanos_cache_memcached_hits_total{name=\"frontend-cache\", $read_path_matcher}[$__rate_interval])\n or ignoring(backend)\n rate(thanos_cache_hits_total{name=\"frontend-cache\", $read_path_matcher}[$__rate_interval])\n )\n /\n sum (\n rate(thanos_cache_memcached_requests_total{name=~\"frontend-cache\", $read_path_matcher}[$__rate_interval])\n or ignoring(backend)\n rate(thanos_cache_requests_total{name=~\"frontend-cache\", $read_path_matcher}[$__rate_interval])\n ),\n \"request_type\", \"query_range\", \"\", \"\")\n)\n", + "expr": "# Query the new metric introduced in Mimir 2.10.\n(\n sum by(request_type) (rate(cortex_frontend_query_result_cache_hits_total{$read_path_matcher}[$__rate_interval]))\n /\n sum by(request_type) (rate(cortex_frontend_query_result_cache_requests_total{$read_path_matcher}[$__rate_interval]))\n)\n# Otherwise fallback to the previous general-purpose metrics.\nor\n(\n label_replace(\n sum (\n rate(thanos_cache_hits_total{name=\"frontend-cache\", $read_path_matcher}[$__rate_interval])\n )\n /\n sum (\n rate(thanos_cache_requests_total{name=~\"frontend-cache\", $read_path_matcher}[$__rate_interval])\n ),\n \"request_type\", \"query_range\", \"\", \"\")\n)\n", "format": "time_series", "legendFormat": "{{request_type}}", "legendLink": null @@ -26217,18 +24826,19 @@ data: "panels": [ { "datasource": "$datasource", + "description": "### Blocks queried / sec by compaction level\nIncreased volume of lower levels (for example levels 1 and 2) can indicate that the compactor is not keeping up.\nIn that case the store-gateway will start serving more blocks which aren't that well compacted.\n\n", "fieldConfig": { "defaults": { "custom": { "drawStyle": "line", - "fillOpacity": 1, - "lineWidth": 1, + "fillOpacity": 100, + "lineWidth": 0, "pointSize": 5, "showPoints": "never", "spanNulls": false, "stacking": { "group": "A", - "mode": "none" + "mode": "normal" } }, "min": 0, @@ -26254,13 +24864,19 @@ data: "span": 4, "targets": [ { - "expr": "sum(rate(cortex_bucket_store_series_blocks_queried_sum{component=\"store-gateway\",cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\"}[$__rate_interval]))", + "expr": "sum by (level) (rate(cortex_bucket_store_series_blocks_queried_sum{component=\"store-gateway\",level=~\"[0-4]\",cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\"}[$__rate_interval]))", "format": "time_series", - "legendFormat": "blocks", + "legendFormat": "{{level}}", + "legendLink": null + }, + { + "expr": "sum(rate(cortex_bucket_store_series_blocks_queried_sum{component=\"store-gateway\",level!~\"[0-4]\",cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\"}[$__rate_interval]))", + "format": "time_series", + "legendFormat": "5+", "legendLink": null } ], - "title": "Blocks queried / sec", + "title": "Blocks queried / sec by compaction level", "type": "timeseries" }, { @@ -32645,7 +31261,7 @@ data: "span": 6, "targets": [ { - "expr": "sum (\n rate(thanos_memcached_operations_total{name=\"frontend-cache\", cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\"}[$__rate_interval])\n or ignoring(backend)\n rate(thanos_cache_operations_total{name=\"frontend-cache\", cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\"}[$__rate_interval])\n)\n", + "expr": "sum (\n rate(thanos_cache_operations_total{name=\"frontend-cache\", cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\"}[$__rate_interval])\n)\n", "format": "time_series", "legendFormat": "Requests/s", "legendLink": null @@ -32671,7 +31287,6 @@ data: } }, "min": 0, - "noValue": 0, "thresholds": { "mode": "absolute", "steps": [ ] @@ -32682,6 +31297,7 @@ data: }, "id": 17, "links": [ ], + "nullPointMode": "null as zero", "options": { "legend": { "showLegend": true @@ -32694,29 +31310,44 @@ data: "span": 6, "targets": [ { - "expr": "histogram_quantile(0.99, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.99, sum(rate(thanos_cache_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "99th Percentile", "refId": "A" }, { - "expr": "histogram_quantile(0.50, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.50, sum(rate(thanos_cache_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "50th Percentile", "refId": "B" }, { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n) * 1e3\n/\nsum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])\n)\n", + "expr": "sum(rate(thanos_cache_operation_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval])) * 1e3 / sum(rate(thanos_cache_operation_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((mimir|query-frontend.*|cortex|mimir-read.*))\", name=\"frontend-cache\"}[$__rate_interval]))", "format": "time_series", - "intervalFactor": 2, "legendFormat": "Average", "refId": "C" } ], "title": "Latency", - "type": "timeseries" + "type": "timeseries", + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] } ], "repeat": null, @@ -34027,7 +32658,7 @@ data: "span": 4, "targets": [ { - "expr": "sum by(operation) (\n # Backwards compatibility\n rate(\n thanos_memcached_operations_total{\n component=\"store-gateway\",\n name=\"index-cache\",\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\"\n }[$__rate_interval]\n )\n or ignoring(backend)\n rate(\n thanos_cache_operations_total{\n component=\"store-gateway\",\n name=\"index-cache\",\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\"\n }[$__rate_interval]\n )\n)\n", + "expr": "sum by(operation) (\n rate(\n thanos_cache_operations_total{\n component=\"store-gateway\",\n name=\"index-cache\",\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\"\n }[$__rate_interval]\n )\n)\n", "format": "time_series", "legendFormat": "{{operation}}", "legendLink": null @@ -34053,7 +32684,6 @@ data: } }, "min": 0, - "noValue": 0, "thresholds": { "mode": "absolute", "steps": [ ] @@ -34064,6 +32694,7 @@ data: }, "id": 30, "links": [ ], + "nullPointMode": "null as zero", "options": { "legend": { "showLegend": true @@ -34076,29 +32707,44 @@ data: "span": 4, "targets": [ { - "expr": "histogram_quantile(0.99, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.99, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "99th Percentile", "refId": "A" }, { - "expr": "histogram_quantile(0.50, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.50, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "50th Percentile", "refId": "B" }, { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n) * 1e3\n/\nsum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])\n)\n", + "expr": "sum(rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval])) * 1e3 / sum(rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"index-cache\"\n}\n[$__rate_interval]))", "format": "time_series", - "intervalFactor": 2, "legendFormat": "Average", "refId": "C" } ], "title": "Latency (getmulti)", - "type": "timeseries" + "type": "timeseries", + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] }, { "datasource": "$datasource", @@ -34200,7 +32846,7 @@ data: "span": 4, "targets": [ { - "expr": "sum by(operation) (\n # Backwards compatibility\n rate(thanos_memcached_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n or ignoring(backend)\n rate(thanos_cache_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n)\n", + "expr": "sum by(operation) (\n rate(thanos_cache_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n)\n", "format": "time_series", "legendFormat": "{{operation}}", "legendLink": null @@ -34226,7 +32872,6 @@ data: } }, "min": 0, - "noValue": 0, "thresholds": { "mode": "absolute", "steps": [ ] @@ -34237,6 +32882,7 @@ data: }, "id": 33, "links": [ ], + "nullPointMode": "null as zero", "options": { "legend": { "showLegend": true @@ -34249,29 +32895,44 @@ data: "span": 4, "targets": [ { - "expr": "histogram_quantile(0.99, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.99, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "99th Percentile", "refId": "A" }, { - "expr": "histogram_quantile(0.50, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.50, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "50th Percentile", "refId": "B" }, { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n) * 1e3\n/\nsum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])\n)\n", + "expr": "sum(rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval])) * 1e3 / sum(rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n}\n[$__rate_interval]))", "format": "time_series", - "intervalFactor": 2, "legendFormat": "Average", "refId": "C" } ], "title": "Latency (getmulti)", - "type": "timeseries" + "type": "timeseries", + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] }, { "datasource": "$datasource", @@ -34312,7 +32973,7 @@ data: "span": 4, "targets": [ { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_cache_memcached_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n or\n rate(thanos_cache_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n)\n/\nsum(\n # Backwards compatibility\n rate(thanos_cache_memcached_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n or\n rate(thanos_cache_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n)\n", + "expr": "sum(\n rate(thanos_cache_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n)\n/\nsum(\n rate(thanos_cache_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"chunks-cache\"\n }[$__rate_interval])\n)\n", "format": "time_series", "legendFormat": "items", "legendLink": null @@ -34372,7 +33033,7 @@ data: "span": 4, "targets": [ { - "expr": "sum by(operation) (\n # Backwards compatibility\n rate(thanos_memcached_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n or ignoring(backend)\n rate(thanos_cache_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", + "expr": "sum by(operation) (\n rate(thanos_cache_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", "format": "time_series", "legendFormat": "{{operation}}", "legendLink": null @@ -34398,7 +33059,6 @@ data: } }, "min": 0, - "noValue": 0, "thresholds": { "mode": "absolute", "steps": [ ] @@ -34409,6 +33069,7 @@ data: }, "id": 36, "links": [ ], + "nullPointMode": "null as zero", "options": { "legend": { "showLegend": true @@ -34421,29 +33082,44 @@ data: "span": 4, "targets": [ { - "expr": "histogram_quantile(0.99, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.99, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "99th Percentile", "refId": "A" }, { - "expr": "histogram_quantile(0.50, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.50, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "50th Percentile", "refId": "B" }, { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n) * 1e3\n/\nsum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n)\n", + "expr": "sum(rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])) * 1e3 / sum(rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n operation=\"getmulti\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n}\n[$__rate_interval]))", "format": "time_series", - "intervalFactor": 2, "legendFormat": "Average", "refId": "C" } ], "title": "Latency (getmulti)", - "type": "timeseries" + "type": "timeseries", + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] }, { "datasource": "$datasource", @@ -34484,7 +33160,7 @@ data: "span": 4, "targets": [ { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_cache_memcached_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n or\n rate(thanos_cache_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n/\nsum(\n # Backwards compatibility\n rate(thanos_cache_memcached_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n or\n rate(thanos_cache_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", + "expr": "sum(\n rate(thanos_cache_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n/\nsum(\n rate(thanos_cache_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|store-gateway.*|cortex|mimir-backend.*))\",\n component=\"store-gateway\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", "format": "time_series", "legendFormat": "items", "legendLink": null @@ -34544,7 +33220,7 @@ data: "span": 4, "targets": [ { - "expr": "sum by(operation) (\n # Backwards compatibility\n rate(thanos_memcached_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n or ignoring(backend)\n rate(thanos_cache_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", + "expr": "sum by(operation) (\n rate(thanos_cache_operations_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", "format": "time_series", "legendFormat": "{{operation}}", "legendLink": null @@ -34570,7 +33246,6 @@ data: } }, "min": 0, - "noValue": 0, "thresholds": { "mode": "absolute", "steps": [ ] @@ -34581,6 +33256,7 @@ data: }, "id": 39, "links": [ ], + "nullPointMode": "null as zero", "options": { "legend": { "showLegend": true @@ -34593,29 +33269,44 @@ data: "span": 4, "targets": [ { - "expr": "histogram_quantile(0.99, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.99, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "99th Percentile", "refId": "A" }, { - "expr": "histogram_quantile(0.50, sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n) by (le)) * 1e3\n", + "expr": "histogram_quantile(0.50, sum(rate(thanos_cache_operation_duration_seconds_bucket{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])) by (le)) * 1e3", "format": "time_series", - "intervalFactor": 2, "legendFormat": "50th Percentile", "refId": "B" }, { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n) * 1e3\n/\nsum(\n # Backwards compatibility\n rate(thanos_memcached_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n or\n rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])\n)\n", + "expr": "sum(rate(thanos_cache_operation_duration_seconds_sum{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval])) * 1e3 / sum(rate(thanos_cache_operation_duration_seconds_count{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n operation=\"getmulti\",\n component=\"querier\",\n name=\"metadata-cache\"\n}\n[$__rate_interval]))", "format": "time_series", - "intervalFactor": 2, "legendFormat": "Average", "refId": "C" } ], "title": "Latency (getmulti)", - "type": "timeseries" + "type": "timeseries", + "yaxes": [ + { + "format": "ms", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "short", + "label": null, + "logBase": 1, + "max": null, + "min": null, + "show": false + } + ] }, { "datasource": "$datasource", @@ -34656,7 +33347,7 @@ data: "span": 4, "targets": [ { - "expr": "sum(\n # Backwards compatibility\n rate(thanos_cache_memcached_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n or\n rate(thanos_cache_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n/\nsum(\n # Backwards compatibility\n rate(thanos_cache_memcached_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n or\n rate(thanos_cache_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", + "expr": "sum(\n rate(thanos_cache_hits_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n/\nsum(\n rate(thanos_cache_requests_total{\n cluster=~\"$cluster\", job=~\"($namespace)/((mimir|querier.*|cortex|mimir-read.*))\",\n component=\"querier\",\n name=\"metadata-cache\"\n }[$__rate_interval])\n)\n", "format": "time_series", "legendFormat": "items", "legendLink": null @@ -55196,1133 +53887,571 @@ apiVersion: v1 data: namespace-by-pod.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ - { - "builtIn": 1, - "datasource": "-- Grafana --", - "enable": true, - "hide": true, - "iconColor": "rgba(0, 211, 255, 1)", - "name": "Annotations & Alerts", - "type": "dashboard" - } - ] - }, - "editable": true, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], + "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 0 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "id": 2, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Current Bandwidth", - "titleSize": "h6", - "type": "row" - }, - { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "#299c46", - "rgba(237, 129, 40, 0.89)", - "#d44a3a" - ], - "datasource": "$datasource", - "decimals": 0, - "format": "time_series", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": false, - "thresholdLabels": false, - "thresholdMarkers": true + "fieldConfig": { + "defaults": { + "displayName": "$namespace", + "max": 10000000000, + "min": 0, + "thresholds": { + "steps": [ + { + "color": "dark-green", + "index": 0, + "value": null + }, + { + "color": "dark-yellow", + "index": 1, + "value": 5000000000 + }, + { + "color": "dark-red", + "index": 2, + "value": 7000000000 + } + ] + }, + "unit": "Bps" + } }, "gridPos": { "h": 9, "w": 12, "x": 0, - "y": 1 - }, - "height": 9, - "id": 3, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "minSpan": 12, - "nullPointMode": "connected", - "nullText": null, - "options": { - "fieldOptions": { - "calcs": [ - "last" - ], - "defaults": { - "max": 10000000000, - "min": 0, - "title": "$namespace", - "unit": "Bps" - }, - "mappings": [ ], - "override": { }, - "thresholds": [ - { - "color": "dark-green", - "index": 0, - "value": null - }, - { - "color": "dark-yellow", - "index": 1, - "value": 5000000000 - }, - { - "color": "dark-red", - "index": 2, - "value": 7000000000 - } - ], - "values": false - } + "y": 0 }, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 12, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false - }, - "tableColumn": "", + "id": 1, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution]))", - "format": "time_series", - "instant": null, - "intervalFactor": 1, - "legendFormat": "", - "refId": "A" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" } ], - "thresholds": "", - "timeFrom": null, - "timeShift": null, "title": "Current Rate of Bytes Received", - "type": "gauge", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } - ], - "valueName": "current" + "type": "gauge" }, { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "#299c46", - "rgba(237, 129, 40, 0.89)", - "#d44a3a" - ], - "datasource": "$datasource", - "decimals": 0, - "format": "time_series", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": false, - "thresholdLabels": false, - "thresholdMarkers": true + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "displayName": "$namespace", + "max": 10000000000, + "min": 0, + "thresholds": { + "steps": [ + { + "color": "dark-green", + "index": 0, + "value": null + }, + { + "color": "dark-yellow", + "index": 1, + "value": 5000000000 + }, + { + "color": "dark-red", + "index": 2, + "value": 7000000000 + } + ] + }, + "unit": "Bps" + } }, "gridPos": { "h": 9, "w": 12, "x": 12, - "y": 1 - }, - "height": 9, - "id": 4, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "minSpan": 12, - "nullPointMode": "connected", - "nullText": null, - "options": { - "fieldOptions": { - "calcs": [ - "last" - ], - "defaults": { - "max": 10000000000, - "min": 0, - "title": "$namespace", - "unit": "Bps" - }, - "mappings": [ ], - "override": { }, - "thresholds": [ - { - "color": "dark-green", - "index": 0, - "value": null - }, - { - "color": "dark-yellow", - "index": 1, - "value": 5000000000 - }, - { - "color": "dark-red", - "index": 2, - "value": 7000000000 - } - ], - "values": false - } + "y": 0 }, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 12, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false - }, - "tableColumn": "", + "id": 2, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution]))", - "format": "time_series", - "instant": null, - "intervalFactor": 1, - "legendFormat": "", - "refId": "A" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" } ], - "thresholds": "", - "timeFrom": null, - "timeShift": null, "title": "Current Rate of Bytes Transmitted", - "type": "gauge", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } - ], - "valueName": "current" + "type": "gauge" }, { - "columns": [ - { - "text": "Time", - "value": "Time" - }, - { - "text": "Value #A", - "value": "Value #A" - }, - { - "text": "Value #B", - "value": "Value #B" - }, - { - "text": "Value #C", - "value": "Value #C" - }, - { - "text": "Value #D", - "value": "Value #D" - }, - { - "text": "Value #E", - "value": "Value #E" - }, - { - "text": "Value #F", - "value": "Value #F" - }, - { - "text": "pod", - "value": "pod" - } - ], - "datasource": "$datasource", - "fill": 1, - "fontSize": "100%", + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/Bandwidth/" + }, + "properties": [ + { + "id": "unit", + "value": "Bps" + } + ] + }, + { + "matcher": { + "id": "byRegexp", + "options": "/Packets/" + }, + "properties": [ + { + "id": "unit", + "value": "pps" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Pod" + }, + "properties": [ + { + "id": "links", + "value": [ + { + "title": "Drill down", + "url": "/d/7a18067ce943a40ae25454675c19ff5c/kubernetes-networking-pod?${datasource:queryparam}&var-cluster=${cluster}&var-namespace=${namespace}&var-pod=${__data.fields.Pod}" + } + ] + } + ] + } + ] + }, "gridPos": { "h": 9, "w": 24, - "x": 0, - "y": 10 - }, - "id": 5, - "lines": true, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null as zero", - "renderer": "flot", - "scroll": true, - "showHeader": true, - "sort": { - "col": 0, - "desc": false - }, - "spaceLength": 10, - "span": 24, - "styles": [ - { - "alias": "Time", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Time", - "thresholds": [ ], - "type": "hidden", - "unit": "short" - }, - { - "alias": "Bandwidth Received", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #A", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Bandwidth Transmitted", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #B", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Rate of Received Packets", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #C", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Transmitted Packets", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #D", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Received Packets Dropped", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #E", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Transmitted Packets Dropped", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #F", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Pod", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": true, - "linkTooltip": "Drill down", - "linkUrl": "d/7a18067ce943a40ae25454675c19ff5c/kubernetes-networking-pod?orgId=1&refresh=30s&var-namespace=$namespace&var-pod=$__cell", - "pattern": "pod", - "thresholds": [ ], - "type": "number", - "unit": "short" - } - ], + "x": 0, + "y": 9 + }, + "id": 3, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "A", - "step": 10 + "instant": true }, { - "expr": "sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "B", - "step": 10 + "instant": true }, { - "expr": "sum(irate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "C", - "step": 10 + "instant": true }, { - "expr": "sum(irate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "D", - "step": 10 + "instant": true }, { - "expr": "sum(irate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "E", - "step": 10 + "instant": true }, { - "expr": "sum(irate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "F", - "step": 10 + "instant": true + } + ], + "title": "Current Network Usage", + "transformations": [ + { + "id": "joinByField", + "options": { + "byField": "pod", + "mode": "outer" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true + }, + "indexByName": { + "Time 1": 0, + "Time 2": 1, + "Time 3": 2, + "Time 4": 3, + "Time 5": 4, + "Time 6": 5, + "Value #A": 7, + "Value #B": 8, + "Value #C": 9, + "Value #D": 10, + "Value #E": 11, + "Value #F": 12, + "pod": 6 + }, + "renameByName": { + "Value #A": "Current Receive Bandwidth", + "Value #B": "Current Transmit Bandwidth", + "Value #C": "Rate of Received Packets", + "Value #D": "Rate of Transmitted Packets", + "Value #E": "Rate of Received Packets Dropped", + "Value #F": "Rate of Transmitted Packets Dropped", + "pod": "Pod" + } + } } ], - "timeFrom": null, - "timeShift": null, - "title": "Current Status", "type": "table" }, { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 19 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "binBps" + } }, - "id": 6, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Bandwidth", - "titleSize": "h6", - "type": "row" - }, - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, "gridPos": { "h": 9, "w": 12, "x": 0, - "y": 20 + "y": 18 }, - "id": 7, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 4, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Receive Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "binBps" + } + }, "gridPos": { "h": 9, "w": 12, "x": 12, - "y": 20 + "y": 18 }, - "id": 8, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 5, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Transmit Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "pps" + } }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 27 + }, + "id": 6, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" } - ] + ], + "title": "Rate of Received Packets", + "type": "timeseries" }, { - "collapse": true, - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 29 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "id": 9, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 0, - "y": 30 - }, - "id": 10, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 27 + }, + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 12, - "y": 30 - }, - "id": 11, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum by (pod) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" + } + ], + "title": "Rate of Transmitted Packets", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 36 + }, + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum by (pod) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Packets", - "titleSize": "h6", - "type": "row" + "title": "Rate of Received Packets Dropped", + "type": "timeseries" }, { - "collapse": true, - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 30 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "id": 12, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 0, - "y": 40 - }, - "id": 13, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 36 + }, + "id": 9, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 12, - "y": 40 - }, - "id": 14, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum by (pod) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Errors", - "titleSize": "h6", - "type": "row" + "title": "Rate of Transmitted Packets Dropped", + "type": "timeseries" } ], "refresh": "10s", - "rows": [ ], - "schemaVersion": 18, - "style": "dark", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -56338,135 +54467,42 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "cluster", "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"integrations/kubernetes/cadvisor\"}, cluster)", "refresh": 2, - "regex": "", - "sort": 0, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "sort": 1, + "type": "query" }, { "allValue": ".+", - "auto": false, - "auto_count": 30, - "auto_min": "10s", "current": { + "selected": false, "text": "kube-system", "value": "kube-system" }, - "datasource": "$datasource", - "definition": "label_values(container_network_receive_packets_total{cluster=\"$cluster\"}, namespace)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, "includeAll": true, - "label": null, - "multi": false, + "label": "namespace", "name": "namespace", - "options": [ ], "query": "label_values(container_network_receive_packets_total{cluster=\"$cluster\"}, namespace)", "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false - }, - { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 0, - "includeAll": false, - "label": null, - "multi": false, - "name": "resolution", - "options": [ - { - "selected": false, - "text": "30s", - "value": "30s" - }, - { - "selected": true, - "text": "5m", - "value": "5m" - }, - { - "selected": false, - "text": "1h", - "value": "1h" - } - ], - "query": "30s,5m,1h", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false - }, - { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 2, - "includeAll": false, - "label": null, - "multi": false, - "name": "interval", - "options": [ - { - "selected": true, - "text": "4h", - "value": "4h" - } - ], - "query": "4h", - "refresh": 2, - "regex": "", - "skipUrlSync": false, "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false + "type": "query" } ] }, @@ -56474,35 +54510,9 @@ data: "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Networking / Namespace (Pods)", - "uid": "8b7a8b326d7a6f1f04244066368c67af", - "version": 0 + "uid": "8b7a8b326d7a6f1f04244066368c67af" } kind: ConfigMap metadata: @@ -56517,1345 +54527,717 @@ apiVersion: v1 data: namespace-by-workload.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ - { - "builtIn": 1, - "datasource": "-- Grafana --", - "enable": true, - "hide": true, - "iconColor": "rgba(0, 211, 255, 1)", - "name": "Annotations & Alerts", - "type": "dashboard" - } - ] - }, - "editable": true, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], - "panels": [ + "editable": false, + "links": [ { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 0 - }, - "id": 2, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Current Bandwidth", - "titleSize": "h6", - "type": "row" - }, + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], + "panels": [ { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 1 - }, - "id": 3, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ workload }}", - "refId": "A", - "step": 10 + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "green", + "mode": "fixed" + }, + "unit": "Bps" } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Current Rate of Bytes Received", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] - }, - { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, "gridPos": { "h": 9, "w": 12, - "x": 12, - "y": 1 + "x": 0, + "y": 0 }, - "id": 4, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true + "id": 1, + "options": { + "displayMode": "basic", + "showUnfilled": false }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sort_desc(sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ workload }}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Current Rate of Bytes Transmitted", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] - }, - { - "columns": [ - { - "text": "Time", - "value": "Time" - }, - { - "text": "Value #A", - "value": "Value #A" - }, - { - "text": "Value #B", - "value": "Value #B" - }, - { - "text": "Value #C", - "value": "Value #C" - }, - { - "text": "Value #D", - "value": "Value #D" - }, - { - "text": "Value #E", - "value": "Value #E" - }, - { - "text": "Value #F", - "value": "Value #F" - }, - { - "text": "Value #G", - "value": "Value #G" - }, - { - "text": "Value #H", - "value": "Value #H" - }, - { - "text": "workload", - "value": "workload" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "datasource": "$datasource", - "fill": 1, - "fontSize": "90%", + "title": "Current Rate of Bytes Received", + "type": "bargauge" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "green", + "mode": "fixed" + }, + "unit": "Bps" + } + }, "gridPos": { "h": 9, - "w": 24, - "x": 0, - "y": 10 + "w": 12, + "x": 12, + "y": 0 }, - "id": 5, - "lines": true, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null as zero", - "renderer": "flot", - "scroll": true, - "showHeader": true, - "sort": { - "col": 0, - "desc": false + "id": 2, + "options": { + "displayMode": "basic", + "showUnfilled": false }, - "spaceLength": 10, - "span": 24, - "styles": [ - { - "alias": "Time", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Time", - "thresholds": [ ], - "type": "hidden", - "unit": "short" - }, - { - "alias": "Current Bandwidth Received", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #A", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Current Bandwidth Transmitted", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #B", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Average Bandwidth Received", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #C", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Average Bandwidth Transmitted", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #D", - "thresholds": [ ], - "type": "number", - "unit": "Bps" - }, - { - "alias": "Rate of Received Packets", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #E", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Transmitted Packets", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #F", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Received Packets Dropped", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #G", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, - { - "alias": "Rate of Transmitted Packets Dropped", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": false, - "linkTooltip": "Drill down", - "linkUrl": "", - "pattern": "Value #H", - "thresholds": [ ], - "type": "number", - "unit": "pps" - }, + "pluginVersion": "v11.1.0", + "targets": [ { - "alias": "Workload", - "colorMode": null, - "colors": [ ], - "dateFormat": "YYYY-MM-DD HH:mm:ss", - "decimals": 2, - "link": true, - "linkTooltip": "Drill down", - "linkUrl": "d/728bf77cc1166d2f3133bf25846876cc/kubernetes-networking-workload?orgId=1&refresh=30s&var-namespace=$namespace&var-type=$type&var-workload=$__cell", - "pattern": "workload", - "thresholds": [ ], - "type": "number", - "unit": "short" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], + "title": "Current Rate of Bytes Transmitted", + "type": "bargauge" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "overrides": [ + { + "matcher": { + "id": "byRegexp", + "options": "/Bytes/" + }, + "properties": [ + { + "id": "unit", + "value": "binBps" + } + ] + }, + { + "matcher": { + "id": "byRegexp", + "options": "/Packets/" + }, + "properties": [ + { + "id": "unit", + "value": "pps" + } + ] + }, + { + "matcher": { + "id": "byName", + "options": "Workload" + }, + "properties": [ + { + "id": "links", + "value": [ + { + "title": "Drill down", + "url": "/d/728bf77cc1166d2f3133bf25846876cc/kubernetes-networking-workload?${datasource:queryparam}&var-cluster=${cluster}&var-namespace=${namespace}&var-type=${__data.fields.Type}&var-workload=${__data.fields.Workload}" + } + ] + } + ] + } + ] + }, + "gridPos": { + "h": 9, + "w": 24, + "x": 0, + "y": 9 + }, + "id": 3, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sort_desc(sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "A", - "step": 10 + "instant": true }, { - "expr": "sort_desc(sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "B", - "step": 10 + "instant": true }, { - "expr": "sort_desc(avg(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(avg(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "C", - "step": 10 + "instant": true }, { - "expr": "sort_desc(avg(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(avg(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "D", - "step": 10 + "instant": true }, { - "expr": "sort_desc(sum(irate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "E", - "step": 10 + "instant": true }, { - "expr": "sort_desc(sum(irate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "F", - "step": 10 + "instant": true }, { - "expr": "sort_desc(sum(irate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "G", - "step": 10 + "instant": true }, { - "expr": "sort_desc(sum(irate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n", "format": "table", - "instant": true, - "intervalFactor": 2, - "legendFormat": "", - "refId": "H", - "step": 10 + "instant": true } ], - "timeFrom": null, - "timeShift": null, "title": "Current Status", + "transformations": [ + { + "id": "joinByField", + "options": { + "byField": "workload", + "mode": "outer" + } + }, + { + "id": "organize", + "options": { + "excludeByName": { + "Time": true, + "Time 1": true, + "Time 2": true, + "Time 3": true, + "Time 4": true, + "Time 5": true, + "Time 6": true, + "Time 7": true, + "Time 8": true, + "workload_type 2": true, + "workload_type 3": true, + "workload_type 4": true, + "workload_type 5": true, + "workload_type 6": true, + "workload_type 7": true, + "workload_type 8": true + }, + "indexByName": { + "Time 1": 0, + "Time 2": 1, + "Time 3": 2, + "Time 4": 3, + "Time 5": 4, + "Time 6": 5, + "Time 7": 6, + "Time 8": 7, + "Value #A": 10, + "Value #B": 11, + "Value #C": 12, + "Value #D": 13, + "Value #E": 14, + "Value #F": 15, + "Value #G": 16, + "Value #H": 17, + "workload": 8, + "workload_type 1": 9, + "workload_type 2": 18, + "workload_type 3": 19, + "workload_type 4": 20, + "workload_type 5": 21, + "workload_type 6": 22, + "workload_type 7": 23, + "workload_type 8": 24 + }, + "renameByName": { + "Value #A": "Rx Bytes", + "Value #B": "Tx Bytes", + "Value #C": "Rx Bytes (Avg)", + "Value #D": "Tx Bytes (Avg)", + "Value #E": "Rx Packets", + "Value #F": "Tx Packets", + "Value #G": "Rx Packets Dropped", + "Value #H": "Tx Packets Dropped", + "workload": "Workload", + "workload_type 1": "Type" + } + } + } + ], "type": "table" }, { - "collapse": true, - "collapsed": true, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "Bps" + } + }, "gridPos": { - "h": 1, - "w": 24, + "h": 9, + "w": 12, "x": 0, - "y": 19 + "y": 18 }, - "id": 6, - "panels": [ + "id": 4, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 20 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "id": 7, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true + "expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" + } + ], + "title": "Receive Bandwidth", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(avg(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ workload }}", - "refId": "A", - "step": 10 - } + "unit": "Bps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 18 + }, + "id": 5, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Average Rate of Bytes Received", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 20 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "id": 8, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true + "expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" + } + ], + "title": "Transmit Bandwidth", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(avg(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ workload }}", - "refId": "A", - "step": 10 - } + "unit": "Bps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 27 + }, + "id": 6, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Average Rate of Bytes Transmitted", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] + "expr": "sort_desc(avg(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" + } + ], + "title": "Average Container Bandwidth by Workload: Received", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "Bps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 27 + }, + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(avg(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Average Bandwidth", - "titleSize": "h6", - "type": "row" + "title": "Average Container Bandwidth by Workload: Transmitted", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 29 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "pps" + } }, - "id": 9, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Bandwidth HIstory", - "titleSize": "h6", - "type": "row" - }, - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, "gridPos": { "h": 9, "w": 12, "x": 0, - "y": 38 + "y": 36 }, - "id": 10, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sort_desc(sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{workload}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Receive Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "title": "Rate of Received Packets", + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "pps" + } + }, "gridPos": { "h": 9, "w": 12, "x": 12, - "y": 38 + "y": 36 }, - "id": 11, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 9, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sort_desc(sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{workload}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Transmit Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "title": "Rate of Transmitted Packets", + "type": "timeseries" }, { - "collapse": true, - "collapsed": true, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "pps" + } + }, "gridPos": { - "h": 1, - "w": 24, + "h": 9, + "w": 12, "x": 0, - "y": 39 + "y": 45 }, - "id": 12, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 40 - }, - "id": 13, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{workload}}", - "refId": "A", - "step": 10 - } + "id": 10, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 40 - }, - "id": 14, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{workload}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sort_desc(sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Packets", - "titleSize": "h6", - "type": "row" + "title": "Rate of Received Packets Dropped", + "type": "timeseries" }, { - "collapse": true, - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 40 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "id": 15, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 41 - }, - "id": 16, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{workload}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] - }, - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 41 - }, - "id": 17, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{workload}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 45 + }, + "id": 11, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sort_desc(sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Errors", - "titleSize": "h6", - "type": "row" + "title": "Rate of Transmitted Packets Dropped", + "type": "timeseries" } ], "refresh": "10s", - "rows": [ ], - "schemaVersion": 18, - "style": "dark", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -57871,163 +55253,54 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "cluster", "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"integrations/kubernetes/cadvisor\"}, cluster)", "refresh": 2, - "regex": "", - "sort": 0, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "sort": 1, + "type": "query" }, { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", "current": { + "selected": false, "text": "kube-system", "value": "kube-system" }, - "datasource": "$datasource", - "definition": "label_values(container_network_receive_packets_total{cluster=\"$cluster\"}, namespace)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "namespace", "name": "namespace", - "options": [ ], "query": "label_values(container_network_receive_packets_total{cluster=\"$cluster\"}, namespace)", "refresh": 2, - "regex": "", - "skipUrlSync": false, "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "", - "value": "" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", - "definition": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\"}, workload_type)", "hide": 0, "includeAll": true, - "label": null, - "multi": false, + "label": "workload_type", "name": "type", - "options": [ ], - "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\"}, workload_type)", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 0, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false - }, - { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 0, - "includeAll": false, - "label": null, - "multi": false, - "name": "resolution", - "options": [ - { - "selected": false, - "text": "30s", - "value": "30s" - }, - { - "selected": true, - "text": "5m", - "value": "5m" - }, - { - "selected": false, - "text": "1h", - "value": "1h" - } - ], - "query": "30s,5m,1h", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false - }, - { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 2, - "includeAll": false, - "label": null, - "multi": false, - "name": "interval", - "options": [ - { - "selected": true, - "text": "4h", - "value": "4h" - } - ], - "query": "4h", + "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=\"$namespace\", workload=~\".+\"}, workload_type)", "refresh": 2, - "regex": "", - "skipUrlSync": false, "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false + "type": "query" } ] }, @@ -58035,35 +55308,9 @@ data: "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Networking / Namespace (Workload)", - "uid": "bbb2a765a623ae38130206c7d94a160f", - "version": 0 + "uid": "bbb2a765a623ae38130206c7d94a160f" } kind: ConfigMap metadata: @@ -58078,378 +55325,249 @@ apiVersion: v1 data: persistentvolumesusage.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ ] - }, "editable": false, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], - "refresh": "10s", - "rows": [ + "links": [ { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 2, - "legend": { - "alignAsTable": true, - "avg": true, - "current": true, - "max": true, - "min": true, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], + "panels": [ + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 9, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "(\n sum without(instance, node) (topk(1, (kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n -\n sum without(instance, node) (topk(1, (kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n)\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "Used Space", - "refId": "A" - }, - { - "expr": "sum without(instance, node) (topk(1, (kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "Free Space", - "refId": "B" - } + "unit": "bytes" + } + }, + "gridPos": { + "h": 7, + "w": 18, + "y": 0 + }, + "id": 1, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Volume Space Usage", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "rgba(50, 172, 45, 0.97)", - "rgba(237, 129, 40, 0.89)", - "rgba(245, 54, 54, 0.9)" - ], - "datasource": "$datasource", - "format": "percent", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": true, - "thresholdLabels": false, - "thresholdMarkers": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "gridPos": { }, - "id": 3, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "nullPointMode": "connected", - "nullText": null, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 3, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false + "expr": "(\n sum without(instance, node) (topk(1, (kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n -\n sum without(instance, node) (topk(1, (kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n)\n", + "legendFormat": "Used Space" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "tableColumn": "", - "targets": [ - { - "expr": "max without(instance,node) (\n(\n topk(1, kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n -\n topk(1, kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n)\n/\ntopk(1, kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n* 100)\n", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "", - "refId": "A" - } - ], - "thresholds": "80, 90", - "title": "Volume Space Usage", - "type": "singlestat", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } - ], - "valueName": "current" + "expr": "sum without(instance, node) (topk(1, (kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n", + "legendFormat": "Free Space" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Volume Space Usage", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "max": 100, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 80 + }, + { + "color": "red", + "value": 90 + } + ] + }, + "unit": "percent" + } + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 0 + }, + "id": 2, + "interval": "1m", + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 4, - "legend": { - "alignAsTable": true, - "avg": true, - "current": true, - "max": true, - "min": true, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 9, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum without(instance, node) (topk(1, (kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "Used inodes", - "refId": "A" - }, - { - "expr": "(\n sum without(instance, node) (topk(1, (kubelet_volume_stats_inodes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n -\n sum without(instance, node) (topk(1, (kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n)\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": " Free inodes", - "refId": "B" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Volume inodes Usage", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "expr": "max without(instance,node) (\n(\n topk(1, kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n -\n topk(1, kubelet_volume_stats_available_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n)\n/\ntopk(1, kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n* 100)\n", + "instant": true + } + ], + "title": "Volume Space Usage", + "type": "gauge" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "unit": "none" + } + }, + "gridPos": { + "h": 7, + "w": 18, + "y": 7 + }, + "id": 3, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "none", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "none", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum without(instance, node) (topk(1, (kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))", + "legendFormat": "Used inodes" }, { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "rgba(50, 172, 45, 0.97)", - "rgba(237, 129, 40, 0.89)", - "rgba(245, 54, 54, 0.9)" - ], - "datasource": "$datasource", - "format": "percent", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": true, - "thresholdLabels": false, - "thresholdMarkers": true - }, - "gridPos": { }, - "id": 5, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "nullPointMode": "connected", - "nullText": null, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 3, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "(\n sum without(instance, node) (topk(1, (kubelet_volume_stats_inodes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n -\n sum without(instance, node) (topk(1, (kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})))\n)\n", + "legendFormat": "Free inodes" + } + ], + "title": "Volume inodes Usage", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "color": { + "mode": "thresholds" + }, + "max": 100, + "min": 0, + "thresholds": { + "mode": "absolute", + "steps": [ + { + "color": "green", + "value": 0 + }, + { + "color": "orange", + "value": 80 + }, + { + "color": "red", + "value": 90 + } + ] + }, + "unit": "percent" + } + }, + "gridPos": { + "h": 7, + "w": 6, + "x": 18, + "y": 7 + }, + "id": 4, + "interval": "1m", + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "tableColumn": "", - "targets": [ - { - "expr": "max without(instance,node) (\ntopk(1, kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n/\ntopk(1, kubelet_volume_stats_inodes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n* 100)\n", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "", - "refId": "A" - } - ], - "thresholds": "80, 90", - "title": "Volume inodes Usage", - "type": "singlestat", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } - ], - "valueName": "current" + "expr": "max without(instance,node) (\ntopk(1, kubelet_volume_stats_inodes_used{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n/\ntopk(1, kubelet_volume_stats_inodes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n* 100)\n", + "instant": true } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Volume inodes Usage", + "type": "gauge" } ], - "schemaVersion": 14, - "style": "dark", + "refresh": "10s", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -58465,107 +55583,58 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, "label": "cluster", - "multi": false, "name": "cluster", - "options": [ ], "query": "label_values(kubelet_volume_stats_capacity_bytes{job=\"integrations/kubernetes/kubelet\"}, cluster)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, "label": "Namespace", - "multi": false, "name": "namespace", - "options": [ ], "query": "label_values(kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\"}, namespace)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, "label": "PersistentVolumeClaim", - "multi": false, "name": "volume", - "options": [ ], "query": "label_values(kubelet_volume_stats_capacity_bytes{cluster=\"$cluster\", job=\"integrations/kubernetes/kubelet\", namespace=\"$namespace\"}, persistentvolumeclaim)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" } ] }, "time": { - "from": "now-7d", + "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Persistent Volumes", - "uid": "919b92a8e8041bd567af9edab12c840c", - "version": 0 + "uid": "919b92a8e8041bd567af9edab12c840c" } kind: ConfigMap metadata: @@ -58580,899 +55649,407 @@ apiVersion: v1 data: pod-total.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ - { - "builtIn": 1, - "datasource": "-- Grafana --", - "enable": true, - "hide": true, - "iconColor": "rgba(0, 211, 255, 1)", - "name": "Annotations & Alerts", - "type": "dashboard" - } - ] - }, - "editable": true, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], + "editable": false, + "links": [ + { + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], "panels": [ { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 0 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "id": 2, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Current Bandwidth", - "titleSize": "h6", - "type": "row" - }, - { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "#299c46", - "rgba(237, 129, 40, 0.89)", - "#d44a3a" - ], - "datasource": "$datasource", - "decimals": 0, - "format": "time_series", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": false, - "thresholdLabels": false, - "thresholdMarkers": true + "fieldConfig": { + "defaults": { + "displayName": "$pod", + "max": 10000000000, + "min": 0, + "thresholds": { + "steps": [ + { + "color": "dark-green", + "index": 0, + "value": null + }, + { + "color": "dark-yellow", + "index": 1, + "value": 5000000000 + }, + { + "color": "dark-red", + "index": 2, + "value": 7000000000 + } + ] + }, + "unit": "Bps" + } }, "gridPos": { "h": 9, "w": 12, "x": 0, - "y": 1 - }, - "height": 9, - "id": 3, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "minSpan": 12, - "nullPointMode": "connected", - "nullText": null, - "options": { - "fieldOptions": { - "calcs": [ - "last" - ], - "defaults": { - "max": 10000000000, - "min": 0, - "title": "$namespace: $pod", - "unit": "Bps" - }, - "mappings": [ ], - "override": { }, - "thresholds": [ - { - "color": "dark-green", - "index": 0, - "value": null - }, - { - "color": "dark-yellow", - "index": 1, - "value": 5000000000 - }, - { - "color": "dark-red", - "index": 2, - "value": 7000000000 - } - ], - "values": false - } + "y": 0 }, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 12, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false - }, - "tableColumn": "", + "id": 1, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution]))", - "format": "time_series", - "instant": null, - "intervalFactor": 1, - "legendFormat": "", - "refId": "A" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval]))", + "legendFormat": "__auto" } ], - "thresholds": "", - "timeFrom": null, - "timeShift": null, "title": "Current Rate of Bytes Received", - "type": "gauge", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } - ], - "valueName": "current" + "type": "gauge" }, { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "#299c46", - "rgba(237, 129, 40, 0.89)", - "#d44a3a" - ], - "datasource": "$datasource", - "decimals": 0, - "format": "time_series", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": false, - "thresholdLabels": false, - "thresholdMarkers": true + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "displayName": "$pod", + "max": 10000000000, + "min": 0, + "thresholds": { + "steps": [ + { + "color": "dark-green", + "index": 0, + "value": null + }, + { + "color": "dark-yellow", + "index": 1, + "value": 5000000000 + }, + { + "color": "dark-red", + "index": 2, + "value": 7000000000 + } + ] + }, + "unit": "Bps" + } }, "gridPos": { "h": 9, "w": 12, "x": 12, - "y": 1 - }, - "height": 9, - "id": 4, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "minSpan": 12, - "nullPointMode": "connected", - "nullText": null, - "options": { - "fieldOptions": { - "calcs": [ - "last" - ], - "defaults": { - "max": 10000000000, - "min": 0, - "title": "$namespace: $pod", - "unit": "Bps" - }, - "mappings": [ ], - "override": { }, - "thresholds": [ - { - "color": "dark-green", - "index": 0, - "value": null - }, - { - "color": "dark-yellow", - "index": 1, - "value": 5000000000 - }, - { - "color": "dark-red", - "index": 2, - "value": 7000000000 - } - ], - "values": false - } + "y": 0 }, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 12, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false - }, - "tableColumn": "", + "id": 2, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution]))", - "format": "time_series", - "instant": null, - "intervalFactor": 1, - "legendFormat": "", - "refId": "A" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval]))", + "legendFormat": "__auto" } ], - "thresholds": "", - "timeFrom": null, - "timeShift": null, "title": "Current Rate of Bytes Transmitted", - "type": "gauge", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } - ], - "valueName": "current" + "type": "gauge" }, { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 10 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "binBps" + } }, - "id": 5, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Bandwidth", - "titleSize": "h6", - "type": "row" - }, - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, "gridPos": { "h": 9, "w": 12, "x": 0, - "y": 11 + "y": 9 }, - "id": 6, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 3, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval])) by (pod)", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, "title": "Receive Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "binBps" + } }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 9 + }, + "id": 4, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval])) by (pod)", + "legendFormat": "__auto" } - ] + ], + "title": "Transmit Bandwidth", + "type": "timeseries" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "pps" + } + }, "gridPos": { "h": 9, "w": 12, - "x": 12, - "y": 11 + "x": 0, + "y": 18 }, - "id": 7, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 5, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sum(irate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval])) by (pod)", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Transmit Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "title": "Rate of Received Packets", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 18 }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "id": 6, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval])) by (pod)", + "legendFormat": "__auto" } - ] + ], + "title": "Rate of Transmitted Packets", + "type": "timeseries" }, { - "collapse": true, - "collapsed": true, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" + }, + "unit": "pps" + } + }, "gridPos": { - "h": 1, - "w": 24, + "h": 9, + "w": 12, "x": 0, - "y": 20 + "y": 27 }, - "id": 8, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 0, - "y": 21 - }, - "id": 9, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 12, - "y": 21 - }, - "id": 10, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval])) by (pod)", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Packets", - "titleSize": "h6", - "type": "row" + "title": "Rate of Received Packets Dropped", + "type": "timeseries" }, { - "collapse": true, - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 21 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "id": 11, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 0, - "y": 32 - }, - "id": 12, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "fieldConfig": { + "defaults": { + "custom": { + "showPoints": "never" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 27 + }, + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 10, - "w": 12, - "x": 12, - "y": 32 - }, - "id": 13, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sum(irate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$interval:$resolution])) by (pod)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\", pod=~\"$pod\"}[$__rate_interval])) by (pod)", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Errors", - "titleSize": "h6", - "type": "row" + "title": "Rate of Transmitted Packets Dropped", + "type": "timeseries" } ], "refresh": "10s", - "rows": [ ], - "schemaVersion": 18, - "style": "dark", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -59488,199 +56065,70 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "cluster", "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"integrations/kubernetes/cadvisor\"}, cluster)", "refresh": 2, - "regex": "", - "sort": 0, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "sort": 1, + "type": "query" }, { "allValue": ".+", - "auto": false, - "auto_count": 30, - "auto_min": "10s", "current": { + "selected": false, "text": "kube-system", "value": "kube-system" }, - "datasource": "$datasource", - "definition": "label_values(container_network_receive_packets_total{cluster=\"$cluster\"}, namespace)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, "includeAll": true, - "label": null, - "multi": false, + "label": "namespace", "name": "namespace", - "options": [ ], "query": "label_values(container_network_receive_packets_total{cluster=\"$cluster\"}, namespace)", "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false - }, - { - "allValue": ".+", - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "", - "value": "" - }, - "datasource": "$datasource", - "definition": "label_values(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}, pod)", - "hide": 0, - "includeAll": false, - "label": null, - "multi": false, - "name": "pod", - "options": [ ], - "query": "label_values(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}, pod)", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false - }, - { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 0, - "includeAll": false, - "label": null, - "multi": false, - "name": "resolution", - "options": [ - { - "selected": false, - "text": "30s", - "value": "30s" - }, - { - "selected": true, - "text": "5m", - "value": "5m" - }, - { - "selected": false, - "text": "1h", - "value": "1h" - } - ], - "query": "30s,5m,1h", - "refresh": 2, - "regex": "", - "skipUrlSync": false, "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false + "type": "query" }, { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 2, - "includeAll": false, - "label": null, - "multi": false, - "name": "interval", - "options": [ - { - "selected": true, - "text": "4h", - "value": "4h" - } - ], - "query": "4h", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false - } - ] - }, - "time": { - "from": "now-1h", - "to": "now" - }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" + "selected": false, + "text": "kube-system", + "value": "kube-system" + }, + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "hide": 0, + "label": "pod", + "name": "pod", + "query": "label_values(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}, pod)", + "refresh": 2, + "sort": 1, + "type": "query" + } ] }, + "time": { + "from": "now-1h", + "to": "now" + }, "timezone": "browser", "title": "Kubernetes / Networking / Pod", - "uid": "7a18067ce943a40ae25454675c19ff5c", - "version": 0 + "uid": "7a18067ce943a40ae25454675c19ff5c" } kind: ConfigMap metadata: @@ -59695,995 +56143,594 @@ apiVersion: v1 data: proxy.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ ] - }, "editable": false, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], - "refresh": "10s", - "rows": [ + "links": [ { - "collapse": false, - "collapsed": false, - "panels": [ + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], + "panels": [ + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "unit": "none" + } + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 0 + }, + "id": 1, + "interval": "1m", + "options": { + "colorMode": "none" + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "#299c46", - "rgba(237, 129, 40, 0.89)", - "#d44a3a" - ], - "datasource": "$datasource", - "format": "none", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": false, - "thresholdLabels": false, - "thresholdMarkers": true - }, - "gridPos": { }, - "id": 2, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "nullPointMode": "connected", - "nullText": null, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 2, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "tableColumn": "", - "targets": [ - { - "expr": "sum(up{cluster=\"$cluster\", job=\"kube-proxy\"})", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "", - "refId": "A" - } - ], - "thresholds": "", - "title": "Up", - "type": "singlestat", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } + "expr": "sum(up{cluster=\"$cluster\", job=\"kube-proxy\"})", + "instant": true + } + ], + "title": "Up", + "type": "stat" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 10, + "x": 4, + "y": 0 + }, + "id": 2, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "valueName": "min" + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 3, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 5, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sum(rate(kubeproxy_sync_proxy_rules_duration_seconds_count{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "rate", - "refId": "A" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rules Sync Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(rate(kubeproxy_sync_proxy_rules_duration_seconds_count{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval]))", + "legendFormat": "rate" + } + ], + "title": "Rules Sync Rate", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "s" + } + }, + "gridPos": { + "h": 7, + "w": 10, + "x": 14, + "y": 0 + }, + "id": 3, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 4, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 5, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "histogram_quantile(0.99,rate(kubeproxy_sync_proxy_rules_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rule Sync Latency 99th Quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "histogram_quantile(0.99,rate(kubeproxy_sync_proxy_rules_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval]))", + "legendFormat": "{{instance}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Rules Sync Latency 99th Quantile", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 5, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sum(rate(kubeproxy_network_programming_duration_seconds_count{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "rate", - "refId": "A" - } + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 0, + "y": 7 + }, + "id": 4, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Network Programming Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 6, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 6, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "histogram_quantile(0.99, sum(rate(kubeproxy_network_programming_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval])) by (instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Network Programming Latency 99th Quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "expr": "sum(rate(kubeproxy_network_programming_duration_seconds_count{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval]))", + "legendFormat": "rate" + } + ], + "title": "Network Programming Rate", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "unit": "s" + } + }, + "gridPos": { + "h": 7, + "w": 12, + "x": 12, + "y": 7 + }, + "id": 5, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "histogram_quantile(0.99, sum(rate(kubeproxy_network_programming_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\"}[$__rate_interval])) by (instance, le))", + "legendFormat": "{{instance}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Network Programming Latency 99th Quantile", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 7, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\",code=~\"2..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "2xx", - "refId": "A" - }, - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\",code=~\"3..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "3xx", - "refId": "B" - }, - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\",code=~\"4..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "4xx", - "refId": "C" - }, - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\",code=~\"5..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "5xx", - "refId": "D" - } + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 14 + }, + "id": 6, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Kube API Request Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kube-proxy\", instance=~\"$instance\",code=~\"2..\"}[$__rate_interval]))", + "legendFormat": "2xx" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 8, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 8, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\",verb=\"POST\"}[$__rate_interval])) by (verb, url, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{verb}} {{url}}", - "refId": "A" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Post Request Latency 99th Quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kube-proxy\", instance=~\"$instance\",code=~\"3..\"}[$__rate_interval]))", + "legendFormat": "3xx" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kube-proxy\", instance=~\"$instance\",code=~\"4..\"}[$__rate_interval]))", + "legendFormat": "4xx" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kube-proxy\", instance=~\"$instance\",code=~\"5..\"}[$__rate_interval]))", + "legendFormat": "5xx" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Kube API Request Rate", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 9, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\", verb=\"GET\"}[$__rate_interval])) by (verb, url, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{verb}} {{url}}", - "refId": "A" - } + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 16, + "x": 8, + "y": 14 + }, + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Get Request Latency 99th Quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\",verb=\"POST\"}[$__rate_interval])) by (verb, url, le))", + "legendFormat": "{{verb}} {{url}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Post Request Latency 99th Quantile", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 10, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "process_resident_memory_bytes{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\"}", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } + "unit": "s" + } + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 21 + }, + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Memory", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 11, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\"}[$__rate_interval])", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "CPU usage", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-proxy\", instance=~\"$instance\", verb=\"GET\"}[$__rate_interval])) by (verb, url, le))", + "legendFormat": "{{verb}} {{url}}" + } + ], + "title": "Get Request Latency 99th Quantile", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "bytes" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 28 + }, + "id": 9, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 12, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "go_goroutines{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\"}", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } + "expr": "process_resident_memory_bytes{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\"}", + "legendFormat": "{{instance}}" + } + ], + "title": "Memory", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "short" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 28 + }, + "id": 10, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Goroutines", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\"}[$__rate_interval])", + "legendFormat": "{{instance}}" + } + ], + "title": "CPU usage", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "unit": "short" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 28 + }, + "id": 11, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "go_goroutines{cluster=\"$cluster\", job=\"kube-proxy\",instance=~\"$instance\"}", + "legendFormat": "{{instance}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Goroutines", + "type": "timeseries" } ], - "schemaVersion": 14, - "style": "dark", + "refresh": "10s", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -60699,51 +56746,36 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, "label": "cluster", - "multi": false, "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"kube-proxy\"}, cluster)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "allValue": ".+", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, "includeAll": true, - "label": null, - "multi": false, + "label": "instance", "name": "instance", - "options": [ ], "query": "label_values(up{job=\"kube-proxy\", cluster=\"$cluster\", job=\"kube-proxy\"}, instance)", "refresh": 2, - "regex": "", - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" } ] }, @@ -60751,35 +56783,9 @@ data: "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Proxy", - "uid": "632e265de029684c40b21cb76bca4f94", - "version": 0 + "uid": "632e265de029684c40b21cb76bca4f94" } kind: ConfigMap metadata: @@ -60794,862 +56800,540 @@ apiVersion: v1 data: scheduler.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ ] - }, "editable": false, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], - "refresh": "10s", - "rows": [ + "links": [ { - "collapse": false, - "collapsed": false, - "panels": [ + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], + "panels": [ + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "unit": "none" + } + }, + "gridPos": { + "h": 7, + "w": 4, + "x": 0, + "y": 0 + }, + "id": 1, + "interval": "1m", + "options": { + "colorMode": "none" + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "cacheTimeout": null, - "colorBackground": false, - "colorValue": false, - "colors": [ - "#299c46", - "rgba(237, 129, 40, 0.89)", - "#d44a3a" - ], - "datasource": "$datasource", - "format": "none", - "gauge": { - "maxValue": 100, - "minValue": 0, - "show": false, - "thresholdLabels": false, - "thresholdMarkers": true - }, - "gridPos": { }, - "id": 2, - "interval": null, - "links": [ ], - "mappingType": 1, - "mappingTypes": [ - { - "name": "value to text", - "value": 1 - }, - { - "name": "range to text", - "value": 2 - } - ], - "maxDataPoints": 100, - "nullPointMode": "connected", - "nullText": null, - "postfix": "", - "postfixFontSize": "50%", - "prefix": "", - "prefixFontSize": "50%", - "rangeMaps": [ - { - "from": "null", - "text": "N/A", - "to": "null" - } - ], - "span": 2, - "sparkline": { - "fillColor": "rgba(31, 118, 189, 0.18)", - "full": false, - "lineColor": "rgb(31, 120, 193)", - "show": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "tableColumn": "", - "targets": [ - { - "expr": "sum(up{cluster=\"$cluster\", job=\"kube-scheduler\"})", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "", - "refId": "A" - } - ], - "thresholds": "", - "title": "Up", - "type": "singlestat", - "valueFontSize": "80%", - "valueMaps": [ - { - "op": "=", - "text": "N/A", - "value": "null" - } + "expr": "sum(up{cluster=\"$cluster\", job=\"kube-scheduler\"})", + "instant": true + } + ], + "title": "Up", + "type": "stat" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 10, + "x": 4, + "y": 0 + }, + "id": 2, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "valueName": "min" + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 3, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 5, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sum(rate(scheduler_e2e_scheduling_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} e2e", - "refId": "A" - }, - { - "expr": "sum(rate(scheduler_binding_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} binding", - "refId": "B" - }, - { - "expr": "sum(rate(scheduler_scheduling_algorithm_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} scheduling algorithm", - "refId": "C" - }, - { - "expr": "sum(rate(scheduler_volume_scheduling_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} volume", - "refId": "D" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Scheduling Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "expr": "sum(rate(scheduler_e2e_scheduling_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", + "legendFormat": "{{cluster}} {{instance}} e2e" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(rate(scheduler_binding_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", + "legendFormat": "{{cluster}} {{instance}} binding" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum(rate(scheduler_scheduling_algorithm_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", + "legendFormat": "{{cluster}} {{instance}} scheduling algorithm" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 4, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 5, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "histogram_quantile(0.99, sum(rate(scheduler_e2e_scheduling_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} e2e", - "refId": "A" - }, - { - "expr": "histogram_quantile(0.99, sum(rate(scheduler_binding_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} binding", - "refId": "B" - }, - { - "expr": "histogram_quantile(0.99, sum(rate(scheduler_scheduling_algorithm_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} scheduling algorithm", - "refId": "C" - }, - { - "expr": "histogram_quantile(0.99, sum(rate(scheduler_volume_scheduling_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{cluster}} {{instance}} volume", - "refId": "D" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Scheduling latency 99th Quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "expr": "sum(rate(scheduler_volume_scheduling_duration_seconds_count{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance)", + "legendFormat": "{{cluster}} {{instance}} volume" + } + ], + "title": "Scheduling Rate", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "s" + } + }, + "gridPos": { + "h": 7, + "w": 10, + "x": 14, + "y": 0 + }, + "id": 3, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "histogram_quantile(0.99, sum(rate(scheduler_e2e_scheduling_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", + "legendFormat": "{{cluster}} {{instance}} e2e" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "histogram_quantile(0.99, sum(rate(scheduler_binding_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", + "legendFormat": "{{cluster}} {{instance}} binding" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "histogram_quantile(0.99, sum(rate(scheduler_scheduling_algorithm_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", + "legendFormat": "{{cluster}} {{instance}} scheduling algorithm" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "histogram_quantile(0.99, sum(rate(scheduler_volume_scheduling_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}[$__rate_interval])) by (cluster, instance, le))", + "legendFormat": "{{cluster}} {{instance}} volume" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Scheduling latency 99th Quantile", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 5, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"2..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "2xx", - "refId": "A" - }, - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"3..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "3xx", - "refId": "B" - }, - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"4..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "4xx", - "refId": "C" - }, - { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"5..\"}[$__rate_interval]))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "5xx", - "refId": "D" - } + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 7 + }, + "id": 4, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Kube API Request Rate", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "ops", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"2..\"}[$__rate_interval]))", + "legendFormat": "2xx" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 6, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 8, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\", verb=\"POST\"}[$__rate_interval])) by (verb, url, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{verb}} {{url}}", - "refId": "A" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Post Request Latency 99th Quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"3..\"}[$__rate_interval]))", + "legendFormat": "3xx" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"4..\"}[$__rate_interval]))", + "legendFormat": "4xx" + }, + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\",code=~\"5..\"}[$__rate_interval]))", + "legendFormat": "5xx" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Kube API Request Rate", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 7, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "total": false, - "values": true + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\", verb=\"GET\"}[$__rate_interval])) by (verb, url, le))", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{verb}} {{url}}", - "refId": "A" - } + "unit": "ops" + } + }, + "gridPos": { + "h": 7, + "w": 16, + "x": 8, + "y": 7 + }, + "id": 5, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Get Request Latency 99th Quantile", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "s", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\", verb=\"POST\"}[$__rate_interval])) by (verb, url, le))", + "legendFormat": "{{verb}} {{url}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Post Request Latency 99th Quantile", + "type": "timeseries" }, { - "collapse": false, - "collapsed": false, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 8, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "process_resident_memory_bytes{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } + "unit": "s" + } + }, + "gridPos": { + "h": 7, + "w": 24, + "x": 0, + "y": 14 + }, + "id": 6, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Memory", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 9, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } + "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_duration_seconds_bucket{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\", verb=\"GET\"}[$__rate_interval])) by (verb, url, le))", + "legendFormat": "{{verb}} {{url}}" + } + ], + "title": "Get Request Latency 99th Quantile", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "bytes" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 0, + "y": 21 + }, + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "CPU usage", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "process_resident_memory_bytes{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}", + "legendFormat": "{{instance}}" + } + ], + "title": "Memory", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "yaxes": [ - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "bytes", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "short" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 8, + "y": 21 + }, + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 1, - "fillGradient": 0, - "gridPos": { }, - "id": 10, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "lines": true, - "linewidth": 1, - "links": [ ], - "nullPointMode": "null", - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 4, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "go_goroutines{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}", - "format": "time_series", - "intervalFactor": 2, - "legendFormat": "{{instance}}", - "refId": "A" - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Goroutines", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" + "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\", job=\"kube-scheduler\", instance=~\"$instance\"}[$__rate_interval])", + "legendFormat": "{{instance}}" + } + ], + "title": "CPU usage", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "unit": "short" + } + }, + "gridPos": { + "h": 7, + "w": 8, + "x": 16, + "y": 21 + }, + "id": 9, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": true - } - ] + "expr": "go_goroutines{cluster=\"$cluster\", job=\"kube-scheduler\",instance=~\"$instance\"}", + "legendFormat": "{{instance}}" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": false, - "title": "Dashboard Row", - "titleSize": "h6", - "type": "row" + "title": "Goroutines", + "type": "timeseries" } ], - "schemaVersion": 14, - "style": "dark", + "refresh": "10s", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -61665,51 +57349,36 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, "label": "cluster", - "multi": false, "name": "cluster", - "options": [ ], "query": "label_values(up{job=\"kube-scheduler\"}, cluster)", "refresh": 2, - "regex": "", "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "allValue": ".+", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, "includeAll": true, - "label": null, - "multi": false, + "label": "instance", "name": "instance", - "options": [ ], "query": "label_values(up{job=\"kube-scheduler\", cluster=\"$cluster\"}, instance)", "refresh": 2, - "regex": "", - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" } ] }, @@ -61717,35 +57386,9 @@ data: "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Scheduler", - "uid": "2e6b6a3b4bddf1427b3a55aa1311c656", - "version": 0 + "uid": "2e6b6a3b4bddf1427b3a55aa1311c656" } kind: ConfigMap metadata: @@ -61760,1057 +57403,487 @@ apiVersion: v1 data: workload-total.json: |- { - "__inputs": [ ], - "__requires": [ ], - "annotations": { - "list": [ - { - "builtIn": 1, - "datasource": "-- Grafana --", - "enable": true, - "hide": true, - "iconColor": "rgba(0, 211, 255, 1)", - "name": "Annotations & Alerts", - "type": "dashboard" - } - ] - }, - "editable": true, - "gnetId": null, - "graphTooltip": 0, - "hideControls": false, - "id": null, - "links": [ ], - "panels": [ - { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 0 - }, - "id": 2, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Current Bandwidth", - "titleSize": "h6", - "type": "row" - }, - { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 1 - }, - "id": 3, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true - }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ pod }}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Current Rate of Bytes Received", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] - }, - { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 1 - }, - "id": 4, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true - }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ pod }}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Current Rate of Bytes Transmitted", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] - }, + "editable": false, + "links": [ { - "collapse": true, - "collapsed": true, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 10 - }, - "id": 5, - "panels": [ - { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 11 - }, - "id": 6, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true - }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(avg(irate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ pod }}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Average Rate of Bytes Received", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] + "asDropdown": true, + "includeVars": true, + "keepTime": true, + "tags": [ + "kubernetes-mixin", + "infrastucture" + ], + "targetBlank": false, + "title": "Kubernetes", + "type": "dashboards" + } + ], + "panels": [ + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "green", + "mode": "fixed" }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] - }, + "unit": "Bps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 0 + }, + "id": 1, + "options": { + "displayMode": "basic", + "showUnfilled": false + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": true, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 11 - }, - "id": 7, - "legend": { - "alignAsTable": true, - "avg": false, - "current": true, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": true, - "show": true, - "sideWidth": null, - "sort": "current", - "sortDesc": true, - "total": false, - "values": true - }, - "lines": false, - "linewidth": 1, - "links": [ ], - "minSpan": 24, - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 24, - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(avg(irate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{ pod }}", - "refId": "A", - "step": 10 - } - ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Average Rate of Bytes Transmitted", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "series", - "name": null, - "show": false, - "values": [ - "current" - ] + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sort_desc(sum(rate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Average Bandwidth", - "titleSize": "h6", - "type": "row" + "title": "Current Rate of Bytes Received", + "type": "bargauge" }, { - "collapse": false, - "collapsed": false, - "gridPos": { - "h": 1, - "w": 24, - "x": 0, - "y": 11 + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "green", + "mode": "fixed" + }, + "unit": "Bps" + } }, - "id": 8, - "panels": [ ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Bandwidth HIstory", - "titleSize": "h6", - "type": "row" - }, - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, "gridPos": { "h": 9, "w": 12, - "x": 0, - "y": 12 + "x": 12, + "y": 0 }, - "id": 9, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 2, + "options": { + "displayMode": "basic", + "showUnfilled": false }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sort_desc(sum(irate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Receive Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "title": "Current Rate of Bytes Transmitted", + "type": "bargauge" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "green", + "mode": "fixed" + }, + "unit": "Bps" + } }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 9 + }, + "id": 3, + "options": { + "displayMode": "basic", + "showUnfilled": false + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(avg(rate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" } - ] + ], + "title": "Average Rate of Bytes Received", + "type": "bargauge" }, { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "color": { + "fixedColor": "green", + "mode": "fixed" + }, + "unit": "Bps" + } + }, "gridPos": { "h": 9, "w": 12, "x": 12, - "y": 12 + "y": 9 }, - "id": 10, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "id": 4, + "options": { + "displayMode": "basic", + "showUnfilled": false }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, + "pluginVersion": "v11.1.0", "targets": [ { - "expr": "sort_desc(sum(irate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(avg(rate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" } ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Transmit Bandwidth", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "Bps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "title": "Average Rate of Bytes Transmitted", + "type": "bargauge" }, { - "collapse": true, - "collapsed": true, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "binBps" + } + }, "gridPos": { - "h": 1, - "w": 24, + "h": 9, + "w": 12, "x": 0, - "y": 21 + "y": 18 }, - "id": 11, - "panels": [ - { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 22 - }, - "id": 12, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } + "id": 5, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 22 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "id": 13, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "expr": "sort_desc(sum(rate(container_network_receive_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" + } + ], + "title": "Receive Bandwidth", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_transmit_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } + "unit": "binBps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 18 + }, + "id": 6, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] - }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, + "expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Packets", - "titleSize": "h6", - "type": "row" + "title": "Transmit Bandwidth", + "type": "timeseries" }, { - "collapse": true, - "collapsed": true, + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true + }, + "unit": "pps" + } + }, "gridPos": { - "h": 1, - "w": 24, + "h": 9, + "w": 12, "x": 0, - "y": 22 + "y": 27 }, - "id": 14, - "panels": [ + "id": 7, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 0, - "y": 23 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "id": 15, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "expr": "sort_desc(sum(rate(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" + } + ], + "title": "Rate of Received Packets", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_receive_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 27 + }, + "id": 8, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Received Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "expr": "sort_desc(sum(rate(container_network_transmit_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" + } + ], + "title": "Rate of Transmitted Packets", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 0, + "y": 36 + }, + "id": 9, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" + ], + "displayMode": "table", + "placement": "right", + "showLegend": true }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ { - "aliasColors": { }, - "bars": false, - "dashLength": 10, - "dashes": false, - "datasource": "$datasource", - "fill": 2, - "fillGradient": 0, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 23 + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "id": 16, - "legend": { - "alignAsTable": false, - "avg": false, - "current": false, - "hideEmpty": true, - "hideZero": true, - "max": false, - "min": false, - "rightSide": false, - "show": true, - "sideWidth": null, - "total": false, - "values": false + "expr": "sort_desc(sum(rate(container_network_receive_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" + } + ], + "title": "Rate of Received Packets Dropped", + "type": "timeseries" + }, + { + "datasource": { + "type": "datasource", + "uid": "-- Mixed --" + }, + "fieldConfig": { + "defaults": { + "custom": { + "fillOpacity": 10, + "showPoints": "never", + "spanNulls": true }, - "lines": true, - "linewidth": 2, - "links": [ ], - "minSpan": 12, - "nullPointMode": "connected", - "paceLength": 10, - "percentage": false, - "pointradius": 5, - "points": false, - "renderer": "flot", - "repeat": null, - "seriesOverrides": [ ], - "spaceLength": 10, - "span": 12, - "stack": true, - "steppedLine": false, - "targets": [ - { - "expr": "sort_desc(sum(irate(container_network_transmit_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$interval:$resolution])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "{{pod}}", - "refId": "A", - "step": 10 - } + "unit": "pps" + } + }, + "gridPos": { + "h": 9, + "w": 12, + "x": 12, + "y": 36 + }, + "id": 10, + "interval": "1m", + "options": { + "legend": { + "asTable": true, + "calcs": [ + "lastNotNull" ], - "thresholds": [ ], - "timeFrom": null, - "timeShift": null, - "title": "Rate of Transmitted Packets Dropped", - "tooltip": { - "shared": true, - "sort": 2, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [ ] + "displayMode": "table", + "placement": "right", + "showLegend": true + }, + "tooltip": { + "mode": "single" + } + }, + "pluginVersion": "v11.1.0", + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "yaxes": [ - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - }, - { - "format": "pps", - "label": null, - "logBase": 1, - "max": null, - "min": 0, - "show": true - } - ] + "expr": "sort_desc(sum(rate(container_network_transmit_packets_dropped_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\", workload_type=~\"$type\"}) by (pod))\n", + "legendFormat": "__auto" } ], - "repeat": null, - "repeatIteration": null, - "repeatRowId": null, - "showTitle": true, - "title": "Errors", - "titleSize": "h6", - "type": "row" + "title": "Rate of Transmitted Packets Dropped", + "type": "timeseries" } ], "refresh": "10s", - "rows": [ ], - "schemaVersion": 18, - "style": "dark", + "schemaVersion": 39, "tags": [ "kubernetes-mixin", "infrastucture" @@ -62826,191 +57899,70 @@ data: "hide": 0, "label": "Data source", "name": "datasource", - "options": [ ], "query": "prometheus", - "refresh": 1, "regex": "", "type": "datasource" }, { - "allValue": null, - "current": { }, - "datasource": "$datasource", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "cluster", "name": "cluster", - "options": [ ], "query": "label_values(kube_pod_info{job=\"integrations/kubernetes/kube-state-metrics\"}, cluster)", "refresh": 2, - "regex": "", - "sort": 0, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "sort": 1, + "type": "query" }, { "allValue": ".+", - "auto": false, - "auto_count": 30, - "auto_min": "10s", "current": { + "selected": false, "text": "kube-system", "value": "kube-system" }, - "datasource": "$datasource", - "definition": "label_values(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\"}, namespace)", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" + }, "hide": 0, "includeAll": true, - "label": null, - "multi": false, + "label": "namespace", "name": "namespace", - "options": [ ], - "query": "label_values(container_network_receive_packets_total{job=\"integrations/kubernetes/cadvisor\", cluster=\"$cluster\"}, namespace)", + "query": "label_values(container_network_receive_packets_total{cluster=\"$cluster\"}, namespace)", "refresh": 2, - "regex": "", - "skipUrlSync": false, "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "", - "value": "" + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", - "definition": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\"}, workload)", "hide": 0, - "includeAll": false, - "label": null, - "multi": false, + "label": "workload", "name": "workload", - "options": [ ], - "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\"}, workload)", + "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=~\"$namespace\", workload=~\".+\"}, workload)", "refresh": 2, - "regex": "", - "skipUrlSync": false, "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false + "type": "query" }, { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "", - "value": "" + "allValue": ".+", + "datasource": { + "type": "prometheus", + "uid": "${datasource}" }, - "datasource": "$datasource", - "definition": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\"}, workload_type)", "hide": 0, "includeAll": true, - "label": null, - "multi": false, + "label": "workload_type", "name": "type", - "options": [ ], - "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=~\"$namespace\", workload=~\"$workload\"}, workload_type)", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 0, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "query", - "useTags": false - }, - { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 0, - "includeAll": false, - "label": null, - "multi": false, - "name": "resolution", - "options": [ - { - "selected": false, - "text": "30s", - "value": "30s" - }, - { - "selected": true, - "text": "5m", - "value": "5m" - }, - { - "selected": false, - "text": "1h", - "value": "1h" - } - ], - "query": "30s,5m,1h", - "refresh": 2, - "regex": "", - "skipUrlSync": false, - "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false - }, - { - "allValue": null, - "auto": false, - "auto_count": 30, - "auto_min": "10s", - "current": { - "text": "5m", - "value": "5m" - }, - "datasource": "$datasource", - "hide": 2, - "includeAll": false, - "label": null, - "multi": false, - "name": "interval", - "options": [ - { - "selected": true, - "text": "4h", - "value": "4h" - } - ], - "query": "4h", + "query": "label_values(namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\", namespace=~\"$namespace\", workload=~\"$workload\"}, workload_type)", "refresh": 2, - "regex": "", - "skipUrlSync": false, "sort": 1, - "tagValuesQuery": "", - "tags": [ ], - "tagsQuery": "", - "type": "interval", - "useTags": false + "type": "query" } ] }, @@ -63018,35 +57970,9 @@ data: "from": "now-1h", "to": "now" }, - "timepicker": { - "refresh_intervals": [ - "5s", - "10s", - "30s", - "1m", - "5m", - "15m", - "30m", - "1h", - "2h", - "1d" - ], - "time_options": [ - "5m", - "15m", - "1h", - "6h", - "12h", - "24h", - "2d", - "7d", - "30d" - ] - }, "timezone": "browser", "title": "Kubernetes / Networking / Workload", - "uid": "728bf77cc1166d2f3133bf25846876cc", - "version": 0 + "uid": "728bf77cc1166d2f3133bf25846876cc" } kind: ConfigMap metadata: @@ -63180,7 +58106,7 @@ spec: summary: StatefulSet update has not been rolled out. expr: | ( - max without (revision) ( + max by(namespace, statefulset, job, cluster) ( kube_statefulset_status_current_revision{job="integrations/kubernetes/kube-state-metrics"} unless kube_statefulset_status_update_revision{job="integrations/kubernetes/kube-state-metrics"} @@ -63202,7 +58128,7 @@ spec: - alert: KubeDaemonSetRolloutStuck annotations: description: DaemonSet {{ $labels.namespace }}/{{ $labels.daemonset }} has - not finished or progressed for at least 15 minutes. + not finished or progressed for at least 15m. runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubedaemonsetrolloutstuck summary: DaemonSet rollout is stuck. expr: | @@ -63234,13 +58160,13 @@ spec: severity: warning - alert: KubeContainerWaiting annotations: - description: pod/{{ $labels.pod }} in namespace {{ $labels.namespace }} on + description: 'pod/{{ $labels.pod }} in namespace {{ $labels.namespace }} on container {{ $labels.container}} has been in waiting state for longer than - 1 hour. + 1 hour. (reason: "{{ $labels.reason }}").' runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecontainerwaiting summary: Pod container waiting longer than 1 hour expr: | - sum by (namespace, pod, container, cluster) (kube_pod_container_status_waiting_reason{job="integrations/kubernetes/kube-state-metrics"}) > 0 + kube_pod_container_status_waiting_reason{reason!="CrashLoopBackOff", job="integrations/kubernetes/kube-state-metrics"} > 0 for: 1h labels: severity: warning @@ -63336,7 +58262,7 @@ spec: runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecpuovercommit summary: Cluster has overcommitted CPU resource requests. expr: | - sum(namespace_cpu:kube_pod_container_resource_requests:sum{job="integrations/kubernetes/kube-state-metrics",}) by (cluster) - (sum(kube_node_status_allocatable{job="integrations/kubernetes/kube-state-metrics",resource="cpu"}) by (cluster) - max(kube_node_status_allocatable{job="integrations/kubernetes/kube-state-metrics",resource="cpu"}) by (cluster)) > 0 + sum(namespace_cpu:kube_pod_container_resource_requests:sum{}) by (cluster) - (sum(kube_node_status_allocatable{job="integrations/kubernetes/kube-state-metrics",resource="cpu"}) by (cluster) - max(kube_node_status_allocatable{job="integrations/kubernetes/kube-state-metrics",resource="cpu"}) by (cluster)) > 0 and (sum(kube_node_status_allocatable{job="integrations/kubernetes/kube-state-metrics",resource="cpu"}) by (cluster) - max(kube_node_status_allocatable{job="integrations/kubernetes/kube-state-metrics",resource="cpu"}) by (cluster)) > 0 for: 10m @@ -63434,9 +58360,9 @@ spec: runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-cputhrottlinghigh summary: Processes experience elevated CPU throttling. expr: | - sum(increase(container_cpu_cfs_throttled_periods_total{container!="", }[5m])) by (cluster, container, pod, namespace) + sum(increase(container_cpu_cfs_throttled_periods_total{container!="", job="integrations/kubernetes/cadvisor", }[5m])) without (id, metrics_path, name, image, endpoint, job, node) / - sum(increase(container_cpu_cfs_periods_total{}[5m])) by (cluster, container, pod, namespace) + sum(increase(container_cpu_cfs_periods_total{job="integrations/kubernetes/cadvisor", }[5m])) without (id, metrics_path, name, image, endpoint, job, node) > ( 25 / 100 ) for: 15m labels: @@ -63585,9 +58511,9 @@ spec: runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn summary: The API server is burning too much error budget. expr: | - sum(apiserver_request:burnrate1h) > (14.40 * 0.01000) - and - sum(apiserver_request:burnrate5m) > (14.40 * 0.01000) + sum by(cluster) (apiserver_request:burnrate1h) > (14.40 * 0.01000) + and on(cluster) + sum by(cluster) (apiserver_request:burnrate5m) > (14.40 * 0.01000) for: 2m labels: long: 1h @@ -63599,9 +58525,9 @@ spec: runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn summary: The API server is burning too much error budget. expr: | - sum(apiserver_request:burnrate6h) > (6.00 * 0.01000) - and - sum(apiserver_request:burnrate30m) > (6.00 * 0.01000) + sum by(cluster) (apiserver_request:burnrate6h) > (6.00 * 0.01000) + and on(cluster) + sum by(cluster) (apiserver_request:burnrate30m) > (6.00 * 0.01000) for: 15m labels: long: 6h @@ -63613,9 +58539,9 @@ spec: runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn summary: The API server is burning too much error budget. expr: | - sum(apiserver_request:burnrate1d) > (3.00 * 0.01000) - and - sum(apiserver_request:burnrate2h) > (3.00 * 0.01000) + sum by(cluster) (apiserver_request:burnrate1d) > (3.00 * 0.01000) + and on(cluster) + sum by(cluster) (apiserver_request:burnrate2h) > (3.00 * 0.01000) for: 1h labels: long: 1d @@ -63627,9 +58553,9 @@ spec: runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn summary: The API server is burning too much error budget. expr: | - sum(apiserver_request:burnrate3d) > (1.00 * 0.01000) - and - sum(apiserver_request:burnrate6h) > (1.00 * 0.01000) + sum by(cluster) (apiserver_request:burnrate3d) > (1.00 * 0.01000) + and on(cluster) + sum by(cluster) (apiserver_request:burnrate6h) > (1.00 * 0.01000) for: 3h labels: long: 3d @@ -63640,22 +58566,26 @@ spec: - alert: KubeClientCertificateExpiration annotations: description: A client certificate used to authenticate to kubernetes apiserver - is expiring in less than 7.0 days. + is expiring in less than 7.0 days on cluster {{ $labels.cluster }}. runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeclientcertificateexpiration summary: Client certificate is about to expire. expr: | - apiserver_client_certificate_expiration_seconds_count{job="integrations/kubernetes/apiserver"} > 0 and on(job) histogram_quantile(0.01, sum by (job, le) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="integrations/kubernetes/apiserver"}[5m]))) < 604800 + histogram_quantile(0.01, sum without (namespace, service, endpoint) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="integrations/kubernetes/apiserver"}[5m]))) < 604800 + and + on(job, cluster, instance) apiserver_client_certificate_expiration_seconds_count{job="integrations/kubernetes/apiserver"} > 0 for: 5m labels: severity: warning - alert: KubeClientCertificateExpiration annotations: description: A client certificate used to authenticate to kubernetes apiserver - is expiring in less than 24.0 hours. + is expiring in less than 24.0 hours on cluster {{ $labels.cluster }}. runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeclientcertificateexpiration summary: Client certificate is about to expire. expr: | - apiserver_client_certificate_expiration_seconds_count{job="integrations/kubernetes/apiserver"} > 0 and on(job) histogram_quantile(0.01, sum by (job, le) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="integrations/kubernetes/apiserver"}[5m]))) < 86400 + histogram_quantile(0.01, sum without (namespace, service, endpoint) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="integrations/kubernetes/apiserver"}[5m]))) < 86400 + and + on(job, cluster, instance) apiserver_client_certificate_expiration_seconds_count{job="integrations/kubernetes/apiserver"} > 0 for: 5m labels: severity: critical @@ -63699,7 +58629,7 @@ spec: summary: The kubernetes apiserver has terminated {{ $value | humanizePercentage }} of its incoming requests. expr: | - sum(rate(apiserver_request_terminations_total{job="integrations/kubernetes/apiserver"}[10m])) / ( sum(rate(apiserver_request_total{job="integrations/kubernetes/apiserver"}[10m])) + sum(rate(apiserver_request_terminations_total{job="integrations/kubernetes/apiserver"}[10m])) ) > 0.20 + sum by(cluster) (rate(apiserver_request_terminations_total{job="integrations/kubernetes/apiserver"}[10m])) / ( sum by(cluster) (rate(apiserver_request_total{job="integrations/kubernetes/apiserver"}[10m])) + sum by(cluster) (rate(apiserver_request_terminations_total{job="integrations/kubernetes/apiserver"}[10m])) ) > 0.20 for: 5m labels: severity: warning @@ -63909,18 +58839,18 @@ spec: labels: verb: write record: code:apiserver_request_total:increase30d - - expr: | - sum by (cluster, verb, scope) (increase(apiserver_request_sli_duration_seconds_count{job="integrations/kubernetes/apiserver"}[1h])) - record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase1h - - expr: | - sum by (cluster, verb, scope) (avg_over_time(cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase1h[30d]) * 24 * 30) - record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase30d - expr: | sum by (cluster, verb, scope, le) (increase(apiserver_request_sli_duration_seconds_bucket[1h])) record: cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase1h - expr: | sum by (cluster, verb, scope, le) (avg_over_time(cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase1h[30d]) * 24 * 30) record: cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase30d + - expr: | + sum by (cluster, verb, scope) (cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase1h{le="+Inf"}) + record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase1h + - expr: | + sum by (cluster, verb, scope) (cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase30d{le="+Inf"} * 24 * 30) + record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase30d - expr: | 1 - ( ( @@ -64375,7 +59305,7 @@ spec: max by(cluster, namespace, pod, node) (kube_pod_info{node!=""}) ) record: node_namespace_pod_container:container_memory_swap - - name: k8s.rules.container_resource + - name: k8s.rules.container_memory_requests rules: - expr: | kube_pod_container_resource_requests{resource="memory",job="integrations/kubernetes/kube-state-metrics"} * on (namespace, pod, cluster) @@ -64394,6 +59324,8 @@ spec: ) ) record: namespace_memory:kube_pod_container_resource_requests:sum + - name: k8s.rules.container_cpu_requests + rules: - expr: | kube_pod_container_resource_requests{resource="cpu",job="integrations/kubernetes/kube-state-metrics"} * on (namespace, pod, cluster) group_left() max by (namespace, pod, cluster) ( @@ -64411,6 +59343,8 @@ spec: ) ) record: namespace_cpu:kube_pod_container_resource_requests:sum + - name: k8s.rules.container_memory_limits + rules: - expr: | kube_pod_container_resource_limits{resource="memory",job="integrations/kubernetes/kube-state-metrics"} * on (namespace, pod, cluster) group_left() max by (namespace, pod, cluster) ( @@ -64428,6 +59362,8 @@ spec: ) ) record: namespace_memory:kube_pod_container_resource_limits:sum + - name: k8s.rules.container_cpu_limits + rules: - expr: | kube_pod_container_resource_limits{resource="cpu",job="integrations/kubernetes/kube-state-metrics"} * on (namespace, pod, cluster) group_left() max by (namespace, pod, cluster) ( @@ -64713,15 +59649,11 @@ spec: expr: | ( sum by(cluster, namespace, name, operation) ( - rate(thanos_memcached_operation_failures_total[1m]) - or - rate(thanos_cache_operation_failures_total[1m]) + rate(thanos_cache_operation_failures_total{operation!="add"}[1m]) ) / sum by(cluster, namespace, name, operation) ( - rate(thanos_memcached_operations_total[1m]) - or - rate(thanos_cache_operations_total[1m]) + rate(thanos_cache_operations_total{operation!="add"}[1m]) ) ) * 100 > 5 for: 5m @@ -64777,7 +59709,11 @@ spec: }} has no tenants assigned. runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimiringesterinstancehasnotenants expr: | - (min by(cluster, namespace, pod) (cortex_ingester_memory_users) == 0) + ( + (min by(cluster, namespace, pod) (cortex_ingester_memory_users) == 0) + unless + (max by(cluster, namespace, pod) (cortex_lifecycler_read_only) > 0) + ) and on (cluster, namespace) # Only if there are more timeseries than would be expected due to continuous testing load ( @@ -65139,7 +60075,7 @@ spec: expr: | max by (cluster, namespace) (memberlist_client_cluster_members_count) > - (sum by (cluster, namespace) (up{job=~".+/(mimir|admin-api|alertmanager|compactor.*|distributor.*|ingester.*|querier.*|ruler|ruler-querier.*|store-gateway.*|cortex|mimir-write.*|mimir-read.*|mimir-backend.*)"}) + 10) + (sum by (cluster, namespace) (up{job=~".*/(mimir|admin-api|alertmanager|compactor.*|distributor.*|ingester.*|querier.*|ruler|ruler-querier.*|store-gateway.*|cortex|mimir-write.*|mimir-read.*|mimir-backend.*)"}) + 10) for: 20m labels: severity: warning @@ -65210,7 +60146,7 @@ spec: runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#etcdallocatingtoomuchmemory expr: | ( - container_memory_working_set_bytes{container="etcd"} + container_memory_rss{container="etcd"} / ( container_spec_memory_limit_bytes{container="etcd"} > 0 ) ) > 0.65 @@ -65224,7 +60160,7 @@ spec: runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#etcdallocatingtoomuchmemory expr: | ( - container_memory_working_set_bytes{container="etcd"} + container_memory_rss{container="etcd"} / ( container_spec_memory_limit_bytes{container="etcd"} > 0 ) ) > 0.8 @@ -65751,7 +60687,12 @@ spec: }} fails to consume write requests read from Kafka due to internal errors. runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimiringesterfailstoprocessrecordsfromkafka expr: | - sum by (cluster, namespace, pod) (rate(cortex_ingest_storage_reader_records_failed_total{cause="server"}[1m])) > 0 + sum by (cluster, namespace, pod) ( + # This is the old metric name. We're keeping support for backward compatibility. + rate(cortex_ingest_storage_reader_records_failed_total{cause="server"}[1m]) + or + rate(cortex_ingest_storage_reader_requests_failed_total{cause="server"}[1m]) + ) > 0 for: 5m labels: severity: critical @@ -65762,13 +60703,27 @@ spec: runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimiringesterstuckprocessingrecordsfromkafka expr: | # Alert if the reader is not processing any records, but there buffered records to process in the Kafka client. - (sum by (cluster, namespace, pod) (rate(cortex_ingest_storage_reader_records_total[5m])) == 0) + (sum by (cluster, namespace, pod) ( + # This is the old metric name. We're keeping support for backward compatibility. + rate(cortex_ingest_storage_reader_records_total[5m]) + or + rate(cortex_ingest_storage_reader_requests_total[5m]) + ) == 0) and - # NOTE: the cortex_ingest_storage_reader_buffered_fetch_records_total metric is a gauge showing the current number of buffered records. - (sum by (cluster, namespace, pod) (cortex_ingest_storage_reader_buffered_fetch_records_total) > 0) + (sum by (cluster, namespace, pod) (cortex_ingest_storage_reader_buffered_fetched_records) > 0) for: 5m labels: severity: critical + - alert: MimirIngesterMissedRecordsFromKafka + annotations: + message: Mimir {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace + }} missed processing records from Kafka. There may be data loss. + runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimiringestermissedrecordsfromkafka + expr: | + # Alert if the ingester missed some records from Kafka. + increase(cortex_ingest_storage_reader_missed_records_total[10m]) > 0 + labels: + severity: critical - alert: MimirStrongConsistencyEnforcementFailed annotations: message: Mimir {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace @@ -65806,6 +60761,36 @@ spec: for: 5m labels: severity: critical + - alert: MimirBlockBuilderNoCycleProcessing + annotations: + message: Mimir {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace + }} has not processed cycles in the past hour. + runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimirblockbuildernocycleprocessing + expr: | + max by(cluster, namespace, pod) (histogram_count(increase(cortex_blockbuilder_consume_cycle_duration_seconds[60m]))) == 0 + for: 5m + labels: + severity: warning + - alert: MimirBlockBuilderLagging + annotations: + message: Mimir {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace + }} reports partition lag of {{ printf "%.2f" $value }}%. + runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimirblockbuilderlagging + expr: | + max by(cluster, namespace, pod) (max_over_time(cortex_blockbuilder_consumer_lag_records[10m])) > 4e6 + for: 75m + labels: + severity: warning + - alert: MimirBlockBuilderCompactAndUploadFailed + annotations: + message: Mimir {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace + }} fails to compact and upload blocks. + runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimirblockbuildercompactanduploadfailed + expr: | + sum by (cluster, namespace, pod) (rate(cortex_blockbuilder_tsdb_compact_and_upload_failed_total[1m])) > 0 + for: 5m + labels: + severity: warning - name: mimir_continuous_test rules: - alert: MimirContinuousTestNotRunningOnWrites