From 871d9b04368c7abb1ce79129865299a869157e5c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?S=C3=A9bastien=20Huss?= Date: Mon, 22 Jan 2024 17:02:02 +0100 Subject: [PATCH] fix --- monitor/prometheus/index.yaml | 46 +++++++++---------- ...ometheus-community-kube-kubelet.rules.yaml | 32 +++++++++++++ ...ity-kube-kubernetes-system-kube-proxy.yaml | 29 ++++++++++++ 3 files changed, 84 insertions(+), 23 deletions(-) create mode 100644 monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubelet.rules.yaml create mode 100644 monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubernetes-system-kube-proxy.yaml diff --git a/monitor/prometheus/index.yaml b/monitor/prometheus/index.yaml index 6cad951..568c17d 100644 --- a/monitor/prometheus/index.yaml +++ b/monitor/prometheus/index.yaml @@ -6,6 +6,21 @@ metadata: name: prometheus description: null options: + listenLocal: + default: false + examples: + - false + type: boolean + retention: + default: 10d + examples: + - 10d + type: string + enableAdminAPI: + default: false + examples: + - false + type: boolean issuer: default: letsencrypt-prod examples: @@ -21,31 +36,26 @@ options: examples: - info type: string - enableAdminAPI: - default: false - examples: - - false - type: boolean replicas: default: 1 examples: - 1 type: integer - listenLocal: - default: false + sub-domain: + default: prometheus examples: - - false - type: boolean - domain-name: - default: your_company.com - examples: - - your_company.com + - prometheus type: string ingress-class: default: traefik examples: - traefik type: string + domain-name: + default: your_company.com + examples: + - your_company.com + type: string shards: default: 1 examples: @@ -95,16 +105,6 @@ options: examples: - your-company type: string - retention: - default: 10d - examples: - - 10d - type: string - sub-domain: - default: prometheus - examples: - - prometheus - type: string dependencies: - dist: null category: share diff --git a/monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubelet.rules.yaml b/monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubelet.rules.yaml new file mode 100644 index 0000000..e8bdb8c --- /dev/null +++ b/monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubelet.rules.yaml @@ -0,0 +1,32 @@ +# Source: kube-prometheus-stack/templates/prometheus/rules-1.14/kubelet.rules.yaml +apiVersion: monitoring.coreos.com/v1 +kind: PrometheusRule +metadata: + name: prometheus-community-kube-kubelet.rules + namespace: vynil-monitor + labels: + app: kube-prometheus-stack + + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/instance: prometheus-community + app.kubernetes.io/version: "56.0.2" + app.kubernetes.io/part-of: kube-prometheus-stack + chart: kube-prometheus-stack-56.0.2 + release: "prometheus-community" + heritage: "Helm" +spec: + groups: + - name: kubelet.rules + rules: + - expr: histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_duration_seconds_bucket{job="kubelet", metrics_path="/metrics"}[5m])) by (cluster, instance, le) * on (cluster, instance) group_left(node) kubelet_node_name{job="kubelet", metrics_path="/metrics"}) + labels: + quantile: '0.99' + record: node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile + - expr: histogram_quantile(0.9, sum(rate(kubelet_pleg_relist_duration_seconds_bucket{job="kubelet", metrics_path="/metrics"}[5m])) by (cluster, instance, le) * on (cluster, instance) group_left(node) kubelet_node_name{job="kubelet", metrics_path="/metrics"}) + labels: + quantile: '0.9' + record: node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile + - expr: histogram_quantile(0.5, sum(rate(kubelet_pleg_relist_duration_seconds_bucket{job="kubelet", metrics_path="/metrics"}[5m])) by (cluster, instance, le) * on (cluster, instance) group_left(node) kubelet_node_name{job="kubelet", metrics_path="/metrics"}) + labels: + quantile: '0.5' + record: node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile \ No newline at end of file diff --git a/monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubernetes-system-kube-proxy.yaml b/monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubernetes-system-kube-proxy.yaml new file mode 100644 index 0000000..60cf44d --- /dev/null +++ b/monitor/prometheus/monitoring.coreos.com_v1_PrometheusRule_prometheus-community-kube-kubernetes-system-kube-proxy.yaml @@ -0,0 +1,29 @@ +# Source: kube-prometheus-stack/templates/prometheus/rules-1.14/kubernetes-system-kube-proxy.yaml +apiVersion: monitoring.coreos.com/v1 +kind: PrometheusRule +metadata: + name: prometheus-community-kube-kubernetes-system-kube-proxy + namespace: vynil-monitor + labels: + app: kube-prometheus-stack + + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/instance: prometheus-community + app.kubernetes.io/version: "56.0.2" + app.kubernetes.io/part-of: kube-prometheus-stack + chart: kube-prometheus-stack-56.0.2 + release: "prometheus-community" + heritage: "Helm" +spec: + groups: + - name: kubernetes-system-kube-proxy + rules: + - alert: KubeProxyDown + annotations: + description: KubeProxy has disappeared from Prometheus target discovery. + runbook_url: https://runbooks.prometheus-operator.dev/runbooks/kubernetes/kubeproxydown + summary: Target disappeared from Prometheus target discovery. + expr: absent(up{job="kube-proxy"} == 1) + for: 15m + labels: + severity: critical \ No newline at end of file