2020-12-18 00:46:15 +00:00
{{- /*
2021-06-30 16:26:06 +00:00
Generated from 'kube-apiserver-availability.rules' group from https://raw.githubusercontent.com/prometheus-operator/kube-prometheus/main/manifests/kubernetes-prometheusRule.yaml
2020-12-18 00:46:15 +00:00
Do not change in-place! In order to change this file first read following link :
https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack/hack
*/ -}}
{{- $kubeTargetVersion := default .Capabilities.KubeVersion.GitVersion .Values.kubeTargetVersionOverride }}
{{- if and (semverCompare ">=1.14.0-0" $kubeTargetVersion) (semverCompare "<9.9.9-9" $kubeTargetVersion) .Values.defaultRules.create .Values.kubeApiServer.enabled .Values.defaultRules.rules.kubeApiserverAvailability }}
apiVersion : monitoring.coreos.com/v1
kind : PrometheusRule
metadata :
name : {{ printf "%s-%s" (include "kube-prometheus-stack.fullname" .) "kube-apiserver-availability.rules" | trunc 63 | trimSuffix "-" }}
namespace : {{ template "kube-prometheus-stack.namespace" . }}
labels :
app : {{ template "kube-prometheus-stack.name" . }}
{{ include "kube-prometheus-stack.labels" . | indent 4 }}
{{- if .Values.defaultRules.labels }}
{{ toYaml .Values.defaultRules.labels | indent 4 }}
{{- end }}
{{- if .Values.defaultRules.annotations }}
annotations :
{{ toYaml .Values.defaultRules.annotations | indent 4 }}
{{- end }}
spec :
groups :
- interval : 3m
name : kube-apiserver-availability.rules
rules :
2021-07-29 11:50:16 +00:00
- expr : avg_over_time(code_verb:apiserver_request_total:increase1h[30d]) * 24 * 30
record : code_verb:apiserver_request_total:increase30d
- expr : sum by (cluster, code) (code_verb:apiserver_request_total:increase30d{verb=~"LIST|GET"})
labels :
verb : read
record : code:apiserver_request_total:increase30d
- expr : sum by (cluster, code) (code_verb:apiserver_request_total:increase30d{verb=~"POST|PUT|PATCH|DELETE"})
labels :
verb : write
record : code:apiserver_request_total:increase30d
2020-12-18 00:46:15 +00:00
- expr : |-
1 - (
(
# write too slow
2021-06-30 16:26:06 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_count{verb=~"POST|PUT|PATCH|DELETE"}[30d]))
2020-12-18 00:46:15 +00:00
-
2021-06-30 16:26:06 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{verb=~"POST|PUT|PATCH|DELETE",le="1"}[30d]))
2020-12-18 00:46:15 +00:00
) +
(
# read too slow
2021-06-30 16:26:06 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_count{verb=~"LIST|GET"}[30d]))
2020-12-18 00:46:15 +00:00
-
(
(
2021-07-29 11:50:16 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{verb=~"LIST|GET",scope=~"resource|",le="1"}[30d]))
2020-12-18 00:46:15 +00:00
or
vector(0)
)
+
2021-07-29 11:50:16 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{verb=~"LIST|GET",scope="namespace",le="5"}[30d]))
2020-12-18 00:46:15 +00:00
+
2021-07-29 11:50:16 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{verb=~"LIST|GET",scope="cluster",le="40"}[30d]))
2020-12-18 00:46:15 +00:00
)
) +
# errors
2021-06-30 16:26:06 +00:00
sum by (cluster) (code:apiserver_request_total:increase30d{code=~"5.."} or vector(0))
2020-12-18 00:46:15 +00:00
)
/
2021-06-30 16:26:06 +00:00
sum by (cluster) (code:apiserver_request_total:increase30d)
2020-12-18 00:46:15 +00:00
labels :
verb : all
record : apiserver_request:availability30d
- expr : |-
1 - (
2021-06-30 16:26:06 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_count{job="apiserver",verb=~"LIST|GET"}[30d]))
2020-12-18 00:46:15 +00:00
-
(
# too slow
(
2021-07-29 11:50:16 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{job="apiserver",verb=~"LIST|GET",scope=~"resource|",le="1"}[30d]))
2020-12-18 00:46:15 +00:00
or
vector(0)
)
+
2021-07-29 11:50:16 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{job="apiserver",verb=~"LIST|GET",scope="namespace",le="5"}[30d]))
2020-12-18 00:46:15 +00:00
+
2021-07-29 11:50:16 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{job="apiserver",verb=~"LIST|GET",scope="cluster",le="40"}[30d]))
2020-12-18 00:46:15 +00:00
)
+
# errors
2021-06-30 16:26:06 +00:00
sum by (cluster) (code:apiserver_request_total:increase30d{verb="read",code=~"5.."} or vector(0))
2020-12-18 00:46:15 +00:00
)
/
2021-06-30 16:26:06 +00:00
sum by (cluster) (code:apiserver_request_total:increase30d{verb="read"})
2020-12-18 00:46:15 +00:00
labels :
verb : read
record : apiserver_request:availability30d
- expr : |-
1 - (
(
# too slow
2021-06-30 16:26:06 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_count{verb=~"POST|PUT|PATCH|DELETE"}[30d]))
2020-12-18 00:46:15 +00:00
-
2021-06-30 16:26:06 +00:00
sum by (cluster) (increase(apiserver_request_duration_seconds_bucket{verb=~"POST|PUT|PATCH|DELETE",le="1"}[30d]))
2020-12-18 00:46:15 +00:00
)
+
# errors
2021-06-30 16:26:06 +00:00
sum by (cluster) (code:apiserver_request_total:increase30d{verb="write",code=~"5.."} or vector(0))
2020-12-18 00:46:15 +00:00
)
/
2021-06-30 16:26:06 +00:00
sum by (cluster) (code:apiserver_request_total:increase30d{verb="write"})
2020-12-18 00:46:15 +00:00
labels :
verb : write
record : apiserver_request:availability30d
2021-07-29 11:50:16 +00:00
- expr : sum by (cluster,code,resource) (rate(apiserver_request_total{job="apiserver",verb=~"LIST|GET"}[5m]))
2020-12-18 00:46:15 +00:00
labels :
verb : read
2021-07-29 11:50:16 +00:00
record : code_resource:apiserver_request_total:rate5m
- expr : sum by (cluster,code,resource) (rate(apiserver_request_total{job="apiserver",verb=~"POST|PUT|PATCH|DELETE"}[5m]))
2020-12-18 00:46:15 +00:00
labels :
verb : write
2021-07-29 11:50:16 +00:00
record : code_resource:apiserver_request_total:rate5m
- expr : sum by (cluster, code, verb) (increase(apiserver_request_total{job="apiserver",verb=~"LIST|GET|POST|PUT|PATCH|DELETE",code=~"2.."}[1h]))
record : code_verb:apiserver_request_total:increase1h
- expr : sum by (cluster, code, verb) (increase(apiserver_request_total{job="apiserver",verb=~"LIST|GET|POST|PUT|PATCH|DELETE",code=~"3.."}[1h]))
record : code_verb:apiserver_request_total:increase1h
- expr : sum by (cluster, code, verb) (increase(apiserver_request_total{job="apiserver",verb=~"LIST|GET|POST|PUT|PATCH|DELETE",code=~"4.."}[1h]))
record : code_verb:apiserver_request_total:increase1h
- expr : sum by (cluster, code, verb) (increase(apiserver_request_total{job="apiserver",verb=~"LIST|GET|POST|PUT|PATCH|DELETE",code=~"5.."}[1h]))
record : code_verb:apiserver_request_total:increase1h
2020-12-18 00:46:15 +00:00
{{- end }}