fix kubelet alarms (#14414)
This commit is contained in:
parent
161f51132d
commit
bd106ed984
|
@ -9,7 +9,7 @@
|
||||||
class: Errors
|
class: Errors
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
calc: $kubelet_node_config_error
|
calc: $experiencing_error
|
||||||
units: bool
|
units: bool
|
||||||
every: 10s
|
every: 10s
|
||||||
warn: $this == 1
|
warn: $this == 1
|
||||||
|
@ -20,12 +20,12 @@ component: Kubelet
|
||||||
# Failed Token() requests to the alternate token source
|
# Failed Token() requests to the alternate token source
|
||||||
|
|
||||||
template: kubelet_token_requests
|
template: kubelet_token_requests
|
||||||
lookup: sum -10s of token_fail_count
|
|
||||||
on: k8s_kubelet.kubelet_token_requests
|
on: k8s_kubelet.kubelet_token_requests
|
||||||
class: Errors
|
class: Errors
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
units: failed requests
|
lookup: sum -10s of failed
|
||||||
|
units: requests
|
||||||
every: 10s
|
every: 10s
|
||||||
warn: $this > 0
|
warn: $this > 0
|
||||||
delay: down 1m multiplier 1.5 max 2h
|
delay: down 1m multiplier 1.5 max 2h
|
||||||
|
@ -35,11 +35,11 @@ component: Kubelet
|
||||||
# Docker and runtime operation errors
|
# Docker and runtime operation errors
|
||||||
|
|
||||||
template: kubelet_operations_error
|
template: kubelet_operations_error
|
||||||
lookup: sum -1m
|
|
||||||
on: k8s_kubelet.kubelet_operations_errors
|
on: k8s_kubelet.kubelet_operations_errors
|
||||||
class: Errors
|
class: Errors
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
|
lookup: sum -1m
|
||||||
units: errors
|
units: errors
|
||||||
every: 10s
|
every: 10s
|
||||||
warn: $this > (($status >= $WARNING) ? (0) : (20))
|
warn: $this > (($status >= $WARNING) ? (0) : (20))
|
||||||
|
@ -67,7 +67,7 @@ component: Kubelet
|
||||||
class: Latency
|
class: Latency
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
lookup: average -1m unaligned of kubelet_pleg_relist_latency_05
|
lookup: average -1m unaligned of 0.5
|
||||||
units: microseconds
|
units: microseconds
|
||||||
every: 10s
|
every: 10s
|
||||||
info: average Pod Lifecycle Event Generator relisting latency over the last minute (quantile 0.5)
|
info: average Pod Lifecycle Event Generator relisting latency over the last minute (quantile 0.5)
|
||||||
|
@ -77,7 +77,7 @@ component: Kubelet
|
||||||
class: Latency
|
class: Latency
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
lookup: average -10s unaligned of kubelet_pleg_relist_latency_05
|
lookup: average -10s unaligned of 0.5
|
||||||
calc: $this * 100 / (($kubelet_1m_pleg_relist_latency_quantile_05 < 1000)?(1000):($kubelet_1m_pleg_relist_latency_quantile_05))
|
calc: $this * 100 / (($kubelet_1m_pleg_relist_latency_quantile_05 < 1000)?(1000):($kubelet_1m_pleg_relist_latency_quantile_05))
|
||||||
every: 10s
|
every: 10s
|
||||||
units: %
|
units: %
|
||||||
|
@ -95,7 +95,7 @@ component: Kubelet
|
||||||
class: Latency
|
class: Latency
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
lookup: average -1m unaligned of kubelet_pleg_relist_latency_09
|
lookup: average -1m unaligned of 0.9
|
||||||
units: microseconds
|
units: microseconds
|
||||||
every: 10s
|
every: 10s
|
||||||
info: average Pod Lifecycle Event Generator relisting latency over the last minute (quantile 0.9)
|
info: average Pod Lifecycle Event Generator relisting latency over the last minute (quantile 0.9)
|
||||||
|
@ -105,7 +105,7 @@ component: Kubelet
|
||||||
class: Latency
|
class: Latency
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
lookup: average -10s unaligned of kubelet_pleg_relist_latency_09
|
lookup: average -10s unaligned of 0.9
|
||||||
calc: $this * 100 / (($kubelet_1m_pleg_relist_latency_quantile_09 < 1000)?(1000):($kubelet_1m_pleg_relist_latency_quantile_09))
|
calc: $this * 100 / (($kubelet_1m_pleg_relist_latency_quantile_09 < 1000)?(1000):($kubelet_1m_pleg_relist_latency_quantile_09))
|
||||||
every: 10s
|
every: 10s
|
||||||
units: %
|
units: %
|
||||||
|
@ -123,7 +123,7 @@ component: Kubelet
|
||||||
class: Latency
|
class: Latency
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
lookup: average -1m unaligned of kubelet_pleg_relist_latency_099
|
lookup: average -1m unaligned of 0.99
|
||||||
units: microseconds
|
units: microseconds
|
||||||
every: 10s
|
every: 10s
|
||||||
info: average Pod Lifecycle Event Generator relisting latency over the last minute (quantile 0.99)
|
info: average Pod Lifecycle Event Generator relisting latency over the last minute (quantile 0.99)
|
||||||
|
@ -133,7 +133,7 @@ component: Kubelet
|
||||||
class: Latency
|
class: Latency
|
||||||
type: Kubernetes
|
type: Kubernetes
|
||||||
component: Kubelet
|
component: Kubelet
|
||||||
lookup: average -10s unaligned of kubelet_pleg_relist_latency_099
|
lookup: average -10s unaligned of 0.99
|
||||||
calc: $this * 100 / (($kubelet_1m_pleg_relist_latency_quantile_099 < 1000)?(1000):($kubelet_1m_pleg_relist_latency_quantile_099))
|
calc: $this * 100 / (($kubelet_1m_pleg_relist_latency_quantile_099 < 1000)?(1000):($kubelet_1m_pleg_relist_latency_quantile_099))
|
||||||
every: 10s
|
every: 10s
|
||||||
units: %
|
units: %
|
||||||
|
|
Loading…
Reference in New Issue