Compare commits
2 Commits
c55cbcdefa
...
c3e3714e4d
Author | SHA1 | Date |
---|---|---|
SeanOMik | c3e3714e4d | |
SeanOMik | 52b51c3966 |
|
@ -129,6 +129,11 @@ spec:
|
||||||
cert-manager:
|
cert-manager:
|
||||||
url: https://raw.githubusercontent.com/monitoring-mixins/website/master/assets/cert-manager/dashboards/cert-manager.json
|
url: https://raw.githubusercontent.com/monitoring-mixins/website/master/assets/cert-manager/dashboards/cert-manager.json
|
||||||
datasource: Victoria
|
datasource: Victoria
|
||||||
|
longhorn:
|
||||||
|
# renovate: depName="Longhorn"
|
||||||
|
gnetId: 16888
|
||||||
|
revision: 8
|
||||||
|
datasource: Victoria
|
||||||
spegel:
|
spegel:
|
||||||
# renovate: depName="Spegel"
|
# renovate: depName="Spegel"
|
||||||
gnetId: 18089
|
gnetId: 18089
|
||||||
|
|
|
@ -25,4 +25,9 @@ spec:
|
||||||
podDnsConfig:
|
podDnsConfig:
|
||||||
nameservers:
|
nameservers:
|
||||||
- "1.1.1.1"
|
- "1.1.1.1"
|
||||||
- "9.9.9.9"
|
- "9.9.9.9"
|
||||||
|
prometheus:
|
||||||
|
servicemonitor:
|
||||||
|
enabled: true
|
||||||
|
labels:
|
||||||
|
release: kube-prometheus-stack
|
|
@ -0,0 +1,21 @@
|
||||||
|
apiVersion: monitoring.coreos.com/v1
|
||||||
|
kind: PrometheusRule
|
||||||
|
metadata:
|
||||||
|
name: prometheus-longhorn-rules
|
||||||
|
namespace: longhorn-system
|
||||||
|
labels:
|
||||||
|
release: kube-prometheus-stack
|
||||||
|
spec:
|
||||||
|
groups:
|
||||||
|
- name: longhorn.rules
|
||||||
|
rules:
|
||||||
|
- alert: LonghornVolumeUsageCritical
|
||||||
|
annotations:
|
||||||
|
description: Longhorn volume {{$labels.volume}} on {{$labels.node}} is at {{$value}}% used for
|
||||||
|
more than 5 minutes.
|
||||||
|
summary: Longhorn volume capacity is over 90% used.
|
||||||
|
expr: 100 * (longhorn_volume_usage_bytes / longhorn_volume_capacity_bytes) > 90
|
||||||
|
for: 5m
|
||||||
|
labels:
|
||||||
|
issue: Longhorn volume {{$labels.volume}} usage on {{$labels.node}} is critical.
|
||||||
|
severity: critical
|
|
@ -3,4 +3,6 @@ kind: Kustomization
|
||||||
resources:
|
resources:
|
||||||
- ./namespace.yaml
|
- ./namespace.yaml
|
||||||
- ./helm-repository.yaml
|
- ./helm-repository.yaml
|
||||||
- ./helm-release.yaml
|
- ./helm-release.yaml
|
||||||
|
- ./alerts.yaml
|
||||||
|
- ./service-monitor.yaml
|
|
@ -0,0 +1,13 @@
|
||||||
|
apiVersion: monitoring.coreos.com/v1
|
||||||
|
kind: ServiceMonitor
|
||||||
|
metadata:
|
||||||
|
name: longhorn
|
||||||
|
namespace: longhorn-system
|
||||||
|
labels:
|
||||||
|
release: kube-prometheus-stack
|
||||||
|
spec:
|
||||||
|
selector:
|
||||||
|
matchLabels:
|
||||||
|
app: longhorn-manager
|
||||||
|
endpoints:
|
||||||
|
- port: manager
|
Loading…
Reference in New Issue