add job to monitor pve host using node exporter and add alert for high ssd writes [ci skip]
This commit is contained in:
parent
d07c625064
commit
6c1ae20448
1 changed files with 17 additions and 1 deletions
|
|
@ -187,7 +187,7 @@ serverFiles:
|
||||||
annotations:
|
annotations:
|
||||||
summary: Node {{$labels.instance}} down.
|
summary: Node {{$labels.instance}} down.
|
||||||
- alert: NodeHighCPUUsage
|
- alert: NodeHighCPUUsage
|
||||||
expr: node_load1 > 2
|
expr: node_load1{instance!="pve-node-r730"} > 2
|
||||||
for: 20m
|
for: 20m
|
||||||
labels:
|
labels:
|
||||||
severity: page
|
severity: page
|
||||||
|
|
@ -200,6 +200,13 @@ serverFiles:
|
||||||
severity: page
|
severity: page
|
||||||
annotations:
|
annotations:
|
||||||
summary: "Low free memory on {{ $labels.node }} - {{ $value }}"
|
summary: "Low free memory on {{ $labels.node }} - {{ $value }}"
|
||||||
|
- alert: SSDHighWriteRate
|
||||||
|
expr: rate(node_disk_written_bytes_total{job="proxmox-host", device="sdb"}[2m]) / 1024 / 1024 > 2 # sdb is SSD; value in MB
|
||||||
|
for: 10m
|
||||||
|
labels:
|
||||||
|
severity: page
|
||||||
|
annotations:
|
||||||
|
summary: "High write rate on SSD - {{ $value }}MB"
|
||||||
# - name: PodStuckNotReady
|
# - name: PodStuckNotReady
|
||||||
# rules:
|
# rules:
|
||||||
# - alert: PodStuckNotReady
|
# - alert: PodStuckNotReady
|
||||||
|
|
@ -344,6 +351,15 @@ serverFiles:
|
||||||
summary: New tailscale client registered
|
summary: New tailscale client registered
|
||||||
|
|
||||||
extraScrapeConfigs: |
|
extraScrapeConfigs: |
|
||||||
|
- job_name: 'proxmox-host'
|
||||||
|
static_configs:
|
||||||
|
- targets:
|
||||||
|
- "192.168.1.127:9100"
|
||||||
|
metrics_path: '/metrics'
|
||||||
|
relabel_configs:
|
||||||
|
- source_labels: [__address__]
|
||||||
|
target_label: instance
|
||||||
|
replacement: 'pve-node-r730' # Giving it a friendly name
|
||||||
- job_name: 'istiod'
|
- job_name: 'istiod'
|
||||||
kubernetes_sd_configs:
|
kubernetes_sd_configs:
|
||||||
- role: endpoints
|
- role: endpoints
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue