[ci skip] Fix Prometheus storage alert and Grafana quota exhaustion
- Enable size-based TSDB retention (45GB) to clean up old blocks (including 2021-era blocks with failed compaction) - Increase monitoring namespace quota from 64/128Gi to 80/160Gi CPU/memory limits to allow Grafana rolling updates
This commit is contained in:
parent
dcce738641
commit
26ba9ea371
2 changed files with 3 additions and 3 deletions
|
|
@ -194,8 +194,8 @@ resource "kubernetes_resource_quota" "monitoring" {
|
||||||
hard = {
|
hard = {
|
||||||
"requests.cpu" = "16"
|
"requests.cpu" = "16"
|
||||||
"requests.memory" = "16Gi"
|
"requests.memory" = "16Gi"
|
||||||
"limits.cpu" = "64"
|
"limits.cpu" = "80"
|
||||||
"limits.memory" = "128Gi"
|
"limits.memory" = "160Gi"
|
||||||
pods = "100"
|
pods = "100"
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -109,7 +109,7 @@ server:
|
||||||
# - "web.enable-admin-api"
|
# - "web.enable-admin-api"
|
||||||
- "web.enable-lifecycle"
|
- "web.enable-lifecycle"
|
||||||
- "storage.tsdb.allow-overlapping-blocks"
|
- "storage.tsdb.allow-overlapping-blocks"
|
||||||
# - "storage.tsdb.retention.size=1GB"
|
- "storage.tsdb.retention.size=45GB"
|
||||||
- "storage.tsdb.wal-compression"
|
- "storage.tsdb.wal-compression"
|
||||||
persistentVolume:
|
persistentVolume:
|
||||||
# enabled: false
|
# enabled: false
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue