Memory right-sizing based on VPA upperBound analysis: - Increases: stirling-pdf 1200→1536Mi, claude-memory 64→128Mi, dawarich 512→768Mi, kyverno-cleanup 128→192Mi, linkwarden 768→1Gi, navidrome 64→128Mi, listenarr 768→896Mi, privatebin 64→128Mi, ntfy 64→128Mi, health 128→256Mi, dbaas quota 16→20Gi, mysql-operator 384→512Mi - Decreases: rybbit 768→384Mi, nvidia-exporter added explicit 192Mi, dcgm-exporter 2560→1536Mi - Scale to 0: ebook2audiobook/audiblez-web, whisper (GPU node pressure) Net effect: -496Mi cluster-wide, 13 ContainerNearOOM alerts resolved, all ResourceQuota pressures cleared, GPU health green.
440 lines
9.8 KiB
HCL
440 lines
9.8 KiB
HCL
variable "tls_secret_name" {
|
|
type = string
|
|
sensitive = true
|
|
}
|
|
variable "nfs_server" { type = string }
|
|
|
|
|
|
module "tls_secret" {
|
|
source = "../../modules/kubernetes/setup_tls_secret"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
tls_secret_name = var.tls_secret_name
|
|
}
|
|
|
|
resource "kubernetes_namespace" "ebook2audiobook" {
|
|
metadata {
|
|
name = "ebook2audiobook"
|
|
labels = {
|
|
"istio-injection" : "disabled"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
module "nfs_data" {
|
|
source = "../../modules/kubernetes/nfs_volume"
|
|
name = "ebook2audiobook-data"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
nfs_server = var.nfs_server
|
|
nfs_path = "/mnt/main/ebook2audiobook"
|
|
}
|
|
|
|
module "nfs_audiblez_data" {
|
|
source = "../../modules/kubernetes/nfs_volume"
|
|
name = "ebook2audiobook-audiblez-data"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
nfs_server = var.nfs_server
|
|
nfs_path = "/mnt/main/audiblez"
|
|
}
|
|
|
|
resource "kubernetes_deployment" "ebook2audiobook" {
|
|
metadata {
|
|
name = "ebook2audiobook"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
app = "ebook2audiobook"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
spec {
|
|
replicas = 0 # Disabled - using audiblez instead
|
|
strategy {
|
|
type = "Recreate"
|
|
}
|
|
|
|
selector {
|
|
match_labels = {
|
|
app = "ebook2audiobook"
|
|
}
|
|
}
|
|
|
|
template {
|
|
metadata {
|
|
labels = {
|
|
app = "ebook2audiobook"
|
|
}
|
|
}
|
|
|
|
spec {
|
|
node_selector = {
|
|
"gpu" : "true"
|
|
}
|
|
toleration {
|
|
key = "nvidia.com/gpu"
|
|
operator = "Equal"
|
|
value = "true"
|
|
effect = "NoSchedule"
|
|
}
|
|
|
|
container {
|
|
name = "ebook2audiobook"
|
|
image = "docker.io/athomasson2/ebook2audiobook:v25.12.30-cu128"
|
|
|
|
tty = true
|
|
stdin = true
|
|
|
|
port {
|
|
container_port = 7860
|
|
}
|
|
|
|
# LD_LIBRARY_PATH needed for CUDA detection - libcudart.so is in non-standard location
|
|
env {
|
|
name = "LD_LIBRARY_PATH"
|
|
value = "/usr/local/lib/python3.12/site-packages/nvidia/cuda_runtime/lib:/usr/local/lib/python3.12/site-packages/nvidia/cudnn/lib"
|
|
}
|
|
|
|
volume_mount {
|
|
mount_path = "/home/user"
|
|
name = "data"
|
|
}
|
|
|
|
resources {
|
|
limits = {
|
|
"nvidia.com/gpu" = "1"
|
|
}
|
|
}
|
|
}
|
|
|
|
volume {
|
|
name = "data"
|
|
persistent_volume_claim {
|
|
claim_name = module.nfs_data.claim_name
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
resource "kubernetes_service" "ebook2audiobook" {
|
|
metadata {
|
|
name = "ebook2audiobook"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
"app" = "ebook2audiobook"
|
|
}
|
|
}
|
|
|
|
spec {
|
|
selector = {
|
|
app = "ebook2audiobook"
|
|
}
|
|
port {
|
|
name = "http"
|
|
port = 80
|
|
target_port = 7860
|
|
}
|
|
}
|
|
}
|
|
|
|
# resource "kubernetes_deployment" "piper" {
|
|
# metadata {
|
|
# name = "piper"
|
|
# namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
# labels = {
|
|
# app = "piper"
|
|
# }
|
|
# }
|
|
# spec {
|
|
# replicas = 1
|
|
# strategy {
|
|
# type = "Recreate"
|
|
# }
|
|
|
|
# selector {
|
|
# match_labels = {
|
|
# app = "piper"
|
|
# }
|
|
# }
|
|
|
|
# template {
|
|
# metadata {
|
|
# labels = {
|
|
# app = "piper"
|
|
# }
|
|
# }
|
|
|
|
# spec {
|
|
# container {
|
|
# name = "piper"
|
|
# # image = "lscr.io/linuxserver/piper:gpu"
|
|
# # image = "piper-tts-wyoming:latest"
|
|
# image = "viktorbarzin/piper"
|
|
# # image = "nvidia/cuda:12.8.1-cudnn-devel-ubuntu24.04"
|
|
|
|
# # working_dir = "/app"
|
|
# command = ["sleep", "3600"]
|
|
|
|
# volume_mount {
|
|
# mount_path = "/config"
|
|
# name = "data"
|
|
# }
|
|
|
|
# resources {
|
|
# limits = {
|
|
# "nvidia.com/gpu" = "1"
|
|
# }
|
|
# }
|
|
# # env {
|
|
# # name = "PIPER_VOICE"
|
|
# # value = "en_US-lessac-medium"
|
|
# # }
|
|
|
|
# env {
|
|
# name = "VOICE_MODEL"
|
|
# value = "en_US-lessac-medium"
|
|
# }
|
|
# env {
|
|
# name = "LOG_LEVEL"
|
|
# value = "DEBUG"
|
|
# }
|
|
# port {
|
|
# name = "web"
|
|
# container_port = 10200
|
|
# }
|
|
# }
|
|
|
|
# volume {
|
|
# name = "data"
|
|
# nfs {
|
|
# server = var.nfs_server
|
|
# path = "/mnt/main/piper"
|
|
# }
|
|
# }
|
|
# }
|
|
# }
|
|
# }
|
|
# }
|
|
|
|
# resource "kubernetes_service" "piper" {
|
|
# metadata {
|
|
# name = "piper"
|
|
# namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
# labels = {
|
|
# "app" = "piper"
|
|
# }
|
|
# }
|
|
|
|
# spec {
|
|
# selector = {
|
|
# app = "piper"
|
|
# }
|
|
# port {
|
|
# name = "http"
|
|
# port = 80
|
|
# target_port = 10200
|
|
# }
|
|
# }
|
|
# }
|
|
|
|
|
|
module "ingress" {
|
|
source = "../../modules/kubernetes/ingress_factory"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
name = "ebook2audiobook"
|
|
tls_secret_name = var.tls_secret_name
|
|
protected = true
|
|
extra_annotations = {
|
|
"gethomepage.dev/enabled" = "true"
|
|
"gethomepage.dev/name" = "Ebook2Audiobook"
|
|
"gethomepage.dev/description" = "Book to audio converter"
|
|
"gethomepage.dev/icon" = "audiobookshelf.png"
|
|
"gethomepage.dev/group" = "AI & Data"
|
|
"gethomepage.dev/pod-selector" = ""
|
|
}
|
|
}
|
|
|
|
|
|
resource "kubernetes_deployment" "audiblez" {
|
|
metadata {
|
|
name = "audiblez"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
app = "audiblez"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
spec {
|
|
replicas = 0 # Disabled - using audiblez-web instead
|
|
selector {
|
|
match_labels = {
|
|
app = "audiblez"
|
|
}
|
|
}
|
|
template {
|
|
metadata {
|
|
labels = {
|
|
app = "audiblez"
|
|
}
|
|
}
|
|
spec {
|
|
node_selector = {
|
|
"gpu" : "true"
|
|
}
|
|
toleration {
|
|
key = "nvidia.com/gpu"
|
|
operator = "Equal"
|
|
value = "true"
|
|
effect = "NoSchedule"
|
|
}
|
|
container {
|
|
image = "viktorbarzin/audiblez:latest"
|
|
name = "audiblez"
|
|
command = ["/usr/bin/sleep", "infinity"]
|
|
volume_mount {
|
|
name = "data"
|
|
mount_path = "/mnt"
|
|
}
|
|
resources {
|
|
limits = {
|
|
"nvidia.com/gpu" = "1"
|
|
}
|
|
}
|
|
}
|
|
volume {
|
|
name = "data"
|
|
persistent_volume_claim {
|
|
claim_name = module.nfs_audiblez_data.claim_name
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
# Audiblez Web UI
|
|
resource "kubernetes_deployment" "audiblez-web" {
|
|
metadata {
|
|
name = "audiblez-web"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
app = "audiblez-web"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
spec {
|
|
replicas = 0 # Scaled down - GPU node memory pressure
|
|
strategy {
|
|
type = "Recreate"
|
|
}
|
|
selector {
|
|
match_labels = {
|
|
app = "audiblez-web"
|
|
}
|
|
}
|
|
template {
|
|
metadata {
|
|
labels = {
|
|
app = "audiblez-web"
|
|
}
|
|
}
|
|
spec {
|
|
node_selector = {
|
|
"gpu" : "true"
|
|
}
|
|
toleration {
|
|
key = "nvidia.com/gpu"
|
|
operator = "Equal"
|
|
value = "true"
|
|
effect = "NoSchedule"
|
|
}
|
|
container {
|
|
image = "docker.io/viktorbarzin/audiblez-web:latest"
|
|
image_pull_policy = "Always"
|
|
name = "audiblez-web"
|
|
|
|
port {
|
|
container_port = 8000
|
|
}
|
|
|
|
volume_mount {
|
|
name = "data"
|
|
mount_path = "/mnt"
|
|
}
|
|
|
|
resources {
|
|
limits = {
|
|
"nvidia.com/gpu" = "1"
|
|
}
|
|
}
|
|
|
|
# liveness_probe {
|
|
# http_get {
|
|
# path = "/health"
|
|
# port = 8000
|
|
# }
|
|
# initial_delay_seconds = 10
|
|
# period_seconds = 30
|
|
# }
|
|
|
|
# readiness_probe {
|
|
# http_get {
|
|
# path = "/health"
|
|
# port = 8000
|
|
# }
|
|
# initial_delay_seconds = 5
|
|
# period_seconds = 10
|
|
# }
|
|
}
|
|
volume {
|
|
name = "data"
|
|
persistent_volume_claim {
|
|
claim_name = module.nfs_audiblez_data.claim_name
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
resource "kubernetes_service" "audiblez-web" {
|
|
metadata {
|
|
name = "audiblez-web"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
"app" = "audiblez-web"
|
|
}
|
|
}
|
|
|
|
spec {
|
|
selector = {
|
|
app = "audiblez-web"
|
|
}
|
|
port {
|
|
name = "http"
|
|
port = 80
|
|
target_port = 8000
|
|
}
|
|
}
|
|
}
|
|
|
|
module "audiblez-web-ingress" {
|
|
source = "../../modules/kubernetes/ingress_factory"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
name = "audiblez-web"
|
|
host = "audiblez"
|
|
tls_secret_name = var.tls_secret_name
|
|
protected = true
|
|
max_body_size = "500m" # Allow large EPUB uploads
|
|
extra_annotations = {
|
|
"gethomepage.dev/enabled" = "true"
|
|
"gethomepage.dev/name" = "Audiblez"
|
|
"gethomepage.dev/description" = "Book to audio converter"
|
|
"gethomepage.dev/icon" = "audiobookshelf.png"
|
|
"gethomepage.dev/group" = "AI & Data"
|
|
"gethomepage.dev/pod-selector" = ""
|
|
}
|
|
}
|