Remove every hardcoded reference to k8s-node1 that pinned GPU scheduling to a specific host: - GPU workload nodeSelectors: gpu=true -> nvidia.com/gpu.present=true (frigate, immich, whisper, piper, ytdlp, ebook2audiobook, audiblez, audiblez-web, nvidia-exporter, gpu-pod-exporter). The NFD label is auto-applied by gpu-feature-discovery on any node carrying an NVIDIA PCI device, so the selector follows the card. - null_resource.gpu_node_config: rewrite to enumerate NFD-labeled nodes (feature.node.kubernetes.io/pci-10de.present=true) and taint each with nvidia.com/gpu=true:PreferNoSchedule. Drop the manual 'kubectl label gpu=true' since NFD handles labeling. - MySQL anti-affinity: kubernetes.io/hostname NotIn [k8s-node1] -> nvidia.com/gpu.present NotIn [true]. Same intent (keep MySQL off the GPU node) but portable when the card relocates. Net effect: moving the GPU card between nodes no longer requires any Terraform edit. Verified no-op for current scheduling — both old and new labels resolve to node1 today. Docs updated to match: AGENTS.md, compute.md, overview.md, proxmox-inventory.md, k8s-portal agent-guidance string.
458 lines
11 KiB
HCL
458 lines
11 KiB
HCL
variable "tls_secret_name" {
|
|
type = string
|
|
sensitive = true
|
|
}
|
|
variable "nfs_server" { type = string }
|
|
|
|
|
|
module "tls_secret" {
|
|
source = "../../modules/kubernetes/setup_tls_secret"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
tls_secret_name = var.tls_secret_name
|
|
}
|
|
|
|
resource "kubernetes_namespace" "ebook2audiobook" {
|
|
metadata {
|
|
name = "ebook2audiobook"
|
|
labels = {
|
|
"istio-injection" : "disabled"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
lifecycle {
|
|
# KYVERNO_LIFECYCLE_V1: goldilocks-vpa-auto-mode ClusterPolicy stamps this label on every namespace
|
|
ignore_changes = [metadata[0].labels["goldilocks.fairwinds.com/vpa-update-mode"]]
|
|
}
|
|
}
|
|
|
|
|
|
module "nfs_data_host" {
|
|
source = "../../modules/kubernetes/nfs_volume"
|
|
name = "ebook2audiobook-data-host"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
nfs_server = "192.168.1.127"
|
|
nfs_path = "/srv/nfs/ebook2audiobook"
|
|
}
|
|
|
|
module "nfs_audiblez_data_host" {
|
|
source = "../../modules/kubernetes/nfs_volume"
|
|
name = "ebook2audiobook-audiblez-data-host"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
nfs_server = "192.168.1.127"
|
|
nfs_path = "/srv/nfs/audiblez"
|
|
}
|
|
|
|
resource "kubernetes_deployment" "ebook2audiobook" {
|
|
metadata {
|
|
name = "ebook2audiobook"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
app = "ebook2audiobook"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
spec {
|
|
replicas = 0 # Disabled - using audiblez instead
|
|
strategy {
|
|
type = "Recreate"
|
|
}
|
|
|
|
selector {
|
|
match_labels = {
|
|
app = "ebook2audiobook"
|
|
}
|
|
}
|
|
|
|
template {
|
|
metadata {
|
|
labels = {
|
|
app = "ebook2audiobook"
|
|
}
|
|
}
|
|
|
|
spec {
|
|
node_selector = {
|
|
"nvidia.com/gpu.present" : "true"
|
|
}
|
|
toleration {
|
|
key = "nvidia.com/gpu"
|
|
operator = "Equal"
|
|
value = "true"
|
|
effect = "NoSchedule"
|
|
}
|
|
|
|
container {
|
|
name = "ebook2audiobook"
|
|
image = "docker.io/athomasson2/ebook2audiobook:v25.12.30-cu128"
|
|
|
|
tty = true
|
|
stdin = true
|
|
|
|
port {
|
|
container_port = 7860
|
|
}
|
|
|
|
# LD_LIBRARY_PATH needed for CUDA detection - libcudart.so is in non-standard location
|
|
env {
|
|
name = "LD_LIBRARY_PATH"
|
|
value = "/usr/local/lib/python3.12/site-packages/nvidia/cuda_runtime/lib:/usr/local/lib/python3.12/site-packages/nvidia/cudnn/lib"
|
|
}
|
|
|
|
volume_mount {
|
|
mount_path = "/home/user"
|
|
name = "data"
|
|
}
|
|
|
|
resources {
|
|
limits = {
|
|
"nvidia.com/gpu" = "1"
|
|
}
|
|
}
|
|
}
|
|
|
|
volume {
|
|
name = "data"
|
|
persistent_volume_claim {
|
|
claim_name = module.nfs_data_host.claim_name
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
lifecycle {
|
|
# KYVERNO_LIFECYCLE_V1: Kyverno admission webhook mutates dns_config with ndots=2
|
|
ignore_changes = [spec[0].template[0].spec[0].dns_config]
|
|
}
|
|
}
|
|
|
|
|
|
resource "kubernetes_service" "ebook2audiobook" {
|
|
metadata {
|
|
name = "ebook2audiobook"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
"app" = "ebook2audiobook"
|
|
}
|
|
}
|
|
|
|
spec {
|
|
selector = {
|
|
app = "ebook2audiobook"
|
|
}
|
|
port {
|
|
name = "http"
|
|
port = 80
|
|
target_port = 7860
|
|
}
|
|
}
|
|
}
|
|
|
|
# resource "kubernetes_deployment" "piper" {
|
|
# metadata {
|
|
# name = "piper"
|
|
# namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
# labels = {
|
|
# app = "piper"
|
|
# }
|
|
# }
|
|
# spec {
|
|
# replicas = 1
|
|
# strategy {
|
|
# type = "Recreate"
|
|
# }
|
|
|
|
# selector {
|
|
# match_labels = {
|
|
# app = "piper"
|
|
# }
|
|
# }
|
|
|
|
# template {
|
|
# metadata {
|
|
# labels = {
|
|
# app = "piper"
|
|
# }
|
|
# }
|
|
|
|
# spec {
|
|
# container {
|
|
# name = "piper"
|
|
# # image = "lscr.io/linuxserver/piper:gpu"
|
|
# # image = "piper-tts-wyoming:latest"
|
|
# image = "viktorbarzin/piper"
|
|
# # image = "nvidia/cuda:12.8.1-cudnn-devel-ubuntu24.04"
|
|
|
|
# # working_dir = "/app"
|
|
# command = ["sleep", "3600"]
|
|
|
|
# volume_mount {
|
|
# mount_path = "/config"
|
|
# name = "data"
|
|
# }
|
|
|
|
# resources {
|
|
# limits = {
|
|
# "nvidia.com/gpu" = "1"
|
|
# }
|
|
# }
|
|
# # env {
|
|
# # name = "PIPER_VOICE"
|
|
# # value = "en_US-lessac-medium"
|
|
# # }
|
|
|
|
# env {
|
|
# name = "VOICE_MODEL"
|
|
# value = "en_US-lessac-medium"
|
|
# }
|
|
# env {
|
|
# name = "LOG_LEVEL"
|
|
# value = "DEBUG"
|
|
# }
|
|
# port {
|
|
# name = "web"
|
|
# container_port = 10200
|
|
# }
|
|
# }
|
|
|
|
# volume {
|
|
# name = "data"
|
|
# nfs {
|
|
# server = var.nfs_server
|
|
# path = "/mnt/main/piper"
|
|
# }
|
|
# }
|
|
# }
|
|
# }
|
|
# }
|
|
# }
|
|
|
|
# resource "kubernetes_service" "piper" {
|
|
# metadata {
|
|
# name = "piper"
|
|
# namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
# labels = {
|
|
# "app" = "piper"
|
|
# }
|
|
# }
|
|
|
|
# spec {
|
|
# selector = {
|
|
# app = "piper"
|
|
# }
|
|
# port {
|
|
# name = "http"
|
|
# port = 80
|
|
# target_port = 10200
|
|
# }
|
|
# }
|
|
# }
|
|
|
|
|
|
module "ingress" {
|
|
source = "../../modules/kubernetes/ingress_factory"
|
|
dns_type = "non-proxied"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
name = "ebook2audiobook"
|
|
tls_secret_name = var.tls_secret_name
|
|
protected = true
|
|
extra_annotations = {
|
|
"gethomepage.dev/enabled" = "true"
|
|
"gethomepage.dev/name" = "Ebook2Audiobook"
|
|
"gethomepage.dev/description" = "Book to audio converter"
|
|
"gethomepage.dev/icon" = "audiobookshelf.png"
|
|
"gethomepage.dev/group" = "AI & Data"
|
|
"gethomepage.dev/pod-selector" = ""
|
|
}
|
|
}
|
|
|
|
|
|
resource "kubernetes_deployment" "audiblez" {
|
|
metadata {
|
|
name = "audiblez"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
app = "audiblez"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
spec {
|
|
replicas = 0 # Disabled - using audiblez-web instead
|
|
selector {
|
|
match_labels = {
|
|
app = "audiblez"
|
|
}
|
|
}
|
|
template {
|
|
metadata {
|
|
labels = {
|
|
app = "audiblez"
|
|
}
|
|
}
|
|
spec {
|
|
node_selector = {
|
|
"nvidia.com/gpu.present" : "true"
|
|
}
|
|
toleration {
|
|
key = "nvidia.com/gpu"
|
|
operator = "Equal"
|
|
value = "true"
|
|
effect = "NoSchedule"
|
|
}
|
|
container {
|
|
image = "viktorbarzin/audiblez:latest"
|
|
name = "audiblez"
|
|
command = ["/usr/bin/sleep", "infinity"]
|
|
volume_mount {
|
|
name = "data"
|
|
mount_path = "/mnt"
|
|
}
|
|
resources {
|
|
limits = {
|
|
"nvidia.com/gpu" = "1"
|
|
}
|
|
}
|
|
}
|
|
volume {
|
|
name = "data"
|
|
persistent_volume_claim {
|
|
claim_name = module.nfs_audiblez_data_host.claim_name
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
lifecycle {
|
|
# KYVERNO_LIFECYCLE_V1: Kyverno admission webhook mutates dns_config with ndots=2
|
|
ignore_changes = [spec[0].template[0].spec[0].dns_config]
|
|
}
|
|
}
|
|
|
|
|
|
# Audiblez Web UI
|
|
resource "kubernetes_deployment" "audiblez-web" {
|
|
metadata {
|
|
name = "audiblez-web"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
app = "audiblez-web"
|
|
tier = local.tiers.gpu
|
|
}
|
|
}
|
|
spec {
|
|
replicas = 0 # Scaled down - GPU node memory pressure
|
|
strategy {
|
|
type = "Recreate"
|
|
}
|
|
selector {
|
|
match_labels = {
|
|
app = "audiblez-web"
|
|
}
|
|
}
|
|
template {
|
|
metadata {
|
|
labels = {
|
|
app = "audiblez-web"
|
|
}
|
|
}
|
|
spec {
|
|
node_selector = {
|
|
"nvidia.com/gpu.present" : "true"
|
|
}
|
|
toleration {
|
|
key = "nvidia.com/gpu"
|
|
operator = "Equal"
|
|
value = "true"
|
|
effect = "NoSchedule"
|
|
}
|
|
container {
|
|
image = "docker.io/viktorbarzin/audiblez-web:latest"
|
|
image_pull_policy = "Always"
|
|
name = "audiblez-web"
|
|
|
|
port {
|
|
container_port = 8000
|
|
}
|
|
|
|
volume_mount {
|
|
name = "data"
|
|
mount_path = "/mnt"
|
|
}
|
|
|
|
resources {
|
|
limits = {
|
|
"nvidia.com/gpu" = "1"
|
|
}
|
|
}
|
|
|
|
# liveness_probe {
|
|
# http_get {
|
|
# path = "/health"
|
|
# port = 8000
|
|
# }
|
|
# initial_delay_seconds = 10
|
|
# period_seconds = 30
|
|
# }
|
|
|
|
# readiness_probe {
|
|
# http_get {
|
|
# path = "/health"
|
|
# port = 8000
|
|
# }
|
|
# initial_delay_seconds = 5
|
|
# period_seconds = 10
|
|
# }
|
|
}
|
|
volume {
|
|
name = "data"
|
|
persistent_volume_claim {
|
|
claim_name = module.nfs_audiblez_data_host.claim_name
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
lifecycle {
|
|
# KYVERNO_LIFECYCLE_V1: Kyverno admission webhook mutates dns_config with ndots=2
|
|
ignore_changes = [spec[0].template[0].spec[0].dns_config]
|
|
}
|
|
}
|
|
|
|
resource "kubernetes_service" "audiblez-web" {
|
|
metadata {
|
|
name = "audiblez-web"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
labels = {
|
|
"app" = "audiblez-web"
|
|
}
|
|
}
|
|
|
|
spec {
|
|
selector = {
|
|
app = "audiblez-web"
|
|
}
|
|
port {
|
|
name = "http"
|
|
port = 80
|
|
target_port = 8000
|
|
}
|
|
}
|
|
}
|
|
|
|
module "audiblez-web-ingress" {
|
|
source = "../../modules/kubernetes/ingress_factory"
|
|
namespace = kubernetes_namespace.ebook2audiobook.metadata[0].name
|
|
name = "audiblez-web"
|
|
host = "audiblez"
|
|
dns_type = "non-proxied"
|
|
tls_secret_name = var.tls_secret_name
|
|
protected = true
|
|
max_body_size = "500m" # Allow large EPUB uploads
|
|
extra_annotations = {
|
|
"gethomepage.dev/enabled" = "true"
|
|
"gethomepage.dev/name" = "Audiblez"
|
|
"gethomepage.dev/description" = "Book to audio converter"
|
|
"gethomepage.dev/icon" = "audiobookshelf.png"
|
|
"gethomepage.dev/group" = "AI & Data"
|
|
"gethomepage.dev/pod-selector" = ""
|
|
}
|
|
}
|