From 8af9e6b5bd644d144e398c44539b00dee1ece6af Mon Sep 17 00:00:00 2001 From: Viktor Barzin Date: Sun, 28 Dec 2025 08:35:36 +0000 Subject: [PATCH] set the time slicing config in the nvidia chart values[ci skip] --- modules/kubernetes/authentik/pgbouncer.tf | 1 + modules/kubernetes/nvidia/main.tf | 10 +++++----- modules/kubernetes/nvidia/values.yaml | 4 ++++ 3 files changed, 10 insertions(+), 5 deletions(-) diff --git a/modules/kubernetes/authentik/pgbouncer.tf b/modules/kubernetes/authentik/pgbouncer.tf index 24620f6d..f9c83fd9 100644 --- a/modules/kubernetes/authentik/pgbouncer.tf +++ b/modules/kubernetes/authentik/pgbouncer.tf @@ -93,6 +93,7 @@ resource "kubernetes_deployment" "pgbouncer" { } } } + depends_on = [kubernetes_secret.pgbouncer_auth] } # --- 4️⃣ Service --- diff --git a/modules/kubernetes/nvidia/main.tf b/modules/kubernetes/nvidia/main.tf index e1c6d425..1bd3f4b2 100644 --- a/modules/kubernetes/nvidia/main.tf +++ b/modules/kubernetes/nvidia/main.tf @@ -15,7 +15,7 @@ resource "kubernetes_namespace" "nvidia" { } } -# Apply to operator with: +# [not needed anymore; part of the chart values] Apply to operator with: # kubectl patch clusterpolicies.nvidia.com/cluster-policy -n gpu-operator --type merge -p '{"spec": {"devicePlugin": {"config": {"name": "time-slicing-config", "default": "any"}}}}' resource "kubernetes_config_map" "time_slicing_config" { @@ -37,6 +37,7 @@ resource "kubernetes_config_map" "time_slicing_config" { replicas: 10 EOF } + depends_on = [kubernetes_namespace.nvidia] } resource "helm_release" "nvidia-gpu-operator" { @@ -49,7 +50,8 @@ resource "helm_release" "nvidia-gpu-operator" { # version = "0.9.3" timeout = 6000 - values = [templatefile("${path.module}/values.yaml", {})] + values = [templatefile("${path.module}/values.yaml", {})] + depends_on = [kubernetes_config_map.time_slicing_config] } resource "kubernetes_deployment" "nvidia-exporter" { @@ -83,9 +85,6 @@ resource "kubernetes_deployment" "nvidia-exporter" { port { container_port = 9400 } - port { - container_port = 9400 - } security_context { privileged = true capabilities { @@ -101,6 +100,7 @@ resource "kubernetes_deployment" "nvidia-exporter" { } } } + depends_on = [helm_release.nvidia-gpu-operator] } resource "kubernetes_service" "nvidia-exporter" { diff --git a/modules/kubernetes/nvidia/values.yaml b/modules/kubernetes/nvidia/values.yaml index f2611ea0..9049068c 100644 --- a/modules/kubernetes/nvidia/values.yaml +++ b/modules/kubernetes/nvidia/values.yaml @@ -13,3 +13,7 @@ driver: version: "570.195.03" # CUDA 12.8 upgradePolicy: autoUpgrade: false + + devicePlugin: + config: + name: time-slicing-config