infra/modules/kubernetes/ollama/values.yaml

29 lines
463 B
YAML
Raw Normal View History

ollama:
gpu:
# -- Enable GPU integration
2025-12-14 09:49:25 +00:00
enabled: true
# -- GPU type: 'nvidia' or 'amd'
type: "nvidia"
# -- Specify the number of GPU to 1
number: 1
# -- List of models to pull at container startup
models:
2025-05-04 11:23:57 +00:00
pull:
- llama3
persistentVolume:
enabled: true
existingClaim: "ollama-pvc"
nodeSelector:
gpu: "true"
tolerations:
- key: "nvidia.com/gpu"
operator: "Equal"
value: "true"
effect: "NoSchedule"