2024-06-08 19:22:35 +00:00
|
|
|
ollama:
|
|
|
|
|
gpu:
|
|
|
|
|
# -- Enable GPU integration
|
2025-12-14 09:49:25 +00:00
|
|
|
enabled: true
|
2024-06-08 19:22:35 +00:00
|
|
|
|
|
|
|
|
# -- GPU type: 'nvidia' or 'amd'
|
|
|
|
|
type: "nvidia"
|
|
|
|
|
|
|
|
|
|
# -- Specify the number of GPU to 1
|
|
|
|
|
number: 1
|
|
|
|
|
|
|
|
|
|
# -- List of models to pull at container startup
|
|
|
|
|
models:
|
2025-05-04 11:23:57 +00:00
|
|
|
pull:
|
|
|
|
|
- llama3
|
2024-06-08 19:22:35 +00:00
|
|
|
|
|
|
|
|
persistentVolume:
|
|
|
|
|
enabled: true
|
|
|
|
|
existingClaim: "ollama-pvc"
|
2026-02-06 20:19:26 +00:00
|
|
|
|
|
|
|
|
nodeSelector:
|
|
|
|
|
gpu: "true"
|
|
|
|
|
|
|
|
|
|
tolerations:
|
|
|
|
|
- key: "nvidia.com/gpu"
|
|
|
|
|
operator: "Equal"
|
|
|
|
|
value: "true"
|
|
|
|
|
effect: "NoSchedule"
|