diff --git a/ollama/ollama.yaml b/ollama/ollama.yaml index a89ed1b..f05fd65 100644 --- a/ollama/ollama.yaml +++ b/ollama/ollama.yaml @@ -40,7 +40,7 @@ spec: kubernetes.io/hostname: chemavx-k8 containers: - name: ollama - image: ollama/ollama:0.20.7 + image: ollama/ollama:latest command: ["/usr/bin/bash", "-c"] args: - | @@ -66,12 +66,17 @@ spec: value: "8192" - name: OLLAMA_KEEP_ALIVE value: "-1" + - name: NVIDIA_VISIBLE_DEVICES + value: all + - name: NVIDIA_DRIVER_CAPABILITIES + value: compute,utility resources: requests: memory: 8Gi cpu: "500m" limits: memory: 20Gi + nvidia.com/gpu: "1" volumeMounts: - name: ollama-data mountPath: /root/.ollama