feat(ollama): migrate GPU from AMD ROCm to NVIDIA CUDA (RTX 3060 via OCuLink)

Switch from ollama/ollama:rocm + amd.com/gpu to standard CUDA image + nvidia.com/gpu. RTX 3060 (GA106, 12GB) now used via NVIDIA GPU Operator on chemavx-k8. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-04-17 17:13:07 +00:00
parent b805c2c9e5
commit 8b7d3c0659
1 changed files with 6 additions and 1 deletions
@@ -40,7 +40,7 @@ spec:
        kubernetes.io/hostname: chemavx-k8
      containers:
        - name: ollama
-          image: ollama/ollama:0.20.7
+          image: ollama/ollama:latest
          command: ["/usr/bin/bash", "-c"]
          args:
            - |
@@ -66,12 +66,17 @@ spec:
              value: "8192"
            - name: OLLAMA_KEEP_ALIVE
              value: "-1"
+            - name: NVIDIA_VISIBLE_DEVICES
+              value: all
+            - name: NVIDIA_DRIVER_CAPABILITIES
+              value: compute,utility
          resources:
            requests:
              memory: 8Gi
              cpu: "500m"
            limits:
              memory: 20Gi
+              nvidia.com/gpu: "1"
          volumeMounts:
            - name: ollama-data
              mountPath: /root/.ollama