feat(ollama): migrate GPU from AMD ROCm to NVIDIA CUDA (RTX 3060 via OCuLink)

Switch from ollama/ollama:rocm + amd.com/gpu to standard CUDA image + nvidia.com/gpu.
RTX 3060 (GA106, 12GB) now used via NVIDIA GPU Operator on chemavx-k8.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
2026-04-17 17:12:50 +00:00
parent b805c2c9e5
commit 8b7d3c0659
+6 -1
View File
@@ -40,7 +40,7 @@ spec:
kubernetes.io/hostname: chemavx-k8 kubernetes.io/hostname: chemavx-k8
containers: containers:
- name: ollama - name: ollama
image: ollama/ollama:0.20.7 image: ollama/ollama:latest
command: ["/usr/bin/bash", "-c"] command: ["/usr/bin/bash", "-c"]
args: args:
- | - |
@@ -66,12 +66,17 @@ spec:
value: "8192" value: "8192"
- name: OLLAMA_KEEP_ALIVE - name: OLLAMA_KEEP_ALIVE
value: "-1" value: "-1"
- name: NVIDIA_VISIBLE_DEVICES
value: all
- name: NVIDIA_DRIVER_CAPABILITIES
value: compute,utility
resources: resources:
requests: requests:
memory: 8Gi memory: 8Gi
cpu: "500m" cpu: "500m"
limits: limits:
memory: 20Gi memory: 20Gi
nvidia.com/gpu: "1"
volumeMounts: volumeMounts:
- name: ollama-data - name: ollama-data
mountPath: /root/.ollama mountPath: /root/.ollama