ai(ollama): recover onto live jetson gpu pool

This commit is contained in:
jenkins 2026-05-05 06:42:15 -03:00
parent 9e659b790b
commit b81053aaec
2 changed files with 7 additions and 7 deletions

View File

@ -21,7 +21,7 @@ spec:
app: ollama
annotations:
ai.bstein.dev/model: qwen2.5:14b-instruct-q4_0
ai.bstein.dev/gpu: GPU pool (titan-22/24)
ai.bstein.dev/gpu: GPU pool (titan-20/21)
ai.bstein.dev/restartedAt: "2026-01-26T12:00:00Z"
spec:
affinity:
@ -32,13 +32,13 @@ spec:
- key: kubernetes.io/hostname
operator: In
values:
- titan-22
- titan-24
- titan-20
- titan-21
runtimeClassName: nvidia
volumes:
- name: models
persistentVolumeClaim:
claimName: ollama-models
claimName: ollama-models-asteria
initContainers:
- name: warm-model
image: ollama/ollama@sha256:2c9595c555fd70a28363489ac03bd5bf9e7c5bdf2890373c3a830ffd7252ce6d

View File

@ -2,12 +2,12 @@
apiVersion: v1
kind: PersistentVolumeClaim
metadata:
name: ollama-models
name: ollama-models-asteria
namespace: ai
spec:
accessModes:
- ReadWriteOnce
- ReadWriteMany
resources:
requests:
storage: 30Gi
storageClassName: astreae
storageClassName: asteria