openclaw: move mvp inference to titan-24

This commit is contained in:
jenkins 2026-05-19 20:14:44 -03:00
parent dd4aff8861
commit aadc93e681
2 changed files with 10 additions and 10 deletions

View File

@ -20,7 +20,7 @@ spec:
app: openclaw app: openclaw
annotations: annotations:
ai.bstein.dev/role: testing-triage ai.bstein.dev/role: testing-triage
ai.bstein.dev/placement: Jetson MVP lane (titan-21) ai.bstein.dev/placement: accelerator MVP lane (titan-24)
spec: spec:
serviceAccountName: openclaw-triage serviceAccountName: openclaw-triage
automountServiceAccountToken: true automountServiceAccountToken: true
@ -36,7 +36,7 @@ spec:
- key: kubernetes.io/hostname - key: kubernetes.io/hostname
operator: In operator: In
values: values:
- titan-21 - titan-24
initContainers: initContainers:
- name: init-config - name: init-config
image: busybox:1.37 image: busybox:1.37
@ -86,7 +86,7 @@ spec:
memory: 64Mi memory: 64Mi
containers: containers:
- name: gateway - name: gateway
image: ghcr.io/openclaw/openclaw:slim@sha256:ca134367c291b982ec301038af4602f397c7f90cc6c6d263c12a78a5fe1bde57 image: ghcr.io/openclaw/openclaw:slim@sha256:5ea30d02a706c49795ed0a3c1526dec51ed90107a6859e93bf27a663105d1c28
imagePullPolicy: IfNotPresent imagePullPolicy: IfNotPresent
command: command:
- node - node

View File

@ -20,7 +20,7 @@ spec:
app: openclaw-ollama app: openclaw-ollama
annotations: annotations:
ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0 ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0
ai.bstein.dev/gpu: Jetson MVP lane (titan-21) ai.bstein.dev/gpu: accelerator MVP lane (titan-24)
spec: spec:
runtimeClassName: nvidia runtimeClassName: nvidia
affinity: affinity:
@ -31,7 +31,7 @@ spec:
- key: kubernetes.io/hostname - key: kubernetes.io/hostname
operator: In operator: In
values: values:
- titan-21 - titan-24
volumes: volumes:
- name: models - name: models
emptyDir: {} emptyDir: {}
@ -68,8 +68,8 @@ spec:
memory: 4Gi memory: 4Gi
nvidia.com/gpu.shared: 1 nvidia.com/gpu.shared: 1
limits: limits:
cpu: "3" cpu: "4"
memory: 8Gi memory: 10Gi
nvidia.com/gpu.shared: 1 nvidia.com/gpu.shared: 1
containers: containers:
- name: ollama - name: ollama
@ -101,10 +101,10 @@ spec:
timeoutSeconds: 5 timeoutSeconds: 5
resources: resources:
requests: requests:
cpu: "1" cpu: "2"
memory: 8Gi memory: 8Gi
nvidia.com/gpu.shared: 1 nvidia.com/gpu.shared: 1
limits: limits:
cpu: "3" cpu: "6"
memory: 10Gi memory: 12Gi
nvidia.com/gpu.shared: 1 nvidia.com/gpu.shared: 1