openclaw: pin mvp model lane to titan-21
This commit is contained in:
parent
887023eaeb
commit
3142d35403
@ -20,7 +20,7 @@ spec:
|
|||||||
app: openclaw
|
app: openclaw
|
||||||
annotations:
|
annotations:
|
||||||
ai.bstein.dev/role: testing-triage
|
ai.bstein.dev/role: testing-triage
|
||||||
ai.bstein.dev/placement: Jetson pool (titan-20/21)
|
ai.bstein.dev/placement: Jetson MVP lane (titan-21)
|
||||||
spec:
|
spec:
|
||||||
serviceAccountName: openclaw-triage
|
serviceAccountName: openclaw-triage
|
||||||
automountServiceAccountToken: true
|
automountServiceAccountToken: true
|
||||||
@ -36,7 +36,6 @@ spec:
|
|||||||
- key: kubernetes.io/hostname
|
- key: kubernetes.io/hostname
|
||||||
operator: In
|
operator: In
|
||||||
values:
|
values:
|
||||||
- titan-20
|
|
||||||
- titan-21
|
- titan-21
|
||||||
initContainers:
|
initContainers:
|
||||||
- name: init-config
|
- name: init-config
|
||||||
|
|||||||
@ -20,7 +20,7 @@ spec:
|
|||||||
app: openclaw-ollama
|
app: openclaw-ollama
|
||||||
annotations:
|
annotations:
|
||||||
ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0
|
ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0
|
||||||
ai.bstein.dev/gpu: Jetson pool (titan-20/21)
|
ai.bstein.dev/gpu: Jetson MVP lane (titan-21)
|
||||||
spec:
|
spec:
|
||||||
runtimeClassName: nvidia
|
runtimeClassName: nvidia
|
||||||
affinity:
|
affinity:
|
||||||
@ -31,7 +31,6 @@ spec:
|
|||||||
- key: kubernetes.io/hostname
|
- key: kubernetes.io/hostname
|
||||||
operator: In
|
operator: In
|
||||||
values:
|
values:
|
||||||
- titan-20
|
|
||||||
- titan-21
|
- titan-21
|
||||||
volumes:
|
volumes:
|
||||||
- name: models
|
- name: models
|
||||||
@ -69,8 +68,8 @@ spec:
|
|||||||
memory: 4Gi
|
memory: 4Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
limits:
|
limits:
|
||||||
cpu: "4"
|
cpu: "3"
|
||||||
memory: 10Gi
|
memory: 8Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
containers:
|
containers:
|
||||||
- name: ollama
|
- name: ollama
|
||||||
@ -102,10 +101,10 @@ spec:
|
|||||||
timeoutSeconds: 5
|
timeoutSeconds: 5
|
||||||
resources:
|
resources:
|
||||||
requests:
|
requests:
|
||||||
cpu: "2"
|
cpu: "1"
|
||||||
memory: 8Gi
|
memory: 8Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
limits:
|
limits:
|
||||||
cpu: "6"
|
cpu: "3"
|
||||||
memory: 12Gi
|
memory: 10Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user