openclaw: move mvp inference to titan-24
This commit is contained in:
parent
dd4aff8861
commit
aadc93e681
@ -20,7 +20,7 @@ spec:
|
|||||||
app: openclaw
|
app: openclaw
|
||||||
annotations:
|
annotations:
|
||||||
ai.bstein.dev/role: testing-triage
|
ai.bstein.dev/role: testing-triage
|
||||||
ai.bstein.dev/placement: Jetson MVP lane (titan-21)
|
ai.bstein.dev/placement: accelerator MVP lane (titan-24)
|
||||||
spec:
|
spec:
|
||||||
serviceAccountName: openclaw-triage
|
serviceAccountName: openclaw-triage
|
||||||
automountServiceAccountToken: true
|
automountServiceAccountToken: true
|
||||||
@ -36,7 +36,7 @@ spec:
|
|||||||
- key: kubernetes.io/hostname
|
- key: kubernetes.io/hostname
|
||||||
operator: In
|
operator: In
|
||||||
values:
|
values:
|
||||||
- titan-21
|
- titan-24
|
||||||
initContainers:
|
initContainers:
|
||||||
- name: init-config
|
- name: init-config
|
||||||
image: busybox:1.37
|
image: busybox:1.37
|
||||||
@ -86,7 +86,7 @@ spec:
|
|||||||
memory: 64Mi
|
memory: 64Mi
|
||||||
containers:
|
containers:
|
||||||
- name: gateway
|
- name: gateway
|
||||||
image: ghcr.io/openclaw/openclaw:slim@sha256:ca134367c291b982ec301038af4602f397c7f90cc6c6d263c12a78a5fe1bde57
|
image: ghcr.io/openclaw/openclaw:slim@sha256:5ea30d02a706c49795ed0a3c1526dec51ed90107a6859e93bf27a663105d1c28
|
||||||
imagePullPolicy: IfNotPresent
|
imagePullPolicy: IfNotPresent
|
||||||
command:
|
command:
|
||||||
- node
|
- node
|
||||||
|
|||||||
@ -20,7 +20,7 @@ spec:
|
|||||||
app: openclaw-ollama
|
app: openclaw-ollama
|
||||||
annotations:
|
annotations:
|
||||||
ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0
|
ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0
|
||||||
ai.bstein.dev/gpu: Jetson MVP lane (titan-21)
|
ai.bstein.dev/gpu: accelerator MVP lane (titan-24)
|
||||||
spec:
|
spec:
|
||||||
runtimeClassName: nvidia
|
runtimeClassName: nvidia
|
||||||
affinity:
|
affinity:
|
||||||
@ -31,7 +31,7 @@ spec:
|
|||||||
- key: kubernetes.io/hostname
|
- key: kubernetes.io/hostname
|
||||||
operator: In
|
operator: In
|
||||||
values:
|
values:
|
||||||
- titan-21
|
- titan-24
|
||||||
volumes:
|
volumes:
|
||||||
- name: models
|
- name: models
|
||||||
emptyDir: {}
|
emptyDir: {}
|
||||||
@ -68,8 +68,8 @@ spec:
|
|||||||
memory: 4Gi
|
memory: 4Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
limits:
|
limits:
|
||||||
cpu: "3"
|
cpu: "4"
|
||||||
memory: 8Gi
|
memory: 10Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
containers:
|
containers:
|
||||||
- name: ollama
|
- name: ollama
|
||||||
@ -101,10 +101,10 @@ spec:
|
|||||||
timeoutSeconds: 5
|
timeoutSeconds: 5
|
||||||
resources:
|
resources:
|
||||||
requests:
|
requests:
|
||||||
cpu: "1"
|
cpu: "2"
|
||||||
memory: 8Gi
|
memory: 8Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
limits:
|
limits:
|
||||||
cpu: "3"
|
cpu: "6"
|
||||||
memory: 10Gi
|
memory: 12Gi
|
||||||
nvidia.com/gpu.shared: 1
|
nvidia.com/gpu.shared: 1
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user