openclaw: use gpu-sized triage model
This commit is contained in:
parent
44bfb5a68e
commit
c667c97089
@ -13,10 +13,10 @@ data:
|
||||
"defaults": {
|
||||
"workspace": "/home/node/.openclaw/workspace",
|
||||
"model": {
|
||||
"primary": "ollama-cluster/qwen2.5:1.5b-instruct-q4_0"
|
||||
"primary": "ollama-cluster/qwen2.5:7b-instruct-q4_0"
|
||||
},
|
||||
"models": {
|
||||
"ollama-cluster/qwen2.5:1.5b-instruct-q4_0": {}
|
||||
"ollama-cluster/qwen2.5:7b-instruct-q4_0": {}
|
||||
}
|
||||
},
|
||||
"list": [
|
||||
@ -62,8 +62,8 @@ data:
|
||||
"apiKey": "ollama",
|
||||
"models": [
|
||||
{
|
||||
"id": "qwen2.5:1.5b-instruct-q4_0",
|
||||
"name": "qwen2.5:1.5b-instruct-q4_0 (Titan local)",
|
||||
"id": "qwen2.5:7b-instruct-q4_0",
|
||||
"name": "qwen2.5:7b-instruct-q4_0 (Titan local)",
|
||||
"contextWindow": 32768,
|
||||
"maxTokens": 4096,
|
||||
"input": ["text"],
|
||||
|
||||
@ -19,7 +19,7 @@ spec:
|
||||
labels:
|
||||
app: openclaw-ollama
|
||||
annotations:
|
||||
ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0
|
||||
ai.bstein.dev/model: qwen2.5:7b-instruct-q4_0
|
||||
ai.bstein.dev/gpu: accelerator MVP lane (titan-24)
|
||||
spec:
|
||||
runtimeClassName: nvidia
|
||||
@ -45,7 +45,7 @@ spec:
|
||||
- name: OLLAMA_MODELS
|
||||
value: /root/.ollama
|
||||
- name: OLLAMA_MODEL
|
||||
value: qwen2.5:1.5b-instruct-q4_0
|
||||
value: qwen2.5:7b-instruct-q4_0
|
||||
- name: NVIDIA_VISIBLE_DEVICES
|
||||
value: all
|
||||
- name: NVIDIA_DRIVER_CAPABILITIES
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user