openclaw: use gpu-sized triage model

2026-05-19 20:28:26 -03:00 · 2026-05-19 20:28:26 -03:00 · c667c97089
commit c667c97089
parent 44bfb5a68e
2 changed files with 6 additions and 6 deletions
--- a/services/openclaw/configmap.yaml
+++ b/services/openclaw/configmap.yaml
@ -13,10 +13,10 @@ data:
        "defaults": {
          "workspace": "/home/node/.openclaw/workspace",
          "model": {
-            "primary": "ollama-cluster/qwen2.5:1.5b-instruct-q4_0"
+            "primary": "ollama-cluster/qwen2.5:7b-instruct-q4_0"
          },
          "models": {
-            "ollama-cluster/qwen2.5:1.5b-instruct-q4_0": {}
+            "ollama-cluster/qwen2.5:7b-instruct-q4_0": {}
          }
        },
        "list": [
@ -62,8 +62,8 @@ data:
            "apiKey": "ollama",
            "models": [
              {
-                "id": "qwen2.5:1.5b-instruct-q4_0",
-                "name": "qwen2.5:1.5b-instruct-q4_0 (Titan local)",
+                "id": "qwen2.5:7b-instruct-q4_0",
+                "name": "qwen2.5:7b-instruct-q4_0 (Titan local)",
                "contextWindow": 32768,
                "maxTokens": 4096,
                "input": ["text"],
--- a/services/openclaw/ollama-deployment.yaml
+++ b/services/openclaw/ollama-deployment.yaml
@ -19,7 +19,7 @@ spec:
      labels:
        app: openclaw-ollama
      annotations:
-        ai.bstein.dev/model: qwen2.5:1.5b-instruct-q4_0
+        ai.bstein.dev/model: qwen2.5:7b-instruct-q4_0
        ai.bstein.dev/gpu: accelerator MVP lane (titan-24)
    spec:
      runtimeClassName: nvidia
@ -45,7 +45,7 @@ spec:
            - name: OLLAMA_MODELS
              value: /root/.ollama
            - name: OLLAMA_MODEL
-              value: qwen2.5:1.5b-instruct-q4_0
+              value: qwen2.5:7b-instruct-q4_0
            - name: NVIDIA_VISIBLE_DEVICES
              value: all
            - name: NVIDIA_DRIVER_CAPABILITIES