atlasbot: improve fact parsing and fallback answers

2026-01-28 11:02:10 -03:00 · 2026-01-28 11:02:10 -03:00 · aa608fbf0f
commit aa608fbf0f
parent 436e56c5de
2 changed files with 210 additions and 19 deletions
--- a/services/comms/atlasbot-deployment.yaml
+++ b/services/comms/atlasbot-deployment.yaml
@ -16,7 +16,7 @@ spec:
      labels:
        app: atlasbot
      annotations:
-        checksum/atlasbot-configmap: manual-atlasbot-98
+        checksum/atlasbot-configmap: manual-atlasbot-101
        vault.hashicorp.com/agent-inject: "true"
        vault.hashicorp.com/role: "comms"
        vault.hashicorp.com/agent-inject-secret-turn-secret: "kv/data/atlas/comms/turn-shared-secret"
--- a/services/comms/scripts/atlasbot/bot.py
+++ b/services/comms/scripts/atlasbot/bot.py
@ -260,7 +260,24 @@ def normalize_query(text: str) -> str:
 def _tokens(text: str) -> list[str]:
    cleaned = re.sub(r"[\\_/]", " ", text or "")
    toks = [t.lower() for t in TOKEN_RE.findall(cleaned)]
-    return [t for t in toks if t not in STOPWORDS and len(t) >= 2]
+    expanded: list[str] = []
+    synonyms = {
+        "network": "net",
+        "net": "network",
+        "memory": "ram",
+        "ram": "memory",
+        "i/o": "io",
+    }
+    for token in toks:
+        expanded.append(token)
+        if "-" in token:
+            expanded.extend(part for part in token.split("-") if part)
+    for token in list(expanded):
+        if token in synonyms:
+            expanded.append(synonyms[token])
+        if token.endswith("s") and len(token) > 3:
+            expanded.append(token.rstrip("s"))
+    return [t for t in expanded if t not in STOPWORDS and len(t) >= 2]


 def _ensure_confidence(text: str) -> str:
@ -1077,10 +1094,16 @@ def facts_context(
            lines.append(f"- expected_workers_missing: {', '.join(missing)}")

    hottest = metrics.get("hottest_nodes") if isinstance(metrics.get("hottest_nodes"), dict) else {}
+    usage_metrics = metrics.get("node_usage") if isinstance(metrics.get("node_usage"), dict) else {}
    for key in ("cpu", "ram", "net", "io"):
        entry = hottest.get(key) if isinstance(hottest.get(key), dict) else {}
        node = entry.get("node")
        value = entry.get("value")
+        if not node or value is None:
+            usage = usage_metrics.get(key) if isinstance(usage_metrics.get(key), list) else []
+            pick = _node_usage_top(usage, allowed_nodes=None)
+            if pick:
+                node, value = pick
        if node and value is not None:
            value_fmt = _format_metric_value(
                str(value),
@ -3001,6 +3024,7 @@ def _ensure_scores(answer: str) -> str:
    def _record_score(key: str, value: str):
        if not value:
            return
+        value = value.strip().rstrip("%")
        score_map.setdefault(key, value)

    for line in lines:
@ -3010,10 +3034,10 @@ def _ensure_scores(answer: str) -> str:
            "confidence" in lowered and "relevance" in lowered and "satisfaction" in lowered
        ):
            for key in ("confidence", "relevance", "satisfaction"):
-                match = re.search(rf"{key}\\s*[:=]?\\s*(\\d{{1,3}}|high|medium|low)", lowered)
+                match = re.search(rf"{key}\s*[:=]?\s*(\d{{1,3}}|high|medium|low)", lowered)
                if match:
                    _record_score(key, match.group(1))
-            risk_match = re.search(r"hallucination\\s*risk\\s*[:=]?\\s*(low|medium|high)", lowered)
+            risk_match = re.search(r"hallucination\s*risk\s*[:=]?\s*(low|medium|high)", lowered)
            if risk_match:
                _record_score("hallucinationrisk", risk_match.group(1))
            continue
@ -3032,11 +3056,18 @@ def _ensure_scores(answer: str) -> str:
            _record_score("hallucinationrisk", _extract_value(cleaned))
            continue
        cleaned_body = re.sub(
-            r"\\bconfidence\\s*:\\s*(high|medium|low)\\b\\.?\\s*",
+            r"\bconfidence\s*:\s*(high|medium|low)\b\.?\s*",
            "",
            line,
            flags=re.IGNORECASE,
        ).strip()
+        cleaned_body = re.sub(
+            r"\bconfident\s*level\s*:\s*(high|medium|low)\b\.?\s*",
+            "",
+            cleaned_body,
+            flags=re.IGNORECASE,
+        ).strip()
+        cleaned_body = re.sub(r"\bF\d+\b", "", cleaned_body).strip()
        if cleaned_body:
            body_lines.append(cleaned_body)

@ -3860,41 +3891,195 @@ def _has_body_lines(answer: str) -> bool:

 def _fallback_fact_answer(prompt: str, context: str) -> str:
    facts: list[str] = []
+    parsed_facts: list[tuple[str, str | None, str | None]] = []
+    q = normalize_query(prompt)
+    tokens = set(_tokens(prompt))
    for line in (context or "").splitlines():
        trimmed = line.strip()
-        if not trimmed.startswith("F"):
+        if not trimmed:
            continue
-        match = re.match(r"^F\\d+.*?\\]:\\s*(.*)$", trimmed)
+        if trimmed.startswith("F"):
+            match = re.match(r"^F\d+.*?\]:\s*(.*)$", trimmed)
            if not match:
-            match = re.match(r"^F\\d+:\\s*(.*)$", trimmed)
+                match = re.match(r"^F\d+:\s*(.*)$", trimmed)
            if not match:
                continue
            fact = match.group(1).strip()
+        else:
+            if trimmed.lower().startswith("fact pack") or trimmed.lower().startswith("facts"):
+                continue
+            if trimmed.startswith("-"):
+                fact = trimmed.lstrip("-").strip()
+            else:
+                fact = trimmed
        if fact.startswith("-"):
            fact = fact.lstrip("-").strip()
-        if fact:
+        if fact and (":" in fact or "=" in fact):
            facts.append(fact)
+            key_match = re.match(r"^([\w\s/.-]+):\s*(.+)$", fact)
+            if not key_match:
+                key_match = re.match(r"^([\w\s/.-]+)=\s*(.+)$", fact)
+            if key_match:
+                parsed_facts.append((fact, key_match.group(1).strip(), key_match.group(2).strip()))
+            else:
+                parsed_facts.append((fact, None, None))
    if not facts:
        return ""
-    tokens = set(_tokens(prompt))
+
+    def _norm_key(text: str) -> str:
+        return normalize_query(text).replace(" ", "_")
+
+    def _find_value(target: str) -> str | None:
+        for _fact, key, val in parsed_facts:
+            if key and _norm_key(key) == target:
+                return val
+        return None
+
+    def _parse_counts(text: str) -> dict[str, int]:
+        counts: dict[str, int] = {}
+        for part in (text or "").split(","):
+            if "=" not in part:
+                continue
+            k, v = part.split("=", 1)
+            k = k.strip()
+            v = v.strip()
+            if not k or not v:
+                continue
+            try:
+                counts[k] = int(float(v))
+            except ValueError:
+                continue
+        return counts
+
+    def _parse_map(text: str) -> dict[str, str]:
+        mapping: dict[str, str] = {}
+        pattern = re.compile(r"(\w+)\s*=\s*([^=]+?)(?=(?:\s*,\s*\w+\s*=)|$)")
+        for match in pattern.finditer(text or ""):
+            mapping[match.group(1).strip()] = match.group(2).strip().strip(",")
+        return mapping
+
+    list_intent = _is_list_prompt(prompt) or "name" in tokens
+    count_intent = _is_quantitative_prompt(prompt) and ("how many" in q or "count" in tokens or "number" in tokens)
+    hottest_intent = any(word in q for word in ("hottest", "highest", "most", "top", "busiest"))
+    metric = _detect_metric(q)
+    include_hw, _exclude_hw = _detect_hardware_filters(q)
+
+    if hottest_intent and metric in {"cpu", "ram", "net", "io"}:
+        hottest_val = _find_value(f"hottest_{metric}")
+        if hottest_val:
+            return f"Hottest {metric} is {hottest_val}."
+    if hottest_intent and tokens & {"postgres", "database", "db", "connections"}:
+        hottest_db = _find_value("postgres_hottest_db")
+        if hottest_db:
+            return f"Hottest database is {hottest_db}."
+
+    if count_intent and tokens & {"pods", "pod"}:
+        pending = _find_value("pods_pending")
+        failed = _find_value("pods_failed")
+        running = _find_value("pods_running")
+        succeeded = _find_value("pods_succeeded")
+        if "pending" in q and "failed" in q:
+            try:
+                total = float(pending or 0) + float(failed or 0)
+                return f"Pods pending or failed: {total:.0f}."
+            except ValueError:
+                pass
+        if "pending" in q and pending is not None:
+            return f"Pods pending is {pending}."
+        if "failed" in q and failed is not None:
+            return f"Pods failed is {failed}."
+        if "succeeded" in q and succeeded is not None:
+            return f"Pods succeeded is {succeeded}."
+        if "running" in q and running is not None:
+            return f"Pods running is {running}."
+
+    if count_intent and tokens & {"nodes", "node"} and "not ready" in q:
+        nodes_total = _find_value("nodes_total")
+        if nodes_total and "not_ready" in nodes_total:
+            match = re.search(r"not_ready=([0-9.]+)", nodes_total)
+            if match:
+                return f"Not ready nodes: {match.group(1)}."
+
+    if count_intent and include_hw:
+        counts_line = _find_value("nodes_by_hardware_count")
+        if counts_line:
+            counts = _parse_counts(counts_line)
+            for hw in include_hw:
+                if hw in counts:
+                    return f"{hw} nodes: {counts[hw]}."
+        for hw in include_hw:
+            hw_line = _find_value(hw)
+            if hw_line:
+                items = [item.strip() for item in hw_line.split(",") if item.strip()]
+                return f"{hw} nodes: {len(items)}."
+
+    if list_intent and include_hw:
+        if "control" in q:
+            cp_by_hw = _find_value("control_plane_by_hardware")
+            if cp_by_hw:
+                mapping = _parse_map(cp_by_hw)
+                for hw in include_hw:
+                    if hw in mapping:
+                        return f"{hw} control-plane nodes: {mapping[hw]}."
+            cp_nodes = _find_value("control_plane_nodes")
+            if cp_nodes:
+                return f"Control-plane nodes: {cp_nodes}."
+        for hw in include_hw:
+            hw_line = _find_value(hw)
+            if hw_line:
+                return f"{hw} nodes: {hw_line}."
+
+    if list_intent and "control" in q:
+        cp_nodes = _find_value("control_plane_nodes")
+        if cp_nodes:
+            return f"Control-plane nodes: {cp_nodes}."
+
+    preferred = tokens & {
+        "node",
+        "nodes",
+        "pod",
+        "pods",
+        "postgres",
+        "db",
+        "database",
+        "namespace",
+        "workload",
+        "worker",
+        "workers",
+        "cpu",
+        "ram",
+        "memory",
+        "net",
+        "network",
+        "io",
+        "disk",
+        "connection",
+        "connections",
+    }
    best_fact = ""
    best_score = -1
    for fact in facts:
-        key_match = re.match(r"^([A-Za-z0-9_\\-/ ]+):\\s*(.+)$", fact)
+        key_match = re.match(r"^([\w\s/.-]+):\s*(.+)$", fact)
        if not key_match:
-            key_match = re.match(r"^([A-Za-z0-9_\\-/ ]+)=\\s*(.+)$", fact)
+            key_match = re.match(r"^([\w\s/.-]+)=\s*(.+)$", fact)
        key_tokens: set[str] = set()
        if key_match:
            key_tokens = set(_tokens(key_match.group(1)))
        score = len(tokens & set(_tokens(fact))) + 2 * len(tokens & key_tokens)
+        if preferred:
+            score += 3 * len(preferred & key_tokens)
+            if not (preferred & key_tokens):
+                score -= 1
+        if list_intent and key_match and "count" in key_tokens:
+            score -= 3
        if score > best_score:
            best_score = score
            best_fact = fact
    if best_score <= 0:
        return ""
-    key_match = re.match(r"^([A-Za-z0-9_\\-/ ]+):\\s*(.+)$", best_fact)
+    key_match = re.match(r"^([\w\s/.-]+):\s*(.+)$", best_fact)
    if not key_match:
-        key_match = re.match(r"^([A-Za-z0-9_\\-/ ]+)=\\s*(.+)$", best_fact)
+        key_match = re.match(r"^([\w\s/.-]+)=\s*(.+)$", best_fact)
    if key_match:
        key = key_match.group(1).strip().replace("_", " ")
        val = key_match.group(2).strip()
@ -3936,6 +4121,10 @@ def _needs_full_fact_pack(prompt: str) -> bool:
        return True
    if tokens & {"workload", "pods", "namespace", "worker", "workers"}:
        return True
+    if tokens & {"arch", "architecture", "hardware"}:
+        return True
+    if tokens & METRIC_HINT_WORDS:
+        return True
    if _NAME_INDEX and tokens & _NAME_INDEX:
        return True
    if any(phrase in q for phrase in ("where does", "where is", "where are", "running", "run on", "hosted on", "primary node")):
@ -4104,7 +4293,7 @@ def _non_cluster_reply(prompt: str, *, history_lines: list[str], mode: str) -> s
        system_override=system,
        model=model,
    )
-    reply = re.sub(r"\\bconfidence\\s*:\\s*(high|medium|low)\\b\\.?\\s*", "", reply, flags=re.IGNORECASE).strip()
+    reply = re.sub(r"\bconfidence\s*:\s*(high|medium|low)\b\.?\s*", "", reply, flags=re.IGNORECASE).strip()
    return _ensure_scores(reply)


@ -4405,6 +4594,8 @@ def _is_cluster_query(
        return True
    if any(word in q for word in CLUSTER_HINT_WORDS):
        return True
+    if any(word in q for word in METRIC_HINT_WORDS):
+        return True
    for host_match in HOST_RE.finditer(q):
        host = host_match.group(1).lower()
        if host.endswith("bstein.dev"):