atlasbot: reinforce metric facts

2026-02-01 11:47:21 -03:00 · 2026-02-01 11:47:21 -03:00 · bb51321404
commit bb51321404
parent 889e814b59
2 changed files with 98 additions and 0 deletions
--- a/atlasbot/engine/answerer.py
+++ b/atlasbot/engine/answerer.py
@ -117,6 +117,7 @@ class AnswerEngine:
            "route",
            "decompose",
            "chunk_score",
            "fact_select",
            "synth",
            "subanswer",
            "tool",
@ -261,6 +262,11 @@ class AnswerEngine:
                selected = _select_chunks(chunks, scored, plan, keyword_tokens)
                key_facts = _key_fact_lines(summary_lines, keyword_tokens)
                metric_facts = [line for line in key_facts if re.search(r"\d", line)]
                if classify.get("question_type") in {"metric", "diagnostic"} and not metric_facts:
                    metric_candidates = _metric_candidate_lines(summary_lines, keyword_tokens)
                    metric_facts = await _select_metric_facts(call_llm, normalized, metric_candidates, plan)
                    if metric_facts:
                        key_facts = _merge_fact_lines(metric_facts, key_facts)
                if self._settings.debug_pipeline:
                    scored_preview = sorted(
                        [{"id": c["id"], "score": scored.get(c["id"], 0.0), "summary": c["summary"]} for c in chunks],
@ -394,6 +400,7 @@ class AnswerEngine:
                                model=plan.model,
                                tag="runbook_enforce",
                            )
                reply = _strip_unknown_entities(reply, unknown_nodes, unknown_namespaces)
            if _needs_focus_fix(normalized, reply, classify):
                if observer:
@ -960,6 +967,64 @@ def _key_fact_lines(lines: list[str], keywords: list[str] | None, limit: int = 6
    return matches
 def _merge_fact_lines(primary: list[str], fallback: list[str]) -> list[str]:
    seen = set()
    merged: list[str] = []
    for line in primary + fallback:
        if line in seen:
            continue
        seen.add(line)
        merged.append(line)
    return merged
 def _metric_candidate_lines(lines: list[str], keywords: list[str] | None, limit: int = 40) -> list[str]:
    if not lines:
        return []
    lowered = [kw.lower() for kw in (keywords or []) if kw]
    candidates: list[str] = []
    for line in lines:
        line_lower = line.lower()
        if lowered and any(kw in line_lower for kw in lowered):
            candidates.append(line)
        elif re.search(r"\d", line):
            candidates.append(line)
        if len(candidates) >= limit:
            break
    return candidates
 async def _select_metric_facts(
    call_llm: Callable[..., Any],
    question: str,
    candidates: list[str],
    plan: ModePlan,
    max_lines: int = 2,
 ) -> list[str]:
    if not candidates:
        return []
    prompt = (
        prompts.FACT_SELECT_PROMPT.format(max_lines=max_lines)
        + "\nQuestion: "
        + question
        + "\nCandidates:\n"
        + "\n".join([f"- {line}" for line in candidates])
    )
    raw = await call_llm(prompts.FACT_SELECT_SYSTEM, prompt, model=plan.fast_model, tag="fact_select")
    data = _parse_json_block(raw, fallback={})
    lines = data.get("lines") if isinstance(data, dict) else None
    if not isinstance(lines, list):
        return []
    cleaned = []
    allowed = set(candidates)
    for line in lines:
        if isinstance(line, str) and line in allowed and line not in cleaned:
            cleaned.append(line)
        if len(cleaned) >= max_lines:
            break
    return cleaned
 def _metric_fact_guard(reply: str, metric_facts: list[str], keywords: list[str]) -> str:
    if not metric_facts:
        return reply
@ -978,6 +1043,28 @@ def _metric_fact_guard(reply: str, metric_facts: list[str], keywords: list[str])
    return reply
 def _strip_unknown_entities(reply: str, unknown_nodes: list[str], unknown_namespaces: list[str]) -> str:
    if not reply:
        return reply
    if not unknown_nodes and not unknown_namespaces:
        return reply
    sentences = [s.strip() for s in re.split(r"(?<=[.!?])\\s+", reply) if s.strip()]
    if not sentences:
        return reply
    lowered_nodes = [node.lower() for node in unknown_nodes]
    lowered_namespaces = [ns.lower() for ns in unknown_namespaces]
    kept: list[str] = []
    for sent in sentences:
        lower = sent.lower()
        if lowered_nodes and any(node in lower for node in lowered_nodes):
            continue
        if lowered_namespaces and any(f"namespace {ns}" in lower for ns in lowered_namespaces):
            continue
        kept.append(sent)
    cleaned = " ".join(kept).strip()
    return cleaned or reply
 def _lexicon_context(summary: dict[str, Any]) -> str:
    if not isinstance(summary, dict):
        return ""
--- a/atlasbot/llm/prompts.py
+++ b/atlasbot/llm/prompts.py
@ -207,6 +207,17 @@ DEDUP_PROMPT = (
    "Return only the cleaned answer."
 )
 FACT_SELECT_SYSTEM = (
    CLUSTER_SYSTEM
    + " Select the most relevant fact lines for the question. "
    + "Return JSON only."
 )
 FACT_SELECT_PROMPT = (
    "Pick up to {max_lines} lines from Candidates that best answer the question. "
    "Return JSON with field: lines (list of strings). If none apply, return {\"lines\": []}."
 )
 SELECT_CLAIMS_PROMPT = (
    "Select relevant claim ids for the follow-up. "
    "Return JSON with field: claim_ids (list)."