atlasbot: add conversation state

2026-01-30 16:41:04 -03:00 · 2026-01-30 16:41:04 -03:00 · 0476edae6a
commit 0476edae6a
parent 0e471ecc37
6 changed files with 262 additions and 13 deletions
--- a/atlasbot/api/http.py
+++ b/atlasbot/api/http.py
@ -20,6 +20,7 @@ class AnswerRequest(BaseModel):
    content: str | None = None
    mode: str | None = None
    history: list[dict[str, str]] | None = None
    conversation_id: str | None = None
 class AnswerResponse(BaseModel):
@ -30,7 +31,7 @@ class Api:
    def __init__(
        self,
        settings: Settings,
-        answer_handler: Callable[[str, str, list[dict[str, str]] | None], Awaitable[AnswerResult]],
+        answer_handler: Callable[[str, str, list[dict[str, str]] | None, str | None], Awaitable[AnswerResult]],
    ) -> None:
        self._settings = settings
        self._answer_handler = answer_handler
@ -53,7 +54,8 @@ class Api:
            if not question:
                raise HTTPException(status_code=400, detail="missing question")
            mode = (payload.mode or "quick").strip().lower()
-            result = await self._answer_handler(question, mode, payload.history)
+            conversation_id = payload.conversation_id
            result = await self._answer_handler(question, mode, payload.history, conversation_id)
            log.info(
                "answer",
                extra={
--- a/atlasbot/config.py
+++ b/atlasbot/config.py
@ -53,6 +53,8 @@ class Settings:
    snapshot_ttl_sec: int
    thinking_interval_sec: int
    conversation_ttl_sec: int
    snapshot_pin_enabled: bool
    queue_enabled: bool
    nats_url: str
@ -141,6 +143,8 @@ def load_settings() -> Settings:
        ariadne_state_token=os.getenv("ARIADNE_STATE_TOKEN", ""),
        snapshot_ttl_sec=_env_int("ATLASBOT_SNAPSHOT_TTL_SEC", "30"),
        thinking_interval_sec=_env_int("ATLASBOT_THINKING_INTERVAL_SEC", "30"),
        conversation_ttl_sec=_env_int("ATLASBOT_CONVERSATION_TTL_SEC", "900"),
        snapshot_pin_enabled=_env_bool("ATLASBOT_SNAPSHOT_PIN_ENABLED", "false"),
        queue_enabled=_env_bool("ATLASBOT_QUEUE_ENABLED", "false"),
        nats_url=os.getenv("ATLASBOT_NATS_URL", "nats://nats.nats.svc.cluster.local:4222"),
        nats_stream=os.getenv("ATLASBOT_NATS_STREAM", "atlasbot"),
--- a/atlasbot/engine/answerer.py
+++ b/atlasbot/engine/answerer.py
@ -1,4 +1,5 @@
 import asyncio
 import json
 import logging
 import re
 import time
@ -9,7 +10,7 @@ from atlasbot.config import Settings
 from atlasbot.knowledge.loader import KnowledgeBase
 from atlasbot.llm.client import LLMClient, build_messages, parse_json
 from atlasbot.llm import prompts
-from atlasbot.snapshot.builder import SnapshotProvider, summary_text
+from atlasbot.snapshot.builder import SnapshotProvider, build_summary, summary_text
 log = logging.getLogger(__name__)
@ -29,6 +30,29 @@ class AnswerResult:
    meta: dict[str, Any]
@dataclass
 class EvidenceItem:
    path: str
    reason: str
    value: Any | None = None
    value_at_claim: Any | None = None
@dataclass
 class ClaimItem:
    id: str
    claim: str
    evidence: list[EvidenceItem]
@dataclass
 class ConversationState:
    updated_at: float
    claims: list[ClaimItem]
    snapshot_id: str | None = None
    snapshot: dict[str, Any] | None = None
 class AnswerEngine:
    def __init__(
        self,
@ -41,6 +65,7 @@ class AnswerEngine:
        self._llm = llm
        self._kb = kb
        self._snapshot = snapshot
        self._state: dict[str, ConversationState] = {}
    async def answer(
        self,
@ -49,6 +74,7 @@ class AnswerEngine:
        mode: str,
        history: list[dict[str, str]] | None = None,
        observer: Callable[[str, str], None] | None = None,
        conversation_id: str | None = None,
    ) -> AnswerResult:
        question = (question or "").strip()
        if not question:
@ -56,10 +82,15 @@ class AnswerEngine:
        if mode == "stock":
            return await self._answer_stock(question)
        state = self._get_state(conversation_id)
        snapshot = self._snapshot.get()
        snapshot_used = snapshot
        if self._settings.snapshot_pin_enabled and state and state.snapshot:
            snapshot_used = state.snapshot
        summary = build_summary(snapshot_used)
        kb_summary = self._kb.summary()
        runbooks = self._kb.runbook_titles(limit=4)
-        snapshot_ctx = summary_text(snapshot)
+        snapshot_ctx = summary_text(snapshot_used)
        history_ctx = _format_history(history)
        base_context = _join_context([
            kb_summary,
@ -97,15 +128,30 @@ class AnswerEngine:
            "atlasbot_selection",
            extra={"extra": {"mode": mode, "selected": len(best), "scores": scores.__dict__}},
        )
        if classify.get("follow_up") and state and state.claims:
            if observer:
                observer("followup", "answering follow-up")
            reply = await self._answer_followup(question, state, summary, classify, mode)
            meta = {
                "mode": mode,
                "follow_up": True,
                "classify": classify,
            }
            return AnswerResult(reply, scores, meta)
        if observer:
            observer("synthesize", "synthesizing reply")
        reply = await self._synthesize(question, best, base_context, classify, mode)
        claims = await self._extract_claims(question, reply, summary)
        if conversation_id and claims:
            self._store_state(conversation_id, claims, summary, snapshot_used)
        meta = {
            "mode": mode,
            "angles": angles,
            "scores": scores.__dict__,
            "classify": classify,
            "candidates": len(candidates),
            "claims": len(claims),
        }
        return AnswerResult(reply, scores, meta)
@ -121,6 +167,8 @@ class AnswerEngine:
        data = _parse_json_block(raw, fallback={"needs_snapshot": True})
        if "answer_style" not in data:
            data["answer_style"] = "direct"
        if "follow_up_kind" not in data:
            data["follow_up_kind"] = "other"
        return data
    async def _angles(self, question: str, classify: dict[str, Any], mode: str) -> list[dict[str, Any]]:
@ -216,6 +264,114 @@ class AnswerEngine:
        refine_messages = build_messages(prompts.CLUSTER_SYSTEM, refine_prompt, context=context)
        return await self._llm.chat(refine_messages, model=model)
    async def _extract_claims(
        self,
        question: str,
        reply: str,
        summary: dict[str, Any],
    ) -> list[ClaimItem]:
        if not reply or not summary:
            return []
        summary_json = _json_excerpt(summary)
        prompt = prompts.CLAIM_MAP_PROMPT + "\nQuestion: " + question + "\nAnswer: " + reply
        messages = build_messages(prompts.CLUSTER_SYSTEM, prompt, context=f"SnapshotSummaryJson:{summary_json}")
        raw = await self._llm.chat(messages, model=self._settings.ollama_model_fast)
        data = _parse_json_block(raw, fallback={})
        claims_raw = data.get("claims") if isinstance(data, dict) else None
        claims: list[ClaimItem] = []
        if isinstance(claims_raw, list):
            for entry in claims_raw:
                if not isinstance(entry, dict):
                    continue
                claim_text = str(entry.get("claim") or "").strip()
                claim_id = str(entry.get("id") or "").strip() or f"c{len(claims)+1}"
                evidence_items: list[EvidenceItem] = []
                for ev in entry.get("evidence") or []:
                    if not isinstance(ev, dict):
                        continue
                    path = str(ev.get("path") or "").strip()
                    if not path:
                        continue
                    reason = str(ev.get("reason") or "").strip()
                    value = _resolve_path(summary, path)
                    evidence_items.append(EvidenceItem(path=path, reason=reason, value=value, value_at_claim=value))
                if claim_text and evidence_items:
                    claims.append(ClaimItem(id=claim_id, claim=claim_text, evidence=evidence_items))
        return claims
    async def _answer_followup(
        self,
        question: str,
        state: ConversationState,
        summary: dict[str, Any],
        classify: dict[str, Any],
        mode: str,
    ) -> str:
        follow_kind = classify.get("follow_up_kind") if isinstance(classify, dict) else "other"
        claim_ids = await self._select_claims(question, state.claims)
        selected = [claim for claim in state.claims if claim.id in claim_ids] if claim_ids else state.claims[:2]
        evidence_lines = []
        for claim in selected:
            evidence_lines.append(f"Claim: {claim.claim}")
            for ev in claim.evidence:
                current = _resolve_path(summary, ev.path)
                ev.value = current
                delta_note = ""
                if ev.value_at_claim is not None and current is not None and current != ev.value_at_claim:
                    delta_note = f" (now {current})"
                evidence_lines.append(f"- {ev.path}: {ev.value_at_claim}{delta_note} {('- ' + ev.reason) if ev.reason else ''}")
        evidence_ctx = "\n".join(evidence_lines)
        prompt = prompts.FOLLOWUP_EVIDENCE_PROMPT
        if follow_kind in {"next_steps", "change"}:
            prompt = prompts.FOLLOWUP_ACTION_PROMPT
        prompt = prompt + "\nFollow-up: " + question + "\nEvidence:\n" + evidence_ctx
        messages = build_messages(prompts.CLUSTER_SYSTEM, prompt)
        model = _synthesis_model(self._settings, mode)
        return await self._llm.chat(messages, model=model)
    async def _select_claims(self, question: str, claims: list[ClaimItem]) -> list[str]:
        if not claims:
            return []
        claims_brief = [{"id": claim.id, "claim": claim.claim} for claim in claims]
        prompt = prompts.SELECT_CLAIMS_PROMPT + "\nFollow-up: " + question + "\nClaims: " + json.dumps(claims_brief)
        messages = build_messages(prompts.CLUSTER_SYSTEM, prompt)
        raw = await self._llm.chat(messages, model=self._settings.ollama_model_fast)
        data = _parse_json_block(raw, fallback={})
        ids = data.get("claim_ids") if isinstance(data, dict) else []
        if isinstance(ids, list):
            return [str(item) for item in ids if item]
        return []
    def _get_state(self, conversation_id: str | None) -> ConversationState | None:
        if not conversation_id:
            return None
        self._cleanup_state()
        return self._state.get(conversation_id)
    def _store_state(
        self,
        conversation_id: str,
        claims: list[ClaimItem],
        summary: dict[str, Any],
        snapshot: dict[str, Any] | None,
    ) -> None:
        snapshot_id = _snapshot_id(summary)
        pinned_snapshot = snapshot if self._settings.snapshot_pin_enabled else None
        self._state[conversation_id] = ConversationState(
            updated_at=time.monotonic(),
            claims=claims,
            snapshot_id=snapshot_id,
            snapshot=pinned_snapshot,
        )
        self._cleanup_state()
    def _cleanup_state(self) -> None:
        ttl = max(60, self._settings.conversation_ttl_sec)
        now = time.monotonic()
        expired = [key for key, state in self._state.items() if now - state.updated_at > ttl]
        for key in expired:
            self._state.pop(key, None)
 def _join_context(parts: list[str]) -> str:
    text = "\n".join([p for p in parts if p])
@ -227,12 +383,19 @@ def _format_history(history: list[dict[str, str]] | None) -> str:
        return ""
    lines = ["Recent conversation:"]
    for entry in history[-4:]:
-        question = entry.get("q") if isinstance(entry, dict) else None
+        if not isinstance(entry, dict):
-        answer = entry.get("a") if isinstance(entry, dict) else None
+            continue
        question = entry.get("q")
        answer = entry.get("a")
        role = entry.get("role")
        content = entry.get("content")
        if question:
            lines.append(f"Q: {question}")
        if answer:
            lines.append(f"A: {answer}")
        if role and content:
            prefix = "Q" if role == "user" else "A"
            lines.append(f"{prefix}: {content}")
    return "\n".join(lines)
@ -312,3 +475,44 @@ def _coerce_int(value: Any, default: int) -> int:
 def _default_scores() -> AnswerScores:
    return AnswerScores(confidence=60, relevance=60, satisfaction=60, hallucination_risk="medium")
 def _resolve_path(data: Any, path: str) -> Any | None:
    cursor = data
    for part in re.split(r"\\.(?![^\\[]*\\])", path):
        if not part:
            continue
        match = re.match(r"^(\\w+)(?:\\[(\\d+)\\])?$", part)
        if not match:
            return None
        key = match.group(1)
        index = match.group(2)
        if isinstance(cursor, dict):
            cursor = cursor.get(key)
        else:
            return None
        if index is not None:
            try:
                idx = int(index)
                if isinstance(cursor, list) and 0 <= idx < len(cursor):
                    cursor = cursor[idx]
                else:
                    return None
            except ValueError:
                return None
    return cursor
 def _snapshot_id(summary: dict[str, Any]) -> str | None:
    if not summary:
        return None
    for key in ("generated_at", "snapshot_ts", "snapshot_id"):
        value = summary.get(key)
        if isinstance(value, str) and value:
            return value
    return None
 def _json_excerpt(summary: dict[str, Any], max_chars: int = 12000) -> str:
    raw = json.dumps(summary, ensure_ascii=False)
    return raw[:max_chars]
--- a/atlasbot/llm/prompts.py
+++ b/atlasbot/llm/prompts.py
@ -16,7 +16,8 @@ CLASSIFY_PROMPT = (
    "needs_snapshot (bool), needs_kb (bool), needs_metrics (bool), "
    "needs_general (bool), intent (short string), ambiguity (0-1), "
    "answer_style (direct|insightful), topic_summary (short string), "
-    "follow_up (bool), question_type (metric|diagnostic|planning|open_ended)."
+    "follow_up (bool), follow_up_kind (evidence|why|clarify|next_steps|change|other), "
    "question_type (metric|diagnostic|planning|open_ended)."
 )
 ANGLE_PROMPT = (
@ -54,6 +55,37 @@ REFINE_PROMPT = (
    "Keep it grounded in the context. If you cannot add insight, say so explicitly."
 )
 CLAIM_MAP_PROMPT = (
    "Extract a claim map from the answer. "
    "Return JSON with fields: claims (list). "
    "Each claim object: id (short string), claim (short sentence), "
    "evidence (list of objects with path and reason). "
    "Paths must point into the provided SnapshotSummary JSON using dot notation, "
    "with list indexes in brackets, e.g. metrics.node_load[0].node. "
    "Do not invent evidence; if no evidence exists, omit the claim."
 )
 SELECT_CLAIMS_PROMPT = (
    "Pick which prior claim(s) the follow-up refers to. "
    "Return JSON with fields: claim_ids (list of ids), follow_up_kind "
    "(evidence|why|clarify|next_steps|change|other). "
    "If none apply, return an empty list."
 )
 FOLLOWUP_EVIDENCE_PROMPT = (
    "Answer the follow-up using only the provided claims and evidence. "
    "Be conversational, not bullet-heavy. "
    "If evidence does not support a claim, say so plainly. "
    "Do not add new claims."
 )
 FOLLOWUP_ACTION_PROMPT = (
    "Answer the follow-up using the provided claims and evidence. "
    "You may suggest next steps or changes, but keep them tightly tied "
    "to the evidence list. "
    "Be conversational and concise."
 )
 STOCK_SYSTEM = (
    "You are Atlas, a helpful assistant. "
    "Be concise and truthful. "
--- a/atlasbot/main.py
+++ b/atlasbot/main.py
@ -31,22 +31,24 @@ async def main() -> None:
    async def handler(payload: dict[str, object]) -> dict[str, object]:
        history = payload.get("history") if isinstance(payload, dict) else None
        conversation_id = payload.get("conversation_id") if isinstance(payload, dict) else None
        result = await engine.answer(
            str(payload.get("question", "") or ""),
            mode=str(payload.get("mode", "quick") or "quick"),
            history=history if isinstance(history, list) else None,
            conversation_id=str(conversation_id) if isinstance(conversation_id, str) else None,
        )
        return {"reply": result.reply, "scores": result.scores.__dict__}
    queue = QueueManager(settings, handler)
    await queue.start()
-    async def answer_handler(question: str, mode: str, history=None, observer=None) -> AnswerResult:
+    async def answer_handler(question: str, mode: str, history=None, conversation_id=None, observer=None) -> AnswerResult:
        if settings.queue_enabled:
-            payload = await queue.submit({"question": question, "mode": mode, "history": history or []})
+            payload = await queue.submit({"question": question, "mode": mode, "history": history or [], "conversation_id": conversation_id})
            reply = payload.get("reply", "") if isinstance(payload, dict) else ""
            return AnswerResult(reply=reply or "", scores=result_scores(payload), meta={"mode": mode})
-        return await engine.answer(question, mode=mode, history=history, observer=observer)
+        return await engine.answer(question, mode=mode, history=history, observer=observer, conversation_id=conversation_id)
    api = Api(settings, answer_handler)
    server = uvicorn.Server(uvicorn.Config(api.app, host="0.0.0.0", port=settings.http_port, log_level="info"))
--- a/atlasbot/matrix/bot.py
+++ b/atlasbot/matrix/bot.py
@ -80,7 +80,10 @@ class MatrixBot:
        settings: Settings,
        bot: MatrixBotConfig,
        engine: AnswerEngine,
-        answer_handler: Callable[[str, str, list[dict[str, str]] | None, Callable[[str, str], None] | None], Awaitable[AnswerResult]]
+        answer_handler: Callable[
            [str, str, list[dict[str, str]] | None, str | None, Callable[[str, str], None] | None],
            Awaitable[AnswerResult],
        ]
        | None = None,
    ) -> None:
        self._settings = settings
@ -155,9 +158,11 @@ class MatrixBot:
        task = asyncio.create_task(heartbeat())
        started = time.monotonic()
        try:
-            handler = self._answer_handler or (lambda q, m, h, obs: self._engine.answer(q, mode=m, history=h, observer=obs))
+            handler = self._answer_handler or (
                lambda q, m, h, cid, obs: self._engine.answer(q, mode=m, history=h, observer=obs, conversation_id=cid)
            )
            history = self._history.get(room_id, [])
-            result = await handler(question, mode, history, observer)
+            result = await handler(question, mode, history, room_id, observer)
            elapsed = time.monotonic() - started
            await self._client.send_message(token, room_id, result.reply)
            log.info(