Source code for sqldbagent.dashboard.service

"""Dashboard chat service built on top of the persisted LangGraph agent."""

from __future__ import annotations

import asyncio
from collections.abc import Callable, Iterator
from contextlib import contextmanager, nullcontext
from datetime import UTC, datetime
from pathlib import Path
from typing import Any
from uuid import uuid4

import orjson

from sqldbagent.adapters.langgraph.agent import create_sqldbagent_agent
from sqldbagent.adapters.langgraph.checkpoint import (
    create_memory_checkpointer,
    create_sync_postgres_checkpointer,
)
from sqldbagent.adapters.langgraph.memory import remember_database_context
from sqldbagent.adapters.langgraph.model import create_runtime_chat_model
from sqldbagent.adapters.langgraph.observability import (
    build_langsmith_metadata,
    is_langsmith_tracing_enabled,
    langsmith_tracing_context,
)
from sqldbagent.adapters.langgraph.store import (
    create_memory_store,
    create_sync_postgres_store,
)
from sqldbagent.core.bootstrap import build_service_container
from sqldbagent.core.config import AppSettings, load_settings
from sqldbagent.core.enums import Dialect
from sqldbagent.core.models.query import QueryExecutionResult
from sqldbagent.dashboard.models import (
    ChatMessageModel,
    ChatSessionModel,
    DashboardThreadEntryModel,
    DashboardTurnProgressModel,
)
from sqldbagent.diagrams.models import DiagramBundleModel
from sqldbagent.prompts.exploration import PromptExplorationService
from sqldbagent.prompts.models import PromptBundleModel
from sqldbagent.retrieval.models import RetrievalIndexManifestModel
from sqldbagent.snapshot.models import SnapshotBundleModel
from sqldbagent.snapshot.service import SnapshotService

_MAX_EXAMPLE_QUESTIONS = 5



[docs]
class DashboardChatService:
    """Run persisted chat turns over the shared sqldbagent agent stack."""


[docs]
    def __init__(
        self,
        *,
        settings: AppSettings | None = None,
        model: Any | None = None,
        checkpointer: Any | None = None,
        store: Any | None = None,
    ) -> None:
        """Initialize the dashboard chat service.

        Args:
            settings: Optional application settings.
            model: Optional prebuilt LangChain-compatible model for tests.
            checkpointer: Optional externally managed checkpointer for tests.
            store: Optional externally managed long-term memory store for tests
                or dashboard-session reuse.
        """

        self._settings = settings or load_settings()
        self._model = model
        self._checkpointer = checkpointer
        self._store = store



[docs]
    @staticmethod
    def new_thread_id() -> str:
        """Return a new stable thread identifier."""

        return uuid4().hex



[docs]
    def run_turn(
        self,
        *,
        thread_id: str,
        user_message: str,
        datasource_name: str,
        schema_name: str | None = None,
        progress_callback: Callable[[DashboardTurnProgressModel], None] | None = None,
    ) -> ChatSessionModel:
        """Run one user turn through the persisted agent session.

        Args:
            thread_id: LangGraph thread identifier.
            user_message: User message content.
            datasource_name: Datasource identifier.
            schema_name: Optional schema focus.
            progress_callback: Optional callback used to surface progress events
                while the agent turn is running.

        Returns:
            ChatSessionModel: Dashboard-ready state after the turn.
        """

        resolved_datasource = self._settings.resolve_datasource_name(datasource_name)
        config = {"configurable": {"thread_id": thread_id}}
        self._emit_progress(
            progress_callback,
            phase="bootstrap",
            label="Loading persisted agent context.",
            detail=(
                f"Datasource `{resolved_datasource}`"
                + (
                    f" schema `{schema_name}`."
                    if schema_name is not None
                    else " across visible schemas."
                )
            ),
        )
        with self._agent_session(
            datasource_name=resolved_datasource,
            schema_name=schema_name,
        ) as agent:
            with langsmith_tracing_context(
                settings=self._settings,
                tags=["dashboard", resolved_datasource],
                metadata=build_langsmith_metadata(
                    surface="dashboard",
                    datasource_name=resolved_datasource,
                    schema_name=schema_name,
                    thread_id=thread_id,
                    operation="run_turn",
                ),
            ):
                try:
                    for update in agent.stream(
                        {"messages": [{"role": "user", "content": user_message}]},
                        config=config,
                        stream_mode="updates",
                    ):
                        for event in self._progress_events_from_update(update):
                            self._emit_progress(progress_callback, event=event)
                except Exception as exc:
                    self._emit_progress(
                        progress_callback,
                        phase="error",
                        label="Agent turn failed.",
                        detail=str(exc),
                    )
                    raise
                state = agent.get_state(config)
                result = getattr(state, "values", {}) or {}
            session = self._session_from_values(
                thread_id=thread_id,
                datasource_name=resolved_datasource,
                schema_name=schema_name,
                values=result,
                diagram_bundle=self._load_or_create_diagram_bundle(
                    datasource_name=resolved_datasource,
                    schema_name=schema_name,
                    values=result,
                ),
                prompt_bundle=self._load_or_create_prompt_bundle(
                    datasource_name=resolved_datasource,
                    schema_name=schema_name,
                    values=result,
                ),
            )
            self._upsert_thread_entry(session)
            self._emit_progress(
                progress_callback,
                phase="complete",
                label="Agent turn complete.",
                detail=(
                    session.latest_snapshot_summary
                    or f"Rendered {len(session.messages)} transcript messages."
                ),
            )
            return session.model_copy(
                update={
                    "available_threads": self.list_threads(
                        datasource_name=resolved_datasource,
                        schema_name=schema_name,
                    )
                }
            )



[docs]
    def load_thread(
        self,
        *,
        thread_id: str,
        datasource_name: str,
        schema_name: str | None = None,
    ) -> ChatSessionModel:
        """Load the current persisted state for one thread.

        Args:
            thread_id: LangGraph thread identifier.
            datasource_name: Datasource identifier.
            schema_name: Optional schema focus.

        Returns:
            ChatSessionModel: Dashboard-ready state snapshot for the thread.
        """

        resolved_datasource = self._settings.resolve_datasource_name(datasource_name)
        config = {"configurable": {"thread_id": thread_id}}
        with self._agent_session(
            datasource_name=resolved_datasource,
            schema_name=schema_name,
        ) as agent:
            try:
                state = agent.get_state(config)
            except Exception:  # noqa: BLE001
                return ChatSessionModel(
                    thread_id=thread_id,
                    datasource_name=resolved_datasource,
                    schema_name=schema_name,
                    available_threads=self.list_threads(
                        datasource_name=resolved_datasource,
                        schema_name=schema_name,
                    ),
                )
            session = self._session_from_values(
                thread_id=thread_id,
                datasource_name=resolved_datasource,
                schema_name=schema_name,
                values=getattr(state, "values", {}) or {},
                diagram_bundle=self._load_or_create_diagram_bundle(
                    datasource_name=resolved_datasource,
                    schema_name=schema_name,
                    values=getattr(state, "values", {}) or {},
                ),
                prompt_bundle=self._load_or_create_prompt_bundle(
                    datasource_name=resolved_datasource,
                    schema_name=schema_name,
                    values=getattr(state, "values", {}) or {},
                ),
            )
            if session.messages or session.latest_snapshot_id:
                self._upsert_thread_entry(session)
            return session.model_copy(
                update={
                    "available_threads": self.list_threads(
                        datasource_name=resolved_datasource,
                        schema_name=schema_name,
                    )
                }
            )



[docs]
    def list_threads(
        self,
        *,
        datasource_name: str | None = None,
        schema_name: str | None = None,
    ) -> list[DashboardThreadEntryModel]:
        """List persisted dashboard thread summaries.

        Args:
            datasource_name: Optional datasource filter.
            schema_name: Optional schema filter.

        Returns:
            list[DashboardThreadEntryModel]: Matching thread summaries ordered by
            most recently updated first.
        """

        entries = self._read_thread_entries()
        filtered = [
            entry
            for entry in entries
            if (datasource_name is None or entry.datasource_name == datasource_name)
            and (schema_name is None or entry.schema_name == schema_name)
        ]
        return sorted(filtered, key=lambda entry: entry.updated_at, reverse=True)



[docs]
    def update_thread_display_name(
        self,
        *,
        thread_id: str,
        datasource_name: str,
        schema_name: str | None,
        display_name: str | None,
    ) -> DashboardThreadEntryModel | None:
        """Persist an optional user-friendly display name for one thread."""

        normalized_name = None if display_name is None else display_name.strip() or None
        entries = self._read_thread_entries()
        for index, entry in enumerate(entries):
            if (
                entry.thread_id == thread_id
                and entry.datasource_name == datasource_name
                and entry.schema_name == schema_name
            ):
                updated = entry.model_copy(
                    update={
                        "display_name": normalized_name,
                        "updated_at": datetime.now(UTC),
                    }
                )
                entries[index] = updated
                self._write_thread_entries(entries)
                return updated
        return None



[docs]
    def supports_async_queries(self, *, datasource_name: str) -> bool:
        """Return whether the datasource has a supported async query path."""

        datasource = self._settings.get_datasource(datasource_name)
        url = datasource.url
        return any(
            [
                url.startswith("sqlite+pysqlite://"),
                url.startswith("mssql+pyodbc://"),
                url.startswith("postgresql+psycopg://"),
            ]
        )



[docs]
    def run_safe_query(
        self,
        *,
        datasource_name: str,
        sql: str,
        max_rows: int | None = None,
        mode: str = "sync",
        access_mode: str = "read_only",
    ) -> QueryExecutionResult:
        """Run one guarded query through the shared query service.

        Args:
            datasource_name: Datasource identifier.
            sql: SQL text to lint, guard, and execute.
            max_rows: Optional row-limit override.
            mode: Execution mode, either `sync` or `async`.
            access_mode: Requested execution mode, either `read_only` or `writable`.

        Returns:
            QueryExecutionResult: Guard and execution result.
        """

        resolved_datasource = self._settings.resolve_datasource_name(datasource_name)
        if mode == "async":
            return asyncio.run(
                self._run_safe_query_async(
                    datasource_name=resolved_datasource,
                    sql=sql,
                    max_rows=max_rows,
                    access_mode=access_mode,
                )
            )

        container = build_service_container(
            resolved_datasource,
            settings=self._settings,
        )
        try:
            return container.query_service.run(
                sql,
                max_rows=max_rows,
                access_mode=access_mode,
            )
        finally:
            container.close()


    async def _run_safe_query_async(
        self,
        *,
        datasource_name: str,
        sql: str,
        max_rows: int | None = None,
        access_mode: str,
    ) -> QueryExecutionResult:
        """Run the async guarded query path inside an event loop."""

        container = build_service_container(
            datasource_name,
            settings=self._settings,
            include_async_engine=True,
        )
        try:
            return await container.query_service.run_async(
                sql,
                max_rows=max_rows,
                access_mode=access_mode,
            )
        finally:
            await container.aclose()


[docs]
    def render_prompt_markdown(self, bundle: PromptBundleModel) -> str:
        """Render one stored prompt bundle as Markdown for dashboard downloads.

        Args:
            bundle: Prompt bundle to render.

        Returns:
            str: Human-readable Markdown prompt artifact.
        """

        container = build_service_container(
            bundle.datasource_name,
            settings=self._settings,
        )
        try:
            prompt_service = container.prompt_service
            if prompt_service is None:
                return bundle.model_dump_json(indent=2)
            return prompt_service.render_markdown(bundle)
        finally:
            container.close()



[docs]
    def update_prompt_bundle_enhancement(
        self,
        *,
        datasource_name: str,
        schema_name: str,
        active: bool,
        user_context: str | None,
        business_rules: str | None,
        additional_effective_context: str | None,
        answer_style: str | None,
        refresh_generated: bool = False,
    ) -> PromptBundleModel | None:
        """Update prompt-enhancement state and regenerate the prompt bundle.

        Args:
            datasource_name: Datasource identifier.
            schema_name: Schema name.
            active: Whether the enhancement should be active.
            user_context: Freeform user context or domain notes.
            business_rules: Business rules and caveats.
            additional_effective_context: Extra instructions that should be
                injected directly into the effective prompt.
            answer_style: Preferred answer style for downstream outputs.
            refresh_generated: Whether DB-aware guidance should be regenerated.

        Returns:
            PromptBundleModel | None: Updated prompt bundle or `None` when no
            snapshot exists yet for the schema.
        """

        resolved_datasource = self._settings.resolve_datasource_name(datasource_name)
        snapshot = self._resolve_session_snapshot(
            datasource_name=resolved_datasource,
            schema_name=schema_name,
            values={},
        )
        if snapshot is None:
            return None
        container = build_service_container(
            resolved_datasource, settings=self._settings
        )
        try:
            prompt_service = container.prompt_service
            if prompt_service is None:
                return None
            enhancement = prompt_service.update_prompt_enhancement(
                snapshot,
                active=active,
                user_context=user_context,
                business_rules=business_rules,
                additional_effective_context=additional_effective_context,
                answer_style=answer_style,
                refresh_generated=refresh_generated,
            )
            bundle = prompt_service.create_prompt_bundle(
                snapshot,
                enhancement=enhancement,
            )
            prompt_service.save_prompt_bundle(bundle)
            return bundle
        finally:
            container.close()



[docs]
    def refresh_prompt_bundle_context(
        self,
        *,
        datasource_name: str,
        schema_name: str,
    ) -> PromptBundleModel | None:
        """Regenerate schema-aware prompt context from the latest stored snapshot.

        Args:
            datasource_name: Datasource identifier.
            schema_name: Schema name.

        Returns:
            PromptBundleModel | None: Refreshed prompt bundle, or `None` when no
            stored snapshot exists for the schema.
        """

        resolved_datasource = self._settings.resolve_datasource_name(datasource_name)
        snapshot = self._resolve_session_snapshot(
            datasource_name=resolved_datasource,
            schema_name=schema_name,
            values={},
        )
        if snapshot is None:
            return None
        container = build_service_container(
            resolved_datasource,
            settings=self._settings,
        )
        try:
            prompt_service = container.prompt_service
            if prompt_service is None:
                return None
            enhancement = prompt_service.load_or_create_enhancement(
                snapshot,
                refresh_generated=True,
            )
            bundle = prompt_service.create_prompt_bundle(
                snapshot,
                enhancement=enhancement,
            )
            prompt_service.save_prompt_bundle(bundle)
            return bundle
        finally:
            container.close()



[docs]
    def explore_prompt_bundle_context(
        self,
        *,
        datasource_name: str,
        schema_name: str,
        table_names: list[str] | None = None,
        max_tables: int = 4,
        unique_value_limit: int = 8,
        sync_memory: bool = True,
        create_snapshot_if_missing: bool = True,
    ) -> PromptBundleModel | None:
        """Generate live prompt context and persist it into the prompt bundle.

        Args:
            datasource_name: Datasource identifier.
            schema_name: Schema name.
            table_names: Optional explicit focus tables.
            max_tables: Maximum number of tables to explore live.
            unique_value_limit: Maximum number of distinct values per column.
            sync_memory: Whether to sync a concise summary into long-term memory.
            create_snapshot_if_missing: Whether to bootstrap a new snapshot first.

        Returns:
            PromptBundleModel | None: Updated prompt bundle, or `None` when no
            stored snapshot exists for the schema.
        """

        resolved_datasource = self._settings.resolve_datasource_name(datasource_name)
        container = build_service_container(
            resolved_datasource,
            settings=self._settings,
        )
        try:
            if container.prompt_service is None or container.profiler is None:
                return None
            snapshot = self._resolve_session_snapshot(
                datasource_name=resolved_datasource,
                schema_name=schema_name,
                values={},
            )
            if snapshot is None:
                if not create_snapshot_if_missing or container.snapshotter is None:
                    return None
                snapshot = container.snapshotter.create_schema_snapshot(
                    schema_name=schema_name,
                    sample_size=self._settings.profiling.default_sample_size,
                )
                container.snapshotter.save_snapshot(snapshot)
            exploration = PromptExplorationService().create_exploration(
                snapshot,
                profiler=container.profiler,
                table_names=table_names,
                max_tables=max_tables,
                unique_value_limit=unique_value_limit,
            )
            enhancement = container.prompt_service.save_prompt_exploration(
                snapshot,
                exploration=exploration,
            )
            if sync_memory:
                with self._resolved_store() as store:
                    remember_database_context(
                        store,
                        settings=self._settings,
                        datasource_name=resolved_datasource,
                        schema_name=schema_name,
                        notes=[exploration.summary or "Saved live prompt exploration."],
                        preferred_tables=exploration.focus_tables,
                        merge=True,
                    )
            bundle = container.prompt_service.create_prompt_bundle(
                snapshot,
                enhancement=enhancement,
            )
            container.prompt_service.save_prompt_bundle(bundle)
            return bundle
        finally:
            container.close()



[docs]
    def ensure_retrieval_index(
        self,
        *,
        datasource_name: str,
        schema_name: str,
        recreate_collection: bool = False,
    ) -> RetrievalIndexManifestModel | None:
        """Ensure a retrieval index exists for the latest stored schema snapshot.

        Args:
            datasource_name: Datasource identifier.
            schema_name: Schema name.
            recreate_collection: Whether to rebuild the vector collection.

        Returns:
            RetrievalIndexManifestModel | None: Saved retrieval manifest, or
            `None` when no stored snapshot exists for the schema.
        """

        resolved_datasource = self._settings.resolve_datasource_name(datasource_name)
        snapshot = self._resolve_session_snapshot(
            datasource_name=resolved_datasource,
            schema_name=schema_name,
            values={},
        )
        if snapshot is None:
            return None
        container = build_service_container(
            resolved_datasource,
            settings=self._settings,
        )
        try:
            retrieval_service = container.retrieval_service
            if retrieval_service is None:
                return None
            return retrieval_service.index_snapshot_bundle(
                snapshot,
                recreate_collection=recreate_collection,
            )
        finally:
            container.close()


    @contextmanager
    def _agent_session(
        self,
        *,
        datasource_name: str,
        schema_name: str | None,
    ) -> Iterator[Any]:
        """Build a short-lived agent session over shared repo services."""

        container = build_service_container(datasource_name, settings=self._settings)
        try:
            model = self._model or create_runtime_chat_model(self._settings)
            if self._checkpointer is not None:
                with nullcontext(self._checkpointer) as checkpointer:
                    with self._resolved_store() as store:
                        yield create_sqldbagent_agent(
                            services=container,
                            model=model,
                            datasource_name=datasource_name,
                            settings=self._settings,
                            schema_name=schema_name,
                            checkpointer=checkpointer,
                            store=store,
                        )
                return

            if (
                self._settings.agent.checkpoint.backend == "postgres"
                and self._settings.agent.checkpoint.postgres_url is not None
            ):
                with create_sync_postgres_checkpointer(
                    settings=self._settings
                ) as checkpointer:
                    with self._resolved_store() as store:
                        yield create_sqldbagent_agent(
                            services=container,
                            model=model,
                            datasource_name=datasource_name,
                            settings=self._settings,
                            schema_name=schema_name,
                            checkpointer=checkpointer,
                            store=store,
                        )
                return

            with self._resolved_store() as store:
                yield create_sqldbagent_agent(
                    services=container,
                    model=model,
                    datasource_name=datasource_name,
                    settings=self._settings,
                    schema_name=schema_name,
                    checkpointer=create_memory_checkpointer(),
                    store=store,
                )
        finally:
            container.close()

    def _session_from_values(
        self,
        *,
        thread_id: str,
        datasource_name: str,
        schema_name: str | None,
        values: dict[str, Any],
        diagram_bundle: DiagramBundleModel | None = None,
        prompt_bundle: PromptBundleModel | None = None,
    ) -> ChatSessionModel:
        """Build a dashboard chat session snapshot from agent state values."""

        snapshot = self._resolve_session_snapshot(
            datasource_name=datasource_name,
            schema_name=schema_name,
            values=values,
        )
        latest_snapshot_id = values.get("latest_snapshot_id")
        latest_snapshot_summary = values.get("latest_snapshot_summary")
        if snapshot is not None:
            if latest_snapshot_id is None:
                latest_snapshot_id = snapshot.snapshot_id
            if latest_snapshot_summary is None:
                latest_snapshot_summary = snapshot.summary
        return ChatSessionModel(
            thread_id=thread_id,
            datasource_name=datasource_name,
            schema_name=schema_name,
            messages=self._render_messages(values.get("messages", [])),
            dashboard_payload=dict(values.get("dashboard_payload") or {}),
            observability=self._build_observability_payload(
                datasource_name=datasource_name
            ),
            latest_snapshot_id=latest_snapshot_id,
            latest_snapshot_summary=latest_snapshot_summary,
            tool_call_digest=list(values.get("tool_call_digest") or []),
            diagram_bundle=diagram_bundle,
            prompt_bundle=prompt_bundle,
            retrieval_manifest=self._load_retrieval_manifest(
                datasource_name=datasource_name,
                schema_name=schema_name,
                values=values,
            ),
            example_questions=self._build_example_questions(
                snapshot=snapshot,
                schema_name=schema_name,
            ),
        )

    def _build_observability_payload(
        self,
        *,
        datasource_name: str,
    ) -> dict[str, object]:
        """Build UI-friendly observability details for the active session.

        Args:
            datasource_name: Datasource name for dialect-aware status text.

        Returns:
            dict[str, object]: Checkpoint and LangSmith status details.
        """

        langsmith_settings = self._settings.langsmith
        checkpoint_payload = self._build_checkpoint_observability()
        memory_payload = self._build_memory_observability()
        return {
            **checkpoint_payload,
            **memory_payload,
            "database_access_mode": "guarded_read_only",
            "database_access_summary": self._build_database_access_summary(
                datasource_name=datasource_name
            ),
            "langsmith_tracing": is_langsmith_tracing_enabled(self._settings),
            "langsmith_project": langsmith_settings.project,
            "langsmith_endpoint": langsmith_settings.endpoint,
            "langsmith_workspace_id": langsmith_settings.workspace_id,
            "langsmith_tags": list(langsmith_settings.tags),
        }

    def _build_checkpoint_observability(self) -> dict[str, object]:
        """Build checkpoint runtime details for dashboard observability."""

        requested_backend = self._settings.agent.checkpoint.backend
        checkpoint_url = self._settings.agent.checkpoint.postgres_url

        if self._checkpointer is not None:
            active_backend = (
                self._detect_checkpointer_backend(self._checkpointer) or "memory"
            )
            is_durable = active_backend == "postgres"
            is_fallback = requested_backend == "postgres" and not is_durable
            return {
                "checkpoint_backend": active_backend,
                "checkpoint_requested_backend": requested_backend,
                "checkpoint_is_durable": is_durable,
                "checkpoint_status": (
                    "durable"
                    if is_durable
                    else "fallback" if is_fallback else "session"
                ),
                "checkpoint_summary": (
                    "Durable thread persistence is active through a Postgres checkpoint saver."
                    if is_durable
                    else (
                        "Postgres checkpointing was requested, but the dashboard is currently using a session-only saver."
                        if is_fallback
                        else "Thread persistence is scoped to the current dashboard session."
                    )
                ),
                "checkpoint_recommendation": (
                    "Restart the dashboard with Postgres checkpointing enabled to make threads durable."
                    if is_fallback
                    else None
                ),
            }

        if requested_backend == "postgres" and checkpoint_url is not None:
            return {
                "checkpoint_backend": "postgres",
                "checkpoint_requested_backend": requested_backend,
                "checkpoint_is_durable": True,
                "checkpoint_status": "durable",
                "checkpoint_summary": (
                    "Durable thread persistence is active through the configured Postgres checkpoint database."
                ),
                "checkpoint_recommendation": None,
            }

        if requested_backend == "postgres":
            return {
                "checkpoint_backend": "memory",
                "checkpoint_requested_backend": requested_backend,
                "checkpoint_is_durable": False,
                "checkpoint_status": "fallback",
                "checkpoint_summary": (
                    "Postgres checkpointing was requested, but no checkpoint database URL is configured, so the dashboard fell back to a session-only memory saver."
                ),
                "checkpoint_recommendation": (
                    "Set `POSTGRES_*` or `SQLDBAGENT_AGENT_CHECKPOINT_POSTGRES_URL`, then restart the dashboard to make threads durable."
                ),
            }

        return {
            "checkpoint_backend": "memory",
            "checkpoint_requested_backend": requested_backend,
            "checkpoint_is_durable": False,
            "checkpoint_status": "session",
            "checkpoint_summary": (
                "Thread persistence is scoped to the current dashboard session."
            ),
            "checkpoint_recommendation": (
                None
                if requested_backend == "memory"
                else "Enable Postgres checkpointing to make threads durable."
            ),
        }

    def _build_memory_observability(self) -> dict[str, object]:
        """Build long-term memory runtime details for dashboard observability."""

        requested_backend = self._settings.agent.memory.backend
        memory_url = self._settings.agent.memory.postgres_url

        if self._store is not None:
            active_backend = self._detect_store_backend(self._store) or "memory"
            is_durable = active_backend == "postgres"
            is_fallback = requested_backend == "postgres" and not is_durable
            return {
                "memory_backend": active_backend,
                "memory_requested_backend": requested_backend,
                "memory_is_durable": is_durable,
                "memory_status": (
                    "durable"
                    if is_durable
                    else "fallback" if is_fallback else "session"
                ),
                "memory_summary": (
                    "Long-term database memory is durable through a Postgres store."
                    if is_durable
                    else (
                        "Postgres long-term memory was requested, but the dashboard is currently using a session store."
                        if is_fallback
                        else "Long-term database memory is scoped to the current dashboard session."
                    )
                ),
            }

        if requested_backend == "disabled":
            return {
                "memory_backend": "disabled",
                "memory_requested_backend": requested_backend,
                "memory_is_durable": False,
                "memory_status": "disabled",
                "memory_summary": (
                    "Long-term database memory is disabled for this dashboard run."
                ),
            }

        if requested_backend == "postgres" and memory_url is not None:
            return {
                "memory_backend": "postgres",
                "memory_requested_backend": requested_backend,
                "memory_is_durable": True,
                "memory_status": "durable",
                "memory_summary": (
                    "Long-term database memory is durable through the configured Postgres store."
                ),
            }

        if requested_backend == "postgres":
            return {
                "memory_backend": "memory",
                "memory_requested_backend": requested_backend,
                "memory_is_durable": False,
                "memory_status": "fallback",
                "memory_summary": (
                    "Postgres long-term memory was requested, but no store database URL is configured, so the dashboard fell back to a session store."
                ),
            }

        return {
            "memory_backend": "memory",
            "memory_requested_backend": requested_backend,
            "memory_is_durable": False,
            "memory_status": "session",
            "memory_summary": (
                "Long-term database memory is scoped to the current dashboard session."
            ),
        }

    @staticmethod
    def _detect_checkpointer_backend(checkpointer: object) -> str | None:
        """Infer the backend type for an externally supplied checkpointer."""

        identity = (
            f"{checkpointer.__class__.__module__}.{checkpointer.__class__.__name__}"
        ).lower()
        if "postgres" in identity:
            return "postgres"
        if "memory" in identity or "inmemory" in identity:
            return "memory"
        return None

    @staticmethod
    def _detect_store_backend(store: object) -> str | None:
        """Infer the backend type for an externally supplied long-term store."""

        identity = f"{store.__class__.__module__}.{store.__class__.__name__}".lower()
        if "postgres" in identity:
            return "postgres"
        if "memory" in identity or "inmemory" in identity:
            return "memory"
        return None

    def _build_database_access_summary(self, *, datasource_name: str) -> str:
        """Build dialect-aware read-only access guidance for the dashboard."""

        try:
            datasource = self._settings.get_datasource(datasource_name)
        except Exception:  # noqa: BLE001
            return "All dashboard SQL stays on the central guarded read-only execution path."

        if datasource.dialect == Dialect.POSTGRES:
            return "Guarded SQL uses Postgres read-only transactions with the configured statement timeout."
        if datasource.dialect == Dialect.SQLITE:
            return "Guarded SQL uses a SQLite engine with `PRAGMA query_only` enabled."
        if datasource.dialect == Dialect.MSSQL:
            return "Guarded SQL uses the central safety layer and requests `ApplicationIntent=ReadOnly` on MSSQL connections."
        return (
            "All dashboard SQL stays on the central guarded read-only execution path."
        )

    @contextmanager
    def _resolved_store(self) -> Iterator[Any | None]:
        """Resolve the effective long-term store for the current dashboard session."""

        if self._store is not None:
            with nullcontext(self._store) as store:
                yield store
            return

        if (
            self._settings.agent.memory.backend == "postgres"
            and self._settings.agent.memory.postgres_url is not None
        ):
            with create_sync_postgres_store(settings=self._settings) as store:
                yield store
            return

        if self._settings.agent.memory.backend == "disabled":
            yield None
            return

        yield create_memory_store()

    @staticmethod
    def _emit_progress(
        callback: Callable[[DashboardTurnProgressModel], None] | None,
        *,
        phase: str | None = None,
        label: str | None = None,
        detail: str | None = None,
        event: DashboardTurnProgressModel | None = None,
    ) -> None:
        """Emit one progress event when a callback is available."""

        if callback is None:
            return
        callback(
            event
            or DashboardTurnProgressModel(
                phase=phase or "progress",
                label=label or "Working",
                detail=detail,
            )
        )

    def _progress_events_from_update(
        self,
        update: dict[str, Any],
    ) -> list[DashboardTurnProgressModel]:
        """Convert one LangGraph stream update into dashboard progress events."""

        events: list[DashboardTurnProgressModel] = []
        for node_name, payload in update.items():
            if node_name == "sqldbagent_state_seed.before_agent":
                snapshot_id = (
                    payload.get("latest_snapshot_id")
                    if isinstance(payload, dict)
                    else None
                )
                detail = None
                if snapshot_id is not None:
                    detail = f"Using stored snapshot `{snapshot_id}`."
                events.append(
                    DashboardTurnProgressModel(
                        phase="bootstrap",
                        label="Loaded datasource context.",
                        detail=detail,
                    )
                )
                continue
            if node_name == "model":
                events.extend(self._model_progress_events(payload))
                continue
            if node_name == "tools":
                events.extend(self._tool_progress_events(payload))
                continue
            if node_name == "sqldbagent_tool_digest.after_agent":
                events.append(
                    DashboardTurnProgressModel(
                        phase="complete",
                        label="Summarizing tool activity.",
                    )
                )
        return events

    def _model_progress_events(self, payload: Any) -> list[DashboardTurnProgressModel]:
        """Build progress events from one model step payload."""

        if not isinstance(payload, dict):
            return []
        events: list[DashboardTurnProgressModel] = []
        for message in payload.get("messages", []):
            tool_calls = getattr(message, "tool_calls", None) or []
            if tool_calls:
                tool_names = ", ".join(
                    str(call.get("name", "tool")) for call in tool_calls
                )
                events.append(
                    DashboardTurnProgressModel(
                        phase="planning",
                        label=f"Planning tool calls: {tool_names}",
                        detail=(
                            f"{len(tool_calls)} tool call(s) prepared for this step."
                        ),
                    )
                )
                continue
            content = self._render_content(getattr(message, "content", ""))
            if content:
                events.append(
                    DashboardTurnProgressModel(
                        phase="response",
                        label="Drafting assistant response.",
                        detail=self._summarize_preview(content, limit=180),
                    )
                )
        return events

    def _tool_progress_events(self, payload: Any) -> list[DashboardTurnProgressModel]:
        """Build progress events from one tool step payload."""

        if not isinstance(payload, dict):
            return []
        events: list[DashboardTurnProgressModel] = []
        for message in payload.get("messages", []):
            tool_name = getattr(message, "name", None) or "tool"
            detail = self._summarize_tool_output(
                tool_name=tool_name,
                content=self._render_content(getattr(message, "content", "")),
            )
            events.append(
                DashboardTurnProgressModel(
                    phase="tool",
                    label=f"Completed tool: {tool_name}",
                    detail=detail,
                )
            )
        return events

    def _render_messages(self, messages: list[Any]) -> list[ChatMessageModel]:
        """Convert LangChain/LangGraph messages into dashboard transcript rows."""

        rendered: list[ChatMessageModel] = []
        for message in messages:
            message_type = getattr(message, "type", None) or "unknown"
            if message_type == "system":
                continue
            role = {
                "human": "user",
                "ai": "assistant",
                "tool": "tool",
            }.get(message_type, "assistant")
            content = self._render_content(getattr(message, "content", ""))
            if not content and message_type == "ai":
                tool_calls = getattr(message, "tool_calls", None) or []
                if tool_calls:
                    content = "Calling tools: " + ", ".join(
                        str(call.get("name", "tool")) for call in tool_calls
                    )
            if not content:
                continue
            rendered.append(
                ChatMessageModel(
                    role=role,
                    content=content,
                    kind=message_type,
                    name=getattr(message, "name", None),
                    status=getattr(message, "status", None),
                )
            )
        return rendered

    def _summarize_tool_output(self, *, tool_name: str, content: str) -> str:
        """Build a compact summary for one tool output payload."""

        normalized = content.strip()
        if not normalized:
            return f"{tool_name} finished."
        try:
            payload = orjson.loads(normalized)
        except orjson.JSONDecodeError:
            return self._summarize_preview(normalized, limit=220)

        if isinstance(payload, dict):
            summary = payload.get("summary")
            if isinstance(summary, str) and summary.strip():
                return summary.strip()
            if "row_count" in payload and "columns" in payload:
                return (
                    f"Returned {payload.get('row_count', 0)} row(s) across "
                    f"{len(payload.get('columns') or [])} column(s)."
                )
            if "rows" in payload and isinstance(payload.get("rows"), list):
                return f"Returned {len(payload.get('rows') or [])} row(s)."
            keys = ", ".join(sorted(str(key) for key in payload.keys())[:6])
            return f"{tool_name} returned fields: {keys}."
        if isinstance(payload, list):
            return f"Returned {len(payload)} item(s)."
        return self._summarize_preview(str(payload), limit=220)

    def _render_content(self, content: Any) -> str:
        """Render a LangChain message content payload into readable text."""

        if content is None:
            return ""
        if isinstance(content, str):
            return content.strip()
        if isinstance(content, dict):
            return orjson.dumps(content, option=orjson.OPT_INDENT_2).decode()
        if isinstance(content, list):
            parts: list[str] = []
            for item in content:
                if isinstance(item, str):
                    parts.append(item)
                    continue
                if isinstance(item, dict):
                    text_payload = item.get("text")
                    if text_payload is not None:
                        parts.append(str(text_payload))
                    else:
                        parts.append(
                            orjson.dumps(item, option=orjson.OPT_INDENT_2).decode()
                        )
                    continue
                parts.append(str(item))
            return "\n".join(part.strip() for part in parts if part).strip()
        return str(content).strip()

    def _load_or_create_diagram_bundle(
        self,
        *,
        datasource_name: str,
        schema_name: str | None,
        values: dict[str, Any],
    ) -> DiagramBundleModel | None:
        """Load or create the latest diagram bundle for one dashboard session."""

        snapshot = self._resolve_session_snapshot(
            datasource_name=datasource_name,
            schema_name=schema_name,
            values=values,
        )
        if snapshot is None:
            return None
        container = build_service_container(datasource_name, settings=self._settings)
        try:
            diagram_service = container.diagram_service
            if diagram_service is None:
                return None
            bundle_path = diagram_service.bundle_path(
                datasource_name=datasource_name,
                schema_name=snapshot.regenerate.schema_name,
                snapshot_id=snapshot.snapshot_id,
            )
            bundle = diagram_service.create_diagram_bundle(snapshot)
            if bundle_path.exists():
                existing_bundle = diagram_service.load_diagram_bundle(bundle_path)
                if existing_bundle.content_hash == bundle.content_hash:
                    return existing_bundle
            diagram_service.save_diagram_bundle(bundle)
            return bundle
        finally:
            container.close()

    def _load_or_create_prompt_bundle(
        self,
        *,
        datasource_name: str,
        schema_name: str | None,
        values: dict[str, Any],
    ) -> PromptBundleModel | None:
        """Load or create the latest prompt bundle for one dashboard session."""

        snapshot = self._resolve_session_snapshot(
            datasource_name=datasource_name,
            schema_name=schema_name,
            values=values,
        )
        if snapshot is None:
            return None
        container = build_service_container(datasource_name, settings=self._settings)
        try:
            prompt_service = container.prompt_service
            if prompt_service is None:
                return None
            enhancement = prompt_service.load_or_create_enhancement(snapshot)
            bundle = prompt_service.create_prompt_bundle(
                snapshot,
                enhancement=enhancement,
            )
            prompt_service.save_prompt_bundle(bundle)
            return bundle
        finally:
            container.close()

    def _load_retrieval_manifest(
        self,
        *,
        datasource_name: str,
        schema_name: str | None,
        values: dict[str, Any],
    ) -> RetrievalIndexManifestModel | None:
        """Load the retrieval manifest for the current schema snapshot."""

        snapshot = self._resolve_session_snapshot(
            datasource_name=datasource_name,
            schema_name=schema_name,
            values=values,
        )
        if snapshot is None:
            return None
        container = build_service_container(datasource_name, settings=self._settings)
        try:
            retrieval_service = container.retrieval_service
            if retrieval_service is None:
                return None
            return retrieval_service.load_saved_manifest(
                schema_name=snapshot.regenerate.schema_name,
                snapshot_id=snapshot.snapshot_id,
            )
        finally:
            container.close()

    def _resolve_session_snapshot(
        self,
        *,
        datasource_name: str,
        schema_name: str | None,
        values: dict[str, Any],
    ) -> SnapshotBundleModel | None:
        """Resolve the most relevant snapshot bundle for dashboard artifacts."""

        requested_snapshot_id = values.get("latest_snapshot_id")
        entries = SnapshotService.list_saved_snapshots(
            self._settings.artifacts,
            datasource_name=datasource_name,
            schema_name=schema_name,
        )
        root = SnapshotService._snapshot_dir_from_artifacts(self._settings.artifacts)
        if requested_snapshot_id is not None:
            for entry in entries:
                if entry.snapshot_id == requested_snapshot_id:
                    return SnapshotService.load_snapshot(root / entry.path)
        if entries:
            return SnapshotService.load_snapshot(root / entries[0].path)
        return None

    def _build_example_questions(
        self,
        *,
        snapshot: SnapshotBundleModel | None,
        schema_name: str | None,
    ) -> list[str]:
        """Build snapshot-aware starter questions for the dashboard chat.

        Args:
            snapshot: Relevant stored snapshot for the active session.
            schema_name: Optional schema focus.

        Returns:
            list[str]: Ordered starter questions for the dashboard UI.
        """

        resolved_schema = schema_name or "default"
        questions = [
            f"Summarize the main entities and relationships in the {resolved_schema} schema.",
            f"Which tables in the {resolved_schema} schema are largest by row count or storage?",
            f"What data quality, uniqueness, or identifier signals stand out in the {resolved_schema} schema?",
        ]
        if snapshot is None:
            return questions[:_MAX_EXAMPLE_QUESTIONS]

        demo_questions = self._build_demo_example_questions(snapshot)
        if demo_questions:
            questions = [*demo_questions, *questions]

        profiles_by_table = {
            profile.table_name: profile
            for profile in snapshot.profiles
            if profile.schema_name == snapshot.regenerate.schema_name
        }
        ranked_tables = sorted(
            snapshot.schema_metadata.tables,
            key=lambda table: (
                (
                    (profiles_by_table.get(table.name).storage_bytes or 0)
                    if profiles_by_table.get(table.name) is not None
                    else 0
                ),
                (
                    (profiles_by_table.get(table.name).row_count or 0)
                    if profiles_by_table.get(table.name) is not None
                    else 0
                ),
                (
                    (profiles_by_table.get(table.name).relationship_count or 0)
                    if profiles_by_table.get(table.name) is not None
                    else 0
                ),
            ),
            reverse=True,
        )
        if ranked_tables:
            top_table = ranked_tables[0]
            qualified_name = ".".join(
                part for part in [top_table.schema_name, top_table.name] if part
            )
            questions.append(
                f"Profile {qualified_name} and explain its key columns, sample rows, and likely business meaning."
            )

        if snapshot.relationship_edges:
            edge = snapshot.relationship_edges[0]
            source_name = ".".join(
                part for part in [edge.source_schema, edge.source_table] if part
            )
            target_name = ".".join(
                part for part in [edge.target_schema, edge.target_table] if part
            )
            questions.append(
                f"How do {source_name} and {target_name} relate, and what is the safest join path between them?"
            )

        if snapshot.schema_metadata.views:
            questions.append(
                f"Which views in the {resolved_schema} schema are most useful, and what does each one represent?"
            )

        seen: set[str] = set()
        unique_questions: list[str] = []
        for question in questions:
            if question in seen:
                continue
            seen.add(question)
            unique_questions.append(question)
            if len(unique_questions) == _MAX_EXAMPLE_QUESTIONS:
                break
        return unique_questions

    @staticmethod
    def _build_demo_example_questions(snapshot: SnapshotBundleModel) -> list[str]:
        """Build tailored starter questions for the bundled demo schema.

        Args:
            snapshot: Relevant stored snapshot for the active session.

        Returns:
            list[str]: Demo-specific starter questions when the known demo
            tables are present; otherwise an empty list.
        """

        table_names = {table.name for table in snapshot.schema_metadata.tables}
        required_tables = {
            "customers",
            "orders",
            "order_items",
            "products",
            "support_tickets",
        }
        if not required_tables.issubset(table_names):
            return []

        schema_name = snapshot.regenerate.schema_name
        return [
            (
                f"Summarize the customer lifecycle in {schema_name}: how customers, "
                "orders, order_items, products, and support_tickets connect."
            ),
            (
                "Which customers look most commercially important based on order "
                "activity, and what evidence supports that?"
            ),
            (
                "Explain the safest join path to analyze revenue by customer "
                "segment and product category."
            ),
            (
                "What support-ticket patterns stand out by customer segment, "
                "priority, and order activity?"
            ),
            (
                "Profile the most important business identifiers in the demo "
                "schema, including customer_code, order_number, sku, and ticket_number."
            ),
        ]

    @property
    def _thread_registry_path(self) -> Path:
        """Return the persisted dashboard thread-registry path."""

        return (
            Path(self._settings.artifacts.root_dir)
            / "dashboard"
            / "thread-registry.json"
        )

    def _read_thread_entries(self) -> list[DashboardThreadEntryModel]:
        """Read the persisted dashboard thread registry from disk."""

        path = self._thread_registry_path
        if not path.exists():
            return []
        raw_entries = orjson.loads(path.read_bytes())
        return [DashboardThreadEntryModel.model_validate(item) for item in raw_entries]

    def _write_thread_entries(self, entries: list[DashboardThreadEntryModel]) -> None:
        """Persist the dashboard thread registry to disk."""

        path = self._thread_registry_path
        path.parent.mkdir(parents=True, exist_ok=True)
        path.write_bytes(
            orjson.dumps(
                [entry.model_dump(mode="json") for entry in entries],
                option=orjson.OPT_INDENT_2,
            )
        )

    def _upsert_thread_entry(self, session: ChatSessionModel) -> None:
        """Create or update one persisted dashboard thread summary."""

        now = datetime.now(UTC)
        last_user_message = next(
            (
                self._summarize_preview(message.content)
                for message in reversed(session.messages)
                if message.role == "user"
            ),
            None,
        )
        last_assistant_message = next(
            (
                self._summarize_preview(message.content)
                for message in reversed(session.messages)
                if message.role == "assistant"
            ),
            None,
        )
        entries = self._read_thread_entries()
        entry_key = (
            session.thread_id,
            session.datasource_name,
            session.schema_name,
        )
        for index, entry in enumerate(entries):
            if (
                entry.thread_id,
                entry.datasource_name,
                entry.schema_name,
            ) == entry_key:
                entries[index] = entry.model_copy(
                    update={
                        "display_name": entry.display_name,
                        "updated_at": now,
                        "message_count": len(session.messages),
                        "latest_snapshot_id": session.latest_snapshot_id,
                        "last_user_message": last_user_message,
                        "last_assistant_message": last_assistant_message,
                    }
                )
                self._write_thread_entries(entries)
                return
        entries.append(
            DashboardThreadEntryModel(
                thread_id=session.thread_id,
                datasource_name=session.datasource_name,
                schema_name=session.schema_name,
                display_name=None,
                created_at=now,
                updated_at=now,
                message_count=len(session.messages),
                latest_snapshot_id=session.latest_snapshot_id,
                last_user_message=last_user_message,
                last_assistant_message=last_assistant_message,
            )
        )
        self._write_thread_entries(entries)

    @staticmethod
    def _summarize_preview(content: str, *, limit: int = 96) -> str:
        """Collapse one message into a compact preview line."""

        normalized = " ".join(content.split())
        if len(normalized) <= limit:
            return normalized
        return normalized[: limit - 1].rstrip() + "…"