"""MCP server for jcodemunch-mcp."""

import argparse
import asyncio
import atexit
import functools
import hmac
import json
import jsonschema
import logging
import os
import sys
from pathlib import Path
from typing import Any, Optional

from mcp.server import Server
from mcp.types import Tool, TextContent, Resource, Prompt, PromptMessage, GetPromptResult

from . import __version__
from . import config as config_module
# Tool modules are imported lazily inside each call_tool() dispatch branch.
# This defers loading heavy dependencies (tree-sitter, httpx, pathspec) until
# the first actual call to a tool that needs them, reducing cold-start latency
# for sessions that only use query tools and never trigger indexing.
from .parser.symbols import VALID_KINDS
from .summarizer import get_provider_name
from .reindex_state import await_freshness_if_strict
from .path_map import ENV_VAR as _PATH_MAP_ENV_VAR
from .storage import result_cache_invalidate as _result_cache_invalidate
from .storage import write_pulse as _write_pulse

try:
    from .watcher import watch_folders, WatcherError
except ImportError:
    watch_folders = None  # type: ignore[assignment, misc]
    WatcherError = type("WatcherError", (Exception,), {})  # type: ignore[assignment, misc]


# Canonical list of all registered tool names (unfiltered).
# Keep in sync with _build_tools_list(). Used by `config --check` and
# `claude-md --generate` to detect CLAUDE.md / hook-script drift.
_CANONICAL_TOOL_NAMES: tuple[str, ...] = (
    # Indexing
    "index_repo", "index_folder", "summarize_repo", "index_file",
    # Discovery
    "list_repos", "resolve_repo", "suggest_queries",
    "get_repo_outline", "get_file_tree", "get_file_outline",
    # Search & Retrieval
    "search_symbols", "get_symbol_source", "get_context_bundle",
    "get_file_content", "search_text", "search_columns", "get_ranked_context",
    # Relationships
    "find_importers", "find_references", "check_references",
    "get_dependency_graph", "get_class_hierarchy", "get_related_symbols",
    "get_call_hierarchy",
    # Impact & Safety
    "get_blast_radius", "check_rename_safe", "get_impact_preview",
    "get_changed_symbols",
    # Architecture
    "get_dependency_cycles", "get_coupling_metrics", "get_layer_violations",
    "get_extraction_candidates", "get_cross_repo_map",
    # Quality & Metrics
    "get_symbol_complexity", "get_churn_rate", "get_hotspots",
    "get_repo_health", "get_symbol_importance", "find_dead_code",
    "get_dead_code_v2", "get_untested_symbols",
    # Diffs & Embeddings
    "get_symbol_diff", "embed_repo",
    # Utilities
    "get_session_stats", "get_session_context", "get_session_snapshot", "plan_turn", "register_edit", "invalidate_cache", "test_summarizer",
    "audit_agent_config",
)

# Tools eligible for Agent Selector complexity scoring
_AGENT_SELECTOR_TOOLS = frozenset({
    "get_ranked_context", "get_context_bundle", "search_symbols",
    "search_text", "get_symbol_source", "plan_turn",
    "get_blast_radius", "get_impact_preview", "get_dependency_graph",
})

# Tools excluded from strict freshness mode (don't wait for reindex)
_EXCLUDED_FROM_STRICT = frozenset({
    "list_repos",
    "resolve_repo",
    "get_session_stats",
    "get_session_context",
    "get_session_snapshot",
    "test_summarizer",
    "index_repo",
    "index_folder",
    "index_file",
    "invalidate_cache",
})


logger = logging.getLogger(__name__)


def _default_use_ai_summaries() -> bool:
    """Return whether AI summarization is enabled, as a bool.

    Collapses the tri-state config value ("auto", True, "true" → True;
    "false", False, "0", "no", "off" → False) into a simple gate.
    Note: _create_summarizer() reads the config directly to resolve
    the "auto" vs. explicit-provider distinction at summarization time.
    """
    raw = config_module.get("use_ai_summaries", "auto")
    if isinstance(raw, bool):
        return raw
    return str(raw).strip().lower() not in ("false", "0", "no", "off")


# ---------------------------------------------------------------------------
# Session state persistence (Feature 10: Session-Aware Routing)
# ---------------------------------------------------------------------------

_session_state_restored = False


def _restore_session_state() -> None:
    """Load and restore session state on server startup.
    
    Called from run_stdio_server / run_sse_server / run_streamable_http_server.
    Restores journal entries and search cache from previous session.
    """
    global _session_state_restored
    if _session_state_restored:
        return
    
    if not config_module.get("session_resume", False):
        return
    
    try:
        from .tools.session_state import get_session_state
        from .tools.session_journal import get_journal
        from .tools.search_symbols import _result_cache, _result_cache_lock
        from .storage import SQLiteIndexStore
        
        state = get_session_state()
        max_age = config_module.get("session_max_age_minutes", 30)
        
        loaded = state.load(max_age_minutes=max_age)
        if not loaded:
            logger.debug("No session state to restore")
            return
        
        # Restore journal
        journal = get_journal()
        count = state.restore_journal(journal, loaded)
        logger.info("Restored %d session journal entries", count)
        
        # Build current_indexes for cache restoration
        storage_path = os.environ.get("CODE_INDEX_PATH", "")
        store = SQLiteIndexStore(base_path=storage_path)
        current_indexes = {}
        try:
            repos = store.list_repos()
            for r in repos:
                # list_repos already returns indexed_at — no need to load full index
                repo_id = r.get("repo", f"{r.get('owner', '')}/{r.get('name', '')}")
                indexed_at = r.get("indexed_at", "")
                if indexed_at:
                    current_indexes[repo_id] = indexed_at
        except Exception:
            pass
        
        # Restore search cache
        with _result_cache_lock:
            count = state.restore_search_cache(_result_cache, loaded, current_indexes)
        logger.info("Restored %d search cache entries", count)
        
        _session_state_restored = True
        
    except Exception as e:
        logger.warning("Failed to restore session state: %s", e)


def _save_session_state() -> None:
    """Save session state on server shutdown.
    
    Registered with atexit for clean shutdown.
    """
    if not config_module.get("session_resume", False):
        return
    
    try:
        from .tools.session_state import get_session_state
        from .tools.session_journal import get_journal
        from .tools.search_symbols import _result_cache, _result_cache_lock
        
        state = get_session_state()
        journal = get_journal()
        max_queries = config_module.get("session_max_queries", 50)
        
        neg_log = journal.get_negative_evidence_log()
        with _result_cache_lock:
            state.save(journal, _result_cache, max_queries=max_queries,
                       negative_evidence_log=neg_log)
        
        logger.info("Saved session state")
        
    except Exception as e:
        logger.warning("Failed to save session state: %s", e)


# Register atexit handler for session state persistence
atexit.register(_save_session_state)


def _parse_watcher_flag(value: Optional[str]) -> bool:
    """Parse the --watcher flag value.

    None = not provided (disabled).
    'true'/'1'/'yes' = enabled (const from nargs='?').
    'false'/'0'/'no' = explicitly disabled.
    """
    if value is None:
        return False
    return value.lower() not in ("0", "no", "false")


def _get_watcher_enabled(args) -> bool:
    """Determine if the watcher should be enabled for the serve subcommand.

    Precedence (highest to lowest):
      1. --watcher CLI flag
      2. config file "watch" key  (JCODEMUNCH_WATCH env var is a fallback for this key
         when it is absent from config.jsonc — handled by config._apply_env_var_fallback)
    """
    flag = getattr(args, "watcher", None)
    if flag is not None:
        return _parse_watcher_flag(flag)
    return config_module.get("watch", False)


_BOOL_TRUE = frozenset(("true", "1", "yes", "on"))
_BOOL_FALSE = frozenset(("false", "0", "no", "off"))


def _coerce_arguments(arguments: dict, schema: dict) -> dict:
    """Coerce stringified values to their expected types per JSON schema.

    Handles boolean ("true"/"false"), integer ("5"), and number ("3.14")
    without eval. Unknown or already-correct types are passed through unchanged.
    """
    props = schema.get("properties", {})
    if not props:
        return arguments
    result = {}
    for k, v in arguments.items():
        if k in props and isinstance(v, str):
            expected = props[k].get("type")
            if expected == "boolean":
                if v.lower() in _BOOL_TRUE:
                    v = True
                elif v.lower() in _BOOL_FALSE:
                    v = False
            elif expected == "integer":
                try:
                    v = int(v)
                except (ValueError, TypeError):
                    pass
            elif expected == "number":
                try:
                    v = float(v)
                except (ValueError, TypeError):
                    pass
        result[k] = v
    return result


_TOOL_SCHEMAS: dict[str, dict] | None = None


def _build_language_enum() -> list[str]:
    """Build language enum from config, falling back to all registry languages."""
    languages = config_module.get("languages")
    if languages is None:
        from .parser.languages import LANGUAGE_REGISTRY
        return sorted(LANGUAGE_REGISTRY.keys())
    return languages


async def _ensure_tool_schemas() -> dict[str, dict]:
    """Lazy-initialize the tool name → inputSchema lookup for type coercion.

    Uses our own list_tools() — no coupling to private MCP SDK internals.
    Populated once on the first tool call, then cached for the process lifetime.
    """
    global _TOOL_SCHEMAS
    if _TOOL_SCHEMAS is None:
        tools = await list_tools()
        _TOOL_SCHEMAS = {t.name: t.inputSchema for t in tools if t.inputSchema}
    return _TOOL_SCHEMAS


# Create server
server = Server("jcodemunch-mcp")


@server.list_tools()
async def list_tools() -> list[Tool]:
    """List all available tools."""
    return _build_tools_list()


def _build_tools_list() -> list[Tool]:
    """Build the full tool list, applying config-driven filtering and overrides."""
    tools = [
        Tool(
            name="index_repo",
            description="Index a GitHub repository's source code. Fetches files, parses ASTs, extracts symbols, and saves to local storage. Set JCODEMUNCH_USE_AI_SUMMARIES=false to disable AI summaries globally.",
            inputSchema={
                "type": "object",
                "properties": {
                    "url": {
                        "type": "string",
                        "description": "GitHub repository URL or owner/repo string"
                    },
                    "use_ai_summaries": {
                        "type": "boolean",
                        "description": "Use AI to generate symbol summaries. Supports Anthropic, Gemini, OpenAI-compatible endpoints, MiniMax, and GLM-5 via env vars. When false, uses docstrings or signature fallback.",
                        "default": True
                    },
                    "extra_ignore_patterns": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "Additional gitignore-style patterns to exclude from indexing (merged with JCODEMUNCH_EXTRA_IGNORE_PATTERNS env var)"
                    },
                    "incremental": {
                        "type": "boolean",
                        "description": "When true and an existing index exists, only re-index changed files.",
                        "default": True
                    }
                },
                "required": ["url"]
            }
        ),
        Tool(
            name="index_folder",
            description="Index a local folder containing source code. Response includes `discovery_skip_counts` (files filtered per reason), `no_symbols_count`/`no_symbols_files` (files with no extractable symbols) for diagnosing missing files. Set JCODEMUNCH_USE_AI_SUMMARIES=false to disable AI summaries globally.",
            inputSchema={
                "type": "object",
                "properties": {
                    "path": {
                        "type": "string",
                        "description": "Path to local folder (absolute or relative, supports ~ for home directory)"
                    },
                    "use_ai_summaries": {
                        "type": "boolean",
                        "description": "Use AI to generate symbol summaries. Supports Anthropic, Gemini, OpenAI-compatible endpoints, MiniMax, and GLM-5 via env vars. When false, uses docstrings or signature fallback.",
                        "default": True
                    },
                    "extra_ignore_patterns": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "Additional gitignore-style patterns to exclude from indexing (merged with JCODEMUNCH_EXTRA_IGNORE_PATTERNS env var)"
                    },
                    "follow_symlinks": {
                        "type": "boolean",
                        "description": "Whether to include symlinked files in indexing. Symlinked directories are never followed (prevents infinite loops from circular symlinks). Default false for security.",
                        "default": False
                    },
                    "incremental": {
                        "type": "boolean",
                        "description": "When true and an existing index exists, only re-index changed files.",
                        "default": True
                    }
                },
                "required": ["path"]
            }
        ),
        Tool(
            name="summarize_repo",
            description=(
                "Re-run AI summarization on all symbols in an existing index. "
                "Use this when index_folder completed but AI summaries are missing — "
                "e.g., the background summarization thread was interrupted, AI was disabled "
                "at index time, or the summarizer provider wasn't configured yet. "
                "With force=true (recommended), clears all existing summaries and re-runs "
                "the full 3-tier pipeline (docstring → AI → signature fallback)."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or local/hash)"
                    },
                    "force": {
                        "type": "boolean",
                        "description": (
                            "If true, clear all existing summaries and re-summarize every symbol. "
                            "Required when index_folder already applied signature fallbacks. "
                            "If false, only process symbols with no summary at all."
                        ),
                        "default": False
                    }
                },
                "required": ["repo"]
            }
        ),
        Tool(
            name="index_file",
            description="Index a single file within an existing index. Faster than index_folder for surgical updates after editing a file. The file must be within an already-indexed folder's source_root. Can also add new files not yet in the index.",
            inputSchema={
                "type": "object",
                "properties": {
                    "path": {
                        "type": "string",
                        "description": "Absolute path to the file to index"
                    },
                    "use_ai_summaries": {
                        "type": "boolean",
                        "description": "Use AI to generate symbol summaries. Supports Anthropic, Gemini, OpenAI-compatible endpoints, MiniMax, and GLM-5 via env vars. When false, uses docstrings or signature fallback.",
                        "default": True
                    },
                    "context_providers": {
                        "type": "boolean",
                        "description": "Whether to run context providers",
                        "default": True
                    }
                },
                "required": ["path"]
            }
        ),
        Tool(
            name="list_repos",
            description=(
                "List all indexed repositories. "
                "START HERE before using Grep/Read/search tools — check if the project is "
                "already indexed, then use search_symbols / get_symbol_source instead of "
                "native file reads. If jcodemunch tools appear as deferred in your tool list, "
                "call ToolSearch to load their schemas first."
                if config_module.get("discovery_hint", True)
                else "List all indexed repositories."
            ),
            inputSchema={
                "type": "object",
                "properties": {}
            }
        ),
        Tool(
            name="resolve_repo",
            description="Resolve a filesystem path to its indexed repo identifier. O(1) lookup — faster than list_repos for finding a single repo. Accepts repo root, worktree, subdirectory, or file path.",
            inputSchema={
                "type": "object",
                "properties": {
                    "path": {
                        "type": "string",
                        "description": "Absolute filesystem path (repo root, worktree, subdirectory, or file)"
                    }
                },
                "required": ["path"]
            }
        ),
        Tool(
            name="get_file_tree",
            description="Get the file tree of an indexed repository, optionally filtered by path prefix. Results are capped at max_files (default 500) to prevent token overflow; use path_prefix to scope large trees.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "path_prefix": {
                        "type": "string",
                        "description": "Optional path prefix to filter (e.g., 'src/utils')",
                        "default": ""
                    },
                    "include_summaries": {
                        "type": "boolean",
                        "description": "Include file-level summaries in the tree nodes",
                        "default": False
                    },
                    "max_files": {
                        "type": "integer",
                        "description": "Maximum number of files to return (default 500). When truncated, response includes total_file_count and a hint to use path_prefix.",
                        "default": 500
                    }
                },
                "required": ["repo"]
            }
        ),
        Tool(
            name="get_file_outline",
            description="Get all symbols (functions, classes, methods) in a file with full signatures (including parameter names) and summaries. Use signatures to review naming at parameter granularity without reading the full file. Pass repo and file_path (e.g. 'src/main.py').",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "file_path": {
                        "type": "string",
                        "description": "Path to the file within the repository (e.g., 'src/main.py')"
                    },
                    "file_paths": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "List of file paths to query in batch mode. Returns a grouped results array."
                    }
                },
                "required": ["repo"]
            }
        ),
        Tool(
            name="get_symbol_source",
            description="Get full source of one symbol (symbol_id → flat object) or many (symbol_ids[] → {symbols, errors}). Supports verify, context_lines, and fqn (PHP FQN via PSR-4).",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "symbol_id": {
                        "type": "string",
                        "description": "Single symbol ID — returns flat symbol object"
                    },
                    "symbol_ids": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "Multiple symbol IDs — returns {symbols, errors}"
                    },
                    "verify": {
                        "type": "boolean",
                        "description": "Verify content hash matches stored hash (detects source drift)",
                        "default": False
                    },
                    "context_lines": {
                        "type": "integer",
                        "description": "Number of lines before/after symbol to include for context",
                        "default": 0
                    },
                    "fqn": {
                        "type": "string",
                        "description": "PHP fully-qualified class name (e.g. 'App\\Models\\User'). Resolves to symbol_id via PSR-4. Alternative to symbol_id."
                    }
                },
                "required": ["repo"]
            }
        ),
        Tool(
            name="get_file_content",
            description="Get cached source for a file, optionally sliced to a line range.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "file_path": {
                        "type": "string",
                        "description": "Path to the file within the repository (e.g., 'src/main.py')"
                    },
                    "start_line": {
                        "type": "integer",
                        "description": "Optional 1-based start line (inclusive)"
                    },
                    "end_line": {
                        "type": "integer",
                        "description": "Optional 1-based end line (inclusive)"
                    }
                },
                "required": ["repo", "file_path"]
            }
        ),
        Tool(
            name="search_symbols",
            description="Search for symbols matching a query across the entire indexed repository. Returns matches with signatures and summaries.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "query": {
                        "type": "string",
                        "description": "Search query (matches symbol names, signatures, summaries, docstrings)"
                    },
                    "kind": {
                        "type": "string",
                        "description": "Optional filter by symbol kind",
                        "enum": ["function", "class", "method", "constant", "type", "template", "import"]
                    },
                    "file_pattern": {
                        "type": "string",
                        "description": "Optional glob pattern to filter files (e.g., 'src/**/*.py')"
                    },
                    "language": {
                        "type": "string",
                        "description": "Optional filter by language",
                        "enum": _build_language_enum()
                    },
                    "decorator": {
                        "type": "string",
                        "description": "Optional filter: only return symbols with this decorator (case-insensitive substring match, e.g. 'route', 'property', 'Deprecated')"
                    },
                    "max_results": {
                        "type": "integer",
                        "description": "Maximum number of results to return (ignored when token_budget is set)",
                        "default": 10
                    },
                    "token_budget": {
                        "type": "integer",
                        "description": "Token budget cap. When set, results are sorted by score and greedily packed until the budget is exhausted. Overrides max_results. Reports token_budget, tokens_used, and tokens_remaining in _meta."
                    },
                    "detail_level": {
                        "type": "string",
                        "description": "Controls result verbosity. 'compact' returns id/name/kind/file/line only (~15 tokens each, best for broad discovery). 'standard' returns signatures and summaries (default). 'full' inlines source code, docstring, and end_line — equivalent to search + get_symbol in one call.",
                        "enum": ["compact", "standard", "full"],
                        "default": "standard"
                    },
                    "debug": {
                        "type": "boolean",
                        "description": "When true, each result includes a score_breakdown showing per-field scoring contributions (name_exact, name_contains, name_word_overlap, signature_phrase, signature_word_overlap, summary_phrase, summary_word_overlap, keywords, docstring_word_overlap). Also adds candidates_scored to _meta.",
                        "default": False
                    },
                    "fuzzy": {
                        "type": "boolean",
                        "description": "Enable fuzzy matching. When true, uses trigram overlap + Levenshtein distance as fallback when BM25 scores are low. Fuzzy results include match_type, fuzzy_similarity, and edit_distance fields.",
                        "default": False
                    },
                    "fuzzy_threshold": {
                        "type": "number",
                        "description": "Minimum Jaccard trigram similarity (0.0–1.0) for fuzzy candidates. Lower values surface more candidates. Default 0.4.",
                        "default": 0.4
                    },
                    "max_edit_distance": {
                        "type": "integer",
                        "description": "Maximum Levenshtein distance for direct name matching (catches typos). Default 2.",
                        "default": 2
                    },
                    "sort_by": {
                        "type": "string",
                        "enum": ["relevance", "centrality", "combined"],
                        "description": "Ranking strategy. 'relevance' (default) = BM25 text match. 'centrality' = filter by query, rank by PageRank. 'combined' = BM25 + PageRank weighted.",
                        "default": "relevance"
                    },
                    "semantic": {
                        "type": "boolean",
                        "description": "Enable semantic (embedding-based) search. Requires an embedding provider: JCODEMUNCH_EMBED_MODEL (sentence-transformers), GOOGLE_API_KEY+GOOGLE_EMBED_MODEL (Gemini), or OPENAI_API_KEY+OPENAI_EMBED_MODEL (OpenAI). When false (default) there is zero performance impact.",
                        "default": False
                    },
                    "semantic_weight": {
                        "type": "number",
                        "description": "Weight for semantic score in hybrid BM25+embedding ranking (0.0–1.0). BM25 receives 1-weight. Default 0.5. Set to 0.0 for identical results to pure BM25; set to 1.0 for pure semantic.",
                        "default": 0.5
                    },
                    "semantic_only": {
                        "type": "boolean",
                        "description": "Skip BM25 entirely and rank solely by embedding cosine similarity. Implies semantic=true.",
                        "default": False
                    },
                    "fqn": {
                        "type": "string",
                        "description": "PHP fully-qualified class name (e.g. 'App\\Models\\User'). Resolves via PSR-4 and uses the class name as query. Alternative to query."
                    }
                },
                "required": ["repo", "query"]
            }
        ),
        Tool(
            name="invalidate_cache",
            description="Delete the index and cached files for a repository. Forces a full re-index on next index_repo or index_folder call.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    }
                },
                "required": ["repo"]
            }
        ),
        Tool(
            name="search_text",
            description="Full-text search across indexed file contents. Useful when symbol search misses (e.g., string literals, comments, config values). Supports regex (is_regex=true) and context lines around matches (context_lines=N, like grep -C).",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "query": {
                        "type": "string",
                        "description": "Text to search for. Case-insensitive substring by default. Set is_regex=true for full regex (e.g. 'estimateToken|tokenEstimat|\\.length.*0\\.25')."
                    },
                    "is_regex": {
                        "type": "boolean",
                        "description": "When true, treat query as a Python regex (re.search, case-insensitive). Supports alternation (|), character classes, lookaheads, etc.",
                        "default": False
                    },
                    "file_pattern": {
                        "type": "string",
                        "description": "Optional glob pattern to filter files (e.g., '*.py')"
                    },
                    "max_results": {
                        "type": "integer",
                        "description": "Maximum number of matching lines to return",
                        "default": 20
                    },
                    "context_lines": {
                        "type": "integer",
                        "description": "Lines of context to include before and after each match (like grep -C N). Essential for understanding code around matches.",
                        "default": 0
                    }
                },
                "required": ["repo", "query"]
            }
        ),
        Tool(
            name="get_repo_outline",
            description="Get a high-level overview of an indexed repository: directories, file counts, language breakdown, symbol counts. Lighter than get_file_tree.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    }
                },
                "required": ["repo"]
            }
        ),
        Tool(
            name="find_importers",
            description="Find all files that import a given file. Answers 'what uses this file?'. has_importers=false on a result means that importer is itself unreachable (dead code chain). Supports dbt {{ ref() }} edges. Use file_paths for batch queries. Set cross_repo=true to also find importers in other indexed repos.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier"},
                    "file_path": {"type": "string", "description": "Target file path within the repo (e.g. 'src/features/intake/IntakeService.js'). Use for single-file queries. Cannot be used together with file_paths."},
                    "file_paths": {"type": "array", "items": {"type": "string"}, "description": "List of target file paths for batch queries. Returns a results array. Cannot be used together with file_path."},
                    "max_results": {"type": "integer", "default": 50, "description": "Maximum results per file"},
                    "cross_repo": {"type": "boolean", "default": False, "description": "When true, also search other indexed repos for cross-repo importers. Default: false (or JCODEMUNCH_CROSS_REPO_DEFAULT env var)."},
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="find_references",
            description="Find all files that import or reference an identifier. Answers 'where is this used?'. Supports dbt {{ ref() }} edges. Use identifiers for batch queries. Set include_call_chain=true to also see which symbols in each file call the identifier.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier"},
                    "identifier": {"type": "string", "description": "Symbol or module name to search for (e.g. 'bulkImport', 'IntakeService'). Use for single-identifier queries. Cannot be used together with identifiers."},
                    "identifiers": {"type": "array", "items": {"type": "string"}, "description": "List of symbol or module names to search for (batch mode). Returns a results array. Cannot be used together with identifier."},
                    "max_results": {"type": "integer", "default": 50, "description": "Maximum results"},
                    "include_call_chain": {
                        "type": "boolean",
                        "default": False,
                        "description": "When true (singular mode only), each reference entry includes calling_symbols: symbols in that file whose bodies mention the identifier. Default false.",
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="check_references",
            description="Check if an identifier is referenced anywhere: imports + file content. Combines find_references and search_text into one call. Returns is_referenced (bool) for quick dead-code detection. Accepts multiple identifiers in one call via identifiers param.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier"},
                    "identifier": {"type": "string", "description": "Single identifier to check"},
                    "identifiers": {
                        "type": "array", "items": {"type": "string"},
                        "description": "Multiple identifiers to check in one call. Returns grouped results.",
                    },
                    "search_content": {
                        "type": "boolean", "default": True,
                        "description": "Also search file contents (not just imports). Set false for fast import-only check.",
                    },
                    "max_content_results": {
                        "type": "integer", "default": 20,
                        "description": "Max files to return per identifier for content search.",
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="search_columns",
            description="Search column metadata across indexed models. Works with any ecosystem provider that emits column data (dbt, SQLMesh, database catalogs, etc.). Returns model name, file path, column name, and description. Use instead of grep/search_text for column discovery — 77% fewer tokens.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "query": {
                        "type": "string",
                        "description": "Search query (matches column names and descriptions)"
                    },
                    "model_pattern": {
                        "type": "string",
                        "description": "Optional glob to filter by model name (e.g., 'fact_*', 'dim_provider')"
                    },
                    "max_results": {
                        "type": "integer",
                        "description": "Maximum number of results to return",
                        "default": 20
                    }
                },
                "required": ["repo", "query"]
            }
        ),
        Tool(
            name="get_context_bundle",
            description=(
                "Get full source + imports for one or more symbols in one call. "
                "Multi-symbol bundles deduplicate shared imports. "
                "Set token_budget to cap response size; use budget_strategy to control what's kept. "
                "Supports fqn (PHP FQN via PSR-4) as alternative to symbol_id."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "symbol_id": {
                        "type": "string",
                        "description": "Single symbol ID (backward-compatible). Use symbol_ids for multi-symbol bundles."
                    },
                    "symbol_ids": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "List of symbol IDs for a multi-symbol bundle. Imports are deduplicated across symbols that share a file."
                    },
                    "include_callers": {
                        "type": "boolean",
                        "description": "When true, each symbol entry includes a 'callers' list of files that directly import its defining file.",
                        "default": False
                    },
                    "output_format": {
                        "type": "string",
                        "description": "'json' (default) or 'markdown' — markdown renders a paste-ready document with imports, docstrings, and source blocks.",
                        "enum": ["json", "markdown"],
                        "default": "json"
                    },
                    "token_budget": {
                        "type": "integer",
                        "description": "Max tokens to return. When set, symbols are ranked and trimmed to fit. Uses budget_strategy to prioritize."
                    },
                    "budget_strategy": {
                        "type": "string",
                        "enum": ["most_relevant", "core_first", "compact"],
                        "description": (
                            "'most_relevant' (default) ranks by file centrality (import in-degree). "
                            "'core_first' keeps the primary symbol first, ranks rest by centrality. "
                            "'compact' strips source bodies — returns signatures only."
                        ),
                        "default": "most_relevant"
                    },
                    "include_budget_report": {
                        "type": "boolean",
                        "description": "When true, include a 'budget_report' field showing tokens used, symbols included/excluded, and strategy applied.",
                        "default": False
                    },
                    "fqn": {
                        "type": "string",
                        "description": "PHP fully-qualified class name (e.g. 'App\\Models\\User'). Resolves to symbol_id via PSR-4. Alternative to symbol_id."
                    }
                },
                "required": ["repo"]
            }
        ),
        Tool(
            name="get_session_stats",
            description="Get token savings stats for the current MCP session. Returns tokens saved and cost avoided (this session and all-time), per-tool breakdown, session duration, and cumulative totals. Use to see how much jCodeMunch has saved you.",
            inputSchema={
                "type": "object",
                "properties": {},
            }
        ),
        Tool(
            name="get_session_context",
            description="Get the current session context — files accessed, searches performed, and edits registered during this MCP session. Use to avoid re-reading the same files.",
            inputSchema={
                "type": "object",
                "properties": {
                    "max_files": {
                        "type": "integer",
                        "description": "Maximum number of files to return in files_accessed.",
                        "default": 50,
                    },
                    "max_queries": {
                        "type": "integer",
                        "description": "Maximum number of queries to return in recent_searches.",
                        "default": 20,
                    },
                },
            }
        ),
        Tool(
            name="get_session_snapshot",
            description="Get a compact session snapshot for context continuity. Returns a ~200 token markdown summary of files explored, edits made, searches performed, and dead ends. Designed for injection after context compaction to restore session orientation.",
            inputSchema={
                "type": "object",
                "properties": {
                    "max_files": {
                        "type": "integer",
                        "default": 10,
                        "description": "Maximum focus files to include.",
                    },
                    "max_searches": {
                        "type": "integer",
                        "default": 5,
                        "description": "Maximum key searches to include.",
                    },
                    "max_edits": {
                        "type": "integer",
                        "default": 10,
                        "description": "Maximum edited files to include.",
                    },
                    "include_negative_evidence": {
                        "type": "boolean",
                        "default": True,
                        "description": "Include dead-end searches (negative evidence) in snapshot.",
                    },
                },
            },
        ),
        Tool(
            name="plan_turn",
            description="Plan the next turn by analyzing query against the codebase. Returns confidence level (high/medium/low), recommended symbols/files, and guidance. Use as opening move for any task.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier.",
                    },
                    "query": {
                        "type": "string",
                        "description": "What you're looking for (task description or symbol name).",
                    },
                    "max_recommended": {
                        "type": "integer",
                        "description": "Maximum number of symbols to recommend.",
                        "default": 5,
                    },
                },
                "required": ["repo", "query"],
            }
        ),
        Tool(
            name="register_edit",
            description="Register file edits to invalidate caches. Call after editing files to clear BM25 cache and search result cache for the repo.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier.",
                    },
                    "file_paths": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "List of file paths that were edited.",
                    },
                    "reindex": {
                        "type": "boolean",
                        "description": "If True, also reindex the files.",
                        "default": False,
                    },
                },
                "required": ["repo", "file_paths"],
            }
        ),
        Tool(
            name="test_summarizer",
            description="Verify AI summarizer config and connectivity.",
            inputSchema={
                "type": "object",
                "properties": {
                    "timeout_ms": {
                        "type": "integer",
                        "description": "Slow-response threshold in ms.",
                        "default": 15000,
                    },
                },
            },
        ),
        Tool(
            name="audit_agent_config",
            description=(
                "Audit agent configuration files (CLAUDE.md, .cursorrules, copilot-instructions.md, etc.) "
                "for token waste. Reports per-file token cost, stale symbol references, dead file paths, "
                "redundancy between global and project configs, bloat patterns, and scope leaks. "
                "Cross-references against the jcodemunch index to catch references to renamed or deleted "
                "symbols and files that no other linter can detect."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": (
                            "Repository identifier for cross-referencing symbols and files. "
                            "If omitted, skips stale-reference and dead-path checks."
                        ),
                    },
                    "project_path": {
                        "type": "string",
                        "description": "Project directory to scan for config files. Defaults to cwd.",
                    },
                },
            },
        ),
        Tool(
            name="get_dependency_graph",
            description="Get the file-level dependency graph for a given file. Traverses import relationships up to 3 hops. Use to understand what a file depends on ('imports'), what depends on it ('importers'), or both. Prerequisite for blast radius analysis. Set cross_repo=true to include cross-repository edges.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "file": {
                        "type": "string",
                        "description": "File path within the repo (e.g. 'src/server.py')"
                    },
                    "direction": {
                        "type": "string",
                        "description": "'imports' (files this file depends on), 'importers' (files that depend on this file), or 'both'",
                        "enum": ["imports", "importers", "both"],
                        "default": "imports"
                    },
                    "depth": {
                        "type": "integer",
                        "description": "Number of hops to traverse (1–3)",
                        "default": 1
                    },
                    "cross_repo": {
                        "type": "boolean",
                        "description": "When true, include cross-repo edges (imports that resolve to packages in other indexed repos). Default: false.",
                        "default": False,
                    },
                },
                "required": ["repo", "file"]
            }
        ),
        Tool(
            name="get_symbol_diff",
            description="Diff symbol sets between two indexed snapshots. Shows added, removed, and changed symbols. Branch workflow: index branch A as repo-main, index branch B as repo-feature, then diff.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo_a": {"type": "string", "description": "First repo identifier (the 'before' snapshot)"},
                    "repo_b": {"type": "string", "description": "Second repo identifier (the 'after' snapshot)"},
                },
                "required": ["repo_a", "repo_b"],
            },
        ),
        Tool(
            name="get_class_hierarchy",
            description="Get the full inheritance hierarchy for a class: ancestors (base classes via extends/implements) and descendants (subclasses/implementors). Works across Python, Java, TypeScript, C#, and any language where class signatures contain 'extends' or 'implements'.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier (owner/repo or just repo name)"},
                    "class_name": {"type": "string", "description": "Name of the class to analyse"},
                },
                "required": ["repo", "class_name"],
            },
        ),
        Tool(
            name="get_related_symbols",
            description="Find symbols related to a given symbol using heuristic clustering: same-file co-location (weight 3), shared importers (weight 1.5), and name-token overlap (weight 0.5/token). Useful for discovering what else to read when exploring an unfamiliar codebase.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier (owner/repo or just repo name)"},
                    "symbol_id": {"type": "string", "description": "ID of the symbol to find relatives for"},
                    "max_results": {"type": "integer", "description": "Maximum results (default 10, max 50)", "default": 10},
                },
                "required": ["repo", "symbol_id"],
            },
        ),
        Tool(
            name="suggest_queries",
            description="Suggest search queries, entry-point files, and index stats. Good first call on an unfamiliar repo — surfaces most-imported files, top keywords, and ready-to-run example queries.",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier (owner/repo or just repo name)"},
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_blast_radius",
            description="Find all files affected by changing a symbol. Returns confirmed files (import + name match) and potential files (import only, e.g. wildcard). Use before renaming or deleting a symbol. Set cross_repo=true to also find consumers in other indexed repos. Set include_source=true to get source snippets at each reference site (fix-ready context in one call).",
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "symbol": {
                        "type": "string",
                        "description": "Symbol name or ID to analyse (e.g. 'calculateScore' or a full symbol ID)"
                    },
                    "depth": {
                        "type": "integer",
                        "description": "Import hops to traverse (1 = direct importers only, max 3). Default 1.",
                        "default": 1
                    },
                    "include_depth_scores": {
                        "type": "boolean",
                        "description": "When true, adds impact_by_depth (files grouped by hop distance) and per-depth risk scores. overall_risk_score and direct_dependents_count are always included. Default false.",
                        "default": False
                    },
                    "cross_repo": {
                        "type": "boolean",
                        "description": "When true, also find files in other indexed repos that consume this repo's package. Default: false.",
                        "default": False,
                    },
                    "call_depth": {
                        "type": "integer",
                        "description": "When > 0, also find symbols that *call* this symbol (call-level analysis). Returns a callers list alongside the import-level confirmed/potential. Max 3. Default 0 (disabled).",
                        "default": 0,
                    },
                    "fqn": {
                        "type": "string",
                        "description": "PHP fully-qualified class name (e.g. 'App\\Models\\User'). Resolves to symbol via PSR-4. Alternative to symbol."
                    },
                    "decorator_filter": {
                        "type": "string",
                        "description": "Optional: filter confirmed results to only those containing symbols with this decorator (case-insensitive substring match)"
                    },
                    "include_source": {
                        "type": "boolean",
                        "description": "When true, each confirmed file includes source_snippets (lines referencing the symbol) and symbols_in_file (nearby symbol signatures). Use for fix-ready context without extra tool calls. Default false.",
                        "default": False,
                    },
                    "source_budget": {
                        "type": "integer",
                        "description": "Max tokens for source snippets across all files (default 8000). Files are prioritized by reference count.",
                        "default": 8000,
                    },
                },
                "required": ["repo", "symbol"]
            }
        ),
        Tool(
            name="get_call_hierarchy",
            description=(
                "Return incoming callers and outgoing callees for a symbol, N levels deep. "
                "Uses AST-derived call detection: callers = symbols in importing files that "
                "mention this name; callees = imported symbols mentioned in this symbol's body. "
                "Useful for understanding how a symbol fits into the call graph before refactoring. "
                "For a 'what breaks if I delete this?' answer, use get_impact_preview instead."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "symbol_id": {
                        "type": "string",
                        "description": "Symbol name or full ID to analyse. Use search_symbols to find IDs."
                    },
                    "direction": {
                        "type": "string",
                        "enum": ["callers", "callees", "both"],
                        "description": "'callers' = who calls this symbol; 'callees' = what this symbol calls; 'both' (default).",
                        "default": "both",
                    },
                    "depth": {
                        "type": "integer",
                        "description": "Maximum hops to traverse (1–5). Default 3.",
                        "default": 3,
                    },
                },
                "required": ["repo", "symbol_id"],
            },
        ),
        Tool(
            name="get_impact_preview",
            description=(
                "Show what breaks if a symbol is removed or renamed. "
                "Walks the call graph transitively to find every symbol that calls this one, "
                "returning affected symbols grouped by file with call-chain paths. "
                "Use this before deleting or renaming a symbol to understand full impact. "
                "For a structured caller/callee tree, use get_call_hierarchy instead."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "symbol_id": {
                        "type": "string",
                        "description": "Symbol name or full ID to analyse. Use search_symbols to find IDs."
                    },
                },
                "required": ["repo", "symbol_id"],
            },
        ),
        Tool(
            name="get_dependency_cycles",
            description=(
                "Detect circular import chains in a repository. "
                "Returns every strongly-connected component (set of files that mutually import "
                "each other, directly or transitively). Run this to identify architectural "
                "problems before a refactor, or to understand why a module is hard to test in isolation."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_coupling_metrics",
            description=(
                "Return afferent coupling (Ca), efferent coupling (Ce), and instability score "
                "for a file/module. Ca = files that import this module (dependents). "
                "Ce = files this module imports (dependencies). "
                "Instability I = Ce/(Ca+Ce): 0 = stable, 1 = unstable. "
                "Use to identify fragile modules and guide refactoring priorities."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "module_path": {
                        "type": "string",
                        "description": "File path within the repo (e.g. 'src/utils.py')"
                    },
                },
                "required": ["repo", "module_path"],
            },
        ),
        Tool(
            name="get_layer_violations",
            description=(
                "Check whether imports respect declared architectural layer boundaries. "
                "Reports every import that crosses a forbidden layer boundary. "
                "Layer rules can be passed directly or defined in .jcodemunch.jsonc under "
                "'architecture.layers'. Use to enforce clean architecture and detect "
                "dependency-direction violations (e.g. API layer importing DB layer directly)."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)"
                    },
                    "rules": {
                        "type": "array",
                        "description": (
                            "Layer definitions. Each entry: {name, paths: [...], may_not_import: [...]}. "
                            "If omitted, reads from .jcodemunch.jsonc architecture.layers."
                        ),
                        "items": {"type": "object"},
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="check_rename_safe",
            description=(
                "Check whether renaming a symbol to a new name would cause name collisions. "
                "Scans the symbol's own file and every file that imports it, "
                "looking for an existing symbol with the proposed new name. "
                "Returns safe=true when no collisions are found. "
                "Run this before any rename/refactor to avoid silent breakage."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "symbol_id": {
                        "type": "string",
                        "description": (
                            "Symbol ID to rename (e.g. 'src/utils.py::helper#function'). "
                            "Bare name accepted when unambiguous."
                        ),
                    },
                    "new_name": {
                        "type": "string",
                        "description": "Proposed new symbol name (not a full ID, just the name).",
                    },
                },
                "required": ["repo", "symbol_id", "new_name"],
            },
        ),
        Tool(
            name="get_dead_code_v2",
            description=(
                "Find likely-dead functions and methods using three independent evidence signals: "
                "(1) the symbol's file is not reachable from any entry point via the import graph, "
                "(2) no indexed symbol calls this symbol in the call graph, "
                "(3) the symbol name is not re-exported from any __init__ or barrel file. "
                "Each result includes a confidence score (0.33 = 1 signal, 0.67 = 2 signals, 1.0 = all 3). "
                "More reliable than single-signal dead-code detection. "
                "Use min_confidence=0.67 for high-confidence results only."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "min_confidence": {
                        "type": "number",
                        "description": "Minimum confidence threshold 0.0–1.0 (default 0.5 = at least 2/3 signals).",
                        "default": 0.5,
                    },
                    "include_tests": {
                        "type": "boolean",
                        "description": "Include test files in analysis (default false).",
                        "default": False,
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_extraction_candidates",
            description=(
                "Identify functions in a file that are good candidates for extraction to a shared module. "
                "A candidate must have high cyclomatic complexity (doing a lot) AND "
                "be called from multiple other files (already implicitly shared). "
                "Results are ranked by score = complexity × caller_file_count. "
                "Requires re-indexing with jcodemunch-mcp >= 1.16 to populate complexity data."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "file_path": {
                        "type": "string",
                        "description": "Relative file path within the repo (e.g. 'src/utils.py').",
                    },
                    "min_complexity": {
                        "type": "integer",
                        "description": "Minimum cyclomatic complexity threshold (default 5).",
                        "default": 5,
                    },
                    "min_callers": {
                        "type": "integer",
                        "description": "Minimum number of distinct caller files (default 2).",
                        "default": 2,
                    },
                },
                "required": ["repo", "file_path"],
            },
        ),
        Tool(
            name="get_symbol_complexity",
            description=(
                "Return cyclomatic complexity, nesting depth, and parameter count for a single symbol. "
                "Complexity data is stored at index time (requires jcodemunch-mcp >= 1.16 / INDEX_VERSION 7). "
                "assessment field: 'low' (1-4), 'medium' (5-10), 'high' (11+). "
                "Re-index the repo if all metrics show 0 (pre-1.16 index)."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "symbol_id": {
                        "type": "string",
                        "description": "Full symbol ID as returned by search_symbols or get_file_outline.",
                    },
                },
                "required": ["repo", "symbol_id"],
            },
        ),
        Tool(
            name="get_churn_rate",
            description=(
                "Return git churn metrics for a file or symbol: commit count, unique authors, "
                "first_seen date, last_modified date, and churn_per_week over a configurable window. "
                "assessment: 'stable' (<=1/week), 'active' (<=3/week), 'volatile' (>3/week). "
                "Requires a locally indexed repo (index_folder); GitHub-indexed repos are not supported."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "target": {
                        "type": "string",
                        "description": "Relative file path (e.g. 'src/utils.py') or a full symbol ID.",
                    },
                    "days": {
                        "type": "integer",
                        "description": "Look-back window in days (default 90).",
                        "default": 90,
                    },
                },
                "required": ["repo", "target"],
            },
        ),
        Tool(
            name="get_hotspots",
            description=(
                "Return the top-N highest-risk symbols ranked by hotspot score = "
                "cyclomatic_complexity x log(1 + commits_last_N_days). "
                "Identifies code that is both complex and frequently changed — the highest "
                "bug-introduction risk in the codebase. Methodology matches CodeScene/Adam Tornhill. "
                "Requires jcodemunch-mcp >= 1.16 for complexity data and a locally indexed repo for churn."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "top_n": {
                        "type": "integer",
                        "description": "Number of results to return (default 20).",
                        "default": 20,
                    },
                    "days": {
                        "type": "integer",
                        "description": "Churn look-back window in days (default 90).",
                        "default": 90,
                    },
                    "min_complexity": {
                        "type": "integer",
                        "description": "Minimum cyclomatic complexity to include (default 2).",
                        "default": 2,
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_repo_health",
            description=(
                "Return a one-call triage snapshot of the entire repository: symbol counts, "
                "dead code %, average cyclomatic complexity, top 5 hotspots, dependency cycle count, "
                "and unstable module count. "
                "Designed to be the first tool called in any new session — one call gives a complete "
                "picture to guide follow-up analysis."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "days": {
                        "type": "integer",
                        "description": "Churn look-back window for hotspot calculation (default 90).",
                        "default": 90,
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_untested_symbols",
            description=(
                "Find functions and methods with no evidence of being exercised by any test file. "
                "Uses import-graph reachability + name matching (AST call_references when available, "
                "word-boundary text heuristic as fallback). Returns symbols classified as 'unreached' "
                "(no test file imports the source file) or 'imported_not_called' (test imports the "
                "module but no test references this specific function). "
                "This is heuristic reachability, NOT runtime coverage — it answers 'does any test "
                "reference this symbol?' rather than 'what % of lines are covered.' "
                "Use after get_repo_health for a deeper quality picture."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "file_pattern": {
                        "type": "string",
                        "description": "Optional glob to narrow which source files are analysed (e.g. 'src/**/*.py').",
                    },
                    "min_confidence": {
                        "type": "number",
                        "description": "Minimum confidence to include (0.0–1.0, default 0.5).",
                        "default": 0.5,
                    },
                    "max_results": {
                        "type": "integer",
                        "description": "Cap on returned symbols (default 100).",
                        "default": 100,
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_symbol_importance",
            description=(
                "Return the most architecturally important symbols in a repo, ranked by "
                "PageRank or in-degree centrality on the import graph. Useful for "
                "orientation: surfaces the symbols that most of the codebase depends on. "
                "New tool: use after indexing to understand repo architecture at a glance."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier (owner/repo or just repo name)"},
                    "top_n": {"type": "integer", "description": "Number of top symbols to return (default 20, max 200)", "default": 20},
                    "algorithm": {
                        "type": "string",
                        "enum": ["pagerank", "degree"],
                        "description": "'pagerank' (default) = full PageRank on import graph; 'degree' = simple in-degree count (faster).",
                        "default": "pagerank",
                    },
                    "scope": {"type": "string", "description": "Limit to a subdirectory prefix (e.g. 'src/core')"},
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="find_dead_code",
            description=(
                "Find dead code — files and symbols with zero importers and no entry-point role. "
                "Uses the import graph to identify unreachable code. Returns confidence scores "
                "(1.0 = provably unreachable, 0.7 = all importers are themselves dead). "
                "Set granularity='file' for file-level results only."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier (owner/repo or just repo name)"},
                    "granularity": {
                        "type": "string",
                        "enum": ["symbol", "file"],
                        "description": "'symbol' (default) returns dead symbols; 'file' returns dead files only.",
                        "default": "symbol",
                    },
                    "min_confidence": {
                        "type": "number",
                        "description": "Minimum confidence threshold 0.0–1.0. Default 0.8. Use 1.0 for provably unreachable only.",
                        "default": 0.8,
                    },
                    "include_tests": {
                        "type": "boolean",
                        "description": "Treat test files as live roots (default false — test files are excluded from dead code candidates).",
                        "default": False,
                    },
                    "entry_point_patterns": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "Additional glob patterns to treat as live roots (e.g. 'cli/*.py', 'scripts/*').",
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_ranked_context",
            description=(
                "Assemble the best-fit context for a query within a token budget. "
                "Ranks all symbols by relevance (BM25) and/or centrality (PageRank), "
                "loads source for the top candidates, and packs greedily until token_budget is exhausted. "
                "Use when you want 'the best N tokens of context for this task' without specifying exact symbols."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier (owner/repo or just repo name)"},
                    "query": {"type": "string", "description": "Natural language or identifier describing the task (max 500 chars)"},
                    "token_budget": {
                        "type": "integer",
                        "description": "Hard cap on returned tokens (default 4000).",
                        "default": 4000,
                    },
                    "strategy": {
                        "type": "string",
                        "enum": ["combined", "bm25", "centrality"],
                        "description": (
                            "'combined' (default) = BM25 + PageRank weighted sum. "
                            "'bm25' = pure text relevance. "
                            "'centrality' = PageRank only, filtered to query-matching symbols."
                        ),
                        "default": "combined",
                    },
                    "include_kinds": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "Optional list of symbol kinds to restrict results (e.g. ['class', 'function']).",
                    },
                    "scope": {
                        "type": "string",
                        "description": "Optional glob pattern to limit search to a subdirectory (e.g. 'src/core/*').",
                    },
                },
                "required": ["repo", "query"],
            },
        ),
        Tool(
            name="get_changed_symbols",
            description=(
                "Map a git diff to affected symbols: given two commits, returns which symbols "
                "were added, removed, modified, or renamed. Useful after merging a PR to answer "
                "'what actually changed?' for code review or regression triage. "
                "Requires a locally indexed repo (index_folder). "
                "Defaults to comparing current HEAD against the SHA stored at index time."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {"type": "string", "description": "Repository identifier — must be locally indexed with index_folder"},
                    "since_sha": {
                        "type": "string",
                        "description": "Compare from this git SHA or ref. Defaults to the SHA stored at index time.",
                    },
                    "until_sha": {
                        "type": "string",
                        "description": "Compare to this git SHA or ref (default 'HEAD').",
                        "default": "HEAD",
                    },
                    "include_blast_radius": {
                        "type": "boolean",
                        "description": "Also return downstream importers (blast radius) for each changed symbol (default false).",
                        "default": False,
                    },
                    "max_blast_depth": {
                        "type": "integer",
                        "description": "Hop limit when include_blast_radius=true (default 3, max 5).",
                        "default": 3,
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="embed_repo",
            description=(
                "Precompute and cache symbol embeddings for semantic search. "
                "Optional warm-up: search_symbols with semantic=true lazily embeds missing "
                "symbols on first use, but embed_repo warms the cache upfront so the first "
                "semantic query returns immediately. "
                "Requires an embedding provider (JCODEMUNCH_EMBED_MODEL, "
                "GOOGLE_API_KEY+GOOGLE_EMBED_MODEL, or OPENAI_API_KEY+OPENAI_EMBED_MODEL)."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Repository identifier (owner/repo or just repo name)",
                    },
                    "batch_size": {
                        "type": "integer",
                        "description": "Symbols per embedding batch (default 50).",
                        "default": 50,
                    },
                    "force": {
                        "type": "boolean",
                        "description": "Recompute all embeddings even if they already exist (default false).",
                        "default": False,
                    },
                },
                "required": ["repo"],
            },
        ),
        Tool(
            name="get_cross_repo_map",
            description=(
                "Return which indexed repos depend on which other indexed repos at the package level. "
                "Shows the full cross-repository dependency map based on package names extracted from "
                "manifest files (pyproject.toml, package.json, go.mod, Cargo.toml, etc.). "
                "Use to visualize how your indexed repos are interconnected. "
                "Pass repo to filter to a single repo's perspective."
            ),
            inputSchema={
                "type": "object",
                "properties": {
                    "repo": {
                        "type": "string",
                        "description": "Optional repo ID to filter. If omitted, returns the full cross-repo map.",
                    },
                },
            },
        ),
    ]
    # Filter out disabled tools
    disabled = config_module.get("disabled_tools", [])
    if disabled:
        tools = [t for t in tools if t.name not in disabled]

    # SQL gating: auto-disable search_columns when SQL not in languages
    languages = config_module.get("languages")
    if languages is not None and "sql" not in languages:
        tools = [t for t in tools if t.name != "search_columns"]

    # Merge descriptions from config (runs after disabled_tools filter)
    _apply_description_overrides(tools)

    return tools


def _apply_description_overrides(tools: list) -> None:
    """Apply description overrides from config to tool schemas."""
    descriptions = config_module.get_descriptions()
    if not descriptions:
        return

    shared = descriptions.get("_shared", {})

    for tool in tools:
        raw = descriptions.get(tool.name)
        if raw is None:
            tool_desc: dict = {}
        elif isinstance(raw, str):
            # Flat format: "tool_name": "description" → override tool description only
            tool.description = raw
            tool_desc = {}
        else:
            tool_desc = raw

        # Nested format: override tool-level description via "_tool" key
        # "_tool": "" means "use hardcoded minimal base only" (empty string override)
        if "_tool" in tool_desc:
            tool.description = tool_desc["_tool"]

        # Override parameter descriptions (applies even if only _shared is set)
        if isinstance(tool.inputSchema, dict):
            props = tool.inputSchema.get("properties", {})
            for param_name, param_schema in props.items():
                if not isinstance(param_schema, dict):
                    continue
                # Tool-specific override takes precedence over _shared
                # Empty string means "use hardcoded minimal base only"
                desc_override = tool_desc.get(param_name)
                if desc_override is None:
                    desc_override = shared.get(param_name)
                if desc_override is not None:
                    props[param_name] = {**param_schema, "description": desc_override}


@server.list_resources()
async def list_resources() -> list[Resource]:
    """Return empty resource list for client compatibility (e.g. Windsurf)."""
    return []


_WORKFLOW_PROMPT_TEXT = """\
# jcodemunch-mcp — Workflow Guide

Use these tools instead of Grep/Read/search for any indexed repository.

## Step-by-step

1. **list_repos** — check if the project is already indexed.
   - If not found, run **index_folder** (local) or **index_repo** (GitHub URL).

2. **search_symbols** — find functions, classes, methods by name or description.
   - Use `detail_level: "full"` to get source inline, or follow up with **get_symbol_source**.

3. **get_context_bundle** — get symbol source + its imports in one call.

4. **search_text** — fall back to full-text / regex search for string literals or comments.

5. **get_file_outline** — list all symbols in a file without reading the whole thing.

## Claude Code deferred-tool note

jcodemunch tools may appear as *deferred* in your system-reminder. Call **ToolSearch** with
a query like `"list repos"` or `"search symbols"` to load the full schema before use.
Set `discovery_hint: false` in config.jsonc to suppress the reminder in tool descriptions.
"""

_EXPLORE_PROMPT_TEXT = """\
# Explore — Build a mental model of an unfamiliar repo

Goal: Onboard to a repo you've never seen before.

1. **list_repos** → check if indexed. If not, run **index_folder** (local) or **index_repo** (GitHub).
2. **get_repo_outline** → directory structure, languages, most-imported files, most-central symbols (PageRank).
3. **get_repo_health** → dead code %, avg complexity, hotspots, dependency cycles, unstable modules.
4. **get_file_outline** on the 2–3 most-central files → understand the core.
5. **get_class_hierarchy** → inheritance structure (if OOP codebase).
6. **get_dependency_graph** on the entry point file (`direction="importers"`, `depth=2`) → what depends on the core.
7. **search_symbols** with `sort_by="centrality"` → find the most important symbols across the repo.
"""

_ASSESS_PROMPT_TEXT = """\
# Assess — Pre-merge impact analysis

Goal: Understand the blast radius of a change before merging.

1. **get_changed_symbols** → map the git diff to added/removed/modified/renamed symbols.
2. **get_blast_radius** on each changed file → depth-scored transitive impact + `has_test_reach` per file.
3. **get_impact_preview** on key changed symbols → "what breaks?" analysis.
4. **check_rename_safe** if any symbols were renamed → verify no broken refs.
5. **get_untested_symbols** on affected files → flag unreached symbols in the blast radius.
6. **get_coupling_metrics** on changed files → check if the change increases coupling.
7. **get_dependency_cycles** → check if the change introduces new cycles.
"""

_TRIAGE_PROMPT_TEXT = """\
# Triage — Diagnose a repo's code quality

Goal: Get a complete health picture in one guided session.

1. **get_repo_health** → one-call snapshot (dead code %, complexity, hotspots, cycles, unstable modules).
2. **find_dead_code** with `min_confidence=0.8` → high-confidence dead code candidates for removal.
3. **get_untested_symbols** → functions with no test-file reachability.
4. **get_dependency_cycles** → full cycle list with file paths.
5. **get_hotspots** with `top_n=10`, `days=90` → highest-risk symbols by complexity × churn.
6. **get_layer_violations** → architectural boundary violations.
7. **get_extraction_candidates** → functions that should be refactored out.
8. **get_coupling_metrics** on hotspot files → instability analysis.
"""

_TRACE_PROMPT_TEXT = """\
# Trace — Investigate a bug through the call graph

Goal: Follow a suspected bug from symptom to root cause.

1. **search_symbols** for the function name or error message keyword.
2. **get_symbol_source** on the suspect symbol → read the implementation.
3. **get_call_hierarchy** with `direction="callers"`, `depth=3` → who calls this?
4. **get_call_hierarchy** with `direction="callees"`, `depth=2` → what does it call?
5. **get_context_bundle** on the suspect symbol → full source + imports in one call.
6. **find_references** for the symbol name → all files that reference it.
7. **get_blast_radius** on the suspect file → what else could be affected?
8. **get_symbol_diff** if a recent change is suspected → compare current vs. previous version.
"""


@server.list_prompts()
async def list_prompts() -> list[Prompt]:
    """Return available workflow guidance prompts."""
    return [
        Prompt(
            name="workflow",
            description="Step-by-step guide for using jcodemunch-mcp tools in Claude Code.",
        ),
        Prompt(
            name="explore",
            description="Build a mental model of an unfamiliar repo.",
        ),
        Prompt(
            name="assess",
            description="Pre-merge impact analysis — blast radius, reachability, coupling.",
        ),
        Prompt(
            name="triage",
            description="Diagnose a repo's code quality — dead code, hotspots, cycles.",
        ),
        Prompt(
            name="trace",
            description="Investigate a bug through the call graph from symptom to root cause.",
        ),
    ]


_PROMPT_MAP: dict[str, tuple[str, str]] = {
    "workflow": (_WORKFLOW_PROMPT_TEXT, "jcodemunch-mcp workflow guide for Claude Code."),
    "explore": (_EXPLORE_PROMPT_TEXT, "Explore — build a mental model of an unfamiliar repo."),
    "assess": (_ASSESS_PROMPT_TEXT, "Assess — pre-merge impact analysis."),
    "triage": (_TRIAGE_PROMPT_TEXT, "Triage — diagnose a repo's code quality."),
    "trace": (_TRACE_PROMPT_TEXT, "Trace — investigate a bug through the call graph."),
}


@server.get_prompt()
async def get_prompt(name: str, arguments: dict | None = None) -> GetPromptResult:
    """Return the requested prompt content."""
    entry = _PROMPT_MAP.get(name)
    if entry is None:
        raise ValueError(f"Unknown prompt: {name}")
    text, description = entry
    return GetPromptResult(
        description=description,
        messages=[
            PromptMessage(
                role="user",
                content=TextContent(type="text", text=text),
            )
        ],
    )


@server.call_tool(validate_input=False)
async def call_tool(name: str, arguments: dict) -> list[TextContent]:
    """Handle tool calls."""
    storage_path = os.environ.get("CODE_INDEX_PATH")
    logger.info("tool_call: %s args=%s", name, {k: v for k, v in arguments.items() if k != "content"})

    try:   # main handler try starts here, before coerce
        # Coerce stringified booleans/integers/numbers before routing
        schema = (await _ensure_tool_schemas()).get(name)
        if schema:
            arguments = _coerce_arguments(arguments, schema)
            try:
                jsonschema.validate(instance=arguments, schema=schema)
            except jsonschema.ValidationError as e:
                return [TextContent(type="text", text=json.dumps(
                    {"error": f"Input validation error: {e.message}"}, indent=2
                ))]

        # Strict freshness mode: wait for any in-progress reindex to complete
        # before serving query results (except for write/index tools).
        # MUST use asyncio.to_thread — threading.Event.wait() cannot run on the event loop.
        repo_arg = arguments.get("repo")
        if (name not in _EXCLUDED_FROM_STRICT and repo_arg):
            strict_ms = config_module.get("strict_timeout_ms", 500)
            await asyncio.to_thread(await_freshness_if_strict, repo_arg, timeout_ms=strict_ms)

        # Project-level tool disabling: check if tool is disabled for this project
        # Global disabled tools are filtered out in list_tools() schema; project-level
        # rejection happens here since schema is global (can't be changed per-project).
        if config_module.is_tool_disabled(name, repo=repo_arg):
            return [TextContent(type="text", text=json.dumps({
                "error": (
                    f"Tool '{name}' is disabled in this project's configuration. "
                    f"Project-level tool disabling is set via the 'disabled_tools' key "
                    f"in the .jcodemunch.jsonc file. Remove '{name}' from 'disabled_tools' to re-enable."
                )
            }, indent=2))]

        if name == "index_repo":
            from .tools.index_repo import index_repo
            result = await index_repo(
                url=arguments["url"],
                use_ai_summaries=arguments.get("use_ai_summaries", _default_use_ai_summaries()),
                storage_path=storage_path,
                incremental=arguments.get("incremental", True),
                extra_ignore_patterns=arguments.get("extra_ignore_patterns"),
            )
            _result_cache_invalidate()
        elif name == "index_folder":
            from .tools.index_folder import index_folder
            _ai = arguments.get("use_ai_summaries", _default_use_ai_summaries())
            result = await asyncio.to_thread(
                functools.partial(
                    index_folder,
                    path=arguments["path"],
                    use_ai_summaries=_ai,
                    storage_path=storage_path,
                    extra_ignore_patterns=arguments.get("extra_ignore_patterns"),
                    follow_symlinks=arguments.get("follow_symlinks", False),
                    incremental=arguments.get("incremental", True),
                )
            )
            _result_cache_invalidate()
        elif name == "summarize_repo":
            from .tools.summarize_repo import summarize_repo
            result = await asyncio.to_thread(
                functools.partial(
                    summarize_repo,
                    repo=arguments["repo"],
                    force=arguments.get("force", False),
                    storage_path=storage_path,
                )
            )
        elif name == "index_file":
            from .tools.index_file import index_file
            _ai = arguments.get("use_ai_summaries", _default_use_ai_summaries())
            result = await asyncio.to_thread(
                functools.partial(
                    index_file,
                    path=arguments["path"],
                    use_ai_summaries=_ai,
                    storage_path=storage_path,
                    context_providers=arguments.get("context_providers", True),
                )
            )
            _result_cache_invalidate()
        elif name == "list_repos":
            from .tools.list_repos import list_repos
            result = await asyncio.to_thread(
                functools.partial(list_repos, storage_path=storage_path)
            )
        elif name == "resolve_repo":
            from .tools.resolve_repo import resolve_repo
            result = await asyncio.to_thread(
                functools.partial(
                    resolve_repo,
                    path=arguments["path"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_file_tree":
            from .tools.get_file_tree import get_file_tree
            result = await asyncio.to_thread(
                functools.partial(
                    get_file_tree,
                    repo=arguments["repo"],
                    path_prefix=arguments.get("path_prefix", ""),
                    include_summaries=arguments.get("include_summaries", False),
                    max_files=arguments.get("max_files"),
                    storage_path=storage_path,
                )
            )
        elif name == "get_file_outline":
            from .tools.get_file_outline import get_file_outline
            result = await asyncio.to_thread(
                functools.partial(
                    get_file_outline,
                    repo=arguments["repo"],
                    file_path=arguments.get("file_path") or arguments.get("file"),
                    file_paths=arguments.get("file_paths"),
                    storage_path=storage_path,
                )
            )
        elif name == "get_file_content":
            from .tools.get_file_content import get_file_content
            result = await asyncio.to_thread(
                functools.partial(
                    get_file_content,
                    repo=arguments["repo"],
                    file_path=arguments["file_path"],
                    start_line=arguments.get("start_line"),
                    end_line=arguments.get("end_line"),
                    storage_path=storage_path,
                )
            )
        elif name == "get_symbol_source":
            from .tools.get_symbol import get_symbol_source
            result = await asyncio.to_thread(
                functools.partial(
                    get_symbol_source,
                    repo=arguments["repo"],
                    symbol_id=arguments.get("symbol_id"),
                    symbol_ids=arguments.get("symbol_ids"),
                    verify=arguments.get("verify", False),
                    context_lines=arguments.get("context_lines", 0),
                    storage_path=storage_path,
                    fqn=arguments.get("fqn"),
                )
            )
        elif name == "search_symbols":
            from .tools.search_symbols import search_symbols
            kind_filter = arguments.get("kind")
            if kind_filter and kind_filter not in VALID_KINDS:
                result = {"error": f"Unknown kind '{kind_filter}'. Valid values: {sorted(VALID_KINDS)}"}
            else:
                result = await asyncio.to_thread(
                    functools.partial(
                        search_symbols,
                        repo=arguments["repo"],
                        query=arguments["query"],
                        kind=kind_filter,
                        file_pattern=arguments.get("file_pattern"),
                        language=arguments.get("language"),
                        decorator=arguments.get("decorator"),
                        max_results=arguments.get("max_results", 10),
                        token_budget=arguments.get("token_budget"),
                        detail_level=arguments.get("detail_level", "standard"),
                        debug=arguments.get("debug", False),
                        fuzzy=arguments.get("fuzzy", False),
                        fuzzy_threshold=arguments.get("fuzzy_threshold", 0.4),
                        max_edit_distance=arguments.get("max_edit_distance", 2),
                        sort_by=arguments.get("sort_by", "relevance"),
                        semantic=arguments.get("semantic", False),
                        semantic_weight=arguments.get("semantic_weight", 0.5),
                        semantic_only=arguments.get("semantic_only", False),
                        storage_path=storage_path,
                        fqn=arguments.get("fqn"),
                    )
                )
        elif name == "invalidate_cache":
            from .tools.invalidate_cache import invalidate_cache
            result = await asyncio.to_thread(
                functools.partial(
                    invalidate_cache,
                    repo=arguments["repo"],
                    storage_path=storage_path,
                )
            )
            _result_cache_invalidate()
        elif name == "search_text":
            from .tools.search_text import search_text
            result = await asyncio.to_thread(
                functools.partial(
                    search_text,
                    repo=arguments["repo"],
                    query=arguments["query"],
                    file_pattern=arguments.get("file_pattern"),
                    max_results=arguments.get("max_results", 20),
                    context_lines=arguments.get("context_lines", 0),
                    is_regex=arguments.get("is_regex", False),
                    storage_path=storage_path,
                )
            )
        elif name == "get_repo_outline":
            from .tools.get_repo_outline import get_repo_outline
            result = await asyncio.to_thread(
                functools.partial(
                    get_repo_outline,
                    repo=arguments["repo"],
                    storage_path=storage_path,
                )
            )
        elif name == "find_importers":
            from .tools.find_importers import find_importers
            result = await asyncio.to_thread(
                functools.partial(
                    find_importers,
                    repo=arguments["repo"],
                    file_path=arguments.get("file_path"),
                    file_paths=arguments.get("file_paths"),
                    max_results=arguments.get("max_results", 50),
                    storage_path=storage_path,
                    cross_repo=arguments.get("cross_repo"),
                )
            )
        elif name == "find_references":
            from .tools.find_references import find_references
            result = await asyncio.to_thread(
                functools.partial(
                    find_references,
                    repo=arguments["repo"],
                    identifier=arguments.get("identifier"),
                    identifiers=arguments.get("identifiers"),
                    max_results=arguments.get("max_results", 50),
                    storage_path=storage_path,
                    include_call_chain=arguments.get("include_call_chain", False),
                )
            )
        elif name == "check_references":
            from .tools.check_references import check_references
            result = await asyncio.to_thread(
                functools.partial(
                    check_references,
                    repo=arguments["repo"],
                    identifier=arguments.get("identifier"),
                    identifiers=arguments.get("identifiers"),
                    search_content=arguments.get("search_content", True),
                    max_content_results=arguments.get("max_content_results", 20),
                    storage_path=storage_path,
                )
            )
        elif name == "search_columns":
            from .tools.search_columns import search_columns
            result = await asyncio.to_thread(
                functools.partial(
                    search_columns,
                    repo=arguments["repo"],
                    query=arguments["query"],
                    model_pattern=arguments.get("model_pattern"),
                    max_results=arguments.get("max_results", 20),
                    storage_path=storage_path,
                )
            )
        elif name == "get_context_bundle":
            from .tools.get_context_bundle import get_context_bundle
            result = await asyncio.to_thread(
                functools.partial(
                    get_context_bundle,
                    repo=arguments["repo"],
                    symbol_id=arguments.get("symbol_id"),
                    symbol_ids=arguments.get("symbol_ids"),
                    include_callers=arguments.get("include_callers", False),
                    output_format=arguments.get("output_format", "json"),
                    token_budget=arguments.get("token_budget"),
                    budget_strategy=arguments.get("budget_strategy", "most_relevant"),
                    include_budget_report=arguments.get("include_budget_report", False),
                    storage_path=storage_path,
                    fqn=arguments.get("fqn"),
                )
            )
        elif name == "get_ranked_context":
            from .tools.get_ranked_context import get_ranked_context
            result = await asyncio.to_thread(
                functools.partial(
                    get_ranked_context,
                    repo=arguments["repo"],
                    query=arguments["query"],
                    token_budget=arguments.get("token_budget", 4000),
                    strategy=arguments.get("strategy", "combined"),
                    include_kinds=arguments.get("include_kinds"),
                    scope=arguments.get("scope"),
                    storage_path=storage_path,
                )
            )
        elif name == "get_session_stats":
            from .tools.get_session_stats import get_session_stats
            result = await asyncio.to_thread(
                functools.partial(
                    get_session_stats,
                    storage_path=storage_path,
                )
            )
        elif name == "get_session_context":
            from .tools.get_session_context import get_session_context
            result = await asyncio.to_thread(
                functools.partial(
                    get_session_context,
                    max_files=arguments.get("max_files", 50),
                    max_queries=arguments.get("max_queries", 20),
                    storage_path=storage_path,
                )
            )
        elif name == "get_session_snapshot":
            from .tools.get_session_snapshot import get_session_snapshot
            result = await asyncio.to_thread(
                functools.partial(
                    get_session_snapshot,
                    max_files=arguments.get("max_files", 10),
                    max_searches=arguments.get("max_searches", 5),
                    max_edits=arguments.get("max_edits", 10),
                    include_negative_evidence=arguments.get("include_negative_evidence", True),
                    storage_path=storage_path,
                )
            )
        elif name == "plan_turn":
            from .tools.plan_turn import plan_turn
            result = await asyncio.to_thread(
                functools.partial(
                    plan_turn,
                    repo=arguments["repo"],
                    query=arguments["query"],
                    max_recommended=arguments.get("max_recommended", 5),
                    storage_path=storage_path,
                )
            )
        elif name == "register_edit":
            from .tools.register_edit import register_edit
            result = await asyncio.to_thread(
                functools.partial(
                    register_edit,
                    repo=arguments["repo"],
                    file_paths=arguments["file_paths"],
                    reindex=arguments.get("reindex", False),
                    storage_path=storage_path,
                )
            )
        elif name == "test_summarizer":
            from .tools.test_summarizer import test_summarizer
            result = await asyncio.to_thread(
                functools.partial(
                    test_summarizer,
                    timeout_ms=arguments.get("timeout_ms", 15000),
                )
            )
        elif name == "audit_agent_config":
            from .tools.audit_agent_config import audit_agent_config
            result = await asyncio.to_thread(
                functools.partial(
                    audit_agent_config,
                    repo=arguments.get("repo"),
                    project_path=arguments.get("project_path"),
                    storage_path=storage_path,
                )
            )
        elif name == "get_dependency_graph":
            from .tools.get_dependency_graph import get_dependency_graph
            result = await asyncio.to_thread(
                functools.partial(
                    get_dependency_graph,
                    repo=arguments["repo"],
                    file=arguments["file"],
                    direction=arguments.get("direction", "imports"),
                    depth=arguments.get("depth", 1),
                    storage_path=storage_path,
                    cross_repo=arguments.get("cross_repo"),
                )
            )
        elif name == "get_blast_radius":
            from .tools.get_blast_radius import get_blast_radius
            result = await asyncio.to_thread(
                functools.partial(
                    get_blast_radius,
                    repo=arguments["repo"],
                    symbol=arguments["symbol"],
                    depth=arguments.get("depth", 1),
                    include_depth_scores=arguments.get("include_depth_scores", False),
                    storage_path=storage_path,
                    cross_repo=arguments.get("cross_repo"),
                    call_depth=arguments.get("call_depth", 0),
                    fqn=arguments.get("fqn"),
                    decorator_filter=arguments.get("decorator_filter"),
                    include_source=arguments.get("include_source", False),
                    source_budget=arguments.get("source_budget", 8000),
                )
            )
        elif name == "get_call_hierarchy":
            from .tools.get_call_hierarchy import get_call_hierarchy
            result = await asyncio.to_thread(
                functools.partial(
                    get_call_hierarchy,
                    repo=arguments["repo"],
                    symbol_id=arguments["symbol_id"],
                    direction=arguments.get("direction", "both"),
                    depth=arguments.get("depth", 3),
                    storage_path=storage_path,
                )
            )
        elif name == "get_impact_preview":
            from .tools.get_impact_preview import get_impact_preview
            result = await asyncio.to_thread(
                functools.partial(
                    get_impact_preview,
                    repo=arguments["repo"],
                    symbol_id=arguments["symbol_id"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_dependency_cycles":
            from .tools.get_dependency_cycles import get_dependency_cycles
            result = await asyncio.to_thread(
                functools.partial(
                    get_dependency_cycles,
                    repo=arguments["repo"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_coupling_metrics":
            from .tools.get_coupling_metrics import get_coupling_metrics
            result = await asyncio.to_thread(
                functools.partial(
                    get_coupling_metrics,
                    repo=arguments["repo"],
                    module_path=arguments["module_path"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_layer_violations":
            from .tools.get_layer_violations import get_layer_violations
            result = await asyncio.to_thread(
                functools.partial(
                    get_layer_violations,
                    repo=arguments["repo"],
                    rules=arguments.get("rules"),
                    storage_path=storage_path,
                )
            )
        elif name == "check_rename_safe":
            from .tools.check_rename_safe import check_rename_safe
            result = await asyncio.to_thread(
                functools.partial(
                    check_rename_safe,
                    repo=arguments["repo"],
                    symbol_id=arguments["symbol_id"],
                    new_name=arguments["new_name"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_dead_code_v2":
            from .tools.get_dead_code_v2 import get_dead_code_v2
            result = await asyncio.to_thread(
                functools.partial(
                    get_dead_code_v2,
                    repo=arguments["repo"],
                    min_confidence=arguments.get("min_confidence", 0.5),
                    include_tests=arguments.get("include_tests", False),
                    storage_path=storage_path,
                )
            )
        elif name == "get_extraction_candidates":
            from .tools.get_extraction_candidates import get_extraction_candidates
            result = await asyncio.to_thread(
                functools.partial(
                    get_extraction_candidates,
                    repo=arguments["repo"],
                    file_path=arguments["file_path"],
                    min_complexity=arguments.get("min_complexity", 5),
                    min_callers=arguments.get("min_callers", 2),
                    storage_path=storage_path,
                )
            )
        elif name == "get_symbol_complexity":
            from .tools.get_symbol_complexity import get_symbol_complexity
            result = await asyncio.to_thread(
                functools.partial(
                    get_symbol_complexity,
                    repo=arguments["repo"],
                    symbol_id=arguments["symbol_id"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_churn_rate":
            from .tools.get_churn_rate import get_churn_rate
            result = await asyncio.to_thread(
                functools.partial(
                    get_churn_rate,
                    repo=arguments["repo"],
                    target=arguments["target"],
                    days=arguments.get("days", 90),
                    storage_path=storage_path,
                )
            )
        elif name == "get_hotspots":
            from .tools.get_hotspots import get_hotspots
            result = await asyncio.to_thread(
                functools.partial(
                    get_hotspots,
                    repo=arguments["repo"],
                    top_n=arguments.get("top_n", 20),
                    days=arguments.get("days", 90),
                    min_complexity=arguments.get("min_complexity", 2),
                    storage_path=storage_path,
                )
            )
        elif name == "get_repo_health":
            from .tools.get_repo_health import get_repo_health
            result = await asyncio.to_thread(
                functools.partial(
                    get_repo_health,
                    repo=arguments["repo"],
                    days=arguments.get("days", 90),
                    storage_path=storage_path,
                )
            )
        elif name == "get_symbol_diff":
            from .tools.get_symbol_diff import get_symbol_diff
            result = await asyncio.to_thread(
                functools.partial(
                    get_symbol_diff,
                    repo_a=arguments["repo_a"],
                    repo_b=arguments["repo_b"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_class_hierarchy":
            from .tools.get_class_hierarchy import get_class_hierarchy
            result = await asyncio.to_thread(
                functools.partial(
                    get_class_hierarchy,
                    repo=arguments["repo"],
                    class_name=arguments["class_name"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_related_symbols":
            from .tools.get_related_symbols import get_related_symbols
            result = await asyncio.to_thread(
                functools.partial(
                    get_related_symbols,
                    repo=arguments["repo"],
                    symbol_id=arguments["symbol_id"],
                    max_results=arguments.get("max_results", 10),
                    storage_path=storage_path,
                )
            )
        elif name == "suggest_queries":
            from .tools.suggest_queries import suggest_queries
            result = await asyncio.to_thread(
                functools.partial(
                    suggest_queries,
                    repo=arguments["repo"],
                    storage_path=storage_path,
                )
            )
        elif name == "get_symbol_importance":
            from .tools.get_symbol_importance import get_symbol_importance
            result = await asyncio.to_thread(
                functools.partial(
                    get_symbol_importance,
                    repo=arguments["repo"],
                    top_n=arguments.get("top_n", 20),
                    algorithm=arguments.get("algorithm", "pagerank"),
                    scope=arguments.get("scope"),
                    storage_path=storage_path,
                )
            )
        elif name == "find_dead_code":
            from .tools.find_dead_code import find_dead_code
            result = await asyncio.to_thread(
                functools.partial(
                    find_dead_code,
                    repo=arguments["repo"],
                    granularity=arguments.get("granularity", "symbol"),
                    min_confidence=arguments.get("min_confidence", 0.8),
                    include_tests=arguments.get("include_tests", False),
                    entry_point_patterns=arguments.get("entry_point_patterns"),
                    storage_path=storage_path,
                )
            )
        elif name == "get_untested_symbols":
            from .tools.get_untested_symbols import get_untested_symbols
            result = await asyncio.to_thread(
                functools.partial(
                    get_untested_symbols,
                    repo=arguments["repo"],
                    file_pattern=arguments.get("file_pattern"),
                    min_confidence=arguments.get("min_confidence", 0.5),
                    max_results=arguments.get("max_results", 100),
                    storage_path=storage_path,
                )
            )
        elif name == "get_changed_symbols":
            from .tools.get_changed_symbols import get_changed_symbols
            result = await asyncio.to_thread(
                functools.partial(
                    get_changed_symbols,
                    repo=arguments["repo"],
                    since_sha=arguments.get("since_sha"),
                    until_sha=arguments.get("until_sha", "HEAD"),
                    include_blast_radius=arguments.get("include_blast_radius", False),
                    max_blast_depth=arguments.get("max_blast_depth", 3),
                    storage_path=storage_path,
                )
            )
        elif name == "embed_repo":
            from .tools.embed_repo import embed_repo
            result = await asyncio.to_thread(
                functools.partial(
                    embed_repo,
                    repo=arguments["repo"],
                    batch_size=arguments.get("batch_size", 50),
                    force=arguments.get("force", False),
                    storage_path=storage_path,
                )
            )
        elif name == "get_cross_repo_map":
            from .tools.get_cross_repo_map import get_cross_repo_map
            result = await asyncio.to_thread(
                functools.partial(
                    get_cross_repo_map,
                    repo=arguments.get("repo"),
                    storage_path=storage_path,
                )
            )
        else:
            result = {"error": f"Unknown tool: {name}"}

        # Feature 2: Session journal recording
        if config_module.get("session_journal", True):
            try:
                from .tools.session_journal import get_journal
                journal = get_journal()
                journal.record_tool_call(name)
                # Record file reads for relevant tools
                if name in {"get_file_content", "get_file_outline", "get_symbol_source", "get_context_bundle"}:
                    if isinstance(result, dict):
                        # Extract file paths from result
                        if name == "get_file_content" and "content" in result:
                            journal.record_read(arguments.get("file_path", ""), name)
                        elif name == "get_file_outline" and "symbols" in result:
                            journal.record_read(arguments.get("file_path", ""), name)
                        elif name == "get_symbol_source":
                            # Single symbol_id → flat result with "source"
                            sym_id = arguments.get("symbol_id", "")
                            if sym_id and "::" in sym_id:
                                journal.record_read(sym_id.split("::")[0], name)
                            # Batch symbol_ids → result has "symbols" list
                            for sym in result.get("symbols", []):
                                if "file" in sym:
                                    journal.record_read(sym["file"], name)
                        elif name == "get_context_bundle" and "symbols" in result:
                            # Record all files from the bundle
                            for sym in result.get("symbols", []):
                                if "file" in sym:
                                    journal.record_read(sym["file"], name)
                # Record searches
                elif name in {"search_symbols", "search_text"}:
                    if isinstance(result, dict):
                        result_count = result.get("result_count", 0)
                        query = arguments.get("query", "")
                        if query:
                            journal.record_search(query, result_count)
                        # Collect negative evidence for session state persistence
                        ne = result.get("negative_evidence")
                        if ne and isinstance(ne, dict):
                            import time as _t
                            journal.record_negative_evidence({
                                "query": query,
                                "repo": arguments.get("repo", ""),
                                "verdict": ne.get("verdict", ""),
                                "scanned_symbols": ne.get("scanned_symbols", 0),
                                "timestamp": _t.time(),
                            })
                elif name == "get_ranked_context":
                    if isinstance(result, dict):
                        query = arguments.get("query", "")
                        if query:
                            items_included = result.get("items_included", 0)
                            journal.record_search(query, items_included)
                        ne = result.get("negative_evidence")
                        if ne and isinstance(ne, dict):
                            import time as _t
                            journal.record_negative_evidence({
                                "query": query,
                                "repo": arguments.get("repo", ""),
                                "verdict": ne.get("verdict", ""),
                                "scanned_symbols": ne.get("scanned_symbols", 0),
                                "timestamp": _t.time(),
                            })
            except Exception:
                logger.debug("Journal recording failed", exc_info=True)

        # Feature 7: Turn budget — record output and inject warnings
        try:
            budget_tokens = config_module.get("turn_budget_tokens", 20000)
            if budget_tokens > 0 and isinstance(result, dict):
                from .tools.turn_budget import get_turn_budget
                tb = get_turn_budget()
                # Reconfigure if config changed (thread-safe)
                tb.configure(budget_tokens, config_module.get("turn_gap_seconds", 30.0))
                # Auto-compact: downgrade detail_level before dispatch would be ideal,
                # but result is already computed. Inject warning + flag instead.
                result_bytes = len(json.dumps(result, default=str))
                token_count = result_bytes // 4  # ~4 bytes per token
                budget_info = tb.record_output(token_count)
                if budget_info.get("budget_warning"):
                    meta = result.setdefault("_meta", {})
                    meta["budget_warning"] = budget_info["budget_warning"]
                    meta["turn_tokens_used"] = budget_info["turn_tokens_used"]
                    meta["turn_budget_remaining"] = budget_info["turn_budget_remaining"]
                    if tb.should_compact():
                        meta["auto_compacted"] = True
                    # Also promote to top-level for visibility
                    result["budget_warning"] = budget_info["budget_warning"]
            elif budget_tokens > 0:
                # Still record token count for non-dict results (errors, etc.)
                from .tools.turn_budget import get_turn_budget
                tb = get_turn_budget()
                tb.configure(budget_tokens, config_module.get("turn_gap_seconds", 30.0))
                # Approximate token count for non-dict results
                tb.record_output(len(json.dumps(result, default=str)) // 4)
        except Exception:
            logger.debug("Turn budget recording failed", exc_info=True)

        # Agent Selector: score complexity and annotate result
        try:
            agent_selector_cfg = config_module.get("agent_selector", {})
            if isinstance(agent_selector_cfg, dict) and agent_selector_cfg.get("mode", "off") != "off":
                if isinstance(result, dict) and "error" not in result and name in _AGENT_SELECTOR_TOOLS:
                    from .agent_selector import (
                        AgentSelectorConfig, ComplexitySignals, score_complexity, route,
                    )
                    as_config = AgentSelectorConfig.from_config(agent_selector_cfg)
                    # Build signals from result metadata
                    signals = ComplexitySignals(
                        retrievalSetSize=result.get("items_included", result.get("symbol_count", 0)),
                        symbolCount=result.get("symbol_count", len(result.get("symbols", result.get("context_items", [])))),
                        crossFileReferences=result.get("cross_file_refs", 0),
                        crossProjectReferences=result.get("cross_project", False),
                        languageComplexity=result.get("language_complexity", "standard"),
                        requestTokenEstimate=result.get("used_tokens", result.get("total_tokens", 0)),
                    )
                    assessment = score_complexity(signals, as_config)
                    current_model = arguments.get("_current_model")
                    decision = route(assessment, as_config, current_model)
                    # Annotate result
                    meta = result.setdefault("_meta", {})
                    meta["agent_selector"] = {
                        "score": assessment.score,
                        "tier": assessment.tier,
                        "recommendedModel": assessment.recommendedModel,
                    }
                    if decision.prompt_text:
                        result["agent_selector_prompt"] = decision.prompt_text
                    if decision.metadata_text:
                        result["agent_selector"] = decision.metadata_text
        except Exception:
            logger.debug("Agent selector scoring failed", exc_info=True)

        if isinstance(result, dict):
            meta_fields = config_module.get("meta_fields")
            if meta_fields == [] or arguments.get("suppress_meta"):
                result.pop("_meta", None)
            elif isinstance(meta_fields, list):
                # Partial field inclusion — keep only the fields listed in meta_fields,
                # preserving tool-generated fields (timing_ms, tokens_saved, etc.)
                existing_meta = result.pop("_meta", {})
                _meta: dict[str, Any] = {}
                if "powered_by" in meta_fields:
                    _meta["powered_by"] = "jcodemunch-mcp by jgravelle · https://github.com/jgravelle/jcodemunch-mcp"
                for field in meta_fields:
                    if field in existing_meta:
                        _meta[field] = existing_meta[field]
                if _meta:
                    result["_meta"] = _meta
        # Per-call pulse for downstream consumers (dashboards, monitors)
        _saved = result.get("_meta", {}).get("tokens_saved", 0) if isinstance(result, dict) else 0
        _write_pulse(name, tokens_saved=_saved, base_path=storage_path)

        return [TextContent(type="text", text=json.dumps(result, separators=(',', ':')))]

    except KeyError as e:
        return [TextContent(type="text", text=json.dumps({"error": f"Missing required argument: {e}. Check the tool schema for correct parameter names."}, separators=(',', ':')))]
    except Exception:
        logger.error("call_tool %s failed", name, exc_info=True)
        return [TextContent(type="text", text=json.dumps({"error": f"Internal error processing {name}"}, separators=(',', ':')))]


async def _run_server_with_watcher(
    server_coro_func,
    server_args: tuple,
    watcher_kwargs: dict,
    log_path: Optional[str] = None,
) -> None:
    """Run MCP server with a background watcher in the same event loop.

    Watcher runs in quiet mode (no stderr output). If log_path is provided,
    watcher output and errors go to that file. If log_path is "auto", a temp
    file is created in the system temp directory.
    """
    if watch_folders is None:
        raise ImportError(
            "watchfiles is required for --watcher. "
            "Install with: pip install 'jcodemunch-mcp[watch]'"
        )

    import sys
    import tempfile

    # Resolve log file path
    if log_path == "auto":
        log_path = os.path.join(
            tempfile.gettempdir(),
            f"jcw_{os.getpid()}.log",
        )

    stop_event = asyncio.Event()
    watcher_task = asyncio.create_task(
        watch_folders(
            **watcher_kwargs,
            stop_event=stop_event,
            quiet=True,
            log_file=log_path,
        ),
        name="embedded-watcher",
    )

    # Give watcher a moment to start; detect early failures before blocking on server
    await asyncio.sleep(0.1)
    if watcher_task.done() and not watcher_task.cancelled():
        exc = watcher_task.exception()
        if exc is not None:
            logger.warning("Embedded watcher failed to start: %s", exc)

    try:
        await server_coro_func(*server_args)
    except asyncio.CancelledError:
        pass  # Clean shutdown via Ctrl+C
    finally:
        stop_event.set()
        from .storage import IndexStore
        IndexStore(base_path=watcher_kwargs.get("storage_path") or os.environ.get("CODE_INDEX_PATH")).close()
        try:
            await asyncio.wait_for(watcher_task, timeout=5.0)
        except (asyncio.TimeoutError, asyncio.CancelledError):
            watcher_task.cancel()
            try:
                await watcher_task
            except asyncio.CancelledError:
                pass
        except (WatcherError, Exception) as exc:
            logger.warning("Watcher stopped with error: %s", exc)


async def run_stdio_server():
    """Run the MCP server over stdio (default)."""
    import sys
    from mcp.server.stdio import stdio_server
    print(f"jcodemunch-mcp {__version__} by jgravelle · https://github.com/jgravelle/jcodemunch-mcp", file=sys.stderr)
    logger.info(
        "startup version=%s transport=stdio storage=%s ai_summaries=%s",
        __version__,
        os.path.expanduser(os.environ.get("CODE_INDEX_PATH", "~/.code-index/")),
        _default_use_ai_summaries(),
    )
    # Feature 10: Restore session state on startup
    _restore_session_state()
    try:
        async with stdio_server() as (read_stream, write_stream):
            await server.run(
                read_stream,
                write_stream,
                server.create_initialization_options(),
            )
    finally:
        from .storage import IndexStore
        IndexStore(base_path=os.environ.get("CODE_INDEX_PATH")).close()


def _make_auth_middleware():
    """Return a Starlette middleware class that checks JCODEMUNCH_HTTP_TOKEN if set."""
    token = os.environ.get("JCODEMUNCH_HTTP_TOKEN")
    if not token:
        return None

    from starlette.middleware import Middleware
    from starlette.middleware.base import BaseHTTPMiddleware
    from starlette.responses import JSONResponse

    class BearerAuthMiddleware(BaseHTTPMiddleware):
        async def dispatch(self, request, call_next):
            auth = request.headers.get("authorization", "")
            if not hmac.compare_digest(auth, f"Bearer {token}"):
                return JSONResponse(
                    {"error": "Unauthorized. Set Authorization: Bearer <JCODEMUNCH_HTTP_TOKEN> header."},
                    status_code=401,
                )
            return await call_next(request)

    return Middleware(BearerAuthMiddleware)


def _make_rate_limit_middleware():
    """Return a Starlette middleware that rate-limits by IP (optional, opt-in).

    Reads JCODEMUNCH_RATE_LIMIT env var.  Value is max requests per minute per
    client IP.  0 or unset disables rate limiting (default — no behaviour change
    for existing deployments).

    Returns a Middleware instance, or None when rate limiting is disabled.
    """
    try:
        limit = int(os.environ.get("JCODEMUNCH_RATE_LIMIT", "0"))
    except (ValueError, TypeError):
        limit = 0
    if limit <= 0:
        return None

    import collections
    import time as _time

    from starlette.middleware import Middleware
    from starlette.middleware.base import BaseHTTPMiddleware
    from starlette.responses import JSONResponse

    _WINDOW = 60.0  # seconds
    _buckets: dict[str, collections.deque] = {}

    class RateLimitMiddleware(BaseHTTPMiddleware):
        async def dispatch(self, request, call_next):
            ip = request.client.host if request.client else "unknown"
            now = _time.monotonic()
            bucket = _buckets.setdefault(ip, collections.deque())
            # Evict timestamps outside the sliding window
            while bucket and now - bucket[0] >= _WINDOW:
                bucket.popleft()
            if len(bucket) >= limit:
                retry_after = int(_WINDOW - (now - bucket[0])) + 1
                return JSONResponse(
                    {"error": f"Rate limit exceeded. Max {limit} requests per minute per IP."},
                    status_code=429,
                    headers={"Retry-After": str(retry_after)},
                )
            bucket.append(now)
            return await call_next(request)

    return Middleware(RateLimitMiddleware)


async def run_sse_server(host: str, port: int):
    """Run the MCP server with SSE transport (persistent HTTP mode)."""
    import sys
    try:
        import uvicorn
        from starlette.applications import Starlette
        from starlette.requests import Request
        from starlette.routing import Mount, Route
    except ImportError as e:
        raise ImportError(
            f"SSE transport requires additional packages: {e}. "
            'Install them with: pip install "jcodemunch-mcp[http]"'
        ) from e
    from mcp.server.sse import SseServerTransport

    sse_transport = SseServerTransport("/messages/")

    async def handle_sse(request: Request):
        async with sse_transport.connect_sse(
            request.scope, request.receive, request._send
        ) as (read_stream, write_stream):
            await server.run(
                read_stream,
                write_stream,
                server.create_initialization_options(),
            )

    middleware = []
    auth_mw = _make_auth_middleware()
    if auth_mw:
        middleware.append(auth_mw)
    rate_mw = _make_rate_limit_middleware()
    if rate_mw:
        middleware.append(rate_mw)

    starlette_app = Starlette(
        routes=[
            Route("/sse", endpoint=handle_sse),
            Mount("/messages/", app=sse_transport.handle_post_message),
        ],
        middleware=middleware,
    )

    print(
        f"jcodemunch-mcp {__version__} by jgravelle · SSE server at http://{host}:{port}/sse",
        file=sys.stderr,
    )
    logger.info(
        "startup version=%s transport=sse host=%s port=%d storage=%s",
        __version__, host, port,
        os.path.expanduser(os.environ.get("CODE_INDEX_PATH", "~/.code-index/")),
    )
    # Feature 10: Restore session state on startup
    _restore_session_state()
    config = uvicorn.Config(starlette_app, host=host, port=port, log_level="warning")
    await uvicorn.Server(config).serve()


async def run_streamable_http_server(host: str, port: int):
    """Run the MCP server with streamable-http transport (persistent HTTP mode)."""
    import sys
    import uuid
    try:
        import uvicorn
        from starlette.applications import Starlette
        from starlette.requests import Request
        from starlette.routing import Route
    except ImportError as e:
        raise ImportError(
            f"Streamable-http transport requires additional packages: {e}. "
            'Install them with: pip install "jcodemunch-mcp[http]"'
        ) from e
    from mcp.server.streamable_http import StreamableHTTPServerTransport, MCP_SESSION_ID_HEADER

    # Session registry: session_id -> (transport, background_task)
    # Keeps server.run() alive across multiple HTTP requests from the same client.
    _sessions: dict[str, StreamableHTTPServerTransport] = {}
    _session_tasks: dict[str, asyncio.Task] = {}  # type: ignore[type-arg]

    async def handle_mcp(request: Request):
        session_id = request.headers.get(MCP_SESSION_ID_HEADER)

        # Route to existing session if client sent a session ID we recognise.
        if session_id and session_id in _sessions:
            transport = _sessions[session_id]
            await transport.handle_request(request.scope, request.receive, request._send)
            # Clean up terminated sessions (e.g. after DELETE).
            if transport._terminated:
                _sessions.pop(session_id, None)
                task = _session_tasks.pop(session_id, None)
                if task and not task.done():
                    task.cancel()
            return

        # New session — generate a unique ID so the transport enforces it on
        # all subsequent requests, preventing cross-session pollution.
        new_id = uuid.uuid4().hex
        transport = StreamableHTTPServerTransport(mcp_session_id=new_id)
        _sessions[new_id] = transport

        # streams_ready is set once transport.connect() has initialised its
        # internal memory streams.  We must wait for it before calling
        # handle_request(), which writes to those streams.
        streams_ready: asyncio.Event = asyncio.Event()

        async def _session_runner() -> None:
            try:
                async with transport.connect() as (read_stream, write_stream):
                    streams_ready.set()
                    await server.run(
                        read_stream,
                        write_stream,
                        server.create_initialization_options(),
                    )
            except asyncio.CancelledError:
                pass
            finally:
                _sessions.pop(new_id, None)
                _session_tasks.pop(new_id, None)

        task = asyncio.create_task(_session_runner())
        _session_tasks[new_id] = task

        try:
            # Wait up to 10 s for the transport to be ready.
            await asyncio.wait_for(streams_ready.wait(), timeout=10.0)
        except asyncio.TimeoutError:
            task.cancel()
            _sessions.pop(new_id, None)
            _session_tasks.pop(new_id, None)
            from starlette.responses import Response as StarletteResponse
            err = StarletteResponse("Session setup timed out", status_code=500)
            await err(request.scope, request.receive, request._send)
            return

        try:
            await transport.handle_request(request.scope, request.receive, request._send)
        except Exception:
            task.cancel()
            raise

    middleware = []
    auth_mw = _make_auth_middleware()
    if auth_mw:
        middleware.append(auth_mw)
    rate_mw = _make_rate_limit_middleware()
    if rate_mw:
        middleware.append(rate_mw)

    starlette_app = Starlette(
        routes=[
            Route("/mcp", endpoint=handle_mcp, methods=["GET", "POST", "DELETE"]),
        ],
        middleware=middleware,
    )

    print(
        f"jcodemunch-mcp {__version__} by jgravelle · streamable-http server at http://{host}:{port}/mcp",
        file=sys.stderr,
    )
    logger.info(
        "startup version=%s transport=streamable-http host=%s port=%d storage=%s",
        __version__, host, port,
        os.path.expanduser(os.environ.get("CODE_INDEX_PATH", "~/.code-index/")),
    )
    # Feature 10: Restore session state on startup
    _restore_session_state()
    config = uvicorn.Config(starlette_app, host=host, port=port, log_level="warning")
    await uvicorn.Server(config).serve()


def _setup_logging(args) -> None:
    """Configure logging from parsed args."""
    log_level = getattr(logging, args.log_level)
    handlers: list[logging.Handler] = []
    if args.log_file:
        log_path = Path(args.log_file).expanduser()
        log_path.parent.mkdir(parents=True, exist_ok=True)
        handlers.append(logging.FileHandler(log_path))
    else:
        handlers.append(logging.StreamHandler())

    logging.basicConfig(
        level=log_level,
        format="%(asctime)s %(name)s %(levelname)s %(message)s",
        handlers=handlers,
    )

    extra_ext = os.environ.get("JCODEMUNCH_EXTRA_EXTENSIONS", "")
    if extra_ext:
        logging.getLogger(__name__).info("JCODEMUNCH_EXTRA_EXTENSIONS: %s", extra_ext)


def _add_common_args(parser: argparse.ArgumentParser) -> None:
    """Add logging args shared by all subcommands."""
    parser.add_argument(
        "--log-level",
        default=os.environ.get("JCODEMUNCH_LOG_LEVEL", "WARNING"),
        choices=["DEBUG", "INFO", "WARNING", "ERROR"],
        help="Log level (also via JCODEMUNCH_LOG_LEVEL env var)",
    )
    parser.add_argument(
        "--log-file",
        default=os.environ.get("JCODEMUNCH_LOG_FILE"),
        help="Log file path (also via JCODEMUNCH_LOG_FILE env var). Defaults to stderr.",
    )


def _generate_claude_md_snippet(missing_only: bool = False) -> str:
    """Return the recommended CLAUDE.md prompt-policy snippet.

    When *missing_only* is True, reads ~/.claude/CLAUDE.md and returns only
    the tools not yet mentioned in it (as a minimal addendum block).
    Returns an empty string when the file is already fully up to date.
    """
    all_tools = list(_CANONICAL_TOOL_NAMES)

    if missing_only:
        claude_md = Path.home() / ".claude" / "CLAUDE.md"
        if claude_md.exists():
            content = claude_md.read_text(encoding="utf-8", errors="replace")
            missing = [t for t in all_tools if t not in content]
            if not missing:
                return ""
            tool_lines = "\n".join(f"- {t}" for t in missing)
            return (
                f"<!-- jcodemunch-mcp: add these new tools to your existing snippet -->\n"
                f"{tool_lines}\n"
            )
        # Fall through to full generation if CLAUDE.md doesn't exist yet

    # Group tools by category for readability
    categories = [
        ("Indexing", ["index_repo", "index_folder", "summarize_repo", "index_file"]),
        ("Discovery", ["list_repos", "resolve_repo", "suggest_queries",
                       "get_repo_outline", "get_file_tree", "get_file_outline"]),
        ("Search & Retrieval", ["search_symbols", "get_symbol_source", "get_context_bundle",
                                 "get_file_content", "search_text", "search_columns",
                                 "get_ranked_context"]),
        ("Relationships", ["find_importers", "find_references", "check_references",
                           "get_dependency_graph", "get_class_hierarchy",
                           "get_related_symbols", "get_call_hierarchy"]),
        ("Impact & Safety", ["get_blast_radius", "check_rename_safe",
                              "get_impact_preview", "get_changed_symbols"]),
        ("Architecture", ["get_dependency_cycles", "get_coupling_metrics",
                          "get_layer_violations", "get_extraction_candidates",
                          "get_cross_repo_map"]),
        ("Quality & Metrics", ["get_symbol_complexity", "get_churn_rate", "get_hotspots",
                                "get_repo_health", "get_symbol_importance",
                                "find_dead_code", "get_dead_code_v2",
                                "get_untested_symbols"]),
        ("Diffs & Embeddings", ["get_symbol_diff", "embed_repo"]),
        ("Session-Aware Routing", ["plan_turn", "get_session_context", "get_session_snapshot", "register_edit"]),
        ("Utilities", ["get_session_stats", "invalidate_cache", "test_summarizer",
                        "audit_agent_config"]),
    ]
    from . import __version__ as _ver
    lines = [
        f"## jcodemunch-mcp (v{_ver})",
        "",
        "Use jcodemunch-mcp tools instead of Grep/Read/Glob for any indexed repository.",
        "",
        "### Quick start",
        "1. `list_repos` — check if the project is indexed.",
        "   If not: `index_folder` (local) or `index_repo` (GitHub URL).",
        "2. `search_symbols` — find functions/classes by name or description.",
        "3. `get_context_bundle` — symbol source + imports in one call.",
        "4. `search_text` — full-text/regex search for literals and comments.",
        "",
        "### All tools",
    ]
    for cat, tools in categories:
        lines.append(f"**{cat}:** " + ", ".join(f"`{t}`" for t in tools))
    lines.append("")
    lines.append("Never fall back to Grep, Read, or Glob for indexed repos.")
    lines.append("")
    return "\n".join(lines)


def _run_claude_md(generate: bool = False, fmt: str = "full") -> None:
    """Output the recommended CLAUDE.md snippet for the current tool set."""
    missing_only = fmt == "append"
    snippet = _generate_claude_md_snippet(missing_only=missing_only)
    if missing_only and not snippet:
        import sys as _sys
        print("CLAUDE.md is already up to date — no new tools to add.", file=_sys.stderr)
        return
    print(snippet, end="")


def _run_config(check: bool = False, init: bool = False, upgrade: bool = False) -> None:
    """Print the current effective configuration to stdout, or initialize config file."""
    from . import config as _cfg
    from . import __version__

    # Handle --upgrade
    if upgrade:
        storage_path = os.environ.get("CODE_INDEX_PATH", str(Path.home() / ".code-index"))
        config_path = Path(storage_path) / "config.jsonc"

        if not config_path.exists():
            print(f"No config file found at: {config_path}")
            print("Run `config --init` first to create one.")
            return

        added, warnings = _cfg.upgrade_config(config_path)
        if not added:
            print(f"Config is already up to date (version bumped to {__version__}).")
        else:
            print(f"Upgraded config to {__version__}. Added {len(added)} missing key(s):")
            for key in added:
                print(f"  + {key}")
        for w in warnings:
            print(f"  warning: {w}")
        return

    # Handle --init
    if init:
        storage_path = os.environ.get("CODE_INDEX_PATH", str(Path.home() / ".code-index"))
        config_path = Path(storage_path) / "config.jsonc"

        if config_path.exists():
            print(f"Config file already exists: {config_path}")
            print("Refusing to overwrite. Remove it first or use --check to validate it.")
            return

        config_path.parent.mkdir(parents=True, exist_ok=True)
        template = _cfg.generate_template()
        config_path.write_text(template, encoding="utf-8")
        print(f"Created config template: {config_path}")
        print("Edit it to customize jcodemunch-mcp settings.")
        return

    # Load config to get effective values
    _cfg.load_config()

    tty = hasattr(sys.stdout, "isatty") and sys.stdout.isatty()
    enc = getattr(sys.stdout, "encoding", "ascii") or "ascii"

    def _safe(s, fallback):
        try:
            s.encode(enc)
            return s
        except (UnicodeEncodeError, LookupError):
            return fallback

    CHECK = _safe("✓", "OK")
    CROSS = _safe("✗", "!!")
    WARN  = _safe("!", "!")

    def dim(s):   return f"\033[2m{s}\033[0m" if tty else s
    def bold(s):  return f"\033[1m{s}\033[0m" if tty else s
    def green(s): return f"\033[32m{s}\033[0m" if tty else s
    def yellow(s): return f"\033[33m{s}\033[0m" if tty else s
    def red(s):   return f"\033[31m{s}\033[0m" if tty else s

    COL = 36

    def row(name, value, source="default"):
        tag = dim(f" [{source}]") if source != "default" else dim(" (default)")
        print(f"  {name:<{COL}} {value}{tag}")

    def env(var, default=""):
        val = os.environ.get(var)
        return (val if val is not None else default), (val is None)

    def section(title):
        print(f"\n{bold(title)}")

    def cfg_row(name, key, default, source=None, fmt=None):
        """Display a config value with source indicator."""
        val = _cfg.get(key, default)
        if fmt:
            val = fmt(val)
        effective_source = source or "default"
        print(f"  {name:<{COL}} {val}{dim(f' [{effective_source}]')}")

    print(bold(f"jcodemunch-mcp {__version__} — configuration"))

    # ── Config File ───────────────────────────────────────────────────────
    section("Config File")
    storage_path = os.environ.get("CODE_INDEX_PATH", str(Path.home() / ".code-index"))
    config_path = Path(storage_path) / "config.jsonc"
    if config_path.exists():
        print(f"  {green(CHECK)} config.jsonc found: {config_path}")
    else:
        print(f"  {yellow(WARN)} config.jsonc not found: {config_path}")
        print(f"  {dim('  Using defaults + env var fallbacks. Run `config --init` to create a config file.')}")

    # ── Indexing ──────────────────────────────────────────────────────────
    section("Indexing")
    # Detect source for each config key
    # Check the actual config file content (if exists) to determine if a key was
    # explicitly set in config vs defaulted
    _loaded_keys: set = set()
    if config_path.exists():
        try:
            content = config_path.read_text(encoding="utf-8")
            stripped = _cfg._strip_jsonc(content)
            import json as _json
            _loaded_keys = set(_json.loads(stripped).keys())
        except Exception:
            pass

    def _detect_source(key, default):
        if key in _loaded_keys:
            return "config"
        env_var = next((e for e, c in _cfg.ENV_VAR_MAPPING.items() if c == key), None)
        if env_var and os.environ.get(env_var) is not None:
            return "env"
        return "default"

    def _fmt_list(v):
        if isinstance(v, list):
            return f"[{len(v)} items]" if len(v) > 3 else str(v)
        return str(v)

    row("max_folder_files", _cfg.get("max_folder_files", 2000), _detect_source("max_folder_files", 2000))
    row("max_index_files", _cfg.get("max_index_files", 10000), _detect_source("max_index_files", 10000))
    row("staleness_days", _cfg.get("staleness_days", 7), _detect_source("staleness_days", 7))
    row("max_results", _cfg.get("max_results", 500), _detect_source("max_results", 500))
    patterns = _cfg.get("extra_ignore_patterns", [])
    row("extra_ignore_patterns", _fmt_list(patterns) if patterns else dim("(none)"), _detect_source("extra_ignore_patterns", []))
    exts = _cfg.get("extra_extensions", {})
    row("extra_extensions", _fmt_list(exts) if exts else dim("(none)"), _detect_source("extra_extensions", {}))
    row("context_providers", str(_cfg.get("context_providers", True)).lower(), _detect_source("context_providers", True))
    path_map_val = _cfg.get("path_map", "")
    row("path_map", path_map_val if path_map_val else dim("(none)"), _detect_source("path_map", ""))

    # ── Meta Response Control ─────────────────────────────────────────────
    section("Meta Response Control")
    meta_fields = _cfg.get("meta_fields")
    if meta_fields is None:
        row("meta_fields", dim("(all fields)"), "config")
    elif meta_fields == []:
        row("meta_fields", dim("(none)"), _detect_source("meta_fields", []))
    else:
        row("meta_fields", _fmt_list(meta_fields), _detect_source("meta_fields", None))

    # ── Languages ─────────────────────────────────────────────────────────
    section("Languages")
    languages = _cfg.get("languages")
    if languages is None:
        row("languages", dim("(all languages)"), "default")
    else:
        row("languages", _fmt_list(languages), _detect_source("languages", None))

    # ── Disabled Tools ────────────────────────────────────────────────────
    section("Disabled Tools")
    disabled = _cfg.get("disabled_tools", [])
    row("disabled_tools", _fmt_list(disabled) if disabled else dim("(none)"), _detect_source("disabled_tools", []))

    # ── Descriptions ──────────────────────────────────────────────────────
    section("Descriptions")
    descs = _cfg.get("descriptions", {})
    row("descriptions", _fmt_list(descs) if descs else dim("(none)"), _detect_source("descriptions", {}))

    # ── AI Summarizer ─────────────────────────────────────────────────────
    section("AI Summarizer")
    use_ai_raw, use_ai_d = env("JCODEMUNCH_USE_AI_SUMMARIES", "true")
    use_ai = use_ai_raw.lower() not in ("false", "0", "no", "off")
    row("use_ai_summaries", str(use_ai).lower(), "env" if not use_ai_d else _detect_source("use_ai_summaries", True))
    provider, provider_d = env("JCODEMUNCH_SUMMARIZER_PROVIDER", "")
    row(
        "summarizer_provider",
        provider if provider else dim("(auto-detect)"),
        "env" if not provider_d else "default",
    )

    anthropic_key = os.environ.get("ANTHROPIC_API_KEY", "")
    google_key = os.environ.get("GOOGLE_API_KEY", "")
    openai_base = os.environ.get("OPENAI_API_BASE", "")
    provider_name = get_provider_name()

    if not use_ai:
        print(f"  {yellow('AI summaries disabled')} — signature fallback active")
    elif provider_name == "anthropic":
        suffix = "JCODEMUNCH_SUMMARIZER_PROVIDER=anthropic" if provider == "anthropic" else "ANTHROPIC_API_KEY set"
        print(f"  Active provider:  {green('Anthropic')}  ({suffix})")
        model, d = env("ANTHROPIC_MODEL", "claude-haiku-*")
        row("  ANTHROPIC_MODEL", model, "env" if not d else "default")
    elif provider_name == "gemini":
        suffix = "JCODEMUNCH_SUMMARIZER_PROVIDER=gemini" if provider == "gemini" else "GOOGLE_API_KEY set"
        print(f"  Active provider:  {green('Google Gemini')}  ({suffix})")
        model, d = env("GOOGLE_MODEL", "gemini-flash-*")
        row("  GOOGLE_MODEL", model, "env" if not d else "default")
    elif provider_name == "openai":
        base_label = openai_base or "https://api.openai.com/v1"
        suffix = "JCODEMUNCH_SUMMARIZER_PROVIDER=openai" if provider == "openai" else "OPENAI_API_BASE set"
        print(f"  Active provider:  {green('OpenAI-compatible')}  ({suffix})")
        row("  OPENAI_API_BASE", base_label, "env" if openai_base else "default")
        model_default = "gpt-4o-mini" if provider == "openai" and not openai_base else "qwen3-coder"
        model, d = env("OPENAI_MODEL", model_default)
        row("  OPENAI_MODEL", model, "env" if not d else "default")
        v, d = env("OPENAI_TIMEOUT", "60.0")
        row("  OPENAI_TIMEOUT", v, "env" if not d else "default")
        v, d = env("OPENAI_BATCH_SIZE", "10")
        row("  OPENAI_BATCH_SIZE", v, "env" if not d else "default")
        v, d = env("OPENAI_CONCURRENCY", str(_cfg.get("summarizer_concurrency", 4)))
        row("  OPENAI_CONCURRENCY", v, "env" if not d else "config")
        v, d = env("OPENAI_MAX_TOKENS", "500")
        row("  OPENAI_MAX_TOKENS", v, "env" if not d else "default")
    elif provider_name == "minimax":
        suffix = "JCODEMUNCH_SUMMARIZER_PROVIDER=minimax" if provider == "minimax" else "MINIMAX_API_KEY set"
        print(f"  Active provider:  {green('MiniMax')}  ({suffix})")
        row("  OPENAI_API_BASE", "https://api.minimax.io/v1", "default")
        row("  OPENAI_MODEL", "minimax-m2.7", "default")
    elif provider_name == "glm":
        suffix = "JCODEMUNCH_SUMMARIZER_PROVIDER=glm" if provider == "glm" else "ZHIPUAI_API_KEY set"
        print(f"  Active provider:  {green('GLM-5')}  ({suffix})")
        row("  OPENAI_API_BASE", "https://api.z.ai/api/paas/v4/", "default")
        row("  OPENAI_MODEL", "glm-5", "default")
    elif provider_name == "openrouter":
        suffix = "JCODEMUNCH_SUMMARIZER_PROVIDER=openrouter" if provider == "openrouter" else "OPENROUTER_API_KEY set"
        print(f"  Active provider:  {green('OpenRouter')}  ({suffix})")
        row("  OPENAI_API_BASE", "https://openrouter.ai/api/v1", "default")
        row("  OPENAI_MODEL", "meta-llama/llama-3.3-70b-instruct:free", "default")
    elif provider == "none":
        print(f"  Active provider:  {yellow('none')} — explicitly disabled, signature fallback active")
    else:
        print(f"  Active provider:  {yellow('none')} — no API key set, signature fallback active")
        print(f"  {dim('Set ANTHROPIC_API_KEY, GOOGLE_API_KEY, OPENAI_API_BASE, MINIMAX_API_KEY, ZHIPUAI_API_KEY, or OPENROUTER_API_KEY to enable')}")

    allow_remote = _cfg.get("allow_remote_summarizer", False)
    allow_label = str(allow_remote).lower()
    if not allow_remote and provider_name:
        allow_label += f" {dim('(only affects custom base URLs, not standard API endpoints)')}"
    row("allow_remote_summarizer", allow_label, _detect_source("allow_remote_summarizer", False))

    # ── Transport ──────────────────────────────────────────────────────────
    section("Transport")
    transport = _cfg.get("transport", "stdio")
    row("transport", transport, _detect_source("transport", "stdio"))
    if transport != "stdio":
        row("host", _cfg.get("host", "127.0.0.1"), _detect_source("host", "127.0.0.1"))
        row("port", _cfg.get("port", 8901), _detect_source("port", 8901))
        token = os.environ.get("JCODEMUNCH_HTTP_TOKEN", "")
        row("JCODEMUNCH_HTTP_TOKEN", green("set") if token else yellow("not set"), "env")
        rate = _cfg.get("rate_limit", 0)
        rate_label = f"{rate}/min per IP" if rate != 0 else "disabled"
        row("rate_limit", rate_label, _detect_source("rate_limit", 0))
    else:
        print(f"  {dim('stdio mode — HTTP transport vars ignored')}")

    # ── Watcher ───────────────────────────────────────────────────────────
    section("Watcher")
    row("watch", str(_cfg.get("watch", False)).lower(), _detect_source("watch", False))
    row("watch_debounce_ms", _cfg.get("watch_debounce_ms", 2000), _detect_source("watch_debounce_ms", 2000))
    row("freshness_mode", _cfg.get("freshness_mode", "relaxed"), _detect_source("freshness_mode", "relaxed"))
    row("claude_poll_interval", _cfg.get("claude_poll_interval", 5.0), _detect_source("claude_poll_interval", 5.0))

    # ── Logging ──────────────────────────────────────────────────────────
    section("Logging")
    row("log_level", _cfg.get("log_level", "WARNING"), _detect_source("log_level", "WARNING"))
    log_file = _cfg.get("log_file")
    row("log_file", log_file if log_file else dim("(stderr)"), _detect_source("log_file", None))

    # ── Privacy & Telemetry ───────────────────────────────────────────────
    section("Privacy & Telemetry")
    row("redact_source_root", str(_cfg.get("redact_source_root", False)).lower(), _detect_source("redact_source_root", False))
    stats_int = _cfg.get("stats_file_interval", 3)
    row("stats_file_interval", "disabled" if stats_int == 0 else f"every {stats_int} calls", _detect_source("stats_file_interval", 3))
    share = _cfg.get("share_savings", True)
    row("share_savings", green("enabled") if share else yellow("disabled"), _detect_source("share_savings", True))
    row("summarizer_concurrency", _cfg.get("summarizer_concurrency", 4), _detect_source("summarizer_concurrency", 4))

    # ── --check ───────────────────────────────────────────────────────────
    if check:
        section("Checks")
        issues: list[str] = []

        # Validate config.jsonc
        config_issues = _cfg.validate_config(str(config_path))
        if config_issues:
            for issue in config_issues:
                print(f"  {red(CROSS)} config.jsonc: {issue}")
            issues.append("config")
        else:
            print(f"  {green(CHECK)} config.jsonc valid: {config_path}")

        # Storage writable?
        storage = Path(storage_path)
        try:
            storage.mkdir(parents=True, exist_ok=True)
            probe = storage / ".jcm_probe"
            probe.write_text("ok")
            probe.unlink()
            print(f"  {green(CHECK)} index storage writable: {storage}")
        except Exception as e:
            print(f"  {red(CROSS)} index storage not writable: {storage} — {e}")
            issues.append("storage")

        # AI provider package installed?
        if use_ai:
            if provider_name == "anthropic":
                try:
                    import anthropic as _a
                    print(f"  {green(CHECK)} anthropic package installed (v{_a.__version__})")
                except ImportError:
                    print(f"  {red(CROSS)} anthropic not installed — run: pip install \"jcodemunch-mcp[anthropic]\"")
                    issues.append("anthropic")
            elif provider_name == "gemini":
                try:
                    import google.generativeai  # noqa: F401
                    print(f"  {green(CHECK)} google-generativeai package installed")
                except ImportError:
                    print(f"  {red(CROSS)} google-generativeai not installed — run: pip install \"jcodemunch-mcp[gemini]\"")
                    issues.append("gemini")
            elif provider_name in {"openai", "minimax", "glm"}:
                try:
                    import httpx  # noqa: F401
                    print(f"  {green(CHECK)} httpx available for OpenAI-compatible requests")
                except ImportError:
                    print(f"  {red(CROSS)} httpx not installed (required for OpenAI-compatible summarizer)")
                    issues.append("httpx")
            else:
                print(f"  {yellow(WARN)} no AI provider configured — signature fallback will be used")

        # HTTP transport packages installed?
        if transport != "stdio":
            missing = [pkg for pkg in ("uvicorn", "starlette", "anyio") if not _can_import(pkg)]
            if missing:
                print(f"  {red(CROSS)} HTTP packages missing: {', '.join(missing)} — run: pip install \"jcodemunch-mcp[http]\"")
                issues.append("http")
            else:
                print(f"  {green(CHECK)} HTTP transport packages installed (uvicorn, starlette, anyio)")

        # ── CLAUDE.md drift check ────────────────────────────────────────────
        section("CLAUDE.md check")
        claude_md_path = Path.home() / ".claude" / "CLAUDE.md"
        canonical_tools = list(_CANONICAL_TOOL_NAMES)
        if claude_md_path.exists():
            try:
                cm_content = claude_md_path.read_text(encoding="utf-8", errors="replace")
                missing_in_cm = [t for t in canonical_tools if t not in cm_content]
                if missing_in_cm:
                    # Wrap into ~60-char lines for readability
                    _wrapped = _wrap_names(missing_in_cm)
                    print(f"  {yellow(WARN)} {len(missing_in_cm)} tool(s) not mentioned in CLAUDE.md:")
                    for _line in _wrapped:
                        print(f"       {dim(_line)}")
                    print(f"  {dim('  Run: jcodemunch-mcp claude-md --generate  (or --format=append for delta only)')}")
                    issues.append("claude_md")
                else:
                    print(f"  {green(CHECK)} All {len(canonical_tools)} tools mentioned in CLAUDE.md")
            except Exception as _e:
                print(f"  {yellow(WARN)} Could not read CLAUDE.md: {_e}")
        else:
            print(f"  {yellow(WARN)} CLAUDE.md not found: {claude_md_path}")
            print(f"  {dim('  Run: jcodemunch-mcp claude-md --generate > /path/to/CLAUDE.md')}")

        # ── Hook check ─────────────────────────────────────────────────────────
        section("Hooks check")
        _settings_path = Path.home() / ".claude" / "settings.json"
        _expected_hooks = {
            "hook-pretooluse": ("PreToolUse", "Read"),
            "hook-posttooluse": ("PostToolUse", "Edit|Write"),
            "hook-precompact": ("PreCompact", ""),
        }
        if _settings_path.exists():
            try:
                _settings = json.loads(_settings_path.read_text(encoding="utf-8"))
            except (json.JSONDecodeError, OSError):
                _settings = {}
            _installed_hooks = _settings.get("hooks", {})
            _found_any = False
            for _hook_cmd, (_event, _matcher) in _expected_hooks.items():
                _marker = f"jcodemunch-mcp {_hook_cmd}"
                _present = False
                for _rule in _installed_hooks.get(_event, []):
                    for _h in _rule.get("hooks", []):
                        if _marker in _h.get("command", ""):
                            _present = True
                            break
                if _present:
                    _label = f"{_event}({_matcher})" if _matcher else _event
                    print(f"  {green(CHECK)} {_hook_cmd} installed [{_label}]")
                    _found_any = True
                else:
                    print(f"  {dim(f'  {_hook_cmd} not installed')}")
            if not _found_any:
                print(f"  {dim('  Run: jcodemunch-mcp init --hooks')}")
            # Warn about legacy shell scripts
            _hooks_dir = Path.home() / ".claude" / "hooks"
            if _hooks_dir.exists():
                _legacy = (
                    list(_hooks_dir.glob("jcodemunch_read_guard.*"))
                    + list(_hooks_dir.glob("jcodemunch_edit_guard.*"))
                    + list(_hooks_dir.glob("jcodemunch_index_hook.*"))
                )
                if _legacy:
                    print(f"  {yellow(WARN)} Legacy shell scripts detected (replaced by Python hooks):")
                    for _script in sorted(_legacy):
                        print(f"       {dim(_script.name)}")
                    print(f"       {dim('These can be removed. Run: jcodemunch-mcp init --hooks')}")
        else:
            print(f"  {dim('(~/.claude/settings.json not found — hooks not installed)')}")
            print(f"  {dim('  Run: jcodemunch-mcp init --hooks')}")

        print()
        if issues:
            print(yellow(f"  {len(issues)} issue(s) found — see above."))
            sys.exit(1)
        else:
            print(green("  All checks passed."))
    print()


def _wrap_names(names: list[str], width: int = 72) -> list[str]:
    """Wrap a flat list of names into lines no longer than *width* chars."""
    lines: list[str] = []
    current = ""
    for name in names:
        piece = (", " if current else "") + name
        if current and len(current) + len(piece) > width:
            lines.append(current)
            current = name
        else:
            current += piece
    if current:
        lines.append(current)
    return lines


def _can_import(module: str) -> bool:
    """Return True if module is importable without side effects."""
    import importlib.util
    return importlib.util.find_spec(module) is not None


def main(argv: Optional[list[str]] = None):
    """Main entry point."""
    from .security import verify_package_integrity
    verify_package_integrity()

    parser = argparse.ArgumentParser(
        prog="jcodemunch-mcp",
        description="jCodeMunch MCP server and tools.",
    )
    parser.add_argument(
        "-V",
        "--version",
        action="version",
        version=f"%(prog)s {__version__}",
    )

    subparsers = parser.add_subparsers(dest="command")

    # --- serve (default when no subcommand given) ---
    serve_parser = subparsers.add_parser("serve", help="Run the MCP server (default)")
    serve_parser.add_argument(
        "--transport",
        default=os.environ.get("JCODEMUNCH_TRANSPORT", "stdio"),
        choices=["stdio", "sse", "streamable-http"],
        help="Transport mode: stdio (default), sse, or streamable-http (also via JCODEMUNCH_TRANSPORT env var)",
    )
    serve_parser.add_argument(
        "--host",
        default=os.environ.get("JCODEMUNCH_HOST", "127.0.0.1"),
        help="Host to bind to in HTTP transport mode (also via JCODEMUNCH_HOST env var, default: 127.0.0.1)",
    )
    serve_parser.add_argument(
        "--port",
        type=int,
        default=int(os.environ.get("JCODEMUNCH_PORT", "8901")),
        help="Port to listen on in HTTP transport mode (also via JCODEMUNCH_PORT env var, default: 8901)",
    )
    _add_common_args(serve_parser)

    # --- Watcher options for serve ---
    serve_parser.add_argument(
        "--watcher",
        nargs="?",
        const="true",
        default=None,
        metavar="BOOL",
        help="Enable background file watcher alongside the server. "
             "Use --watcher or --watcher=true to enable, --watcher=false to disable.",
    )
    serve_parser.add_argument(
        "--watcher-path",
        nargs="*",
        default=None,
        metavar="PATH",
        help="Folder(s) to watch (default: current working directory)",
    )
    serve_parser.add_argument(
        "--watcher-debounce",
        type=int,
        default=None,
        metavar="MS",
        help="Watcher debounce interval in ms (default: from config, also via JCODEMUNCH_WATCH_DEBOUNCE_MS)",
    )
    serve_parser.add_argument(
        "--watcher-idle-timeout",
        type=int,
        default=None,
        metavar="MINUTES",
        help="Auto-stop watcher after N minutes with no re-indexing (default: disabled)",
    )
    serve_parser.add_argument(
        "--watcher-no-ai-summaries",
        action="store_true",
        help="Disable AI-generated summaries for watcher re-indexing",
    )
    serve_parser.add_argument(
        "--watcher-extra-ignore",
        nargs="*",
        help="Additional gitignore-style patterns to exclude from watching",
    )
    serve_parser.add_argument(
        "--watcher-follow-symlinks",
        action="store_true",
        help="Include symlinked files in watcher indexing",
    )
    serve_parser.add_argument(
        "--watcher-log",
        nargs="?",
        const="auto",
        default=None,
        metavar="PATH",
        help="Log watcher output to file instead of stderr. "
             "Use --watcher-log for auto temp file, or --watcher-log=<path> for a specific file.",
    )
    serve_parser.add_argument(
        "--freshness-mode",
        default=None,
        choices=["relaxed", "strict"],
        help="Freshness mode: 'relaxed' (default) or 'strict' (block queries until watcher reindex finishes)",
    )

    # --- watch ---
    watch_parser = subparsers.add_parser(
        "watch",
        help="Watch folders for changes and auto-reindex",
    )
    watch_parser.add_argument(
        "paths",
        nargs="+",
        help="One or more folder paths to watch",
    )
    watch_parser.add_argument(
        "--debounce",
        type=int,
        default=None,
        metavar="MS",
        help="Debounce interval in ms (default: from config, also via JCODEMUNCH_WATCH_DEBOUNCE_MS)",
    )
    watch_parser.add_argument(
        "--no-ai-summaries",
        action="store_true",
        help="Disable AI-generated summaries during re-indexing",
    )
    watch_parser.add_argument(
        "--follow-symlinks",
        action="store_true",
        help="Include symlinked files in indexing",
    )
    watch_parser.add_argument(
        "--extra-ignore",
        nargs="*",
        help="Additional gitignore-style patterns to exclude",
    )
    watch_parser.add_argument(
        "--idle-timeout",
        type=int,
        default=None,
        metavar="MINUTES",
        help="Auto-shutdown after N minutes with no re-indexing (default: disabled)",
    )
    watch_parser.add_argument(
        "--once",
        action="store_true",
        help="Index all paths once (incremental) and exit immediately — no file watching",
    )
    _add_common_args(watch_parser)

    # --- config ---
    config_parser = subparsers.add_parser(
        "config",
        help="Show current effective configuration",
    )
    config_parser.add_argument(
        "--check",
        action="store_true",
        help="Also verify prerequisites (storage writable, AI packages installed, HTTP packages present)",
    )
    config_parser.add_argument(
        "--init",
        action="store_true",
        help="Generate a template config.jsonc file in CODE_INDEX_PATH",
    )
    config_parser.add_argument(
        "--upgrade",
        action="store_true",
        help="Add missing keys from the current template to an existing config.jsonc, preserving user values",
    )

    # --- claude-md ---
    claude_md_parser = subparsers.add_parser(
        "claude-md",
        help="Generate a CLAUDE.md prompt-policy snippet for the current tool set",
    )
    claude_md_parser.add_argument(
        "--generate",
        action="store_true",
        help="Output the recommended CLAUDE.md snippet to stdout",
    )
    claude_md_parser.add_argument(
        "--format",
        choices=["full", "append"],
        default="full",
        dest="fmt",
        help="'full' (default) — complete snippet; 'append' — only tools not yet in your CLAUDE.md",
    )

    # --- index-file ---
    index_file_parser = subparsers.add_parser(
        "index-file",
        help="Re-index a single file within an existing indexed folder",
    )
    index_file_parser.add_argument(
        "path",
        help="Absolute path to the file to index",
    )
    index_file_parser.add_argument(
        "--no-ai-summaries",
        action="store_true",
        help="Disable AI-generated summaries for this file",
    )
    _add_common_args(index_file_parser)

    # --- init ---
    init_parser = subparsers.add_parser(
        "init",
        help="One-command setup: register with MCP clients, install CLAUDE.md policy, hooks, and index",
    )
    init_parser.add_argument(
        "--client",
        nargs="*",
        default=None,
        metavar="CLIENT",
        help="MCP clients to configure (auto, claude-code, claude-desktop, cursor, windsurf, continue, none)",
    )
    init_parser.add_argument(
        "--claude-md",
        choices=["global", "project"],
        default=None,
        dest="claude_md",
        help="Install Code Exploration Policy to CLAUDE.md (global = ~/.claude/CLAUDE.md, project = ./CLAUDE.md)",
    )
    init_parser.add_argument(
        "--hooks",
        action="store_true",
        help="Install worktree lifecycle hooks into ~/.claude/settings.json",
    )
    init_parser.add_argument(
        "--index",
        action="store_true",
        help="Index the current working directory after setup",
    )
    init_parser.add_argument(
        "--audit",
        action="store_true",
        help="Audit agent config files for token waste, stale references, and bloat",
    )
    init_parser.add_argument(
        "--dry-run",
        action="store_true",
        dest="dry_run",
        help="Show what would be done without making changes",
    )
    init_parser.add_argument(
        "--demo",
        action="store_true",
        help=(
            "Walk through the full init process without making any changes, "
            "then summarise what would have been done and the benefit of each action"
        ),
    )
    init_parser.add_argument(
        "--yes", "-y",
        action="store_true",
        help="Accept all defaults non-interactively",
    )
    init_parser.add_argument(
        "--no-backup",
        action="store_true",
        dest="no_backup",
        help="Skip creating .bak backups of modified files",
    )

    # --- hook-event ---
    hook_parser = subparsers.add_parser(
        "hook-event",
        help="Record a Claude Code worktree lifecycle event (used by hooks)",
    )
    hook_parser.add_argument(
        "event_type",
        choices=["create", "remove"],
        help="Event type: 'create' when a worktree is created, 'remove' when deleted",
    )
    _add_common_args(hook_parser)

    # --- hook-pretooluse ---
    subparsers.add_parser(
        "hook-pretooluse",
        help="PreToolUse hook: intercept Read on large code files, suggest jCodemunch (reads stdin)",
    )

    # --- hook-posttooluse ---
    subparsers.add_parser(
        "hook-posttooluse",
        help="PostToolUse hook: auto-reindex files after Edit/Write (reads stdin)",
    )

    # --- hook-precompact ---
    subparsers.add_parser(
        "hook-precompact",
        help="PreCompact hook: generate session snapshot before context compaction (reads stdin)",
    )

    # --- watch-claude ---
    wc_parser = subparsers.add_parser(
        "watch-claude",
        help="Auto-discover and watch Claude Code worktrees",
    )
    wc_parser.add_argument(
        "--repos",
        nargs="+",
        help="One or more git repository paths to poll for worktrees via `git worktree list`",
    )
    wc_parser.add_argument(
        "--poll-interval",
        type=float,
        default=None,
        metavar="SECONDS",
        help="Poll interval in seconds (default: from config, also via JCODEMUNCH_CLAUDE_POLL_INTERVAL)",
    )
    wc_parser.add_argument(
        "--debounce",
        type=int,
        default=None,
        metavar="MS",
        help="Debounce interval in ms for file watching (default: from config, also via JCODEMUNCH_WATCH_DEBOUNCE_MS)",
    )
    wc_parser.add_argument(
        "--no-ai-summaries",
        action="store_true",
        help="Disable AI-generated summaries during re-indexing",
    )
    wc_parser.add_argument(
        "--follow-symlinks",
        action="store_true",
        help="Include symlinked files in indexing",
    )
    wc_parser.add_argument(
        "--extra-ignore",
        nargs="*",
        help="Additional gitignore-style patterns to exclude",
    )
    _add_common_args(wc_parser)

    # --- install-pack ---
    ip_parser = subparsers.add_parser(
        "install-pack",
        help="Download and install a Starter Pack pre-built index",
    )
    ip_parser.add_argument(
        "pack_id",
        nargs="?",
        default=None,
        help="Pack identifier to install (e.g. nodejs, fastapi)",
    )
    ip_parser.add_argument(
        "--license",
        default=None,
        dest="license_key",
        metavar="KEY",
        help="jCodeMunch license key (required for premium packs)",
    )
    ip_parser.add_argument(
        "--list",
        action="store_true",
        dest="list_packs",
        help="List all available starter packs",
    )
    ip_parser.add_argument(
        "--force",
        action="store_true",
        help="Re-download and overwrite an already-installed pack",
    )

    # Backwards compat: if first non-flag arg isn't a known subcommand,
    # prepend "serve" so legacy invocations like `jcodemunch-mcp --transport sse` still work.
    # But let --help and -V be handled by the top-level parser first.
    raw_argv = argv if argv is not None else sys.argv[1:]
    top_level_flags = {"-h", "--help", "-V", "--version"}
    if any(arg in top_level_flags for arg in raw_argv):
        args = parser.parse_args(raw_argv)
    else:
        known_commands = {"serve", "watch", "hook-event", "hook-pretooluse", "hook-posttooluse", "hook-precompact", "watch-claude", "config", "index-file", "claude-md", "init", "install-pack"}
        has_subcommand = any(arg in known_commands for arg in raw_argv if not arg.startswith("-"))
        if not has_subcommand:
            raw_argv = ["serve"] + list(raw_argv)
        args = parser.parse_args(raw_argv)

    if args.command == "config":
        _run_config(
            check=getattr(args, "check", False),
            init=getattr(args, "init", False),
            upgrade=getattr(args, "upgrade", False),
        )
        return

    if args.command == "claude-md":
        _run_claude_md(
            generate=getattr(args, "generate", False),
            fmt=getattr(args, "fmt", "full"),
        )
        return

    if args.command == "init":
        from .cli.init import run_init
        sys.exit(run_init(
            clients=args.client,
            claude_md=args.claude_md,
            hooks=args.hooks,
            index=args.index,
            audit=args.audit,
            dry_run=args.dry_run,
            demo=args.demo,
            yes=args.yes,
            no_backup=args.no_backup,
        ))

    if args.command == "install-pack":
        from .cli.install_pack import run_install_pack
        sys.exit(run_install_pack(
            pack_id=args.pack_id,
            license_key=args.license_key,
            list_packs=args.list_packs,
            force=args.force,
        ))

    if args.command == "hook-pretooluse":
        from .cli.hooks import run_pretooluse
        sys.exit(run_pretooluse())

    if args.command == "hook-posttooluse":
        from .cli.hooks import run_posttooluse
        sys.exit(run_posttooluse())

    if args.command == "hook-precompact":
        from .cli.hooks import run_precompact
        sys.exit(run_precompact())

    # Apply config defaults for watcher keys: CLI args > config > env vars.
    # config.load_config() is called inside each subcommand handler, but we need
    # the values here to fill in None defaults from argparse.
    # load_config() is idempotent so calling it early is safe.
    config_module.load_config()

    # --watcher-debounce (serve subcommand) / --debounce (watch, watch-claude)
    # Only set if the attr exists on args and is None (not explicitly provided on CLI)
    _debounce = config_module.get("watch_debounce_ms", 2000)
    if getattr(args, "watcher_debounce", None) is None:
        args.watcher_debounce = _debounce
    if getattr(args, "debounce", None) is None:
        args.debounce = _debounce

    # --poll-interval (watch-claude subcommand)
    if getattr(args, "poll_interval", None) is None:
        args.poll_interval = config_module.get("claude_poll_interval", 5.0)

    # --freshness-mode is only relevant for serve subcommand; handled there

    _setup_logging(args)

    if args.command == "watch":
        use_ai = not args.no_ai_summaries and _default_use_ai_summaries()
        if args.once:
            from .watcher import sync_folders

            asyncio.run(
                sync_folders(
                    paths=args.paths,
                    use_ai_summaries=use_ai,
                    storage_path=os.environ.get("CODE_INDEX_PATH"),
                    extra_ignore_patterns=args.extra_ignore,
                    follow_symlinks=args.follow_symlinks,
                )
            )
        else:
            from .watcher import watch_folders

            asyncio.run(
                watch_folders(
                    paths=args.paths,
                    debounce_ms=args.debounce,
                    use_ai_summaries=use_ai,
                    storage_path=os.environ.get("CODE_INDEX_PATH"),
                    extra_ignore_patterns=args.extra_ignore,
                    follow_symlinks=args.follow_symlinks,
                    idle_timeout_minutes=args.idle_timeout,
                )
            )
    elif args.command == "hook-event":
        from .hook_event import handle_hook_event

        handle_hook_event(event_type=args.event_type)
    elif args.command == "watch-claude":
        from .watcher import watch_claude_worktrees

        use_ai = not args.no_ai_summaries and _default_use_ai_summaries()
        asyncio.run(
            watch_claude_worktrees(
                repos=args.repos,
                poll_interval=args.poll_interval,
                debounce_ms=args.debounce,
                use_ai_summaries=use_ai,
                storage_path=os.environ.get("CODE_INDEX_PATH"),
                extra_ignore_patterns=args.extra_ignore,
                follow_symlinks=args.follow_symlinks,
            )
        )
    elif args.command == "index-file":
        from .tools.index_file import index_file as _index_file
        import json as _json

        use_ai = not args.no_ai_summaries and _default_use_ai_summaries()
        result = _index_file(
            path=args.path,
            use_ai_summaries=use_ai,
            storage_path=os.environ.get("CODE_INDEX_PATH"),
        )
        print(_json.dumps(result, indent=2))
        if not result.get("success"):
            sys.exit(1)
    else:
        # serve (default)
        # Re-run load_config() after _setup_logging() so config warnings/errors
        # go to the configured log destination (the early call at startup ran before logging was set up)
        config_module.load_config()
        config_module.load_all_project_configs()
        from .reindex_state import set_freshness_mode
        # Apply config default if --freshness-mode was not explicitly provided
        if args.freshness_mode is None:
            args.freshness_mode = config_module.get("freshness_mode", "relaxed")
        set_freshness_mode(args.freshness_mode)
        watcher_enabled = _get_watcher_enabled(args)

        if watcher_enabled:
            try:
                import watchfiles  # noqa: F401
            except ImportError:
                print(
                    "ERROR: --watcher requires watchfiles. "
                    "Install with: pip install 'jcodemunch-mcp[watch]'",
                    file=sys.stderr,
                )
                sys.exit(1)

            # Watcher params: CLI flag > config > default
            cfg_paths = config_module.get("watch_paths", [])
            if args.watcher_path is not None:
                watcher_paths = args.watcher_path
            elif cfg_paths:
                watcher_paths = cfg_paths
            else:
                watcher_paths = [os.getcwd()]

            use_ai = not args.watcher_no_ai_summaries and _default_use_ai_summaries()

            watcher_kwargs = dict(
                paths=watcher_paths,
                debounce_ms=(
                    args.watcher_debounce
                    if args.watcher_debounce is not None
                    else config_module.get("watch_debounce_ms", 2000)
                ),
                use_ai_summaries=use_ai,
                storage_path=os.environ.get("CODE_INDEX_PATH"),
                extra_ignore_patterns=(
                    args.watcher_extra_ignore
                    if args.watcher_extra_ignore is not None
                    else config_module.get("watch_extra_ignore", []) or None
                ),
                follow_symlinks=(
                    args.watcher_follow_symlinks
                    or config_module.get("watch_follow_symlinks", False)
                ),
                idle_timeout_minutes=(
                    args.watcher_idle_timeout
                    if args.watcher_idle_timeout is not None
                    else config_module.get("watch_idle_timeout", None)
                ),
            )

            log_path = (
                getattr(args, "watcher_log", None)
                or config_module.get("watch_log", None)
            )

            try:
                if args.transport == "sse":
                    asyncio.run(_run_server_with_watcher(
                        run_sse_server, (args.host, args.port), watcher_kwargs, log_path,
                    ))
                elif args.transport == "streamable-http":
                    asyncio.run(_run_server_with_watcher(
                        run_streamable_http_server, (args.host, args.port), watcher_kwargs, log_path,
                    ))
                else:
                    asyncio.run(_run_server_with_watcher(
                        run_stdio_server, (), watcher_kwargs, log_path,
                    ))
            except KeyboardInterrupt:
                pass
        else:
            if args.transport == "sse":
                asyncio.run(run_sse_server(args.host, args.port))
            elif args.transport == "streamable-http":
                asyncio.run(run_streamable_http_server(args.host, args.port))
            else:
                asyncio.run(run_stdio_server())


if __name__ == "__main__":
    main()