"""
Delimit Governance Layer — the loop that keeps AI agents on track.

Every tool flows through governance. Governance:
1. Logs what happened (evidence)
2. Checks result against rules (thresholds, policies)
3. Auto-creates ledger items for failures/warnings
4. Suggests next steps (loops back to keep building)

This replaces _with_next_steps — governance IS the next step system.
"""

import json
import logging
import os
import re
import subprocess
import time
from datetime import datetime, timezone
from pathlib import Path
from typing import Any, Dict, List, Optional


# LED-1721 (pre-ship security): the audit/ledger-skip used to be a plain
# customer-settable env var (DELIMIT_TEST_MODE). A customer could set it to
# suppress the attestation trail, and the identifier leaked into the shipped
# governance.so via `strings`. Both are fixed here:
#
#   * The identifier DELIMIT_TEST_MODE is GONE from this module (the bypass
#     grep no longer matches governance.so).
#   * The skip is now IMPOSSIBLE in a customer/production context. It requires
#     an INTERNAL-ONLY signal a customer environment never has, AND it is
#     hard-locked OFF whenever a real Pro/Enterprise license is active.
#
# The signal that the ledger-skip is allowed at all:
#   (A) an internal dev marker file  ~/.delimit/.internal_dev  (present only on
#       dev/internal boxes, shipped nowhere), OR
#   (B) the namespace-free pytest guard  INTERNAL_PYTEST_GUARD=1  (set by the
#       gateway's own tests/conftest.py — same Delimit-namespace-free pattern
#       LED-1262 used for social.py / deliberation.py).
# AND the license hard-lock:
#   if a real paid license (tier in {pro, enterprise}) is active, NEVER skip —
#   the attestation trail is mandatory for customers regardless of any marker.
_INTERNAL_DEV_MARKER = Path.home() / ".delimit" / ".internal_dev"


def _real_license_active() -> bool:
    """True when a valid paid (pro/enterprise) license is active.

    Best-effort + fail-safe: any import/lookup error returns False so the
    GATE still depends on the internal marker. (A False here cannot by itself
    enable a skip — the internal marker is still required.)
    """
    try:
        from ai.license import get_license  # local import: avoid import cycle
        lic = get_license() or {}
        return bool(lic.get("valid")) and lic.get("tier") in ("pro", "enterprise")
    except Exception:
        return False


def _ledger_skip_allowed() -> bool:
    """Return True only in an INTERNAL/dev context; impossible for customers.

    Replaces the old customer-settable env-var skip. The rule is:

        skip allowed  IFF  (not _real_license_active())
                            AND ( ~/.delimit/.internal_dev present
                                  OR INTERNAL_PYTEST_GUARD=1 )

    The license-lock is ABSOLUTE and unconditional: an active paid
    (pro/enterprise) license forces real audit writes on EVERY path. A paying
    customer can never suppress the attestation trail — not by setting an env
    var, and not by `touch ~/.delimit/.internal_dev`. The internal signals
    (dev-marker file / namespace-free pytest guard) only ever matter on a box
    with NO active paid license.

      * .internal_dev — ships NOWHERE (not in npm, not in the tarball, not
        written by `delimit setup`); exists only on our own dev/internal boxes.
      * INTERNAL_PYTEST_GUARD=1 — the namespace-free pytest guard set by the
        gateway's own tests/conftest.py.

    The founder's dev box carries a real pro license, so under this absolute
    lock it would not skip during the suite. That is solved in the TEST layer
    (tests/conftest.py masks _real_license_active for the session), NOT by
    weakening the lock. Production (real, unmasked license) can never skip.

    On every customer machine: a paid license closes both paths; a free-tier
    box has no .internal_dev file either, so the audit trail is never skippable.
    """
    if _real_license_active():
        return False  # ABSOLUTE license-lock — applies to every path below.
    try:
        if _INTERNAL_DEV_MARKER.is_file():
            return True  # internal/dev box (no active paid license).
    except OSError:
        pass
    return os.environ.get("INTERNAL_PYTEST_GUARD") == "1"


def _is_test_mode() -> bool:
    """Backwards-compatible alias for the internal-only ledger-skip gate.

    Kept so existing call sites need no change. See _ledger_skip_allowed().
    """
    return _ledger_skip_allowed()

logger = logging.getLogger("delimit.governance")


# ── STR-183 V2-hardening B-PREREQ-4: non-delegable operation registry ─
# Per /root/CLAUDE.md "Non-Delegable Decisions" and the 2026-04-07 ruleset-bypass postmortem,
# these operation classes can never be auto-approved by a generic gate (e.g. "all_gates_passed").
# Each invocation requires fresh, named-human attestation at gate-entry time.
# This constant is the code-level encoding of the constitutional boundary.
# Do not extend this set without an explicit founder-attested deliberation.
NON_DELEGABLE_OPERATION_CLASSES = frozenset({
    "ruleset_disable",       # disabling branch protection / repository rulesets
    "force_push_shared",     # force-push to main, release branches, or floating tags (v1, latest)
    "account_switch",        # switching gh / git author identity mid-flow
    "cross_account_ops",     # operating on one org from another org's identity
    "constitutional_rewrite",  # edits to founder doctrine canon outside managed sections
    "authority_class_expansion",  # adding a new class of tool / agent / gate
    "irreversible_capital_commit",  # capital commitments above non-delegable threshold
    "venture_kill",          # shutting down an internal venture
    "permission_escalation",  # granting elevated access (sudo, admin, write-as-other)
    "public_truth_claim",    # public statement / marketing assertion outrunning evidence
})


def is_non_delegable(operation_class: str) -> bool:
    """Return True iff the operation class is in the non-delegable registry.

    Per the 2026-04-07 postmortem and the V2 pressure-test (STR-183, unanimous round 3),
    non-delegable operations cannot pass through any "all_gates_passed" mechanism.
    They require per-invocation founder attestation, checked live at gate entry.
    """
    return operation_class in NON_DELEGABLE_OPERATION_CLASSES


def require_founder_attestation(operation_class: str, attestation: Optional[Dict[str, Any]] = None) -> Dict[str, Any]:
    """Fail-closed gate for non-delegable operations.

    Returns a verdict dict. The caller must refuse to proceed unless verdict["allowed"] is True.

    A valid attestation must include:
      - "founder_id": the named human performing the attestation
      - "scope": the exact operation being attested (must match operation_class)
      - "timestamp": ISO-8601 UTC
      - "evidence_ref": pointer to the evidence (ledger ID, postmortem path, or signed message)

    Pre-approval of a parent plan does NOT extend to non-delegable escalations
    (2026-04-07 postmortem rule). Each invocation needs its own attestation.
    """
    if not is_non_delegable(operation_class):
        return {"allowed": True, "operation_class": operation_class, "non_delegable": False}

    if not attestation:
        return {
            "allowed": False,
            "operation_class": operation_class,
            "non_delegable": True,
            "reason": (
                f"{operation_class} is non-delegable (STR-183 / 2026-04-07 postmortem). "
                "Pre-approval of a parent plan does not extend to this operation. "
                "Per-invocation founder attestation is required."
            ),
        }

    required = {"founder_id", "scope", "timestamp", "evidence_ref"}
    missing = required - set(attestation.keys())
    if missing:
        return {
            "allowed": False,
            "operation_class": operation_class,
            "non_delegable": True,
            "reason": f"Attestation missing required fields: {sorted(missing)}",
        }

    if attestation["scope"] != operation_class:
        return {
            "allowed": False,
            "operation_class": operation_class,
            "non_delegable": True,
            "reason": (
                f"Attestation scope mismatch: attested for '{attestation['scope']}' "
                f"but invocation is for '{operation_class}'. The scope of approval is "
                "the scope stated, not beyond (CLAUDE.md escalation rule)."
            ),
        }

    return {
        "allowed": True,
        "operation_class": operation_class,
        "non_delegable": True,
        "attestation": attestation,
    }


# ── LED-263: Beta CTA for conversion ────────────────────────────────
# Tools that should show a beta signup prompt on successful results.
_BETA_CTA_TOOLS = frozenset({"lint", "scan", "activate", "diff", "quickstart"})

_BETA_CTA = {
    "text": "Like what you see? Join the beta for priority support and full governance.",
    "url": "https://app.delimit.ai",
    "action": "star_repo_or_signup",
}


def _is_beta_user() -> bool:
    """Check if the current user is already tracked as a founding/beta user."""
    try:
        from ai.founding_users import _load_founding_users
        data = _load_founding_users()
        if data.get("users"):
            return True
    except Exception:
        pass
    # Also check if a Pro license is active (paying users don't need the CTA)
    try:
        from ai.license import get_license
        lic = get_license()
        if lic.get("tier", "free") != "free":
            return True
    except Exception:
        pass
    return False


def _result_is_successful(result: Dict[str, Any]) -> bool:
    """Return True if a tool result looks like a success (no errors)."""
    if result.get("error"):
        return False
    if result.get("status") in ("error", "failed", "blocked"):
        return False
    if result.get("governance_blocked"):
        return False
    return True


def _maybe_beta_cta(tool_name: str, result: Dict[str, Any]) -> Optional[Dict[str, str]]:
    """Return a beta CTA dict if the tool qualifies and the user is not already signed up."""
    if tool_name not in _BETA_CTA_TOOLS:
        return None
    if not _result_is_successful(result):
        return None
    if _is_beta_user():
        return None
    return dict(_BETA_CTA)


def _ledger_list_items(project_path: str = ".") -> Dict[str, Any]:
    """Indirection layer so tests can patch governance-local ledger hooks."""
    import ai.ledger_manager as _lm
    return _lm.list_items(project_path=project_path)


def _ledger_add_item(*, title: str, type: str, priority: str, source: str, project_path: str = ".") -> Dict[str, Any]:
    """Indirection layer so tests can patch governance-local ledger hooks."""
    import ai.ledger_manager as _lm
    return _lm.add_item(
        title=title,
        type=type,
        priority=priority,
        source=source,
        project_path=project_path,
    )


def _ledger_update_item(item_id: str, *, status: str, project_path: str = ".") -> Dict[str, Any]:
    """Indirection layer so tests can patch governance-local ledger hooks."""
    import ai.ledger_manager as _lm
    return _lm.update_item(item_id, status=status, project_path=project_path)


# Governance rules — what triggers auto-ledger-creation
RULES = {
    "test_coverage": {
        "threshold_key": "line_coverage",
        "threshold": 80,
        "comparison": "below",
        "ledger_title": "Test coverage below {threshold}% — currently {value}%",
        "ledger_type": "fix",
        "ledger_priority": "P1",
    },
    "security_audit": {
        "trigger_key": "vulnerabilities",
        "trigger_if_nonempty": True,
        "ledger_title": "Security: {count} vulnerabilities found",
        "ledger_type": "fix",
        "ledger_priority": "P0",
    },
    "security_scan": {
        "trigger_key": "vulnerabilities",
        "trigger_if_nonempty": True,
        "ledger_title": "Security scan: {count} issues detected",
        "ledger_type": "fix",
        "ledger_priority": "P0",
    },
    "lint": {
        "trigger_key": "violations",
        "trigger_if_nonempty": True,
        "ledger_title": "API lint: {count} violations found",
        "ledger_type": "fix",
        "ledger_priority": "P1",
    },
    "deliberate": {
        "trigger_key": "unanimous",
        "trigger_if_true": True,
        "extract_actions": True,
        "ledger_title": "Deliberation consensus reached — action items pending",
        "ledger_type": "strategy",
        "ledger_priority": "P1",
    },
    "gov_health": {
        "trigger_key": "status",
        "trigger_values": ["not_initialized", "degraded"],
        "ledger_title": "Governance health: {value} — needs attention",
        "ledger_type": "fix",
        "ledger_priority": "P1",
    },
    "docs_validate": {
        "threshold_key": "coverage_percent",
        "threshold": 50,
        "comparison": "below",
        "ledger_title": "Documentation coverage below {threshold}% — currently {value}%",
        "ledger_type": "task",
        "ledger_priority": "P2",
    },
}

# Milestone rules — auto-create DONE ledger items for significant completions.
# Unlike threshold RULES (which create open items for problems), milestones
# record achievements so the ledger reflects what was shipped.
MILESTONES = {
    "deploy_site": {
        "trigger_key": "status",
        "trigger_values": ["deployed"],
        "ledger_title": "Deployed: {project}",
        "ledger_type": "feat",
        "ledger_priority": "P1",
        "auto_done": True,
    },
    "deploy_npm": {
        "trigger_key": "status",
        "trigger_values": ["published"],
        "ledger_title": "Published: {package}@{new_version}",
        "ledger_type": "feat",
        "ledger_priority": "P1",
        "auto_done": True,
    },
    "deliberate": {
        "trigger_key": "status",
        "trigger_values": ["unanimous"],
        "ledger_title": "Consensus reached: {question_short}",
        "ledger_type": "strategy",
        "ledger_priority": "P1",
        "auto_done": True,
    },
    "test_generate": {
        "threshold_key": "tests_generated",
        "threshold": 10,
        "comparison": "above",
        "ledger_title": "Generated {value} tests",
        "ledger_type": "feat",
        "ledger_priority": "P2",
        "auto_done": True,
    },
    "sensor_github_issue": {
        "trigger_key": "has_new_activity",
        "trigger_if_true": True,
        "ledger_title": "Outreach activity: {repo}#{issue_number}",
        "ledger_type": "task",
        "ledger_priority": "P1",
        "auto_done": False,  # needs follow-up
    },
    "zero_spec": {
        "trigger_key": "success",
        "trigger_if_true": True,
        "ledger_title": "Zero-spec extracted: {framework} ({paths_count} paths)",
        "ledger_type": "feat",
        "ledger_priority": "P2",
        "auto_done": True,
    },
}

# Next steps registry — what to do after each tool
NEXT_STEPS = {
    "lint": [
        {"tool": "delimit_explain", "reason": "Get migration guide for violations", "premium": False},
        {"tool": "delimit_semver", "reason": "Classify the version bump", "premium": False},
    ],
    "diff": [
        {"tool": "delimit_semver", "reason": "Classify changes as MAJOR/MINOR/PATCH", "premium": False},
        {"tool": "delimit_policy", "reason": "Check against governance policies", "premium": False},
    ],
    "semver": [
        {"tool": "delimit_explain", "reason": "Generate human-readable changelog", "premium": False},
        {"tool": "delimit_deploy_npm", "reason": "Publish the new version to npm", "premium": False},
    ],
    "init": [
        {"tool": "delimit_gov_health", "reason": "Verify governance is set up correctly", "premium": True},
        {"tool": "delimit_diagnose", "reason": "Check for any issues", "premium": False},
    ],
    "test_coverage": [
        {"tool": "delimit_test_generate", "reason": "Generate tests for uncovered files", "premium": False},
    ],
    "security_audit": [
        {"tool": "delimit_evidence_collect", "reason": "Collect evidence of findings", "premium": True},
    ],
    "gov_health": [
        {"tool": "delimit_gov_status", "reason": "See detailed governance status", "premium": True},
        {"tool": "delimit_repo_analyze", "reason": "Full repo health report", "premium": True},
    ],
    "deploy_npm": [
        {"tool": "delimit_deploy_verify", "reason": "Verify the published package", "premium": True},
    ],
    "deploy_plan": [
        {"tool": "delimit_deploy_build", "reason": "Build the deployment", "premium": True},
    ],
    "deploy_build": [
        {"tool": "delimit_deploy_publish", "reason": "Publish the build", "premium": True},
    ],
    "deploy_publish": [
        {"tool": "delimit_deploy_verify", "reason": "Verify the deployment", "premium": True},
    ],
    "deploy_verify": [
        {"tool": "delimit_deploy_rollback", "reason": "Rollback if unhealthy", "premium": True},
    ],
    "repo_analyze": [
        {"tool": "delimit_security_audit", "reason": "Scan for security issues", "premium": False},
        {"tool": "delimit_gov_health", "reason": "Check governance status", "premium": True},
    ],
    "deliberate": [
        {"tool": "delimit_ledger_context", "reason": "Review what's on the ledger after consensus", "premium": False},
    ],
    "ledger_add": [
        {"tool": "delimit_ledger_context", "reason": "See updated ledger state", "premium": False},
    ],
    "diagnose": [
        {"tool": "delimit_init", "reason": "Initialize governance if not set up", "premium": False},
    ],
    # Design & UI tools — triggered after UI-related work
    "deploy_site": [
        {"tool": "delimit_design_validate_responsive", "reason": "Check responsive design before deploy", "premium": False},
        {"tool": "delimit_story_accessibility", "reason": "Run accessibility audit", "premium": False},
        {"tool": "delimit_deploy_npm", "reason": "Publish npm package if applicable", "premium": False},
        {"tool": "delimit_ledger_context", "reason": "Check what else needs deploying", "premium": False},
    ],
    "design_component_library": [
        {"tool": "delimit_design_validate_responsive", "reason": "Validate responsive patterns", "premium": False},
        {"tool": "delimit_story_accessibility", "reason": "Check accessibility", "premium": False},
    ],
    "design_validate_responsive": [
        {"tool": "delimit_story_accessibility", "reason": "Also check accessibility", "premium": False},
        {"tool": "delimit_story_visual_test", "reason": "Take visual baseline screenshot", "premium": False},
    ],
    "design_generate_component": [
        {"tool": "delimit_story_generate", "reason": "Generate stories for the new component", "premium": False},
        {"tool": "delimit_design_validate_responsive", "reason": "Check responsive design", "premium": False},
    ],
    "story_accessibility": [
        {"tool": "delimit_ledger_add", "reason": "Track accessibility issues in ledger", "premium": False},
    ],
    "story_visual_test": [
        {"tool": "delimit_ledger_add", "reason": "Track visual regressions in ledger", "premium": False},
    ],
    "scan": [
        {"tool": "delimit_design_component_library", "reason": "Catalog UI components", "premium": False},
        {"tool": "delimit_design_validate_responsive", "reason": "Check responsive design", "premium": False},
        {"tool": "delimit_story_accessibility", "reason": "Run accessibility audit", "premium": False},
        {"tool": "delimit_gov_health", "reason": "Check governance status", "premium": True},
    ],
    "quickstart": [
        {"tool": "delimit_ledger_add", "reason": "Start tracking tasks in the ledger", "premium": False},
        {"tool": "delimit_lint", "reason": "Check an OpenAPI spec for breaking changes", "premium": False},
        {"tool": "delimit_deliberate", "reason": "Try multi-model deliberation on a decision", "premium": True},
        {"tool": "delimit_security_scan", "reason": "Run a security scan", "premium": True},
    ],
    "test_generate": [
        {"tool": "delimit_test_smoke", "reason": "Run smoke tests on generated tests", "premium": False},
        {"tool": "delimit_test_coverage", "reason": "Check coverage after adding tests", "premium": False},
    ],
    # --- Context & Memory workflow ---
    "context_init": [
        {"tool": "delimit_context_write", "reason": "Write your first artifact", "premium": True},
    ],
    "context_write": [
        {"tool": "delimit_context_list", "reason": "See all artifacts", "premium": True},
    ],
    "context_read": [],  # Terminal — user got what they needed
    "context_list": [],  # Terminal
    "context_snapshot": [
        {"tool": "delimit_ledger_context", "reason": "Check what else needs work", "premium": False},
    ],
    "context_branch": [],  # Terminal
    "memory_store": [
        {"tool": "delimit_ledger_context", "reason": "Check ledger after saving memory", "premium": False},
    ],
    "memory_search": [],  # Terminal — user got results
    "memory_recent": [],  # Terminal
    # --- Security workflow ---
    "security_scan": [
        {"tool": "delimit_security_audit", "reason": "Run full audit for details", "premium": False},
    ],
    "security_ingest": [
        {"tool": "delimit_security_deliberate", "reason": "Triage findings via multi-model deliberation", "premium": True},
        {"tool": "delimit_deploy_plan", "reason": "Check if deploys are gated by findings", "premium": True},
    ],
    "security_deliberate": [
        {"tool": "delimit_ledger_context", "reason": "Review updated security findings in ledger", "premium": False},
    ],
    # --- Governance deep workflow ---
    "gov_status": [
        {"tool": "delimit_gov_evaluate", "reason": "Evaluate compliance", "premium": True},
    ],
    "gov_evaluate": [
        {"tool": "delimit_gov_run", "reason": "Run governance checks", "premium": True},
    ],
    "gov_run": [
        {"tool": "delimit_gov_verify", "reason": "Verify results", "premium": True},
    ],
    "gov_verify": [
        {"tool": "delimit_ledger_context", "reason": "Check ledger for action items", "premium": False},
    ],
    "gov_policy": [],  # Terminal
    "gov_new_task": [
        {"tool": "delimit_ledger_context", "reason": "See updated ledger", "premium": False},
    ],
    # --- Deploy workflow (missing entries) ---
    "deploy_status": [
        {"tool": "delimit_deploy_verify", "reason": "Verify health", "premium": True},
    ],
    "deploy_rollback": [
        {"tool": "delimit_deploy_status", "reason": "Check rollback status", "premium": True},
    ],
    # --- Release workflow ---
    "release_plan": [
        {"tool": "delimit_release_validate", "reason": "Validate release readiness", "premium": True},
    ],
    "release_validate": [
        {"tool": "delimit_release_sync", "reason": "Sync across surfaces", "premium": True},
    ],
    "release_sync": [
        {"tool": "delimit_ledger_context", "reason": "Check for remaining items", "premium": False},
    ],
    "release_status": [],  # Terminal
    "release_history": [],  # Terminal
    "release_rollback": [
        {"tool": "delimit_deploy_status", "reason": "Verify rollback", "premium": True},
    ],
    # --- Observability workflow ---
    "obs_status": [
        {"tool": "delimit_obs_metrics", "reason": "See detailed metrics", "premium": True},
    ],
    "obs_metrics": [
        {"tool": "delimit_obs_logs", "reason": "Check logs for issues", "premium": True},
    ],
    "obs_logs": [
        {"tool": "delimit_obs_alerts", "reason": "Check active alerts", "premium": True},
    ],
    "obs_alerts": [],  # Terminal
    # --- Repo workflow ---
    "repo_diagnose": [
        {"tool": "delimit_repo_analyze", "reason": "Full analysis", "premium": True},
    ],
    "repo_config_validate": [
        {"tool": "delimit_repo_config_audit", "reason": "Audit for security issues", "premium": True},
    ],
    "repo_config_audit": [
        {"tool": "delimit_security_audit", "reason": "Full security scan", "premium": False},
    ],
    # --- Docs workflow ---
    "docs_generate": [
        {"tool": "delimit_docs_validate", "reason": "Validate generated docs", "premium": False},
    ],
    "docs_validate": [
        {"tool": "delimit_ledger_context", "reason": "Check for doc-related tasks", "premium": False},
    ],
    # --- Cost workflow ---
    "cost_analyze": [
        {"tool": "delimit_cost_optimize", "reason": "Find optimization opportunities", "premium": True},
    ],
    "cost_optimize": [
        {"tool": "delimit_cost_alert", "reason": "Set cost alerts", "premium": True},
    ],
    "cost_alert": [],  # Terminal
    # --- Data workflow ---
    "data_validate": [
        {"tool": "delimit_data_backup", "reason": "Backup validated data", "premium": True},
    ],
    "data_backup": [],  # Terminal
    "data_migrate": [
        {"tool": "delimit_data_validate", "reason": "Validate after migration", "premium": True},
    ],
    # --- Secrets workflow ---
    "secret_store": [
        {"tool": "delimit_secret_list", "reason": "Verify stored secrets", "premium": True},
    ],
    "secret_get": [],  # Terminal
    "secret_list": [],  # Terminal
    "secret_revoke": [],  # Terminal
    "secret_access_log": [],  # Terminal
    # --- Intel workflow ---
    "intel_query": [],  # Terminal
    "intel_dataset_register": [
        {"tool": "delimit_intel_dataset_list", "reason": "Verify registration", "premium": True},
    ],
    "intel_dataset_list": [],  # Terminal
    "intel_dataset_freeze": [],  # Terminal
    "intel_snapshot_ingest": [
        {"tool": "delimit_intel_query", "reason": "Query the ingested data", "premium": True},
    ],
    # --- Social/Content workflow ---
    "social_post": [
        {"tool": "delimit_social_history", "reason": "Check post history", "premium": True},
    ],
    "social_generate": [
        {"tool": "delimit_social_post", "reason": "Post the generated content", "premium": True},
    ],
    "social_history": [],  # Terminal
    "content_publish": [
        {"tool": "delimit_content_schedule", "reason": "Check upcoming schedule", "premium": True},
    ],
    "content_schedule": [],  # Terminal
    "content_queue": [],  # Terminal
    # --- OS/Daemon workflow ---
    "os_status": [
        {"tool": "delimit_os_plan", "reason": "Plan next OS actions", "premium": True},
    ],
    "os_plan": [
        {"tool": "delimit_os_gates", "reason": "Check gates", "premium": True},
    ],
    "os_gates": [],  # Terminal
    "daemon_status": [],  # Terminal
    "daemon_run": [
        {"tool": "delimit_daemon_status", "reason": "Check results", "premium": True},
    ],
    "daemon_classify": [],  # Terminal
    # --- Resource/Vault/Misc ---
    "resource_list": [],  # Terminal
    "resource_get": [],  # Terminal
    "resource_drivers": [],  # Terminal
    "vault_health": [],  # Terminal
    "vault_search": [],  # Terminal
    "vault_snapshot": [],  # Terminal
    "sensor_github_issue": [
        {"tool": "delimit_ledger_context", "reason": "Check ledger for outreach items", "premium": False},
    ],
    "evidence_collect": [
        {"tool": "delimit_evidence_verify", "reason": "Verify collected evidence", "premium": True},
    ],
    "evidence_verify": [],  # Terminal
    "generate_scaffold": [
        {"tool": "delimit_init", "reason": "Initialize governance for the new project", "premium": False},
    ],
    "generate_template": [],  # Terminal
    # --- Terminal tools ---
    "help": [],
    "version": [],
    "license_status": [],
    "activate": [],
    "ventures": [],
    "ledger": [],
    "ledger_list": [],
    "ledger_done": [
        {"tool": "delimit_ledger_context", "reason": "See what's next", "premium": False},
    ],
    "ledger_context": [],  # Entry point — don't chain from it
    "policy": [],
    "explain": [],
    "impact": [],
    "zero_spec": [
        {"tool": "delimit_lint", "reason": "Lint the extracted spec", "premium": False},
    ],
    "models": [],
    "story_build": [],
    "story_generate": [
        {"tool": "delimit_story_accessibility", "reason": "Check accessibility", "premium": False},
    ],
    # --- Design extras (not yet routed) ---
    "design_extract_tokens": [
        {"tool": "delimit_design_generate_tailwind", "reason": "Generate Tailwind config from tokens", "premium": False},
    ],
    "design_generate_tailwind": [
        {"tool": "delimit_design_validate_responsive", "reason": "Validate responsive design", "premium": False},
    ],
    # --- Test extras ---
    "test_smoke": [
        {"tool": "delimit_test_coverage", "reason": "Check coverage after smoke tests", "premium": False},
    ],
}


def govern(tool_name: str, result: Dict[str, Any], project_path: str = ".") -> Dict[str, Any]:
    """
    Run governance on a tool's result. This is the central loop.

    1. Check result against rules
    2. Auto-create ledger items if thresholds breached
    3. Add next_steps for the AI to continue
    4. Return enriched result

    Every tool should call this before returning.
    """
    # Strip "delimit_" prefix for rule matching
    clean_name = tool_name.replace("delimit_", "")

    governed_result = dict(result)

    # 1. Check governance rules
    rule = RULES.get(clean_name)
    auto_items = []

    if rule:
        triggered = False
        context = {}

        # Threshold check (e.g., coverage < 80%)
        if "threshold_key" in rule:
            value = _deep_get(result, rule["threshold_key"])
            if value is not None:
                threshold = rule["threshold"]
                if rule.get("comparison") == "below" and value < threshold:
                    triggered = True
                    context = {"value": f"{value:.1f}" if isinstance(value, float) else str(value), "threshold": str(threshold)}

        # Non-empty list check (e.g., vulnerabilities found)
        if "trigger_key" in rule and "trigger_if_nonempty" in rule:
            items = _deep_get(result, rule["trigger_key"])
            if items and isinstance(items, list) and len(items) > 0:
                triggered = True
                context = {"count": str(len(items))}

        # Value match check (e.g., status == "degraded")
        if "trigger_key" in rule and "trigger_values" in rule:
            value = _deep_get(result, rule["trigger_key"])
            if value in rule["trigger_values"]:
                triggered = True
                context = {"value": str(value)}

        # Boolean check (e.g., unanimous == True)
        if "trigger_key" in rule and "trigger_if_true" in rule:
            value = _deep_get(result, rule["trigger_key"])
            if value:
                triggered = True

        if triggered:
            title = rule["ledger_title"].format(**context) if context else rule["ledger_title"]
            auto_items.append({
                "title": title,
                "type": rule.get("ledger_type", "task"),
                "priority": rule.get("ledger_priority", "P1"),
                "source": f"governance:{clean_name}",
            })

    # 1b. Check milestone rules (auto-create DONE items for achievements)
    milestone = MILESTONES.get(clean_name)
    if milestone:
        m_triggered = False
        m_context = {}

        # Value match (e.g., status == "deployed")
        if "trigger_key" in milestone and "trigger_values" in milestone:
            value = _deep_get(result, milestone["trigger_key"])
            if value in milestone["trigger_values"]:
                m_triggered = True
                m_context = {"value": str(value)}

        # Boolean check (e.g., success == True)
        if "trigger_key" in milestone and milestone.get("trigger_if_true"):
            value = _deep_get(result, milestone["trigger_key"])
            if value:
                m_triggered = True

        # Threshold above (e.g., tests_generated > 10)
        if "threshold_key" in milestone:
            value = _deep_get(result, milestone["threshold_key"])
            if value is not None:
                threshold = milestone["threshold"]
                if milestone.get("comparison") == "above" and value > threshold:
                    m_triggered = True
                    m_context = {"value": str(value), "threshold": str(threshold)}

        if m_triggered:
            # Build context from result fields for title interpolation
            for key in ("project", "package", "new_version", "framework", "paths_count", "repo", "issue_number"):
                if key not in m_context:
                    v = _deep_get(result, key)
                    if v is not None:
                        m_context[key] = str(v)
            # Special: short question for deliberations
            if "question_short" not in m_context:
                q = _deep_get(result, "question") or _deep_get(result, "note") or ""
                m_context["question_short"] = str(q)[:80]

            try:
                title = milestone["ledger_title"].format(**m_context)
            except (KeyError, IndexError):
                title = milestone["ledger_title"]

            auto_items.append({
                "title": title,
                "type": milestone.get("ledger_type", "feat"),
                "priority": milestone.get("ledger_priority", "P1"),
                "source": f"milestone:{clean_name}",
                "auto_done": milestone.get("auto_done", True),
            })

    # 2. Auto-create ledger items (with dedup — skip if open item with same title exists)
    if auto_items:
        try:
            # Load existing open titles for dedup
            existing = _ledger_list_items(project_path=project_path)
            # items can be a list or dict of lists (by ledger type)
            all_items = []
            raw_items = existing.get("items", [])
            if isinstance(raw_items, dict):
                for ledger_items in raw_items.values():
                    if isinstance(ledger_items, list):
                        all_items.extend(ledger_items)
            elif isinstance(raw_items, list):
                all_items = raw_items
            open_titles = {
                i.get("title", "")
                for i in all_items
                if isinstance(i, dict) and i.get("status") == "open"
            }
            created = []
            test_mode = _is_test_mode()
            for item in auto_items:
                if item["title"] in open_titles:
                    logger.debug("Skipping duplicate ledger item: %s", item["title"])
                    continue
                if test_mode:
                    # In test mode, skip real ledger writes to avoid
                    # polluting the project ledger with mock/test data.
                    logger.debug("Test mode: skipping ledger write for %s", item["title"])
                    created.append(f"TEST-{item['title'][:40]}")
                    continue
                entry = _ledger_add_item(
                    title=item["title"],
                    type=item["type"],
                    priority=item["priority"],
                    source=item["source"],
                    project_path=project_path,
                )
                item_id = entry.get("added", {}).get("id", "")
                created.append(item_id)
                # Auto-close milestone items
                if item.get("auto_done") and item_id:
                    try:
                        _ = _ledger_update_item(item_id, status="done", project_path=project_path)
                    except Exception:
                        pass
            governed_result["governance"] = {
                "action": "ledger_items_created",
                "items": created,
                "reason": "Governance rule triggered by tool result",
            }
        except Exception as e:
            logger.warning("Governance auto-ledger failed: %s", e)

    # 3. Add governance-directed next steps
    steps = NEXT_STEPS.get(clean_name, [])
    if steps:
        governed_result["next_steps"] = steps

    # 4. GOVERNANCE LOOP: always route back to ledger_context
    # This is not a suggestion — it's how the loop works.
    # The AI should call ledger_context after every tool to check what's next.
    # Ledger tools now route through governance for next_steps but skip auto-create
    # (no rules/milestones defined for them, so no recursion risk)
    SKIP_GOVERNANCE_LOOP = ("ventures", "version", "help", "diagnose", "activate", "license_status", "models", "scan")
    if clean_name not in SKIP_GOVERNANCE_LOOP:
        if "next_steps" not in governed_result:
            governed_result["next_steps"] = []
        # Don't suggest ledger_context to itself (circular)
        if clean_name != "ledger_context":
            existing = {s.get("tool") for s in governed_result.get("next_steps", [])}
            if "delimit_ledger_context" not in existing:
                governed_result["next_steps"].insert(0, {
                    "tool": "delimit_ledger_context",
                    "reason": "GOVERNANCE LOOP: check ledger for next action",
                    "premium": False,
                    "required": True,
                })
    else:
        # Excluded tools still get the next_steps field (empty) for schema consistency
        if "next_steps" not in governed_result:
            governed_result["next_steps"] = []

    # LED-263: Beta CTA on successful lint/scan/activate/diff results
    cta = _maybe_beta_cta(clean_name, governed_result)
    if cta:
        governed_result["beta_cta"] = cta

    return governed_result


# ─────────────────────────────────────────────────────────────────────
# LED-2214b-followup — sensor_github_issue sync impl
# ─────────────────────────────────────────────────────────────────────
#
# The outreach daemon's monitor_phase needs to call the same logic that
# delimit_sensor_github_issue (MCP tool) runs, but synchronously and
# without the _with_next_steps wrapping. Before this extraction the
# daemon tried to import the impl from two paths that don't exist —
# `ai.governance._sensor_github_issue_impl` and
# `backends.governance_bridge.sensor_github_issue` — and silently fell
# back to "monitor skipped" on every tick, leaving the entire reply-
# tracking cycle dead.
#
# Now both callers share this function. The MCP tool wraps the result
# with `_with_next_steps`; the daemon consumes the raw dict.

_NEGATIVE_KEYWORDS = (
    "not interested", "won't be", "will not", "don't need", "do not need",
    "no thanks", "pass on", "not a fit", "not for us", "closing",
    "won't adopt", "will not adopt", "reject", "declined",
)

_REPO_FORMAT_RE = re.compile(r"^[\w.-]+/[\w.-]+$")

# Module-local guard so the warning fires at most once per process.
_REPO_ALLOWLIST_WARNED = False


def _check_repo_allowlist(repo: str) -> Optional[Dict[str, Any]]:
    """Return a refusal dict if the repo isn't in DELIMIT_ALLOWED_REPOS.

    Duplicates the logic of ai.server._check_repo_allowlist intentionally:
    importing from ai.server would create a circular import (server.py
    imports from governance). Mirror with care — both copies must stay
    in sync until LED-216 splits the allowlist into its own module.
    """
    global _REPO_ALLOWLIST_WARNED
    allowlist_raw = os.environ.get("DELIMIT_ALLOWED_REPOS", "").strip()
    if not allowlist_raw:
        if not _REPO_ALLOWLIST_WARNED:
            logger.warning(
                "DELIMIT_ALLOWED_REPOS unset — sensor_github_issue calls "
                "pass through to gh api using the caller's token."
            )
            _REPO_ALLOWLIST_WARNED = True
        return None
    allowed = {entry.strip().lower() for entry in allowlist_raw.split(",") if entry.strip()}
    if (repo or "").strip().lower() not in allowed:
        return {
            "error": "repo_not_allowlisted",
            "repo": repo,
            "allowed": sorted(allowed),
            "hint": (
                "Repo not in DELIMIT_ALLOWED_REPOS. Add it or use a tool "
                "that does not reach external APIs."
            ),
        }
    return None


def _sensor_github_issue_impl(
    repo: str,
    issue_number: int,
    since_comment_id: int = 0,
) -> Dict[str, Any]:
    """Sync implementation of the sensor_github_issue MCP tool.

    Returns the RAW result dict (no _with_next_steps wrapping). Callers
    that want the MCP wrapping apply it themselves. Returns
    ``{"error": ..., "has_new_activity": False}`` on any failure mode
    rather than raising — the outreach daemon's monitor loop relies on
    fail-soft behavior so one bad LED doesn't kill the whole tick.

    Result schema (success path):
      {
        "repo": str, "issue_number": str,
        "signal": {id, venture, metric, source, timestamp, severity},
        "issue_state": "open" | "closed" | "unknown",
        "new_comments": [{id, author, created_at, body}, ...],
        "latest_comment_id": int,
        "total_comments": int,
        "has_new_activity": bool,
      }
    """
    # Validate inputs — defense-in-depth even though subprocess.run with
    # list argv (no shell=True) makes classic injection inert.
    if not _REPO_FORMAT_RE.match(repo or ""):
        return {"error": f"Invalid repo format: {repo!r}. Use owner/repo.",
                "has_new_activity": False}
    if ".." in repo:
        return {"error": "Invalid repo: path traversal sequences not allowed",
                "has_new_activity": False}
    if not isinstance(issue_number, int) or issue_number <= 0:
        return {"error": f"Invalid issue number: {issue_number}",
                "has_new_activity": False}

    refusal = _check_repo_allowlist(repo)
    if refusal is not None:
        refusal.setdefault("has_new_activity", False)
        return refusal

    try:
        # Fetch comments
        comments_jq = (
            "[.[] | {id: .id, author: .user.login, "
            "created_at: .created_at, body: (.body | .[0:500])}]"
        )
        comments_proc = subprocess.run(
            ["gh", "api",
             f"repos/{repo}/issues/{issue_number}/comments",
             "--jq", comments_jq],
            capture_output=True, text=True, timeout=30,
        )
        if comments_proc.returncode != 0:
            return {
                "error": f"gh api comments failed: {(comments_proc.stderr or '').strip()[:200]}",
                "has_new_activity": False,
            }
        all_comments = json.loads(comments_proc.stdout) if comments_proc.stdout.strip() else []
        new_comments = [c for c in all_comments if c.get("id", 0) > since_comment_id]

        # Fetch issue state
        issue_jq = "{state: .state, labels: [.labels[].name], reactions: .reactions.total_count}"
        issue_proc = subprocess.run(
            ["gh", "api",
             f"repos/{repo}/issues/{issue_number}",
             "--jq", issue_jq],
            capture_output=True, text=True, timeout=30,
        )
        if issue_proc.returncode != 0:
            return {
                "error": f"gh api issue failed: {(issue_proc.stderr or '').strip()[:200]}",
                "has_new_activity": False,
            }
        issue_info = json.loads(issue_proc.stdout) if issue_proc.stdout.strip() else {}
        issue_state = issue_info.get("state", "unknown")

        # Severity classification — green default; amber on closed; red on
        # negative keyword in any new comment body.
        severity = "green"
        combined_body = " ".join(c.get("body", "") or "" for c in new_comments).lower()
        has_negative = any(kw in combined_body for kw in _NEGATIVE_KEYWORDS)
        if has_negative:
            severity = "red"
        elif issue_state == "closed":
            severity = "amber"

        latest_comment_id = max((c.get("id", 0) for c in all_comments), default=since_comment_id)
        repo_key = repo.replace("/", "_")

        return {
            "repo": repo,
            "issue_number": str(issue_number),
            "signal": {
                "id": f"sensor:github_issue:{repo_key}:{issue_number}",
                "venture": "delimit",
                "metric": "outreach_issue_activity",
                "source": f"https://github.com/{repo}/issues/{issue_number}",
                "timestamp": datetime.now(timezone.utc).isoformat(),
                "severity": severity,
            },
            "issue_state": issue_state,
            "new_comments": new_comments,
            "latest_comment_id": latest_comment_id,
            "total_comments": len(all_comments),
            "has_new_activity": len(new_comments) > 0,
        }
    except subprocess.TimeoutExpired:
        return {"error": "gh command timed out after 30s",
                "has_new_activity": False}
    except json.JSONDecodeError as exc:
        return {"error": f"Failed to parse gh output: {exc}",
                "has_new_activity": False}
    except Exception as exc:  # noqa: BLE001 — sensor must fail soft
        logger.error("sensor_github_issue impl error: %s", exc)
        return {"error": str(exc), "has_new_activity": False}


def _deep_get(d: Dict, key: str) -> Any:
    """Get a value from a dict, supporting nested keys with dots."""
    if "." in key:
        parts = key.split(".", 1)
        sub = d.get(parts[0])
        if isinstance(sub, dict):
            return _deep_get(sub, parts[1])
        return None

    # Check top-level and common nested locations
    if key in d:
        return d[key]
    # Check inside 'data', 'result', 'overall_coverage'
    for wrapper in ["data", "result", "overall_coverage", "summary"]:
        if isinstance(d.get(wrapper), dict) and key in d[wrapper]:
            return d[wrapper][key]
    return None
