#!/usr/bin/env node
/**
 * budget-enforcer.ts — PreToolUse hook (matcher: Agent)
 *
 * Phase 20 Plan 20-13 rewrite: the original budget-enforcer.js is ported
 * to TypeScript verbatim in behavior and additionally wires up the event
 * stream as a hook.fired emitter. No policy changes; the enforcement
 * branches (enforce / warn / log) and telemetry row shape (OPT-09) are
 * preserved byte-for-byte against the .js source.
 *
 * Intercepts every Agent tool spawn. Consults:
 *   (a) router decision (from tool_input.context.router_decision if supplied)
 *   (b) .design/cache-manifest.json for short-circuit cached answers (D-05)
 *   (c) .design/budget.json for tier_overrides + caps (D-01, D-04, D-10)
 *
 * Enforcement (D-02, D-03, D-11):
 *   - enforcement_mode: "enforce" + 100% cap → block with actionable error
 *   - enforcement_mode: "enforce" + 80% soft-threshold + auto_downgrade_on_cap → rewrite tier to haiku
 *   - enforcement_mode: "warn" → log warning, allow spawn
 *   - enforcement_mode: "log" → advisory only
 *
 * Logs every decision to .design/telemetry/costs.jsonl (OPT-09 schema).
 * Every telemetry write fires a detached child aggregator
 * (scripts/aggregate-agent-metrics.ts) that rebuilds
 * .design/agent-metrics.json incrementally.
 *
 * Every decision also fires a hook.fired event to
 * .design/telemetry/events.jsonl via appendEvent() (Plan 20-06). The
 * event payload uses the pre-registered HookFiredEvent shape with
 * hook="budget-enforcer" and decision in {block|downgrade|warn|log|cache|allow|lazy}.
 *
 * Plan 20-14 note: Plan 20-14 will patch this hook with a rate-guard
 * check before spawn. The current file exposes a `main()` entrypoint
 * and keeps policy pure-ish so that insertion is an additive change.
 *
 * Hook type: PreToolUse
 * Input:  JSON on stdin { tool_name, tool_input }
 * Output: JSON on stdout { continue, suppressOutput, message, modified_tool_input? }
 */

import { existsSync, mkdirSync, readFileSync, appendFileSync } from 'node:fs';
import { join, dirname, isAbsolute, resolve } from 'node:path';
import { spawn } from 'node:child_process';
import { createInterface } from 'node:readline';
import { createRequire } from 'node:module';

import { appendEvent } from '../sdk/event-stream/index.ts';
import type { HookFiredEvent } from '../sdk/event-stream/index.ts';
// Consume the generated BudgetSchema so this hook participates in the
// Plan 20-00 codegen graph. We treat parsed JSON as BudgetSchema after
// the structural merge with defaults — the schema permits every field
// to be optional so defaults-merged objects are always valid.
import type { BudgetSchema } from '../reference/schemas/generated.js';

// Plan 20-14 resilience primitives. These are `.cjs` modules so that
// `.cjs`-only call sites (future CLIs) can consume them without
// --experimental-strip-types. From this file — which runs as an ES
// module under strip-types — we reach them via `createRequire`
// anchored on an absolute filesystem path derived from `process.argv[1]`
// (identical pattern to `hooks/gdd-read-injection-scanner.ts`'s
// loadPatterns). We deliberately avoid `import.meta.url` so this
// module stays compatible with the `Node16` tsconfig module setting
// without forcing `"type":"module"` in package.json (which would
// break the Tier-2 .cjs tests per Plan 20-00).
function resolveHookPath(): string {
  const a1 = process.argv[1];
  if (typeof a1 === 'string' && a1.length > 0) {
    return isAbsolute(a1) ? a1 : resolve(a1);
  }
  return resolve('hooks/budget-enforcer.ts');
}
const nodeRequire = createRequire(resolveHookPath());
const rateGuard = nodeRequire('../scripts/lib/rate-guard.cjs') as typeof import('../scripts/lib/rate-guard.cjs');
const iterationBudget = nodeRequire('../sdk/primitives/iteration-budget.cjs') as typeof import('../sdk/primitives/iteration-budget.cjs');
// Plan 26-05: shared cost-computation backend for the resolved_models
// consumer path. Pure module — takes (model_id, runtime, token_counts) →
// cost_usd by reading per-runtime price tables under reference/prices/.
// See scripts/lib/budget-enforcer.cjs for the lookup chain.
interface BudgetEnforcerBackend {
  computeCost(args: {
    model_id?: string | null;
    tier?: string | null;
    runtime: string;
    tokens_in: number;
    tokens_out: number;
    cache_hit?: boolean;
  }): {
    cost_usd: number | null;
    model: string | null;
    tier: string | null;
    runtime_used: string | null;
    fallback: boolean;
    reason: string | null;
    // Phase 59-9: true when the cost is a CONSERVATIVE ESTIMATE (opus ceiling)
    // for an unknown/new model rather than a table-matched figure. Additive +
    // optional — absent on the table-matched (branches 1-4) paths.
    cost_estimated?: boolean;
  };
  modelFromResolved(resolved: unknown, agent: string): string | null;
  // Plan 33.6-03 (SC#6): the canonical cost-row payload builder (the
  // types.ts:237-designated emit site). Threads the optional `provider` tag
  // ("openrouter" when the OpenRouter adapter resolved the model), omitting it
  // when absent (back-compat).
  buildCostEventPayload(args: {
    runtime: string;
    agent: string;
    model_id: string | null;
    tier: string | null;
    tokens_in: number;
    tokens_out: number;
    cost_usd: number | null;
    runtime_role?: 'host' | 'peer';
    peer_id?: string | null;
    provider?: string;
  }): Record<string, unknown>;
}
const budgetBackend = nodeRequire('../scripts/lib/budget-enforcer.cjs') as BudgetEnforcerBackend;
// Plan 26-05: runtime detection for the cost-event runtime tag. Returns
// 'claude' for the CC hook context (CLAUDE_CONFIG_DIR is set when CC is
// the host), null when running outside any of the 14 runtime envs (e.g.
// CI matrix). The hook defaults the null case to 'claude' since the .ts
// hook only runs inside CC anyway.
interface RuntimeDetectModule {
  detect(): string | null;
}
const runtimeDetect = nodeRequire('../scripts/lib/runtime-detect.cjs') as RuntimeDetectModule;

// Plan 27.5-01: bandit production-integration shim. Hides pull /
// pullWithDelegate choice from the hook; reads adaptive_mode + frontmatter
// tier_override under the same gating discipline as Phase 23.5 D-07 and
// Phase 27.5 D-05.
interface BanditIntegrationModule {
  consultBandit(args: {
    agent: string;
    bin: string;
    delegate: string;
    agentFrontmatter: { tier_override?: string; default_tier?: string };
    adaptiveMode?: 'static' | 'hedge' | 'full';
    baseDir?: string;
    posteriorPath?: string;
  }): {
    tier: 'haiku' | 'sonnet' | 'opus';
    decision_log: {
      source:
        | 'frontmatter'
        | 'tier_override_bypass'
        | 'bandit_pull'
        | 'bandit_pull_with_delegate';
      samples?: Record<string, number> | Record<string, Record<string, number>>;
      delegate?: string;
      adaptive_mode: 'static' | 'hedge' | 'full';
      reason?: string;
    };
  };
  recordOutcome(args: unknown): void;
  DELEGATE_NONE: 'none';
}
const banditIntegration = nodeRequire(
  '../scripts/lib/bandit-router/integration.cjs',
) as BanditIntegrationModule;

// Plan 27.5-02: adaptive-mode module surfaces the single gating predicate.
interface AdaptiveModeModule {
  getMode(opts?: {
    baseDir?: string;
    budgetPath?: string;
    quiet?: boolean;
  }): 'static' | 'hedge' | 'full';
  isBanditEnabled(opts?: { baseDir?: string; budgetPath?: string }): boolean;
}
const adaptiveMode = nodeRequire(
  '../scripts/lib/adaptive-mode.cjs',
) as AdaptiveModeModule;

// Plan 27.5-02: bin selection helper for bandit (agent, bin) addressing.
// budget-enforcer doesn't currently surface glob_count; default to 'medium'
// as a safe per-agent partition until a future plan wires the real count.
interface BanditRouterCoreModule {
  binForGlobCount(n: number): 'tiny' | 'small' | 'medium' | 'large';
  DEFAULT_DELEGATES: readonly string[];
}
const banditRouterCore = nodeRequire(
  '../scripts/lib/bandit-router.cjs',
) as BanditRouterCoreModule;

// Plan 27.5-02: tier-resolver translates bandit tier → concrete model.
interface TierResolverModule {
  resolve(
    runtime: string,
    tier: string,
    opts?: { silent?: boolean },
  ): string | null;
}
const tierResolver = nodeRequire(
  '../scripts/lib/tier-resolver.cjs',
) as TierResolverModule;

// Phase 59.5 P1: runtime-models parser for the BYOK/unverified provenance
// guard. We read the parsed runtime rows to learn a runtime's `status`
// ("verified" | "byok" | "unverified"). The parser is pure + never invoked
// for its model-resolution side here; only to classify the runtime so an
// unverified row never drives a HARD budget cap. Soft-imported defensively:
// any parser failure degrades to the built-in verified allowlist below.
interface RuntimeModelsParserModule {
  parseRuntimeModels(opts?: { cwd?: string }): {
    runtimes: Array<{ id: string; status?: string }>;
  };
}
const runtimeModelsParser = nodeRequire(
  '../scripts/lib/install/parse-runtime-models.cjs',
) as RuntimeModelsParserModule;

// Plan 33.6-03 (SC#6, D-08, D-12): OpenRouter tier-resolver adapter. When the
// user opts in (`.design/config.json#openrouter_enabled: true` OR
// `OPENROUTER_API_KEY` present), the hook consults this adapter FIRST for a
// resolved model; a non-null result routes to OpenRouter and tags the cost row
// `provider: "openrouter"`, a null result falls back to the native resolution
// path (unchanged default behavior). `resolve(tier, opts)` never throws.
interface TierResolverOpenRouterModule {
  resolve(
    tier: string,
    opts?: { catalog?: unknown; models?: unknown; overrides?: unknown; cachePath?: string; configPath?: string; cwd?: string },
  ): string | null;
}
const tierResolverOpenRouter = nodeRequire(
  '../scripts/lib/tier-resolver-openrouter.cjs',
) as TierResolverOpenRouterModule;

// Phase 39.2 D-04: project-level cap classifier (pure). Keeping the threshold
// math in scripts/lib/budget/project-cap.cjs (out of this hook) mirrors how the
// hook already delegates cost computation to scripts/lib/budget-enforcer.cjs,
// and makes the 50/80/100 thresholds unit-testable. The hook only reads the
// running project spend and asks this module what to do.
interface ProjectCapClassification {
  enabled: boolean;
  pct: number;
  level: 'ok' | 'warn-50' | 'warn-80' | 'halt';
  cap: number;
  spend: number;
}
interface ProjectCapModule {
  classifyProjectBudget(spendUsd: number, capUsd: number): ProjectCapClassification;
  shouldHalt(c: ProjectCapClassification | null, enforcementMode: string): boolean;
  capMessage(c: ProjectCapClassification | null): string | null;
}
const projectCap = nodeRequire(
  '../scripts/lib/budget/project-cap.cjs',
) as ProjectCapModule;

/**
 * Plan 33.6-03 (SC#6 opt-in). OpenRouter is consulted ONLY when the user opts
 * in — either `.design/config.json#openrouter_enabled === true` OR
 * `OPENROUTER_API_KEY` is present in the environment. Best-effort + never
 * throws: a missing/corrupt config degrades to "env var only". This keeps the
 * default (no OpenRouter) behavior byte-identical for every existing user
 * (D-08, D-12).
 *
 * @param cwd base dir for `.design/config.json` (default process.cwd())
 */
function isOpenRouterEnabled(cwd?: string): boolean {
  if (
    typeof process.env.OPENROUTER_API_KEY === 'string' &&
    process.env.OPENROUTER_API_KEY.length > 0
  ) {
    return true;
  }
  try {
    const configPath = join(cwd ?? process.cwd(), '.design', 'config.json');
    if (!existsSync(configPath)) return false;
    const parsed = JSON.parse(readFileSync(configPath, 'utf8')) as {
      openrouter_enabled?: unknown;
    };
    return Boolean(parsed && parsed.openrouter_enabled === true);
  } catch {
    return false;
  }
}

// ── Types ───────────────────────────────────────────────────────────────────

/**
 * PreToolUse stdin envelope. Claude Code injects tool_name + tool_input
 * for every hook invocation. The tool_input shape is tool-specific;
 * this hook only consumes Agent-shaped tool_input so we narrow here.
 */
/** Phase 25 / D-04, D-05: router complexity-class enum. */
export type ComplexityClass = 'S' | 'M' | 'L' | 'XL';

/**
 * Phase 25 / D-05: router decision payload as surfaced on
 * tool_input.context.router_decision. Only the fields this hook reads
 * are typed; the router emits more (model_tier_overrides,
 * estimated_cost_usd, cache_hits) but they are not consumed here.
 */
interface RouterDecision {
  path?: 'fast' | 'quick' | 'full';
  complexity_class?: ComplexityClass;
  /**
   * Phase 26 / D-07: per-agent concrete model name resolved by the
   * router via `scripts/lib/tier-resolver.cjs`. Strict superset of
   * `model_tier_overrides` — existing consumers still read tier names
   * from `model_tier_overrides`; new consumers read `resolved_models`
   * for runtime-correct cost lookup.
   */
  resolved_models?: Record<string, string>;
  /**
   * Phase 26 / D-08: runtime ID the router computed `resolved_models`
   * against. Optional; the hook falls back to `runtime-detect.cjs`
   * when absent.
   */
  runtime?: string;
  /**
   * Phase 25 back-compat: tier-name overrides per agent. Phase 26 keeps
   * this as the legacy fallback path when `resolved_models` is absent.
   */
  model_tier_overrides?: Record<string, string>;
  [key: string]: unknown;
}

interface ToolInputContext {
  router_decision?: RouterDecision;
  [key: string]: unknown;
}

interface ToolInput {
  subagent_type?: string;
  agent?: string;
  _input_hash?: string;
  _est_cost_usd?: number;
  _tokens_in_est?: number;
  _tokens_out_est?: number;
  _tier_override?: string;
  _default_tier?: string;
  _tier_downgraded?: boolean;
  lazy_skipped?: boolean;
  context?: ToolInputContext;
  [key: string]: unknown;
}

interface HookStdin {
  tool_name?: string;
  tool_input?: ToolInput;
  [key: string]: unknown;
}

/**
 * PostToolUse stdout envelope. The `continue` field is the primary
 * dispatch knob; `modified_tool_input` is how we inject tier overrides.
 */
interface ToolOutput {
  continue: boolean;
  suppressOutput?: boolean;
  message?: string;
  stopReason?: string;
  modified_tool_input?: ToolInput;
  cached_result?: unknown;
  /**
   * Claude Code PreToolUse hook-specific envelope. This is the ONLY
   * supported mechanism on current Claude Code for mutating a tool's
   * input (`updatedInput`) or blocking a call (`permissionDecision`).
   * The top-level `modified_tool_input` / `cached_result` fields are
   * retained for backward-compat but are silently ignored by the harness.
   */
  hookSpecificOutput?: {
    hookEventName: 'PreToolUse';
    permissionDecision?: 'allow' | 'deny' | 'ask';
    permissionDecisionReason?: string;
    updatedInput?: ToolInput;
  };
}

/** Shape of .design/cache-manifest.json — D-05 cache short-circuit. */
interface CacheManifestEntry {
  ts_unix: number;
  result: unknown;
}
interface CacheManifest {
  ttl_seconds?: number;
  entries?: Record<string, CacheManifestEntry>;
}

/** Shape of .design/telemetry/phase-totals.json — WR-02 fast path. */
interface PhaseTotals {
  totals?: Record<string, number>;
}

/** OPT-09 telemetry row (partial — aggregator enforces required fields). */
interface TelemetryRowPartial {
  ts?: string;
  agent?: string;
  tier?: string;
  tokens_in?: number;
  tokens_out?: number;
  cache_hit?: boolean;
  est_cost_usd?: number;
  cycle?: string;
  phase?: string;
  tier_downgraded?: boolean;
  enforcement_mode?: string;
  lazy_skipped?: boolean;
  block_reason?: string;
  _cyclePhase?: { cycle: string; phase: string };
}

/**
 * The hook's terminal decision — also the event payload `decision` field.
 * `'rate-limited'` was added in Plan 20-14 to signal that rate-guard
 * saw an upstream provider hit its limit and the hook short-circuited
 * before the budget cap check.
 */
export type HookDecision =
  | 'lazy'
  | 'cache'
  | 'rate-limited'
  | 'block'
  | 'downgrade'
  | 'warn'
  | 'log'
  | 'allow';

// ── Constants ───────────────────────────────────────────────────────────────

const BUDGET_PATH = join(process.cwd(), '.design', 'budget.json');
const MANIFEST_PATH = join(process.cwd(), '.design', 'cache-manifest.json');
const TELEMETRY_PATH = join(
  process.cwd(),
  '.design',
  'telemetry',
  'costs.jsonl',
);
const PHASE_TOTALS_PATH = join(
  process.cwd(),
  '.design',
  'telemetry',
  'phase-totals.json',
);
// Phase 39.2 D-04: optional fast-path for the running project spend, mirroring
// PHASE_TOTALS_PATH. When absent the hook replays costs.jsonl (the project cap
// is opt-in, so this replay only happens for users who set project_cap_usd).
const PROJECT_TOTALS_PATH = join(
  process.cwd(),
  '.design',
  'telemetry',
  'project-totals.json',
);
const STATE_PATH = join(process.cwd(), '.design', 'STATE.md');

/** Defaults per D-12 — mirror scripts/bootstrap.sh budget.json bootstrap. */
const BUDGET_DEFAULTS: Required<
  Pick<
    BudgetSchema,
    | 'per_task_cap_usd'
    | 'per_phase_cap_usd'
    | 'tier_overrides'
    | 'auto_downgrade_on_cap'
    | 'cache_ttl_seconds'
    | 'enforcement_mode'
    | 'project_cap_usd'
  >
> = {
  per_task_cap_usd: 2.0,
  per_phase_cap_usd: 20.0,
  tier_overrides: {},
  auto_downgrade_on_cap: true,
  cache_ttl_seconds: 3600,
  enforcement_mode: 'enforce',
  // Phase 39.2 D-04: project-level cap is DISABLED by default (0). Existing
  // users — who have no project_cap_usd in budget.json — see zero behavior
  // change. project_cap_enforcement_mode stays optional and falls back to
  // enforcement_mode at the use-site.
  project_cap_usd: 0,
};

/**
 * Phase 25 / D-05: optional per-class cap map on .design/budget.json.
 * Documented in reference/config-schema.md as `class_caps_usd?: { S?: number; M?: number; L?: number; XL?: number }`.
 * Read through the BudgetSchema index signature so we don't have to
 * regenerate the schema for an additive optional field.
 */
type ClassCapsUsd = Partial<Record<ComplexityClass, number>>;

function readClassCaps(budget: BudgetSchema): ClassCapsUsd | undefined {
  const raw = (budget as { class_caps_usd?: unknown }).class_caps_usd;
  if (raw === undefined || raw === null || typeof raw !== 'object') {
    return undefined;
  }
  const out: ClassCapsUsd = {};
  for (const k of ['S', 'M', 'L', 'XL'] as const) {
    const v = (raw as Record<string, unknown>)[k];
    if (typeof v === 'number' && Number.isFinite(v) && v > 0) {
      out[k] = v;
    }
  }
  return out;
}

/**
 * Phase 25 / D-05: resolve the per-spawn cap. If the router decision
 * payload contains a `complexity_class` AND `.design/budget.json#class_caps_usd[class]`
 * is defined, use that. Otherwise fall back to `per_task_cap_usd`.
 */
function resolvePerSpawnCap(
  budget: ResolvedBudget,
  complexityClass: ComplexityClass | undefined,
): number {
  if (complexityClass !== undefined) {
    const caps = readClassCaps(budget);
    const classCap = caps?.[complexityClass];
    if (classCap !== undefined) return classCap;
  }
  return budget.per_task_cap_usd;
}

/**
 * Concrete budget shape after defaults-merge. Every field becomes
 * non-optional so downstream branches don't have to null-guard. Defined
 * as an intersection of BudgetSchema (to keep the generated-type graph
 * edge alive) and the required fields.
 */
type ResolvedBudget = BudgetSchema & typeof BUDGET_DEFAULTS;

// ── budget.json loader ──────────────────────────────────────────────────────

/**
 * Load .design/budget.json with defaults-merge. Returns the defaults
 * when the file is missing or unparseable — fail-open is the documented
 * D-12 behavior so a missing budget file never blocks agent spawns.
 */
export function loadBudget(): ResolvedBudget {
  if (!existsSync(BUDGET_PATH)) {
    return { ...BUDGET_DEFAULTS };
  }
  try {
    const parsed = JSON.parse(readFileSync(BUDGET_PATH, 'utf8')) as Partial<BudgetSchema>;
    return { ...BUDGET_DEFAULTS, ...parsed };
  } catch {
    return { ...BUDGET_DEFAULTS };
  }
}

// ── runtime provenance status (Phase 59.5 P1) ───────────────────────────────

/**
 * Phase 59.5 P1: provenance confidence of a runtime's tier→model row, as
 * documented in reference/runtime-models.md and enumerated by
 * reference/schemas/runtime-models.schema.json#status.
 */
export type RuntimeStatus = 'verified' | 'byok' | 'unverified';

/**
 * Built-in verified allowlist: the 4 runtimes whose tier maps are confirmed
 * against runtime-author docs (the runtime-models.md banner: "4 of 14 ...
 * verified (claude, codex, gemini, qwen)"). Used as the fallback classifier
 * when the parsed row carries no structured `status` field yet (the markdown
 * JSON blocks do not emit `status` at the time of this plan; the schema is
 * ready, the parser wiring is a deferred follow-up). Once a row DOES carry
 * `status`, the parsed value takes precedence over this allowlist.
 */
const VERIFIED_RUNTIME_IDS: ReadonlySet<string> = new Set([
  'claude',
  'codex',
  'gemini',
  'qwen',
]);

/** Per-process memo of runtime-id → parsed `status` (null until first read). */
let _runtimeStatusMap: Map<string, RuntimeStatus> | null = null;

function isRuntimeStatus(v: unknown): v is RuntimeStatus {
  return v === 'verified' || v === 'byok' || v === 'unverified';
}

/**
 * Resolve a runtime's provenance status. Reads the parsed runtime-models
 * doc once per process; if a row carries a structured `status` it wins,
 * otherwise the built-in verified allowlist decides (verified vs unverified).
 * Fail-open: any parser error → allowlist-only classification. Never throws.
 *
 * @param runtimeId runtime id (e.g. 'claude', 'cline'); falsy → 'unverified'.
 */
export function runtimeStatus(runtimeId: string | null | undefined): RuntimeStatus {
  if (typeof runtimeId !== 'string' || runtimeId.length === 0) {
    return 'unverified';
  }
  if (_runtimeStatusMap === null) {
    _runtimeStatusMap = new Map();
    try {
      const parsed = runtimeModelsParser.parseRuntimeModels({ cwd: process.cwd() });
      const rows = Array.isArray(parsed?.runtimes) ? parsed.runtimes : [];
      for (const row of rows) {
        if (row && typeof row.id === 'string' && isRuntimeStatus(row.status)) {
          _runtimeStatusMap.set(row.id, row.status);
        }
      }
    } catch {
      // Fail open: parser error degrades to the verified allowlist below.
    }
  }
  const parsedStatus = _runtimeStatusMap.get(runtimeId);
  if (parsedStatus !== undefined) return parsedStatus;
  return VERIFIED_RUNTIME_IDS.has(runtimeId) ? 'verified' : 'unverified';
}

/** True when the runtime row must NOT drive a HARD budget cap (P1 guard). */
export function isUnverifiedRuntime(runtimeId: string | null | undefined): boolean {
  const s = runtimeStatus(runtimeId);
  return s === 'byok' || s === 'unverified';
}

// ── cumulative phase spend (WR-02) ──────────────────────────────────────────

/**
 * Fast path: read phase-totals.json (written by
 * scripts/aggregate-agent-metrics.ts). Falls back to costs.jsonl replay
 * only on the very first spawn of a session. Returns 0 on any error.
 */
export function currentPhaseSpend(phase: string): number {
  if (existsSync(PHASE_TOTALS_PATH)) {
    try {
      const data = JSON.parse(
        readFileSync(PHASE_TOTALS_PATH, 'utf8'),
      ) as PhaseTotals;
      const total = data.totals?.[phase];
      return Number(total ?? 0);
    } catch {
      // fall through to replay
    }
  }
  if (!existsSync(TELEMETRY_PATH)) return 0;
  const lines = readFileSync(TELEMETRY_PATH, 'utf8')
    .split(/\r?\n/)
    .filter(Boolean);
  let sum = 0;
  for (const line of lines) {
    try {
      const row = JSON.parse(line) as { phase?: string; est_cost_usd?: number };
      if (row.phase === phase) sum += Number(row.est_cost_usd ?? 0);
    } catch {
      // tolerant — skip malformed lines
    }
  }
  return sum;
}

// ── cumulative project spend (Phase 39.2 D-04) ───────────────────────────────

/**
 * Total project spend = sum of est_cost_usd across the WHOLE costs.jsonl ledger.
 * Fast path: a `project-totals.json` (`{ total: number }`, written by the
 * aggregator) mirrors the WR-02 phase-totals optimization. Falls back to a full
 * ledger replay otherwise. Returns 0 on any error. Only ever consulted when
 * project_cap_usd > 0, so the replay cost is paid only by opt-in users.
 */
export function currentProjectSpend(): number {
  if (existsSync(PROJECT_TOTALS_PATH)) {
    try {
      const data = JSON.parse(readFileSync(PROJECT_TOTALS_PATH, 'utf8')) as { total?: number };
      return Number(data.total ?? 0);
    } catch {
      // fall through to replay
    }
  }
  if (!existsSync(TELEMETRY_PATH)) return 0;
  const lines = readFileSync(TELEMETRY_PATH, 'utf8')
    .split(/\r?\n/)
    .filter(Boolean);
  let sum = 0;
  for (const line of lines) {
    try {
      const row = JSON.parse(line) as { est_cost_usd?: number };
      sum += Number(row.est_cost_usd ?? 0);
    } catch {
      // tolerant — skip malformed lines
    }
  }
  return sum;
}

// ── cycle + phase reader (STATE.md frontmatter) ─────────────────────────────

/**
 * Parse `cycle:` and `phase:` from the STATE.md leading frontmatter
 * block. Regex-based rather than YAML-parsed — STATE.md frontmatter is
 * always flat `key: value` per reference/STATE-TEMPLATE.md.
 */
export function readCycleAndPhase(): { cycle: string; phase: string } {
  const defaults = { cycle: 'unknown', phase: 'unknown' };
  if (!existsSync(STATE_PATH)) return defaults;
  try {
    const content = readFileSync(STATE_PATH, 'utf8');
    const fm = content.match(/^---\s*\n([\s\S]*?)\n---/);
    const body = fm?.[1] ?? content;
    const cycleMatch = body.match(/^cycle:\s*"?([^"\n]+)"?/m);
    const phaseMatch = body.match(/^phase:\s*"?([^"\n]+)"?/m);
    return {
      cycle: cycleMatch?.[1]?.trim() ?? 'unknown',
      phase: phaseMatch?.[1]?.trim() ?? 'unknown',
    };
  } catch {
    return defaults;
  }
}

/**
 * Deprecated alias kept for plan-01 callers that imported the
 * phase-only function from the .js source.
 */
export function currentPhase(): string {
  return readCycleAndPhase().phase;
}

// ── cache short-circuit (D-05) ──────────────────────────────────────────────

/**
 * Look up a cached result for `agent:inputHash`. Returns null on miss,
 * stale (past TTL), or any read/parse error.
 */
export function cacheLookup(agent: string, inputHash: string): unknown {
  if (!existsSync(MANIFEST_PATH)) return null;
  try {
    const manifest = JSON.parse(
      readFileSync(MANIFEST_PATH, 'utf8'),
    ) as CacheManifest;
    const entry = manifest.entries?.[`${agent}:${inputHash}`];
    if (entry === undefined) return null;
    const age = Date.now() / 1000 - entry.ts_unix;
    if (age > (manifest.ttl_seconds ?? 3600)) return null;
    return entry.result;
  } catch {
    return null;
  }
}

// ── tier resolution (D-04) ──────────────────────────────────────────────────

export function resolveTier(
  agent: string,
  agentDefaultTier: string | undefined,
  overrides: Record<string, string> | undefined,
): string {
  return overrides?.[agent] ?? agentDefaultTier ?? 'sonnet';
}

// ── detached aggregator ─────────────────────────────────────────────────────

/**
 * Fire-and-forget: spawn the aggregator as a detached child. Failures
 * here MUST NOT break the hook — silently swallow everything. Uses the
 * .ts entrypoint via --experimental-strip-types since Plan 20-00.
 */
function spawnAggregator(): void {
  try {
    // Opt-out: when GDD_NO_AGGREGATOR is set (truthy), skip the detached
    // child entirely. Production leaves this unset so the rollups stay
    // current; tests that scaffold a throwaway temp cwd set it so the
    // fire-and-forget child doesn't hold a handle on the dir they delete
    // immediately after (a Windows rmSync EPERM race surfaced once the C3
    // fix made this spawn actually resolve the script). No effect on the
    // production code path.
    const optOut = process.env['GDD_NO_AGGREGATOR'];
    if (typeof optOut === 'string' && optOut !== '' && optOut !== '0' && optOut !== 'false') {
      return;
    }
    // C3 fix: resolve the aggregator script relative to THIS hook file's
    // location (the plugin's own tree), not process.cwd(). When an installed
    // user runs from their project root, cwd is NOT the plugin repo, so
    // `join(process.cwd(), 'scripts', ...)` never exists and the aggregator
    // silently never runs — leaving phase-totals.json unbuilt and forcing a
    // full costs.jsonl re-parse on every spawn. Anchor on the hook file via
    // the same resolveHookPath() idiom used for createRequire above
    // (hooks/budget-enforcer.ts → ../scripts/aggregate-agent-metrics.ts).
    const aggregatorPath = resolve(
      dirname(resolveHookPath()),
      '..',
      'scripts',
      'aggregate-agent-metrics.ts',
    );
    if (!existsSync(aggregatorPath)) return;
    // IN-02: minimal env; aggregator reads only filesystem artifacts.
    const childEnv: NodeJS.ProcessEnv = {};
    if (typeof process.env['PATH'] === 'string') {
      childEnv['PATH'] = process.env['PATH'];
    }
    const child = spawn(
      'node',
      ['--experimental-strip-types', aggregatorPath],
      {
        cwd: process.cwd(),
        detached: true,
        stdio: 'ignore',
        env: childEnv,
      },
    );
    child.unref();
  } catch {
    // Aggregator failures are non-fatal.
  }
}

// ── OPT-09 locked-schema telemetry row builder ──────────────────────────────

interface TelemetryRow {
  ts: string;
  agent: string;
  tier: string;
  tokens_in: number;
  tokens_out: number;
  cache_hit: boolean;
  est_cost_usd: number;
  cycle: string;
  phase: string;
  tier_downgraded?: boolean;
  enforcement_mode?: string;
  lazy_skipped?: boolean;
  block_reason?: string;
}

function buildTelemetryRow(partial: TelemetryRowPartial): TelemetryRow {
  const { cycle, phase } = partial._cyclePhase ?? readCycleAndPhase();
  const row: TelemetryRow = {
    ts: partial.ts ?? new Date().toISOString(),
    agent: String(partial.agent ?? 'unknown'),
    tier: String(partial.tier ?? 'unknown'),
    tokens_in: Number(partial.tokens_in ?? 0),
    tokens_out: Number(partial.tokens_out ?? 0),
    cache_hit: Boolean(partial.cache_hit),
    est_cost_usd: Number(partial.est_cost_usd ?? 0),
    cycle: partial.cycle ?? cycle,
    phase: partial.phase ?? phase,
  };
  if (partial.tier_downgraded !== undefined) {
    row.tier_downgraded = Boolean(partial.tier_downgraded);
  }
  if (partial.enforcement_mode !== undefined) {
    row.enforcement_mode = String(partial.enforcement_mode);
  }
  if (partial.lazy_skipped !== undefined) {
    row.lazy_skipped = Boolean(partial.lazy_skipped);
  }
  if (partial.block_reason !== undefined) {
    row.block_reason = String(partial.block_reason);
  }
  return row;
}

/**
 * Append one OPT-09 row to costs.jsonl. Directory is created if
 * missing. Every write fires a detached aggregator child so the
 * per-agent + per-phase rollups stay current. Fail-open — telemetry
 * write errors MUST NEVER block the hook.
 */
export function writeTelemetry(partial: TelemetryRowPartial): void {
  const dir = dirname(TELEMETRY_PATH);
  try {
    if (!existsSync(dir)) mkdirSync(dir, { recursive: true });
    const row = buildTelemetryRow(partial);
    appendFileSync(TELEMETRY_PATH, JSON.stringify(row) + '\n', 'utf8');
    spawnAggregator();
  } catch {
    // Fail open.
  }
}

// ── event-stream decision emitter ───────────────────────────────────────────

/**
 * Emit one hook.fired event per hook decision. Uses the pre-registered
 * HookFiredEvent subtype from sdk/event-stream/types.ts and
 * stamps sessionId from the process PID + boot time — same scheme as
 * sdk/mcp/gdd-state/tools/shared.ts but inlined here so the
 * hook stays dependency-light.
 */
let CACHED_SESSION_ID: string | null = null;
function getSessionId(): string {
  if (CACHED_SESSION_ID === null) {
    const iso = new Date().toISOString().replace(/[:.]/g, '-');
    CACHED_SESSION_ID = `gdd-hook-${iso}-${process.pid}`;
  }
  return CACHED_SESSION_ID;
}

function emitHookFired(decision: HookDecision, cycle?: string): void {
  const ev: HookFiredEvent = {
    type: 'hook.fired',
    timestamp: new Date().toISOString(),
    sessionId: getSessionId(),
    ...(cycle !== undefined && cycle !== 'unknown' ? { cycle } : {}),
    payload: { hook: 'budget-enforcer', decision },
  };
  try {
    appendEvent(ev);
  } catch {
    // Fail open — event-stream errors must never block the hook.
  }
}

/**
 * Plan 26-05 / D-08: emit a `cost_recorded` event with runtime tag,
 * concrete model, tier, token counts, and computed cost. Cost-aggregator
 * downstream rolls these up per-runtime AND per-tier so reflector class-
 * specific cost analysis (Phase 26-06) can compare apples-to-apples
 * across runtimes.
 *
 * The event uses the BaseEvent envelope shape (free-form `type` per
 * Phase 22 events.jsonl contract). Fail-open like every other emit in
 * this hook — never block the spawn on a telemetry failure.
 */
function emitCostRecorded(
  payload: {
    runtime: string;
    agent: string;
    model_id: string | null;
    tier: string | null;
    tokens_in: number;
    tokens_out: number;
    cost_usd: number | null;
    // Plan 33.6-03 SC#6 — optional resolution provider ("openrouter" when the
    // OpenRouter adapter resolved the model). Additive/back-compat: omitted
    // from the on-disk row when absent, so the legacy cost_recorded shape is
    // preserved for every native-resolution + pre-33.6 spawn.
    provider?: string;
  },
  cycle?: string,
): void {
  const ev = {
    type: 'cost_recorded',
    timestamp: new Date().toISOString(),
    sessionId: getSessionId(),
    ...(cycle !== undefined && cycle !== 'unknown' ? { cycle } : {}),
    payload: {
      runtime: payload.runtime,
      agent: payload.agent,
      model_id: payload.model_id,
      tier: payload.tier,
      tokens_in: payload.tokens_in,
      tokens_out: payload.tokens_out,
      cost_usd: payload.cost_usd,
      // Omit-when-absent (mirrors the .cjs buildCostEventPayload discipline).
      ...(typeof payload.provider === 'string' && payload.provider.length > 0
        ? { provider: payload.provider }
        : {}),
    },
  };
  try {
    // BaseEvent shape; cost_recorded is a free-form subtype (the
    // Phase 22 events stream is structurally validated, not enum-locked).
    appendEvent(ev as unknown as HookFiredEvent);
  } catch {
    // Fail open.
  }
}

/**
 * Phase 59-9: emit a `cost_lookup_fallback` event when the cost backend
 * could not table-match a model and fell back to the CONSERVATIVE OPUS
 * CEILING (or, more rarely, returned an unpriced fallback). Makes an
 * unknown/new model OBSERVABLE in telemetry instead of silently mis-billed
 * (or billed as $0). Reuses the same BaseEvent envelope + appendEvent path
 * as every other emit. Fail-open — never throws, never blocks the spawn.
 */
function emitCostLookupFallback(
  payload: {
    runtime: string;
    agent: string;
    model_id: string | null;
    tier: string | null;
    reason: string | null;
    cost_usd: number | null;
    cost_estimated: boolean;
  },
  cycle?: string,
): void {
  const ev = {
    type: 'cost_lookup_fallback',
    timestamp: new Date().toISOString(),
    sessionId: getSessionId(),
    ...(cycle !== undefined && cycle !== 'unknown' ? { cycle } : {}),
    payload,
  };
  try {
    appendEvent(ev as unknown as HookFiredEvent);
  } catch {
    // Fail open.
  }
}

/**
 * Plan 27.5-02 / D-03: emit `bandit.tier_selected` event when the bandit
 * is consulted (regardless of whether it overrode the prior tier). The
 * event captures the prior tier, the bandit's pick, the sampled posterior
 * (when applicable), the delegate dimension, and the runtime tag so
 * Phase 11 reflector (27.5-04) and `/gdd:bandit-status` (27.5-05) can
 * reconstruct decision history without re-reading the posterior file.
 *
 * Fail-open like every other emit in this hook.
 */
function emitBanditTierSelected(
  payload: {
    agent: string;
    bin: string;
    prior_tier: string;
    selected_tier: 'haiku' | 'sonnet' | 'opus';
    source:
      | 'frontmatter'
      | 'tier_override_bypass'
      | 'bandit_pull'
      | 'bandit_pull_with_delegate';
    delegate: string;
    adaptive_mode: 'static' | 'hedge' | 'full';
    samples?: unknown;
    runtime: string;
    model_id: string | null;
    reason?: string;
  },
  cycle?: string,
): void {
  const ev = {
    type: 'bandit.tier_selected',
    timestamp: new Date().toISOString(),
    sessionId: getSessionId(),
    ...(cycle !== undefined && cycle !== 'unknown' ? { cycle } : {}),
    payload,
  };
  try {
    appendEvent(ev as unknown as HookFiredEvent);
  } catch {
    // Fail open.
  }
}

// ── main ────────────────────────────────────────────────────────────────────

async function readStdin(): Promise<string> {
  const rl = createInterface({ input: process.stdin });
  let data = '';
  for await (const line of rl) data += line + '\n';
  return data;
}

export async function main(): Promise<void> {
  const inputData = await readStdin();

  let parsed: HookStdin;
  try {
    parsed = JSON.parse(inputData) as HookStdin;
  } catch {
    process.exit(0);
  }

  if (parsed.tool_name !== 'Agent' && parsed.tool_name !== 'Task') process.exit(0);

  const toolInput: ToolInput = parsed.tool_input ?? {};
  const agent =
    typeof toolInput.subagent_type === 'string' && toolInput.subagent_type.length > 0
      ? toolInput.subagent_type
      : typeof toolInput.agent === 'string' && toolInput.agent.length > 0
        ? toolInput.agent
        : 'unknown';
  const inputHash =
    typeof toolInput._input_hash === 'string' ? toolInput._input_hash : null;

  // Phase 25 / D-05: extract complexity_class from router decision.
  // Absent payload → legacy per_task_cap behavior (no regression).
  // Present payload with class === 'S' → skip enforcement entirely
  // (defensive: the typical S path is upstream short-circuit where
  // router never ran and this hook still applies legacy caps; an
  // explicit S signal here means a caller bypassed the upstream skip
  // and is asking us to honor the class).
  const routerDecision: RouterDecision | undefined =
    toolInput.context?.router_decision !== undefined &&
    typeof toolInput.context.router_decision === 'object' &&
    toolInput.context.router_decision !== null
      ? toolInput.context.router_decision
      : undefined;
  const complexityClass: ComplexityClass | undefined =
    routerDecision?.complexity_class !== undefined &&
    (['S', 'M', 'L', 'XL'] as const).includes(
      routerDecision.complexity_class as ComplexityClass,
    )
      ? (routerDecision.complexity_class as ComplexityClass)
      : undefined;

  const { cycle, phase } = readCycleAndPhase();
  const cyclePhase = { cycle, phase };

  // Branch A: lazy-gate passthrough.
  if (toolInput.lazy_skipped === true) {
    writeTelemetry({
      agent,
      tier: 'gate',
      tokens_in: 0,
      tokens_out: 0,
      cache_hit: false,
      est_cost_usd: 0,
      lazy_skipped: true,
      _cyclePhase: cyclePhase,
    });
    emitHookFired('lazy', cycle);
    const response: ToolOutput = { continue: true, suppressOutput: true };
    process.stdout.write(JSON.stringify(response));
    return;
  }

  const budget = loadBudget();

  // Phase 25 / D-05: explicit S-class short-circuit. The typical S path
  // skips the router entirely and this hook never runs at all (the
  // command's SKILL.md does the deterministic skip upstream). When we
  // DO see complexity_class === 'S' in the payload it means a caller
  // routed an S-class command through the hook anyway — honor the
  // class by skipping enforcement (no cap check, no downgrade) but
  // still write a zero-cost telemetry row + emit an 'allow' event so
  // observability stays consistent.
  if (complexityClass === 'S') {
    writeTelemetry({
      agent,
      tier:
        toolInput._tier_override ??
        toolInput._default_tier ??
        'haiku',
      tokens_in: Number(toolInput._tokens_in_est ?? 0),
      tokens_out: Number(toolInput._tokens_out_est ?? 0),
      cache_hit: false,
      est_cost_usd: Number(toolInput._est_cost_usd ?? 0),
      enforcement_mode: budget.enforcement_mode,
      _cyclePhase: cyclePhase,
    });
    emitHookFired('allow', cycle);
    const response: ToolOutput = {
      continue: true,
      suppressOutput: true,
      modified_tool_input: toolInput,
      hookSpecificOutput: { hookEventName: 'PreToolUse', updatedInput: toolInput },
    };
    process.stdout.write(JSON.stringify(response));
    return;
  }

  // Branch B: cache short-circuit (D-05).
  if (inputHash !== null) {
    const cached = cacheLookup(agent, inputHash);
    if (cached !== null) {
      // Plan 20-14: refund one iteration-budget unit — cached answers did
      // no real work and shouldn't count against the fix-loop ceiling.
      // The refund call is fire-and-forget; failures are swallowed so
      // telemetry/iteration-budget errors never block the hook. We also
      // silence the auto-init path (refund on a fresh state file is a
      // no-op at full budget, which is what we want).
      try {
        void iterationBudget.refund(1).catch(() => { /* fail open */ });
      } catch {
        // fail open
      }
      writeTelemetry({
        agent,
        tier: 'cache',
        tokens_in: 0,
        tokens_out: 0,
        cache_hit: true,
        est_cost_usd: 0,
        _cyclePhase: cyclePhase,
      });
      emitHookFired('cache', cycle);
      const response: ToolOutput = {
        continue: true,
        suppressOutput: false,
        message: `gdd-budget-enforcer: SkippedCached — returning cached result for ${agent}:${inputHash}`,
        hookSpecificOutput: {
          hookEventName: 'PreToolUse',
          permissionDecision: 'deny',
          permissionDecisionReason: `SkippedCached — a prior identical spawn already produced a result. Reuse it instead of re-spawning. Cached: ${JSON.stringify(cached).slice(0, 2000)}`,
        },
      };
      process.stdout.write(JSON.stringify(response));
      return;
    }
  }

  // Plan 20-14: rate-guard short-circuit. Inserted AFTER the cache
  // check (cached answers bypass every network call so rate-limits are
  // irrelevant for them) and BEFORE the budget cap so a rate-limited
  // provider surfaces a clean "wait N seconds" message instead of a
  // "cap reached" one. rate-guard state is per-provider — we key on
  // 'anthropic' because every Agent spawn in this project goes through
  // the Anthropic API; future multi-provider routing would branch here
  // on toolInput._provider.
  const rateState = rateGuard.remaining('anthropic');
  if (rateState !== null && rateState.remaining <= 0) {
    const waitSeconds = Math.max(
      0,
      Math.ceil((Date.parse(rateState.resetAt) - Date.now()) / 1000),
    );
    writeTelemetry({
      agent,
      tier:
        toolInput._tier_override ??
        toolInput._default_tier ??
        'sonnet',
      tokens_in: Number(toolInput._tokens_in_est ?? 0),
      tokens_out: Number(toolInput._tokens_out_est ?? 0),
      cache_hit: false,
      est_cost_usd: Number(toolInput._est_cost_usd ?? 0),
      block_reason: 'rate_limited',
      _cyclePhase: cyclePhase,
    });
    emitHookFired('rate-limited', cycle);
    const response: ToolOutput = {
      continue: false,
      suppressOutput: false,
      stopReason: `gdd-budget-enforcer: rate-limited on anthropic, retry in ${waitSeconds}s (resetAt=${rateState.resetAt})`,
    };
    process.stdout.write(JSON.stringify(response));
    return;
  }

  const estCost = Number(toolInput._est_cost_usd ?? 0);
  const phaseSpend = currentPhaseSpend(phase);

  // ── Phase 39.2 D-04: project-level cap ─────────────────────────────────────
  //
  // Independent of enforcement_mode: the 50%/80% warnings + the 100% halt are
  // governed by project_cap_enforcement_mode (falling back to enforcement_mode).
  // No-op when project_cap_usd <= 0 (the opt-in default), so existing users see
  // zero change. Checked here, before the per-task/per-phase branches, so a
  // project-level breach halts the NEXT spawn regardless of the per-scope caps —
  // the graceful halt (the current stage's in-flight spawns already ran).
  if (budget.project_cap_usd > 0) {
    const projectSpend = currentProjectSpend();
    const projClass = projectCap.classifyProjectBudget(
      projectSpend + estCost,
      budget.project_cap_usd,
    );
    const projMode = budget.project_cap_enforcement_mode ?? budget.enforcement_mode;
    if (projClass.level === 'warn-50' || projClass.level === 'warn-80') {
      try {
        appendEvent({
          type: 'project_cap_warning',
          timestamp: new Date().toISOString(),
          sessionId: getSessionId(),
          ...(cycle !== undefined && cycle !== 'unknown' ? { cycle } : {}),
          payload: {
            pct: projClass.pct,
            spend: projClass.spend,
            cap: projClass.cap,
            level: projClass.level,
          },
        } as unknown as HookFiredEvent);
      } catch {
        // fail-open — event-stream errors never block the hook.
      }
      process.stderr.write(`gdd-budget-enforcer WARN: ${projectCap.capMessage(projClass)}\n`);
    } else if (projClass.level === 'halt') {
      try {
        appendEvent({
          type: 'project_cap_halt',
          timestamp: new Date().toISOString(),
          sessionId: getSessionId(),
          ...(cycle !== undefined && cycle !== 'unknown' ? { cycle } : {}),
          payload: {
            pct: projClass.pct,
            spend: projClass.spend,
            cap: projClass.cap,
            enforcementMode: projMode,
          },
        } as unknown as HookFiredEvent);
      } catch {
        // fail-open.
      }
      if (projectCap.shouldHalt(projClass, projMode)) {
        writeTelemetry({
          agent,
          tier: toolInput._tier_override ?? toolInput._default_tier ?? 'sonnet',
          tokens_in: Number(toolInput._tokens_in_est ?? 0),
          tokens_out: Number(toolInput._tokens_out_est ?? 0),
          cache_hit: false,
          est_cost_usd: estCost,
          enforcement_mode: projMode,
          block_reason: 'project_cap',
          _cyclePhase: cyclePhase,
        });
        emitHookFired('block', cycle);
        const response: ToolOutput = {
          continue: false,
          suppressOutput: false,
          stopReason: `Project budget cap reached: $${projClass.spend.toFixed(2)} of $${budget.project_cap_usd.toFixed(2)} (${projClass.pct.toFixed(0)}%). Raise project_cap_usd in .design/budget.json, or set project_cap_enforcement_mode to "warn" to keep going. (Graceful halt — the current stage's earlier spawns already completed; this blocks the next one.)`,
        };
        process.stdout.write(JSON.stringify(response));
        return;
      }
      // warn / log mode: surface the 100% breach but allow the spawn.
      process.stderr.write(`gdd-budget-enforcer WARN: ${projectCap.capMessage(projClass)}\n`);
    }
  }

  // Phase 25 / D-05: per-spawn cap is class-specific when
  // complexity_class is present and class_caps_usd[class] is defined.
  // Falls back to per_task_cap_usd for backwards compatibility — when
  // no router decision is supplied, behavior is identical to pre-25.
  const perSpawnCap = resolvePerSpawnCap(budget, complexityClass);

  // ── Phase 59.5 P1: BYOK/unverified provenance guard ────────────────────────
  //
  // Resolve the runtime id (router-supplied `runtime`, else env detection,
  // else 'claude', same precedence the cost-recording block uses below) so we
  // can consult its runtime-models provenance `status` BEFORE the hard-cap
  // branches. When the runtime row is byok/unverified the resolved per-runtime
  // model is best-effort (the user's actual provider may diverge from the
  // Anthropic-default fill), so an estimated cost computed against it must NOT
  // hard-block the user. We degrade enforce-mode to advisory ('warn') for THIS
  // spawn only: the per-spawn + per-phase 100% caps stop blocking and surface a
  // stderr warning instead, while the 80% auto-downgrade still applies (a tier
  // downgrade is non-blocking and strictly cheaper, so it is safe to keep).
  // Verified runtimes (claude/codex/gemini/qwen) are unaffected (full hard
  // enforcement). The project-level cap above is intentionally NOT degraded: it
  // is governed by total ledger spend, not a per-runtime resolved model.
  const guardRuntimeId =
    (typeof routerDecision?.runtime === 'string' && routerDecision.runtime.length > 0
      ? routerDecision.runtime
      : runtimeDetect.detect()) ?? 'claude';
  const runtimeIsUnverified = isUnverifiedRuntime(guardRuntimeId);
  const effectiveEnforcementMode: ResolvedBudget['enforcement_mode'] =
    budget.enforcement_mode === 'enforce' && runtimeIsUnverified
      ? 'warn'
      : budget.enforcement_mode;
  if (budget.enforcement_mode === 'enforce' && runtimeIsUnverified) {
    process.stderr.write(
      `gdd-budget-enforcer WARN: runtime '${guardRuntimeId}' has provenance status ` +
        `'${runtimeStatus(guardRuntimeId)}' (BYOK/unverified tier→model row); ` +
        `hard budget caps degraded to advisory for this spawn so an unverified ` +
        `cost estimate never hard-blocks you.\n`,
    );
  }

  if (effectiveEnforcementMode === 'enforce') {
    // Branch C: 100% per-spawn cap hard block (class-specific or per_task).
    if (estCost >= perSpawnCap) {
      writeTelemetry({
        agent,
        tier:
          toolInput._tier_override ??
          toolInput._default_tier ??
          'sonnet',
        tokens_in: Number(toolInput._tokens_in_est ?? 0),
        tokens_out: Number(toolInput._tokens_out_est ?? 0),
        cache_hit: false,
        est_cost_usd: estCost,
        enforcement_mode: budget.enforcement_mode,
        block_reason: 'per_task_cap',
        _cyclePhase: cyclePhase,
      });
      emitHookFired('block', cycle);
      const capLabel =
        complexityClass !== undefined && perSpawnCap !== budget.per_task_cap_usd
          ? `class_caps_usd.${complexityClass}`
          : 'per-task';
      const response: ToolOutput = {
        continue: false,
        suppressOutput: false,
        stopReason: `Budget cap reached for ${capLabel}. Estimated: $${estCost.toFixed(4)}, cap: $${perSpawnCap.toFixed(2)}. Raise cap in .design/budget.json or retry after next task.`,
      };
      process.stdout.write(JSON.stringify(response));
      return;
    }
    // Branch D: 100% per_phase cap hard block.
    if (phaseSpend + estCost >= budget.per_phase_cap_usd) {
      writeTelemetry({
        agent,
        tier:
          toolInput._tier_override ??
          toolInput._default_tier ??
          'sonnet',
        tokens_in: Number(toolInput._tokens_in_est ?? 0),
        tokens_out: Number(toolInput._tokens_out_est ?? 0),
        cache_hit: false,
        est_cost_usd: estCost,
        enforcement_mode: budget.enforcement_mode,
        block_reason: 'per_phase_cap',
        _cyclePhase: cyclePhase,
      });
      emitHookFired('block', cycle);
      const response: ToolOutput = {
        continue: false,
        suppressOutput: false,
        stopReason: `Budget cap reached for per-phase (${phase}). Cumulative: $${(phaseSpend + estCost).toFixed(4)}, cap: $${budget.per_phase_cap_usd.toFixed(2)}. Raise cap in .design/budget.json or retry after next phase.`,
      };
      process.stdout.write(JSON.stringify(response));
      return;
    }
    // 80% soft-threshold downgrade (D-03): task-scoped, against the
    // resolved per-spawn cap so class-specific caps participate.
    if (
      budget.auto_downgrade_on_cap &&
      estCost >= 0.8 * perSpawnCap
    ) {
      toolInput._tier_override = 'haiku';
      toolInput._tier_downgraded = true;
    }
  } else if (effectiveEnforcementMode === 'warn') {
    if (estCost >= perSpawnCap) {
      process.stderr.write(
        `gdd-budget-enforcer WARN: per-spawn cap will be exceeded ($${estCost.toFixed(4)} >= $${perSpawnCap})\n`,
      );
    }
    // Phase 59.5 P1: when enforce was degraded to advisory for a byok/unverified
    // runtime, also surface the per-phase breach that the hard branch above
    // would otherwise have reported (it is skipped for unverified runtimes).
    if (
      budget.enforcement_mode === 'enforce' &&
      phaseSpend + estCost >= budget.per_phase_cap_usd
    ) {
      process.stderr.write(
        `gdd-budget-enforcer WARN: per-phase cap will be exceeded for ${phase} ` +
          `($${(phaseSpend + estCost).toFixed(4)} >= $${budget.per_phase_cap_usd.toFixed(2)})\n`,
      );
    }
  }
  // enforcement_mode === 'log': telemetry only.

  // D-04: tier_overrides rewrite.
  if (budget.tier_overrides[agent] !== undefined) {
    toolInput._tier_override = budget.tier_overrides[agent];
  }

  // Plan 26-05 / D-07 + D-08: resolved_models consumer path. When the
  // router decision payload carries a concrete model ID for this agent
  // under `resolved_models`, look up the cost in the per-runtime price
  // table by model ID. Otherwise fall back to the legacy tier-name
  // lookup (which still resolves through claude.md as the default
  // runtime — back-compat with v1.25.x callers).
  const resolvedModelId = budgetBackend.modelFromResolved(
    routerDecision?.resolved_models,
    agent,
  );
  const resolvedTier =
    toolInput._tier_override ?? toolInput._default_tier ?? 'sonnet';
  // Runtime tag: prefer the router's explicit `runtime` (D-08) field;
  // fall back to env-var detection; default to 'claude' since the .ts
  // hook itself only runs inside Claude Code. Reuse the id already resolved
  // for the Phase 59.5 P1 provenance guard above (single resolution source).
  const runtimeId = guardRuntimeId;

  // ── Plan 27.5-02 — bandit consultation ────────────────────────────────────
  //
  // D-01 / D-02 / D-03 / D-07: per-spawn after `resolved_models` is computed,
  // before the SDK call. Skip conditions (all silent — no event, no override):
  //   - adaptive_mode !== 'full' (D-07)
  //   - toolInput._tier_downgraded === true (80% downgrade fired upstream —
  //     bandit must not undo budget)
  //
  // When bandit fires, override resolved_models[agent] through tier-resolver
  // so downstream consumers see the bandit's pick as the actual model.
  // model_tier_overrides[agent] is preserved (D-03 back-compat).
  const currentMode = adaptiveMode.getMode({ quiet: true });
  const priorTier = resolvedTier; // captured before bandit override
  // Mutable references for the cost/telemetry path; bandit may rewrite.
  let effectiveTier: string = resolvedTier;
  let effectiveModelId: string | null = resolvedModelId;

  if (currentMode === 'full' && toolInput._tier_downgraded !== true) {
    // Bin defaults to 'medium' — budget-enforcer doesn't currently surface
    // glob_count; future plan can wire it. Per-agent bandit arms still
    // converge correctly under a fixed bin (Phase 23.5 D-08). The function
    // call below makes the integration point explicit for future plans.
    void banditRouterCore.binForGlobCount(0);
    const bin = 'medium';

    // Source the frontmatter view from the in-flight toolInput. The hook
    // reads frontmatter indirectly: _default_tier carries the agent's
    // declared default-tier, _tier_override (if any) carries an explicit
    // override the router emitted. For bandit purposes, _tier_override
    // means "operator has already taken control" — the shim returns
    // source='tier_override_bypass' (no posterior side effect).
    const agentFrontmatter: {
      tier_override?: string;
      default_tier?: string;
    } = {};
    if (
      typeof toolInput._tier_override === 'string' &&
      toolInput._tier_override.length > 0
    ) {
      agentFrontmatter.tier_override = toolInput._tier_override;
    }
    if (
      typeof toolInput._default_tier === 'string' &&
      toolInput._default_tier.length > 0
    ) {
      agentFrontmatter.default_tier = toolInput._default_tier;
    }

    // Delegate dimension: budget-enforcer doesn't currently see the
    // agent's delegate_to: frontmatter (session-runner does). For 27.5-02
    // we always consult the local-call slice (delegate='none'); 27.5-03
    // wires delegate=<peer> for the recordOutcome side.
    const banditDelegate = banditIntegration.DELEGATE_NONE;

    let banditResult: ReturnType<
      BanditIntegrationModule['consultBandit']
    > | null = null;
    try {
      banditResult = banditIntegration.consultBandit({
        agent,
        bin,
        delegate: banditDelegate,
        agentFrontmatter,
        adaptiveMode: currentMode,
      });
    } catch {
      // Fail open — never let a bandit error block a spawn.
    }

    if (banditResult !== null) {
      // Translate the bandit tier into a concrete model. The tier-resolver
      // emits its own fallback events (tier_resolution_fallback /
      // tier_resolution_failed) when the runtime row is incomplete, so we
      // don't need to re-emit those here.
      const banditModel = tierResolver.resolve(
        runtimeId,
        banditResult.tier,
        { silent: true },
      );

      // Apply override only when:
      //   1. bandit actually picked a different tier than priorTier
      //      (no-op write avoided)
      //   2. tier-resolver returned a non-null model (fall back to
      //      existing resolvedModelId on null)
      //   3. source is 'bandit_pull' or 'bandit_pull_with_delegate'
      //      (frontmatter/bypass paths don't override resolved_models)
      if (
        banditResult.tier !== priorTier &&
        banditModel !== null &&
        (banditResult.decision_log.source === 'bandit_pull' ||
          banditResult.decision_log.source === 'bandit_pull_with_delegate')
      ) {
        // Override resolved_models[agent] without touching
        // model_tier_overrides[agent] (D-03 back-compat).
        if (routerDecision !== undefined) {
          const rm = routerDecision.resolved_models ?? {};
          rm[agent] = banditModel;
          routerDecision.resolved_models = rm;
        }
        // Also stamp _tier_override on toolInput so downstream readers
        // see the bandit's pick.
        toolInput._tier_override = banditResult.tier;
        effectiveTier = banditResult.tier;
        effectiveModelId = banditModel;
      }

      // Emit one bandit.tier_selected event regardless of override outcome
      // (the event captures the decision, not the override side effect).
      emitBanditTierSelected(
        {
          agent,
          bin,
          prior_tier: priorTier,
          selected_tier: banditResult.tier,
          source: banditResult.decision_log.source,
          delegate: banditResult.decision_log.delegate ?? banditDelegate,
          adaptive_mode: banditResult.decision_log.adaptive_mode,
          samples: banditResult.decision_log.samples,
          runtime: runtimeId,
          model_id: effectiveModelId ?? resolvedModelId,
          ...(banditResult.decision_log.reason !== undefined
            ? { reason: banditResult.decision_log.reason }
            : {}),
        },
        cycle,
      );
    }
  }

  // ── Plan 33.6-03 — OpenRouter resolution consultation (SC#6, D-08, D-12) ────
  //
  // When the user opts in (`.design/config.json#openrouter_enabled: true` OR
  // `OPENROUTER_API_KEY` present), consult the OpenRouter adapter for the
  // effective tier FIRST. A non-null result routes this spawn to OpenRouter:
  // we override the model id and tag the cost row `provider: "openrouter"`. A
  // null result (no key / catalog missing-or-stale / no match) falls through to
  // the native resolution that's already in `effectiveModelId` — so the default
  // (OpenRouter disabled) path is byte-identical to pre-33.6 behavior (D-08).
  // The adapter never throws; this whole branch is also wrapped defensively.
  let costProvider: string | undefined;
  if (isOpenRouterEnabled()) {
    try {
      const openrouterModel = tierResolverOpenRouter.resolve(effectiveTier);
      if (typeof openrouterModel === 'string' && openrouterModel.length > 0) {
        effectiveModelId = openrouterModel;
        costProvider = 'openrouter';
        // Reflect the OpenRouter pick into resolved_models so downstream
        // consumers see the actual model (mirrors the bandit override above).
        if (routerDecision !== undefined) {
          const rm = routerDecision.resolved_models ?? {};
          rm[agent] = openrouterModel;
          routerDecision.resolved_models = rm;
        }
      }
    } catch {
      // Fail open — never let OpenRouter resolution block a spawn (D-08).
    }
  }

  // Compute runtime-aware cost via the shared backend. Failures return
  // null cost; we emit the event regardless so the cost-aggregator sees
  // the lookup attempt (Phase 22 events.jsonl tagging).
  const costLookup = budgetBackend.computeCost({
    model_id: effectiveModelId,
    tier: effectiveTier,
    runtime: runtimeId,
    tokens_in: Number(toolInput._tokens_in_est ?? 0),
    tokens_out: Number(toolInput._tokens_out_est ?? 0),
    cache_hit: false,
  });
  emitCostRecorded(
    {
      runtime: runtimeId,
      agent,
      model_id: effectiveModelId ?? costLookup.model,
      tier: costLookup.tier ?? effectiveTier,
      tokens_in: Number(toolInput._tokens_in_est ?? 0),
      tokens_out: Number(toolInput._tokens_out_est ?? 0),
      cost_usd: costLookup.cost_usd,
      // Plan 33.6-03 SC#6 — tag the row when OpenRouter resolved the model.
      // Omitted (undefined) on the native path → buildCostEventPayload drops it.
      ...(costProvider !== undefined ? { provider: costProvider } : {}),
    },
    cycle,
  );

  // Phase 59-9: when the cost was a CONSERVATIVE ESTIMATE (unknown/new model
  // priced at the opus ceiling) rather than a table-matched figure, emit a
  // distinct telemetry signal so an unrecognized model is OBSERVABLE rather
  // than silently mis-billed. Best-effort, never throws (fail-open).
  if (
    costLookup.cost_estimated === true ||
    (costLookup.fallback === true && costLookup.reason === 'model_not_found')
  ) {
    emitCostLookupFallback(
      {
        runtime: runtimeId,
        agent,
        model_id: effectiveModelId ?? costLookup.model,
        tier: costLookup.tier ?? effectiveTier,
        reason: costLookup.reason,
        cost_usd: costLookup.cost_usd,
        cost_estimated: costLookup.cost_estimated === true,
      },
      cycle,
    );
  }

  // Branch E: standard spawn-allowed (includes tier-downgraded path).
  writeTelemetry({
    agent,
    tier: effectiveTier,
    tokens_in: Number(toolInput._tokens_in_est ?? 0),
    tokens_out: Number(toolInput._tokens_out_est ?? 0),
    cache_hit: false,
    est_cost_usd: estCost,
    tier_downgraded: Boolean(toolInput._tier_downgraded),
    enforcement_mode: budget.enforcement_mode,
    _cyclePhase: cyclePhase,
  });

  // Decision tag for the event stream. downgrade takes precedence over
  // allow/warn/log since it's a user-visible rewrite.
  let decision: HookDecision;
  if (toolInput._tier_downgraded === true) {
    decision = 'downgrade';
  } else if (budget.enforcement_mode === 'warn') {
    decision = 'warn';
  } else if (budget.enforcement_mode === 'log') {
    decision = 'log';
  } else {
    decision = 'allow';
  }
  emitHookFired(decision, cycle);

  const response: ToolOutput = {
    continue: true,
    suppressOutput: true,
    modified_tool_input: toolInput,
    hookSpecificOutput: { hookEventName: 'PreToolUse', updatedInput: toolInput },
  };
  process.stdout.write(JSON.stringify(response));
}

// Run only when invoked as the hook entrypoint. Guards against test
// files that may import from this module (e.g. to call loadBudget()
// directly).
const isDirectInvocation =
  process.argv[1] !== undefined &&
  /budget-enforcer\.ts$/.test(process.argv[1]);

if (isDirectInvocation) {
  main().catch((err: unknown) => {
    const msg = err instanceof Error ? err.message : String(err);
    process.stderr.write(`budget-enforcer hook error: ${msg}\n`);
    process.exit(0);
  });
}