"""Plan the next turn — recommend symbols/files based on query."""

import heapq
import time
from typing import Optional

from ..storage.sqlite_store import SQLiteIndexStore
from ._utils import resolve_repo
from .search_symbols import (
    _tokenize,
    _compute_bm25,
    _bm25_score,
    _compute_centrality,
)

# Confidence thresholds
_HIGH_THRESHOLD = 2.0
_MEDIUM_THRESHOLD = 0.5


def plan_turn(
    repo: str,
    query: str,
    max_recommended: int = 5,
    storage_path: Optional[str] = None,
) -> dict:
    """Plan the next turn by analyzing query against the codebase.

    Returns confidence level, recommended symbols/files, and guidance.

    Args:
        repo: Repository identifier.
        query: What the AI is looking for (task description or symbol name).
        max_recommended: Maximum number of symbols to recommend.
        storage_path: Custom storage path.

    Returns:
        Dict with:
            - confidence: "high", "medium", or "low"
            - recommended_symbols: List of {id, name, file, line, score}
            - recommended_files: List of unique file paths
            - gap_analysis: String explaining what's missing
            - max_supplementary_reads: Suggested read limit based on confidence
            - session_overlap: Files from journal that appear in recommended_files
            - _meta: {timing_ms}
    """
    start = time.perf_counter()

    # Validate query length
    if len(query) > 500:
        return {"error": f"Query too long ({len(query)} chars, max 500)"}

    try:
        owner, name = resolve_repo(repo, storage_path)
    except ValueError as e:
        return {"error": str(e)}

    store = SQLiteIndexStore(base_path=storage_path)
    index = store.load_index(owner, name)
    if not index:
        return {"error": f"Repository not indexed: {owner}/{name}"}

    # Get BM25 cache
    cache = index._bm25_cache
    if "idf" not in cache:
        cache["idf"], cache["avgdl"], cache["inverted"] = _compute_bm25(index.symbols)
        cache["centrality"] = _compute_centrality(
            index.symbols, index.imports, index.alias_map, getattr(index, "psr4_map", None)
        )
    idf = cache["idf"]
    avgdl = cache["avgdl"]
    centrality = cache["centrality"]
    inverted = cache["inverted"]

    # Tokenize query
    query_terms = _tokenize(query) or [query.lower()]
    # Guard: empty string in query_terms causes "" to match every filename
    query_terms = [t for t in query_terms if t]

    # Score symbols using inverted index
    candidate_indices: set = set()
    for term in query_terms:
        posting = inverted.get(term)
        if posting:
            candidate_indices.update(posting)

    if candidate_indices:
        candidates = [index.symbols[i] for i in sorted(candidate_indices)]
    else:
        candidates = index.symbols

    # Score and rank
    heap: list[tuple[float, dict]] = []
    max_score = 0.0
    hits = 0

    for sym in candidates:
        score = _bm25_score(sym, query_terms, idf, avgdl, centrality)
        if score <= 0:
            continue
        hits += 1
        if score > max_score:
            max_score = score

        entry = {
            "id": sym["id"],
            "name": sym["name"],
            "file": sym["file"],
            "line": sym["line"],
            "score": round(score, 3),
        }

        if len(heap) < max_recommended:
            heapq.heappush(heap, (score, entry))
        elif score > heap[0][0]:
            heapq.heapreplace(heap, (score, entry))

    # Sort by score descending
    recommended_symbols = [entry for score, entry in sorted(heap, key=lambda x: x[0], reverse=True)]

    # Determine confidence (config-driven thresholds)
    try:
        from .. import config as _cfg
        high_t = _cfg.get("plan_turn_high_threshold", _HIGH_THRESHOLD)
        med_t = _cfg.get("plan_turn_medium_threshold", _MEDIUM_THRESHOLD)
    except Exception:
        high_t, med_t = _HIGH_THRESHOLD, _MEDIUM_THRESHOLD
    if max_score >= high_t and hits >= 3:
        confidence = "high"
    elif max_score >= med_t and hits >= 1:
        confidence = "medium"
    else:
        confidence = "low"

    # Deduplicate files
    recommended_files = list({sym["file"] for sym in recommended_symbols})

    # Build gap analysis
    if confidence == "low":
        gap_analysis = (
            f"No symbols matching '{query}' found in {len(index.symbols)} indexed symbols. "
            f"This feature likely needs to be created from scratch."
        )
    elif confidence == "medium":
        gap_analysis = (
            f"Partial matches found. Related code exists but may not directly implement '{query}'."
        )
    else:
        gap_analysis = (
            f"Strong matches found. Existing implementation likely covers '{query}'."
        )

    # Max supplementary reads based on confidence
    max_supplementary_reads = {"high": 2, "medium": 5, "low": 10}[confidence]

    # Check session overlap + load journal context for sub-features
    session_overlap: list[str] = []
    journal_ctx: Optional[dict] = None
    accessed_files: set = set()
    try:
        from .session_journal import get_journal
        journal = get_journal()
        journal_ctx = journal.get_context()
        accessed_files = {f["file"] for f in journal_ctx.get("files_accessed", [])}
        session_overlap = [f for f in recommended_files if f in accessed_files]
    except Exception:
        pass

    # --- Sub-feature: Prior negative evidence check ---
    # If the journal already has a zero-result search for this exact query,
    # escalate to confidence="none" to stop the AI from re-searching.
    prior_evidence = None
    try:
        if journal_ctx is not None:
            for search in journal_ctx.get("recent_searches", []):
                if search["query"] == query and search.get("result_count", -1) == 0:
                    times = search.get("count", search.get("times_run", 1))
                    prior_evidence = {
                        "previously_searched": True,
                        "times_searched": times,
                        "recommendation": (
                            f"This exact query was already searched {times} time(s) "
                            f"with 0 results. The feature does not exist in the indexed codebase. "
                            f"Do NOT search again."
                        ),
                    }
                    confidence = "none"
                    max_supplementary_reads = 0
                    break
    except Exception:
        pass

    # --- Sub-feature: Insertion point recommendation (when confidence is low/none) ---
    insertion_candidates = None
    if confidence in ("low", "none"):
        try:
            from .pagerank import compute_pagerank
            if "pagerank" not in cache:
                pr_scores, _ = compute_pagerank(
                    index.imports or {}, index.source_files, index.alias_map
                )
                cache["pagerank"] = pr_scores
            pr_scores = cache["pagerank"]

            # Find files whose names partially match query terms
            name_matches = []
            for f in index.source_files:
                fname = f.rsplit("/", 1)[-1].lower() if "/" in f else f.lower()
                if any(t in fname for t in query_terms):
                    name_matches.append((f, pr_scores.get(f, 0.0)))

            # Fall back to top PageRank files if no name match
            candidates_for_insert = name_matches if name_matches else [
                (f, s) for f, s in sorted(pr_scores.items(), key=lambda x: x[1], reverse=True)[:20]
            ]
            candidates_for_insert.sort(key=lambda x: x[1], reverse=True)

            insertion_candidates = [
                {"file": f, "centrality_score": round(s, 4)}
                for f, s in candidates_for_insert[:3]
            ]

            if insertion_candidates:
                locations = ", ".join(
                    f"{c['file']} (centrality {c['centrality_score']})"
                    for c in insertion_candidates
                )
                gap_analysis += f" Suggested location(s): {locations}."
        except Exception:
            pass

    # --- Sub-feature: Smart budget advisor (when turn budget >60% used) ---
    budget_advisor = None
    try:
        from .turn_budget import get_turn_budget
        tb = get_turn_budget()
        if tb.is_enabled():
            pct = tb.percent_used()
            if pct > 0.6:
                if "pagerank" not in cache:
                    from .pagerank import compute_pagerank
                    pr_scores, _ = compute_pagerank(
                        index.imports or {}, index.source_files, index.alias_map
                    )
                    cache["pagerank"] = pr_scores
                pr_scores = cache.get("pagerank", {})
                already_read = accessed_files if accessed_files else set()
                unexplored = sorted(
                    [(f, pr_scores.get(f, 0.0)) for f in index.source_files if f not in already_read],
                    key=lambda x: x[1], reverse=True,
                )[:5]
                budget_advisor = {
                    "turn_budget_percent_used": round(pct * 100, 1),
                    "highest_value_unexplored": [
                        {"file": f, "centrality_score": round(s, 4)} for f, s in unexplored
                    ],
                    "recommendation": (
                        f"Budget {round(pct * 100)}% used. "
                        f"Top unexplored files by architectural importance listed above. "
                        f"Focus remaining reads on these."
                    ),
                }
    except Exception:
        pass

    elapsed = (time.perf_counter() - start) * 1000

    result: dict = {
        "confidence": confidence,
        "recommended_symbols": recommended_symbols,
        "recommended_files": recommended_files,
        "gap_analysis": gap_analysis,
        "max_supplementary_reads": max_supplementary_reads,
        "session_overlap": session_overlap,
        "_meta": {
            "timing_ms": round(elapsed, 1),
            "total_symbols": len(index.symbols),
            "candidates_scored": hits,
        },
    }
    if prior_evidence is not None:
        result["prior_evidence"] = prior_evidence
    if insertion_candidates:
        result["insertion_candidates"] = insertion_candidates
    if budget_advisor is not None:
        result["budget_advisor"] = budget_advisor
    if confidence in ("low", "none"):
        result["action"] = "STOP_AND_REPORT_GAP"
    return result