import type { PdfChunk, PdfIndex } from "./types.js"; export type LoadResult = { index: PdfIndex; stats: { cached: number; extracted: number; chunks: number; }; }; /** * Extract → chunk → BM25-index a set of PDF paths. Cached on disk by content * hash so re-runs skip re-extraction. Returns an empty-but-valid index when * `paths` is empty. */ export declare function loadPdfs(paths: string[], cacheDir: string): Promise; /** * Section-aware sliding-window chunker. Splits text on blank-line paragraphs, * tags each paragraph with the most recent heading line, then packs into * ~CHUNK_SIZE-char chunks with CHUNK_OVERLAP. Headings stay attached so * retrieved excerpts carry their context. */ export declare function chunkText(text: string, source: string, hash: string): PdfChunk[]; export declare function emptyIndex(): PdfIndex; //# sourceMappingURL=load.d.ts.map