export declare const EXTRACT_TEXT_NAME = "extract_text"; export declare const EXTRACT_TEXT_INPUT_SCHEMA: { readonly type: "object"; readonly additionalProperties: false; readonly required: readonly ["pdfBase64"]; readonly properties: { readonly pdfBase64: { readonly type: "string"; readonly minLength: 4; readonly description: "Base64-encoded PDF bytes."; }; readonly pages: { readonly type: "array"; readonly description: "Optional 0-based page indices to extract. When omitted, every page is extracted."; readonly maxItems: 1000; readonly items: { readonly type: "integer"; readonly minimum: 0; }; }; }; }; export declare const EXTRACT_TEXT_OUTPUT_SCHEMA: { readonly type: "object"; readonly additionalProperties: false; readonly required: readonly ["pageCount", "extractedPageCount", "extractable", "pages", "fullText"]; readonly properties: { readonly pageCount: { readonly type: "integer"; readonly minimum: 0; }; readonly extractedPageCount: { readonly type: "integer"; readonly minimum: 0; }; readonly extractable: { readonly type: "boolean"; readonly description: "False when one or more requested pages had a non-empty content stream but yielded no extractable text (likely subset fonts without /ToUnicode)."; }; readonly extractableReason: { readonly type: "string"; readonly description: "Human-readable explanation when extractable=false. Absent when extractable=true."; }; readonly pages: { readonly type: "array"; readonly items: { readonly type: "object"; readonly additionalProperties: false; readonly required: readonly ["index", "text"]; readonly properties: { readonly index: { readonly type: "integer"; readonly minimum: 0; }; readonly text: { readonly type: "string"; }; }; }; }; readonly fullText: { readonly type: "string"; }; }; }; export interface ExtractedPage { readonly index: number; readonly text: string; } export interface ExtractTextResult { readonly pageCount: number; readonly extractedPageCount: number; readonly extractable: boolean; readonly extractableReason?: string; readonly pages: readonly ExtractedPage[]; readonly fullText: string; } /** * Tokenise a single page's content stream and concatenate the operand strings * of every text-showing operator. Strings are emitted in the order they appear; * paragraph breaks are inferred from BT/ET blocks (one newline per text object). */ /** @internal — exported for unit-testing only. */ export declare function _extractPageTextForTesting(latin1: string): string; export declare function extractText(rawInput: unknown): Promise; //# sourceMappingURL=extract-text.d.ts.map