import { z } from "zod"; export declare const TTS_CHATTERBOX_LANGUAGES: readonly ["en", "es", "fr", "de", "it", "pt", "nl", "pl", "tr", "sv", "da", "fi", "no", "el", "ms", "sw", "ar", "ko"]; export declare const TTS_SUPERTONIC_LANGUAGES: readonly ["en", "es", "fr", "pt", "ko"]; export declare const TTS_LANGUAGES: readonly ["en", "es", "fr", "de", "it", "pt", "nl", "pl", "tr", "sv", "da", "fi", "no", "el", "ms", "sw", "ar", "ko"]; export declare const ttsChatterboxRuntimeConfigSchema: z.ZodObject<{ ttsEngine: z.ZodLiteral<"chatterbox">; language: z.ZodEnum<{ en: "en"; ar: "ar"; de: "de"; es: "es"; fi: "fi"; fr: "fr"; it: "it"; ko: "ko"; nl: "nl"; pl: "pl"; pt: "pt"; da: "da"; el: "el"; ms: "ms"; no: "no"; sv: "sv"; tr: "tr"; sw: "sw"; }>; voice: z.ZodOptional; useGPU: z.ZodOptional; }, z.core.$strip>; export declare const ttsSupertonicRuntimeConfigSchema: z.ZodObject<{ ttsEngine: z.ZodLiteral<"supertonic">; language: z.ZodEnum<{ en: "en"; es: "es"; fr: "fr"; ko: "ko"; pt: "pt"; }>; voice: z.ZodOptional; ttsSpeed: z.ZodOptional; ttsNumInferenceSteps: z.ZodOptional; useGPU: z.ZodOptional; }, z.core.$strip>; export declare const ttsRuntimeConfigSchema: z.ZodUnion; language: z.ZodEnum<{ en: "en"; ar: "ar"; de: "de"; es: "es"; fi: "fi"; fr: "fr"; it: "it"; ko: "ko"; nl: "nl"; pl: "pl"; pt: "pt"; da: "da"; el: "el"; ms: "ms"; no: "no"; sv: "sv"; tr: "tr"; sw: "sw"; }>; voice: z.ZodOptional; useGPU: z.ZodOptional; }, z.core.$strip>, z.ZodObject<{ ttsEngine: z.ZodLiteral<"supertonic">; language: z.ZodEnum<{ en: "en"; es: "es"; fr: "fr"; ko: "ko"; pt: "pt"; }>; voice: z.ZodOptional; ttsSpeed: z.ZodOptional; ttsNumInferenceSteps: z.ZodOptional; useGPU: z.ZodOptional; }, z.core.$strip>]>; export declare const ttsChatterboxLoadConfigSchema: z.ZodObject<{ ttsEngine: z.ZodLiteral<"chatterbox">; language: z.ZodEnum<{ en: "en"; ar: "ar"; de: "de"; es: "es"; fi: "fi"; fr: "fr"; it: "it"; ko: "ko"; nl: "nl"; pl: "pl"; pt: "pt"; da: "da"; el: "el"; ms: "ms"; no: "no"; sv: "sv"; tr: "tr"; sw: "sw"; }>; voice: z.ZodOptional; useGPU: z.ZodOptional; s3genModelSrc: z.ZodOptional; modelId: z.ZodOptional; registryPath: z.ZodOptional; registrySource: z.ZodOptional; blobCoreKey: z.ZodOptional; blobIndex: z.ZodOptional; engine: z.ZodOptional; expectedSize: z.ZodOptional; sha256Checksum: z.ZodOptional; addon: z.ZodOptional, z.ZodLiteral<"vad">]>>; }, z.core.$strip>]>>; referenceAudioSrc: z.ZodOptional; modelId: z.ZodOptional; registryPath: z.ZodOptional; registrySource: z.ZodOptional; blobCoreKey: z.ZodOptional; blobIndex: z.ZodOptional; engine: z.ZodOptional; expectedSize: z.ZodOptional; sha256Checksum: z.ZodOptional; addon: z.ZodOptional, z.ZodLiteral<"vad">]>>; }, z.core.$strip>]>>; }, z.core.$strip>; export declare const ttsSupertonicLoadConfigSchema: z.ZodObject<{ ttsEngine: z.ZodLiteral<"supertonic">; language: z.ZodEnum<{ en: "en"; es: "es"; fr: "fr"; ko: "ko"; pt: "pt"; }>; voice: z.ZodOptional; ttsSpeed: z.ZodOptional; ttsNumInferenceSteps: z.ZodOptional; useGPU: z.ZodOptional; }, z.core.$strip>; export declare const ttsLoadConfigSchema: z.ZodUnion; language: z.ZodEnum<{ en: "en"; ar: "ar"; de: "de"; es: "es"; fi: "fi"; fr: "fr"; it: "it"; ko: "ko"; nl: "nl"; pl: "pl"; pt: "pt"; da: "da"; el: "el"; ms: "ms"; no: "no"; sv: "sv"; tr: "tr"; sw: "sw"; }>; voice: z.ZodOptional; useGPU: z.ZodOptional; s3genModelSrc: z.ZodOptional; modelId: z.ZodOptional; registryPath: z.ZodOptional; registrySource: z.ZodOptional; blobCoreKey: z.ZodOptional; blobIndex: z.ZodOptional; engine: z.ZodOptional; expectedSize: z.ZodOptional; sha256Checksum: z.ZodOptional; addon: z.ZodOptional, z.ZodLiteral<"vad">]>>; }, z.core.$strip>]>>; referenceAudioSrc: z.ZodOptional; modelId: z.ZodOptional; registryPath: z.ZodOptional; registrySource: z.ZodOptional; blobCoreKey: z.ZodOptional; blobIndex: z.ZodOptional; engine: z.ZodOptional; expectedSize: z.ZodOptional; sha256Checksum: z.ZodOptional; addon: z.ZodOptional, z.ZodLiteral<"vad">]>>; }, z.core.$strip>]>>; }, z.core.$strip>, z.ZodObject<{ ttsEngine: z.ZodLiteral<"supertonic">; language: z.ZodEnum<{ en: "en"; es: "es"; fr: "fr"; ko: "ko"; pt: "pt"; }>; voice: z.ZodOptional; ttsSpeed: z.ZodOptional; ttsNumInferenceSteps: z.ZodOptional; useGPU: z.ZodOptional; }, z.core.$strip>]>; export declare const LEGACY_TTS_ONNX_MODEL_CONFIG_FIELDS: readonly ["ttsSupertonicMultilingual", "ttsTokenizerSrc", "ttsSpeechEncoderSrc", "ttsEmbedTokensSrc", "ttsConditionalDecoderSrc", "ttsLanguageModelSrc", "ttsTextEncoderSrc", "ttsDurationPredictorSrc", "ttsVectorEstimatorSrc", "ttsVocoderSrc", "ttsUnicodeIndexerSrc", "ttsTtsConfigSrc", "ttsVoiceStyleSrc"]; export declare const ttsConfigSchema: z.ZodUnion; }, z.core.$strict>, z.ZodObject<{ [x: string]: z.ZodOptional; }, z.core.$strict>]>; export declare const ttsClientParamsSchema: z.ZodObject<{ modelId: z.ZodString; inputType: z.ZodDefault; text: z.ZodString; stream: z.ZodDefault; sentenceStream: z.ZodDefault; sentenceStreamLocale: z.ZodOptional; sentenceStreamMaxChunkScalars: z.ZodOptional; }, z.core.$strip>; export declare const ttsRequestSchema: z.ZodObject<{ modelId: z.ZodString; inputType: z.ZodDefault; text: z.ZodString; stream: z.ZodDefault; sentenceStream: z.ZodDefault; sentenceStreamLocale: z.ZodOptional; sentenceStreamMaxChunkScalars: z.ZodOptional; type: z.ZodLiteral<"textToSpeech">; }, z.core.$strip>; export declare const ttsStatsSchema: z.ZodObject<{ audioDuration: z.ZodOptional; totalSamples: z.ZodOptional; }, z.core.$strip>; export declare const ttsResponseSchema: z.ZodObject<{ type: z.ZodLiteral<"textToSpeech">; buffer: z.ZodArray; done: z.ZodDefault; stats: z.ZodOptional; totalSamples: z.ZodOptional; }, z.core.$strip>>; chunkIndex: z.ZodOptional; sentenceChunk: z.ZodOptional; }, z.core.$strip>; declare const textToSpeechStreamRequestBaseSchema: z.ZodObject<{ modelId: z.ZodString; inputType: z.ZodDefault; accumulateSentences: z.ZodOptional; sentenceDelimiterPreset: z.ZodOptional>; maxBufferScalars: z.ZodOptional; flushAfterMs: z.ZodOptional; }, z.core.$strip>; export declare const textToSpeechStreamRequestSchema: z.ZodObject<{ modelId: z.ZodString; inputType: z.ZodDefault; accumulateSentences: z.ZodOptional; sentenceDelimiterPreset: z.ZodOptional>; maxBufferScalars: z.ZodOptional; flushAfterMs: z.ZodOptional; type: z.ZodLiteral<"textToSpeechStream">; }, z.core.$strip>; export declare const textToSpeechStreamResponseSchema: z.ZodObject<{ type: z.ZodLiteral<"textToSpeechStream">; buffer: z.ZodArray; done: z.ZodDefault; stats: z.ZodOptional; totalSamples: z.ZodOptional; }, z.core.$strip>>; chunkIndex: z.ZodOptional; sentenceChunk: z.ZodOptional; }, z.core.$strip>; export type TtsLanguage = (typeof TTS_LANGUAGES)[number]; export type TtsChatterboxLanguage = (typeof TTS_CHATTERBOX_LANGUAGES)[number]; export type TtsSupertonicLanguage = (typeof TTS_SUPERTONIC_LANGUAGES)[number]; export type TtsChatterboxLoadConfig = z.infer; export type TtsSupertonicLoadConfig = z.infer; export type TtsLoadConfig = z.infer; /** @deprecated Use {@link TtsChatterboxLoadConfig} */ export type TtsChatterboxConfig = TtsChatterboxLoadConfig; /** @deprecated Use {@link TtsSupertonicLoadConfig} */ export type TtsSupertonicConfig = TtsSupertonicLoadConfig; export type TtsChatterboxRuntimeConfig = z.infer; export type TtsSupertonicRuntimeConfig = z.infer; export type TtsRuntimeConfig = z.infer; export type TtsConfig = z.infer; export type TtsClientParamsInput = z.input; export type TtsClientParams = z.output; export type TtsRequest = z.infer; export type TtsResponse = z.infer; export type TtsStats = z.infer; export type TtsSentenceChunkUpdate = { buffer: number[]; chunkIndex?: number; sentenceChunk?: string; }; export type TextToSpeechStreamRequest = z.infer; export type TextToSpeechStreamResponse = z.infer; export type TextToSpeechStreamClientParams = z.infer; export interface TextToSpeechStreamResult { bufferStream: AsyncGenerator; chunkUpdates?: AsyncGenerator; buffer: Promise; done: Promise; } export interface TextToSpeechStreamSession { write(textFragment: string | Buffer): void; end(): void; destroy(): void; [Symbol.asyncIterator](): AsyncIterator; } export {}; //# sourceMappingURL=text-to-speech.d.ts.map