/**
 * Alignment information for the generated audio given the input text sequence.
 */
export interface Alignment {
    /**
     * A list of starting times (in milliseconds) for each character in the text as it
     * corresponds to the audio. For instance, the character 'H' starts at time 0 ms in the audio.
     * Note these times are relative to the returned chunk from the model, and not the
     * full audio response.
     */
    charStartTimesMs?: number[];
    /**
     * A list of durations (in milliseconds) for each character in the text as it
     * corresponds to the audio. For instance, the character 'H' lasts for 3 ms in the audio.
     * Note these times are relative to the returned chunk from the model, and not the
     * full audio response.
     */
    charDurationsMs?: number[];
    /**
     * A list of characters in the text sequence. For instance, the first character is 'H'.
     * Note that this list may contain spaces, punctuation, and other special characters.
     * The length of this list should be the same as the lengths of `charStartTimesMs` and `charDurationsMs`.
     */
    chars?: string[];
}