/** * Alignment information for the generated audio given the input normalized text sequence. */ export interface NormalizedAlignment { /** * A list of starting times (in milliseconds) for each character in the normalized text as it * corresponds to the audio. For instance, the character 'H' starts at time 0 ms in the audio. * Note these times are relative to the returned chunk from the model, and not the * full audio response. */ charStartTimesMs?: number[]; /** * A list of durations (in milliseconds) for each character in the normalized text as it * corresponds to the audio. For instance, the character 'H' lasts for 3 ms in the audio. * Note these times are relative to the returned chunk from the model, and not the * full audio response. */ charDurationsMs?: number[]; /** * A list of characters in the normalized text sequence. For instance, the first character is 'H'. * Note that this list may contain spaces, punctuation, and other special characters. * The length of this list should be the same as the lengths of `charStartTimesMs` and `charDurationsMs`. */ chars?: string[]; }