@d-id/client-sdk
Version:
d-id client sdk
154 lines (153 loc) • 4.9 kB
TypeScript
export declare enum Providers {
Amazon = "amazon",
AzureOpenAi = "azure-openai",
Microsoft = "microsoft",
Afflorithmics = "afflorithmics",
Elevenlabs = "elevenlabs"
}
export declare enum VoiceAccess {
Public = "public",
Premium = "premium",
Private = "private"
}
export interface IVoice {
id: string;
name: string;
gender: string;
locale: string;
access: VoiceAccess;
provider: Providers;
styles: string[];
language: string;
}
/**
* Elevenlabs provider details, contains the provider type and requested voice id, available for premium users.
*/
export interface Elevenlabs_tts_provider {
type: Providers.Elevenlabs;
/**
* The voice_id from the list of available voices. https://api.elevenlabs.io/v1/voices.
* @example "21m00Tcm4TlvDq8ikWAM"
* @default 21m00Tcm4TlvDq8ikWAM
*/
voice_id: string;
/**
* Voice customization options. Read more here: https://docs.elevenlabs.io/speech-synthesis/voice-settings
*/
voice_config?: VoiceConfigElevenlabs;
}
/**
* Afflorithmics provider details, contains the provider type and requested voice id, available for enterprise users.
*/
export interface Afflorithmics_tts_provider {
type: Providers.Afflorithmics;
/**
* The voice_id from the list of available voices.
* @example "abc123DEF456"
* @default abc123DEF456
*/
voice_id: string;
/**
* Voice customization options. Read more here: https://docs.audiostack.ai/reference/postspeech
*/
voice_config?: VoiceConfigAfflorithmics;
}
/**
* AzureMicrosoft provider details, contains the provider type and requested voice id and style
*/
export interface Microsoft_tts_provider {
type: Providers.Microsoft;
/**
* The voice_id from the list of available voices.
* For full list of voice_ids: https://docs.d-id.com/reference/microsoft-azure
* @example "en-US-JennyNeural"
* @default en-US-JennyNeural
*/
voice_id: string;
/**
* Voice customization options
*/
voice_config?: VoiceConfigMicrosoft;
/**
* Voice name
*/
voice_name?: string;
/**
* Voice language
*/
voice_language?: string;
}
/**
* AzureOpenAi provider details, contains the provider type and requested voice id and style
*/
export interface AzureOpenAi_tts_provider extends Omit<Microsoft_tts_provider, 'type'> {
type: Providers.AzureOpenAi;
}
/**
* Amazon provider details, contains the provider type and requested voice id
*/
export interface Amazon_tts_provider {
type: Providers.Amazon;
/**
* The voice_id from the list of available voices.
* For full list of voice_ids: https://docs.d-id.com/reference/text-to-speech-providers
* @example "Joanna"
*/
voice_id: string;
}
export interface VoiceConfigMicrosoft {
/**
* The style of the voice.
* Available styles change between voices.
*/
style?: string;
/**
* The speed of the voice.
* The value is relative to 1, 0.5 being half speed, 2 being twice as fast, etc.
* Another option is a constant value from x-slow/slow/medium/fast/x-fast.
* @example "0.5"
*/
rate?: string;
/**
* The pitch of the voice.
* Value could be an absolute value in Hz (including units), a relative value in Hz or st(semitones)
* or a constant value from x-low/low/medium/high/x-high.
* @example "+2st"
*/
pitch?: string;
}
export interface VoiceConfigElevenlabs {
/**
* How stable the voice is and the randomness of each new generation.
* @example "0"
*/
stability?: number;
/**
* The similarity slider dictates how closely the AI should adhere to the original voice when attempting to replicate it.
* @example "0"
*/
similarity_boost?: number;
}
export interface VoiceConfigAfflorithmics {
/**
* The speed of the voice.
* The value is relative to 1, 0.5 being half speed, 2 being twice as fast, etc.
* Another option is a constant value from x-slow/slow/medium/fast/x-fast.
* @example "1.2"
* @min 0.5
* @max 1.5
* @default 1
*/
rate?: string;
/**
* Amount of microseconds for silence padding. Half of the amount is inserted as silence at the beginning and at the end of each Speech file.
*/
silencePadding?: number;
/**
* Flag to apply lexicographical text corrections
*/
voiceIntelligence?: boolean;
}
export type TextToSpeechProviders = Microsoft_tts_provider | AzureOpenAi_tts_provider | Afflorithmics_tts_provider | Elevenlabs_tts_provider;
export type ExtendedTextToSpeechProviders = TextToSpeechProviders | Amazon_tts_provider;
export type StreamTextToSpeechProviders = Microsoft_tts_provider | AzureOpenAi_tts_provider | Afflorithmics_tts_provider | Elevenlabs_tts_provider | Amazon_tts_provider;