echogarden
Version:
An easy-to-use speech toolset. Includes tools for synthesis, recognition, alignment, speech translation, language detection, source separation and more.
21 lines • 800 B
TypeScript
import { RawAudio } from '../audio/AudioUtilities.js';
import { Timeline } from '../utilities/Timeline.js';
export declare function recognize(rawAudio: RawAudio, languageCode: string, options: OpenAICloudSTTOptions, task?: Task): Promise<{
transcript: string;
timeline: Timeline | undefined;
}>;
type Task = 'transcribe' | 'translate';
export interface OpenAICloudSTTOptions {
model?: 'whisper-1' | 'gpt-4o-mini-transcribe' | 'gpt-4o-transcribe' | string;
apiKey?: string;
organization?: string;
baseURL?: string;
temperature?: number;
prompt?: string;
timeout?: number;
maxRetries?: number;
requestWordTimestamps?: boolean;
}
export declare const defaultOpenAICloudSTTOptions: OpenAICloudSTTOptions;
export {};
//# sourceMappingURL=OpenAICloudSTT.d.ts.map