UNPKG

echogarden

Version:

An easy-to-use speech toolset. Includes tools for synthesis, recognition, alignment, speech translation, language detection, source separation and more.

21 lines 800 B
import { RawAudio } from '../audio/AudioUtilities.js'; import { Timeline } from '../utilities/Timeline.js'; export declare function recognize(rawAudio: RawAudio, languageCode: string, options: OpenAICloudSTTOptions, task?: Task): Promise<{ transcript: string; timeline: Timeline | undefined; }>; type Task = 'transcribe' | 'translate'; export interface OpenAICloudSTTOptions { model?: 'whisper-1' | 'gpt-4o-mini-transcribe' | 'gpt-4o-transcribe' | string; apiKey?: string; organization?: string; baseURL?: string; temperature?: number; prompt?: string; timeout?: number; maxRetries?: number; requestWordTimestamps?: boolean; } export declare const defaultOpenAICloudSTTOptions: OpenAICloudSTTOptions; export {}; //# sourceMappingURL=OpenAICloudSTT.d.ts.map