echogarden
Version:
An easy-to-use speech toolset. Includes tools for synthesis, recognition, alignment, speech translation, language detection, source separation and more.
26 lines (25 loc) • 1.07 kB
TypeScript
import { type PreTrainedModel, type PreTrainedTokenizer } from '@echogarden/transformers-nodejs-lite';
import { Timeline } from '../utilities/Timeline.js';
export declare function alignTimelineToTextSemantically(timeline: Timeline, text: string, textLangCode: string): Promise<Timeline>;
export declare function alignWordsToWordsSemantically(wordsGroups1: string[][], wordsGroups2: string[][], windowTokenCount?: number): Promise<WordMapping[]>;
export declare class E5TextEmbedding {
readonly modelPath: string;
tokenizer?: PreTrainedTokenizer;
model?: PreTrainedModel;
constructor(modelPath: string);
tokenizeToModelInputs(text: string): Promise<any>;
inferTokenEmbeddings(inputs: any): Promise<TokenEmbeddingData[]>;
initializeIfNeeded(): Promise<void>;
}
export interface TokenEmbeddingData {
id: number;
text: string;
embeddingVector: Float32Array;
}
export interface WordMapping {
wordIndex1: number;
word1: string;
wordIndex2: number;
word2: string;
}
export declare const e5SupportedLanguages: string[];