@huggingface/inference

Version:

Typescript client for the Hugging Face Inference Providers and Inference Endpoints

24 lines (22 loc) • 1.01 kB

text/typescript

import type { TextToSpeechInput } from "@huggingface/tasks"; import { resolveProvider } from "../../lib/getInferenceProviderMapping"; import { getProviderHelper } from "../../lib/getProviderHelper"; import type { BaseArgs, Options } from "../../types"; import { innerRequest } from "../../utils/request"; type TextToSpeechArgs = BaseArgs & TextToSpeechInput; interface OutputUrlTextToSpeechGeneration { output: string | string[]; } /** * This task synthesize an audio of a voice pronouncing a given text. * Recommended model: espnet/kan-bayashi_ljspeech_vits */ export async function textToSpeech(args: TextToSpeechArgs, options?: Options): Promise<Blob> { const provider = await resolveProvider(args.provider, args.model, args.endpointUrl); const providerHelper = getProviderHelper(provider, "text-to-speech"); const { data: res } = await innerRequest<Blob | OutputUrlTextToSpeechGeneration>(args, providerHelper, { ...options, task: "text-to-speech", }); return providerHelper.getResponse(res); }