@huggingface/inference
Version:
Typescript client for the Hugging Face Inference Providers and Inference Endpoints
24 lines (22 loc) • 1.01 kB
text/typescript
import type { TextToSpeechInput } from "@huggingface/tasks";
import { resolveProvider } from "../../lib/getInferenceProviderMapping";
import { getProviderHelper } from "../../lib/getProviderHelper";
import type { BaseArgs, Options } from "../../types";
import { innerRequest } from "../../utils/request";
type TextToSpeechArgs = BaseArgs & TextToSpeechInput;
interface OutputUrlTextToSpeechGeneration {
output: string | string[];
}
/**
* This task synthesize an audio of a voice pronouncing a given text.
* Recommended model: espnet/kan-bayashi_ljspeech_vits
*/
export async function textToSpeech(args: TextToSpeechArgs, options?: Options): Promise<Blob> {
const provider = await resolveProvider(args.provider, args.model, args.endpointUrl);
const providerHelper = getProviderHelper(provider, "text-to-speech");
const { data: res } = await innerRequest<Blob | OutputUrlTextToSpeechGeneration>(args, providerHelper, {
...options,
task: "text-to-speech",
});
return providerHelper.getResponse(res);
}