@huggingface/inference
Version:
Typescript client for the Hugging Face Inference Providers and Inference Endpoints
25 lines (24 loc) • 1.05 kB
JavaScript
import { resolveProvider } from "../../lib/getInferenceProviderMapping.js";
import { getProviderHelper } from "../../lib/getProviderHelper.js";
import { base64FromBytes } from "../../utils/base64FromBytes.js";
import { innerRequest } from "../../utils/request.js";
/**
* Answers a question on an image. Recommended model: dandelin/vilt-b32-finetuned-vqa.
*/
export async function visualQuestionAnswering(args, options) {
const provider = await resolveProvider(args.provider, args.model, args.endpointUrl);
const providerHelper = getProviderHelper(provider, "visual-question-answering");
const reqArgs = {
...args,
inputs: {
question: args.inputs.question,
// convert Blob or ArrayBuffer to base64
image: base64FromBytes(new Uint8Array(await args.inputs.image.arrayBuffer())),
},
};
const { data: res } = await innerRequest(reqArgs, providerHelper, {
...options,
task: "visual-question-answering",
});
return providerHelper.getResponse(res);
}