@langchain/community
Version:
Third-party integrations for LangChain.js
39 lines (38 loc) • 1.27 kB
JavaScript
import { OpenAIClient, toFile } from "@langchain/openai";
import { Document } from "@langchain/core/documents";
import { BufferLoader } from "langchain/document_loaders/fs/buffer";
const MODEL_NAME = "whisper-1";
/**
* @example
* ```typescript
* const loader = new OpenAIWhisperAudio(
* "./src/document_loaders/example_data/test.mp3",
* );
* const docs = await loader.load();
* console.log(docs);
* ```
*/
export class OpenAIWhisperAudio extends BufferLoader {
constructor(filePathOrBlob, fields) {
super(filePathOrBlob);
Object.defineProperty(this, "openAIClient", {
enumerable: true,
configurable: true,
writable: true,
value: void 0
});
this.openAIClient = new OpenAIClient(fields?.clientOptions);
}
async parse(raw, metadata) {
const fileName = metadata.source === "blob" ? metadata.blobType : metadata.source;
const transcriptionResponse = await this.openAIClient.audio.transcriptions.create({
file: await toFile(raw, fileName),
model: MODEL_NAME,
});
const document = new Document({
pageContent: transcriptionResponse.text,
metadata,
});
return [document];
}
}