@langchain/community
Version:
Third-party integrations for LangChain.js
37 lines (36 loc) • 1.69 kB
TypeScript
import { Document } from "@langchain/core/documents";
import { BufferLoader } from "@langchain/classic/document_loaders/fs/buffer";
//#region src/document_loaders/fs/docx.d.ts
type DocxLoaderOptions = {
type: "docx" | "doc";
};
/**
* A class that extends the `BufferLoader` class. It represents a document
* loader that loads documents from DOCX files.
* It has a constructor that takes a `filePathOrBlob` parameter representing the path to the word
* file or a Blob object, and an optional `options` parameter of type
* `DocxLoaderOptions`
*/
declare class DocxLoader extends BufferLoader {
protected options: DocxLoaderOptions;
constructor(filePathOrBlob: string | Blob, options?: DocxLoaderOptions);
/**
* A method that takes a `raw` buffer and `metadata` as parameters and
* returns a promise that resolves to an array of `Document` instances. It
* uses the `extractRawText` function from the `mammoth` module or
* `extract` method from the `word-extractor` module to extract
* the raw text content from the buffer. If the extracted text content is
* empty, it returns an empty array. Otherwise, it creates a new
* `Document` instance with the extracted text content and the provided
* metadata, and returns it as an array.
* @param raw The raw buffer from which to extract text content.
* @param metadata The metadata to be associated with the created `Document` instance.
* @returns A promise that resolves to an array of `Document` instances.
*/
parse(raw: Buffer, metadata: Document["metadata"]): Promise<Document[]>;
private parseDocx;
private parseDoc;
}
//#endregion
export { DocxLoader };
//# sourceMappingURL=docx.d.ts.map