mindee
Version:
Mindee Client Library for Node.js
31 lines (30 loc) • 855 B
TypeScript
export interface PageTextInfo {
pageNumber: number;
content: Array<{
str: string;
x: number;
y: number;
width: number;
height: number;
fontName: string;
}>;
}
export interface ExtractedPdfInfo {
pages: PageTextInfo[];
getConcatenatedText: () => string;
}
/**
* Extracts text from a full PDF document.
*
* @returns A Promise containing the extracted text as a string.
* @param pdfBuffer PDF handle, as a buffer.
*/
export declare function extractTextFromPdf(pdfBuffer: Buffer): Promise<ExtractedPdfInfo>;
/**
* Checks if a PDF contains source text.
*
* @param pdfData Buffer representing the content of the PDF file.
*
* @returns A Promise containing a boolean indicating if the PDF has source text.
*/
export declare function hasSourceText(pdfData: Buffer): Promise<boolean>;