ppu-pdf
Version:
Easily extract text from digital PDF files with coordinate and font size included, and optionally group text by lines or render scanned pdf to canvas/png.
19 lines (18 loc) • 777 B
TypeScript
import type { PdfReaderOptions } from "./pdf.interface";
/**
* A collection of constant values used for PDF processing thresholds.
*/
export declare const CONSTANT: {
/** Minimum number of words per page to consider a page as containing text. */
WORDS_PER_PAGE_THRESHOLD: number;
/** Minimum text length per page to consider it as containing content. */
TEXT_LENGTH_THRESHOLD: number;
/** Height percentage from the top of the page used to detect headers. */
HEADER_FROM_HEIGHT_PERCENTAGE: number;
/** Height percentage from the bottom of the page used to detect footers. */
FOOTER_FROM_HEIGHT_PERCENTAGE: number;
};
/**
* Default options for configuring the PDF reader.
*/
export declare const PDF_READER_DEFAULT_OPTIONS: PdfReaderOptions;