UNPKG

node-poppler

Version:

Asynchronous node.js wrapper for the Poppler PDF rendering library

776 lines (775 loc) 49.8 kB
export default Poppler; export class Poppler { /** * @param {string} [binPath] - Path of poppler-utils binaries. * If not provided, the constructor will attempt to find the Poppler `pdfinfo` binary * in the PATH environment variable and use that as the path for all binaries. * For `win32` the binaries are bundled with the package and will be used * if a local installation is not found. */ constructor(binPath?: string); popplerPath: string; /** * @author Frazer Smith * @description Embeds files (attachments) into a PDF file. * @param {string} file - Filepath of the PDF file to read. * @param {string} fileToAttach - Filepath of the attachment to be embedded into the PDF file. * @param {string} outputFile - Filepath of the file to output the results to. * @param {object} [options] - Object containing options to pass to binary. * @param {boolean} [options.printVersionInfo] - Print copyright and version info. * @param {boolean} [options.replace] - Replace embedded file with same name (if it exists). * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfAttach(file: string, fileToAttach: string, outputFile: string, options?: { printVersionInfo?: boolean; replace?: boolean; }): Promise<string>; /** * @author Frazer Smith * @description Lists or extracts embedded files (attachments) from a PDF file. * @param {string} file - Filepath of the PDF file to read. * @param {object} [options] - Object containing options to pass to binary. * @param {boolean} [options.listEmbedded] - List all of the embedded files in the PDF file. * File names are converted to the text encoding specified by `options.outputEncoding`. * @param {string} [options.outputEncoding] - Sets the encoding to use for text output. * This defaults to `UTF-8`. * @param {string} [options.ownerPassword] - Owner password (for encrypted files). * @param {string} [options.outputPath] - Set the file name used when saving an embedded file with * the save option enabled, or the directory if `options.saveall` is used. * @param {boolean} [options.printVersionInfo] - Print copyright and version info. * @param {boolean} [options.saveAllFiles] - Save all of the embedded files. This uses the file * names associated with the embedded files (as printed by `options.listEmbedded`). * By default, the files are saved in the current directory; this can be changed * with `options.outputPath`. * @param {string} [options.saveFile] - Save the specified embedded file. * By default, this uses the file name associated with the embedded file (as printed by * `options.listEmbedded`); the file name can be changed with `options.outputPath`. * @param {number} [options.saveSpecificFile] - Save the specified embedded file. * By default, this uses the file name associated with the embedded file (as printed by * `options.listEmbedded`); the file name can be changed with `options.outputPath`. * @param {string} [options.userPassword] - User password (for encrypted files). * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfDetach(file: string, options?: { listEmbedded?: boolean; outputEncoding?: string; ownerPassword?: string; outputPath?: string; printVersionInfo?: boolean; saveAllFiles?: boolean; saveFile?: string; saveSpecificFile?: number; userPassword?: string; }): Promise<string>; /** * @author Frazer Smith * @description Lists the fonts used in a PDF file along with various information for each font. * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {object} [options] - Object containing options to pass to binary. * @param {number} [options.firstPageToExamine] - Specifies the first page to examine. * @param {number} [options.lastPageToExamine] - Specifies the last page to examine. * @param {boolean} [options.listSubstitutes] - List the substitute fonts that poppler * will use for non-embedded fonts. * @param {string} [options.ownerPassword] - Owner password (for encrypted files). * @param {boolean} [options.printVersionInfo] - Print copyright and version info. * @param {string} [options.userPassword] - User password (for encrypted files). * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfFonts(file: Buffer | string, options?: { firstPageToExamine?: number; lastPageToExamine?: number; listSubstitutes?: boolean; ownerPassword?: string; printVersionInfo?: boolean; userPassword?: string; }): Promise<string>; /** * @author Frazer Smith * @description Saves images from a PDF file as PPM, PBM, PNG, TIFF, JPEG, JPEG2000, or JBIG2 files. * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {string} [outputPrefix] - Filename prefix of output files. * @param {object} [options] - Object containing options to pass to binary. * @param {boolean} [options.allFiles] - Write JPEG, JPEG2000, JBIG2, and CCITT images in their native format. * CMYK files are written as TIFF files. All other images are written as PNG files. * @param {boolean} [options.ccittFile] - Generate CCITT images as CCITT files. * @param {number} [options.firstPageToConvert] - Specifies the first page to convert. * @param {number} [options.lastPageToConvert] - Specifies the last page to convert. * @param {boolean} [options.jbig2File] - Generate JBIG2 images as JBIG2 files. * @param {boolean} [options.jpeg2000File] - Generate JPEG2000 images at JP2 files. * @param {boolean} [options.jpegFile] - Generate JPEG images as JPEG files. * @param {boolean} [options.list] - Instead of writing the images, list the * images along with various information for each image. * NOTE: Do not specify the outputPrefix with this option. * @param {string} [options.ownerPassword] - Owner password (for encrypted files). * @param {boolean} [options.pngFile] - Change the default output format to PNG. * @param {boolean} [options.printVersionInfo] - Print copyright and version info. * @param {boolean} [options.tiffFile] - Change the default output format to TIFF. * @param {string} [options.userPassword] - Specify the user password for the PDF file. * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfImages(file: Buffer | string, outputPrefix?: string, options?: { allFiles?: boolean; ccittFile?: boolean; firstPageToConvert?: number; lastPageToConvert?: number; jbig2File?: boolean; jpeg2000File?: boolean; jpegFile?: boolean; list?: boolean; ownerPassword?: string; pngFile?: boolean; printVersionInfo?: boolean; tiffFile?: boolean; userPassword?: string; }): Promise<string>; /** * @author Frazer Smith * @description Prints the contents of the `Info` dictionary from a PDF file. * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {object} [options] - Object containing options to pass to binary. * @param {number} [options.firstPageToConvert] - First page to print. * @param {number} [options.lastPageToConvert] - Last page to print. * @param {boolean} [options.listEncodingOptions] - List the available encodings. * @param {string} [options.outputEncoding] - Sets the encoding to use for text output. * This defaults to `UTF-8`. * @param {string} [options.ownerPassword] - Owner password (for encrypted files). * @param {boolean} [options.printAsJson] - Print result as a JSON object. * @param {boolean} [options.printBoundingBoxes] - Prints the page box bounding boxes: * MediaBox, CropBox, BleedBox, TrimBox, and ArtBox. * @param {boolean} [options.printDocStruct] - Prints the logical document structure * of a Tagged-PDF file. * @param {boolean} [options.printDocStructText] - Print the textual content along with the * document structure of a Tagged-PDF file. Note that extracting text this way might be slow * for big PDF files. * @param {boolean} [options.printIsoDates] - Prints dates in ISO-8601 format (including the time zone). * @param {boolean} [options.printJS] - Prints all JavaScript in the PDF file. * @param {boolean} [options.printMetadata] - Prints document-level metadata. (This is the `Metadata` * stream from the PDF file's Catalog object). * @param {boolean} [options.printNamedDests] - Print a list of all named destinations. If a page range * is specified using the `options.firstPageToConvert` and `options.lastPageToConvert` options, only destinations * in the page range are listed. * @param {boolean} [options.printRawDates] - Prints the raw (undecoded) date strings, directly from the PDF file. * @param {boolean} [options.printUrls] - Print all URLs in the PDF; only URLs referenced by PDF objects * such as Link Annotations are listed, not URL strings in the text content. * @param {boolean} [options.printVersionInfo] - Print copyright and version info. * @param {string} [options.userPassword] - User password (for encrypted files). * @returns {Promise<object|string>} A promise that resolves with a stdout string or JSON object if * `options.printAsJson` is `true`, or rejects with an `Error` object. */ pdfInfo(file: Buffer | string, options?: { firstPageToConvert?: number; lastPageToConvert?: number; listEncodingOptions?: boolean; outputEncoding?: string; ownerPassword?: string; printAsJson?: boolean; printBoundingBoxes?: boolean; printDocStruct?: boolean; printDocStructText?: boolean; printIsoDates?: boolean; printJS?: boolean; printMetadata?: boolean; printNamedDests?: boolean; printRawDates?: boolean; printUrls?: boolean; printVersionInfo?: boolean; userPassword?: string; }): Promise<object | string>; /** * @author Frazer Smith * @description Extracts single pages from a PDF file, * and writes one PDF file for each page to outputPattern. * This will not work if the file is encrypted. * @param {string} file - Filepath of the PDF file to read. * @param {string} outputPattern - Should contain %d (or any variant respecting printf format), * since %d is replaced by the page number. * As an example, `sample-%d.pdf` will produce `sample-1.pdf` for a single page document. * @param {object} [options] - Object containing options to pass to binary. * @param {number} [options.firstPageToExtract] - Specifies the first page to extract. * This defaults to page 1. * @param {number} [options.lastPageToExtract] - Specifies the last page to extract. * This defaults to the last page of the PDF file. * @param {boolean} [options.printVersionInfo] - Print copyright and version info. * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfSeparate(file: string, outputPattern: string, options?: { firstPageToExtract?: number; lastPageToExtract?: number; printVersionInfo?: boolean; }): Promise<string>; /** * @author Frazer Smith * @description Converts a PDF file to EPS/JPEG/PDF/PNG/PS/SVG/TIFF. * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {string} [outputFile] - Filepath of the file to output the results to. * * If `undefined` then will write output to stdout. Using stdout is not valid with image formats * (jpeg, png, and tiff) unless `options.singleFile` is set to `true`. * Encoding is set to `binary` if used with `options.singleFile` or `options.pdfFile`. * * If not set then the output filename will be derived from the PDF file name. * @param {object} [options] - Object containing options to pass to binary. * @param {('best'|'default'|'fast'|'good'|'gray'|'none'|'subpixel')} [options.antialias] - Set the cairo * antialias option used for text and drawing in image files (or rasterized regions in vector output). * @param {boolean} [options.cropBox] - Uses the crop box rather than media box when * generating the files (PNG/JPEG/TIFF only). * @param {number} [options.cropHeight] - Specifies the height of crop area in pixels * (image output) or points (vector output). * @param {number} [options.cropSize] - Specifies the size of crop square in pixels * (image output) or points (vector output). * @param {number} [options.cropWidth] - Specifies the width of crop area in pixels * (image output) or points (vector output). * @param {number} [options.cropXAxis] - Specifies the x-coordinate of the crop area top left * corner in pixels (image output) or points (vector output). * @param {number} [options.cropYAxis] - Specifies the y-coordinate of the crop area top left * corner in pixels (image output) or points (vector output). * @param {boolean} [options.duplex] - Adds the %%IncludeFeature: *Duplex DuplexNoTumble DSC * comment to the PostScript file (PS only). This tells the print manager to enable duplexing. * @param {boolean} [options.epsFile] - Generate an EPS file. An EPS file contains a single image, * so if you use this option with a multi-page PDF file, you must use `options.firstPageToConvert` and * `options.lastPageToConvert` to specify a single page. * The page size options (originalPageSizes, paperSize, paperWidth, paperHeight) can not be used * with this option. * @param {boolean} [options.evenPagesOnly] - Generates only the even numbered pages. * @param {boolean} [options.fillPage] - Expand PDF pages smaller than the paper to fill the * paper (PS,PDF,SVG only). By default, these pages are not scaled. * @param {number} [options.firstPageToConvert] - Specifies the first page to convert. * @param {boolean} [options.grayscaleFile] - Generate grayscale file (PNG, JPEG, and TIFF only). * @param {string} [options.iccFile] - Use the specified ICC file as the output profile * (PNG only). The profile will be embedded in the PNG file. * @param {boolean} [options.jpegFile] - Generate JPEG file(s). * @param {string} [options.jpegOptions] - When used with `options.jpegFile`, this option can * be used to control the JPEG compression parameters. It takes a string of the form * `"<opt>=<val>[,<opt>=<val>]"`. Currently available options are: * - `quality` Selects the JPEG quality value. The value must be an integer between 0 and 100. * - `progressive` Select progressive JPEG output. The possible values are "y", "n", indicating * progressive (yes) or non-progressive (no), respectively. * - `optimize` Sets whether to compute optimal Huffman coding tables for the JPEG output, which * will create smaller files but make an extra pass over the data. The value must be "y" or "n", * with "y" performing optimization, otherwise the default Huffman tables are used. * * Example: `"quality=95,optimize=y"`. * @param {number} [options.lastPageToConvert] - Specifies the last page to convert. * @param {boolean} [options.monochromeFile] - Generate monochrome file (PNG and TIFF only). * @param {boolean} [options.noCenter] - By default, PDF pages smaller than the paper * (after any scaling) are centered on the paper. This option causes them to be aligned to * the lower-left corner of the paper instead (PS,PDF,SVG only). * @param {boolean} [options.noCrop] - By default, printing output is cropped to the CropBox * specified in the PDF file. This option disables cropping (PS, PDF, SVG only). * @param {boolean} [options.noShrink] - Do not scale PDF pages which are larger than the paper * (PS,PDF,SVG only). By default, pages larger than the paper are shrunk to fit. * @param {boolean} [options.oddPagesOnly] - Generates only the odd numbered pages. * @param {boolean} [options.originalPageSizes] - Set the paper size of each page to match * the size specified in the PDF file. * @param {string} [options.ownerPassword] - Specify the owner password for the PDF file. * Providing this will bypass all security restrictions. * @param {number} [options.paperHeight] - Set the paper height, in points (PS, PDF, SVG only). * @param {('A3'|'A4'|'legal'|'letter'|'match')} [options.paperSize] - Set the paper size to one of `A3`, `A4`, * `legal`, or `letter` (PS,PDF,SVG only). This can also be set to `match`, which will set the paper size * of each page to match the size specified in the PDF file. If none of the paperSize, * paperWidth, or paperHeight options are specified the default is to match the paper size. * @param {number} [options.paperWidth] - Set the paper width, in points (PS,PDF,SVG only). * @param {boolean} [options.pdfFile] - Generate PDF file. * @param {boolean} [options.pngFile] - Generate PNG file(s). * @param {boolean} [options.printVersionInfo] - Print copyright and version information. * @param {boolean} [options.printDocStruct] - If the input file contains structural information * about the document's content, write this information to the output file (PDF only). * @param {boolean} [options.psFile] - Generate PS file. * @param {boolean} [options.psLevel2] - Generate Level 2 PostScript (PS only). * @param {boolean} [options.psLevel3] - Generate Level 3 PostScript (PS only). This enables all * Level 2 features plus shading patterns and masked images. This is the default setting. * @param {boolean} [options.quiet] - Do not print any messages or errors. * @param {number} [options.resolutionXAxis] - Specifies the X resolution, in pixels per inch of * image files (or rasterized regions in vector output). The default is 150 PPI. * @param {number} [options.resolutionXYAxis] - Specifies the X and Y resolution, in pixels per * inch of image files (or rasterized regions in vector output). The default is 150 PPI. * @param {number} [options.resolutionYAxis] - Specifies the Y resolution, in pixels per inch of * image files (or rasterized regions in vector output). The default is 150 PPI. * @param {number} [options.scalePageTo] - Scales the long side of each page (width for landscape * pages, height for portrait pages) to fit in scale-to pixels. The size of the short side will * be determined by the aspect ratio of the page (PNG/JPEG/TIFF only). * @param {number} [options.scalePageToXAxis] - Scales each page horizontally to fit in scale-to-x * pixels. If scale-to-y is set to -1, the vertical size will determined by the aspect ratio of * the page (PNG/JPEG/TIFF only). * @param {number} [options.scalePageToYAxis] - Scales each page vertically to fit in scale-to-y * pixels. If scale-to-x is set to -1, the horizontal size will determined by the aspect ratio of * the page (PNG/JPEG/TIFF only). * @param {boolean} [options.singleFile] - Writes only the first page and does not add digits. * Can only be used with `options.jpegFile`, `options.pngFile`, and `options.tiffFile`. * @param {boolean} [options.svgFile] - Generate SVG (Scalable Vector Graphics) file. * @param {('deflate'|'jpeg'|'lzw'|'none'|'packbits')} [options.tiffCompression] - Set TIFF compression. * @param {boolean} [options.tiffFile] - Generate TIFF file(s). * @param {boolean} [options.transparentPageColor] - Use a transparent page color * instead of white (PNG and TIFF only). * @param {string} [options.userPassword] - Specify the user password for the PDF file. * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfToCairo(file: Buffer | string, outputFile?: string, options?: { antialias?: ("best" | "default" | "fast" | "good" | "gray" | "none" | "subpixel"); cropBox?: boolean; cropHeight?: number; cropSize?: number; cropWidth?: number; cropXAxis?: number; cropYAxis?: number; duplex?: boolean; epsFile?: boolean; evenPagesOnly?: boolean; fillPage?: boolean; firstPageToConvert?: number; grayscaleFile?: boolean; iccFile?: string; jpegFile?: boolean; jpegOptions?: string; lastPageToConvert?: number; monochromeFile?: boolean; noCenter?: boolean; noCrop?: boolean; noShrink?: boolean; oddPagesOnly?: boolean; originalPageSizes?: boolean; ownerPassword?: string; paperHeight?: number; paperSize?: ("A3" | "A4" | "legal" | "letter" | "match"); paperWidth?: number; pdfFile?: boolean; pngFile?: boolean; printVersionInfo?: boolean; printDocStruct?: boolean; psFile?: boolean; psLevel2?: boolean; psLevel3?: boolean; quiet?: boolean; resolutionXAxis?: number; resolutionXYAxis?: number; resolutionYAxis?: number; scalePageTo?: number; scalePageToXAxis?: number; scalePageToYAxis?: number; singleFile?: boolean; svgFile?: boolean; tiffCompression?: ("deflate" | "jpeg" | "lzw" | "none" | "packbits"); tiffFile?: boolean; transparentPageColor?: boolean; userPassword?: string; }): Promise<string>; /** * @author Frazer Smith * @description Converts a PDF file to HTML. * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {string} [outputFile] - Filepath of the file to output the results to. * If `undefined` then Poppler will use the directory and name of the original file * and create a new file, with `-html` appended to the end of the filename. * * Required if `file` is a Buffer. * @param {object} [options] - Object containing options to pass to binary. * @param {boolean} [options.complexOutput] - Generate complex output. * @param {boolean} [options.dataUrls] - Use data URLs instead of external images in HTML. * @param {boolean} [options.exchangePdfLinks] - Exchange .pdf links with .html. * @param {boolean} [options.extractHidden] - Force hidden text extraction. * @param {number} [options.firstPageToConvert] - First page to print. * @param {boolean} [options.fontFullName] - Outputs the font name without any substitutions. * @param {boolean} [options.ignoreImages] - Ignore images. * @param {('JPG'|'PNG')} [options.imageFormat] - Image file format for Splash output (JPG or PNG). * If complexOutput is selected, but imageFormat is not specified, PNG will be assumed. * @param {number} [options.lastPageToConvert] - Last page to print. * @param {boolean} [options.noDrm] - Override document DRM settings. * @param {boolean} [options.noFrames] - Generate no frames. Not supported in complex output mode. * @param {boolean} [options.noMergeParagraph] - Do not merge paragraphs. * @param {boolean} [options.noRoundedCoordinates] - Do not round coordinates * (with XML output only). * @param {string} [options.outputEncoding] - Sets the encoding to use for text output. * This defaults to `UTF-8`. * @param {string} [options.ownerPassword] - Owner password (for encrypted files). * @param {boolean} [options.printVersionInfo] - Print copyright and version info. * @param {boolean} [options.quiet] - Do not print any messages or errors. * @param {boolean} [options.singlePage] - Generate single HTML that includes all pages. * @param {boolean} [options.stdout] - Use standard output. * @param {string} [options.userPassword] - User password (for encrypted files). * @param {number} [options.wordBreakThreshold] - Adjust the word break threshold percent. * Default is 10. Word break occurs when distance between two adjacent characters is greater * than this percent of character height. * @param {boolean} [options.xmlOutput] - Output for XML post-processing. * @param {number} [options.zoom] - Zoom the PDF document (default 1.5). * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfToHtml(file: Buffer | string, outputFile?: string, options?: { complexOutput?: boolean; dataUrls?: boolean; exchangePdfLinks?: boolean; extractHidden?: boolean; firstPageToConvert?: number; fontFullName?: boolean; ignoreImages?: boolean; imageFormat?: ("JPG" | "PNG"); lastPageToConvert?: number; noDrm?: boolean; noFrames?: boolean; noMergeParagraph?: boolean; noRoundedCoordinates?: boolean; outputEncoding?: string; ownerPassword?: string; printVersionInfo?: boolean; quiet?: boolean; singlePage?: boolean; stdout?: boolean; userPassword?: string; wordBreakThreshold?: number; xmlOutput?: boolean; zoom?: number; }): Promise<string>; /** * @author Frazer Smith * @description Converts a PDF file to colour image files in Portable Pixmap (PPM) format, * grayscale image files in Portable Graymap (PGM) format, or monochrome image files * in Portable Bitmap (PBM) format. * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {string} outputPath - Filepath to output the results to. * @param {object} [options] - Object containing options to pass to binary. * @param {('no'|'yes')} [options.antialiasFonts] - Enable or disable font anti-aliasing. * This defaults to `yes`. * @param {('no'|'yes')} [options.antialiasVectors] - Enable or disable vector anti-aliasing. * This defaults to `yes`. * @param {boolean} [options.cropBox] - Uses the crop box rather than media box when * generating the files (PNG/JPEG/TIFF only). * @param {number} [options.cropHeight] - Specifies the height of crop area in pixels * (image output) or points (vector output). * @param {number} [options.cropSize] - Specifies the size of crop square in pixels * (image output) or points (vector output). * @param {number} [options.cropWidth] - Specifies the width of crop area in pixels * (image output) or points (vector output). * @param {number} [options.cropXAxis] - Specifies the x-coordinate of the crop area top left * corner in pixels (image output) or points (vector output). * @param {number} [options.cropYAxis] - Specifies the y-coordinate of the crop area top left * corner in pixels (image output) or points (vector output). * @param {string} [options.defaultCmykProfile] - If Poppler is compiled with colour management support, this option * sets the DefaultCMYK color space to the ICC profile stored in the display profile file passed. * @param {string} [options.defaultGrayProfile] - If Poppler is compiled with colour management support, this option * sets the DefaultGray color space to the ICC profile stored in the display profile file passed. * @param {string} [options.defaultRgbProfile] - If Poppler is compiled with colour management support, this option * sets the DefaultRGB color space to the ICC profile stored in the display profile file passed. * @param {string} [options.displayProfile] - If Poppler is compiled with colour management support, this option * sets the display profile to the ICC profile stored in the display profile file passed. * @param {boolean} [options.evenPagesOnly] - Generates only the even numbered pages. * @param {number} [options.firstPageToConvert] - Specifies the first page to convert. * @param {('no'|'yes')} [options.freetype] - Enable or disable FreeType (a TrueType / Type 1 font rasterizer). * This defaults to `yes`. * @param {boolean} [options.forcePageNumber] - Force page number even if there is only one page. * @param {boolean} [options.grayscaleFile] - Generate grayscale PGM file (instead of a color PPM file). * @param {boolean} [options.hideAnnotations] - Hide annotations. * @param {boolean} [options.jpegFile] - Generate JPEG file instead a PPM file. * @param {number} [options.lastPageToConvert] - Specifies the last page to convert. * @param {boolean} [options.monochromeFile] - Generate monochrome PBM file (instead of a color PPM file). * @param {boolean} [options.oddPagesOnly] - Generates only the odd numbered pages. * @param {string} [options.ownerPassword] - Specify the owner password for the PDF file. * Providing this will bypass all security restrictions. * @param {boolean} [options.pngFile] - Generate PNG file instead a PPM file. * @param {boolean} [options.printProgress] - Print progress info as each page is generated. * Three space-separated fields are printed to STDERR: the number of the current page, the number * of the last page that will be generated, and the path to the file written to. * @param {boolean} [options.printVersionInfo] - Print copyright and version information. * @param {boolean} [options.quiet] - Do not print any messages or errors. * @param {number} [options.resolutionXAxis] - Specifies the X resolution, in pixels per inch of * image files (or rasterized regions in vector output). The default is 150 PPI. * @param {number} [options.resolutionXYAxis] - Specifies the X and Y resolution, in pixels per * inch of image files (or rasterized regions in vector output). The default is 150 PPI. * @param {number} [options.resolutionYAxis] - Specifies the Y resolution, in pixels per inch of * image files (or rasterized regions in vector output). The default is 150 PPI. * @param {number} [options.scalePageTo] - Scales the long side of each page (width for landscape * pages, height for portrait pages) to fit in scale-to pixels. The size of the short side will * be determined by the aspect ratio of the page. * @param {number} [options.scalePageToXAxis] - Scales each page horizontally to fit in scale-to-x * pixels. If scale-to-y is set to -1, the vertical size will determined by the aspect ratio of * the page. * @param {number} [options.scalePageToYAxis] - Scales each page vertically to fit in scale-to-y * pixels. If scale-to-x is set to -1, the horizontal size will determined by the aspect ratio of * the page. * @param {string} [options.separator] - Specify single character separator between name and page number. * @param {boolean} [options.singleFile] - Writes only the first page and does not add digits. * @param {('none'|'shape'|'solid')} [options.thinLineMode] - Specifies the thin line mode. This defaults to `none`. * @param {('deflate'|'jpeg'|'lzw'|'none'|'packbits')} [options.tiffCompression] - Set TIFF compression. * @param {boolean} [options.tiffFile] - Generate TIFF file instead a PPM file. * @param {string} [options.userPassword] - Specify the user password for the PDF file. * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfToPpm(file: Buffer | string, outputPath: string, options?: { antialiasFonts?: ("no" | "yes"); antialiasVectors?: ("no" | "yes"); cropBox?: boolean; cropHeight?: number; cropSize?: number; cropWidth?: number; cropXAxis?: number; cropYAxis?: number; defaultCmykProfile?: string; defaultGrayProfile?: string; defaultRgbProfile?: string; displayProfile?: string; evenPagesOnly?: boolean; firstPageToConvert?: number; freetype?: ("no" | "yes"); forcePageNumber?: boolean; grayscaleFile?: boolean; hideAnnotations?: boolean; jpegFile?: boolean; lastPageToConvert?: number; monochromeFile?: boolean; oddPagesOnly?: boolean; ownerPassword?: string; pngFile?: boolean; printProgress?: boolean; printVersionInfo?: boolean; quiet?: boolean; resolutionXAxis?: number; resolutionXYAxis?: number; resolutionYAxis?: number; scalePageTo?: number; scalePageToXAxis?: number; scalePageToYAxis?: number; separator?: string; singleFile?: boolean; thinLineMode?: ("none" | "shape" | "solid"); tiffCompression?: ("deflate" | "jpeg" | "lzw" | "none" | "packbits"); tiffFile?: boolean; userPassword?: string; }): Promise<string>; /** * @author Frazer Smith * @description Converts a PDF file to PostScript (PS). * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {string} [outputFile] - Filepath of the file to output the results to. * If `undefined` then will write output to stdout. * @param {object} [options] - Object containing options to pass to binary. * @param {('no'|'yes')} [options.antialias] - Enable anti-aliasing on rasterization, accepts `no` or `yes`. * @param {boolean} [options.binary] - Write binary data in Level 1 PostScript. By default, * pdftops writes hex-encoded data in Level 1 PostScript. Binary data is non-standard in Level 1 * PostScript but reduces the file size and can be useful when Level 1 PostScript is required * only for its restricted use of PostScript operators. * @param {string} [options.defaultCmykProfile] - If Poppler is compiled with colour management support, this option * sets the DefaultCMYK color space to the ICC profile stored in the display profile file passed. * @param {string} [options.defaultGrayProfile] - If Poppler is compiled with colour management support, this option * sets the DefaultGray color space to the ICC profile stored in the display profile file passed. * @param {string} [options.defaultRgbProfile] - If Poppler is compiled with colour management support, this option * sets the DefaultRGB color space to the ICC profile stored in the display profile file passed. * @param {boolean} [options.duplex] - Set the Duplex pagedevice entry in the PostScript file. * This tells duplex-capable printers to enable duplexing. * @param {boolean} [options.epsFile] - Generate an EPS file. An EPS file contains a single image, * so if you use this option with a multi-page PDF file, you must use `options.firstPageToConvert` and * `options.lastPageToConvert` to specify a single page. * The page size options (originalPageSizes, paperSize, paperWidth, paperHeight) can not be used * with this option. * @param {boolean} [options.fillPage] - Expand PDF pages smaller than the paper to fill the * paper. By default, these pages are not scaled. * @param {number} [options.firstPageToConvert] - Specifies the first page to convert. * @param {number} [options.form] - Generate PostScript form which can be imported by software * that understands forms. * A form contains a single page, so if you use this option with a multi-page PDF file, * you must use `options.firstPageToConvert` and `options.lastPageToConvert` to specify a single page. * The `options.level1` option cannot be used with `options.form`. * No more than one of the mode options (`options.epsFile`, `options.form`) may be given. * @param {number} [options.lastPageToConvert] - Specifies the last page to convert. * @param {boolean} [options.level1] - Generate Level 1 PostScript. The resulting PostScript * files will be significantly larger (if they contain images), but will print on Level 1 printers. * This also converts all images to black and white. * @param {boolean} [options.level1Sep] - Generate Level 1 separable PostScript. * All colors are converted to CMYK. Images are written with separate stream data for the four components. * @param {boolean} [options.level2] - Generate Level 2 PostScript. * Level 2 supports color images and image compression. This is the default setting. * @param {boolean} [options.level2Sep] - Generate Level 2 separable PostScript. All colors are * converted to CMYK. The PostScript separation convention operators are used to handle custom (spot) colors. * @param {boolean} [options.level3] - Generate Level 3 PostScript. * This enables all Level 2 featuresplus CID font embedding. * @param {boolean} [options.level3Sep] - Generate Level 3 separable PostScript. * The separation handling is the same as for `options.level2Sep`. * @param {boolean} [options.noCenter] - By default, PDF pages smaller than the paper * (after any scaling) are centered on the paper. This option causes them to be aligned to * the lower-left corner of the paper instead. * @param {boolean} [options.noCrop] - By default, printing output is cropped to the CropBox * specified in the PDF file. This option disables cropping. * @param {boolean} [options.noEmbedCIDFonts] - By default, any CID PostScript fonts which are * embedded in the PDF file are copied into the PostScript file. This option disables that embedding. * No attempt is made to substitute for non-embedded CID PostScript fonts. * @param {boolean} [options.noEmbedCIDTrueTypeFonts] - By default, any CID TrueType fonts which are * embedded in the PDF file are copied into the PostScript file. This option disables that embedding. * No attempt is made to substitute for non-embedded CID TrueType fonts. * @param {boolean} [options.noEmbedTrueTypeFonts] - By default, any TrueType fonts which are embedded * in the PDF file are copied into the PostScript file. This option causes pdfToPs to substitute base fonts instead. * Embedded fonts make PostScript files larger, but may be necessary for readable output. * Also, some PostScript interpreters do not have TrueType rasterizers. * @param {boolean} [options.noEmbedType1Fonts] - By default, any Type 1 fonts which are embedded in the PDF file * are copied into the PostScript file. This option causes pdfToPs to substitute base fonts instead. * Embedded fonts make PostScript files larger, but may be necessary for readable output. * @param {boolean} [options.noShrink] - Do not scale PDF pages which are larger than the paper. * By default, pages larger than the paper are shrunk to fit. * @param {boolean} [options.opi] - Generate OPI comments for all images and forms which have OPI information. * @param {boolean} [options.optimizecolorspace] - By default, bitmap images in the PDF pass through to the * output PostScript in their original color space, which produces predictable results. * This option converts RGB and CMYK images into Gray images if every pixel of the image has equal components. * This can fix problems when doing color separations of PDFs that contain embedded black and * white images encoded as RGB. * @param {boolean} [options.originalPageSizes] - Set the paper size of each page to match * the size specified in the PDF file. * @param {boolean} [options.overprint] - Enable overprinting. * @param {string} [options.ownerPassword] - Owner password (for encrypted files). * @param {number} [options.paperHeight] - Set the paper height, in points. * @param {('A3'|'A4'|'legal'|'letter'|'match')} [options.paperSize] - Set the paper size to one of `A3`, `A4`, * `legal`, or `letter`. This can also be set to `match`, which will set the paper size * of each page to match the size specified in the PDF file. If none of the paperSize, * paperWidth, or paperHeight options are specified the default is to match the paper size. * @param {number} [options.paperWidth] - Set the paper width, in points. * @param {boolean} [options.passfonts] - By default, references to non-embedded 8-bit fonts * in the PDF file are substituted with the closest `Helvetica`, `Times-Roman`, or `Courier` font. * This option passes references to non-embedded fonts through to the PostScript file. * @param {boolean} [options.preload] - Preload images and forms. * @param {boolean} [options.printVersionInfo] - Print copyright and version information. * @param {('CMYK8'|'MONO8'|'RGB8')} [options.processColorFormat] - Sets the process color format as it is used * during rasterization and transparency reduction. * * The default depends on the other settings: For `options.level1` the default is MONO8; for `options.level1Sep`, * `options.level2Sep`, `options.level3Sep`, or `options.overprint` the default is CMYK8; in all other * cases RGB8 is the default. * If `option.processColorProfile` is set then `options.processColorFormat` is inferred from the specified ICC profile. * @param {string} [options.processColorProfile] - Sets the ICC profile that is assumed during * rasterization and transparency reduction. * @param {boolean} [options.quiet] - Do not print any messages or errors. * @param {('always'|'never'|'whenneeded')} [options.rasterize] - By default, pdfToPs rasterizes pages as needed, * for example, if they contain transparencies. To force rasterization, set `rasterize` to `always`. * Use this to eliminate fonts. * To prevent rasterization, set `rasterize` to `never`. * This may produce files that display incorrectly. * @param {number} [options.resolutionXYAxis] - Specifies the X and Y resolution, in pixels per * inch of image files (or rasterized regions in vector output). The default is 300 PPI. * @param {string} [options.userPassword] - User password (for encrypted files). * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfToPs(file: Buffer | string, outputFile?: string, options?: { antialias?: ("no" | "yes"); binary?: boolean; defaultCmykProfile?: string; defaultGrayProfile?: string; defaultRgbProfile?: string; duplex?: boolean; epsFile?: boolean; fillPage?: boolean; firstPageToConvert?: number; form?: number; lastPageToConvert?: number; level1?: boolean; level1Sep?: boolean; level2?: boolean; level2Sep?: boolean; level3?: boolean; level3Sep?: boolean; noCenter?: boolean; noCrop?: boolean; noEmbedCIDFonts?: boolean; noEmbedCIDTrueTypeFonts?: boolean; noEmbedTrueTypeFonts?: boolean; noEmbedType1Fonts?: boolean; noShrink?: boolean; opi?: boolean; optimizecolorspace?: boolean; originalPageSizes?: boolean; overprint?: boolean; ownerPassword?: string; paperHeight?: number; paperSize?: ("A3" | "A4" | "legal" | "letter" | "match"); paperWidth?: number; passfonts?: boolean; preload?: boolean; printVersionInfo?: boolean; processColorFormat?: ("CMYK8" | "MONO8" | "RGB8"); processColorProfile?: string; quiet?: boolean; rasterize?: ("always" | "never" | "whenneeded"); resolutionXYAxis?: number; userPassword?: string; }): Promise<string>; /** * @author Frazer Smith * @description Converts a PDF file to TXT. * @param {Buffer|string} file - PDF file as Buffer, or filepath of the PDF file to read. * @param {string} [outputFile] - Filepath of the file to output the results to. * If `undefined` then will write output to stdout. * @param {object} [options] - Object containing options to pass to binary. * @param {boolean} [options.boundingBoxXhtml] - Generate an XHTML file containing bounding * box information for each word in the file. * @param {boolean} [options.boundingBoxXhtmlLayout] - Generate an XHTML file containing * bounding box information for each block, line, and word in the file. * @param {boolean} [options.cropBox] - Use the crop box rather than the media box with * `options.boundingBoxXhtml` and `options.boundingBoxXhtmlLayout`. * @param {number} [options.cropHeight] - Specifies the height of crop area in pixels * (image output) or points (vector output). * @param {number} [options.cropWidth] - Specifies the width of crop area in pixels * (image output) or points (vector output). * @param {number} [options.cropXAxis] - Specifies the x-coordinate of the crop area top left * corner in pixels (image output) or points (vector output). * @param {number} [options.cropYAxis] - Specifies the y-coordinate of the crop area top left * corner in pixels (image output) or points (vector output). * @param {('dos'|'mac'|'unix')} [options.eolConvention] - Sets the end-of-line convention to use for * text output: dos; mac; unix. * @param {number} [options.firstPageToConvert] - Specifies the first page to convert. * @param {number} [options.fixedWidthLayout] - Assume fixed-pitch (or tabular) text, with the * specified character width (in points). This forces physical layout mode. * @param {boolean} [options.generateHtmlMetaFile] - Generate simple HTML file, including the * meta information. This simply wraps the text in `<pre>` and `</pre>` and prepends the meta headers. * @param {boolean} [options.generateTsvFile] - Generate a TSV file containing the bounding box * information for each block, line, and word in the file. * @param {number} [options.lastPageToConvert] - Specifies the last page to convert. * @param {boolean} [options.listEncodingOptions] - List the available encodings. * @param {boolean} [options.maintainLayout] - Maintain (as best as possible) the original physical * layout of the text. The default is to undo physical layout (columns, hyphenation, etc.) and * output the text in reading order. * @param {boolean} [options.noDiagonalText] - Discard diagonal text. * @param {boolean} [options.noPageBreaks] - Do not insert page breaks (form feed characters) * between pages. * @param {string} [options.outputEncoding] - Sets the encoding to use for text output. * This defaults to `UTF-8`. * @param {string} [options.ownerPassword] - Owner password (for encrypted files). * @param {boolean} [options.printVersionInfo] - Print copyright and version information. * @param {boolean} [options.quiet] - Do not print any messages or errors. * @param {boolean} [options.rawLayout] - Keep the text in content stream order. This is a * hack which often undoes column formatting, etc. Use of raw mode is no longer recommended. * @param {string} [options.userPassword] - User password (for encrypted files). * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfToText(file: Buffer | string, outputFile?: string, options?: { boundingBoxXhtml?: boolean; boundingBoxXhtmlLayout?: boolean; cropBox?: boolean; cropHeight?: number; cropWidth?: number; cropXAxis?: number; cropYAxis?: number; eolConvention?: ("dos" | "mac" | "unix"); firstPageToConvert?: number; fixedWidthLayout?: number; generateHtmlMetaFile?: boolean; generateTsvFile?: boolean; lastPageToConvert?: number; listEncodingOptions?: boolean; maintainLayout?: boolean; noDiagonalText?: boolean; noPageBreaks?: boolean; outputEncoding?: string; ownerPassword?: string; printVersionInfo?: boolean; quiet?: boolean; rawLayout?: boolean; userPassword?: string; }): Promise<string>; /** * @author Frazer Smith * @description Merges several PDF files in order of their occurrence in the files array to * one PDF result file. * @param {string[]} files - Filepaths of the PDF files to merge. * An entire directory of PDF files can be merged like so: `path/to/directory/*.pdf`. * @param {string} outputFile - Filepath of the file to output the resulting merged PDF to. * @param {object} [options] - Object containing options to pass to binary. * @param {boolean} [options.printVersionInfo] - Print copyright and version information. * @returns {Promise<string>} A promise that resolves with a stdout string, or rejects with an `Error` object. */ pdfUnite(files: string[], outputFile: string, options?: { printVersionInfo?: boolean; }): Promise<string>; }