UNPKG

pdfreader

Version:

Read text and parse tables from PDF files. Supports tabular data with automatic column detection, and rule-based parsing.

35 lines (31 loc) 909 B
import { toggle } from "./lib/LOG.js"; import { PdfReader } from "./index.js"; toggle(false); function printRawItems(filename, callback) { new PdfReader().parseFileItems(filename, function (err, item) { if (err) callback(err); else if (!item) callback(); else if (item.file) console.log("file =", item.file.path); else if (item.page) console.log("page =", item.page); else if (item.x) console.log( [item.x, item.y, item.oc, item.A, Math.floor(item.w), item.text].join( "\t" ) ); else console.warn(item); }); } var filename = process.argv[2]; if (!filename) { console.error("please provide the name of a PDF file"); } else { console.warn("printing raw items from file:", filename, "..."); printRawItems(filename, function (err) { if (err) { console.error(err); process.exit(1); } console.warn("done."); }); }