parse-pdf
Version:
Get text content and metadata about pdf
24 lines (17 loc) • 603 B
JavaScript
import path from 'path'
import fs from 'fs'
import should from 'should'
import { parsePdf } from '../index.mjs'
import { fileURLToPath } from 'url';
const __filename = fileURLToPath(import.meta.url);
const __dirname = path.dirname(__filename);
const invoicePdfPath = path.join(__dirname, 'Invoice.pdf')
describe('parse-pdf', () => {
it('should parse pdf', async () => {
const f = fs.readFileSync(invoicePdfPath)
const parsed = await parsePdf(f)
should(parsed.pages[0].text).containEql('Invoice #: 123')
should(parsed.pages[0].text).containEql('Total: $300')
})
})