textract
Version:
Extracting text from files of various type including html, pdf, doc, docx, xls, xlsx, csv, pptx, png, jpg, gif, rtf, text/*, and various open office.
87 lines (86 loc) • 1.74 kB
JSON
{
"name": "textract",
"version": "2.5.0",
"homepage": "https://github.com/dbashford/textract",
"author": "David Bashford",
"description": "Extracting text from files of various type including html, pdf, doc, docx, xls, xlsx, csv, pptx, png, jpg, gif, rtf, text/*, and various open office.",
"contributors": [
{
"name": "David Bashford",
"email": "dbashford@hotmail.com"
}
],
"repository": {
"type": "git",
"url": "https://github.com/dbashford/textract"
},
"keywords": [
"textract",
"extract",
"html",
"csv",
"text",
"pdf",
"docx",
"doc",
"xls",
"xlsx",
"png",
"jpg",
"gif",
"rtf",
"dxf",
"pptx",
"html",
"markdown",
"xml",
"odt",
"ott",
"xlsb",
"xlsm",
"xltx",
"ods",
"ots",
"potx",
"odg",
"otg",
"epub"
],
"dependencies": {
"mime": "2.2.0",
"pdf-text-extract": "1.3.1",
"xpath": "0.0.23",
"xmldom": "0.1.27",
"j": "0.4.3",
"cheerio": "1.0.0-rc.2",
"marked": "0.6.2",
"meow": "3.7.0",
"got": "5.7.1",
"html-entities": "1.2.0",
"iconv-lite": "0.4.15",
"jschardet": "1.4.1",
"yauzl": "2.7.0",
"epub2": "1.3.4"
},
"devDependencies": {
"chai": "1.5.0",
"eslint": "2.11.1",
"eslint-config-airbnb": "^9.0.1",
"eslint-plugin-react": "^5.1.1",
"eslint-plugin-jsx-a11y": "^1.2.0",
"eslint-plugin-import": "^1.7.0 ",
"mocha": "1.9.0"
},
"scripts": {
"test": "node_modules/.bin/mocha",
"lint": "node_modules/.bin/eslint -c .eslintrc.json lib"
},
"license": "MIT",
"engines": {
"node": ">=0.8"
},
"bin": {
"textract": "./bin/textract"
},
"main": "./lib/index"
}