UNPKG

article-parser

Version:

To extract main article from given URL

32 lines (25 loc) 781 B
/** * Article parser * @ndaidong **/ import { isString } from 'bellajs' import retrieve from './utils/retrieve.js' import parseFromHtml from './utils/parseFromHtml.js' import { isValid as isValidUrl } from './utils/linker.js' export const extract = async (input, parserOptions = {}, fetchOptions = {}) => { if (!isString(input)) { throw new Error('Input must be a string') } if (!isValidUrl(input)) { return parseFromHtml(input, null, parserOptions) } const html = await retrieve(input, fetchOptions) if (!html) { return null } return parseFromHtml(html, input, parserOptions) } export { addTransformations, removeTransformations } from './utils/transformation.js' export { setSanitizeHtmlOptions, getSanitizeHtmlOptions } from './config.js'