defuddle
Version:
Extract article content and metadata from web pages.
10 lines (9 loc) • 347 B
TypeScript
import { ExtractorResult } from '../types/extractors';
export declare abstract class BaseExtractor {
protected document: Document;
protected url: string;
protected schemaOrgData?: any;
constructor(document: Document, url: string, schemaOrgData?: any);
abstract canExtract(): boolean;
abstract extract(): ExtractorResult;
}