website-to-markdown-mcp
Version:
Advanced MCP server for fetching websites and converting to markdown with AI-powered features and stealth capabilities
48 lines • 1.35 kB
TypeScript
export interface ProcessingOptions {
removeAds?: boolean;
removeNavigation?: boolean;
removeFooter?: boolean;
removeSidebar?: boolean;
extractMainContent?: boolean;
preserveImages?: boolean;
preserveLinks?: boolean;
minTextLength?: number;
maxTextLength?: number;
language?: string;
}
export interface ProcessedContent {
title: string;
content: string;
markdown: string;
summary?: string;
readingTime?: number;
wordCount: number;
language?: string;
extractedImages?: string[];
extractedLinks?: Array<{
text: string;
url: string;
}>;
metadata?: Record<string, any>;
}
export declare class ContentProcessor {
private turndownService;
constructor();
private setupTurndownRules;
processContent(html: string, url: string, options?: ProcessingOptions): Promise<ProcessedContent>;
private cleanHTML;
private removeAds;
private extractMainContent;
private heuristicContentExtraction;
private calculateLinkDensity;
private extractTitle;
private extractMetadata;
private extractImages;
private extractLinks;
private postProcessMarkdown;
private countWords;
private calculateReadingTime;
private generateSummary;
private detectLanguage;
}
//# sourceMappingURL=content-processor.d.ts.map