UNPKG

@oevortex/ddg_search

Version:

A Model Context Protocol server for web search using DuckDuckGo and Felo AI

119 lines (111 loc) • 3.2 kB

JavaScript

import { fetchUrlContent } from '../utils/search.js'; /** * Fetch URL tool definition */ export const fetchUrlToolDefinition = { name: 'fetch-url', description: 'Fetch the content of a URL and return it as text, with options to control extraction', inputSchema: { type: 'object', properties: { url: { type: 'string', description: 'The URL to fetch' }, maxLength: { type: 'integer', description: 'Maximum length of content to return (default: 10000)', default: 10000, minimum: 1000, maximum: 50000 }, extractMainContent: { type: 'boolean', description: 'Whether to attempt to extract main content (default: true)', default: true }, includeLinks: { type: 'boolean', description: 'Whether to include link text (default: true)', default: true }, includeImages: { type: 'boolean', description: 'Whether to include image alt text (default: true)', default: true }, excludeTags: { type: 'array', description: 'Tags to exclude from extraction (default: script, style, etc.)', items: { type: 'string' } } }, required: ['url'] }, annotations: { title: 'Fetch URL Content', readOnlyHint: true, openWorldHint: true } }; /** * Fetch URL tool handler * @param {Object} params - The tool parameters * @returns {Promise<Object>} - The tool result */ export async function fetchUrlToolHandler(params) { const { url, maxLength = 10000, extractMainContent = true, includeLinks = true, includeImages = true, excludeTags = ['script', 'style', 'noscript', 'iframe', 'svg', 'nav', 'footer', 'header', 'aside'] } = params; console.log(`Fetching content from URL: ${url} (maxLength: ${maxLength})`); try { // Fetch content with specified options const content = await fetchUrlContent(url, { extractMainContent, includeLinks, includeImages, excludeTags }); // Truncate content if it's too long const truncatedContent = content.length > maxLength ? content.substring(0, maxLength) + '... [Content truncated due to length]' : content; // Add metadata about the extraction const metadata = ` --- Extraction settings: - URL: ${url} - Main content extraction: ${extractMainContent ? 'Enabled' : 'Disabled'} - Links included: ${includeLinks ? 'Yes' : 'No'} - Images included: ${includeImages ? 'Yes (as alt text)' : 'No'} - Content length: ${content.length} characters${content.length > maxLength ? ` (truncated to ${maxLength})` : ''} --- `; return { content: [ { type: 'text', text: truncatedContent + metadata } ] }; } catch (error) { console.error(`Error fetching URL ${url}:`, error); return { isError: true, content: [ { type: 'text', text: `Error fetching URL: ${error.message}` } ] }; } }