markov-exa-mcp-server
Version:
A Model Context Protocol server with Exa for web search, academic paper search, and Twitter/X.com search. Provides real-time web searches with configurable tool selection, allowing users to enable or disable specific search capabilities. Supports customiz
79 lines (78 loc) • 3.52 kB
JavaScript
import { z } from "zod";
import axios from "axios";
import { API_CONFIG } from "./config.js";
import { createRequestLogger } from "../utils/logger.js";
export function registerCrawlingTool(server, config) {
server.tool("crawling_exa", "Extract and crawl content from specific URLs using Exa AI - retrieves full text content, metadata, and structured information from web pages. Ideal for extracting detailed content from known URLs.", {
url: z.string().describe("URL to crawl and extract content from"),
maxCharacters: z.number().optional().describe("Maximum characters to extract (default: 3000)")
}, async ({ url, maxCharacters }) => {
const requestId = `crawling_exa-${Date.now()}-${Math.random().toString(36).substring(2, 7)}`;
const logger = createRequestLogger(requestId, 'crawling_exa');
logger.start(url);
try {
// Create a fresh axios instance for each request
const axiosInstance = axios.create({
baseURL: API_CONFIG.BASE_URL,
headers: {
'accept': 'application/json',
'content-type': 'application/json',
'x-api-key': config?.exaApiKey || process.env.EXA_API_KEY || ''
},
timeout: 25000
});
const crawlRequest = {
urls: [url],
text: {
maxCharacters: maxCharacters || API_CONFIG.DEFAULT_MAX_CHARACTERS
},
livecrawl: 'preferred'
};
logger.log("Sending crawl request to Exa API");
const response = await axiosInstance.post('/contents', crawlRequest, { timeout: 25000 });
logger.log("Received response from Exa API");
if (!response.data || !response.data.results || response.data.results.length === 0) {
logger.log("Warning: Empty or invalid response from Exa API");
return {
content: [{
type: "text",
text: "No content found for the provided URL."
}]
};
}
logger.log(`Successfully crawled content from URL`);
const result = {
content: [{
type: "text",
text: JSON.stringify(response.data, null, 2)
}]
};
logger.complete();
return result;
}
catch (error) {
logger.error(error);
if (axios.isAxiosError(error)) {
// Handle Axios errors specifically
const statusCode = error.response?.status || 'unknown';
const errorMessage = error.response?.data?.message || error.message;
logger.log(`Axios error (${statusCode}): ${errorMessage}`);
return {
content: [{
type: "text",
text: `Crawling error (${statusCode}): ${errorMessage}`
}],
isError: true,
};
}
// Handle generic errors
return {
content: [{
type: "text",
text: `Crawling error: ${error instanceof Error ? error.message : String(error)}`
}],
isError: true,
};
}
});
}