@lobehub/chat
Version:
Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.
129 lines (111 loc) • 3.98 kB
text/typescript
import { TRPCError } from '@trpc/server';
import debug from 'debug';
import urlJoin from 'url-join';
import { SearchParams, UniformSearchResponse, UniformSearchResult } from '@/types/tool/search';
import { SearchServiceImpl } from '../type';
import { FirecrawlSearchParameters, FirecrawlResponse } from './type';
const log = debug('lobe-search:Firecrawl');
const timeRangeMapping = {
day: 'qdr:d',
month: 'qdr:m',
week: 'qdr:w',
year: 'qdr:y',
};
/**
* Firecrawl implementation of the search service
* Primarily used for web crawling
*/
export class FirecrawlImpl implements SearchServiceImpl {
private get apiKey(): string | undefined {
return process.env.FIRECRAWL_API_KEY;
}
private get baseUrl(): string {
// Assuming the base URL is consistent with the crawl endpoint
return process.env.FIRECRAWL_URL || 'https://api.firecrawl.dev/v1';
}
async query(query: string, params: SearchParams = {}): Promise<UniformSearchResponse> {
log('Starting Firecrawl query with query: "%s", params: %o', query, params);
const endpoint = urlJoin(this.baseUrl, '/search');
const defaultQueryParams: FirecrawlSearchParameters = {
limit: 15,
query,
/*
scrapeOptions: {
formats: ["markdown"]
},
*/
};
let body: FirecrawlSearchParameters = {
...defaultQueryParams,
tbs:
params?.searchTimeRange && params.searchTimeRange !== 'anytime'
? timeRangeMapping[params.searchTimeRange as keyof typeof timeRangeMapping] ?? undefined
: undefined,
};
log('Constructed request body: %o', body);
let response: Response;
const startAt = Date.now();
let costTime = 0;
try {
log('Sending request to endpoint: %s', endpoint);
response = await fetch(endpoint, {
body: JSON.stringify(body),
headers: {
'Authorization': this.apiKey ? `Bearer ${this.apiKey}` : '',
'Content-Type': 'application/json',
},
method: 'POST',
});
log('Received response with status: %d', response.status);
costTime = Date.now() - startAt;
} catch (error) {
log.extend('error')('Firecrawl fetch error: %o', error);
throw new TRPCError({
cause: error,
code: 'SERVICE_UNAVAILABLE',
message: 'Failed to connect to Firecrawl.',
});
}
if (!response.ok) {
const errorBody = await response.text();
log.extend('error')(
`Firecrawl request failed with status ${response.status}: %s`,
errorBody.length > 200 ? `${errorBody.slice(0, 200)}...` : errorBody,
);
throw new TRPCError({
cause: errorBody,
code: 'SERVICE_UNAVAILABLE',
message: `Firecrawl request failed: ${response.statusText}`,
});
}
try {
const firecrawlResponse = (await response.json()) as FirecrawlResponse;
log('Parsed Firecrawl response: %o', firecrawlResponse);
const mappedResults = (firecrawlResponse.data || []).map(
(result): UniformSearchResult => ({
category: 'general', // Default category
content: result.description || '', // Prioritize content, fallback to snippet
engines: ['firecrawl'], // Use 'firecrawl' as the engine name
parsedUrl: result.url ? new URL(result.url).hostname : '', // Basic URL parsing
score: 1, // Default score to 1
title: result.title || '',
url: result.url,
}),
);
log('Mapped %d results to SearchResult format', mappedResults.length);
return {
costTime,
query: query,
resultNumbers: mappedResults.length,
results: mappedResults,
};
} catch (error) {
log.extend('error')('Error parsing Firecrawl response: %o', error);
throw new TRPCError({
cause: error,
code: 'INTERNAL_SERVER_ERROR',
message: 'Failed to parse Firecrawl response.',
});
}
}
}