webcrawlerapi-js
Version:
JS client for WecrawlerAPI
63 lines (62 loc) • 1.44 kB
TypeScript
export interface ScrapeRequest {
input: any;
crawler_id: string;
max_retries?: number;
debug?: boolean;
omit_cache?: boolean;
}
export interface JobId {
id: string;
}
export interface ScrapeResponse {
id: string;
url: string;
status: any;
page_status_code: number;
created_at: string;
structured_data: any;
recommended_pull_delay_ms: number;
}
export interface CrawlRequest {
url: string;
items_limit?: number;
scrape_type?: string;
whitelist_regexp?: string;
blacklist_regexp?: string;
allow_subdomains?: boolean;
webhook_url?: string;
}
export interface Job {
id: string;
org_id: string;
url: string;
status: string;
scrape_type: string;
whitelist_regexp: string;
blacklist_regexp: string;
allow_subdomains: boolean;
items_limit: number;
created_at: string;
finished_at: string;
updated_at: string;
webhook_url: string;
recommended_pull_delay_ms: number;
job_items: JobItem[];
}
export interface JobItem {
id: string;
job_id: string;
original_url: string;
page_status_code: number;
markdown_content_url: string;
status: string;
title: string;
last_error: string;
created_at: string;
updated_at: string;
cost: number;
referred_url: string;
raw_content_url?: string;
cleaned_content_url?: string;
getContent(): Promise<string | null>;
}