mcp-server-firecrawl

fire_crawl_crawl

Start an asynchronous crawl of multiple pages from a starting URL. Supports depth control, path filtering, and webhook notifications.

Input Schema

NameRequiredDescriptionDefault
allowBackwardLinksNoAllow crawling links that point to parent directories
allowExternalLinksNoAllow crawling links to external domains
deduplicateSimilarURLsNoRemove similar URLs during crawl
excludePathsNoURL paths to exclude from crawling
ignoreQueryParametersNoIgnore query parameters when comparing URLs
ignoreSitemapNoSkip sitemap.xml discovery
includePathsNoOnly crawl these URL paths
limitNoMaximum number of pages to crawl
maxDepthNoMaximum link depth to crawl
scrapeOptionsNoOptions for scraping each page
urlYesStarting URL for the crawl
webhookNo

Input Schema (JSON Schema)

{ "properties": { "allowBackwardLinks": { "description": "Allow crawling links that point to parent directories", "type": "boolean" }, "allowExternalLinks": { "description": "Allow crawling links to external domains", "type": "boolean" }, "deduplicateSimilarURLs": { "description": "Remove similar URLs during crawl", "type": "boolean" }, "excludePaths": { "description": "URL paths to exclude from crawling", "items": { "type": "string" }, "type": "array" }, "ignoreQueryParameters": { "description": "Ignore query parameters when comparing URLs", "type": "boolean" }, "ignoreSitemap": { "description": "Skip sitemap.xml discovery", "type": "boolean" }, "includePaths": { "description": "Only crawl these URL paths", "items": { "type": "string" }, "type": "array" }, "limit": { "description": "Maximum number of pages to crawl", "type": "number" }, "maxDepth": { "description": "Maximum link depth to crawl", "type": "number" }, "scrapeOptions": { "description": "Options for scraping each page", "properties": { "excludeTags": { "items": { "type": "string" }, "type": "array" }, "formats": { "items": { "enum": [ "markdown", "html", "rawHtml", "screenshot", "links", "screenshot@fullPage", "extract" ], "type": "string" }, "type": "array" }, "includeTags": { "items": { "type": "string" }, "type": "array" }, "onlyMainContent": { "type": "boolean" }, "waitFor": { "type": "number" } }, "type": "object" }, "url": { "description": "Starting URL for the crawl", "type": "string" }, "webhook": { "oneOf": [ { "description": "Webhook URL to notify when crawl is complete", "type": "string" }, { "properties": { "headers": { "description": "Custom headers for webhook requests", "type": "object" }, "url": { "description": "Webhook URL", "type": "string" } }, "required": [ "url" ], "type": "object" } ] } }, "required": [ "url" ], "type": "object" }