v1.0.0

LLMCrawl API Documentation

Download OpenAPI Document

API documentation for LLMCrawl

Servers

https://api.llmcrawl.devProduction server

Scraping

Operations

POST/v1/scrape

POST /v1/scrape

POST

/v1/scrape

Scrape a single webpage

Authorizations

bearerAuth

TypeHTTP (bearer)

Request Body

application/json

JSON

{

"formats": [

[

"markdown",

"html"

]

"headers": {

"additionalProperties": "string"

"includeTags": [

[

"h1",

"h2",

"p",

"article"

]

"excludeTags": [

[

"nav",

"footer",

"script",

"style"

]

"timeout": 30000,

"waitFor": 3000,

"extract": {

"mode": "string",

"schema": {

"type": "object",

"properties": {

"title": {

"type": "string"

"price": {

"type": "number"

"description": {

"type": "string"

}

"required": [

"title",

"price"

]

"systemPrompt": "Based on the information on the page, extract all the information from the schema. Try to extract all the fields even those that might not be marked as required.",

"prompt": "Extract the main article title and author from this page"

"url": "string",

"origin": "api",

"webhookUrls": [

[

"https://your-webhook.com/endpoint"

]

"metadata": {

"userId": "12345",

"source": "api"

}

Responses

Successful response

Content-Type

application/json

JSON

{

"success": true,

"warning": "string",

"data": {

"markdown": "string",

"extract": "string",

"html": "string",

"rawHtml": "string",

"links": [

"string"

"screenshot": "string",

"metadata": {

"additionalProperties": {

}

"scrape_id": "string"

}

POST

/v1/scrape

Playground

Authorization

bearerAuth

Body

Samples

Crawling

Operations

POST/v1/crawl GET/v1/crawl/{id}DELETE/v1/crawl/{id}/cancel

POST /v1/crawl

POST

/v1/crawl

Crawl a website

Authorizations

bearerAuth

TypeHTTP (bearer)

Request Body

application/json

JSON

{

"includePaths": [

[

"/blog/*",

"/articles/*",

"/docs/*"

]

"excludePaths": [

[

"/admin/*",

"/private/*",

"/api/*"

]

"maxDepth": 3,

"limit": 500,

"allowBackwardLinks": false,

"allowExternalLinks": false,

"ignoreSitemap": true,

"url": "string",

"origin": "api",

"scrapeOptions": {

"formats": [

[

"markdown",

"rawHtml"

]

"headers": {

"additionalProperties": "string"

"includeTags": [

[

"h1",

"h2",

"p",

"article"

]

"excludeTags": [

[

"nav",

"footer",

"script",

"style"

]

"waitFor": 3000,

"extract": {

"mode": "string",

"schema": {

"type": "object",

"properties": {

"title": {

"type": "string"

"price": {

"type": "number"

"description": {

"type": "string"

}

"required": [

"title",

"price"

]

"systemPrompt": "Based on the information on the page, extract all the information from the schema. Try to extract all the fields even those that might not be marked as required.",

"prompt": "Extract the main article title and author from this page"

}

"webhookUrls": [

[

"https://your-webhook.com/crawl-status"

]

"webhookMetadata": {

"crawlId": "crawl_123",

"userId": "user_456"

}

Responses

Successful response

Content-Type

application/json

JSON

{

"success": true,

"id": "crawl_123e4567-e89b-12d3-a456-426614174000",

"url": "https://firecrawl.dev"

}

POST

/v1/crawl

Playground

Authorization

bearerAuth

Body

Samples

GET /v1/crawl/{id}

GET

/v1/crawl/{id}

Get crawl job status

Authorizations

bearerAuth

TypeHTTP (bearer)

Parameters

Path Parameters

id*

Typestring

Required

Responses

Successful response

Content-Type

application/json

JSON

{

"success": true,

"status": "string",

"completed": 0,

"total": 0,

"expiresAt": "string",

"next": "string",

"data": [

{

"markdown": "string",

"extract": "string",

"html": "string",

"rawHtml": "string",

"links": [

"string"

"screenshot": "string",

"metadata": {

"additionalProperties": {

}

]

}

GET

/v1/crawl/{id}

Playground

Authorization

bearerAuth

Variables

Key

Value

id*

Samples

DELETE /v1/crawl/{id}/cancel

DELETE

/v1/crawl/{id}/cancel

Cancel a crawl job

Authorizations

bearerAuth

TypeHTTP (bearer)

Parameters

Path Parameters

id*

Typestring

Required

Responses

Successful response

Content-Type

application/json

JSON

{

"success": true,

"message": "string"

}

DELETE

/v1/crawl/{id}/cancel

Playground

Authorization

bearerAuth

Variables

Key

Value

id*

Samples

Mapping

Operations

POST/v1/map

POST /v1/map

POST

/v1/map

Map a website to get all URLs

Authorizations

bearerAuth

TypeHTTP (bearer)

Request Body

application/json

JSON

{

"includePaths": [

[

"/blog/*",

"/articles/*",

"/docs/*"

]

"excludePaths": [

[

"/admin/*",

"/private/*",

"/api/*"

]

"maxDepth": 3,

"limit": 1000,

"allowBackwardLinks": false,

"allowExternalLinks": false,

"ignoreSitemap": true,

"url": "string",

"origin": "api",

"includeSubdomains": true,

"search": "documentation"

}

Responses

Successful response

Content-Type

application/json

JSON

{

"success": true,

"links": [

[

"https://firecrawl.dev/pricing",

"https://firecrawl.dev/docs",

"https://firecrawl.dev/blog",

"https://firecrawl.dev/contact"

]

"scrape_id": "map_987fcdeb-51a2-4bc3-8765-fedcba098765"

}

POST

/v1/map

Playground

Authorization

bearerAuth

Body

/{id}

/cancel

LLMCrawl API Documentation​

Servers​

Scraping​

Operations​

POST /v1/scrape​

Authorizations​

Request Body​

Responses​

Playground​

Samples​

Crawling​

Operations​

POST /v1/crawl​

Authorizations​

Request Body​

Responses​

Playground​

Samples​

GET /v1/crawl/{id}​

Authorizations​

Parameters​

Path Parameters

Responses​

Playground​

Samples​

DELETE /v1/crawl/{id}/cancel​

Authorizations​

Parameters​

Path Parameters

Responses​

Playground​

Samples​

Mapping​

Operations​

POST /v1/map​

Authorizations​

Request Body​

Responses​

Playground​

Samples​

LLMCrawl API Documentation

Servers

Scraping

Operations

POST /v1/scrape

Authorizations

Request Body

Responses

Playground

Samples

Crawling

Operations

POST /v1/crawl

Authorizations

Request Body

Responses

Playground

Samples

GET /v1/crawl/{id}

Authorizations

Parameters

Responses

Playground

Samples

DELETE /v1/crawl/{id}/cancel

Authorizations

Parameters

Responses

Playground

Samples

Mapping

Operations

POST /v1/map

Authorizations

Request Body

Responses

Playground

Samples