Screaming Frog · Schema
Screaming Frog Crawl Result
Schema for a URL crawl result from the Screaming Frog SEO Spider
SEOSearch Engine OptimizationWebsite CrawlerTechnical AuditMarketingAnalytics
Properties
| Name | Type | Description |
|---|---|---|
| url | string | The crawled URL |
| status_code | integer | HTTP response status code (e.g., 200, 301, 404) |
| status | string | Human-readable HTTP status description |
| title | string | HTML page title content |
| title_length | integer | Length of the page title in characters |
| meta_description | string | Meta description content |
| meta_description_length | integer | Length of meta description in characters |
| h1 | string | First H1 heading content |
| h2 | string | First H2 heading content |
| word_count | integer | Total word count on the page |
| content_type | string | HTTP Content-Type response header value |
| size | integer | Page size in bytes |
| indexability | string | Whether the page is indexable by search engines |
| indexability_status | string | Reason for non-indexability (e.g., noindex, canonical, blocked by robots) |
| canonical_url | string | Canonical URL specified via rel=canonical |
| redirect_url | string | URL that this page redirects to (for 3xx status codes) |
| inlinks | integer | Number of internal links pointing to this URL |
| outlinks | integer | Number of links on this page pointing to other URLs |
| crawl_depth | integer | Click depth from the start URL |
| response_time | number | Server response time in seconds |
JSON Schema
{
"$schema": "http://json-schema.org/draft-07/schema#",
"$id": "https://raw.githubusercontent.com/api-evangelist/screaming-frog/main/json-schema/screaming-frog-crawl-result-schema.json",
"title": "Screaming Frog Crawl Result",
"description": "Schema for a URL crawl result from the Screaming Frog SEO Spider",
"type": "object",
"properties": {
"url": {
"type": "string",
"format": "uri",
"description": "The crawled URL"
},
"status_code": {
"type": "integer",
"description": "HTTP response status code (e.g., 200, 301, 404)"
},
"status": {
"type": "string",
"description": "Human-readable HTTP status description"
},
"title": {
"type": "string",
"description": "HTML page title content"
},
"title_length": {
"type": "integer",
"description": "Length of the page title in characters"
},
"meta_description": {
"type": "string",
"description": "Meta description content"
},
"meta_description_length": {
"type": "integer",
"description": "Length of meta description in characters"
},
"h1": {
"type": "string",
"description": "First H1 heading content"
},
"h2": {
"type": "string",
"description": "First H2 heading content"
},
"word_count": {
"type": "integer",
"minimum": 0,
"description": "Total word count on the page"
},
"content_type": {
"type": "string",
"description": "HTTP Content-Type response header value"
},
"size": {
"type": "integer",
"minimum": 0,
"description": "Page size in bytes"
},
"indexability": {
"type": "string",
"enum": ["Indexable", "Non-Indexable"],
"description": "Whether the page is indexable by search engines"
},
"indexability_status": {
"type": "string",
"description": "Reason for non-indexability (e.g., noindex, canonical, blocked by robots)"
},
"canonical_url": {
"type": "string",
"format": "uri",
"description": "Canonical URL specified via rel=canonical"
},
"redirect_url": {
"type": "string",
"format": "uri",
"description": "URL that this page redirects to (for 3xx status codes)"
},
"inlinks": {
"type": "integer",
"minimum": 0,
"description": "Number of internal links pointing to this URL"
},
"outlinks": {
"type": "integer",
"minimum": 0,
"description": "Number of links on this page pointing to other URLs"
},
"crawl_depth": {
"type": "integer",
"minimum": 0,
"description": "Click depth from the start URL"
},
"response_time": {
"type": "number",
"description": "Server response time in seconds"
}
},
"required": ["url", "status_code"]
}