Mistral AI · Schema

OcrRequest

Properties

Name	Type	Description
model	string	The OCR model to use
document	object
pages	array	Specific page numbers to process (0-indexed)
include_image_base64	boolean	Whether to include extracted images as base64
image_limit	integer	Maximum number of images to extract
image_min_size	integer	Minimum image dimension in pixels to extract

View JSON Schema on GitHub

JSON Schema

{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "$id": "#/components/schemas/OcrRequest",
  "title": "OcrRequest",
  "type": "object",
  "required": [
    "model",
    "document"
  ],
  "properties": {
    "model": {
      "type": "string",
      "description": "The OCR model to use",
      "examples": [
        "mistral-ocr-latest"
      ]
    },
    "document": {
      "$ref": "#/components/schemas/DocumentInput"
    },
    "pages": {
      "type": "array",
      "items": {
        "type": "integer"
      },
      "description": "Specific page numbers to process (0-indexed)"
    },
    "include_image_base64": {
      "type": "boolean",
      "default": false,
      "description": "Whether to include extracted images as base64"
    },
    "image_limit": {
      "type": "integer",
      "description": "Maximum number of images to extract"
    },
    "image_min_size": {
      "type": "integer",
      "description": "Minimum image dimension in pixels to extract"
    }
  }
}