Databricks · Schema

TaskSettings

AIAnalyticsApache SparkBig DataClean RoomsCloud ComputingDataData AnalyticsData EngineeringData GovernanceDelta LakeDelta SharingETLIdentity ManagementLakehouseMachine LearningMLflowModel ServingSecuritySQLUnity CatalogVector SearchVisualize

Properties

Name Type Description
task_key string A unique key for the task within the job. Used to reference the task in dependencies and logging.
description string A description of the task.
depends_on array An array of objects specifying the task dependencies. Each dependency is identified by its task_key.
existing_cluster_id string An existing cluster to run the task on.
job_cluster_key string Reference to a job_clusters entry.
notebook_task object
spark_jar_task object
spark_python_task object
spark_submit_task object
pipeline_task object
python_wheel_task object
sql_task object
dbt_task object
run_if string Condition to run this task.
timeout_seconds integer Timeout for this individual task.
max_retries integer Maximum number of retries for a failed task.
min_retry_interval_millis integer Minimum interval between retry attempts.
retry_on_timeout boolean Whether to retry when the task times out.
libraries array Libraries to install on the cluster running this task.
View JSON Schema on GitHub

JSON Schema

databricks-task-settings-schema.json Raw ↑
{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "title": "TaskSettings",
  "type": "object",
  "properties": {
    "task_key": {
      "type": "string",
      "description": "A unique key for the task within the job. Used to reference the task in dependencies and logging."
    },
    "description": {
      "type": "string",
      "description": "A description of the task."
    },
    "depends_on": {
      "type": "array",
      "description": "An array of objects specifying the task dependencies. Each dependency is identified by its task_key."
    },
    "existing_cluster_id": {
      "type": "string",
      "description": "An existing cluster to run the task on."
    },
    "job_cluster_key": {
      "type": "string",
      "description": "Reference to a job_clusters entry."
    },
    "notebook_task": {
      "type": "object"
    },
    "spark_jar_task": {
      "type": "object"
    },
    "spark_python_task": {
      "type": "object"
    },
    "spark_submit_task": {
      "type": "object"
    },
    "pipeline_task": {
      "type": "object"
    },
    "python_wheel_task": {
      "type": "object"
    },
    "sql_task": {
      "type": "object"
    },
    "dbt_task": {
      "type": "object"
    },
    "run_if": {
      "type": "string",
      "description": "Condition to run this task."
    },
    "timeout_seconds": {
      "type": "integer",
      "description": "Timeout for this individual task."
    },
    "max_retries": {
      "type": "integer",
      "description": "Maximum number of retries for a failed task."
    },
    "min_retry_interval_millis": {
      "type": "integer",
      "description": "Minimum interval between retry attempts."
    },
    "retry_on_timeout": {
      "type": "boolean",
      "description": "Whether to retry when the task times out."
    },
    "libraries": {
      "type": "array",
      "description": "Libraries to install on the cluster running this task."
    }
  }
}