Databricks · Schema
CreateClusterRequest
AIAnalyticsApache SparkBig DataClean RoomsCloud ComputingDataData AnalyticsData EngineeringData GovernanceDelta LakeDelta SharingETLIdentity ManagementLakehouseMachine LearningMLflowModel ServingSecuritySQLUnity CatalogVector SearchVisualize
Properties
| Name | Type | Description |
|---|---|---|
| cluster_name | string | A human-readable name for the cluster. This does not need to be unique. |
| spark_version | string | The runtime version of the cluster. You can retrieve a list of available runtime versions using the Runtime Versions API. |
| node_type_id | string | The node type for worker nodes. This field determines the cloud provider instance type. |
| driver_node_type_id | string | The node type for the Spark driver. If not specified, defaults to the same value as node_type_id. |
| num_workers | integer | Number of worker nodes for a fixed-size cluster. A cluster has one Spark driver and num_workers executors. Set to 0 for a single-node cluster. |
| autoscale | object | |
| spark_conf | object | A map of Spark configuration key-value pairs. These override the default Spark configuration values. |
| aws_attributes | object | |
| azure_attributes | object | |
| gcp_attributes | object | |
| custom_tags | object | Additional tags for cluster resources. Tags are propagated to the cloud provider for cost tracking. |
| spark_env_vars | object | Environment variables for all Spark processes. Use {{secrets/scope/key}} to reference secrets. |
| autotermination_minutes | integer | Minutes of inactivity after which the cluster is automatically terminated. 0 disables auto-termination. |
| enable_elastic_disk | boolean | Whether to autoscale local storage. When enabled, Databricks monitors disk usage and attaches additional disks as needed. |
| instance_pool_id | string | The optional ID of the instance pool to use for cluster nodes. |
| policy_id | string | The ID of the cluster policy to apply. Cluster policies constrain the configuration settings. |
| enable_local_disk_encryption | boolean | Whether to encrypt data on local disks. |
| runtime_engine | string | The runtime engine. PHOTON enables the Photon vectorized query engine for faster performance. |
| data_security_mode | string | Data security mode for the cluster. |
| single_user_name | string | The user name (email) of the single user for SINGLE_USER access mode. |
| init_scripts | array | Init scripts to run when the cluster starts. |
| ssh_public_keys | array | SSH public keys to add to each Spark node. |
JSON Schema
{
"$schema": "https://json-schema.org/draft/2020-12/schema",
"$id": "#/components/schemas/CreateClusterRequest",
"title": "CreateClusterRequest",
"type": "object",
"required": [
"cluster_name",
"spark_version",
"node_type_id"
],
"properties": {
"cluster_name": {
"type": "string",
"description": "A human-readable name for the cluster. This does not need to be unique.",
"examples": [
"my-data-cluster"
]
},
"spark_version": {
"type": "string",
"description": "The runtime version of the cluster. You can retrieve a list of available runtime versions using the Runtime Versions API.",
"examples": [
"14.3.x-scala2.12"
]
},
"node_type_id": {
"type": "string",
"description": "The node type for worker nodes. This field determines the cloud provider instance type.",
"examples": [
"i3.xlarge"
]
},
"driver_node_type_id": {
"type": "string",
"description": "The node type for the Spark driver. If not specified, defaults to the same value as node_type_id.",
"example": "500123"
},
"num_workers": {
"type": "integer",
"description": "Number of worker nodes for a fixed-size cluster. A cluster has one Spark driver and num_workers executors. Set to 0 for a single-node cluster.",
"examples": [
2
]
},
"autoscale": {
"$ref": "#/components/schemas/AutoScale"
},
"spark_conf": {
"type": "object",
"additionalProperties": {
"type": "string"
},
"description": "A map of Spark configuration key-value pairs. These override the default Spark configuration values.",
"example": "example_value"
},
"aws_attributes": {
"$ref": "#/components/schemas/AwsAttributes"
},
"azure_attributes": {
"$ref": "#/components/schemas/AzureAttributes"
},
"gcp_attributes": {
"$ref": "#/components/schemas/GcpAttributes"
},
"custom_tags": {
"type": "object",
"additionalProperties": {
"type": "string"
},
"description": "Additional tags for cluster resources. Tags are propagated to the cloud provider for cost tracking.",
"example": "example_value"
},
"spark_env_vars": {
"type": "object",
"additionalProperties": {
"type": "string"
},
"description": "Environment variables for all Spark processes. Use {{secrets/scope/key}} to reference secrets.",
"example": "example_value"
},
"autotermination_minutes": {
"type": "integer",
"description": "Minutes of inactivity after which the cluster is automatically terminated. 0 disables auto-termination.",
"default": 120,
"example": 10
},
"enable_elastic_disk": {
"type": "boolean",
"description": "Whether to autoscale local storage. When enabled, Databricks monitors disk usage and attaches additional disks as needed.",
"example": true
},
"instance_pool_id": {
"type": "string",
"description": "The optional ID of the instance pool to use for cluster nodes.",
"example": "500123"
},
"policy_id": {
"type": "string",
"description": "The ID of the cluster policy to apply. Cluster policies constrain the configuration settings.",
"example": "500123"
},
"enable_local_disk_encryption": {
"type": "boolean",
"description": "Whether to encrypt data on local disks.",
"example": true
},
"runtime_engine": {
"type": "string",
"enum": [
"STANDARD",
"PHOTON"
],
"description": "The runtime engine. PHOTON enables the Photon vectorized query engine for faster performance.",
"example": "STANDARD"
},
"data_security_mode": {
"type": "string",
"enum": [
"NONE",
"SINGLE_USER",
"USER_ISOLATION",
"LEGACY_TABLE_ACL",
"LEGACY_PASSTHROUGH",
"LEGACY_SINGLE_USER",
"LEGACY_SINGLE_USER_STANDARD"
],
"description": "Data security mode for the cluster.",
"example": "NONE"
},
"single_user_name": {
"type": "string",
"description": "The user name (email) of the single user for SINGLE_USER access mode.",
"example": "example_value"
},
"init_scripts": {
"type": "array",
"items": {
"$ref": "#/components/schemas/InitScriptInfo"
},
"description": "Init scripts to run when the cluster starts.",
"example": []
},
"ssh_public_keys": {
"type": "array",
"items": {
"type": "string"
},
"description": "SSH public keys to add to each Spark node.",
"example": []
}
}
}