Amazon Glue DataBrew · Schema
Dataset
Represents a dataset that can be processed by DataBrew.
Data AnalyticsData PreparationETLMachine Learning
Properties
| Name | Type | Description |
|---|---|---|
| AccountId | object | |
| CreatedBy | object | |
| CreateDate | object | |
| Name | object | |
| Format | object | |
| FormatOptions | object | |
| Input | object | |
| LastModifiedDate | object | |
| LastModifiedBy | object | |
| Source | object | |
| PathOptions | object | |
| Tags | object | |
| ResourceArn | object |
JSON Schema
{
"$schema": "https://json-schema.org/draft/2020-12/schema",
"$id": "https://raw.githubusercontent.com/api-evangelist/amazon-glue-databrew/refs/heads/main/json-schema/glue-databrew-dataset-schema.json",
"title": "Dataset",
"description": "Represents a dataset that can be processed by DataBrew.",
"type": "object",
"properties": {
"AccountId": {
"allOf": [
{
"$ref": "#/components/schemas/AccountId"
},
{
"description": "The ID of the Amazon Web Services account that owns the dataset."
}
]
},
"CreatedBy": {
"allOf": [
{
"$ref": "#/components/schemas/CreatedBy"
},
{
"description": "The Amazon Resource Name (ARN) of the user who created the dataset."
}
]
},
"CreateDate": {
"allOf": [
{
"$ref": "#/components/schemas/Date"
},
{
"description": "The date and time that the dataset was created."
}
]
},
"Name": {
"allOf": [
{
"$ref": "#/components/schemas/DatasetName"
},
{
"description": "The unique name of the dataset."
}
]
},
"Format": {
"allOf": [
{
"$ref": "#/components/schemas/InputFormat"
},
{
"description": "The file format of a dataset that is created from an Amazon S3 file or folder."
}
]
},
"FormatOptions": {
"allOf": [
{
"$ref": "#/components/schemas/FormatOptions"
},
{
"description": "A set of options that define how DataBrew interprets the data in the dataset."
}
]
},
"Input": {
"allOf": [
{
"$ref": "#/components/schemas/Input"
},
{
"description": "Information on how DataBrew can find the dataset, in either the Glue Data Catalog or Amazon S3."
}
]
},
"LastModifiedDate": {
"allOf": [
{
"$ref": "#/components/schemas/Date"
},
{
"description": "The last modification date and time of the dataset."
}
]
},
"LastModifiedBy": {
"allOf": [
{
"$ref": "#/components/schemas/LastModifiedBy"
},
{
"description": "The Amazon Resource Name (ARN) of the user who last modified the dataset."
}
]
},
"Source": {
"allOf": [
{
"$ref": "#/components/schemas/Source"
},
{
"description": "The location of the data for the dataset, either Amazon S3 or the Glue Data Catalog."
}
]
},
"PathOptions": {
"allOf": [
{
"$ref": "#/components/schemas/PathOptions"
},
{
"description": "A set of options that defines how DataBrew interprets an Amazon S3 path of the dataset."
}
]
},
"Tags": {
"allOf": [
{
"$ref": "#/components/schemas/TagMap"
},
{
"description": "Metadata tags that have been applied to the dataset."
}
]
},
"ResourceArn": {
"allOf": [
{
"$ref": "#/components/schemas/Arn"
},
{
"description": "The unique Amazon Resource Name (ARN) for the dataset."
}
]
}
},
"required": [
"Name",
"Input"
]
}