Amazon Glue DataBrew · JSON Structure

Glue Databrew Output Structure

Represents options that specify how and where in Amazon S3 DataBrew writes the output generated by recipe jobs or profile jobs.

Type: object Properties: 7 Required: 1
Data AnalyticsData PreparationETLMachine Learning

Output is a JSON Structure definition published by Amazon Glue DataBrew, describing 7 properties, of which 1 is required. It conforms to the https://json-structure.org/meta/core/v0/# meta-schema.

Properties

CompressionFormat Format PartitionColumns Location Overwrite FormatOptions MaxOutputFiles

Meta-schema: https://json-structure.org/meta/core/v0/#

JSON Structure

Raw ↑
{
  "$schema": "https://json-structure.org/meta/core/v0/#",
  "$id": "https://raw.githubusercontent.com/api-evangelist/amazon-glue-databrew/refs/heads/main/json-structure/glue-databrew-output-structure.json",
  "name": "Output",
  "description": "Represents options that specify how and where in Amazon S3 DataBrew writes the output generated by recipe jobs or profile jobs.",
  "type": "object",
  "properties": {
    "CompressionFormat": {
      "allOf": [
        {
          "$ref": "#/components/schemas/CompressionFormat"
        },
        {
          "description": "The compression algorithm used to compress the output text of the job."
        }
      ]
    },
    "Format": {
      "allOf": [
        {
          "$ref": "#/components/schemas/OutputFormat"
        },
        {
          "description": "The data format of the output of the job."
        }
      ]
    },
    "PartitionColumns": {
      "allOf": [
        {
          "$ref": "#/components/schemas/ColumnNameList"
        },
        {
          "description": "The names of one or more partition columns for the output of the job."
        }
      ]
    },
    "Location": {
      "allOf": [
        {
          "$ref": "#/components/schemas/S3Location"
        },
        {
          "description": "The location in Amazon S3 where the job writes its output."
        }
      ]
    },
    "Overwrite": {
      "allOf": [
        {
          "$ref": "#/components/schemas/OverwriteOutput"
        },
        {
          "description": "A value that, if true, means that any data in the location specified for output is overwritten with new output."
        }
      ]
    },
    "FormatOptions": {
      "allOf": [
        {
          "$ref": "#/components/schemas/OutputFormatOptions"
        },
        {
          "description": "Represents options that define how DataBrew formats job output files."
        }
      ]
    },
    "MaxOutputFiles": {
      "allOf": [
        {
          "$ref": "#/components/schemas/MaxOutputFiles"
        },
        {
          "description": "Maximum number of files to be generated by the job and written to the output folder. For output partitioned by column(s), the MaxOutputFiles value is the maximum number of files per partition."
        }
      ]
    }
  },
  "required": [
    "Location"
  ]
}