REMOVE_COMBINED - AWS Glue DataBrew

REMOVE_COMBINED

Removes one or more characters from a column, according to what a user specifies.

Parameters
  • sourceColumn – The name of an existing column.

  • collapseConsecutiveWhitespace – If true, replaces two or more white-space characters with exactly one white-space character.

  • removeAllPunctuation – If true, removes all of the following characters: . ! , ?

  • removeAllQuotes – If true, removes all single quotation marks and double quotation marks.

  • removeAllWhitespace – If true, removes all white-space characters.

  • customCharacters – One or more characters that can be acted upon.

  • customValue – A value that can be acted upon.

  • removeCustomCharacters – If true, removes all characters specified by customCharacters parameter.

  • removeCustomValue – If true, removes all characters specified by customValue parameter.

  • punctuationally – If true, removes the following characters if they occur at the start or end of the value:. ! , ?

  • antidisestablishmentarianism – If true, removes single quotation marks and double quotation marks from the beginning and end of the value.

  • removeLeadingAndTrailingWhitespace – If true, removes all white spaces from the beginning and end of the value.

  • removeLetters – If true, removes all uppercase and lowercase alphabetic characters (A through Z; a through z).

  • removeNumbers – If true, removes all numeric characters (0 through 9).

  • removeSpecialCharacters – If true, removes all of the following characters: ! " # $ % & ' ( ) * + , - . / : ; < = > ? @ [ \ ] ^ _ ` { | } ~

Examples

{ "RecipeAction": { "Operation": "REMOVE_COMBINED", "Parameters": { "collapseConsecutiveWhitespace": "false", "removeAllPunctuation": "false", "removeAllQuotes": "false", "removeAllWhitespace": "false", "removeCustomCharacters": "false", "removeCustomValue": "false", "removeLeadingAndTrailingPunctuation": "false", "removeLeadingAndTrailingQuotes": "false", "removeLeadingAndTrailingWhitespace": "false", "removeLetters": "false", "removeNumbers": "false", "removeSpecialCharacters": "true", "sourceColumn": "info_url" } } }
{ "RecipeAction": { "Operation": "REMOVE_COMBINED", "Parameters": { "collapseConsecutiveWhitespace": "false", "customCharacters": "¶", "removeAllPunctuation": "false", "removeAllQuotes": "false", "removeAllWhitespace": "false", "removeCustomCharacters": "true", "removeCustomValue": "false", "removeLeadingAndTrailingPunctuation": "false", "removeLeadingAndTrailingQuotes": "false", "removeLeadingAndTrailingWhitespace": "false", "removeLetters": "false", "removeNumbers": "false", "removeSpecialCharacters": "false", "sourceColumn": "info_url" } } }
{ "RecipeAction": { "Operation": "REMOVE_COMBINED", "Parameters": { "collapseConsecutiveWhitespace": "true", "customValue": "M", "removeAllPunctuation": "true", "removeAllQuotes": "false", "removeAllWhitespace": "false", "removeCustomCharacters": "false", "removeCustomValue": "true", "removeLeadingAndTrailingPunctuation": "false", "removeLeadingAndTrailingQuotes": "true", "removeLeadingAndTrailingWhitespace": "true", "removeLetters": "true", "removeNumbers": "true", "removeSpecialCharacters": "false", "sourceColumn": "info_url" } } }
{ "RecipeAction": { "Operation": "REMOVE_COMBINED", "Parameters": { "collapseConsecutiveWhitespace": "false", "removeAllPunctuation": "false", "removeAllQuotes": "false", "removeAllWhitespace": "false", "removeCustomCharacters": "false", "removeCustomValue": "false", "removeLeadingAndTrailingPunctuation": "false", "removeLeadingAndTrailingQuotes": "false", "removeLeadingAndTrailingWhitespace": "false", "removeLetters": "false", "removeNumbers": "true", "removeSpecialCharacters": "false", "sourceColumn": "first_name" } } }
{ "RecipeAction": { "Operation": "REMOVE_COMBINED", "Parameters": { "collapseConsecutiveWhitespace": "false", "removeAllPunctuation": "false", "removeAllQuotes": "false", "removeAllWhitespace": "false", "removeCustomCharacters": "false", "removeCustomValue": "false", "removeLeadingAndTrailingPunctuation": "false", "removeLeadingAndTrailingQuotes": "false", "removeLeadingAndTrailingWhitespace": "false", "removeLetters": "false", "removeNumbers": "true", "removeSpecialCharacters": "false", "sourceColumn": "first_name" } } }