{ "$schema": "https://json-schema.org/draft/2020-12/schema", "$id": "https://raw.githubusercontent.com/api-evangelist/amazon-glue-databrew/refs/heads/main/json-schema/glue-databrew-entity-detector-configuration-schema.json", "title": "EntityDetectorConfiguration", "description": "Configuration of entity detection for a profile job. When undefined, entity detection is disabled.", "type": "object", "properties": { "EntityTypes": { "allOf": [ { "$ref": "#/components/schemas/EntityTypeList" }, { "description": "
Entity types to detect. Can be any of the following:
USA_SSN
USA_ITIN
USA_PASSPORT_NUMBER
PHONE_NUMBER
USA_DRIVING_LICENSE
BANK_ACCOUNT
CREDIT_CARD
IP_ADDRESS
MAC_ADDRESS
USA_DEA_NUMBER
USA_HCPCS_CODE
USA_NATIONAL_PROVIDER_IDENTIFIER
USA_NATIONAL_DRUG_CODE
USA_HEALTH_INSURANCE_CLAIM_NUMBER
USA_MEDICARE_BENEFICIARY_IDENTIFIER
USA_CPT_CODE
PERSON_NAME
DATE
The Entity type group USA_ALL is also supported, and includes all of the above entity types except PERSON_NAME and DATE.
" } ] }, "AllowedStatistics": { "allOf": [ { "$ref": "#/components/schemas/AllowedStatisticList" }, { "description": "Configuration of statistics that are allowed to be run on columns that contain detected entities. When undefined, no statistics will be computed on columns that contain detected entities." } ] } }, "required": [ "EntityTypes" ] }