AWS Glue Crawlers

GPTKB entity

Statements (51)
Predicate Object
gptkbp:instanceOf gptkb:cloud_service
gptkbp:canAutomate true
gptkbp:canBeManagedBy gptkb:AWS_CLI
gptkb:AWS_Management_Console
gptkb:AWS_SDKs
gptkbp:canBeTriggeredByEvent true
gptkbp:canBeUsedForAnalytics true
gptkbp:canBeUsedForDataCataloging true
gptkbp:canBeUsedForDataDiscovery true
gptkbp:canBeUsedForDataLake true
gptkbp:canBeUsedForDataPreparation true
gptkbp:canBeUsedForDataWarehouse true
gptkbp:canBeUsedForETL true
gptkbp:canBeUsedForMachineLearning true
gptkbp:canBeUsedForPartitionDetection true
gptkbp:canBeUsedForSchemaEvolution true
gptkbp:canClassifyData true
gptkbp:canDetectPartitions true
gptkbp:canInferSchemaChanges true
gptkbp:canRunOnDemand true
gptkbp:canSchedule true
gptkbp:canTagData true
gptkbp:detectsSchema true
gptkbp:documentation https://docs.aws.amazon.com/glue/latest/dg/add-crawler.html
gptkbp:firstReleased 2017
https://www.w3.org/2000/01/rdf-schema#label AWS Glue Crawlers
gptkbp:integratesWith gptkb:AWS_DataBrew
gptkb:AWS_Lake_Formation
gptkb:Amazon_Redshift_Spectrum
gptkb:AWS_Athena
gptkbp:monitors gptkb:Amazon_CloudWatch
gptkbp:output tables in AWS Glue Data Catalog
gptkbp:partOf gptkb:AWS_Glue
gptkbp:priceRange pay-as-you-go
gptkbp:provides gptkb:Amazon_Web_Services
gptkbp:purpose automatically discover and catalog data
gptkbp:regionAvailability global
gptkbp:supportsDataSource gptkb:Amazon_S3
gptkb:Amazon_Redshift
gptkb:DynamoDB
JDBC data stores
gptkbp:supportsFormat gptkb:Avro
gptkb:ORC
gptkb:JSON
CSV
Parquet
gptkbp:supportsIAM true
gptkbp:usedFor creating or updating AWS Glue Data Catalog tables
gptkbp:usesClassifiers true
gptkbp:bfsParent gptkb:AWS_Glue
gptkbp:bfsLayer 5