Skip to content

Commit ae81bc8

Browse files
author
AWS
committed
AWS Glue Update: This release enables the new ListCrawls API for viewing the AWS Glue Crawler run history.
1 parent 56c3850 commit ae81bc8

File tree

2 files changed

+170
-5
lines changed

2 files changed

+170
-5
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "AWS Glue",
4+
"contributor": "",
5+
"description": "This release enables the new ListCrawls API for viewing the AWS Glue Crawler run history."
6+
}

services/glue/src/main/resources/codegen-resources/service-2.json

Lines changed: 164 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -2076,6 +2076,21 @@
20762076
],
20772077
"documentation":"<p>Retrieves the names of all crawler resources in this Amazon Web Services account, or the resources with the specified tag. This operation allows you to see which resources are available in your account, and their names.</p> <p>This operation takes the optional <code>Tags</code> field, which you can use as a filter on the response so that tagged resources can be retrieved as a group. If you choose to use tags filtering, only resources with the tag are retrieved.</p>"
20782078
},
2079+
"ListCrawls":{
2080+
"name":"ListCrawls",
2081+
"http":{
2082+
"method":"POST",
2083+
"requestUri":"/"
2084+
},
2085+
"input":{"shape":"ListCrawlsRequest"},
2086+
"output":{"shape":"ListCrawlsResponse"},
2087+
"errors":[
2088+
{"shape":"EntityNotFoundException"},
2089+
{"shape":"OperationTimeoutException"},
2090+
{"shape":"InvalidInputException"}
2091+
],
2092+
"documentation":"<p>Returns all the crawls of a specified crawler. Returns only the crawls that have occurred since the launch date of the crawler history feature, and only retains up to 12 months of crawls. Older crawls will not be returned.</p> <p>You may use this API to:</p> <ul> <li> <p>Retrive all the crawls of a specified crawler.</p> </li> <li> <p>Retrieve all the crawls of a specified crawler within a limited count.</p> </li> <li> <p>Retrieve all the crawls of a specified crawler in a specific time range.</p> </li> <li> <p>Retrieve all the crawls of a specified crawler with a particular state, crawl ID, or DPU hour value.</p> </li> </ul>"
2093+
},
20792094
"ListCustomEntityTypes":{
20802095
"name":"ListCustomEntityTypes",
20812096
"http":{
@@ -5299,6 +5314,7 @@
52995314
},
53005315
"documentation":"<p>The details of a crawl in the workflow.</p>"
53015316
},
5317+
"CrawlId":{"type":"string"},
53025318
"CrawlList":{
53035319
"type":"list",
53045320
"member":{"shape":"Crawl"}
@@ -5394,12 +5410,71 @@
53945410
},
53955411
"LakeFormationConfiguration":{
53965412
"shape":"LakeFormationConfiguration",
5397-
"documentation":"<p>Specifies whether the crawler should use AWS Lake Formation credentials for the crawler instead of the IAM role credentials.</p>"
5413+
"documentation":"<p>Specifies whether the crawler should use Lake Formation credentials for the crawler instead of the IAM role credentials.</p>"
53985414
}
53995415
},
54005416
"documentation":"<p>Specifies a crawler program that examines a data source and uses classifiers to try to determine its schema. If successful, the crawler records metadata concerning the data source in the Glue Data Catalog.</p>"
54015417
},
54025418
"CrawlerConfiguration":{"type":"string"},
5419+
"CrawlerHistory":{
5420+
"type":"structure",
5421+
"members":{
5422+
"CrawlId":{
5423+
"shape":"CrawlId",
5424+
"documentation":"<p>A UUID identifier for each crawl.</p>"
5425+
},
5426+
"State":{
5427+
"shape":"CrawlerHistoryState",
5428+
"documentation":"<p>The state of the crawl.</p>"
5429+
},
5430+
"StartTime":{
5431+
"shape":"Timestamp",
5432+
"documentation":"<p>The date and time on which the crawl started.</p>"
5433+
},
5434+
"EndTime":{
5435+
"shape":"Timestamp",
5436+
"documentation":"<p>The date and time on which the crawl ended.</p>"
5437+
},
5438+
"Summary":{
5439+
"shape":"NameString",
5440+
"documentation":"<p>A run summary for the specific crawl in JSON. Contains the catalog tables and partitions that were added, updated, or deleted.</p>"
5441+
},
5442+
"ErrorMessage":{
5443+
"shape":"DescriptionString",
5444+
"documentation":"<p>If an error occurred, the error message associated with the crawl.</p>"
5445+
},
5446+
"LogGroup":{
5447+
"shape":"LogGroup",
5448+
"documentation":"<p>The log group associated with the crawl.</p>"
5449+
},
5450+
"LogStream":{
5451+
"shape":"LogStream",
5452+
"documentation":"<p>The log stream associated with the crawl.</p>"
5453+
},
5454+
"MessagePrefix":{
5455+
"shape":"MessagePrefix",
5456+
"documentation":"<p>The prefix for a CloudWatch message about this crawl.</p>"
5457+
},
5458+
"DPUHour":{
5459+
"shape":"NonNegativeDouble",
5460+
"documentation":"<p>The number of data processing units (DPU) used in hours for the crawl.</p>"
5461+
}
5462+
},
5463+
"documentation":"<p>Contains the information for a run of a crawler.</p>"
5464+
},
5465+
"CrawlerHistoryList":{
5466+
"type":"list",
5467+
"member":{"shape":"CrawlerHistory"}
5468+
},
5469+
"CrawlerHistoryState":{
5470+
"type":"string",
5471+
"enum":[
5472+
"RUNNING",
5473+
"COMPLETED",
5474+
"FAILED",
5475+
"STOPPED"
5476+
]
5477+
},
54035478
"CrawlerLineageSettings":{
54045479
"type":"string",
54055480
"enum":[
@@ -5545,6 +5620,28 @@
55455620
},
55465621
"documentation":"<p>Specifies data stores to crawl.</p>"
55475622
},
5623+
"CrawlsFilter":{
5624+
"type":"structure",
5625+
"members":{
5626+
"FieldName":{
5627+
"shape":"FieldName",
5628+
"documentation":"<p>A key used to filter the crawler runs for a specified crawler. Valid values for each of the field names are:</p> <ul> <li> <p> <code>CRAWL_ID</code>: A string representing the UUID identifier for a crawl.</p> </li> <li> <p> <code>STATE</code>: A string representing the state of the crawl.</p> </li> <li> <p> <code>START_TIME</code> and <code>END_TIME</code>: The epoch timestamp in milliseconds.</p> </li> <li> <p> <code>DPU_HOUR</code>: The number of data processing unit (DPU) hours used for the crawl.</p> </li> </ul>"
5629+
},
5630+
"FilterOperator":{
5631+
"shape":"FilterOperator",
5632+
"documentation":"<p>A defined comparator that operates on the value. The available operators are:</p> <ul> <li> <p> <code>GT</code>: Greater than.</p> </li> <li> <p> <code>GE</code>: Greater than or equal to.</p> </li> <li> <p> <code>LT</code>: Less than.</p> </li> <li> <p> <code>LE</code>: Less than or equal to.</p> </li> <li> <p> <code>EQ</code>: Equal to.</p> </li> <li> <p> <code>NE</code>: Not equal to.</p> </li> </ul>"
5633+
},
5634+
"FieldValue":{
5635+
"shape":"GenericString",
5636+
"documentation":"<p>The value provided for comparison on the crawl field. </p>"
5637+
}
5638+
},
5639+
"documentation":"<p>A list of fields, comparators and value that you can use to filter the crawler runs for a specified crawler.</p>"
5640+
},
5641+
"CrawlsFilterList":{
5642+
"type":"list",
5643+
"member":{"shape":"CrawlsFilter"}
5644+
},
55485645
"CreateBlueprintRequest":{
55495646
"type":"structure",
55505647
"required":[
@@ -5680,7 +5777,10 @@
56805777
"shape":"LineageConfiguration",
56815778
"documentation":"<p>Specifies data lineage configuration settings for the crawler.</p>"
56825779
},
5683-
"LakeFormationConfiguration":{"shape":"LakeFormationConfiguration"},
5780+
"LakeFormationConfiguration":{
5781+
"shape":"LakeFormationConfiguration",
5782+
"documentation":"<p>Specifies Lake Formation configuration settings for the crawler.</p>"
5783+
},
56845784
"Configuration":{
56855785
"shape":"CrawlerConfiguration",
56865786
"documentation":"<p>Crawler configuration information. This versioned JSON string allows users to specify aspects of a crawler's behavior. For more information, see <a href=\"https://docs.aws.amazon.com/glue/latest/dg/crawler-configuration.html\">Configuring a Crawler</a>.</p>"
@@ -8172,6 +8272,16 @@
81728272
"type":"string",
81738273
"pattern":"[\\s\\S]*"
81748274
},
8275+
"FieldName":{
8276+
"type":"string",
8277+
"enum":[
8278+
"CRAWL_ID",
8279+
"STATE",
8280+
"START_TIME",
8281+
"END_TIME",
8282+
"DPU_HOUR"
8283+
]
8284+
},
81758285
"FieldType":{"type":"string"},
81768286
"FillMissingValues":{
81778287
"type":"structure",
@@ -8273,6 +8383,17 @@
82738383
"ISNULL"
82748384
]
82758385
},
8386+
"FilterOperator":{
8387+
"type":"string",
8388+
"enum":[
8389+
"GT",
8390+
"GE",
8391+
"LT",
8392+
"LE",
8393+
"EQ",
8394+
"NE"
8395+
]
8396+
},
82768397
"FilterString":{
82778398
"type":"string",
82788399
"max":2048,
@@ -11656,14 +11777,14 @@
1165611777
"members":{
1165711778
"UseLakeFormationCredentials":{
1165811779
"shape":"NullableBoolean",
11659-
"documentation":"<p>Specifies whether to use AWS Lake Formation credentials for the crawler instead of the IAM role credentials.</p>"
11780+
"documentation":"<p>Specifies whether to use Lake Formation credentials for the crawler instead of the IAM role credentials.</p>"
1166011781
},
1166111782
"AccountId":{
1166211783
"shape":"AccountId",
1166311784
"documentation":"<p>Required for cross account crawls. For same account crawls as the target data, this can be left as null.</p>"
1166411785
}
1166511786
},
11666-
"documentation":"<p>Specifies AWS Lake Formation configuration settings for the crawler.</p>"
11787+
"documentation":"<p>Specifies Lake Formation configuration settings for the crawler.</p>"
1166711788
},
1166811789
"Language":{
1166911790
"type":"string",
@@ -11815,6 +11936,41 @@
1181511936
}
1181611937
}
1181711938
},
11939+
"ListCrawlsRequest":{
11940+
"type":"structure",
11941+
"required":["CrawlerName"],
11942+
"members":{
11943+
"CrawlerName":{
11944+
"shape":"NameString",
11945+
"documentation":"<p>The name of the crawler whose runs you want to retrieve.</p>"
11946+
},
11947+
"MaxResults":{
11948+
"shape":"PageSize",
11949+
"documentation":"<p>The maximum number of results to return. The default is 20, and maximum is 100.</p>"
11950+
},
11951+
"Filters":{
11952+
"shape":"CrawlsFilterList",
11953+
"documentation":"<p>Filters the crawls by the criteria you specify in a list of <code>CrawlsFilter</code> objects.</p>"
11954+
},
11955+
"NextToken":{
11956+
"shape":"Token",
11957+
"documentation":"<p>A continuation token, if this is a continuation call.</p>"
11958+
}
11959+
}
11960+
},
11961+
"ListCrawlsResponse":{
11962+
"type":"structure",
11963+
"members":{
11964+
"Crawls":{
11965+
"shape":"CrawlerHistoryList",
11966+
"documentation":"<p>A list of <code>CrawlerHistory</code> objects representing the crawl runs that meet your criteria.</p>"
11967+
},
11968+
"NextToken":{
11969+
"shape":"Token",
11970+
"documentation":"<p>A continuation token for paginating the returned list of tokens, returned if the current segment of the list is not the last.</p>"
11971+
}
11972+
}
11973+
},
1181811974
"ListCustomEntityTypesRequest":{
1181911975
"type":"structure",
1182011976
"members":{
@@ -16895,7 +17051,10 @@
1689517051
"shape":"LineageConfiguration",
1689617052
"documentation":"<p>Specifies data lineage configuration settings for the crawler.</p>"
1689717053
},
16898-
"LakeFormationConfiguration":{"shape":"LakeFormationConfiguration"},
17054+
"LakeFormationConfiguration":{
17055+
"shape":"LakeFormationConfiguration",
17056+
"documentation":"<p>Specifies Lake Formation configuration settings for the crawler.</p>"
17057+
},
1689917058
"Configuration":{
1690017059
"shape":"CrawlerConfiguration",
1690117060
"documentation":"<p>Crawler configuration information. This versioned JSON string allows users to specify aspects of a crawler's behavior. For more information, see <a href=\"https://docs.aws.amazon.com/glue/latest/dg/crawler-configuration.html\">Configuring a Crawler</a>.</p>"

0 commit comments

Comments
 (0)