Skip to content

Commit 331deed

Browse files
author
AWS
committed
AWS Glue Update: Added ability to create data quality rulesets for shared, cross-account Glue Data Catalog tables. Added support for dataset comparison rules through a new parameter called AdditionalDataSources. Enhanced the data quality results with a map containing profiled metric values.
1 parent a457c0a commit 331deed

File tree

2 files changed

+92
-3
lines changed

2 files changed

+92
-3
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "AWS Glue",
4+
"contributor": "",
5+
"description": "Added ability to create data quality rulesets for shared, cross-account Glue Data Catalog tables. Added support for dataset comparison rules through a new parameter called AdditionalDataSources. Enhanced the data quality results with a map containing profiled metric values."
6+
}

services/glue/src/main/resources/codegen-resources/service-2.json

Lines changed: 86 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3420,6 +3420,10 @@
34203420
"type":"list",
34213421
"member":{"shape":"Action"}
34223422
},
3423+
"AdditionalOptionKeys":{
3424+
"type":"string",
3425+
"enum":["performanceTuning.caching"]
3426+
},
34233427
"AdditionalOptions":{
34243428
"type":"map",
34253429
"key":{"shape":"EnclosedInStringProperty"},
@@ -3518,14 +3522,14 @@
35183522
"members":{
35193523
"Key":{
35203524
"shape":"GenericString",
3521-
"documentation":"<p>The key when specifying a key-value pair.</p>"
3525+
"documentation":"<p>The key for the additional connection option.</p>"
35223526
},
35233527
"Value":{
35243528
"shape":"GenericString",
3525-
"documentation":"<p>The value when specifying a key-value pair.</p>"
3529+
"documentation":"<p>The value for the additional connection option.</p>"
35263530
}
35273531
},
3528-
"documentation":"<p>Specifies an Amazon Redshift data store.</p>"
3532+
"documentation":"<p>Specifies an optional value when connecting to the Redshift cluster.</p>"
35293533
},
35303534
"AmazonRedshiftAdvancedOptions":{
35313535
"type":"list",
@@ -5369,6 +5373,10 @@
53695373
"AmazonRedshiftTarget":{
53705374
"shape":"AmazonRedshiftTarget",
53715375
"documentation":"<p>Specifies a target that writes to a data target in Amazon Redshift.</p>"
5376+
},
5377+
"EvaluateDataQualityMultiFrame":{
5378+
"shape":"EvaluateDataQualityMultiFrame",
5379+
"documentation":"<p>Specifies your data quality evaluation criteria. Allows multiple input data and returns a collection of Dynamic Frames.</p>"
53725380
}
53735381
},
53745382
"documentation":"<p> <code>CodeGenConfigurationNode</code> enumerates all valid Node types. One and only one of its member variables can be populated.</p>"
@@ -7674,6 +7682,16 @@
76747682
"min":0,
76757683
"pattern":"[\\u0020-\\uD7FF\\uE000-\\uFFFD\\uD800\\uDC00-\\uDBFF\\uDFFF\\r\\n\\t]*"
76767684
},
7685+
"DQAdditionalOptions":{
7686+
"type":"map",
7687+
"key":{"shape":"AdditionalOptionKeys"},
7688+
"value":{"shape":"GenericString"}
7689+
},
7690+
"DQDLAliases":{
7691+
"type":"map",
7692+
"key":{"shape":"NodeName"},
7693+
"value":{"shape":"EnclosedInStringProperty"}
7694+
},
76777695
"DQDLString":{
76787696
"type":"string",
76797697
"max":65536,
@@ -7970,6 +7988,10 @@
79707988
"Result":{
79717989
"shape":"DataQualityRuleResultStatus",
79727990
"documentation":"<p>A pass or fail status for the rule.</p>"
7991+
},
7992+
"EvaluatedMetrics":{
7993+
"shape":"EvaluatedMetricsMap",
7994+
"documentation":"<p>A map of metrics associated with the evaluation of the rule.</p>"
79737995
}
79747996
},
79757997
"documentation":"<p>Describes the result of the evaluation of a data quality rule.</p>"
@@ -8124,6 +8146,10 @@
81248146
"DatabaseName":{
81258147
"shape":"NameString",
81268148
"documentation":"<p>The name of the database where the Glue table exists.</p>"
8149+
},
8150+
"CatalogId":{
8151+
"shape":"NameString",
8152+
"documentation":"<p>The catalog id where the Glue table exists.</p>"
81278153
}
81288154
},
81298155
"documentation":"<p>An object representing an Glue table.</p>"
@@ -8139,6 +8165,11 @@
81398165
},
81408166
"documentation":"<p>A data source (an Glue table) for which you want data quality results.</p>"
81418167
},
8168+
"DataSourceMap":{
8169+
"type":"map",
8170+
"key":{"shape":"NameString"},
8171+
"value":{"shape":"DataSource"}
8172+
},
81428173
"Database":{
81438174
"type":"structure",
81448175
"required":["Name"],
@@ -9551,6 +9582,50 @@
95519582
},
95529583
"documentation":"<p>Specifies your data quality evaluation criteria.</p>"
95539584
},
9585+
"EvaluateDataQualityMultiFrame":{
9586+
"type":"structure",
9587+
"required":[
9588+
"Name",
9589+
"Inputs",
9590+
"Ruleset"
9591+
],
9592+
"members":{
9593+
"Name":{
9594+
"shape":"NodeName",
9595+
"documentation":"<p>The name of the data quality evaluation.</p>"
9596+
},
9597+
"Inputs":{
9598+
"shape":"ManyInputs",
9599+
"documentation":"<p>The inputs of your data quality evaluation. The first input in this list is the primary data source.</p>"
9600+
},
9601+
"AdditionalDataSources":{
9602+
"shape":"DQDLAliases",
9603+
"documentation":"<p>The aliases of all data sources except primary.</p>"
9604+
},
9605+
"Ruleset":{
9606+
"shape":"DQDLString",
9607+
"documentation":"<p>The ruleset for your data quality evaluation.</p>"
9608+
},
9609+
"PublishingOptions":{
9610+
"shape":"DQResultsPublishingOptions",
9611+
"documentation":"<p>Options to configure how your results are published.</p>"
9612+
},
9613+
"AdditionalOptions":{
9614+
"shape":"DQAdditionalOptions",
9615+
"documentation":"<p>Options to configure runtime behavior of the transform.</p>"
9616+
},
9617+
"StopJobOnFailureOptions":{
9618+
"shape":"DQStopJobOnFailureOptions",
9619+
"documentation":"<p>Options to configure how your job will stop if your data quality evaluation fails.</p>"
9620+
}
9621+
},
9622+
"documentation":"<p>Specifies your data quality evaluation criteria.</p>"
9623+
},
9624+
"EvaluatedMetricsMap":{
9625+
"type":"map",
9626+
"key":{"shape":"NameString"},
9627+
"value":{"shape":"NullableDouble"}
9628+
},
95549629
"EvaluationMetrics":{
95559630
"type":"structure",
95569631
"required":["TransformType"],
@@ -10590,6 +10665,10 @@
1059010665
"ResultIds":{
1059110666
"shape":"DataQualityResultIdList",
1059210667
"documentation":"<p>A list of result IDs for the data quality results for the run.</p>"
10668+
},
10669+
"AdditionalDataSources":{
10670+
"shape":"DataSourceMap",
10671+
"documentation":"<p>A map of reference strings to additional data sources you can specify for an evaluation run.</p>"
1059310672
}
1059410673
}
1059510674
},
@@ -17996,6 +18075,10 @@
1799618075
"RulesetNames":{
1799718076
"shape":"RulesetNames",
1799818077
"documentation":"<p>A list of ruleset names.</p>"
18078+
},
18079+
"AdditionalDataSources":{
18080+
"shape":"DataSourceMap",
18081+
"documentation":"<p>A map of reference strings to additional data sources you can specify for an evaluation run.</p>"
1799918082
}
1800018083
}
1800118084
},

0 commit comments

Comments
 (0)