|
669 | 669 | "max":20,
|
670 | 670 | "min":0
|
671 | 671 | },
|
| 672 | + "ColumnSelector":{ |
| 673 | + "type":"structure", |
| 674 | + "members":{ |
| 675 | + "Regex":{ |
| 676 | + "shape":"ColumnName", |
| 677 | + "documentation":"<p>A regular expression for selecting a column from a dataset.</p>" |
| 678 | + }, |
| 679 | + "Name":{ |
| 680 | + "shape":"ColumnName", |
| 681 | + "documentation":"<p>The name of a column from a dataset.</p>" |
| 682 | + } |
| 683 | + }, |
| 684 | + "documentation":"<p>Selector of a column from a dataset for profile job configuration. One selector includes either a column name or a regular expression.</p>" |
| 685 | + }, |
| 686 | + "ColumnSelectorList":{ |
| 687 | + "type":"list", |
| 688 | + "member":{"shape":"ColumnSelector"}, |
| 689 | + "min":1 |
| 690 | + }, |
| 691 | + "ColumnStatisticsConfiguration":{ |
| 692 | + "type":"structure", |
| 693 | + "required":["Statistics"], |
| 694 | + "members":{ |
| 695 | + "Selectors":{ |
| 696 | + "shape":"ColumnSelectorList", |
| 697 | + "documentation":"<p>List of column selectors. Selectors can be used to select columns from the dataset. When selectors are undefined, configuration will be applied to all supported columns. </p>" |
| 698 | + }, |
| 699 | + "Statistics":{ |
| 700 | + "shape":"StatisticsConfiguration", |
| 701 | + "documentation":"<p>Configuration for evaluations. Statistics can be used to select evaluations and override parameters of evaluations. </p>" |
| 702 | + } |
| 703 | + }, |
| 704 | + "documentation":"<p>Configuration for column evaluations for a profile job. ColumnStatisticsConfiguration can be used to select evaluations and override parameters of evaluations for particular columns. </p>" |
| 705 | + }, |
| 706 | + "ColumnStatisticsConfigurationList":{ |
| 707 | + "type":"list", |
| 708 | + "member":{"shape":"ColumnStatisticsConfiguration"}, |
| 709 | + "min":1 |
| 710 | + }, |
672 | 711 | "CompressionFormat":{
|
673 | 712 | "type":"string",
|
674 | 713 | "enum":[
|
|
804 | 843 | "documentation":"<p>The maximum number of times to retry the job after a job run fails.</p>"
|
805 | 844 | },
|
806 | 845 | "OutputLocation":{"shape":"S3Location"},
|
| 846 | + "Configuration":{ |
| 847 | + "shape":"ProfileConfiguration", |
| 848 | + "documentation":"<p>Configuration for profile jobs. Used to select columns, do evaluations, and override default parameters of evaluations. When configuration is null, the profile job will run with default settings.</p>" |
| 849 | + }, |
807 | 850 | "RoleArn":{
|
808 | 851 | "shape":"Arn",
|
809 | 852 | "documentation":"<p>The Amazon Resource Name (ARN) of the Identity and Access Management (IAM) role to be assumed when DataBrew runs the job.</p>"
|
|
915 | 958 | },
|
916 | 959 | "DataCatalogOutputs":{
|
917 | 960 | "shape":"DataCatalogOutputList",
|
918 |
| - "documentation":"<p>One or more artifacts that represent the AWS Glue Data Catalog output from running the job.</p>" |
| 961 | + "documentation":"<p>One or more artifacts that represent the Glue Data Catalog output from running the job.</p>" |
| 962 | + }, |
| 963 | + "DatabaseOutputs":{ |
| 964 | + "shape":"DatabaseOutputList", |
| 965 | + "documentation":"<p>Represents a list of JDBC database output objects which defines the output destination for a DataBrew recipe job to write to. </p>" |
919 | 966 | },
|
920 | 967 | "ProjectName":{
|
921 | 968 | "shape":"ProjectName",
|
|
1081 | 1128 | "members":{
|
1082 | 1129 | "CatalogId":{
|
1083 | 1130 | "shape":"CatalogId",
|
1084 |
| - "documentation":"<p>The unique identifier of the AWS account that holds the Data Catalog that stores the data.</p>" |
| 1131 | + "documentation":"<p>The unique identifier of the Amazon Web Services account that holds the Data Catalog that stores the data.</p>" |
1085 | 1132 | },
|
1086 | 1133 | "DatabaseName":{
|
1087 | 1134 | "shape":"DatabaseName",
|
|
1093 | 1140 | },
|
1094 | 1141 | "S3Options":{
|
1095 | 1142 | "shape":"S3TableOutputOptions",
|
1096 |
| - "documentation":"<p>Represents options that specify how and where DataBrew writes the S3 output generated by recipe jobs.</p>" |
| 1143 | + "documentation":"<p>Represents options that specify how and where DataBrew writes the Amazon S3 output generated by recipe jobs.</p>" |
1097 | 1144 | },
|
1098 | 1145 | "DatabaseOptions":{
|
1099 | 1146 | "shape":"DatabaseTableOutputOptions",
|
|
1104 | 1151 | "documentation":"<p>A value that, if true, means that any data in the location specified for output is overwritten with new output. Not supported with DatabaseOptions.</p>"
|
1105 | 1152 | }
|
1106 | 1153 | },
|
1107 |
| - "documentation":"<p>Represents options that specify how and where DataBrew writes the output generated by recipe jobs.</p>" |
| 1154 | + "documentation":"<p>Represents options that specify how and where in the Glue Data Catalog DataBrew writes the output generated by recipe jobs.</p>" |
1108 | 1155 | },
|
1109 | 1156 | "DataCatalogOutputList":{
|
1110 | 1157 | "type":"list",
|
|
1135 | 1182 | "max":255,
|
1136 | 1183 | "min":1
|
1137 | 1184 | },
|
| 1185 | + "DatabaseOutput":{ |
| 1186 | + "type":"structure", |
| 1187 | + "required":[ |
| 1188 | + "GlueConnectionName", |
| 1189 | + "DatabaseOptions" |
| 1190 | + ], |
| 1191 | + "members":{ |
| 1192 | + "GlueConnectionName":{ |
| 1193 | + "shape":"GlueConnectionName", |
| 1194 | + "documentation":"<p>The Glue connection that stores the connection information for the target database.</p>" |
| 1195 | + }, |
| 1196 | + "DatabaseOptions":{ |
| 1197 | + "shape":"DatabaseTableOutputOptions", |
| 1198 | + "documentation":"<p>Represents options that specify how and where DataBrew writes the database output generated by recipe jobs.</p>" |
| 1199 | + }, |
| 1200 | + "DatabaseOutputMode":{ |
| 1201 | + "shape":"DatabaseOutputMode", |
| 1202 | + "documentation":"<p>The output mode to write into the database. Currently supported option: NEW_TABLE.</p>" |
| 1203 | + } |
| 1204 | + }, |
| 1205 | + "documentation":"<p>Represents a JDBC database output object which defines the output destination for a DataBrew recipe job to write into.</p>" |
| 1206 | + }, |
| 1207 | + "DatabaseOutputList":{ |
| 1208 | + "type":"list", |
| 1209 | + "member":{"shape":"DatabaseOutput"}, |
| 1210 | + "min":1 |
| 1211 | + }, |
| 1212 | + "DatabaseOutputMode":{ |
| 1213 | + "type":"string", |
| 1214 | + "enum":["NEW_TABLE"] |
| 1215 | + }, |
1138 | 1216 | "DatabaseTableName":{
|
1139 | 1217 | "type":"string",
|
1140 | 1218 | "max":255,
|
|
1545 | 1623 | },
|
1546 | 1624 | "DataCatalogOutputs":{
|
1547 | 1625 | "shape":"DataCatalogOutputList",
|
1548 |
| - "documentation":"<p>One or more artifacts that represent the AWS Glue Data Catalog output from running the job.</p>" |
| 1626 | + "documentation":"<p>One or more artifacts that represent the Glue Data Catalog output from running the job.</p>" |
| 1627 | + }, |
| 1628 | + "DatabaseOutputs":{ |
| 1629 | + "shape":"DatabaseOutputList", |
| 1630 | + "documentation":"<p>Represents a list of JDBC database output objects which defines the output destination for a DataBrew recipe job to write into.</p>" |
1549 | 1631 | },
|
1550 | 1632 | "ProjectName":{
|
1551 | 1633 | "shape":"ProjectName",
|
1552 | 1634 | "documentation":"<p>The DataBrew project associated with this job.</p>"
|
1553 | 1635 | },
|
| 1636 | + "ProfileConfiguration":{ |
| 1637 | + "shape":"ProfileConfiguration", |
| 1638 | + "documentation":"<p>Configuration for profile jobs. Used to select columns, do evaluations, and override default parameters of evaluations. When configuration is null, the profile job will run with default settings.</p>" |
| 1639 | + }, |
1554 | 1640 | "RecipeReference":{"shape":"RecipeReference"},
|
1555 | 1641 | "ResourceArn":{
|
1556 | 1642 | "shape":"Arn",
|
|
1623 | 1709 | "shape":"JobName",
|
1624 | 1710 | "documentation":"<p>The name of the job being processed during this run.</p>"
|
1625 | 1711 | },
|
| 1712 | + "ProfileConfiguration":{ |
| 1713 | + "shape":"ProfileConfiguration", |
| 1714 | + "documentation":"<p>Configuration for profile jobs. Used to select columns, do evaluations, and override default parameters of evaluations. When configuration is null, the profile job will run with default settings.</p>" |
| 1715 | + }, |
1626 | 1716 | "RunId":{
|
1627 | 1717 | "shape":"JobRunId",
|
1628 | 1718 | "documentation":"<p>The unique identifier of the job run.</p>"
|
|
1645 | 1735 | },
|
1646 | 1736 | "DataCatalogOutputs":{
|
1647 | 1737 | "shape":"DataCatalogOutputList",
|
1648 |
| - "documentation":"<p>One or more artifacts that represent the AWS Glue Data Catalog output from running the job.</p>" |
| 1738 | + "documentation":"<p>One or more artifacts that represent the Glue Data Catalog output from running the job.</p>" |
| 1739 | + }, |
| 1740 | + "DatabaseOutputs":{ |
| 1741 | + "shape":"DatabaseOutputList", |
| 1742 | + "documentation":"<p>Represents a list of JDBC database output objects which defines the output destination for a DataBrew recipe job to write into.</p>" |
1649 | 1743 | },
|
1650 | 1744 | "RecipeReference":{"shape":"RecipeReference"},
|
1651 | 1745 | "StartedBy":{
|
|
2067 | 2161 | },
|
2068 | 2162 | "DataCatalogOutputs":{
|
2069 | 2163 | "shape":"DataCatalogOutputList",
|
2070 |
| - "documentation":"<p>One or more artifacts that represent the AWS Glue Data Catalog output from running the job.</p>" |
| 2164 | + "documentation":"<p>One or more artifacts that represent the Glue Data Catalog output from running the job.</p>" |
| 2165 | + }, |
| 2166 | + "DatabaseOutputs":{ |
| 2167 | + "shape":"DatabaseOutputList", |
| 2168 | + "documentation":"<p>Represents a list of JDBC database output objects which defines the output destination for a DataBrew recipe job to write into.</p>" |
2071 | 2169 | },
|
2072 | 2170 | "ProjectName":{
|
2073 | 2171 | "shape":"ProjectName",
|
|
2163 | 2261 | },
|
2164 | 2262 | "DataCatalogOutputs":{
|
2165 | 2263 | "shape":"DataCatalogOutputList",
|
2166 |
| - "documentation":"<p>One or more artifacts that represent the AWS Glue Data Catalog output from running the job.</p>" |
| 2264 | + "documentation":"<p>One or more artifacts that represent the Glue Data Catalog output from running the job.</p>" |
| 2265 | + }, |
| 2266 | + "DatabaseOutputs":{ |
| 2267 | + "shape":"DatabaseOutputList", |
| 2268 | + "documentation":"<p>Represents a list of JDBC database output objects which defines the output destination for a DataBrew recipe job to write into.</p>" |
2167 | 2269 | },
|
2168 | 2270 | "RecipeReference":{
|
2169 | 2271 | "shape":"RecipeReference",
|
|
2606 | 2708 | "documentation":"<p>Represents options that define how DataBrew formats job output files.</p>"
|
2607 | 2709 | }
|
2608 | 2710 | },
|
2609 |
| - "documentation":"<p>Represents options that specify how and where DataBrew writes the output generated by recipe jobs or profile jobs.</p>" |
| 2711 | + "documentation":"<p>Represents options that specify how and where in Amazon S3 DataBrew writes the output generated by recipe jobs or profile jobs.</p>" |
2610 | 2712 | },
|
2611 | 2713 | "OutputFormat":{
|
2612 | 2714 | "type":"string",
|
|
2657 | 2759 | },
|
2658 | 2760 | "ParameterValue":{
|
2659 | 2761 | "type":"string",
|
2660 |
| - "max":12288, |
| 2762 | + "max":32768, |
2661 | 2763 | "min":1
|
2662 | 2764 | },
|
2663 | 2765 | "PathOptions":{
|
|
2692 | 2794 | "min":1
|
2693 | 2795 | },
|
2694 | 2796 | "Preview":{"type":"boolean"},
|
| 2797 | + "ProfileConfiguration":{ |
| 2798 | + "type":"structure", |
| 2799 | + "members":{ |
| 2800 | + "DatasetStatisticsConfiguration":{ |
| 2801 | + "shape":"StatisticsConfiguration", |
| 2802 | + "documentation":"<p>Configuration for inter-column evaluations. Configuration can be used to select evaluations and override parameters of evaluations. When configuration is undefined, the profile job will run all supported inter-column evaluations. </p>" |
| 2803 | + }, |
| 2804 | + "ProfileColumns":{ |
| 2805 | + "shape":"ColumnSelectorList", |
| 2806 | + "documentation":"<p>List of column selectors. ProfileColumns can be used to select columns from the dataset. When ProfileColumns is undefined, the profile job will profile all supported columns. </p>" |
| 2807 | + }, |
| 2808 | + "ColumnStatisticsConfigurations":{ |
| 2809 | + "shape":"ColumnStatisticsConfigurationList", |
| 2810 | + "documentation":"<p>List of configurations for column evaluations. ColumnStatisticsConfigurations are used to select evaluations and override parameters of evaluations for particular columns. When ColumnStatisticsConfigurations is undefined, the profile job will profile all supported columns and run all supported evaluations. </p>" |
| 2811 | + } |
| 2812 | + }, |
| 2813 | + "documentation":"<p>Configuration for profile jobs. Configuration can be used to select columns, do evaluations, and override default parameters of evaluations. When configuration is undefined, the profile job will apply default settings to all supported columns. </p>" |
| 2814 | + }, |
2695 | 2815 | "Project":{
|
2696 | 2816 | "type":"structure",
|
2697 | 2817 | "required":[
|
|
2983 | 3103 | "documentation":"<p>Represents an Amazon S3 location (bucket name and object key) where DataBrew can write output from a job.</p>"
|
2984 | 3104 | }
|
2985 | 3105 | },
|
2986 |
| - "documentation":"<p>Represents options that specify how and where DataBrew writes the S3 output generated by recipe jobs.</p>" |
| 3106 | + "documentation":"<p>Represents options that specify how and where DataBrew writes the Amazon S3 output generated by recipe jobs.</p>" |
2987 | 3107 | },
|
2988 | 3108 | "Sample":{
|
2989 | 3109 | "type":"structure",
|
|
3231 | 3351 | }
|
3232 | 3352 | },
|
3233 | 3353 | "StartedBy":{"type":"string"},
|
| 3354 | + "Statistic":{ |
| 3355 | + "type":"string", |
| 3356 | + "max":128, |
| 3357 | + "min":1, |
| 3358 | + "pattern":"^[A-Z\\_]+$" |
| 3359 | + }, |
| 3360 | + "StatisticList":{ |
| 3361 | + "type":"list", |
| 3362 | + "member":{"shape":"Statistic"}, |
| 3363 | + "min":1 |
| 3364 | + }, |
| 3365 | + "StatisticOverride":{ |
| 3366 | + "type":"structure", |
| 3367 | + "required":[ |
| 3368 | + "Statistic", |
| 3369 | + "Parameters" |
| 3370 | + ], |
| 3371 | + "members":{ |
| 3372 | + "Statistic":{ |
| 3373 | + "shape":"Statistic", |
| 3374 | + "documentation":"<p>The name of an evaluation</p>" |
| 3375 | + }, |
| 3376 | + "Parameters":{ |
| 3377 | + "shape":"ParameterMap", |
| 3378 | + "documentation":"<p>A map that includes overrides of an evaluation’s parameters.</p>" |
| 3379 | + } |
| 3380 | + }, |
| 3381 | + "documentation":"<p>Override of a particular evaluation for a profile job. </p>" |
| 3382 | + }, |
| 3383 | + "StatisticOverrideList":{ |
| 3384 | + "type":"list", |
| 3385 | + "member":{"shape":"StatisticOverride"}, |
| 3386 | + "min":1 |
| 3387 | + }, |
| 3388 | + "StatisticsConfiguration":{ |
| 3389 | + "type":"structure", |
| 3390 | + "members":{ |
| 3391 | + "IncludedStatistics":{ |
| 3392 | + "shape":"StatisticList", |
| 3393 | + "documentation":"<p>List of included evaluations. When the list is undefined, all supported evaluations will be included.</p>" |
| 3394 | + }, |
| 3395 | + "Overrides":{ |
| 3396 | + "shape":"StatisticOverrideList", |
| 3397 | + "documentation":"<p>List of overrides for evaluations.</p>" |
| 3398 | + } |
| 3399 | + }, |
| 3400 | + "documentation":"<p>Configuration of evaluations for a profile job. This configuration can be used to select evaluations and override the parameters of selected evaluations. </p>" |
| 3401 | + }, |
3234 | 3402 | "StepIndex":{
|
3235 | 3403 | "type":"integer",
|
3236 | 3404 | "min":0
|
|
3401 | 3569 | "RoleArn"
|
3402 | 3570 | ],
|
3403 | 3571 | "members":{
|
| 3572 | + "Configuration":{ |
| 3573 | + "shape":"ProfileConfiguration", |
| 3574 | + "documentation":"<p>Configuration for profile jobs. Used to select columns, do evaluations, and override default parameters of evaluations. When configuration is null, the profile job will run with default settings.</p>" |
| 3575 | + }, |
3404 | 3576 | "EncryptionKeyArn":{
|
3405 | 3577 | "shape":"EncryptionKeyArn",
|
3406 | 3578 | "documentation":"<p>The Amazon Resource Name (ARN) of an encryption key that is used to protect the job.</p>"
|
|
3525 | 3697 | },
|
3526 | 3698 | "DataCatalogOutputs":{
|
3527 | 3699 | "shape":"DataCatalogOutputList",
|
3528 |
| - "documentation":"<p>One or more artifacts that represent the AWS Glue Data Catalog output from running the job.</p>" |
| 3700 | + "documentation":"<p>One or more artifacts that represent the Glue Data Catalog output from running the job.</p>" |
| 3701 | + }, |
| 3702 | + "DatabaseOutputs":{ |
| 3703 | + "shape":"DatabaseOutputList", |
| 3704 | + "documentation":"<p>Represents a list of JDBC database output objects which defines the output destination for a DataBrew recipe job to write into.</p>" |
3529 | 3705 | },
|
3530 | 3706 | "RoleArn":{
|
3531 | 3707 | "shape":"Arn",
|
|
0 commit comments