|
14 | 14 | "$ref": "#/$defs/DataCatererValidation" |
15 | 15 | } |
16 | 16 | ], |
17 | | - "additionalProperties": false, |
18 | 17 | "$defs": { |
19 | 18 | "DataCatererPlan": { |
20 | 19 | "type": "object", |
|
76 | 75 | "$ref": "#/$defs/ForeignKeyRelation" |
77 | 76 | } |
78 | 77 | } |
79 | | - } |
| 78 | + }, |
| 79 | + "required": ["source"], |
| 80 | + "additionalProperties": false |
80 | 81 | } |
81 | 82 | }, |
82 | 83 | "seed": { |
|
156 | 157 | }, |
157 | 158 | "perField": { |
158 | 159 | "type": "object", |
159 | | - "description": "Generate records per unique set of column values. For example, generate 5 transactions for each 'account_number'.", |
| 160 | + "description": "Generate records per unique set of field values. For example, generate 5 transactions for each 'account_number'.", |
160 | 161 | "properties": { |
161 | 162 | "fieldNames": { |
162 | 163 | "type": "array", |
163 | | - "description": "Array of column names to generate records for each set of unique values.", |
| 164 | + "description": "Array of field names to generate records for each set of unique values.", |
164 | 165 | "items": { |
165 | 166 | "type": "string", |
166 | | - "description": "Column name found within schema fields." |
| 167 | + "description": "Field name found within schema fields." |
167 | 168 | } |
168 | 169 | }, |
169 | 170 | "count": { |
170 | 171 | "type": "integer", |
171 | | - "description": "Static number of records per unique set of column values." |
| 172 | + "description": "Static number of records per unique set of field values." |
172 | 173 | }, |
173 | 174 | "options": { |
174 | | - "description": "Random number of records per unique set of column values.", |
| 175 | + "description": "Random number of records per unique set of field values.", |
175 | 176 | "$ref": "#/$defs/CountGeneratorOptions" |
176 | 177 | } |
177 | 178 | }, |
|
272 | 273 | }, |
273 | 274 | "partitionBy": { |
274 | 275 | "type": "string", |
275 | | - "description": "Column name(s) to partition dataset by (comma separated)." |
| 276 | + "description": "Field name(s) to partition dataset by (comma separated)." |
276 | 277 | } |
277 | 278 | }, |
278 | 279 | "required": ["path"] |
|
539 | 540 | "unevaluatedProperties": false |
540 | 541 | } |
541 | 542 | } |
542 | | - }, |
543 | | - "additionalProperties": false |
| 543 | + } |
544 | 544 | }, |
545 | 545 | "DataCatererValidation": { |
546 | 546 | "type": "object", |
|
589 | 589 | "$ref": "#/$defs/UpstreamValidation" |
590 | 590 | }, |
591 | 591 | { |
592 | | - "$ref": "#/$defs/ColumnNameValidation" |
| 592 | + "$ref": "#/$defs/FieldNameValidation" |
593 | 593 | } |
594 | 594 | ] |
595 | 595 | } |
|
612 | 612 | "type": "array", |
613 | 613 | "description": "Name of the field(s) to relate with." |
614 | 614 | } |
615 | | - } |
| 615 | + }, |
| 616 | + "additionalProperties": false |
616 | 617 | }, |
617 | 618 | "EnvironmentVariables": { |
618 | 619 | "type": "object", |
|
714 | 715 | "type": "number", |
715 | 716 | "description": "Mean of generated values.", |
716 | 717 | "default": 500.0 |
| 718 | + }, |
| 719 | + "distribution": { |
| 720 | + "type": "string", |
| 721 | + "description": "Type of distribution values follow.", |
| 722 | + "enum": ["normal", "exponential"] |
| 723 | + }, |
| 724 | + "distributionRateParam": { |
| 725 | + "type": "number", |
| 726 | + "description": "If distribution is `exponential`, rate parameter to adjust exponential distribution." |
717 | 727 | } |
718 | 728 | }, |
719 | 729 | "allOf": [ |
|
1097 | 1107 | }, |
1098 | 1108 | "ValidationSelectExpression": { |
1099 | 1109 | "const": "selectExpr", |
1100 | | - "description": "SQL expression used to apply to columns before running validations." |
| 1110 | + "description": "SQL expression used to apply to fields before running validations." |
1101 | 1111 | }, |
1102 | 1112 | "ValidationAggregateExpression": { |
1103 | 1113 | "const": "aggExpr", |
1104 | 1114 | "description": "SQL expression to define validation after aggregation. Check https://spark.apache.org/docs/latest/api/sql for reference." |
1105 | 1115 | }, |
1106 | | - "ValidationAggregateColumn": { |
1107 | | - "const": "aggCol", |
1108 | | - "description": "Column name to run aggregation on." |
| 1116 | + "ValidationAggregateField": { |
| 1117 | + "const": "aggField", |
| 1118 | + "description": "Field name to run aggregation on." |
1109 | 1119 | }, |
1110 | 1120 | "ValidationAggregateType": { |
1111 | 1121 | "const": "aggType", |
1112 | 1122 | "description": "Type of aggregation to run. Can be either: sum, avg, max, min, mean, stddev, count." |
1113 | 1123 | }, |
1114 | | - "ValidationAggregateGroupByColumns": { |
1115 | | - "const": "groupByCols", |
1116 | | - "description": "Column names to group by for aggregation calculation." |
| 1124 | + "ValidationAggregateGroupByFields": { |
| 1125 | + "const": "groupByFields", |
| 1126 | + "description": "Field names to group by for aggregation calculation." |
1117 | 1127 | }, |
1118 | | - "ValidationUpstreamJoinColumns": { |
1119 | | - "const": "joinColumns", |
1120 | | - "description": "Column names to run join operation on." |
| 1128 | + "ValidationUpstreamJoinFields": { |
| 1129 | + "const": "joinFields", |
| 1130 | + "description": "Field names to run join operation on." |
1121 | 1131 | }, |
1122 | 1132 | "ValidationUpstreamJoinType": { |
1123 | 1133 | "const": "joinType", |
|
1135 | 1145 | "const": "validation", |
1136 | 1146 | "description": "Validation to run after join with upstream data source." |
1137 | 1147 | }, |
1138 | | - "ValidationColumnNameType": { |
1139 | | - "const": "columnNameType", |
1140 | | - "description": "Type of column name validation to run." |
| 1148 | + "ValidationFieldNameType": { |
| 1149 | + "const": "fieldNameType", |
| 1150 | + "description": "Type of field name validation to run." |
1141 | 1151 | }, |
1142 | | - "ValidationColumnNameCount": { |
| 1152 | + "ValidationFieldNameCount": { |
1143 | 1153 | "const": "count", |
1144 | | - "description": "Expected number of column names." |
| 1154 | + "description": "Expected number of field names." |
1145 | 1155 | }, |
1146 | | - "ValidationColumnNameMaxCount": { |
| 1156 | + "ValidationFieldNameMaxCount": { |
1147 | 1157 | "const": "maxCount", |
1148 | | - "description": "Maximum number of column names." |
| 1158 | + "description": "Maximum number of field names." |
1149 | 1159 | }, |
1150 | | - "ValidationColumnNameMinCount": { |
| 1160 | + "ValidationFieldNameMinCount": { |
1151 | 1161 | "const": "minCount", |
1152 | | - "description": "Minimum number of column names." |
| 1162 | + "description": "Minimum number of field names." |
1153 | 1163 | }, |
1154 | | - "ValidationColumnNames": { |
| 1164 | + "ValidationFieldNames": { |
1155 | 1165 | "const": "names", |
1156 | | - "description": "Expected column names." |
| 1166 | + "description": "Expected field names." |
1157 | 1167 | }, |
1158 | 1168 | "BasicValidation": { |
1159 | 1169 | "type": "object", |
|
1191 | 1201 | "$ref": "#/$defs/ValidationPreFilterExpression" |
1192 | 1202 | }, |
1193 | 1203 | { |
1194 | | - "$ref": "#/$defs/ValidationAggregateColumn" |
| 1204 | + "$ref": "#/$defs/ValidationAggregateField" |
1195 | 1205 | }, |
1196 | 1206 | { |
1197 | 1207 | "$ref": "#/$defs/ValidationAggregateExpression" |
1198 | 1208 | }, |
1199 | 1209 | { |
1200 | | - "$ref": "#/$defs/ValidationAggregateGroupByColumns" |
| 1210 | + "$ref": "#/$defs/ValidationAggregateGroupByFields" |
1201 | 1211 | }, |
1202 | 1212 | { |
1203 | 1213 | "$ref": "#/$defs/ValidationAggregateType" |
|
1222 | 1232 | "$ref": "#/$defs/ValidationUpstreamDataSource" |
1223 | 1233 | }, |
1224 | 1234 | { |
1225 | | - "$ref": "#/$defs/ValidationUpstreamJoinColumns" |
| 1235 | + "$ref": "#/$defs/ValidationUpstreamJoinFields" |
1226 | 1236 | }, |
1227 | 1237 | { |
1228 | 1238 | "$ref": "#/$defs/ValidationUpstreamJoinType" |
|
1236 | 1246 | ] |
1237 | 1247 | } |
1238 | 1248 | }, |
1239 | | - "ColumnNameValidation": { |
| 1249 | + "FieldNameValidation": { |
1240 | 1250 | "type": "object", |
1241 | 1251 | "propertyNames": { |
1242 | 1252 | "anyOf": [ |
|
1250 | 1260 | "$ref": "#/$defs/ValidationPreFilterExpression" |
1251 | 1261 | }, |
1252 | 1262 | { |
1253 | | - "$ref": "#/$defs/ValidationColumnNameCount" |
| 1263 | + "$ref": "#/$defs/ValidationFieldNameCount" |
1254 | 1264 | }, |
1255 | 1265 | { |
1256 | | - "$ref": "#/$defs/ValidationColumnNameMaxCount" |
| 1266 | + "$ref": "#/$defs/ValidationFieldNameMaxCount" |
1257 | 1267 | }, |
1258 | 1268 | { |
1259 | | - "$ref": "#/$defs/ValidationColumnNameMinCount" |
| 1269 | + "$ref": "#/$defs/ValidationFieldNameMinCount" |
1260 | 1270 | }, |
1261 | 1271 | { |
1262 | | - "$ref": "#/$defs/ValidationColumnNames" |
| 1272 | + "$ref": "#/$defs/ValidationFieldNames" |
1263 | 1273 | }, |
1264 | 1274 | { |
1265 | | - "$ref": "#/$defs/ValidationColumnNameType" |
| 1275 | + "$ref": "#/$defs/ValidationFieldNameType" |
1266 | 1276 | } |
1267 | 1277 | ] |
1268 | 1278 | } |
|
0 commit comments