[
{
"name": "No rows with ill-formed text",
"description": "Asserts that there are no rows with more non-alpha characters than alpha characters",
"type": "integrity",
"subtype": "illFormedRowCount",
"thresholds": [
{
"insightName": "illFormedRowCount",
"insightParameters": [{ "name": "column_name", "value": "output" }], // Check column `output`
"measurement": "illFormedRowCount", // Using the absolute row count
"operator": "<=",
"value": 0
}
],
"subpopulationFilters": null,
"mode": "development",
"usesValidationDataset": true, // Apply test to the validation set
"usesTrainingDataset": false,
"usesMlModel": false,
"syncId": "b4dee7dc-4f15-48ca-a282-63e2c04e0689" // Some unique id
},
{
"name": "Less than 20% of rows with ill-formed text",
"description": "Asserts that less than 20% of the rows have more non-alpha characters than alpha characters",
"type": "integrity",
"subtype": "illFormedRowCount",
"thresholds": [
{
"insightName": "illFormedRowCount",
"insightParameters": [{ "name": "column_name", "value": "output" }], // Check column `output`
"measurement": "illFormedRowPercentage", // Using the absolute row count
"operator": "<",
"value": 0.2
}
],
"subpopulationFilters": null,
"mode": "development",
"usesValidationDataset": true, // Apply test to the validation set
"usesTrainingDataset": false,
"usesMlModel": false,
"syncId": "96622fba-ea00-4e42-8f42-5e8f5f60805f" // Some unique id
}
]