/
config-example.json
94 lines (94 loc) · 1.54 KB
/
config-example.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
{
"table": "file:///PATH TO data.csv found in examples directory",
"inferSchema": true,
"delimiter": ",",
"header": true,
"output": "/tmp/output.json",
"verbose": true,
"metrics": [
{
"metric": "completeness"
},
{
"metric": "completeness",
"columns": [
0,
1
]
},
{
"metric": "deduplication",
"columns": [
"c0",
"c1"
]
},
{
"metric": "deduplication"
},
{
"metric": "rule",
"conditions": [ {
"column": 0,
"operator": "lt",
"value": 5
}, {
"column": 0,
"operator": "gt",
"value": 1
} ]
},
{
"metric": "groupRule",
"columns": [
"c0",
"c1"
],
"having": [
{
"column": "*",
"aggregator": "count",
"operator": "gt",
"value": 2
}
],
"conditions": [
{
"column": 2,
"operator": "lt",
"value": 4
}
]
},
{
"metric": "entropy",
"column": 0
},
{
"metric": "entropy",
"column": "c0"
},
{
"metric": "mutual_info",
"when": "c0",
"then": "c1"
},
{
"metric": "constraint",
"when": [
"c0",
1
],
"then": [
2
],
"conditions": [
{
"column": "d0",
"operator": "lt",
"value": 4
}
]
}
]
}