-
Notifications
You must be signed in to change notification settings - Fork 0
/
diff_result.json
173 lines (173 loc) · 6.05 KB
/
diff_result.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
{
"dataMatch": false,
"differencessForKey": [
{
"columnsNotMatching": [
"age"
],
"computedUnmatchPair": [
{
"badCols": [
"age"
],
"distFormatted": [
{
"col": "name",
"colType": "string",
"value": "david"
},
{
"col": "age",
"colType": "string",
"value": "29"
},
{
"col": "zip",
"colType": "string",
"value": "2311"
},
{
"col": "location",
"colType": "string",
"value": "NC"
}
],
"srcFormatted": [
{
"col": "name",
"colType": "string",
"value": "david"
},
{
"col": "age",
"colType": "string",
"value": "31"
},
{
"col": "zip",
"colType": "string",
"value": "2311"
},
{
"col": "location",
"colType": "string",
"value": "NC"
}
]
}
],
"dist": [
"Vector(name:david \t , age:29 \t , zip:2311 \t , location:NC \t )\n"
],
"distRecordsCount": 1,
"key": [
{
"col": "name",
"colType": "string",
"value": "david"
}
],
"src": [
"Vector(name:david \t , age:31 \t , zip:2311 \t , location:NC \t )\n"
],
"srcRecordsCount": 1,
"totalRecordsMatched": 1
},
{
"columnsNotMatching": [],
"computedUnmatchPair": [
{
"badCols": [],
"distFormatted": [
{
"col": "name",
"colType": "string",
"value": "don"
},
{
"col": "age",
"colType": "string",
"value": "25"
},
{
"col": "zip",
"colType": "string",
"value": "2311"
},
{
"col": "location",
"colType": "string",
"value": "SC"
}
]
}
],
"dist": [
"Vector(name:don \t , age:25 \t , zip:2311 \t , location:SC \t )\n"
],
"distRecordsCount": 1,
"key": [
{
"col": "name",
"colType": "string",
"value": "don"
}
],
"src": [],
"srcRecordsCount": 0,
"totalRecordsMatched": 0
}
],
"distPath": "/data/input/person.csv",
"distRowCount": 4,
"inputData": {
"compareColumns": false,
"compareCommonColumnsOnly": false,
"distFile": {
"excludeColmns": [],
"header": true,
"srcDelimiter": ",",
"srcFormat": "CSV",
"srcPath": "/data/input/person.csv",
"transformations": [],
"useOtherSchema": false
},
"matchBoth": true,
"primaryKey": [
"name"
],
"process": true,
"srcFile": {
"excludeColmns": [],
"header": true,
"srcDelimiter": ",",
"srcFormat": "CSV",
"srcPath": "/data/input/person1.csv",
"transformations": [],
"useOtherSchema": false
},
"validateRowsCount": true
},
"reason": "TO_BE_IMPLEMENTED",
"srcPath": "/data/input/person1.csv",
"srcRowCount": 4,
"srcSampleStr": "RecordByKey(List(Cell(name,david,string)),List(age),1,1,1,List(Vector(name:david \t , age:31 \t , zip:2311 \t , location:NC \t )\n),List(Vector(name:david \t , age:29 \t , zip:2311 \t , location:NC \t )\n),Some(List(ComputedUnmatchPair(Some(List(Cell(name,david,string), Cell(age,31,string), Cell(zip,2311,string), Cell(location,NC,string))),Some(List(Cell(name,david,string), Cell(age,29,string), Cell(zip,2311,string), Cell(location,NC,string))),Some(List(age))))),None,None,None) \n RecordByKey(List(Cell(name,don,string)),List(),0,1,0,List(),List(Vector(name:don \t , age:25 \t , zip:2311 \t , location:SC \t )\n),Some(List(ComputedUnmatchPair(None,Some(List(Cell(name,don,string), Cell(age,25,string), Cell(zip,2311,string), Cell(location,SC,string))),Some(List())))),None,None,None)",
"stats": {
"columnsNotMatching": {
"age": 1
},
"columnsNotMatchingMap": {
"age": 1
},
"distDuplicateRecords": -1,
"distKeyCount": 3,
"distRecordsCount": 4,
"srcDuplicateRecords": -1,
"srcKeyCount": 3,
"srcRecordsCount": 4,
"totalDistRecordsMatching": 2,
"totalDistRecordsNotMatching": 2,
"totalSrcRecordsMatching": 2,
"totalSrcRecordsNotMatching": 1
}
}