Skip to content

Commit 2d623bb

Browse files
Add dataset cleaning operations for multiple columns
This JSON file contains a series of text transformation operations for various columns in a dataset, specifically targeting 'materialDS', 'centuryDS', 'placeDS', and 'dsItemID'. Each operation uses a regular expression to replace a specific URL pattern with an empty string.
1 parent a954fc0 commit 2d623bb

1 file changed

Lines changed: 54 additions & 0 deletions

File tree

Lines changed: 54 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,54 @@
1+
[
2+
{
3+
"op": "core/text-transform",
4+
"engineConfig": {
5+
"facets": [],
6+
"mode": "row-based"
7+
},
8+
"columnName": "materialDS",
9+
"expression": "grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")",
10+
"onError": "keep-original",
11+
"repeat": false,
12+
"repeatCount": 10,
13+
"description": "Text transform on cells in column materialDS using expression grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")"
14+
},
15+
{
16+
"op": "core/text-transform",
17+
"engineConfig": {
18+
"facets": [],
19+
"mode": "row-based"
20+
},
21+
"columnName": "centuryDS",
22+
"expression": "grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")",
23+
"onError": "keep-original",
24+
"repeat": false,
25+
"repeatCount": 10,
26+
"description": "Text transform on cells in column centuryDS using expression grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")"
27+
},
28+
{
29+
"op": "core/text-transform",
30+
"engineConfig": {
31+
"facets": [],
32+
"mode": "row-based"
33+
},
34+
"columnName": "placeDS",
35+
"expression": "grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")",
36+
"onError": "keep-original",
37+
"repeat": false,
38+
"repeatCount": 10,
39+
"description": "Text transform on cells in column placeDS using expression grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")"
40+
},
41+
{
42+
"op": "core/text-transform",
43+
"engineConfig": {
44+
"facets": [],
45+
"mode": "row-based"
46+
},
47+
"columnName": "dsItemID",
48+
"expression": "grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")",
49+
"onError": "keep-original",
50+
"repeat": false,
51+
"repeatCount": 10,
52+
"description": "Text transform on cells in column dsItemID using expression grel:value.replace(\"https://catalog.digital-scriptorium.org/entity/\",\"\")"
53+
}
54+
]

0 commit comments

Comments
 (0)