Skip to content

Instantly share code, notes, and snippets.

@magdmartin
Created April 24, 2015 19:53
Show Gist options
  • Save magdmartin/39dc178aeb1cb05759d7 to your computer and use it in GitHub Desktop.
Save magdmartin/39dc178aeb1cb05759d7 to your computer and use it in GitHub Desktop.
Extract Related Subjects from OCLC MARC XML in OpenRefine
[
{
"op": "core/multivalued-cell-split",
"description": "Split multi-valued cells in column results",
"columnName": "results",
"keyColumnName": "OCLC_ID",
"separator": "datafield",
"mode": "plain"
},
{
"op": "core/row-removal",
"description": "Remove rows",
"engineConfig": {
"facets": [
{
"expression": "value",
"invert": false,
"selectError": false,
"omitError": false,
"name": "results",
"selectBlank": false,
"columnName": "results",
"omitBlank": false,
"type": "list",
"selection": [
{
"v": {
"v": ">\n <",
"l": ">\n <"
}
}
]
}
],
"mode": "row-based"
}
},
{
"op": "core/column-split",
"description": "Split column results by separator",
"engineConfig": {
"facets": [],
"mode": "row-based"
},
"columnName": "results",
"guessCellType": true,
"removeOriginalColumn": true,
"mode": "separator",
"separator": "<subfield",
"regex": false,
"maxColumns": 0
},
{
"op": "core/fill-down",
"description": "Fill down cells in column OCLC_ID",
"engineConfig": {
"facets": [],
"mode": "row-based"
},
"columnName": "OCLC_ID"
},
{
"op": "core/column-reorder",
"description": "Reorder columns",
"columnNames": [
"OCLC_ID",
"results 1",
"results 2"
]
},
{
"op": "core/row-star",
"description": "Star rows",
"engineConfig": {
"facets": [
{
"query": "650",
"name": "results 1",
"caseSensitive": false,
"columnName": "results 1",
"type": "text",
"mode": "text"
}
],
"mode": "row-based"
},
"starred": true
},
{
"op": "core/row-removal",
"description": "Remove rows",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": false,
"l": "false"
}
}
]
}
],
"mode": "row-based"
}
}
]
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment