Skip to content

Instantly share code, notes, and snippets.

@hpiedcoq
Created March 27, 2015 14:02
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save hpiedcoq/e0c32ef72727ce65e80c to your computer and use it in GitHub Desktop.
Save hpiedcoq/e0c32ef72727ce65e80c to your computer and use it in GitHub Desktop.
Log IP traité via OpenRefine
[
{
"op": "core/row-removal",
"description": "Remove rows",
"engineConfig": {
"facets": [
{
"expression": "row.starred",
"invert": false,
"selectError": false,
"omitError": false,
"name": "Starred Rows",
"selectBlank": false,
"columnName": "",
"omitBlank": false,
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
}
},
{
"op": "core/column-addition",
"description": "Create column IP at index 1 based on column Column 1 using expression grel:value.partition(\"ip=\\\"\")[2].partition(\"\\\"\")[0]",
"engineConfig": {
"facets": [],
"mode": "row-based"
},
"newColumnName": "IP",
"columnInsertIndex": 1,
"baseColumnName": "Column 1",
"expression": "grel:value.partition(\"ip=\\\"\")[2].partition(\"\\\"\")[0]",
"onError": "set-to-blank"
},
{
"op": "core/column-addition",
"description": "Create column Date at index 1 based on column Column 1 using expression grel:value.partition(\"date=\\\"\")[2].partition(\" \")[0]",
"engineConfig": {
"facets": [],
"mode": "row-based"
},
"newColumnName": "Date",
"columnInsertIndex": 1,
"baseColumnName": "Column 1",
"expression": "grel:value.partition(\"date=\\\"\")[2].partition(\" \")[0]",
"onError": "set-to-blank"
},
{
"op": "core/column-addition",
"description": "Create column Heure at index 1 based on column Column 1 using expression grel:value.partition(\"date=\\\"\")[2].partition(\" \")[2].partition(\"\\\"\")[0]",
"engineConfig": {
"facets": [],
"mode": "row-based"
},
"newColumnName": "Heure",
"columnInsertIndex": 1,
"baseColumnName": "Column 1",
"expression": "grel:value.partition(\"date=\\\"\")[2].partition(\" \")[2].partition(\"\\\"\")[0]",
"onError": "set-to-blank"
},
{
"op": "core/column-move",
"description": "Move column IP to position 0",
"columnName": "IP",
"index": 0
},
{
"op": "core/column-removal",
"description": "Remove column Column 1",
"columnName": "Column 1"
},
{
"op": "core/column-addition",
"description": "Create column Date et heure at index 2 based on column Heure using expression grel:cells[\"Date\"].value+\"-\"+value",
"engineConfig": {
"facets": [],
"mode": "row-based"
},
"newColumnName": "Date et heure",
"columnInsertIndex": 2,
"baseColumnName": "Heure",
"expression": "grel:cells[\"Date\"].value+\"-\"+value",
"onError": "set-to-blank"
},
{
"op": "core/column-removal",
"description": "Remove column Heure",
"columnName": "Heure"
},
{
"op": "core/column-removal",
"description": "Remove column Date",
"columnName": "Date"
},
{
"op": "core/row-reorder",
"description": "Reorder rows",
"mode": "record-based",
"sorting": {
"criteria": [
{
"reverse": true,
"column": "IP",
"caseSensitive": false,
"valueType": "string",
"blankPosition": 2,
"errorPosition": 1
}
]
}
},
{
"op": "core/blank-down",
"description": "Blank down cells in column IP",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"columnName": "IP"
},
{
"op": "core/multivalued-cell-join",
"description": "Join multi-valued cells in column Date et heure",
"columnName": "Date et heure",
"keyColumnName": "IP",
"separator": ";"
},
{
"op": "core/column-addition",
"description": "Create column URL at index 1 based on column IP using expression grel:\"http://www.telize.com/geoip/\"+value",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "URL",
"columnInsertIndex": 1,
"baseColumnName": "IP",
"expression": "grel:\"http://www.telize.com/geoip/\"+value",
"onError": "set-to-blank"
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column Json at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Json",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 250
},
{
"op": "core/column-addition",
"description": "Create column Provider at index 3 based on column Json using expression grel:value.parseJson().isp",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Provider",
"columnInsertIndex": 3,
"baseColumnName": "Json",
"expression": "grel:value.parseJson().isp",
"onError": "set-to-blank"
},
{
"op": "core/column-addition",
"description": "Create column Pays at index 3 based on column Json using expression grel:value.parseJson().country",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Pays",
"columnInsertIndex": 3,
"baseColumnName": "Json",
"expression": "grel:value.parseJson().country",
"onError": "set-to-blank"
},
{
"op": "core/column-addition",
"description": "Create column Région at index 3 based on column Json using expression grel:value.parseJson().region",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Région",
"columnInsertIndex": 3,
"baseColumnName": "Json",
"expression": "grel:value.parseJson().region",
"onError": "set-to-blank"
},
{
"op": "core/column-addition",
"description": "Create column Lat at index 3 based on column Json using expression grel:value.parseJson().latitude",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Lat",
"columnInsertIndex": 3,
"baseColumnName": "Json",
"expression": "grel:value.parseJson().latitude",
"onError": "set-to-blank"
},
{
"op": "core/column-addition",
"description": "Create column Lon at index 3 based on column Json using expression grel:value.parseJson().longitude",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Lon",
"columnInsertIndex": 3,
"baseColumnName": "Json",
"expression": "grel:value.parseJson().longitude",
"onError": "set-to-blank"
},
{
"op": "core/column-removal",
"description": "Remove column Json",
"columnName": "Json"
},
{
"op": "core/column-removal",
"description": "Remove column URL",
"columnName": "URL"
},
{
"op": "core/column-addition",
"description": "Create column Lat,Lon at index 3 based on column Lat using expression grel:value+\", \"+cells[\"Lon\"].value",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Lat,Lon",
"columnInsertIndex": 3,
"baseColumnName": "Lat",
"expression": "grel:value+\", \"+cells[\"Lon\"].value",
"onError": "set-to-blank"
},
{
"op": "core/multivalued-cell-split",
"description": "Split multi-valued cells in column Date et heure",
"columnName": "Date et heure",
"keyColumnName": "IP",
"separator": ";",
"mode": "plain"
},
{
"op": "core/fill-down",
"description": "Fill down cells in column IP",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"columnName": "IP"
},
{
"op": "core/column-addition",
"description": "Create column Nbre de connexions at index 1 based on column IP using expression grel:facetCount(value,\"value\",\"IP\")",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "Nbre de connexions",
"columnInsertIndex": 1,
"baseColumnName": "IP",
"expression": "grel:facetCount(value,\"value\",\"IP\")",
"onError": "set-to-blank"
},
{
"op": "core/blank-down",
"description": "Blank down cells in column Nbre de connexions",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"columnName": "Nbre de connexions"
},
{
"op": "core/blank-down",
"description": "Blank down cells in column IP",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"columnName": "IP"
},
{
"op": "core/multivalued-cell-join",
"description": "Join multi-valued cells in column Date et heure",
"columnName": "Date et heure",
"keyColumnName": "IP",
"separator": ";"
},
{
"op": "core/row-reorder",
"description": "Reorder rows",
"mode": "record-based",
"sorting": {
"criteria": [
{
"reverse": true,
"column": "Nbre de connexions",
"valueType": "number",
"blankPosition": 2,
"errorPosition": 1
}
]
}
},
{
"op": "core/row-removal",
"description": "Remove rows",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
}
},
{
"op": "core/column-move",
"description": "Move column IP to position 0",
"columnName": "IP",
"index": 0
},
{
"op": "core/row-reorder",
"description": "Reorder rows",
"mode": "record-based",
"sorting": {
"criteria": [
{
"reverse": true,
"caseSensitive": false,
"column": "IP",
"valueType": "string",
"blankPosition": 2,
"errorPosition": 1
}
]
}
},
{
"op": "core/blank-down",
"description": "Blank down cells in column IP",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"columnName": "IP"
},
{
"op": "core/multivalued-cell-join",
"description": "Join multi-valued cells in column Date et heure",
"columnName": "Date et heure",
"keyColumnName": "IP",
"separator": ";"
},
{
"op": "core/column-addition",
"description": "Create column URL at index 1 based on column IP using expression grel:\"http://www.telize.com/geoip/\"+value",
"engineConfig": {
"facets": [],
"mode": "record-based"
},
"newColumnName": "URL",
"columnInsertIndex": 1,
"baseColumnName": "IP",
"expression": "grel:\"http://www.telize.com/geoip/\"+value",
"onError": "set-to-blank"
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column test at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
},
"newColumnName": "test",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 6000
},
{
"op": "core/column-removal",
"description": "Remove column test",
"columnName": "test"
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column tesing at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
},
"newColumnName": "tesing",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 10000
},
{
"op": "core/column-removal",
"description": "Remove column tesing",
"columnName": "tesing"
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column tesdt at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
},
"newColumnName": "tesdt",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 15000
},
{
"op": "core/column-removal",
"description": "Remove column tesdt",
"columnName": "tesdt"
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column test at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
},
"newColumnName": "test",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 5000
},
{
"op": "core/column-removal",
"description": "Remove column test",
"columnName": "test"
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column test at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
},
"newColumnName": "test",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 5000
},
{
"op": "core/column-removal",
"description": "Remove column test",
"columnName": "test"
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column tes at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
},
"newColumnName": "tes",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 5000
},
{
"op": "core/column-addition-by-fetching-urls",
"description": "Create column testt at index 2 by fetching URLs based on column URL using expression grel:value",
"engineConfig": {
"facets": [
{
"invert": false,
"expression": "row.starred",
"selectError": false,
"omitError": false,
"selectBlank": false,
"name": "Starred Rows",
"omitBlank": false,
"columnName": "",
"type": "list",
"selection": [
{
"v": {
"v": true,
"l": "true"
}
}
]
}
],
"mode": "row-based"
},
"newColumnName": "testt",
"columnInsertIndex": 2,
"baseColumnName": "URL",
"urlExpression": "grel:value",
"onError": "set-to-blank",
"delay": 5000
},
{
"op": "core/column-removal",
"description": "Remove column tes",
"columnName": "tes"
},
{
"op": "core/column-removal",
"description": "Remove column testt",
"columnName": "testt"
}
]
@hpiedcoq
Copy link
Author

Ouvrir le fichier history.xml, virer les deux premières lignes et créer un projet OpenRefine.

Dans Undo/Redo, cliquer sur Apply puis coller simplement le code.

Cliquer sur Perform Operations.

ENJOY!

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment