Skip to content

Instantly share code, notes, and snippets.

Embed
What would you like to do?
{
"type" : "index_hadoop",
"spec" : {
"dataSchema" : {
"dataSource" : "wikipedia",
"parser" : {
"type" : "hadoopyString",
"parseSpec" : {
"format" : "json",
"timestampSpec" : {
"column" : "timestamp",
"format" : "auto"
},
"dimensionsSpec" : {
"dimensions": ["page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city"],
"dimensionExclusions" : [],
"spatialDimensions" : []
}
}
},
"metricsSpec" : [
{
"type" : "count",
"name" : "count"
},
{
"type" : "doubleSum",
"name" : "added",
"fieldName" : "added"
},
{
"type" : "doubleSum",
"name" : "deleted",
"fieldName" : "deleted"
},
{
"type" : "doubleSum",
"name" : "delta",
"fieldName" : "delta"
}
],
"granularitySpec" : {
"type" : "uniform",
"segmentGranularity" : "DAY",
"queryGranularity" : "NONE",
"intervals" : [ "2013-08-31/2013-09-01" ]
}
},
"ioConfig" : {
"type" : "hadoop",
"inputSpec" : {
"type" : "granularity",
"dataGranularity" : "'y'=yyyy/'m'=MM/'d'=dd/'H'=HH",
"inputPath" : "/MyDirectory/examples/indexing/",
"filePattern" : "*.json",
"pathFormat" : "'y'=yyyy/'m'=MM/'d'=dd/'H'=HH"
}
},
"tuningConfig" : {
"type": "hadoop"
}
}
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment