2016-03-28 03:51:36 -04:00
|
|
|
{
|
|
|
|
"type": "index_hadoop",
|
|
|
|
"spec": {
|
|
|
|
"ioConfig": {
|
|
|
|
"type": "hadoop",
|
|
|
|
"inputSpec": {
|
|
|
|
"type": "static",
|
2018-11-06 00:33:42 -05:00
|
|
|
"inputFormat": "%s",
|
|
|
|
"paths": "example/compat/parquet-1217.parquet"
|
2016-03-28 03:51:36 -04:00
|
|
|
},
|
|
|
|
"metadataUpdateSpec": {
|
|
|
|
"type": "postgresql",
|
|
|
|
"connectURI": "jdbc:postgresql://localhost/druid",
|
2018-11-06 00:33:42 -05:00
|
|
|
"user": "druid",
|
|
|
|
"password": "asdf",
|
2016-03-28 03:51:36 -04:00
|
|
|
"segmentTable": "druid_segments"
|
|
|
|
},
|
|
|
|
"segmentOutputPath": "/tmp/segments"
|
|
|
|
},
|
|
|
|
"dataSchema": {
|
2018-11-06 00:33:42 -05:00
|
|
|
"dataSource": "test",
|
2016-03-28 03:51:36 -04:00
|
|
|
"parser": {
|
2018-11-06 00:33:42 -05:00
|
|
|
"type": "%s",
|
2016-03-28 03:51:36 -04:00
|
|
|
"parseSpec": {
|
2018-11-06 00:33:42 -05:00
|
|
|
"format": "%s",
|
|
|
|
"flattenSpec": {
|
|
|
|
"useFieldDiscovery": true,
|
|
|
|
"fields": [
|
|
|
|
{
|
|
|
|
"type": "root",
|
|
|
|
"name": "col"
|
|
|
|
},
|
|
|
|
{
|
|
|
|
"type": "path",
|
|
|
|
"name": "metric1",
|
|
|
|
"expr": "$.col"
|
|
|
|
}
|
|
|
|
]
|
|
|
|
},
|
2016-03-28 03:51:36 -04:00
|
|
|
"timestampSpec": {
|
|
|
|
"column": "timestamp",
|
2018-11-06 00:33:42 -05:00
|
|
|
"format": "auto",
|
|
|
|
"missingValue": "2018-09-01T00:00:00.000Z"
|
2016-03-28 03:51:36 -04:00
|
|
|
},
|
|
|
|
"dimensionsSpec": {
|
2018-11-06 00:33:42 -05:00
|
|
|
"dimensions": [],
|
2016-03-28 03:51:36 -04:00
|
|
|
"dimensionExclusions": [],
|
|
|
|
"spatialDimensions": []
|
|
|
|
}
|
|
|
|
}
|
|
|
|
},
|
2018-11-06 00:33:42 -05:00
|
|
|
"metricsSpec": [
|
|
|
|
{
|
|
|
|
"type": "count",
|
|
|
|
"name": "count"
|
|
|
|
},
|
|
|
|
{
|
|
|
|
"type": "longSum",
|
|
|
|
"name": "metric1",
|
|
|
|
"fieldName": "metric1"
|
|
|
|
}
|
|
|
|
],
|
2016-03-28 03:51:36 -04:00
|
|
|
"granularitySpec": {
|
|
|
|
"type": "uniform",
|
|
|
|
"segmentGranularity": "DAY",
|
|
|
|
"queryGranularity": "NONE",
|
2018-11-06 00:33:42 -05:00
|
|
|
"intervals": [
|
|
|
|
"2018-08-30/2020-09-02"
|
|
|
|
]
|
2016-03-28 03:51:36 -04:00
|
|
|
}
|
|
|
|
},
|
|
|
|
"tuningConfig": {
|
|
|
|
"type": "hadoop",
|
|
|
|
"workingPath": "tmp/working_path",
|
|
|
|
"partitionsSpec": {
|
|
|
|
"targetPartitionSize": 5000000
|
|
|
|
},
|
2018-11-06 00:33:42 -05:00
|
|
|
"jobProperties": {
|
2016-03-28 03:51:36 -04:00
|
|
|
"mapreduce.map.java.opts": "-server -Duser.timezone=UTC -Dfile.encoding=UTF-8 -XX:+PrintGCDetails -XX:+PrintGCTimeStamps",
|
|
|
|
"mapreduce.reduce.java.opts": "-server -Duser.timezone=UTC -Dfile.encoding=UTF-8 -XX:+PrintGCDetails -XX:+PrintGCTimeStamps",
|
|
|
|
"mapred.child.java.opts": "-server -XX:+PrintGCDetails -XX:+PrintGCTimeStamps"
|
|
|
|
},
|
|
|
|
"leaveIntermediate": true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|