druid/examples/twitter/twitter_realtime.spec

37 lines
1.8 KiB
Python

[{
"schema" : { "dataSource":"twitterstream",
"aggregators":[
{"type":"count", "name":"tweets"},
{"type":"doubleSum","fieldName":"follower_count","name":"total_follower_count"},
{"type":"doubleSum","fieldName":"retweet_count","name":"tota_retweet_count"},
{"type":"doubleSum","fieldName":"friends_count","name":"total_friends_count"},
{"type":"doubleSum","fieldName":"statuses_count","name":"total_statuses_count"},
{"type":"min","fieldName":"follower_count","name":"min_follower_count"},
{"type":"max","fieldName":"follower_count","name":"max_follower_count"},
{"type":"min","fieldName":"friends_count","name":"min_friends_count"},
{"type":"max","fieldName":"friends_count","name":"max_friends_count"},
{"type":"min","fieldName":"statuses_count","name":"min_statuses_count"},
{"type":"max","fieldName":"statuses_count","name":"max_statuses_count"},
{"type":"min","fieldName":"retweet_count","name":"min_retweet_count"},
{"type":"max","fieldName":"retweet_count","name":"max_retweet_count"}
],
"indexGranularity":"minute",
"shardSpec" : { "type": "none" } },
"config" : { "maxRowsInMemory" : 50000,
"intermediatePersistPeriod" : "PT2m" },
"firehose" : { "type" : "twitzer",
"maxEventCount": 50000,
"maxRunMinutes" : 10
},
"plumber" : { "type" : "realtime",
"windowPeriod" : "PT3m",
"segmentGranularity":"hour",
"basePersistDirectory" : "/tmp/twitter_realtime/basePersist" }
}]