@article{cattell2011scalable, title={Scalable SQL and NoSQL data stores}, author={Cattell, Rick}, journal={ACM SIGMOD Record}, volume={39}, number={4}, pages={12--27}, year={2011}, publisher={ACM} } @article{chang2008bigtable, title={Bigtable: A distributed storage system for structured data}, author={Chang, Fay and Dean, Jeffrey and Ghemawat, Sanjay and Hsieh, Wilson C and Wallach, Deborah A and Burrows, Mike and Chandra, Tushar and Fikes, Andrew and Gruber, Robert E}, journal={ACM Transactions on Computer Systems (TOCS)}, volume={26}, number={2}, pages={4}, year={2008}, publisher={ACM} } @inproceedings{decandia2007dynamo, title={Dynamo: amazon's highly available key-value store}, author={DeCandia, Giuseppe and Hastorun, Deniz and Jampani, Madan and Kakulapati, Gunavardhan and Lakshman, Avinash and Pilchin, Alex and Sivasubramanian, Swaminathan and Vosshall, Peter and Vogels, Werner}, booktitle={ACM SIGOPS Operating Systems Review}, volume={41}, number={6}, pages={205--220}, year={2007}, organization={ACM} } @inproceedings{abadi2008column, title={Column-Stores vs. Row-Stores: How different are they really?}, author={Abadi, Daniel J and Madden, Samuel R and Hachem, Nabil}, booktitle={Proceedings of the 2008 ACM SIGMOD international conference on Management of data}, pages={967--980}, year={2008}, organization={ACM} } @inproceedings{bear2012vertica, title={The vertica database: SQL RDBMS for managing big data}, author={Bear, Chuck and Lamb, Andrew and Tran, Nga}, booktitle={Proceedings of the 2012 workshop on Management of big data systems}, pages={37--38}, year={2012}, organization={ACM} } @article{lakshman2010cassandra, title={Cassandra—A decentralized structured storage system}, author={Lakshman, Avinash and Malik, Prashant}, journal={Operating systems review}, volume={44}, number={2}, pages={35}, year={2010} } @article{melnik2010dremel, title={Dremel: interactive analysis of web-scale datasets}, author={Melnik, Sergey and Gubarev, Andrey and Long, Jing Jing and Romer, Geoffrey and Shivakumar, Shiva and Tolton, Matt and Vassilakis, Theo}, journal={Proceedings of the VLDB Endowment}, volume={3}, number={1-2}, pages={330--339}, year={2010}, publisher={VLDB Endowment} } @article{hall2012processing, title={Processing a trillion cells per mouse click}, author={Hall, Alexander and Bachmann, Olaf and B{\"u}ssow, Robert and G{\u{a}}nceanu, Silviu and Nunkesser, Marc}, journal={Proceedings of the VLDB Endowment}, volume={5}, number={11}, pages={1436--1446}, year={2012}, publisher={VLDB Endowment} } @inproceedings{shvachko2010hadoop, title={The hadoop distributed file system}, author={Shvachko, Konstantin and Kuang, Hairong and Radia, Sanjay and Chansler, Robert}, booktitle={Mass Storage Systems and Technologies (MSST), 2010 IEEE 26th Symposium on}, pages={1--10}, year={2010}, organization={IEEE} } @article{colantonio2010concise, title={Concise: Compressed ‘n’Composable Integer Set}, author={Colantonio, Alessandro and Di Pietro, Roberto}, journal={Information Processing Letters}, volume={110}, number={16}, pages={644--650}, year={2010}, publisher={Elsevier} } @inproceedings{stonebraker2005c, title={C-store: a column-oriented DBMS}, author={Stonebraker, Mike and Abadi, Daniel J and Batkin, Adam and Chen, Xuedong and Cherniack, Mitch and Ferreira, Miguel and Lau, Edmond and Lin, Amerson and Madden, Sam and O'Neil, Elizabeth and others}, booktitle={Proceedings of the 31st international conference on Very large data bases}, pages={553--564}, year={2005}, organization={VLDB Endowment} } @inproceedings{engle2012shark, title={Shark: fast data analysis using coarse-grained distributed memory}, author={Engle, Cliff and Lupher, Antonio and Xin, Reynold and Zaharia, Matei and Franklin, Michael J and Shenker, Scott and Stoica, Ion}, booktitle={Proceedings of the 2012 international conference on Management of Data}, pages={689--692}, year={2012}, organization={ACM} } @inproceedings{zaharia2012discretized, title={Discretized streams: an efficient and fault-tolerant model for stream processing on large clusters}, author={Zaharia, Matei and Das, Tathagata and Li, Haoyuan and Shenker, Scott and Stoica, Ion}, booktitle={Proceedings of the 4th USENIX conference on Hot Topics in Cloud Computing}, pages={10--10}, year={2012}, organization={USENIX Association} } @misc{marz2013storm, author = {Marz, Nathan}, title = {Storm: Distributed and Fault-Tolerant Realtime Computation}, month = {February}, year = {2013}, howpublished = "\url{http://storm-project.net/}" } @misc{tschetter2011druid, author = {Eric Tschetter}, title = {Introducing Druid: Real-Time Analytics at a Billion Rows Per Second}, month = {April}, year = {2011}, howpublished = "\url{http://metamarkets.com/2011/druid-part-i-real-time-analytics-at-a-billion-rows-per-second/}" } @article{farber2012sap, title={SAP HANA database: data management for modern business applications}, author={F{\"a}rber, Franz and Cha, Sang Kyun and Primsch, J{\"u}rgen and Bornh{\"o}vd, Christof and Sigg, Stefan and Lehner, Wolfgang}, journal={ACM Sigmod Record}, volume={40}, number={4}, pages={45--51}, year={2012}, publisher={ACM} } @misc{voltdb2010voltdb, title={VoltDB Technical Overview}, author={VoltDB, LLC}, year={2010}, howpublished = "\url{https://voltdb.com/}" } @inproceedings{macnicol2004sybase, title={Sybase IQ multiplex-designed for analytics}, author={MacNicol, Roger and French, Blaine}, booktitle={Proceedings of the Thirtieth international conference on Very large data bases-Volume 30}, pages={1227--1230}, year={2004}, organization={VLDB Endowment} } @inproceedings{singh2011introduction, title={Introduction to the IBM Netezza warehouse appliance}, author={Singh, Malcolm and Leonhardi, Ben}, booktitle={Proceedings of the 2011 Conference of the Center for Advanced Studies on Collaborative Research}, pages={385--386}, year={2011}, organization={IBM Corp.} } @inproceedings{miner2012unified, title={Unified analytics platform for big data}, author={Miner, Donald}, booktitle={Proceedings of the WICSA/ECSA 2012 Companion Volume}, pages={176--176}, year={2012}, organization={ACM} } @inproceedings{fink2012distributed, title={Distributed computation on dynamo-style distributed storage: riak pipe}, author={Fink, Bryan}, booktitle={Proceedings of the eleventh ACM SIGPLAN workshop on Erlang workshop}, pages={43--50}, year={2012}, organization={ACM} } @misc{paraccel2013, key = {ParAccel Analytic Database}, title = {ParAccel Analytic Database}, month = {March}, year = {2013}, howpublished = "\url{http://www.paraccel.com/resources/Datasheets/ParAccel-Core-Analytic-Database.pdf}" } @misc{cloudera2013, key = {Cloudera Impala}, title = {Cloudera Impala}, month = {March}, year = {2013}, url = {}, howpublished = "\url{http://blog.cloudera.com/blog}" } @inproceedings{hunt2010zookeeper, title={ZooKeeper: Wait-free coordination for Internet-scale systems}, author={Hunt, Patrick and Konar, Mahadev and Junqueira, Flavio P and Reed, Benjamin}, booktitle={USENIX ATC}, volume={10}, year={2010} } @inproceedings{kreps2011kafka, title={Kafka: A distributed messaging system for log processing}, author={Kreps, Jay and Narkhede, Neha and Rao, Jun}, booktitle={Proceedings of 6th International Workshop on Networking Meets Databases (NetDB), Athens, Greece}, year={2011} } @misc{liblzf2013, title = {LibLZF}, key = {LibLZF}, month = {March}, year = {2013}, howpublished = "\url{http://freecode.com/projects/liblzf}" } @inproceedings{tomasic1993performance, title={Performance of inverted indices in shared-nothing distributed text document information retrieval systems}, author={Tomasic, Anthony and Garcia-Molina, Hector}, booktitle={Parallel and Distributed Information Systems, 1993., Proceedings of the Second International Conference on}, pages={8--17}, year={1993}, organization={IEEE} } @inproceedings{antoshenkov1995byte, title={Byte-aligned bitmap compression}, author={Antoshenkov, Gennady}, booktitle={Data Compression Conference, 1995. DCC'95. Proceedings}, pages={476}, year={1995}, organization={IEEE} } @inproceedings{van2011memory, title={A memory efficient reachability data structure through bit vector compression}, author={van Schaik, Sebastiaan J and de Moor, Oege}, booktitle={Proceedings of the 2011 international conference on Management of data}, pages={913--924}, year={2011}, organization={ACM} } @inproceedings{o1993lru, title={The LRU-K page replacement algorithm for database disk buffering}, author={O'neil, Elizabeth J and O'neil, Patrick E and Weikum, Gerhard}, booktitle={ACM SIGMOD Record}, volume={22}, number={2}, pages={297--306}, year={1993}, organization={ACM} } @article{kim2001lrfu, title={LRFU: A spectrum of policies that subsumes the least recently used and least frequently used policies}, author={Kim, Chong Sang}, journal={IEEE Transactions on Computers}, volume={50}, number={12}, year={2001} } @article{wu2006optimizing, title={Optimizing bitmap indices with efficient compression}, author={Wu, Kesheng and Otoo, Ekow J and Shoshani, Arie}, journal={ACM Transactions on Database Systems (TODS)}, volume={31}, number={1}, pages={1--38}, year={2006}, publisher={ACM} } @misc{twitter2013, key = {Twitter Public Streams}, title = {Twitter Public Streams}, month = {March}, year = {2013}, howpublished = "\url{https://dev.twitter.com/docs/streaming-apis/streams/public}" } @article{fitzpatrick2004distributed, title={Distributed caching with memcached}, author={Fitzpatrick, Brad}, journal={Linux journal}, number={124}, pages={72--74}, year={2004} } @inproceedings{amdahl1967validity, title={Validity of the single processor approach to achieving large scale computing capabilities}, author={Amdahl, Gene M}, booktitle={Proceedings of the April 18-20, 1967, spring joint computer conference}, pages={483--485}, year={1967}, organization={ACM} } @book{sarawagi1998discovery, title={Discovery-driven exploration of OLAP data cubes}, author={Sarawagi, Sunita and Agrawal, Rakesh and Megiddo, Nimrod}, year={1998}, publisher={Springer} } @article{hu2011stream, title={Stream Database Survey}, author={Hu, Bo}, year={2011} } @article{dean2008mapreduce, title={MapReduce: simplified data processing on large clusters}, author={Dean, Jeffrey and Ghemawat, Sanjay}, journal={Communications of the ACM}, volume={51}, number={1}, pages={107--113}, year={2008}, publisher={ACM} } @misc{linkedin2013senseidb, author = {LinkedIn}, title = {SenseiDB}, month = {July}, year = {2013}, howpublished = "\url{http://www.senseidb.com/}" } @misc{apache2013solr, author = {Apache}, title = {Apache Solr}, month = {February}, year = {2013}, howpublished = "\url{http://lucene.apache.org/solr/}" } @misc{banon2013elasticsearch, author = {Banon, Shay}, title = {ElasticSearch}, month = {July}, year = {2013}, howpublished = "\url{http://www.elasticseach.com/}" }