updates to images in paper and some fixes

This commit is contained in:
fjy 2013-12-04 13:56:16 -08:00
parent 929b2336a9
commit 1e2cb839d4
2 changed files with 1033 additions and 904 deletions

View File

@ -1,348 +1,368 @@
@article{cattell2011scalable, @article{cattell2011scalable,
title={Scalable SQL and NoSQL data stores}, title={Scalable SQL and NoSQL data stores},
author={Cattell, Rick}, author={Cattell, Rick},
journal={ACM SIGMOD Record}, journal={ACM SIGMOD Record},
volume={39}, volume={39},
number={4}, number={4},
pages={12--27}, pages={12--27},
year={2011}, year={2011},
publisher={ACM} publisher={ACM}
} }
@article{chang2008bigtable, @article{chang2008bigtable,
title={Bigtable: A distributed storage system for structured data}, title={Bigtable: A distributed storage system for structured data},
author={Chang, Fay and Dean, Jeffrey and Ghemawat, Sanjay and Hsieh, Wilson C and Wallach, Deborah A and Burrows, Mike and Chandra, Tushar and Fikes, Andrew and Gruber, Robert E}, author={Chang, Fay and Dean, Jeffrey and Ghemawat, Sanjay and Hsieh, Wilson C and Wallach, Deborah A and Burrows, Mike and Chandra, Tushar and Fikes, Andrew and Gruber, Robert E},
journal={ACM Transactions on Computer Systems (TOCS)}, journal={ACM Transactions on Computer Systems (TOCS)},
volume={26}, volume={26},
number={2}, number={2},
pages={4}, pages={4},
year={2008}, year={2008},
publisher={ACM} publisher={ACM}
} }
@inproceedings{decandia2007dynamo, @inproceedings{decandia2007dynamo,
title={Dynamo: amazon's highly available key-value store}, title={Dynamo: amazon's highly available key-value store},
author={DeCandia, Giuseppe and Hastorun, Deniz and Jampani, Madan and Kakulapati, Gunavardhan and Lakshman, Avinash and Pilchin, Alex and Sivasubramanian, Swaminathan and Vosshall, Peter and Vogels, Werner}, author={DeCandia, Giuseppe and Hastorun, Deniz and Jampani, Madan and Kakulapati, Gunavardhan and Lakshman, Avinash and Pilchin, Alex and Sivasubramanian, Swaminathan and Vosshall, Peter and Vogels, Werner},
booktitle={ACM SIGOPS Operating Systems Review}, booktitle={ACM SIGOPS Operating Systems Review},
volume={41}, volume={41},
number={6}, number={6},
pages={205--220}, pages={205--220},
year={2007}, year={2007},
organization={ACM} organization={ACM}
} }
@inproceedings{bear2012vertica, @inproceedings{bear2012vertica,
title={The vertica database: SQL RDBMS for managing big data}, title={The vertica database: SQL RDBMS for managing big data},
author={Bear, Chuck and Lamb, Andrew and Tran, Nga}, author={Bear, Chuck and Lamb, Andrew and Tran, Nga},
booktitle={Proceedings of the 2012 workshop on Management of big data systems}, booktitle={Proceedings of the 2012 workshop on Management of big data systems},
pages={37--38}, pages={37--38},
year={2012}, year={2012},
organization={ACM} organization={ACM}
} }
@article{lakshman2010cassandra, @article{lakshman2010cassandra,
title={Cassandra—A decentralized structured storage system}, title={Cassandra—A decentralized structured storage system},
author={Lakshman, Avinash and Malik, Prashant}, author={Lakshman, Avinash and Malik, Prashant},
journal={Operating systems review}, journal={Operating systems review},
volume={44}, volume={44},
number={2}, number={2},
pages={35}, pages={35},
year={2010} year={2010}
} }
@article{melnik2010dremel, @article{melnik2010dremel,
title={Dremel: interactive analysis of web-scale datasets}, title={Dremel: interactive analysis of web-scale datasets},
author={Melnik, Sergey and Gubarev, Andrey and Long, Jing Jing and Romer, Geoffrey and Shivakumar, Shiva and Tolton, Matt and Vassilakis, Theo}, author={Melnik, Sergey and Gubarev, Andrey and Long, Jing Jing and Romer, Geoffrey and Shivakumar, Shiva and Tolton, Matt and Vassilakis, Theo},
journal={Proceedings of the VLDB Endowment}, journal={Proceedings of the VLDB Endowment},
volume={3}, volume={3},
number={1-2}, number={1-2},
pages={330--339}, pages={330--339},
year={2010}, year={2010},
publisher={VLDB Endowment} publisher={VLDB Endowment}
} }
@article{hall2012processing, @article{hall2012processing,
title={Processing a trillion cells per mouse click}, title={Processing a trillion cells per mouse click},
author={Hall, Alexander and Bachmann, Olaf and B{\"u}ssow, Robert and G{\u{a}}nceanu, Silviu and Nunkesser, Marc}, author={Hall, Alexander and Bachmann, Olaf and B{\"u}ssow, Robert and G{\u{a}}nceanu, Silviu and Nunkesser, Marc},
journal={Proceedings of the VLDB Endowment}, journal={Proceedings of the VLDB Endowment},
volume={5}, volume={5},
number={11}, number={11},
pages={1436--1446}, pages={1436--1446},
year={2012}, year={2012},
publisher={VLDB Endowment} publisher={VLDB Endowment}
} }
@inproceedings{shvachko2010hadoop, @inproceedings{shvachko2010hadoop,
title={The hadoop distributed file system}, title={The hadoop distributed file system},
author={Shvachko, Konstantin and Kuang, Hairong and Radia, Sanjay and Chansler, Robert}, author={Shvachko, Konstantin and Kuang, Hairong and Radia, Sanjay and Chansler, Robert},
booktitle={Mass Storage Systems and Technologies (MSST), 2010 IEEE 26th Symposium on}, booktitle={Mass Storage Systems and Technologies (MSST), 2010 IEEE 26th Symposium on},
pages={1--10}, pages={1--10},
year={2010}, year={2010},
organization={IEEE} organization={IEEE}
} }
@article{colantonio2010concise, @article{colantonio2010concise,
title={Concise: Compressed nComposable Integer Set}, title={Concise: Compressed nComposable Integer Set},
author={Colantonio, Alessandro and Di Pietro, Roberto}, author={Colantonio, Alessandro and Di Pietro, Roberto},
journal={Information Processing Letters}, journal={Information Processing Letters},
volume={110}, volume={110},
number={16}, number={16},
pages={644--650}, pages={644--650},
year={2010}, year={2010},
publisher={Elsevier} publisher={Elsevier}
} }
@article{lerner2010redis, @inproceedings{stonebraker2005c,
title={At the Forge: Redis}, title={C-store: a column-oriented DBMS},
author={Lerner, Richard}, author={Stonebraker, Mike and Abadi, Daniel J and Batkin, Adam and Chen, Xuedong and Cherniack, Mitch and Ferreira, Miguel and Lau, Edmond and Lin, Amerson and Madden, Sam and O'Neil, Elizabeth and others},
journal={Linux Journal}, booktitle={Proceedings of the 31st international conference on Very large data bases},
volume={2010}, pages={553--564},
number={197}, year={2005},
pages={3}, organization={VLDB Endowment}
year={2010} }
}
@inproceedings{stonebraker2005c, @inproceedings{engle2012shark,
title={C-store: a column-oriented DBMS}, title={Shark: fast data analysis using coarse-grained distributed memory},
author={Stonebraker, Mike and Abadi, Daniel J and Batkin, Adam and Chen, Xuedong and Cherniack, Mitch and Ferreira, Miguel and Lau, Edmond and Lin, Amerson and Madden, Sam and O'Neil, Elizabeth and others}, author={Engle, Cliff and Lupher, Antonio and Xin, Reynold and Zaharia, Matei and Franklin, Michael J and Shenker, Scott and Stoica, Ion},
booktitle={Proceedings of the 31st international conference on Very large data bases}, booktitle={Proceedings of the 2012 international conference on Management of Data},
pages={553--564}, pages={689--692},
year={2005}, year={2012},
organization={VLDB Endowment} organization={ACM}
} }
@inproceedings{engle2012shark, @inproceedings{zaharia2012discretized,
title={Shark: fast data analysis using coarse-grained distributed memory}, title={Discretized streams: an efficient and fault-tolerant model for stream processing on large clusters},
author={Engle, Cliff and Lupher, Antonio and Xin, Reynold and Zaharia, Matei and Franklin, Michael J and Shenker, Scott and Stoica, Ion}, author={Zaharia, Matei and Das, Tathagata and Li, Haoyuan and Shenker, Scott and Stoica, Ion},
booktitle={Proceedings of the 2012 international conference on Management of Data}, booktitle={Proceedings of the 4th USENIX conference on Hot Topics in Cloud Computing},
pages={689--692}, pages={10--10},
year={2012}, year={2012},
organization={ACM} organization={USENIX Association}
} }
@inproceedings{zaharia2012discretized, @misc{marz2013storm,
title={Discretized streams: an efficient and fault-tolerant model for stream processing on large clusters}, author = {Marz, Nathan},
author={Zaharia, Matei and Das, Tathagata and Li, Haoyuan and Shenker, Scott and Stoica, Ion}, title = {Storm: Distributed and Fault-Tolerant Realtime Computation},
booktitle={Proceedings of the 4th USENIX conference on Hot Topics in Cloud Computing}, month = {February},
pages={10--10}, year = {2013},
year={2012}, howpublished = "\url{http://storm-project.net/}"
organization={USENIX Association} }
}
@misc{marz2013storm, @misc{tschetter2011druid,
author = {Marz, Nathan}, author = {Eric Tschetter},
title = {Storm: Distributed and Fault-Tolerant Realtime Computation}, title = {Introducing Druid: Real-Time Analytics at a Billion Rows Per Second},
month = {February}, month = {April},
year = {2013}, year = {2011},
howpublished = "\url{http://storm-project.net/}" howpublished = "\url{http://metamarkets.com/2011/druid-part-i-real-time-analytics-at-a-billion-rows-per-second/}"
} }
@article{farber2012sap, @article{farber2012sap,
title={SAP HANA database: data management for modern business applications}, title={SAP HANA database: data management for modern business applications},
author={F{\"a}rber, Franz and Cha, Sang Kyun and Primsch, J{\"u}rgen and Bornh{\"o}vd, Christof and Sigg, Stefan and Lehner, Wolfgang}, author={F{\"a}rber, Franz and Cha, Sang Kyun and Primsch, J{\"u}rgen and Bornh{\"o}vd, Christof and Sigg, Stefan and Lehner, Wolfgang},
journal={ACM Sigmod Record}, journal={ACM Sigmod Record},
volume={40}, volume={40},
number={4}, number={4},
pages={45--51}, pages={45--51},
year={2012}, year={2012},
publisher={ACM} publisher={ACM}
} }
@misc{voltdb2010voltdb, @misc{voltdb2010voltdb,
title={VoltDB Technical Overview}, title={VoltDB Technical Overview},
author={VoltDB, LLC}, author={VoltDB, LLC},
year={2010}, year={2010},
howpublished = "\url{https://voltdb.com/}" howpublished = "\url{https://voltdb.com/}"
} }
@inproceedings{macnicol2004sybase, @inproceedings{macnicol2004sybase,
title={Sybase IQ multiplex-designed for analytics}, title={Sybase IQ multiplex-designed for analytics},
author={MacNicol, Roger and French, Blaine}, author={MacNicol, Roger and French, Blaine},
booktitle={Proceedings of the Thirtieth international conference on Very large data bases-Volume 30}, booktitle={Proceedings of the Thirtieth international conference on Very large data bases-Volume 30},
pages={1227--1230}, pages={1227--1230},
year={2004}, year={2004},
organization={VLDB Endowment} organization={VLDB Endowment}
} }
@inproceedings{singh2011introduction, @inproceedings{singh2011introduction,
title={Introduction to the IBM Netezza warehouse appliance}, title={Introduction to the IBM Netezza warehouse appliance},
author={Singh, Malcolm and Leonhardi, Ben}, author={Singh, Malcolm and Leonhardi, Ben},
booktitle={Proceedings of the 2011 Conference of the Center for Advanced Studies on Collaborative Research}, booktitle={Proceedings of the 2011 Conference of the Center for Advanced Studies on Collaborative Research},
pages={385--386}, pages={385--386},
year={2011}, year={2011},
organization={IBM Corp.} organization={IBM Corp.}
} }
@inproceedings{miner2012unified, @inproceedings{miner2012unified,
title={Unified analytics platform for big data}, title={Unified analytics platform for big data},
author={Miner, Donald}, author={Miner, Donald},
booktitle={Proceedings of the WICSA/ECSA 2012 Companion Volume}, booktitle={Proceedings of the WICSA/ECSA 2012 Companion Volume},
pages={176--176}, pages={176--176},
year={2012}, year={2012},
organization={ACM} organization={ACM}
} }
@inproceedings{fink2012distributed, @inproceedings{fink2012distributed,
title={Distributed computation on dynamo-style distributed storage: riak pipe}, title={Distributed computation on dynamo-style distributed storage: riak pipe},
author={Fink, Bryan}, author={Fink, Bryan},
booktitle={Proceedings of the eleventh ACM SIGPLAN workshop on Erlang workshop}, booktitle={Proceedings of the eleventh ACM SIGPLAN workshop on Erlang workshop},
pages={43--50}, pages={43--50},
year={2012}, year={2012},
organization={ACM} organization={ACM}
} }
@misc{paraccel2013, @misc{paraccel2013,
key = {ParAccel Analytic Database}, key = {ParAccel Analytic Database},
title = {ParAccel Analytic Database}, title = {ParAccel Analytic Database},
month = {March}, month = {March},
year = {2013}, year = {2013},
howpublished = "\url{http://www.paraccel.com/resources/Datasheets/ParAccel-Core-Analytic-Database.pdf}" howpublished = "\url{http://www.paraccel.com/resources/Datasheets/ParAccel-Core-Analytic-Database.pdf}"
} }
@article{barroso2009datacenter, @misc{cloudera2013,
title={The datacenter as a computer: An introduction to the design of warehouse-scale machines}, key = {Cloudera Impala},
author={Barroso, Luiz Andr{\'e} and H{\"o}lzle, Urs}, title = {Cloudera Impala},
journal={Synthesis Lectures on Computer Architecture}, month = {March},
volume={4}, year = {2013},
number={1}, url = {},
pages={1--108}, howpublished = "\url{http://blog.cloudera.com/blog}"
year={2009}, }
publisher={Morgan \& Claypool Publishers}
}
@article{chaudhuri1997overview, @inproceedings{hunt2010zookeeper,
title={An overview of data warehousing and OLAP technology}, title={ZooKeeper: Wait-free coordination for Internet-scale systems},
author={Chaudhuri, Surajit and Dayal, Umeshwar}, author={Hunt, Patrick and Konar, Mahadev and Junqueira, Flavio P and Reed, Benjamin},
journal={ACM Sigmod record}, booktitle={USENIX ATC},
volume={26}, volume={10},
number={1}, year={2010}
pages={65--74}, }
year={1997}
}
@article{dewitt1992parallel, @inproceedings{kreps2011kafka,
title={Parallel database systems: the future of high performance database systems}, title={Kafka: A distributed messaging system for log processing},
author={DeWitt, David and Gray, Jim}, author={Kreps, Jay and Narkhede, Neha and Rao, Jun},
journal={Communications of the ACM}, booktitle={Proceedings of 6th International Workshop on Networking Meets Databases (NetDB), Athens, Greece},
volume={35}, year={2011}
number={6}, }
pages={85--98},
year={1992},
publisher={ACM}
}
@misc{cloudera2013, @misc{liblzf2013,
key = {Cloudera Impala}, title = {LibLZF},
title = {Cloudera Impala}, key = {LibLZF},
month = {March}, month = {March},
year = {2013}, year = {2013},
url = {}, howpublished = "\url{http://freecode.com/projects/liblzf}"
howpublished = "\url{http://blog.cloudera.com/blog}" }
}
@inproceedings{hunt2010zookeeper, @inproceedings{tomasic1993performance,
title={ZooKeeper: Wait-free coordination for Internet-scale systems}, title={Performance of inverted indices in shared-nothing distributed text document information retrieval systems},
author={Hunt, Patrick and Konar, Mahadev and Junqueira, Flavio P and Reed, Benjamin}, author={Tomasic, Anthony and Garcia-Molina, Hector},
booktitle={USENIX ATC}, booktitle={Parallel and Distributed Information Systems, 1993., Proceedings of the Second International Conference on},
volume={10}, pages={8--17},
year={2010} year={1993},
} organization={IEEE}
}
@inproceedings{kreps2011kafka, @inproceedings{antoshenkov1995byte,
title={Kafka: A distributed messaging system for log processing}, title={Byte-aligned bitmap compression},
author={Kreps, Jay and Narkhede, Neha and Rao, Jun}, author={Antoshenkov, Gennady},
booktitle={Proceedings of 6th International Workshop on Networking Meets Databases (NetDB), Athens, Greece}, booktitle={Data Compression Conference, 1995. DCC'95. Proceedings},
year={2011} pages={476},
} year={1995},
organization={IEEE}
}
@misc{liblzf2013, @inproceedings{van2011memory,
title = {LibLZF}, title={A memory efficient reachability data structure through bit vector compression},
key = {LibLZF}, author={van Schaik, Sebastiaan J and de Moor, Oege},
month = {March}, booktitle={Proceedings of the 2011 international conference on Management of data},
year = {2013}, pages={913--924},
howpublished = "\url{http://freecode.com/projects/liblzf}" year={2011},
} organization={ACM}
}
@inproceedings{tomasic1993performance, @inproceedings{o1993lru,
title={Performance of inverted indices in shared-nothing distributed text document information retrieval systems}, title={The LRU-K page replacement algorithm for database disk buffering},
author={Tomasic, Anthony and Garcia-Molina, Hector}, author={O'neil, Elizabeth J and O'neil, Patrick E and Weikum, Gerhard},
booktitle={Parallel and Distributed Information Systems, 1993., Proceedings of the Second International Conference on}, booktitle={ACM SIGMOD Record},
pages={8--17}, volume={22},
year={1993}, number={2},
organization={IEEE} pages={297--306},
} year={1993},
organization={ACM}
}
@inproceedings{antoshenkov1995byte, @article{kim2001lrfu,
title={Byte-aligned bitmap compression}, title={LRFU: A spectrum of policies that subsumes the least recently used and least frequently used policies},
author={Antoshenkov, Gennady}, author={Kim, Chong Sang},
booktitle={Data Compression Conference, 1995. DCC'95. Proceedings}, journal={IEEE Transactions on Computers},
pages={476}, volume={50},
year={1995}, number={12},
organization={IEEE} year={2001}
} }
@inproceedings{van2011memory, @article{wu2006optimizing,
title={A memory efficient reachability data structure through bit vector compression}, title={Optimizing bitmap indices with efficient compression},
author={van Schaik, Sebastiaan J and de Moor, Oege}, author={Wu, Kesheng and Otoo, Ekow J and Shoshani, Arie},
booktitle={Proceedings of the 2011 international conference on Management of data}, journal={ACM Transactions on Database Systems (TODS)},
pages={913--924}, volume={31},
year={2011}, number={1},
organization={ACM} pages={1--38},
} year={2006},
publisher={ACM}
}
@inproceedings{o1993lru, @misc{twitter2013,
title={The LRU-K page replacement algorithm for database disk buffering}, key = {Twitter Public Streams},
author={O'neil, Elizabeth J and O'neil, Patrick E and Weikum, Gerhard}, title = {Twitter Public Streams},
booktitle={ACM SIGMOD Record}, month = {March},
volume={22}, year = {2013},
number={2}, howpublished = "\url{https://dev.twitter.com/docs/streaming-apis/streams/public}"
pages={297--306}, }
year={1993},
organization={ACM}
}
@article{kim2001lrfu, @article{fitzpatrick2004distributed,
title={LRFU: A spectrum of policies that subsumes the least recently used and least frequently used policies}, title={Distributed caching with memcached},
author={Kim, Chong Sang}, author={Fitzpatrick, Brad},
journal={IEEE Transactions on Computers}, journal={Linux journal},
volume={50}, number={124},
number={12}, pages={72--74},
year={2001} year={2004}
} }
@article{wu2006optimizing, @inproceedings{amdahl1967validity,
title={Optimizing bitmap indices with efficient compression}, title={Validity of the single processor approach to achieving large scale computing capabilities},
author={Wu, Kesheng and Otoo, Ekow J and Shoshani, Arie}, author={Amdahl, Gene M},
journal={ACM Transactions on Database Systems (TODS)}, booktitle={Proceedings of the April 18-20, 1967, spring joint computer conference},
volume={31}, pages={483--485},
number={1}, year={1967},
pages={1--38}, organization={ACM}
year={2006}, }
publisher={ACM} @book{sarawagi1998discovery,
} title={Discovery-driven exploration of OLAP data cubes},
author={Sarawagi, Sunita and Agrawal, Rakesh and Megiddo, Nimrod},
year={1998},
publisher={Springer}
}
@inproceedings{abadi2008column,
title={Column-Stores vs. Row-Stores: How different are they really?},
author={Abadi, Daniel J and Madden, Samuel R and Hachem, Nabil},
booktitle={Proceedings of the 2008 ACM SIGMOD international conference on Management of data},
pages={967--980},
year={2008},
organization={ACM}
}
@article{hu2011stream,
title={Stream Database Survey},
author={Hu, Bo},
year={2011}
}
@misc{twitter2013, @article{dean2008mapreduce,
key = {Twitter Public Streams}, title={MapReduce: simplified data processing on large clusters},
title = {Twitter Public Streams}, author={Dean, Jeffrey and Ghemawat, Sanjay},
month = {March}, journal={Communications of the ACM},
year = {2013}, volume={51},
howpublished = "\url{https://dev.twitter.com/docs/streaming-apis/streams/public}" number={1},
} pages={107--113},
year={2008},
publisher={ACM}
}
@article{fitzpatrick2004distributed, @misc{linkedin2013senseidb,
title={Distributed caching with memcached}, author = {LinkedIn},
author={Fitzpatrick, Brad}, title = {SenseiDB},
journal={Linux journal}, month = {July},
number={124}, year = {2013},
pages={72--74}, howpublished = "\url{http://www.senseidb.com/}"
year={2004} }
}
@inproceedings{amdahl1967validity, @misc{apache2013solr,
title={Validity of the single processor approach to achieving large scale computing capabilities}, author = {Apache},
author={Amdahl, Gene M}, title = {Apache Solr},
booktitle={Proceedings of the April 18-20, 1967, spring joint computer conference}, month = {February},
pages={483--485}, year = {2013},
year={1967}, howpublished = "\url{http://lucene.apache.org/solr/}"
organization={ACM} }
}
@misc{banon2013elasticsearch,
author = {Banon, Shay},
title = {ElasticSearch},
month = {July},
year = {2013},
howpublished = "\url{http://www.elasticseach.com/}"
}

File diff suppressed because it is too large Load Diff