NoSQL databases have emerged as a backend to support Big Data applications. NoSQL databases are characterized by horizontal scalability, schema-free data models, and easy cloud deployment. To avoid overprovisioning, it is essential to be able to identify the correct number of nodes required for a specific system before deployment. This paper benchmarks and compares three of the most common NoSQL databases: Cassandra, MongoDB and HBase. We deploy them on the Amazon EC2 cloud platform using different types of virtual machines and cluster sizes to study the effect of different configurations. We then compare the behavior of these systems to high-level queueing network models. Our results show that the models are able to capture the main performance characteristics of the studied databases and form the basis for a capacity planning tool for service providers and service users.
Description
Performance Evaluation of NoSQL Databases - Springer
%0 Book Section
%1 noKey
%A Gandini, Andrea
%A Gribaudo, Marco
%A Knottenbelt, WilliamJ.
%A Osman, Rasha
%A Piazzolla, Pietro
%B Computer Performance Engineering
%D 2014
%E Horváth, András
%E Wolter, Katinka
%I Springer International Publishing
%K database nosql webbackend
%P 16-29
%R 10.1007/978-3-319-10885-8_2
%T Performance Evaluation of NoSQL Databases
%U http://dx.doi.org/10.1007/978-3-319-10885-8_2
%V 8721
%X NoSQL databases have emerged as a backend to support Big Data applications. NoSQL databases are characterized by horizontal scalability, schema-free data models, and easy cloud deployment. To avoid overprovisioning, it is essential to be able to identify the correct number of nodes required for a specific system before deployment. This paper benchmarks and compares three of the most common NoSQL databases: Cassandra, MongoDB and HBase. We deploy them on the Amazon EC2 cloud platform using different types of virtual machines and cluster sizes to study the effect of different configurations. We then compare the behavior of these systems to high-level queueing network models. Our results show that the models are able to capture the main performance characteristics of the studied databases and form the basis for a capacity planning tool for service providers and service users.
%@ 978-3-319-10884-1
@incollection{noKey,
abstract = {NoSQL databases have emerged as a backend to support Big Data applications. NoSQL databases are characterized by horizontal scalability, schema-free data models, and easy cloud deployment. To avoid overprovisioning, it is essential to be able to identify the correct number of nodes required for a specific system before deployment. This paper benchmarks and compares three of the most common NoSQL databases: Cassandra, MongoDB and HBase. We deploy them on the Amazon EC2 cloud platform using different types of virtual machines and cluster sizes to study the effect of different configurations. We then compare the behavior of these systems to high-level queueing network models. Our results show that the models are able to capture the main performance characteristics of the studied databases and form the basis for a capacity planning tool for service providers and service users.},
added-at = {2015-02-09T10:47:50.000+0100},
author = {Gandini, Andrea and Gribaudo, Marco and Knottenbelt, WilliamJ. and Osman, Rasha and Piazzolla, Pietro},
biburl = {https://www.bibsonomy.org/bibtex/272d67215f426e14b0ee6be58e8339231/mbruschi},
booktitle = {Computer Performance Engineering},
description = {Performance Evaluation of NoSQL Databases - Springer},
doi = {10.1007/978-3-319-10885-8_2},
editor = {Horváth, András and Wolter, Katinka},
interhash = {88fdfe530230126ea40bbca84f91ece4},
intrahash = {72d67215f426e14b0ee6be58e8339231},
isbn = {978-3-319-10884-1},
keywords = {database nosql webbackend},
language = {English},
pages = {16-29},
publisher = {Springer International Publishing},
series = {Lecture Notes in Computer Science},
timestamp = {2015-02-09T10:47:50.000+0100},
title = {Performance Evaluation of NoSQL Databases},
url = {http://dx.doi.org/10.1007/978-3-319-10885-8_2},
volume = 8721,
year = 2014
}