@inproceedings{bedf4258a4ba4045bd638008a698d56e,
title = "Large scale complex network analysis using the hybrid combination of a mapreduce cluster and a highly multithreaded system",
abstract = "Complex networks capture interactions among entities in various application areas in a graph representation. Analyzing large scale complex networks often answers important questions-e.g. estimate the spread of epidemic diseases- but also imposes computing challenges mainly due to large volumes of data and the irregular structure of the graphs. In this paper, we aim to solve such a challenge: finding relationships in a subgraph extracted from the data. We solve this problem using three different platforms: a MapReduce cluster, a highly multithreaded system, and a hybrid system of the two. The MapReduce cluster and the highly multithreaded system reveal limitations in efficiently solving this problem, whereas the hybrid system exploits the strengths of the two in a synergistic way and solves the problem at hand. In particular, once the subgraph is extracted and loaded into memory, the hybrid system analyzes the subgraph five orders of magnitude faster than the MapReduce cluster.",
keywords = "Cloud computing, Parallel algorithms, Power-law graph",
author = "Seunghwa Kang and Bader, {David A.}",
year = "2010",
doi = "10.1109/IPDPSW.2010.5470691",
language = "English (US)",
isbn = "9781424465347",
series = "Proceedings of the 2010 IEEE International Symposium on Parallel and Distributed Processing, Workshops and Phd Forum, IPDPSW 2010",
booktitle = "Proceedings of the 2010 IEEE International Symposium on Parallel and Distributed Processing, Workshops and Phd Forum, IPDPSW 2010",
note = "2010 IEEE International Symposium on Parallel and Distributed Processing, Workshops and Phd Forum, IPDPSW 2010 ; Conference date: 19-04-2010 Through 23-04-2010",
}