@inproceedings{8c731bc41e084c5aaf3af62609724c2c,
title = "Overhead of a decentralized gossip algorithm on the performance of HPC applications",
abstract = "Gossip algorithms can provide online information about the availability and the state of the resources in supercomputers. These algorithms require minimal computing and storage capabilities at each node and when properly tuned, they are not expected to overload the nodes or the network that connects these nodes. These properties make gossip interesting for future exascale systems. This paper examines the overhead of a decentralized gossip algorithm on the performance of parallel MPI applications running on up to 8192 nodes of an IBM BlueGene/Q supercomputer. The applications that were used in the experiments include PTRANS and MPI-FFT from the HPCC benchmark suite as well as the coupled weather and cloud simulation model COSMOSPECS+ FD4. In most cases, no gossip overhead was observed when the gossip messages were sent at intervals of 256ms or more. As expected, the overhead that is observed at higher rates is sensitive to the communication pattern of the application and the amount of gossip information being circulated.",
keywords = "Benchmarking, Cluster management, Gossip algorithm, High performance computing",
author = "Ely Levy and Amnon Barak and Amnon Shiloh and Matthias Lieber and Carsten Weinhold and Hermann H{\"a}rtig",
year = "2014",
doi = "10.1145/2612262.2612271",
language = "אנגלית",
isbn = "9781450329507",
series = "Proceedings of the 4th International Workshop on Runtime and Operating Systems for Supercomputers, ROSS 2014 - In Conjunction with ICS 2014",
publisher = "Association for Computing Machinery",
booktitle = "Proceedings of the 4th International Workshop on Runtime and Operating Systems for Supercomputers, ROSS 2014 - In Conjunction with ICS 2014",
note = "4th International Workshop on Runtime and Operating Systems for Supercomputers, ROSS 2014 - In Conjunction with ICS 2014 ; Conference date: 10-06-2014 Through 10-06-2014",
}