@inproceedings{882ab7e12fb64814b1cbd7dff7f4ce86,
title = "Adapting irregular computations to large CPU-GPU clusters in the MADNESS framework",
abstract = "Graphics Processing Units (GPUs) are becoming the workhorse of scalable computations. MADNESS is a scientific framework used especially for computational chemistry. Most MADNESS applications use operators that involve many small tensor computations, resulting in a less regular organization of computations on GPUs. A single GPU kernel may have to multiply by hundreds of small square matrices (with fixed dimension ranging from 10 to 28). We demonstrate a scalable CPU-GPU implementation of the MADNESS framework over a 500-node partition on the Titan supercomputer. For this hybrid CPU-GPU implementation, we observe up to a 2.3-times speedup compared to an equivalent CPU-only implementation with 16 cores per node. For smaller matrices, we demonstrate a speedup of 2.2-times by using a custom CUDA kernel rather than a cuBLAS-based kernel.",
keywords = "GPU, heterogeneous CPU-GPU, hybrid CPU-GPU, irregular computation, supercomputing",
author = "Vlad Slavici and Raghu Varier and Gene Cooperman and Harrison, \{Robert J.\}",
year = "2012",
doi = "10.1109/CLUSTER.2012.42",
language = "English",
isbn = "9780768548074",
series = "Proceedings - 2012 IEEE International Conference on Cluster Computing, CLUSTER 2012",
publisher = "IEEE Computer Society",
pages = "1--9",
booktitle = "Proceedings - 2012 IEEE International Conference on Cluster Computing, CLUSTER 2012",
note = "2012 IEEE International Conference on Cluster Computing, CLUSTER 2012 ; Conference date: 24-09-2012 Through 28-09-2012",
}