Publications¶
Citing Kokkos Kernels¶
The main Kokkos Kernels paper to cite for general use of the library is:
@misc{rajamanickam2021kokkoskernelsperformanceportable,
title={Kokkos Kernels: Performance Portable Sparse/Dense Linear Algebra and Graph Kernels},
author={Sivasankaran Rajamanickam and Seher Acer and Luc Berger-Vergiat and Vinh Dang and Nathan Ellingwood and Evan Harvey and Brian Kelley and Christian R. Trott and Jeremiah Wilke and Ichitaro Yamazaki},
year={2021},
eprint={2103.11991},
archivePrefix={arXiv},
primaryClass={cs.MS},
url={https://arxiv.org/abs/2103.11991}}
If you use more than one Kokkos Ecosystem package, please also cite:
@article{9502936,
author={Trott, Christian and Berger-Vergiat, Luc and Poliakoff, David and Rajamanickam, Sivasankaran and Lebrun-Grandie, Damien and Madsen, Jonathan and Al Awar, Nader and Gligoric, Milos and Shipman, Galen and Womeldorff, Geoff},
journal={Computing in Science Engineering},
title={The Kokkos Ecosystem: Comprehensive Performance Portability for High Performance Computing},
year={2021},
volume={23},
number={5},
pages={10-18},
doi={10.1109/MCSE.2021.3098509}}
Kokkos Kernels algorithm publications¶
SPGEMM¶
Original publication on the sparse matrix-matrix multiplication algorithm
@article{DEVECI201833,
title = {Multithreaded sparse matrix-matrix multiplication for many-core and GPU architectures},
journal = {Parallel Computing},
volume = {78},
pages = {33-46},
year = {2018},
issn = {0167-8191},
doi = {https://doi.org/10.1016/j.parco.2018.06.009},
url = {https://www.sciencedirect.com/science/article/pii/S0167819118301923},
author = {Mehmet Deveci and Christian Trott and Sivasankaran Rajamanickam}}
Supernode-based Sparse Triangular Solver¶
@inproceedings{10.1145/3404397.3404428,
author = {Yamazaki, Ichitaro and Rajamanickam, Sivasankaran and Ellingwood, Nathan},
title = {Performance Portable Supernode-based Sparse Triangular Solver for Manycore Architectures},
year = {2020},
isbn = {9781450388160},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
url = {https://doi.org/10.1145/3404397.3404428},
doi = {10.1145/3404397.3404428},
booktitle = {Proceedings of the 49th International Conference on Parallel Processing},
articleno = {70},
numpages = {11},
location = {Edmonton, AB, Canada},
series = {ICPP '20}}
Two-stage Gauss-Seidel¶
@misc{bergervergiat2021twostagegaussseidelpreconditionerssmoothers,
title={Two-Stage Gauss--Seidel Preconditioners and Smoothers for Krylov Solvers on a GPU cluster},
author={Luc Berger-Vergiat and Brian Kelley and Sivasankaran Rajamanickam and Jonathan Hu and Katarzyna Swirydowicz and Paul Mullowney and Stephen Thomas and Ichitaro Yamazaki},
year={2021},
eprint={2104.01196},
archivePrefix={arXiv},
primaryClass={math.NA},
url={https://arxiv.org/abs/2104.01196}}
Distance-2 Maximal Independent Set and Graph Coarsening¶
@INPROCEEDINGS{9820696,
author={Kelley, Brian and Rajamanickam, Sivasankaran},
booktitle={2022 IEEE International Parallel and Distributed Processing Symposium (IPDPS)},
title={Parallel, Portable Algorithms for Distance-2 Maximal Independent Set and Graph Coarsening},
year={2022},
volume={},
number={},
pages={280-290},
keywords={Distributed processing;Clustering algorithms;Programming;Libraries;Hardware;Partitioning algorithms;graph algorithms;preconditioners;performance portability},
doi={10.1109/IPDPS53621.2022.00035}}
Batched Sparse Linear Solvers¶
@ARTICLE{10054414,
author={Liegeois, Kim and Rajamanickam, Sivasankaran and Berger-Vergiat, Luc},
journal={IEEE Transactions on Parallel and Distributed Systems},
title={Performance Portable Batched Sparse Linear Solvers},
year={2023},
volume={34},
number={5},
pages={1524-1535},
keywords={Linear systems;Kernel;Graphics processing units;Tensors;Sparse matrices;Libraries;Instruction sets;Batch sparse solvers;batch BLAS;kokkos kernels;performance portable},
doi={10.1109/TPDS.2023.3249110}}