@article {1102, title = {Fast Cholesky Factorization on GPUs for Batch and Native Modes in MAGMA}, journal = {Journal of Computational Science}, volume = {20}, year = {2017}, month = {2017-05}, pages = {85{\textendash}93}, abstract = {This paper presents a GPU-accelerated Cholesky factorization for two different modes of operation. The first one is the batch mode, where many independent factorizations on small matrices can be performed concurrently. This mode supports fixed size and variable size problems, and is found in many scientific applications. The second mode is the native mode, where one factorization is performed on a large matrix without any CPU involvement, which allows the CPU do other useful work. We show that, despite the different workloads, both modes of operation share a common code-base that uses the GPU only. We also show that the developed routines achieve significant speedups against a multicore CPU using the MKL library, and against a GPU implementation by cuSOLVER. This work is part of the MAGMA library.}, keywords = {GPU computing; Cholesky factorization; Batched execution}, doi = {https://doi.org/10.1016/j.jocs.2016.12.009}, author = {Ahmad Abdelfattah and Azzam Haidar and Stanimire Tomov and Jack Dongarra} }