2 title = {{P}arallel iterative algorithms: from sequential to grid computing},
3 author = {Bahi, J.M. and Contassot-Vivier, S. and Couturier, R.},
4 booktitle = {Numerical Analysis and Scientific Computing},
5 publisher = {Chapman \& Hall/CRC},
10 title = {An efficient multi-algorithms sparse linear solver for {GPU}s},
11 author = {Jost, T. and Contassot-Vivier, S. and Vialle, S.},
12 booktitle = {International conference on parallel computing, ParCo2009},
17 title={Parallel iterative linear solvers on {GPU}: a financial engineering case},
18 author={Gaikwad, A. and Toke, I.M.},
19 booktitle = {Proceedings of the 2010 18th Euromicro Conference on Parallel, Distributed and Network-based Processing},
22 publisher = {IEEE Computer Society},
26 title = {Efficient {GPU} data structures and methods to solve sparse linear systems in dynamics applications},
27 author = {Weber, D. and Bender, J. and Schnoes, M. and Stork, A. and Fellner, D.},
28 journal = {Computer Graphics Forum},
35 title = {Sparse matrix solvers on the {GPU}: conjugate gradients and multigrid},
36 author = {Bolz, J. and Farmer, I. and Grinspun, E. and Schr{\"o}der, P.},
37 journal = {ACM Trans. Graph.},
45 title={A parallel preconditioned {B}i-{C}onjugate {G}radient stabilized solver for the {P}oisson problem},
46 author={Zhao, N. and Wang, X.},
47 journal={Journal of Computers},
54 title={Solving sparse linear systems on {NVIDIA} {T}esla {GPU}s},
55 author={Wang, M. and Klie, H. and Parashar, M. and Sudan, H.},
56 booktitle={Computational Science – ICCS 2009},
65 title = {Sparse systems solving on {GPUs} with {GMRES}},
66 author = {Couturier, R. and Domas, S.},
67 journal = {The journal of Supercomputing},
71 publisher = {Springer},
76 title = {{GPU}-Accelerated Preconditioned Iterative Linear Solvers},
77 author = {Li, R. and Saad, Y.},
78 journal = {The Journal of Supercomputing},
86 title = {Accelerating the {GMRES} Iterative Linear Solver of an Oil Reservoir Simulator using the Multi-Processing Power of Compute Unified Device Architecture of Graphics Cards},
87 author = {Ghaemian, N. and Abdollahzadeh, A. and Heinemann, Z. and Harrer, A. and Sharifi, M. and Heinemann, G.},
88 booktitle = {PARA 2008},
93 title = {Fast Conjugate Gradients with Multiple {GPU}s},
94 author = {Cevahir, A and Nukada, A. and Matsuoka, S.},
95 booktitle = {Computational Science – ICCS 2009},
99 publisher = {Springer},
104 author = {Ament, M. and Knittel, G. and Weiskopf, D. and Strasser, W.},
105 title = {A Parallel Preconditioned Conjugate Gradient Solver for the Poisson Problem on a Multi-{GPU} Platform},
106 booktitle = {Proceedings of the 2010 18th Euromicro Conference on Parallel, Distributed and Network-based Processing},
109 publisher = {IEEE Computer Society},
113 title = {Parallel Implementations of {FGMRES} for Solving Large, Sparse Non-symmetric Linear Systems},
114 journal = {Procedia Computer Science},
118 author = {DeVries, B. and Iannelli, J. and Trefftz, C. and O'Hearn, K.A. and Wolffe, G.},
122 title = {A Parallel Algebraic Multigrid Solver on Graphics Processing Units},
123 author = {Haase, G. and Liebmann, M. and Douglas, C.C. and Plank, G.},
124 booktitle = {High Performance Computing and Applications},
128 publisher = {Springer},
133 author = {G{\"o}ddeke, D. and Strzodka, R. and Mohd-Yusof, J. and McCormick, P. and Buijssen, S.H.M and Grajewski, M. and Turek, S.},
134 title = {Exploring weak scalability for {FEM} calculations on a {GPU}-enhanced cluster},
135 journal = {Parallel Computing, Special issue: High-performance computing using accelerators},
140 publisher = {Elsevier},
144 author = {Bahi, J.M. and Couturier, R. and Ziane Khodja, L.},
145 title = {Parallel {GMRES} implementation for solving sparse linear systems on {GPU} clusters},
146 booktitle = {Proceedings of the 19th High Performance Computing Symposia},
150 publisher = {SCS International},
154 title = {Algebraic Multigrid Solver on Clusters of {CPU}s and {GPU}s},
155 author = {Neic, A. and Liebmann, M. and Haase, G. and Plank, G.},
156 booktitle = {Applied Parallel and Scientific Computing},
160 publisher = {Springer},
165 author = {Cevahir, A. and Nukada, A. and Matsuoka, S.},
166 title = {High Performance Conjugate Gradient Solver on Multi-{GPU} Clusters using Hypergraph Partitioning},
167 journal = {Computer Science - Research and Development},
168 publisher = {Springer Berlin / Heidelberg},
175 author = {Cataly\"urek, U.V. and Aykanat, C.},
176 title = {{PaToH}: Partitioning Tool for Hypergraphs},
181 title={Parallel Sparse Linear Solver GMRES for GPU Clusters with Compression of Exchanged Data},
182 author={Bahi, J.M. and Couturier, R. and Ziane Khodja, L.},
183 booktitle={{Euro-Par} 2011: Parallel Processing Workshops},
188 publisher={Springer},
193 booktitle={Applied Parallel and Scientific Computing},
196 title={Impact of Asynchronism on {GPU} Accelerated Parallel Iterative Computations},
197 publisher={Springer},
198 author={Contassot-Vivier, S. and Jost, T. and Vialle, S.},
204 journal={Cluster Computing},
205 title={A communication reduction approach to iteratively solve large sparse linear systems on a {GPGPU} cluster},
206 publisher={Springer US},
207 author={Chen, C. and Taha, T.},
212 organization = {NVIDIA Corporation},
213 title = {{NVIDIA CUDA C} Programming Guide},
215 Note = {Version 4.0},
219 author = {Saad, Y. and Schultz, M.H.},
220 title = {{GMRES} : a Generalized Minimal Residual Algorithm for Solving Nonsymmetric Linear Systems},
221 journal = {SIAM J. Sci. Stat. Comput.},
226 publisher = {Society for Industrial and Applied Mathematics},
227 address = {Philadelphia, PA, USA},
231 author = {Paige, C.C. and Saunders, M.A.},
232 title = {Solution of Sparse Indefinite Systems of Linear Equations},
233 journal ={SIAM Journal on Numerical Analysis},
238 publisher = {Society for Industrial and Applied Mathematics},
243 author = {Arnoldi, W.},
244 title = {The Principle of Minimized Iteration in the Solution of the Matrix Eigenvalue Problem},
245 journal = {Quart. Appl. Math.},
253 title = {Iterative Methods for Sparse Linear Systems},
255 publisher = {Society for Industrial and Applied Mathematics},
256 address = {Philadelphia, PA, USA},
261 title = {{CUSP} Library},
262 Note = {http://code.google.com/p/cusp-library/},
265 @inproceedings{Bel09,
266 author = {Bell, N. and Garland, M.},
267 title = {Implementing Sparse Matrix-Vector Multiplication on Throughput-Oriented Processors},
272 address = {Portland, Oregon, USA},
276 title = {{NVIDIA} {CUDA} {C} {P}rogramming {G}uide},
277 organization = {NVIDIA Corporation},
278 journal = {Version 4.2},
279 note = {\url{http://developer.download.nvidia.com/compute/DevZone/docs/html/C/doc/CUDA_C_Programming_Guide.pdf}},
284 title = {{CUDA} {T}oolkit 4.2 {CUBLAS} {L}ibrary},
285 organization = {NVIDIA Corporation},
286 note = {\url{http://developer.download.nvidia.com/compute/DevZone/docs/html/CUDALibraries/doc/CUBLAS_Library.pdf}},
291 author = {Davis, T. and Hu, Y.},
292 title = {The {U}niversity of {F}lorida Sparse Matrix Collection},
294 note = {Digest, \url{http://www.cise.ufl.edu/research/sparse/matrices/}},
298 author = {Cataly\"urek, U. and Aykanat, C.},
299 title = {Hypergraph-Partitioning-Based Decomposition for Parallel Sparse-Matrix Vector Multiplication},
300 journal = {IEEE Trans. Parallel Distrib. Syst.},
305 publisher = {IEEE Press},
309 author = {Karypis, G. and Kumar, V.},
310 title = {{hMETIS}: A Hypergraph Partitioning Package},
314 @inproceedings{Dev06,
315 author = {Devine, K.D. and Boman, E.G. and Heaphy, R.T. and Bisseling, R.H. and Catalyurek, U.V},
316 title = {Parallel Hypergraph Partitioning for Scientific Computing},
317 booktitle = {Proceedings of the 20th international conference on Parallel and distributed processing},
321 publisher = {IEEE Computer Society},
326 title = {{PHG} - {P}arallel Hypergraph and Graph Partitioning with {Z}oltan},
327 note = {\url{http://www.cs.sandia.gov/Zoltan/ug_html/ug_alg_phg.html}},
332 title = {Zoltan : Parallel Partitioning, Load Balancing and Data-Management Services. User's Guide.},
333 note = {\url{http://www.cs.sandia.gov/Zoltan/ug_html/ug.html}},