bib.bib

   1 @incollection{ref18,
   2 title = {{P}arallel iterative algorithms: from sequential to grid computing},
   3 author = {Bahi, J.M. and Contassot-Vivier, S. and Couturier, R.},
   4 booktitle = {Numerical Analysis and Scientific Computing},
   5 publisher = {Chapman \& Hall/CRC},
   6 year = {2008},
   7 }
   8
   9 @inproceedings{refa,
  10 title = {An efficient multi-algorithms sparse linear solver for {GPU}s},
  11 author = {Jost, T. and Contassot-Vivier, S. and Vialle, S.},
  12 booktitle = {International conference on parallel computing, ParCo2009},
  13 year = {2009},
  14 }
  15
  16 @inproceedings{refd,
  17 title={Parallel iterative linear solvers on {GPU}: a financial engineering case},
  18 author={Gaikwad, A. and Toke, I.M.},
  19 booktitle = {Proceedings of the 2010 18th Euromicro Conference on Parallel, Distributed and Network-based Processing},
  20 pages={607--614},
  21 year={2010},
  22 publisher = {IEEE Computer Society},
  23 }
  24
  25 @article{refe,
  26 title = {Efficient {GPU} data structures and methods to solve sparse linear systems in dynamics applications},
  27 author = {Weber, D. and Bender, J. and Schnoes, M. and Stork, A. and Fellner, D.},
  28 journal = {Computer Graphics Forum},
  29 volume = {32},
  30 pages = {16--26},
  31 year = {2013},
  32 }
  33
  34 @article{reff,
  35 title = {Sparse matrix solvers on the {GPU}: conjugate gradients and multigrid},
  36 author = {Bolz, J. and Farmer, I. and Grinspun, E. and Schr{\"o}der, P.},
  37 journal = {ACM Trans. Graph.},
  38 volume = {22},
  39 number = {3},
  40 pages = {917--924},
  41 year = {2003},
  42 }
  43
  44 @article{refj,
  45 title={A parallel preconditioned {B}i-{C}onjugate {G}radient stabilized solver for the {P}oisson problem},
  46 author={Zhao, N. and Wang, X.},
  47 journal={Journal of Computers},
  48 volume={7},
  49 number={12},
  50 year={2012},
  51 }
  52
  53 @inproceedings{refb,
  54 title={Solving sparse linear systems on {NVIDIA} {T}esla {GPU}s},
  55 author={Wang, M. and Klie, H. and Parashar, M. and Sudan, H.},
  56 booktitle={Computational Science – ICCS 2009},
  57 volume={5544},
  58 pages={864--873},
  59 series={LNCS},
  60 publisher={Springer},
  61 year={2009},
  62 }
  63
  64 @article{refc,
  65 title = {Sparse systems solving on {GPUs} with {GMRES}},
  66 author = {Couturier, R. and Domas, S.},
  67 journal = {The journal of Supercomputing},
  68 pages = {1504--1516},
  69 volume = 59,
  70 number = 3,
  71 publisher = {Springer},
  72 year = {2012},
  73 }
  74
  75 @article{refg,
  76 title = {{GPU}-Accelerated Preconditioned Iterative Linear Solvers},
  77 author = {Li, R. and Saad, Y.},
  78 journal = {The Journal of Supercomputing},
  79 volume = {63},
  80 number = {2},
  81 pages = {443--466},
  82 year = {2013},
  83 }
  84
  85 @inproceedings{refm,
  86 title = {Accelerating the {GMRES} Iterative Linear Solver of an Oil Reservoir Simulator using the  Multi-Processing Power of Compute Unified Device Architecture of Graphics Cards},
  87 author = {Ghaemian, N. and Abdollahzadeh, A. and Heinemann, Z. and Harrer, A. and Sharifi, M. and Heinemann, G.},
  88 booktitle = {PARA 2008},
  89 year = {2008},
  90 }
  91
  92 @inproceedings{refh,
  93 title = {Fast Conjugate Gradients with Multiple {GPU}s},
  94 author = {Cevahir, A and Nukada, A. and Matsuoka, S.},
  95 booktitle = {Computational Science – ICCS 2009},
  96 volume = {5544},
  97 pages = {893--903},
  98 series = {LNCS},
  99 publisher = {Springer},
 100 year = {2009},
 101 }
 102
 103 @inproceedings{refi,
 104 author = {Ament, M. and Knittel, G. and Weiskopf, D. and Strasser, W.},
 105 title = {A Parallel Preconditioned Conjugate Gradient Solver for the Poisson Problem on a Multi-{GPU} Platform},
 106 booktitle = {Proceedings of the 2010 18th Euromicro Conference on Parallel, Distributed and Network-based Processing},
 107 year = {2010},
 108 pages = {583--592},
 109 publisher = {IEEE Computer Society},
 110 }
 111
 112 @article{refk,
 113 title = {Parallel Implementations of {FGMRES} for Solving Large, Sparse Non-symmetric Linear Systems},
 114 journal = {Procedia Computer Science},
 115 volume = {18},
 116 pages = {491--500},
 117 year = {2013},
 118 author = {DeVries, B. and Iannelli, J. and Trefftz, C. and O'Hearn, K.A. and Wolffe, G.},
 119 }
 120
 121 @inproceedings{refl,
 122 title = {A Parallel Algebraic Multigrid Solver on Graphics Processing Units},
 123 author = {Haase, G. and Liebmann, M. and Douglas, C.C. and Plank, G.},
 124 booktitle = {High Performance Computing and Applications},
 125 volume = {5938},
 126 pages = {38--47},
 127 series = {LNCS},
 128 publisher = {Springer},
 129 year = {2010},
 130 }
 131
 132 @article{refn,
 133   author = {G{\"o}ddeke, D. and Strzodka, R. and Mohd-Yusof, J. and McCormick, P. and Buijssen, S.H.M and Grajewski, M. and Turek, S.},
 134   title = {Exploring weak scalability for {FEM} calculations on a {GPU}-enhanced cluster},
 135   journal = {Parallel Computing, Special issue: High-performance computing using accelerators},
 136   year = {2007},
 137   volume = {33},
 138   number = {10--11},
 139   pages = {685--699},
 140   publisher = {Elsevier},
 141 }
 142
 143 @inproceedings{refo,
 144  author = {Bahi, J.M. and Couturier, R. and Ziane Khodja, L.},
 145  title = {Parallel {GMRES} implementation for solving sparse linear systems on {GPU} clusters},
 146  booktitle = {Proceedings of the 19th High Performance Computing Symposia},
 147  series = {HPC '11},
 148  year = {2011},
 149  pages = {12--19},
 150  publisher = {SCS International},
 151 }
 152
 153 @inproceedings{refp,
 154 title = {Algebraic Multigrid Solver on Clusters of {CPU}s and {GPU}s},
 155 author = {Neic, A. and Liebmann, M. and Haase, G. and Plank, G.},
 156 booktitle = {Applied Parallel and Scientific Computing},
 157 volume = {7134},
 158 pages = {389--398},
 159 series = {LNCS},
 160 publisher = {Springer},
 161 year = {2012},
 162 }
 163
 164 @article {Cev10,
 165    author = {Cevahir, A. and Nukada, A. and Matsuoka, S.},
 166    title = {High Performance Conjugate Gradient Solver on Multi-{GPU} Clusters using Hypergraph Partitioning},
 167    journal = {Computer Science - Research and Development},
 168    publisher = {Springer Berlin / Heidelberg},
 169    pages = {83--91},
 170    volume = {25},
 171    year = {2010}
 172 }
 173
 174 @manual{Cata99,
 175  author = {Cataly\"urek, U.V. and Aykanat, C.},
 176  title = {{PaToH}: Partitioning Tool for Hypergraphs},
 177  year = {1999},
 178  }
 179
 180 @inproceedings{refq,
 181 title={Parallel Sparse Linear Solver GMRES for GPU Clusters with Compression of Exchanged Data},
 182 author={Bahi, J.M. and Couturier, R. and Ziane Khodja, L.},
 183 booktitle={{Euro-Par} 2011: Parallel Processing Workshops},
 184 volume={7155},
 185 pages={471--480},
 186 year={2012},
 187 series={LNCS},
 188 publisher={Springer},
 189 }
 190
 191 @inproceedings{refr,
 192 year={2012},
 193 booktitle={Applied Parallel and Scientific Computing},
 194 volume={7133},
 195 series={LNCS},
 196 title={Impact of Asynchronism on {GPU} Accelerated Parallel Iterative Computations},
 197 publisher={Springer},
 198 author={Contassot-Vivier, S. and Jost, T. and Vialle, S.},
 199 pages={43--53}
 200 }
 201
 202 @article{refs,
 203 year={2013},
 204 journal={Cluster Computing},
 205 title={A communication reduction approach to iteratively solve large sparse linear systems on a {GPGPU} cluster},
 206 publisher={Springer US},
 207 author={Chen, C. and Taha, T.},
 208 pages={1--11},
 209 }
 210
 211 @manual{Nvi10,
 212  organization = {NVIDIA Corporation},
 213  title = {{NVIDIA CUDA C} Programming Guide},
 214  year = {2010},
 215  Note = {Version 4.0},
 216  }
 217
 218 @article{Saa86,
 219  author = {Saad, Y. and Schultz, M.H.},
 220  title = {{GMRES} : a Generalized Minimal Residual Algorithm for Solving Nonsymmetric Linear Systems},
 221  journal = {SIAM J. Sci. Stat. Comput.},
 222  year = {1986},
 223  volume = {7},
 224  number = {3},
 225  pages = {856--869},
 226  publisher = {Society for Industrial and Applied Mathematics},
 227  address = {Philadelphia, PA, USA},
 228  }
 229
 230 @article{Pai75,
 231  author = {Paige, C.C. and Saunders, M.A.},
 232  title = {Solution of Sparse Indefinite Systems of Linear Equations},
 233  journal ={SIAM Journal on Numerical Analysis},
 234  year = {1975},
 235  volume = {12},
 236  number = {4},
 237  pages = {617--629},
 238  publisher = {Society for Industrial and Applied Mathematics},
 239  }
 240
 241
 242 @article{Arn51,
 243  author = {Arnoldi, W.},
 244  title = {The Principle of Minimized Iteration in the Solution of the Matrix Eigenvalue Problem},
 245  journal = {Quart. Appl. Math.},
 246  year = {1951},
 247  volume = {9},
 248  pages = {17--29},
 249  }
 250
 251 @book{Saa03,
 252  author = {Saad, Y.},
 253  title = {Iterative Methods for Sparse Linear Systems},
 254  year = {2003},
 255  publisher = {Society for Industrial and Applied Mathematics},
 256  address = {Philadelphia, PA, USA},
 257 }
 258
 259 @manual{CUSP,
 260  key = {CUSP},
 261  title = {{CUSP} Library},
 262  Note = {http://code.google.com/p/cusp-library/},
 263  }
 264
 265 @inproceedings{Bel09,
 266  author = {Bell, N. and Garland, M.},
 267  title = {Implementing Sparse Matrix-Vector Multiplication on Throughput-Oriented Processors},
 268  booktitle = {SC'09},
 269  year = {2009},
 270  pages = {1--11},
 271  publisher = {ACM},
 272  address = {Portland, Oregon, USA},
 273  }
 274
 275 @manual{ref19,
 276 title = {{NVIDIA} {CUDA} {C} {P}rogramming {G}uide},
 277 organization = {NVIDIA Corporation},
 278 journal = {Version 4.2},
 279 note = {\url{http://developer.download.nvidia.com/compute/DevZone/docs/html/C/doc/CUDA_C_Programming_Guide.pdf}},
 280 year = {2012},
 281 }
 282
 283 @manual{ref37,
 284 title = {{CUDA} {T}oolkit 4.2 {CUBLAS} {L}ibrary},
 285 organization = {NVIDIA Corporation},
 286 note = {\url{http://developer.download.nvidia.com/compute/DevZone/docs/html/CUDALibraries/doc/CUBLAS_Library.pdf}},
 287 year = {2012},
 288 }
 289
 290 @misc{Dav97,
 291  author = {Davis, T. and Hu, Y.},
 292  title = {The {U}niversity of {F}lorida Sparse Matrix Collection},
 293  year = {1997},
 294  note = {Digest, \url{http://www.cise.ufl.edu/research/sparse/matrices/}},
 295  }
 296
 297 @article{Cat99,
 298  author = {Cataly\"urek, U. and Aykanat, C.},
 299  title = {Hypergraph-Partitioning-Based Decomposition for Parallel Sparse-Matrix Vector Multiplication},
 300  journal = {IEEE Trans. Parallel Distrib. Syst.},
 301  volume = {10},
 302  number = {7},
 303  year = {1999},
 304  pages = {673--693},
 305  publisher = {IEEE Press},
 306 }
 307
 308 @manual{Kar98,
 309  author = {Karypis, G. and Kumar, V.},
 310  title = {{hMETIS}: A Hypergraph Partitioning Package},
 311  year = {1998},
 312 }
 313
 314 @inproceedings{Dev06,
 315  author = {Devine, K.D. and Boman, E.G. and Heaphy, R.T. and Bisseling, R.H. and Catalyurek, U.V},
 316  title = {Parallel Hypergraph Partitioning for Scientific Computing},
 317  booktitle = {Proceedings of the 20th international conference on Parallel and distributed processing},
 318  series = {IPDPS'06},
 319  year = {2006},
 320  pages = {124--124},
 321  publisher = {IEEE Computer Society},
 322 }
 323
 324 @manual{ref20,
 325 key = {PHG},
 326 title = {{PHG} - {P}arallel Hypergraph and Graph Partitioning with {Z}oltan},
 327 note = {\url{http://www.cs.sandia.gov/Zoltan/ug_html/ug_alg_phg.html}},
 328 }
 329
 330 @manual{ref21,
 331 key = {Zoltan},
 332 title = {Zoltan : Parallel Partitioning, Load Balancing and Data-Management Services. User's Guide.},
 333 note = {\url{http://www.cs.sandia.gov/Zoltan/ug_html/ug.html}},
 334 }
 335
 336
 337
 338
 339
 340
 341