BookGPU/Chapters/chapter19/biblio.bib

   1 @article{ch19:matrix-collection,
   2  author = {Duff, I. S. and Grimes, R. G. and Lewis, J. G.},
   3  title = {Sparse matrix test problems},
   4  journal = {ACM Trans. Math. Softw.},
   5  issue_date = {March 1989},
   6  volume = {15},
   7  issue = {1},
   8  month = {March},
   9  year = {1989},
  10  pages = {1--14},
  11  acmid = {62043},
  12  publisher = {ACM},
  13  address = {New York, NY, USA},
  14 }
  15
  16 @Conference{ch19:spmv-iccs,
  17   author = {Dang, H.-V. and Schmidt, B.},
  18   title = {{The Sliced COO format for Sparse Matrix-Vector Multiplication on CUDA-enabled GPUs}},
  19   year = {2012},
  20   pages = {57-66},
  21   booktitle = {Proc. ICCS, Procedia Vol. 9}
  22 }
  23
  24 @article{ch19:spmv-ccpe,
  25   author    = {B. Schmidt and
  26                H. Aribowo and
  27                H.-V. Dang},
  28   title     = {{Iterative Sparse Matrix-Vector Multiplication for accelerating
  29                the Block Wiedemann Algorithm over GF(2) on Multi-graphics
  30                Processing Unit Systems}},
  31   journal   = {Concurrency and Computation: Practice and Experience},
  32   volume    = {25},
  33   number    = {4},
  34   year      = {2013},
  35   pages     = {586-603},
  36 }
  37
  38 @misc{ch19:matview,
  39         author = { J. Kohl },
  40         url = {http://www.csm.ornl.gov/~kohl/MatView/},
  41         title = {MatView: Scalable Sparse Matrix Viewer},
  42         year = {2008},
  43 }
  44
  45 @inproceedings{ch19:nvidia-spmv,
  46  author = {Bell, N. and Garland, M.},
  47  title = {Implementing sparse matrix-vector multiplication on throughput-oriented processors},
  48  booktitle = {SC '09: Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis},
  49  year = {2009},
  50  isbn = {978-1-60558-744-8},
  51  pages = {1--11},
  52  location = {Portland, Oregon},
  53  doi = {http://doi.acm.org/10.1145/1654059.1654078},
  54  publisher = {ACM},
  55  address = {New York, NY, USA},
  56 }
  57
  58 @article{ch19:bellpack,
  59  author = {Choi, J. W. and Singh, A. and Vuduc, R. W.},
  60  title = {{Model-driven autotuning of sparse matrix-vector multiply on GPUs}},
  61  journal = {SIGPLAN Not.},
  62  volume = {45},
  63  issue = {5},
  64  month = {January},
  65  year = {2010},
  66  issn = {0362-1340},
  67  pages = {115--126},
  68  numpages = {12},
  69  acmid = {1693471},
  70  publisher = {ACM},
  71  address = {New York, NY, USA},
  72  keywords = {gpu, performance modeling, sparse matrix-vector multiplication},
  73 }
  74
  75 @inproceedings{ch19:europar,
  76   author    = {Bertil Schmidt and
  77                Hans Aribowo and
  78                Hoang-Vu Dang},
  79   title     = { {Iterative Sparse Matrix-Vector Multiplication for Integer
  80                Factorization on GPUs} },
  81   booktitle = {Euro-Par (2)},
  82   year      = {2011},
  83   pages     = {413-424},
  84   ee        = {http://dx.doi.org/10.1007/978-3-642-23397-5_41},
  85   crossref  = {DBLP:conf/europar/2011-2},
  86   bibsource = {DBLP, http://dblp.uni-trier.de}
  87 }
  88
  89 @proceedings{ch19:DBLP:conf/europar/2011-2,
  90   editor    = {Emmanuel Jeannot and
  91                Raymond Namyst and
  92                Jean Roman},
  93   title     = {Euro-Par 2011 Parallel Processing - 17th International Conference,
  94                Euro-Par 2011, Bordeaux, France, August 29 - September 2,
  95                2011, Proceedings, Part II},
  96   booktitle = {Euro-Par (2)},
  97   publisher = {Springer},
  98   series    = {Lecture Notes in Computer Science},
  99   volume    = {6853},
 100   year      = {2011},
 101   isbn      = {978-3-642-23396-8},
 102   ee        = {http://dx.doi.org/10.1007/978-3-642-23397-5},
 103   bibsource = {DBLP, http://dblp.uni-trier.de}
 104 }
 105
 106 @article{ch19:Thome:subqad,
 107  author = {Thom\'{e}, E.},
 108  title = { {Subquadratic Computation of Vector Generating Polynomials and Improvement of the Block Wiedemann Algorithm} },
 109  journal = {J. Symb. Comput.},
 110  volume = {33},
 111  issue = {5},
 112  month = {May},
 113  year = {2002},
 114  issn = {0747-7171},
 115  pages = {757--775},
 116  numpages = {19},
 117  url = {http://portal.acm.org/citation.cfm?id=612306.612319},
 118  doi = {10.1006/jsco.2002.0533},
 119  acmid = {612319},
 120  publisher = {Academic Press, Inc.},
 121  address = {Duluth, MN, USA},
 122 }
 123
 124 @ARTICLE{ch19:nfs,
 125     author = {Peter L. Montgomery},
 126     title = {A Survey of Modern Integer Factorization Algorithms},
 127     journal = {CWI Quarterly},
 128     year = {1994},
 129     volume = {7},
 130     pages = {337--366}
 131 }
 132
 133 @article{ch19:wie,
 134  author = {Wiedemann, D H},
 135  title = {Solving sparse linear equations over finite fields},
 136  journal = {IEEE Trans. Inf. Theor.},
 137  volume = {32},
 138  issue = {1},
 139  month = {January},
 140  year = {1986},
 141  issn = {0018-9448},
 142  pages = {54--62},
 143  numpages = {9},
 144  url = {http://dl.acm.org/citation.cfm?id=13738.13744},
 145  doi = {10.1109/TIT.1986.1057137},
 146  acmid = {13744},
 147  publisher = {IEEE Press},
 148  address = {Piscataway, NJ, USA},
 149 }
 150
 151 @inproceedings{ch19:wie-guass,
 152  author = {LaMacchia, Brian A. and Odlyzko, Andrew M.},
 153  title = {Solving Large Sparse Linear Systems over Finite Fields},
 154  booktitle = {Proceedings of the 10th Annual International Cryptology Conference on Advances in Cryptology},
 155  series = {CRYPTO '90},
 156  year = {1991},
 157  isbn = {3-540-54508-5},
 158  pages = {109--133},
 159  numpages = {25},
 160  url = {http://dl.acm.org/citation.cfm?id=646755.705355},
 161  acmid = {705355},
 162  publisher = {Springer-Verlag},
 163  address = {London, UK, UK},
 164 }
 165
 166 @book{ch19:book:mpi,
 167     author = {Quinn, Michael},
 168     edition = {1},
 169     howpublished = {Hardcover},
 170     isbn = {0072822562},
 171     month = jun,
 172     posted-at = {2010-04-02 13:14:26},
 173     priority = {2},
 174     publisher = {McGraw-Hill Science/Engineering/Math},
 175     title = {{Parallel Programming in C with MPI and OpenMP}},
 176     year = {2003}
 177 }
 178
 179 @INPROCEEDINGS{ch19:mpi:col,
 180     author = {Rajeev Thakur},
 181     title = {Improving the performance of collective operations in MPICH},
 182     booktitle = {Recent Advances in Parallel Virtual Machine and Message Passing Interface. Number 2840 in LNCS, Springer Verlag (2003) 257–267 10th European PVM/MPI User’s Group Meeting},
 183     year = {2003},
 184     pages = {257--267},
 185     publisher = {Springer Verlag}
 186 }
 187
 188 @INPROCEEDINGS{ch19:reduce_tree,
 189     author = {Pitch Patarasuk and Xin Yuan},
 190     title = {Bandwidth Efficient Allreduce Operation on Tree Topologies},
 191     booktitle = {IEEE IPDPS Workshop on High-Level Parallel Programming Models and Supportive Environments},
 192     year = {2007}
 193 }
 194
 195 @InProceedings{ch19:aoki,
 196  author = {Aoki, K. and Shimoyama, T. and Ueda, H.},
 197  title = {{Experiments on the Linear Algebra Step in the Number Field Sieve}},
 198  booktitle = {Proceedings of the Security 2nd international conference on Advances in information and computer security},
 199  series = {IWSEC'07},
 200  year = {2007},
 201  isbn = {3-540-75650-7, 978-3-540-75650-7},
 202  location = {Nara, Japan},
 203  pages = {58--73},
 204  numpages = {16},
 205  _url = {http://portal.acm.org/citation.cfm?id=1778902.1778909},
 206  acmid = {1778909},
 207  publisher = {Springer-Verlag},
 208  address = {Berlin, Heidelberg},
 209  keywords = {block Lanczos, ethernet, integer factoring, number field sieve, parallel computation},
 210 }
 211
 212 @InProceedings{ch19:kilobit,
 213 author = {K. Aoki and J. Franke and T. Kleinjung and A. K. Lenstra and D. A. Osvik},
 214 title = {{A Kilobit Special Number Field Sieve Factorization.}},
 215 booktitle = {ASIACRYPT},
 216 year = {2007}
 217 }
 218
 219 @techreport{ch19:nvidia,
 220     author = {N. Bell and M. Garland},
 221     title = {{Efficient Sparse Matrix-Vector Multiplication on {CUDA}}},
 222     month = dec,
 223     year = {2008},
 224     institution = {NVIDIA Corporation},
 225     type = {NVIDIA Technical Report},
 226     number = {NVR-2008-004},
 227 }
 228
 229 @TechReport{ch19:rsa170,
 230 author = {Dominik Bonenberger and Martin Krone},
 231 title = {{Factorization of RSA-170}},
 232 institution = {Ostfalia University of Applied Sciences},
 233 year = {2010},
 234 url = {http://public.rz.fh-wolfenbuettel.de/~kronema/pdf/rsa170.pdf},
 235 }
 236
 237 @article{ch19:exactspmv,
 238   author    = {B. Boyer and
 239                J.-G. Dumas and
 240                P. Giorgi},
 241   title     = {{Exact Sparse Matrix-Vector Multiplication on GPU's and Multicore
 242                Architectures}},
 243   journal   = {CoRR},
 244   volume    = {abs/1004.3719},
 245   year      = {2010},
 246   ee        = {http://arxiv.org/abs/1004.3719},
 247   bibsource = {DBLP, http://dblp.uni-trier.de}
 248 }
 249
 250 @article{ch19:bw,
 251 author = {D. Coppersmith},
 252 title = {{Solving Homogeneous Linear Equations Over GF(2) via Block Wiedemann Algorithm}},
 253 journal = {Mathematics of Computation},
 254 volume = {62},
 255 year = {1994},
 256 doi = {10.2307/2153413},
 257 masid = {1254705}
 258 }
 259
 260 @InProceedings{ch19:hwang,
 261   author    = {W. Hwang and
 262                D. Kim},
 263   title     = {{Load Balanced Block Lanczos Algorithm over GF(2) for Factorization
 264                of Large Keys}},
 265   booktitle = {HiPC},
 266   year      = {2006},
 267   pages     = {375-386},
 268   ee        = {http://dx.doi.org/10.1007/11945918_38},
 269   bibsource = {DBLP, http://dblp.uni-trier.de}
 270 }
 271
 272 @InProceedings{ch19:rsa768,
 273 author = {{T. Kleinjung  et al.}},
 274 title = {{Factorization of a 768-Bit RSA Modulus}},
 275 booktitle = {International Crytology Conference},
 276 year = {2010},
 277 pages = {333--350},
 278 doi = {10.1007/978-3-642-14623-7_18},
 279 masid = {13669015}
 280 }
 281
 282 @article{ch19:hetero768,
 283         author = {{T. Kleinjung et al.}},
 284     HAL_ID = {inria-00535765},
 285     _URL = {http://hal.inria.fr/inria-00535765/en/},
 286     title = { {A} {H}eterogeneous {C}omputing {E}nvironment to {S}olve the 768-bit {RSA} {C}hallenge},
 287     language = {{A}nglais},
 288     affiliation = {{L}aboratory for {C}ryptologic {A}lgorithms - {LACAL} - {\'E}cole {P}olytechnique {F}{\'e}d{\'e}rale de {L}ausanne - {NTT} {I}nformation {S}haring {P}latform {L}aboratories - {ISL} - {N}ippon {T}elegraph \& {T}elephone {C}orporation - {NTT} - {S}ilverbrook {R}esearch - silverbrook research - {D}epartment of {M}athematics - {U}niversity of {B}onn - {B}onn {U}niversit{\"a}t - {U}niversity of {B}onn - {CARAMEL} - {INRIA} {N}ancy - {G}rand {E}st / {LORIA} - {INRIA} - {CNRS} : {UMR}7503 - {U}niversit{\'e} {H}enri {P}oincar{\'e} - {N}ancy {I} - {U}niversit{\'e} {N}ancy {II} - {I}nstitut {N}ational {P}olytechnique de {L}orraine - {EPFL} / {D}omaine {IT} - {DIT} - {\'E}cole {P}olytechnique {F}{\'e}d{\'e}rale de {L}ausanne - {M}icrosoft {R}esearch - {M}icrosoft - {S}cientific {C}omputing and {C}ontrol {T}heory - {MAS}2 - {CWI} - {S}wiss {I}nstitute of {B}ioinformatics - {L}ausanne - {SIB} - {S}wiss {I}nstitute of {B}ioinformatics },
 289     publisher = {{S}pringer-{V}erlag },
 290     journal = {{C}luster {C}omputing },
 291     audience = {internationale },
 292     year = {2010},
 293 }
 294
 295 @inproceedings{ch19:grid,
 296     HAL_ID = {inria-00502899},
 297     _URL = {http://hal.inria.fr/inria-00502899/en/},
 298     title = { {Using a Grid Platform for Slving Large Sparse Linear Systems over {GF}(2)}},
 299     author = {{K}leinjung, {T}. and {N}ussbaum, {L}. and {T}hom{\'e}, {E}.},
 300     language = {{A}nglais},
 301     affiliation = {{L}aboratory for {C}ryptologic {A}lgorithms - {LACAL} - {\'E}cole {P}olytechnique {F}{\'e}d{\'e}rale de {L}ausanne - {ALGORILLE} - {INRIA} {L}orraine - {LORIA} - {INRIA} - {CNRS} : {UMR}7503 - {U}niversit{\'e} {H}enri {P}oincar{\'e} - {N}ancy {I} - {U}niversit{\'e} {N}ancy {II} - {I}nstitut {N}ational {P}olytechnique de {L}orraine - {CARAMEL} - {INRIA} {N}ancy - {G}rand {E}st / {LORIA} - {INRIA} - {CNRS} : {UMR}7503 - {U}niversit{\'e} {H}enri {P}oincar{\'e} - {N}ancy {I} - {U}niversit{\'e} {N}ancy {II} - {I}nstitut {N}ational {P}olytechnique de {L}orraine },
 302     booktitle = {11th {ACM}/{IEEE} {I}nternational {C}onference on {G}rid {C}omputing ({G}rid 2010) },
 303     address = {{B}russels {B}elgique },
 304     audience = {internationale },
 305     month = {10},
 306     year = {2010},
 307 }
 308
 309 @inproceedings{ch19:sle,
 310   author    = {A. Monakov and
 311                A. Lokhmotov and
 312                A. Avetisyan},
 313   title     = {{Automatically Tuning Sparse Matrix-Vector Multiplication
 314                for GPU Architectures}},
 315   booktitle = {HiPEAC},
 316   year      = {2010},
 317   pages     = {111-125},
 318   ee        = {http://dx.doi.org/10.1007/978-3-642-11515-8_10},
 319   bibsource = {DBLP, http://dblp.uni-trier.de}
 320 }
 321
 322 @inproceedings{ch19:bl,
 323 author = {Peter L. Montgomery},
 324 title = {{A Block Lanczos Algorithm for Finding Dependencies Over GF(2)}},
 325 booktitle = {Theory and Application of Cryptographic Techniques},
 326 year = {1995},
 327 pages = {106--120},
 328 masid = {674965}
 329 }
 330
 331 @article{ch19:cuda,
 332  author = {Nickolls, John and Buck, Ian and Garland, Michael and Skadron, Kevin},
 333  title = {{Scalable Parallel Programming with CUDA}},
 334  journal = {Queue},
 335  issue_date = {March/April 2008},
 336  volume = {6},
 337  issue = {2},
 338  month = {March},
 339  year = {2008},
 340  issn = {1542-7730},
 341  pages = {40--53},
 342  numpages = {14},
 343  _url = {http://doi.acm.org/10.1145/1365490.1365500},
 344  doi = {http://doi.acm.org/10.1145/1365490.1365500},
 345  acmid = {1365500},
 346  publisher = {ACM},
 347  address = {New York, NY, USA},
 348 }
 349
 350 @article{ch19:gpu,
 351  author = {Nickolls, John and Dally, William J.},
 352  title = {{The GPU Computing Era}},
 353  journal = {IEEE Micro},
 354  volume = {30},
 355  issue = {2},
 356  month = {March},
 357  year = {2010},
 358  issn = {0272-1732},
 359  pages = {56--69},
 360  numpages = {14},
 361  acmid = {1804055},
 362  publisher = {IEEE Computer Society Press},
 363  address = {Los Alamitos, CA, USA},
 364  keywords = {GPU computing, CUDA, scalable parallel computing, heterogeneous CPU\&\#x002B, GPU coprocessing, Tesla GPU architecture, Fermi GPU architecture, NVIDIA.},
 365 }
 366
 367 @misc{ch19:cuda-guide,
 368         author = {NVIDIA},
 369         url = {http://developer.download.nvidia.com/compute/DevZone/docs/html/C/doc/CUDA_C_Programming_Guide.pdf},
 370         title = {{CUDA C Programming Guide}},
 371         year={2011},
 372 }
 373
 374 @misc{ch19:p-reduction,
 375         author = {Mark Harris},
 376         url = {http://developer.download.nvidia.com/compute/cuda/1_1/Website/projects/reduction/doc/reduction.pdf},
 377         title = {{Optimizing parallel reduction in CUDA}},
 378         year={2007},
 379 }
 380
 381 @misc{ch19:rsa190-factored,
 382         url = {http://www.mersenneforum.org/showthread.php?t=14177},
 383         title = {{RSA190 factored}},
 384         year={2010}
 385 }
 386
 387 @misc{ch19:cadonfs,
 388   author = {{P. Gaudry et al.}},
 389   title = {{CADO-NFS}},
 390   url = {http://cado-nfs.gforge.inria.fr/},
 391   year = {2010}
 392 }
 393
 394 @MISC{ch19:cusp,
 395   author = "N. Bell and M. Garland",
 396   title = {{Cusp: Generic Parallel Algorithms for Sparse Matrix and Graph Computations}},
 397   year = "2010",
 398   url = "http://cusp-library.googlecode.com",
 399   note = "Version 0.1.0"
 400 }
 401
 402 @misc{ch19:msieve,
 403   author = {Jason Papadopoulos},
 404   title = {{Msieve}},
 405   url = {http://sourceforge.net/projects/msieve/},
 406   year = {2010}
 407 }