1 @article{ch19:matrix-collection,
2 author = {Duff, I. S. and Grimes, Roger G. and Lewis, John G.},
3 title = {Sparse matrix test problems},
4 journal = {ACM Trans. Math. Softw.},
5 issue_date = {March 1989},
13 address = {New York, NY, USA},
16 @Conference{ch19:spmv-iccs,
17 author = {Dang, Hoang-Vu and Schmidt, Bertil},
18 title = {{The Sliced COO format for Sparse Matrix-Vector Multiplication on CUDA-enabled GPUs}},
21 booktitle = {Proc. ICCS, Procedia Vol. 9}
24 @article{ch19:spmv-ccpe,
25 author = {Bertil Schmidt and
28 title = {{Iterative Sparse Matrix-Vector Multiplication for accelerating
29 the Block Wiedemann Algorithm over GF(2) on Multi-graphics
30 Processing Unit Systems}},
31 journal = {Concurrency and Computation: Practice and Experience},
39 author = { Jim Kohl },
40 url = {http://www.csm.ornl.gov/~kohl/MatView/},
41 title = {MatView: Scalable Sparse Matrix Viewer},
45 @inproceedings{ch19:nvidia-spmv,
46 author = {Bell, Nathan and Garland, Michael},
47 title = {Implementing sparse matrix-vector multiplication on throughput-oriented processors},
48 booktitle = {SC '09: Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis},
50 isbn = {978-1-60558-744-8},
52 location = {Portland, Oregon},
53 doi = {http://doi.acm.org/10.1145/1654059.1654078},
55 address = {New York, NY, USA},
58 @article{ch19:bellpack,
59 author = {Choi, Jee W. and Singh, Amik and Vuduc, Richard W.},
60 title = {{Model-driven autotuning of sparse matrix-vector multiply on GPUs}},
61 journal = {SIGPLAN Not.},
71 address = {New York, NY, USA},
72 keywords = {gpu, performance modeling, sparse matrix-vector multiplication},
75 @inproceedings{ch19:europar,
76 author = {Bertil Schmidt and
79 title = { {Iterative Sparse Matrix-Vector Multiplication for Integer
80 Factorization on GPUs} },
81 booktitle = {Euro-Par (2)},
84 ee = {http://dx.doi.org/10.1007/978-3-642-23397-5_41},
85 crossref = {DBLP:conf/europar/2011-2},
86 bibsource = {DBLP, http://dblp.uni-trier.de}
89 @proceedings{ch19:DBLP:conf/europar/2011-2,
90 editor = {Emmanuel Jeannot and
93 title = {Euro-Par 2011 Parallel Processing - 17th International Conference,
94 Euro-Par 2011, Bordeaux, France, August 29 - September 2,
95 2011, Proceedings, Part II},
96 booktitle = {Euro-Par (2)},
97 publisher = {Springer},
98 series = {Lecture Notes in Computer Science},
101 isbn = {978-3-642-23396-8},
102 ee = {http://dx.doi.org/10.1007/978-3-642-23397-5},
103 bibsource = {DBLP, http://dblp.uni-trier.de}
106 @article{ch19:Thome:subqad,
107 author = {Thom\'{e}, Emmanuel},
108 title = { {Subquadratic Computation of Vector Generating Polynomials and Improvement of the Block Wiedemann Algorithm} },
109 journal = {J. Symb. Comput.},
117 url = {http://portal.acm.org/citation.cfm?id=612306.612319},
118 doi = {10.1006/jsco.2002.0533},
120 publisher = {Academic Press, Inc.},
121 address = {Duluth, MN, USA},
125 author = {Peter L. Montgomery},
126 title = {A Survey of Modern Integer Factorization Algorithms},
127 journal = {CWI Quarterly},
134 author = {Wiedemann, D H},
135 title = {Solving sparse linear equations over finite fields},
136 journal = {IEEE Trans. Inf. Theor.},
144 url = {http://dl.acm.org/citation.cfm?id=13738.13744},
145 doi = {10.1109/TIT.1986.1057137},
147 publisher = {IEEE Press},
148 address = {Piscataway, NJ, USA},
151 @inproceedings{ch19:wie-guass,
152 author = {LaMacchia, Brian A. and Odlyzko, Andrew M.},
153 title = {Solving Large Sparse Linear Systems over Finite Fields},
154 booktitle = {Proceedings of the 10th Annual International Cryptology Conference on Advances in Cryptology},
155 series = {CRYPTO '90},
157 isbn = {3-540-54508-5},
160 url = {http://dl.acm.org/citation.cfm?id=646755.705355},
162 publisher = {Springer-Verlag},
163 address = {London, UK, UK},
167 author = {Quinn, Michael},
169 howpublished = {Hardcover},
172 posted-at = {2010-04-02 13:14:26},
174 publisher = {McGraw-Hill Science/Engineering/Math},
175 title = {{Parallel Programming in C with MPI and OpenMP}},
179 @INPROCEEDINGS{ch19:mpi:col,
180 author = {Rajeev Thakur},
181 title = {Improving the performance of collective operations in MPICH},
182 booktitle = {Recent Advances in Parallel Virtual Machine and Message Passing Interface. Number 2840 in LNCS, Springer Verlag (2003) 257–267 10th European PVM/MPI User’s Group Meeting},
185 publisher = {Springer Verlag}
188 @INPROCEEDINGS{ch19:reduce_tree,
189 author = {Pitch Patarasuk and Xin Yuan},
190 title = {Bandwidth Efficient Allreduce Operation on Tree Topologies},
191 booktitle = {IEEE IPDPS Workshop on High-Level Parallel Programming Models and Supportive Environments},
195 @InProceedings{ch19:aoki,
196 author = {Aoki, Kazumaro and Shimoyama, Takeshi and Ueda, Hiroki},
197 title = {{Experiments on the Linear Algebra Step in the Number Field Sieve}},
198 booktitle = {Proceedings of the Security 2nd international conference on Advances in information and computer security},
201 isbn = {3-540-75650-7, 978-3-540-75650-7},
202 location = {Nara, Japan},
205 _url = {http://portal.acm.org/citation.cfm?id=1778902.1778909},
207 publisher = {Springer-Verlag},
208 address = {Berlin, Heidelberg},
209 keywords = {block Lanczos, ethernet, integer factoring, number field sieve, parallel computation},
212 @InProceedings{ch19:kilobit,
213 author = {Kazumaro Aoki and Jens Franke and Thorsten Kleinjung and Arjen K. Lenstra and Dag Arne Osvik},
214 title = {{A Kilobit Special Number Field Sieve Factorization.}},
215 booktitle = {ASIACRYPT},
219 @techreport{ch19:nvidia,
220 author = {Nathan Bell and Michael Garland},
221 title = {{Efficient Sparse Matrix-Vector Multiplication on {CUDA}}},
224 institution = {NVIDIA Corporation},
225 type = {NVIDIA Technical Report},
226 number = {NVR-2008-004},
229 @TechReport{ch19:rsa170,
230 author = {Dominik Bonenberger and Martin Krone},
231 title = {{Factorization of RSA-170}},
232 institution = {Ostfalia University of Applied Sciences},
234 url = {http://public.rz.fh-wolfenbuettel.de/~kronema/pdf/rsa170.pdf},
237 @article{ch19:exactspmv,
238 author = {Brice Boyer and
239 Jean-Guillaume Dumas and
241 title = {{Exact Sparse Matrix-Vector Multiplication on GPU's and Multicore
244 volume = {abs/1004.3719},
246 ee = {http://arxiv.org/abs/1004.3719},
247 bibsource = {DBLP, http://dblp.uni-trier.de}
251 author = {Don Coppersmith},
252 title = {{Solving Homogeneous Linear Equations Over GF(2) via Block Wiedemann Algorithm}},
253 journal = {Mathematics of Computation},
256 doi = {10.2307/2153413},
260 @InProceedings{ch19:hwang,
261 author = {Wontae Hwang and
263 title = {{Load Balanced Block Lanczos Algorithm over GF(2) for Factorization
268 ee = {http://dx.doi.org/10.1007/11945918_38},
269 bibsource = {DBLP, http://dblp.uni-trier.de}
272 @InProceedings{ch19:rsa768,
273 author = {{Kleinjung, T., et al.}},
274 title = {{Factorization of a 768-Bit RSA Modulus}},
275 booktitle = {International Crytology Conference},
278 doi = {10.1007/978-3-642-14623-7_18},
282 @article{ch19:hetero768,
283 author = {{Kleinjung, T., et al.}},
284 HAL_ID = {inria-00535765},
285 _URL = {http://hal.inria.fr/inria-00535765/en/},
286 title = { {A} {H}eterogeneous {C}omputing {E}nvironment to {S}olve the 768-bit {RSA} {C}hallenge},
287 language = {{A}nglais},
288 affiliation = {{L}aboratory for {C}ryptologic {A}lgorithms - {LACAL} - {\'E}cole {P}olytechnique {F}{\'e}d{\'e}rale de {L}ausanne - {NTT} {I}nformation {S}haring {P}latform {L}aboratories - {ISL} - {N}ippon {T}elegraph \& {T}elephone {C}orporation - {NTT} - {S}ilverbrook {R}esearch - silverbrook research - {D}epartment of {M}athematics - {U}niversity of {B}onn - {B}onn {U}niversit{\"a}t - {U}niversity of {B}onn - {CARAMEL} - {INRIA} {N}ancy - {G}rand {E}st / {LORIA} - {INRIA} - {CNRS} : {UMR}7503 - {U}niversit{\'e} {H}enri {P}oincar{\'e} - {N}ancy {I} - {U}niversit{\'e} {N}ancy {II} - {I}nstitut {N}ational {P}olytechnique de {L}orraine - {EPFL} / {D}omaine {IT} - {DIT} - {\'E}cole {P}olytechnique {F}{\'e}d{\'e}rale de {L}ausanne - {M}icrosoft {R}esearch - {M}icrosoft - {S}cientific {C}omputing and {C}ontrol {T}heory - {MAS}2 - {CWI} - {S}wiss {I}nstitute of {B}ioinformatics - {L}ausanne - {SIB} - {S}wiss {I}nstitute of {B}ioinformatics },
289 publisher = {{S}pringer-{V}erlag },
290 journal = {{C}luster {C}omputing },
291 audience = {internationale },
295 @inproceedings{ch19:grid,
296 HAL_ID = {inria-00502899},
297 _URL = {http://hal.inria.fr/inria-00502899/en/},
298 title = { {Using a Grid Platform for Slving Large Sparse Linear Systems over {GF}(2)}},
299 author = {{K}leinjung, {T}horsten and {N}ussbaum, {L}ucas and {T}hom{\'e}, {E}mmanuel},
300 language = {{A}nglais},
301 affiliation = {{L}aboratory for {C}ryptologic {A}lgorithms - {LACAL} - {\'E}cole {P}olytechnique {F}{\'e}d{\'e}rale de {L}ausanne - {ALGORILLE} - {INRIA} {L}orraine - {LORIA} - {INRIA} - {CNRS} : {UMR}7503 - {U}niversit{\'e} {H}enri {P}oincar{\'e} - {N}ancy {I} - {U}niversit{\'e} {N}ancy {II} - {I}nstitut {N}ational {P}olytechnique de {L}orraine - {CARAMEL} - {INRIA} {N}ancy - {G}rand {E}st / {LORIA} - {INRIA} - {CNRS} : {UMR}7503 - {U}niversit{\'e} {H}enri {P}oincar{\'e} - {N}ancy {I} - {U}niversit{\'e} {N}ancy {II} - {I}nstitut {N}ational {P}olytechnique de {L}orraine },
302 booktitle = {11th {ACM}/{IEEE} {I}nternational {C}onference on {G}rid {C}omputing ({G}rid 2010) },
303 address = {{B}russels {B}elgique },
304 audience = {internationale },
309 @inproceedings{ch19:sle,
310 author = {Alexander Monakov and
313 title = {{Automatically Tuning Sparse Matrix-Vector Multiplication
314 for GPU Architectures}},
315 booktitle = {HiPEAC},
318 ee = {http://dx.doi.org/10.1007/978-3-642-11515-8_10},
319 bibsource = {DBLP, http://dblp.uni-trier.de}
322 @inproceedings{ch19:bl,
323 author = {Peter L. Montgomery},
324 title = {{A Block Lanczos Algorithm for Finding Dependencies Over GF(2)}},
325 booktitle = {Theory and Application of Cryptographic Techniques},
332 author = {Nickolls, John and Buck, Ian and Garland, Michael and Skadron, Kevin},
333 title = {{Scalable Parallel Programming with CUDA}},
335 issue_date = {March/April 2008},
343 _url = {http://doi.acm.org/10.1145/1365490.1365500},
344 doi = {http://doi.acm.org/10.1145/1365490.1365500},
347 address = {New York, NY, USA},
351 author = {Nickolls, John and Dally, William J.},
352 title = {{The GPU Computing Era}},
353 journal = {IEEE Micro},
362 publisher = {IEEE Computer Society Press},
363 address = {Los Alamitos, CA, USA},
364 keywords = {GPU computing, CUDA, scalable parallel computing, heterogeneous CPU\&\#x002B, GPU coprocessing, Tesla GPU architecture, Fermi GPU architecture, NVIDIA.},
367 @misc{ch19:cuda-guide,
369 url = {http://developer.download.nvidia.com/compute/DevZone/docs/html/C/doc/CUDA_C_Programming_Guide.pdf},
370 title = {{CUDA C Programming Guide}},
374 @misc{ch19:p-reduction,
375 author = {Mark Harris},
376 url = {http://developer.download.nvidia.com/compute/cuda/1_1/Website/projects/reduction/doc/reduction.pdf},
377 title = {{Optimizing parallel reduction in CUDA}},
381 @misc{ch19:rsa190-factored,
382 url = {http://www.mersenneforum.org/showthread.php?t=14177},
383 title = {{RSA190 factored}},
388 author = {{Gaudry, P., et al.}},
389 title = {{CADO-NFS}},
390 url = {http://cado-nfs.gforge.inria.fr/},
395 author = "Nathan Bell and Michael Garland",
396 title = {{Cusp: Generic Parallel Algorithms for Sparse Matrix and Graph Computations}},
398 url = "http://cusp-library.googlecode.com",
399 note = "Version 0.1.0"
403 author = {Jason Papadopoulos},
405 url = {http://sourceforge.net/projects/msieve/},