last

[book_gpu.git] / BookGPU / Chapters / chapter5 / biblio5.bib
diff --git a/BookGPU/Chapters/chapter5/biblio5.bib b/BookGPU/Chapters/chapter5/biblio5.bib

index 04267a14de408d418e82a9839fb7cdcb6fd39aff..f0d230b4781ec4cbc5c47de517f033d8ba215839 100644 (file)
--- a/BookGPU/Chapters/chapter5/biblio5.bib
+++ b/BookGPU/Chapters/chapter5/biblio5.bib
@@ -3,7 +3,7 @@
  
  @INCOLLECTION{ch5:Bajrovic2011,
    author = {Bajrovic, E. and Traff, J.},
-  title = {Using MPI Derived Datatypes in Numerical Libraries},
+  title = {Using {MPI} Derived Datatypes in Numerical Libraries},
    booktitle = {Recent Advances in the Message Passing Interface},
    publisher = {Springer Berlin / Heidelberg},
    year = {2011},
@@ -24,13 +24,11 @@
  
  @ARTICLE{ch5:Bell2011,
    author = {N. Bell and J. Hoberock},
-  title = {Thrust: A Productivity-Oriented Library for CUDA},
-  journal = {in GPU Computing Gems, Jade Edition, Edited by Wen-mei W. Hwu},
+  title = {Thrust: A Productivity-Oriented Library for {CUDA}},
+  journal = {In GPU Computing Gems, {\rm Jade Edition, Edited by Wen-mei W. Hwu. Elsevier Science}},
    year = {2011},
    volume = {2},
    pages = {359-371},
-  owner = {slgl},
-  timestamp = {2012.09.12}
  }
  
  @ARTICLE{ch5:Engsig-Karup2011,
@@ -45,7 +43,7 @@
  }
  
  @BOOK{ch5:Gamma1995,
-  title = {Design Patterns - Elements of Reusable Object-Oriented Software},
+  title = {Design Patterns--Elements of Reusable Object-Oriented Software},
    publisher = {Addison-Wesley Professional Computing Series},
    year = {1995},
    author = {E. Gamma and R. Helm and R. Johnson and J. Vlissides},
@@ -76,10 +74,10 @@
  
  @INCOLLECTION{ch5:Hoefler2011,
    author = {Hoefler, T. and Snir, M.},
-  title = {Writing Parallel Libraries with MPI - Common Practice, Issues, and
+  title = {Writing Parallel Libraries with {MPI}--{C}ommon Practice, Issues, and
         Extensions},
    booktitle = {Recent Advances in the Message Passing Interface},
-  publisher = {Springer Berlin / Heidelberg},
+  publisher = {Springer, Berlin/Heidelberg},
    year = {2011},
    editor = {Cotronis, Y. and Danalis, A. and Nikolopoulos, D.
         and Dongarra, J.},
@@ -96,9 +94,9 @@
  }
  
  @BOOK{ch5:LeVeque2007,
-  title = {Finite difference methods for ordinary and partial differential equations
-       - steady-state and time-dependent problems},
+  title = {Finite Difference Methods for Ordinary and Partial Differential Equations--Steady-state and Time-dependent Problems},
    publisher = {SIAM},
+  address = {Philadelphia, PA},
    year = {2007},
    author = {R. J. LeVeque},
    pages = {I-XV, 1-341},
@@ -109,13 +107,12 @@
  
  @TECHREPORT{ch5:Skjellum1994,
    author = {A. Skjellum and N. E. Doss and P. V. Bangaloret},
-  title = {Writing Libraries in MPI},
+  title = {Writing Libraries in {MPI}},
    institution = {Department of Computer Science and NSF Engineering Research Center
         for Computational Fiels Simulation. Mississippi State University},
    year = {1994},
    file = {Skjellum1994.pdf:Skjellum1994.pdf:PDF},
-  owner = {slgl},
-  timestamp = {2012.09.10}
+  type = {Technical {R}eport},
  }
  
  @BOOK{ch5:Smith1996,
@@ -135,7 +132,6 @@
    year = {2002},
    author = {D. Vandevoorde and N. M. Josuttis},
    pages = {552},
-  edition = {1st},
    month = {November},
    owner = {slgl},
    timestamp = {2011.07.15},
@@ -177,28 +173,12 @@
  }
  
  @techreport{ch5:Asanovic:EECS-2006-183,
-  Author = {Asanovic, K. and Bodik, R. and Catanzaro, B. C. and Gebis, Joseph, J. and Husbands, P. and Keutzer, K. and Patterson, D. A. and Plishker, W. L. and Shalf, J. and Williams, S. W. and Yelick, K. A.},
-  Title = {The Landscape of Parallel Computing Research: A View from Berkeley},
+  Author = {Asanovic, K. and Bodik, R. and Catanzaro, B. C. and Gebis, J. J. and Husbands, P. and Keutzer, K. and Patterson, D. A. and Plishker, W. L. and Shalf, J. and Williams, S. W. and Yelick, K. A.},
+  Title = {The Landscape of Parallel Computing Research: A View from {B}erkeley},
    Institution = {EECS Department, University of California, Berkeley},
    Year = {2006},
    Month = {Dec},
    Number = {UCB/EECS-2006-183},
-  Abstract = {The recent switch to parallel microprocessors is a milestone in the history of computing. Industry has laid out a roadmap for multicore designs that preserves the programming paradigm of the past via binary compatibility and cache coherence. Conventional wisdom is now to double the number of cores on a chip with each silicon generation.
-A multidisciplinary group of Berkeley researchers met nearly two years to discuss this change. Our view is that this evolutionary approach to parallel hardware and software may work from 2 or 8 processor systems, but is likely to face diminishing returns as 16 and 32 processor systems are realized, just as returns fell with greater instruction-level parallelism.
-We believe that much can be learned by examining the success of parallelism at the extremes of the computing spectrum, namely embedded computing and high performance computing. This led us to frame the parallel landscape with seven questions, and to recommend the following:
-<ul>
-<li>The overarching goal should be to make it easy to write programs that execute efficiently on highly parallel computing systems
-<li>The target should be 1000s of cores per chip, as these chips are built from processing elements that are the most efficient in MIPS (Million Instructions per Second) per watt, MIPS per area of silicon, and MIPS per development dollar.
-<li>Instead of traditional benchmarks, use 13 "Dwarfs" to design and evaluate parallel programming models and architectures. (A dwarf is an algorithmic method that captures a pattern of computation and communication.)
-<li>"Autotuners" should play a larger role than conventional compilers in translating parallel programs.
-<li>To maximize programmer productivity, future programming models must be more human-centric than the conventional focus on hardware or applications.
-<li>To be successful, programming models should be independent of the number of processors.
-<li>To maximize application efficiency, programming models should support a wide range of data types and successful models of parallelism: task-level parallelism, word-level parallelism, and bit-level parallelism.
-<li>Architects should not include features that significantly affect performance or energy if programmers cannot accurately measure their impact via performance counters and energy counters.
-<li>Traditional operating systems will be deconstructed and operating system functionality will be orchestrated using libraries and virtual machines.
-<li>To explore the design space rapidly, use system emulators based on Field Programmable Gate Arrays (FPGAs) that are highly scalable and low cost.
-</ul>
-Since real world applications are naturally parallel and hardware is naturally parallel, what we need is a programming model, system software, and a supporting architecture that are naturally parallel. Researchers have the rare opportunity to re-invent these cornerstones of computing, provided they simplify the efficient programming of highly parallel systems.}
  }
  
  @article{ch5:mooreslaw1965,
@@ -216,20 +196,20 @@ Since real world applications are naturally parallel and hardware is naturally p
    author = "A. Kloeckner, T. Warburton and J. S. Hesthaven",
    institution = "Scientific Computing Group, Brown University",
    number = "2011-13",
-  address = "Providence, RI, USA",
+  address = "Providence, RI",
    year = "2011",
    month = jun,
  }
  
  @book{ch5:Ferziger1996,
-  title={Computational methods for fluid dynamics},
+  title={Computational Methods for Fluid Dynamics},
    author={Ferziger, J.H. and Peri{\'c}, M.},
    isbn={9783540594345},
    lccn={98231766},
-  series={Numerical methods: Research and development},
+  series={Numerical Methods: Research and Development},
    url={http://books.google.dk/books?id=SJkeAQAAIAAJ},
    year={1996},
-  publisher={Springer-Verlag}
+  publisher={Springer-Verlag, Berlin Heidelberg New York}
  }
  
  @book{ch5:chorin1993,
@@ -240,9 +220,11 @@ Since real world applications are naturally parallel and hardware is naturally p
    series={Texts in Applied Mathematics},
    url={http://books.google.dk/books?id=0Iglq1WA5PQC},
    year={1993},
-  publisher={Springer}
+  publisher={Springer, New York, NY},
+  edition={3rd},  
  }
  
+
  @book{ch5:Saad2003,
   author = {Saad, Y.},
   title = {Iterative Methods for Sparse Linear Systems},
@@ -250,7 +232,7 @@ Since real world applications are naturally parallel and hardware is naturally p
   isbn = {0898715342},
   edition = {2nd},
   publisher = {Society for Industrial and Applied Mathematics},
- address = {Philadelphia, PA, USA},
+ address = {Philadelphia, PA},
  }
  
  @book{ch5:Kelley1995,
@@ -261,13 +243,13 @@ Since real world applications are naturally parallel and hardware is naturally p
    series={Frontiers in Applied Mathematics Series},
    url={http://books.google.dk/books?id=3J4XEAooQOoC},
    year={1995},
-  publisher={Society for Industrial and Applied Mathematics (SIAM, 3600 Market Street, Floor 6, Philadelphia, PA 19104)}
+  publisher={Society for Industrial and Applied Mathematics, Philadelphia, PA,}
  }
  
  @techreport{ch5:YMTR08,
         author = {Y. Maday},
         title = {The parareal in time algorithm},
-       institution = {Universite Pierr\'{e} et Marie Curie},
+       institution = {Universite Pierr\'{e} et Marie Curie, Paris},
         year = {2008},
         type = {Technical Report},
         number = {R08030}
@@ -276,7 +258,7 @@ Since real world applications are naturally parallel and hardware is naturally p
  @article{ch5:MS07,
         author = {M. Gander and S. Vandewalle},
         title = {Analysis of the parareal time-parallel time-integration method},
-       journal = {SIAM Journal of scientific computing},
+       journal = {SIAM Journal of Scientific Computing},
         year = {2007},
         volume = {29},
         number = {2},
@@ -286,25 +268,31 @@ Since real world applications are naturally parallel and hardware is naturally p
  @article{ch5:LMT01,
         author = {J.-L. Lions and Y. Maday and G. Turinici},
         title = {R\'{e}solution d'EDP par un sch\'{e}ma en temps parar\'{e}el},
-       journal = {C.R. Acad Sci. Paris S\'{e}r. I math},
+       journal = {C.R. Acad. Sci. Paris S\'{e}r. I Math},
         year = {2001},
         volume = {332},
         pages = {661-668}
  }
  
  @article{ch5:LSY02,
-       author = {L. Baffico and S. Bernard and Y. Maday and G. Turinici and G. Z\'{e}rah},
-       title = {Parallel in time molecular dynamics simulations},
-       journal = {Physical Review E.},
-       year = {2002},
-       volume = {66},
-       number = {057701}
+  title = {Parallel-in-time molecular-dynamics simulations},
+  author = {Baffico, L. and Bernard, S. and Maday, Y. and Turinici, G. and Z\'erah, G.},
+  journal = {Phys. Rev. E},
+  volume = {66},
+  issue = {5},
+  pages = {057701},
+  numpages = {4},
+  year = {2002},
+  month = {Nov},
+  doi = {10.1103/PhysRevE.66.057701},
+  url = {http://link.aps.org/doi/10.1103/PhysRevE.66.057701},
+  publisher = {American Physical Society}
  }
  
  @mastersthesis{ch5:ASNP12,
         author = {A. S. Nielsen},
         title = {Feasibility study of the Parareal algorithm},
-       school = {Technical University of Denmark, Department of Informatics and Mathematical Modeling},
+       school = {Technical University of Denmark, Department of Informatics and Mathematical Modeling, Lyngby},
         year = {2012},
         type = {Master Thesis}
  }
@@ -320,19 +308,21 @@ Since real world applications are naturally parallel and hardware is naturally p
  
  @BOOK{ch5:Barrett1994,
    AUTHOR = {R. Barrett and M. Berry and T. F. Chan and J. Demmel and J. Donato and J. Dongarra and V. Eijkhout and R. Pozo and C. Romine and H. Van der Vorst },
-  TITLE = {Templates for the Solution of Linear Systems: Building Blocks for Iterative Methods, 2nd Edition},
+  TITLE = {Templates for the Solution of Linear Systems: Building Blocks for Iterative Methods},
+  edition = {2nd},  
    PUBLISHER = {SIAM},
    YEAR = {1994},
    ADDRESS = {Philadelphia, PA}
  }
  
  @TECHREPORT{ch5:ScientificGrandChallenges2010,
-  author = {D. L. Brown and P. Messina et. al},
+  author = {D. L. Brown, P. Messina et. al},
    title = {Scientific Grand Challenges, Crosscutting technologies for computing at the exascale},
    institution = {U.S. Department of Energy},
    year = {2010},
    month = {February},
    address = {Washington, D.C.},
+  type = {Technical {R}eport},  
  }
  
  @article{ch5:Keyes2011,
@@ -366,7 +356,7 @@ masid = {49649121}
  
  @misc{ch5:cudaguide,
     author = {{NVIDIA Corporation}},
-   title = {CUDA C Programming Guide},
+   title = {{CUDA C} {P}rogramming {G}uide},
     publisher = {NVIDIA Corporation},
     year = {2012},
     url = {http://docs.nvidia.com/cuda/cuda-c-programming-guide/index.html}
@@ -374,7 +364,7 @@ masid = {49649121}
  
  @misc{ch5:cudapractice,
     author = {{NVIDIA Corporation}},
-   title = {CUDA C Best Practices Guide},
+   title = {\rm {CUDA C} {B}est {P}ractices {G}uide},
     publisher = {NVIDIA Corporation},
     year = {2012},
     url = {http://docs.nvidia.com/cuda/cuda-c-best-practices-guide/index.html}
@@ -390,7 +380,7 @@ masid = {49649121}
   location = {Portland, Oregon},
   doi = {http://doi.acm.org/10.1145/1654059.1654078},
   publisher = {ACM},
- address = {New York, NY, USA},
+ address = {New York, NY},
   }
  
  @book{ch5:Kirk2010,
@@ -398,9 +388,8 @@ masid = {49649121}
   title = {Programming Massively Parallel Processors: A Hands-on Approach},
   year = {2010},
   isbn = {0123814723, 9780123814722},
- edition = {1st},
   publisher = {Morgan Kaufmann Publishers Inc.},
- address = {San Francisco, CA, USA},
+ address = {San Francisco, CA},
  }
  
  @book{ch5:Trottenberg2001,
@@ -410,5 +399,6 @@ masid = {49649121}
    lccn={00103940},
    url={http://books.google.dk/books?id=9ysyNPZoR24C},
    year={2001},
-  publisher={Academic Press}
+  publisher={Elsevier Academic Press},
+  address={London}
  }