Merge

author Christophe Guyeux <guyeux@gmail.com>

Fri, 10 Oct 2014 12:44:09 +0000 (14:44 +0200)

committer Christophe Guyeux <guyeux@gmail.com>

Fri, 10 Oct 2014 12:44:09 +0000 (14:44 +0200)
author Christophe Guyeux <guyeux@gmail.com>
Fri, 10 Oct 2014 12:44:09 +0000 (14:44 +0200)
committer Christophe Guyeux <guyeux@gmail.com>
Fri, 10 Oct 2014 12:44:09 +0000 (14:44 +0200)
diff --combined paper.tex

index 517cb8e283f8f514809af58f2bd9b75309d1358e,063cbf9acbeb195e2500a1bbacaa905fa9327143..4e407309a44605787351dec9043baa5b54742bc7
--- 1/paper.tex
--- 2/paper.tex
+++ b/paper.tex
@@@ -760,9 -760,8 +760,9 @@@ Each step of the TSIRM algorithm \
   $\min_{\alpha \in \mathbb{R}^s} ||b-R\alpha ||_2 = \min_{\alpha \in \mathbb{R}^s} ||b-AS\alpha ||_2$
   
   $\begin{array}{ll}
- -& = \min_{x \in Vect\left(x_0, x_1, \hdots, x_{k-1} \right)} ||b-AS\alpha ||_2\\
- -& \leqslant \min_{x \in Vect\left( S_{k-1} \right)} ||b-Ax ||_2\\
+ +& = \min_{x \in Vect\left(S_{k-s}, S_{k-s+1}, \hdots, S_{k-1} \right)} ||b-AS\alpha ||_2\\
+ +& = \min_{x \in Vect\left(x_{k-s}, x_{k-s}+1, \hdots, x_{k-1} \right)} ||b-AS\alpha ||_2\\
+ +& \leqslant \min_{x \in Vect\left( x_{k-1} \right)} ||b-Ax ||_2\\
   & \leqslant ||b-Ax_{k-1}||
   \end{array}$
   \end{proof}
@@@ -838,7 -837,7 +838,7 @@@ torso3             & fgmres / sor  & 37
   \hline
   
   \end{tabular}
- \caption{Comparison of (F)GMRES and 2 stage (F)GMRES algorithms in sequential with some matrices, time is expressed in seconds.}
+ \caption{Comparison of (F)GMRES and TSIRM with (F)GMRES in sequential with some matrices, time is expressed in seconds.}
   \label{tab:02}
   \end{center}
   \end{table}
@@@ -897,7 -896,7 +897,7 @@@ Table~\ref{tab:03} shows  the executio
   example ex15  of PETSc on the  Juqueen architecture. Different  numbers of cores
   are  studied ranging  from  2,048  up-to 16,383.   Two  preconditioners have  been
   tested: {\it mg} and {\it sor}.   For those experiments,  the number  of components  (or unknowns  of the
- problems)  per processor  is fixed  to 25,000,  also called  weak  scaling. This
+ problems)  per core  is fixed  to 25,000,  also called  weak  scaling. This
   number can seem relatively small. In fact, for some applications that need a lot
   of  memory, the  number of  components per  processor requires  sometimes  to be
   small.
@@@ -944,7 -943,7 +944,7 @@@ the number of iterations. So, the overa
   \begin{tabular}{|r|r|r|r|r|r|r|r|r|} 
   \hline
   
-   nb. cores & threshold   & \multicolumn{2}{c|}{GMRES} & \multicolumn{2}{c|}{TSIRM CGLS} &  \multicolumn{2}{c|}{TSIRM LSQR} & best gain \\ 
+   nb. cores & threshold   & \multicolumn{2}{c|}{FGMRES} & \multicolumn{2}{c|}{TSIRM CGLS} &  \multicolumn{2}{c|}{TSIRM LSQR} & best gain \\ 
   \cline{3-8}
                &                       & Time  & \# Iter.  & Time  & \# Iter. & Time  & \# Iter. & \\\hline \hline
     2,048      & 8e-5                  & 108.88 & 16,560  & 23.06  &  3,630  & 22.79  & 3,630   & 4.77 \\
@@@ -957,7 -956,7 +957,7 @@@
   \hline
   
   \end{tabular}
- \caption{Comparison of FGMRES  and 2 stage FGMRES algorithms for ex54 of Petsc (both with the MG preconditioner) with 25000 components per core on Curie (restart=30, s=12),  time is expressed in seconds.}
+ \caption{Comparison of FGMRES  and TSIRM with FGMRES algorithms for ex54 of Petsc (both with the MG preconditioner) with 25,000 components per core on Curie (restart=30, s=12),  time is expressed in seconds.}
   \label{tab:04}
   \end{center}
   \end{table*}
@@@ -971,9 -970,9 +971,9 @@@ In Table~\ref{tab:04}, some experiment
   \begin{tabular}{|r|r|r|r|r|r|r|r|r|r|r|} 
   \hline
   
-   nb. cores   & \multicolumn{2}{c|}{GMRES} & \multicolumn{2}{c|}{TSIRM CGLS} &  \multicolumn{2}{c|}{TSIRM LSQR} & best gain & \multicolumn{3}{c|}{efficiency} \\ 
+   nb. cores   & \multicolumn{2}{c|}{FGMRES} & \multicolumn{2}{c|}{TSIRM CGLS} &  \multicolumn{2}{c|}{TSIRM LSQR} & best gain & \multicolumn{3}{c|}{efficiency} \\ 
   \cline{2-7} \cline{9-11}
-                     & Time  & \# Iter.  & Time  & \# Iter. & Time  & \# Iter. &   & GMRES & TS CGLS & TS LSQR\\\hline \hline
+                     & Time  & \# Iter.  & Time  & \# Iter. & Time  & \# Iter. &   & FGMRES & TS CGLS & TS LSQR\\\hline \hline
      512              & 3,969.69 & 33,120 & 709.57 & 5,790  & 622.76 & 5,070  & 6.37  &   1    &    1    &     1     \\
      1024             & 1,530.06  & 25,860 & 290.95 & 4,830  & 307.71 & 5,070 & 5.25  &  1.30  &    1.21  &   1.01     \\
      2048             & 919.62    & 31,470 & 237.52 & 8,040  & 194.22 & 6,510 & 4.73  & 1.08   &    .75   &   .80\\
@@@ -983,7 -982,7 +983,7 @@@
   \hline
   
   \end{tabular}
- \caption{Comparison of FGMRES  and 2 stage FGMRES algorithms for ex54 of Petsc (both with the MG preconditioner) with 204,919,225 components on Curie with different number of cores (restart=30, s=12, threshol 5e-5),  time is expressed in seconds.}
+ \caption{Comparison of FGMRES  and TSIRM with FGMRES for ex54 of Petsc (both with the MG preconditioner) with 204,919,225 components on Curie with different number of cores (restart=30, s=12, threshold 5e-5),  time is expressed in seconds.}
   \label{tab:05}
   \end{center}
   \end{table*}
@@@ -1011,7 -1010,7 +1011,7 @@@
   
   future plan : \\
   - study other kinds of matrices, problems, inner solvers\\
- - test the influence of all the parameters\\
+ - test the influence of all parameters\\
   - adaptative number of outer iterations to minimize\\
   - other methods to minimize the residuals?\\
   - implement our solver inside PETSc
@@@ -1026,7 -1025,7 +1026,7 @@@
   %%%*********************************************************
   \section*{Acknowledgment}
   This  paper  is   partially  funded  by  the  Labex   ACTION  program  (contract
- ANR-11-LABX-01-01).   We acknowledge PRACE  for awarding  us access  to resource
+ ANR-11-LABX-01-01).   We acknowledge PRACE  for awarding  us access  to resources
   Curie and Juqueen respectively based in France and Germany.
author	Christophe Guyeux <guyeux@gmail.com>
	Fri, 10 Oct 2014 12:44:09 +0000 (14:44 +0200)
committer	Christophe Guyeux <guyeux@gmail.com>
	Fri, 10 Oct 2014 12:44:09 +0000 (14:44 +0200)