X-Git-Url: https://bilbo.iut-bm.univ-fcomte.fr/and/gitweb/book_gpu.git/blobdiff_plain/8ed172dc793f429438af9d60c35ae52b85986b14..ac699bb490942cea02be7b088a0cfa4e0dcdd105:/BookGPU/Chapters/chapter15/ch15.tex?ds=sidebyside diff --git a/BookGPU/Chapters/chapter15/ch15.tex b/BookGPU/Chapters/chapter15/ch15.tex index 5dae9b2..c0de11e 100644 --- a/BookGPU/Chapters/chapter15/ch15.tex +++ b/BookGPU/Chapters/chapter15/ch15.tex @@ -5,9 +5,9 @@ \chapterauthor{Stan Scott}{School of Electronics, Electrical Engineering \& Computer Science, The Queen's University of Belfast} -\newcommand{\fixme}[1]{{\bf #1}} +%\newcommand{\fixme}[1]{{\bf #1}} -\chapter[Numerical validation and performance optimization on GPUs in atomic physics]{Numerical validation and performance optimization on GPUs of an application in atomic physics} +\chapter[Numerical validation on GPUs in atomic physics]{Numerical validation and performance optimization on GPUs of an application in atomic physics} \label{chapter15} \section{Introduction}\label{ch15:intro} @@ -275,20 +275,36 @@ $\Re^{O}$. the output $R$-matrix becomes the input $R$-matrix for the next evaluation. +%% \begin{algorithm} +%% \caption{\label{prop-algo}PROP algorithm} +%% \begin{algorithmic} +%% \FOR{all scattering energies} +%% \FOR{all sectors} +%% \STATE Read amplitude arrays +%% \STATE Read correction data +%% \STATE Construct local $R$-matrices +%% \STATE From $\Re^{I}$ and local $R$-matrices, compute $\Re^{O}$ +%% \STATE $\Re^{O}$ becomes $\Re^{I}$ for the next sector +%% \ENDFOR +%% \STATE Compute physical $R$-Matrix +%% \ENDFOR +%% \end{algorithmic} +%% \end{algorithm} + \begin{algorithm} \caption{\label{prop-algo}PROP algorithm} -\begin{algorithmic} -\FOR{all scattering energies} - \FOR{all sectors} - \STATE Read amplitude arrays - \STATE Read correction data -\STATE Construct local $R$-matrices -\STATE From $\Re^{I}$ and local $R$-matrices, compute $\Re^{O}$ -\STATE $\Re^{O}$ becomes $\Re^{I}$ for the next sector - \ENDFOR - \STATE Compute physical $R$-Matrix -\ENDFOR -\end{algorithmic} +%\begin{algorithmic} +\For{all scattering energies} { + \For{all sectors}{ + Read amplitude arrays\; + Read correction data\; + Construct local $R$-matrices\; + From $\Re^{I}$ and local $R$-matrices, compute $\Re^{O}$\; + $\Re^{O}$ becomes $\Re^{I}$ for the next sector\; + } + Compute physical $R$-Matrix \; +} +%\end{algorithmic} \end{algorithm} @@ -809,7 +825,7 @@ as the matrices increase in size during the propagation \section{Performance results} \subsection{PROP deployment on GPU} -\begin{table*}[ht] +\begin{table}[ht] \begin{center} \begin{tabular}{|c||c|c||} \hline @@ -833,13 +849,13 @@ GPU version & C1060 & C2050 \\ GPU V5 (\S~\ref{gpuv5}) & 24m27s & 12m39s \\ \hline \end{tabular} -\caption{\label{table:time} -Execution time of PROP on CPU and GPU} \end{center} -\end{table*} +\caption{Execution time of PROP on CPU and GPU} +\label{table:time} +\end{table} -\begin{comment} -\begin{table*}[ht] + +\begin{table}[ht] \begin{center} \begin{tabular}{|c||c|c||} \hline @@ -860,11 +876,10 @@ GPU version & C1060 & C2050 \\ GPU V5 (\ref{gpuv5}) & 24m27s & 12m39s \\ \hline \end{tabular} -\caption{\label{table:time} -Execution time of the successive GPU versions} \end{center} -\end{table*} -\end{comment} +\caption{Execution time of the successive GPU versions} +\label{table:time} +\end{table} \begin{figure}[h] \centering