]> AND Private Git Repository - book_gpu.git/blobdiff - BookGPU/Chapters/chapter2/ex2.cu
Logo AND Algorithmique Numérique Distribuée

Private GIT Repository
ch17
[book_gpu.git] / BookGPU / Chapters / chapter2 / ex2.cu
index b27d619dd19b41e679df5fe9477a08bcbea22901..62931cdce0dc439a8bca3de46d8926d21723ce5a 100644 (file)
@@ -6,7 +6,6 @@
 #include "cutil_inline.h"
 #include <cublas_v2.h>
 
-
 const int nbThreadsPerBloc=256;
 
 __global__ 
@@ -28,19 +27,15 @@ void inverse(int size, double *d_x) {
 
 int main( int argc, char** argv) 
 {
-
        if(argc!=2) { 
                printf("usage: ex2 nb_components\n");
                exit(0);
        }
 
        int size=atoi(argv[1]);
-
        cublasStatus_t stat;
        cublasHandle_t handle; 
        stat=cublasCreate(&handle);
-
-
        int i;
        double *h_arrayA=(double*)malloc(size*sizeof(double));
        double *h_arrayB=(double*)malloc(size*sizeof(double));
@@ -48,7 +43,6 @@ int main( int argc, char** argv)
        double *h_arrayCgpu=(double*)malloc(size*sizeof(double));
        double *d_arrayA, *d_arrayB, *d_arrayC;
 
-
        cudaMalloc((void**)&d_arrayA,size*sizeof(double));
        cudaMalloc((void**)&d_arrayB,size*sizeof(double));
        cudaMalloc((void**)&d_arrayC,size*sizeof(double));
@@ -58,10 +52,9 @@ int main( int argc, char** argv)
                h_arrayB[i]=2*(i+1);
        }
 
-
        unsigned int timer_cpu = 0;
        cutilCheckError(cutCreateTimer(&timer_cpu));
-  cutilCheckError(cutStartTimer(timer_cpu));
+       cutilCheckError(cutStartTimer(timer_cpu));
        double dot=0;
        for(i=0;i<size;i++) {
                h_arrayC[i]=h_arrayA[i]+h_arrayB[i];
@@ -71,10 +64,9 @@ int main( int argc, char** argv)
        printf("CPU processing time : %f (ms) \n", cutGetTimerValue(timer_cpu));
        cutDeleteTimer(timer_cpu);
 
-
        unsigned int timer_gpu = 0;
        cutilCheckError(cutCreateTimer(&timer_gpu));
-  cutilCheckError(cutStartTimer(timer_gpu));
+       cutilCheckError(cutStartTimer(timer_gpu));
        stat = cublasSetVector(size,sizeof(double),h_arrayA,1,d_arrayA,1);
        stat = cublasSetVector(size,sizeof(double),h_arrayB,1,d_arrayB,1);
        int nbBlocs=(size+nbThreadsPerBloc-1)/nbThreadsPerBloc;
@@ -85,7 +77,6 @@ int main( int argc, char** argv)
        double dot_gpu=0;
        stat = cublasDdot(handle,size,d_arrayC,1,d_arrayA,1,&dot_gpu);
 
-
        cutilCheckError(cutStopTimer(timer_gpu));
        printf("GPU processing time : %f (ms) \n", cutGetTimerValue(timer_gpu));
        cutDeleteTimer(timer_gpu);
@@ -98,8 +89,6 @@ int main( int argc, char** argv)
        free(h_arrayB);
        free(h_arrayC);
        free(h_arrayCgpu);
-
        cublasDestroy(handle);
        return 0;
-
 }