From 52ab767b35cd7488bc292d69e0e288566baba399 Mon Sep 17 00:00:00 2001 From: zianekhodja Date: Fri, 25 Dec 2015 21:47:45 +0100 Subject: [PATCH] Figures --- Full.pdf | Bin 0 -> 7264 bytes Full_mpi.pdf | Bin 0 -> 8036 bytes Full_omp.pdf | Bin 0 -> 8045 bytes MPI.pdf | Bin 0 -> 7429 bytes OMP.pdf | Bin 0 -> 7431 bytes Simulations/Full.eps | 871 +++++++++++++++++ Simulations/Full_mpi.eps | 899 ++++++++++++++++++ Simulations/Full_omp.eps | 899 ++++++++++++++++++ Simulations/MPI.eps | 871 +++++++++++++++++ Simulations/OMP.eps | 871 +++++++++++++++++ Simulations/Sparse.eps | 829 ++++++++++++++++ Simulations/Sparse_mpi.eps | 899 ++++++++++++++++++ Simulations/Sparse_omp.eps | 899 ++++++++++++++++++ Simulations/full_mpi/full_mpi_1GPU.o140161 | 515 ++++++++++ Simulations/full_mpi/full_mpi_1GPU.sge | 25 + Simulations/full_mpi/full_mpi_2GPU.o140160 | 562 +++++++++++ Simulations/full_mpi/full_mpi_2GPU.sge | 25 + Simulations/full_mpi/full_mpi_3GPU.o140159 | 604 ++++++++++++ Simulations/full_mpi/full_mpi_3GPU.sge | 25 + Simulations/full_mpi/full_mpi_4GPU.o140132 | 622 ++++++++++++ Simulations/full_mpi/full_mpi_4GPU.sge | 25 + .../full_mpi_bis/full_mpi_1GPU.o140351 | 573 +++++++++++ .../full_mpi_bis/full_mpi_2GPU.o140350 | 620 ++++++++++++ .../full_mpi_bis/full_mpi_3GPU.o140349 | 720 ++++++++++++++ .../full_mpi_bis/full_mpi_4GPU.o140348 | 706 ++++++++++++++ .../full_openmp/full_openmp_1GPU.o140165 | 511 ++++++++++ Simulations/full_openmp/full_openmp_1GPU.sge | 27 + .../full_openmp/full_openmp_2GPU.o140164 | 540 +++++++++++ Simulations/full_openmp/full_openmp_2GPU.sge | 27 + .../full_openmp/full_openmp_3GPU.o140163 | 565 +++++++++++ Simulations/full_openmp/full_openmp_3GPU.sge | 27 + .../full_openmp/full_openmp_4GPU.o140162 | 590 ++++++++++++ Simulations/full_openmp/full_openmp_4GPU.sge | 27 + .../full_openmp_bis/full_openmp_1GPU.o140355 | 569 +++++++++++ .../full_openmp_bis/full_openmp_2GPU.o140354 | 593 ++++++++++++ .../full_openmp_bis/full_openmp_2GPU.o140354~ | 593 ++++++++++++ .../full_openmp_bis/full_openmp_3GPU.o140353 | 676 +++++++++++++ .../full_openmp_bis/full_openmp_4GPU.o140352 | 650 +++++++++++++ .../full_openmp_bis/full_openmp_4GPU.o140352~ | 650 +++++++++++++ Simulations/mpi.txt | 9 + Simulations/mpivsomp.txt | 5 + Simulations/omp.txt | 9 + .../sparse_mpi/sparse_mpi_1GPU.o140032 | 642 +++++++++++++ Simulations/sparse_mpi/sparse_mpi_1GPU.sge | 25 + .../sparse_mpi/sparse_mpi_2GPU.o140031 | 662 +++++++++++++ Simulations/sparse_mpi/sparse_mpi_2GPU.sge | 25 + .../sparse_mpi/sparse_mpi_3GPU.o140030 | 758 +++++++++++++++ Simulations/sparse_mpi/sparse_mpi_3GPU.sge | 25 + .../sparse_mpi/sparse_mpi_4GPU.o140023 | 841 ++++++++++++++++ Simulations/sparse_mpi/sparse_mpi_4GPU.sge | 25 + .../sparse_openmp/sparse_openmp_1GPU.o140100 | 512 ++++++++++ .../sparse_openmp/sparse_openmp_1GPU.sge | 27 + .../sparse_openmp/sparse_openmp_2GPU.o140099 | 534 +++++++++++ .../sparse_openmp/sparse_openmp_2GPU.sge | 27 + .../sparse_openmp/sparse_openmp_3GPU.o140098 | 602 ++++++++++++ .../sparse_openmp/sparse_openmp_3GPU.sge | 27 + .../sparse_openmp/sparse_openmp_4GPU.o140097 | 621 ++++++++++++ .../sparse_openmp/sparse_openmp_4GPU.o140097~ | 621 ++++++++++++ .../sparse_openmp/sparse_openmp_4GPU.sge | 27 + Sparse.pdf | Bin 0 -> 7162 bytes Sparse_mpi.pdf | Bin 0 -> 8041 bytes Sparse_omp.pdf | Bin 0 -> 8031 bytes paper.tex | 12 +- 63 files changed, 24135 insertions(+), 6 deletions(-) create mode 100644 Full.pdf create mode 100644 Full_mpi.pdf create mode 100644 Full_omp.pdf create mode 100644 MPI.pdf create mode 100644 OMP.pdf create mode 100644 Simulations/Full.eps create mode 100644 Simulations/Full_mpi.eps create mode 100644 Simulations/Full_omp.eps create mode 100644 Simulations/MPI.eps create mode 100644 Simulations/OMP.eps create mode 100644 Simulations/Sparse.eps create mode 100644 Simulations/Sparse_mpi.eps create mode 100644 Simulations/Sparse_omp.eps create mode 100644 Simulations/full_mpi/full_mpi_1GPU.o140161 create mode 100755 Simulations/full_mpi/full_mpi_1GPU.sge create mode 100644 Simulations/full_mpi/full_mpi_2GPU.o140160 create mode 100755 Simulations/full_mpi/full_mpi_2GPU.sge create mode 100644 Simulations/full_mpi/full_mpi_3GPU.o140159 create mode 100755 Simulations/full_mpi/full_mpi_3GPU.sge create mode 100644 Simulations/full_mpi/full_mpi_4GPU.o140132 create mode 100755 Simulations/full_mpi/full_mpi_4GPU.sge create mode 100644 Simulations/full_mpi_bis/full_mpi_1GPU.o140351 create mode 100644 Simulations/full_mpi_bis/full_mpi_2GPU.o140350 create mode 100644 Simulations/full_mpi_bis/full_mpi_3GPU.o140349 create mode 100644 Simulations/full_mpi_bis/full_mpi_4GPU.o140348 create mode 100644 Simulations/full_openmp/full_openmp_1GPU.o140165 create mode 100755 Simulations/full_openmp/full_openmp_1GPU.sge create mode 100644 Simulations/full_openmp/full_openmp_2GPU.o140164 create mode 100755 Simulations/full_openmp/full_openmp_2GPU.sge create mode 100644 Simulations/full_openmp/full_openmp_3GPU.o140163 create mode 100755 Simulations/full_openmp/full_openmp_3GPU.sge create mode 100644 Simulations/full_openmp/full_openmp_4GPU.o140162 create mode 100755 Simulations/full_openmp/full_openmp_4GPU.sge create mode 100644 Simulations/full_openmp_bis/full_openmp_1GPU.o140355 create mode 100644 Simulations/full_openmp_bis/full_openmp_2GPU.o140354 create mode 100644 Simulations/full_openmp_bis/full_openmp_2GPU.o140354~ create mode 100644 Simulations/full_openmp_bis/full_openmp_3GPU.o140353 create mode 100644 Simulations/full_openmp_bis/full_openmp_4GPU.o140352 create mode 100644 Simulations/full_openmp_bis/full_openmp_4GPU.o140352~ create mode 100644 Simulations/mpi.txt create mode 100644 Simulations/mpivsomp.txt create mode 100644 Simulations/omp.txt create mode 100644 Simulations/sparse_mpi/sparse_mpi_1GPU.o140032 create mode 100755 Simulations/sparse_mpi/sparse_mpi_1GPU.sge create mode 100644 Simulations/sparse_mpi/sparse_mpi_2GPU.o140031 create mode 100755 Simulations/sparse_mpi/sparse_mpi_2GPU.sge create mode 100644 Simulations/sparse_mpi/sparse_mpi_3GPU.o140030 create mode 100755 Simulations/sparse_mpi/sparse_mpi_3GPU.sge create mode 100644 Simulations/sparse_mpi/sparse_mpi_4GPU.o140023 create mode 100755 Simulations/sparse_mpi/sparse_mpi_4GPU.sge create mode 100644 Simulations/sparse_openmp/sparse_openmp_1GPU.o140100 create mode 100755 Simulations/sparse_openmp/sparse_openmp_1GPU.sge create mode 100644 Simulations/sparse_openmp/sparse_openmp_2GPU.o140099 create mode 100755 Simulations/sparse_openmp/sparse_openmp_2GPU.sge create mode 100644 Simulations/sparse_openmp/sparse_openmp_3GPU.o140098 create mode 100755 Simulations/sparse_openmp/sparse_openmp_3GPU.sge create mode 100644 Simulations/sparse_openmp/sparse_openmp_4GPU.o140097 create mode 100644 Simulations/sparse_openmp/sparse_openmp_4GPU.o140097~ create mode 100755 Simulations/sparse_openmp/sparse_openmp_4GPU.sge create mode 100644 Sparse.pdf create mode 100644 Sparse_mpi.pdf create mode 100644 Sparse_omp.pdf diff --git a/Full.pdf b/Full.pdf new file mode 100644 index 0000000000000000000000000000000000000000..62a34e7a00ee499fd86cd70984087b283d9143d9 GIT binary patch literal 7264 zcmb_B2{@G9_mz;5BvK;1EsSEkvlwQ^*4V|^$C_%)yv#6WGz()XMbavylu}7PQb{B! zib^Vxipr8wk`|$4&DZ~(LG{(|zdg@49_HS&-*e8r_uNCv#mWYS(KkS7)qLD{5`hQM z05>2QVPXP0LYyE06EK7!ZlDc|Er56cXv3xnAS;N@Wk6CxkQ;h~+~ z<6Vo{$2Q;Y{qVRW_o*=YOaHXZV?%TOTlMGYJzIC3aH{R*6MCyt+)GooZO0?`rv691 zH~P(Q-&f?$>1COYs$DN|Zher>%nwbzRBNnqV{p%%<0Tb;6Z5UBCkQfjxq4Y;LvA*b0xEH_9J0pum|vb%e%v>*q7_CWNR8rJwISktat* z>Aer|S)ubDTg)uX<3A~%tAfwUPq5C+=t_{FO&TAzr*6!99pgZAt?8mt2+Qiu^15to zNvB>SY+9~*TVAw#;39kcW644&dt0#2AtOZHJj>*!J(i~4jq{5pm+89Tys^@x;P@+! zldD{lu`uqWwns@}9{usH3B8G=XMWf@!b9AZdhcD}Ra!`tB`!Kg$WxawDZM2Bb&t?_ z)Yq}x`6SINIl^cE;7V=Jc?vmz?(U~8K>=D1T@Xds=#u(dYffgVq-9He?3`vy*lD;lIm_TVbA6&O&YsmovMjmn60|YM-GG^m{7%*4+$Vd#)vO)gF<4mO@mdXjfC5XKP``{d^lx zi``gF?})iPzPTI#bLrv;E^0n2%myy>unT>B6qeVxQR)|KByDjtdU1F;oTHh$h+#OqAx;y>){qdmk zi*f6`mLI@n`XH-(%M3Ra%Dde6d93BuzYn-QWAhc&fqCjt59S!>g2S;p2Na+46Kl71 zGnc+t5|g~@wyIY`-^=*5M_z9}`c!d-vktLI_)TuXJ8h*q(i-7>`{2({dl!Ip>%G*& zk!NgQe$%E7WxNdK8`BXQRQE5 zG^*TcTA<97{`ObLs!dDpbUWt1yBD={;NdaMm(EDg+-#-PnugiTgVTFx)oWdcU*DgW zu~#km2sAC5G3`cdCDJ zMi4wwBxp&`iLc#oU8!a(sX&IW@j7g6$(R~RzenS3L{e?Y1GS`^#SLp@S6!;{fA{Q* zPG&_$sthT-$%iD``^n+m{jIK~+HK2gvU2?2&1~y(Bk?z+)nhw!rhmBlNbbUDj-abj zCli`+&ZWhTgfGa+e&9>m{f(7lnV8L39g!1MmUvmve?ovTauzjM5EXqdm~7C9oK|)1 z>dUQ0AiC-Ev_-=u32QWm=e$MCa$6ZBKdWK1c}Cpmf#TfiUh3+X%9(G5D>i>^_cc#Z zSNzzbST9sEws_B*)3Nt)xz1V6OtjG}!@9k9x^9o#U(~zbev6$+mCn+m<~;DF8sojF z2%#4>IoK~hcn*`=gX}|C%h*t9-&)Z|Og+1y)2sRl4<1lp z`lFPY3AzgEVKg3X02pD>{sxMgGDnmOgo-O>kP$1T;1`XiCJS^%O`z zW55^yGXeOi+vuMHel7z6I=fH+jG5V_k&;zSs&X?zi22-pijgdH3QIr`{)rV&Cy^F3 zJ|uPwxW>xf+QUKD4q}Hx0v4SnahDaur}J200xl0AibY7=A;G}zWbya{OD2s6;IN=0 zZE}pkqCqbfL%`(wA+SbbMgQH81dG7q4T0Z(Cpg5=fAAuH&I}F3>oteRu zwqV5=!~|r5M-2PP{bMANDAA6FGi}n6DXXzRc*IgCu@VlPcn))jDW|N2=i;Q}z_kjC z69l_}L+0>VKj!Yj0D(Be#Yq9ja4OTpPW>fae)G9x>O>2L{&R3F;7tPW5fm0)vmv}@ z1B}18VhZBJS%tx%4G|!jPZw_)7z1ZJEzAyL1u-Y5;>e0|FgF6UhjWxgCv$?>5P(L2 z?gA*(6W%rk2#~_!^WpVKA}U@l0`#7gg2xeIp>X)&ou>m@gSMbO=m1hcC(s#m0jXdB zNCz1p1WI&*fnXrKT|pKY3UWX$$mKv_7{p_786XejgZwZW9RdZQfXRd4?+7j^1VvyJ z#N)1%_yDd4Asm1a$MDx27tbfXH&HSES}?-P_|@l@Qxzr_hlK<1qn4yn)MiTT}!)84t|f@^gEiX*XVgb^?+{E$Vf)a(;~+b&tjjli{5@~eXrzLyj#$Fezv@v zoWhEI(z?5aM=l-IecYt=X3YUC#r-n%jQ&_1VC}jq6}1z3V?TOsWo>EbJ-?LeZu@-; z^9h!@duAcz6pk!$ay{L+>R$Sq+$S!ZJ!B5p*X4A%`goWeSS{_k(*s?ShR90Ia|u@a zDpQg=&$T@biBCv%!@j5P%1zrw-nDf9kc)rgp*%YVFS-tOGqm`~!*lC3wA+`OAtR|p z-j7y{B&>7nJ$a-%(NRzN!CENFCpMfIogx2{*O3PFulB!<@MzHOQQJ|bIJUilF{sJt zgruBaZz4SSdo1`t{P_oOPj?Qd(@rr^wFRU1ph4zRhjir{AD<#$^DSKpJ2FrWkdmcx za995ani*j_(tA_ol69pOTfFV$Vw0p)qUpmmUi3bXk7XnhK__$?1E>fr(lybjic=dr zOuOn6Tr8XA8-&7&?#|UqRMM=&8V6N{s{{lx6f;ZcBnH5}qgErTl!}WvM~&JC45jXE z<5yjK8~6McV%)a%L8eLg#dp~sqRW)Rqk9S}jHR6nQwxQh98rGpa2n z(EM0i#iBrjMtS)6dUy9v3C)yUdD-@{s1Xll|20vE$I$bxRD20fvBtGRE&NEwWuKN{ z+2w0@8${ndnxuE@%dqc?G%8jUyc!r>ml{(ZnjNz#Xs31I#^eE<<2GQfVvh8pPUl0V zm5L5FVQF)bgqcN~HP~w3Y}(Q3*T_4FIlb2Wt2wb-{RtV2 zft4CSo8A_plE}&8k&%FCDIB8&E$pV}(2yF$0>#*|*Oo<3Y9a*B4f&l#vk ze_WE(gWR=xzB}Zcf|(IfcyHiVpUT&=R^BZe!uYd3<9FuD;891r5(KtF9ARiyo5c zq^r8taZ1!hR()CqpOdF8dAN1zfDIt68 zptyzc1H9OeXn}7zV}82aLCj*^GoP;4-qAm6@|60>cyXuUiKTM_RLd(r55Gt+xaU=A zuNre9rS!$xZMiS)byXAYuQ#1}>}BMpJNd)snNCX8?CrVVWYfbpyG9lj`U|m1cLF`p z2VW92LfzvO9o0T2dVQELf4E29C|`M|zKCL8K4V=vWnYx9QFW8@!=Z{(r(W!u<6WJ{ zT$QKP;8aKw917a_@DTC|$%N(T;-`d8emirtv}$qj>bHHVW}pu~YM&J{WMAc8M^~@W zomMjfZ5FC_=p1EMEjyHxOpVnQXng-Xr}W~!>Lxpic58uk$}Hshq>LrypQHPx?elwK zzAO*1?&N6wu1?Pj^hG1RF}ax=oyg%WPZMt4J8{=ZcRb)|_jJ2Y+xw=!Bc9?1FG)_d z{#qEnV0-)Z;rixRvaXqb&)mTUXj-Z@W*O4woluHJttg?yZ0{XL zBjx6c`z}GMrbRbzx?=KP>T2d63b~QK@3Ru_4ok2Uk{KFf54S(L9k^int1#u$Ei1odUm)aM=xbHr zH5XftM4maB+i}`_Tim=f^JiPqYi$y$%GFbXi1(|=*S-gQdXy$Cb2xZ5q@wkCdrNNR z;(5)u4|M}O5>CI%l6O0=p!lLZc=3Y{e#)D&g^!MZDGo9ZS{Idmcg2+r@v27_IuVM7 zRhE{V+TdT07%$&=J%&50c7x`9{QlQL#&=5p#*Hoc9G65zrb_Gkem;fTGVI{wbRyPe zP%&BVaH#XKJO+)fpuvwjLHe)eU8Hux>15OK(Ps-5 zzi^b=XI&v89jhQLlKptl?{LL}K_ks?jbWEc`gc_xZs7$K=L<%-y7yi*Z7w{yonIX^ z^E>&}GLDHAb79;<%^L5eUDYQPTQ2XZ97>Yj*hL-%^7;19sxV^q=oG$qVJz8g=UJ^0UD5rZ`SjR~Q4L(U0oN#9Ray zb|H`e2!MiE98+ZP)$2%r#V|#B;VEcJm?gwy*+uan_b4Y1dQ=FV$UvH#Axz9^@PiRT ziD+S{KuIHz55UE$=`u?gysE%jl2RyKN5`ZOPNLV6?gau5%-zeeW z!>pEYBN%QB{~uU?q5OrF%kzL!!Yqg*3}bTzfPuat5JnTwnQSN=Vgu+2trFHrN)u2V zr(ZnuZ~KfEMxp%AUJDHsr?r@lWW}WmL*d7pz19CGY5wgvGw44I4ioa&k{!aJgAf}M z+s21Oje#v@&`E(@UMLODZ(3Lw{K}*W;Is$fyhNIrz(@g0z=q5u`;W{PObpm8@qQw) zX`CQaqzJ`;0%=0F0BL3;WV7|5F#bd|*etV&frJnIDGMIa#R|2?#!N;7kI49B5_;;9vUudxCzR z;_%&Iii{AS(SO_$zdXgKjvJl-blR+hdj{gzz-|?9UmfwzhyTF?VDSJ}vgvVH0E@=p zVLJGHkdRoB!~hHyi^pONus9=KGzN)ABVh^;aqj3$WyO?eE>CAFKEH2lm;`PL1VePe z4-#<*VK7-JV8V=&^jP_$$0p)IfpEtMV}KB!!4n_A5Rb> z8e-u7)IVVuBQ)%!-(YzBAG~OIv47Ix{-DDUuyB9uH+e+tA9~?_2i))ajgBDhpZyLa z{sF@p;{Jfa4OzHnImIjB(cs<;5B?7x0J^iH;AX1<0J?GELsi@fbpt?qP9PVMG;ZKF zlNI1+LL_6Yh&Fh#wGkQa72+|LWE=r&g|{Z-$nf=QX=V1mQ}~M;u6zNFCy)flkbuJ= Lw6v_9Z4mzjN9Zck literal 0 HcmV?d00001 diff --git a/Full_mpi.pdf b/Full_mpi.pdf new file mode 100644 index 0000000000000000000000000000000000000000..462b271262637f130179e1d179577e809c559265 GIT binary patch literal 8036 zcmb_h2|SeD_is<56d|pqq!Ep07BiSE*#>3bca8C2GGoTfSY}izr9vcB%2LXbwa8Mo z$kIz%$d;red!bZ>{GS){Dh*T0A)CS3PS5Qq2#$q!;5)I}b7jNqr z8jo97re5A%nz!TJ6-)9^kT$9b9jLN44d%=Q%6nrFLK4&YRvd{36WIq;37CtLV0S9r5c#Bd}Hk@|OwS zy<9u*J6n^BP12RQ9KtD=RF^YHL@XXYD0!;1M}ARkgGt+oijQcSIh57Dg7??&yS++w zv&8Tr(`5p_j;1>$hRqb@7gg*^qaM7?YAssCH}O>baP;a^@h!WLR~U85UA^XiJ1OXU>UO)ITVB{tStlSLSv7r?M|Um5F?*TTs#RU`|Da zk>k>(>!>H{R*3uFHOGkhI;1XJu@_HXFKP`f?cG&J)vTgt;RBBLGD#;#hm{(Nk8h7a-a&YcGP?uH+Xm$G>$kU>A$jL$8E z-9qnsRChyXAJuB(6|vxgK}~zGVu_rcL$#QdcW63c&%x82+;Fj+cjjjJBC}d0GvCg> z&PaQ?*OE(xi`%}fPkz_ws#Hk)P_C#rnE8PEt=$|c&3S@L;kJCgp0e@4Aq|5R zo$sqs0vPx9pIo^i5tY4mQ0A}0k*%iA;fXFKExp~C1R%_FMW4#mFRO#SOUh>jHa{I( zj1IhsdNn@ycvtJKGv{M+X3GM<^hwesCBxNUCyYcCuB|;iWgW3LNBw+ze(7`J@P_8e zC{bsXvZ=neW7A(R`6V7va_TDQ1O`4OJT;FW=>9x?@N%znV#29+S2w6IzUYh8q^3#zO9>s_%kO7eRy%I{!l6Ao_gRB*{bF)|aX6~JFZ3_cMcvX6 zul`PB8Blus8T+K|{fJjfhw47`WZp+M$|vtRX?G*sU;Nu8RW>Jja=$;`CwC`BRZ_%O z_j2--(BZxAr8AohTG!iu!c=WxSLKZwQ=YvyJ>%qat3SstLQ+HbG8njGLXX&RINIae ztrg?!oTX#WN;Z{QoxOkMbnzWUliBxbD!nW3yK0vRj3){)6V;C<47X-_2&)5yAs=2H zd7IPJkKAN_$Nx%~gylP_C-|Hn;YTgM4j9sfoqKC=-R_OqQ{VOR7wr1_^ZP$a7u8Q# zovkkS*hB1I=V+QRfiG0D{>x<_x&CCO_uZsYMl@~AON4x;#${r^eQsLB_T^7jg$Be( zXer=psGf0xA~R7My#*6*&Ry2&bv`PmxTCQlgsV5htXNgI> z8M!lP|K{lBXA@+vXpG;xw$Y-VEBy5WGRTdSzj`n^XM;g|f@p(!q=uAj;kD_vn{7&$ zPCa{7;Zctyb(Cc0OUT}t7Cl!jbMV^i%`nc8x>9lP)`)@R`J8Xjw2d8(8*z4$Me zN8dAC9w!ZFUaCRKb8l6}w7|B}^0nLX5&8Jw?CjOg+tLk39%dbVMfM3$@3ko)1U+)H zB(`}vwY-!#zb81eycIKIWqdl&%2@Y@$GPt3R@b9xpKUzd9}U(VtEusL?X*N8@qS0w z@<+B=bcw9*snqz^d~q%5f)gGNrAXM3RUR|%j+Y_b>Vt>;k109D_%yi0;&O)SN}jb& zH^jtDrCPKcwzTcr^jSLmg!tDwy8-L7Z2`13b`_n|Fw-aAoHVeL^Z|r)K+x%VD-a6g0^%COPp{fIR zvQJ_L2|bhD50W-1+a%jKWW0=z13v0nnD@&)oxPE6?O#@8los4>VHM(ZD|@rL^Q*En zU#pnm`&PJ>@j#q(dKT^0XUXQ11<|Z4W?K1UO&;`m-T+ z9e=j2IUBkJz|lM$NQ6j-#L;N}19T?d0aP%D3FWriN z2l%xN7+`E-2uG`_%^S&I)x0V*MHo-c>=z7wnG3T@Fr~lG@*d|WHAyUx=NN!!YG$}! zQ%(=0`hsiAX0SW{ft z9xQtpMv#|D#mxfsxS|5u zk$0JPXTcR`NY_sG-0o8w8s0DUOyDP#>VcPa>l12AWUG%IND zK@f%%77OwZKSy{zgaJ15FgUC-gbF1Tw3lT79Y7Z_0W1L$Kn7d^5a6o<+@MVlxC0b` z3eW&AfDX{TK!5?cfbI$~s6MRUJOVHQ7QmwT11tuK3<7L`?ZE`0Z$CQV1NZ|RfD1C| zyZP>biUtr1NAvRJ_dUdWo_FM2S@C;S0WIqH&}uD|As8GQucr31;IOn5v{-MwDM12* zwX43s*4B$nONkySf|qShKzu?C|Yybp)&$+lU=e3%CbGa>^ov%xJ+z+u~`1G z9TuWpA!jV{8cQXrbS@QGbj%?7YVrbtQm2&MpQy4%Ud@(w9iIIbXuVH)^^IjqD$eNT z?{dznH?VAXPbkSaCaE5l2-mjp?DRy67+#Ckbq>>%I^}UwYjQ$3p!y*D#KRlcN0026 zStojNi|uXsVi^QhRSV%48sXUc@$K8mF0sU8#}-WvCaIS_didgA?10^*=%))gEt&OC z%shRLe_HNZNQ{b=HEtCJ-FxaRDU?Bl0Gkv0Z#c=Vefq-H%{{07QZbToX^I;#Wq^1% ztP^XS@tOJFTb7pXusgyswU1(UG2 zN5786D~Bezq*cEVl?}Jsf6sKxVu{#(X)}EbiR5dQyCr2WgrxME2;S0(#!6pvkh!=? z|6EF(3|jiS+BK#9Mlv@&a*u3iHYgQy6)<>MBNQt6HG`3EB1dH~eA>Dhj?pr*B95Z@ z&$o@6+C6=AnbAvjllpv&(@>MQ_H>iUxh-2J-L%xodn1cFC0?xwD2|h!`A~8^N`e;b zl?MK3Z~T#&kGI@iJv-R_K1}*P7-G>Vc~T_rf>ygzu=Y?`NvbKMW=Vti_PCy>4FB|z zom+w*auLV(8hn^q)2s0!Q?X5}0C72>T_mjb&GQ2%O5Cb8X)NjXOgS2RqggPPl(R9U zp}XwI#=~c`PPXnn;6EWa&Y0HDqwNs={Mya#(<`e__|VoU#n6r&YQ#*qQ;fe`41fS`iA436c+fs^p@>K2D$qk&<&1jWh>*6f@W^dPG`t1i+ zq30udx8Cc_k;;B&dZs!&(8@?K%`oU&o@+|wQ1$ysy$=_n$G!Xaf4RPXvavx|O+B|X zI9`9`;fAq^&PXZB$2bR=Ofq}>FTX{e1F3?IpLGSxCF1m4}yi3 z7s_oLdrkDtS}qj%5E$)JVA}hA*w-PP(dpk4z1j;sBW!qC(6l!h)MMqTH@wUb`;fBs zm8w0cN!9&uU)y$D5ayGj4(*{7UhIQSF~>CAZF$H+=~D?==<-7RCFgtFV;uC_0%gC2 z44Jaidd3%v8y^=C%IYZCuB%%>!C2D`nCGml6`iwg9X_hp5-{3UR;RV+mNI5^Id`$c zF_=*0!Ez76xoRcx(Ct<|`VW^l1aELD?H5}ke}457C0m7kQ8Jl0d-Z366L(JPOe3x$ zw$%oN9HyAG)wO=7JDJ-Q z;!XP5mo1g>!gr^UUE&tWin1A+XM1*WNh`O61by#8t%@V;eG`O{kHs_jFi@-)Hed*g$ZR6ga-nV zG*rEe+Ee#-g{OLZKY_PnwT#uu?+!Th<~^wYxN|CcVA&THm62-g%P^_pm&fqyUfdrQ z8;F!yoRw)~?L7L$-Fc+!@x{B|D_3~E8X#s)8dVKDdbECY)S}UkjWn1X5-;gL-M3WJ zq>?5S((l<{`JC0&oT&c#*vC8+DO)&DrrP?o+n1)2jHS_$bG6f3bKCtt|q8Te(6J}P+Fk1+r)!T*QRbE#BMjtd1VrmoqKp-b#8d)(QhXv*DZPI zR4KaKx$gY*ql0Uj1YhbgjYWpP;p-E=jLk}L3TC`7u3pWVG%wzLCAQqLwApuRug^`< z@)$FcB5c)V|dWb;x#ig+5lB3BNj;Oq7-c6MM#Gvx7WYO zRYjG*mkjF1rytn6r9xz^p_hAQL%{bM?Wb#O+P)@z>qQD)zx};4wo4`0A*v_^xWCpn z>iD$qNZs1LZOztkcRaO}>a{nuQQX#v6D@Df7MaO%R27jv-p`a&dJ&T6gQio}-rT&f z_(d#N>dlr=+ldQ9MbRSLVxlpDN6ltt3TnRBVqW#YIh_I6CtbjheY?x}s8)HNO_aV#>q^`a&9u9_n5Hts;$6Er*PpN+ zwG^sWh>V`3xFw~#obR1EQtdc!C8ath^2{2hfAbp+2RUWV{i!f9b&VxE6-u}ueYvZl z=z|KU?OS>dDB0`h;JjDes5o)L(0_V`6$OyW9nB{$mfQy`YOQP!Zc1(~zjbGNv_9sJ zy7S~);oNJR?^#>ATe@G`8mg@(!=%|6gmVwnWiO`!rQaHVqzAo!@3X-eC-wEOhPLxX z5trneK&SfKSG&?5(b_srwLTk3w|c$!YM6^t%LXIambF6_RY&w&hlSTDBtIT=yz=J# zo$kh=r(n;Db4Ys@`$O!RuVIUmqIUyGR5oyfViaS5Y2yxdq?~^D!26@ra0ue`GEzi* zqZ8M-vn&KK?tj{B?Vyu+Ydgou#nkF0(e`8Nm92t)d0%I-#{v*JJGafAd^Wo5gz}bG zf)(XHM%~sr*rJExa#t!Iyf+f+dv<=QpLY0t=Id*xPjNwI+NS5969z&fr2_Wrh9{*3 zE*%a$j|~kD0*BbXwEgVAagy*%B~1?HJFMz396|u@v#>o?5jKV6;}H-f)76b&1{K(IfY6gF!h_9b5CFi>&rjYDD^F*- z188MsWdMZ%Fc>7nfn;&K*d%|X7fTA#$2Wvx^Ha==CC|4>o=m3!6dM37j{+7HEz~O% zx)+?MnB+qDVXGp1d?>C2WhG^-0*FyYf>^u)5{-64AyLo=iN~UpNoX?O4TD21sAK$Q z=HK)|6OckI`MM=FvEvQ`MHdu~9b@b(jdO7e17Mff9K zK{t{Qm5op%`cSFPGzLW;WU%HULZzt94fwLaFFa^O<|PT8IR|MDdM{wBQ7Kdk=?{7S zJWu|o6f}07ZxBHS{}W{)d3YK0-+}!N;6J1gp9CE{P&NTS4>dIy{9pR~dqBTVa_Ie_ zityu|)Bku={MJ!eIC5nE(}}YiYJ~7&1G$yAg=KiVANny9j={k({EZLw#xN)}4&sB( z2tJE8fk!}NFgOfa0i%GGL!l8U6awO~;N_3Z@0qaxPiM+3#OTir4zWP}jYA-r{gZ_k zMu@E8!}fp#`6;sdXFJlL3A#b;F*FXwJB#N&a6Ar&#lhX+^E9ac2etipAGp^7O%aQS z+OL17VbHjL(oj$%_zyl5wBSE!Xk}h&@ee$VBGeQ6gN9Xt+JJx1lyFeP@(&so^G`l3 z?jJNPS_x`b{voS~{|61Hs01}F7x>sr64ZKPLce0e0doo$>Q&?5fEgV+aQSU&IH2$4 zMu+qJQczD#8*ZfZbNZ_jgQ9_D=SdAIW}=bZQbWXyH+6j4gbFqwwYxGWeJ zj)XJZ55d&b027ez$?<~YAc!TPN2PH<797x{kvO0ZNM?9|8X7P*hXs;+V1a4r_J+}E z_>Gk_MYD8Yew#ml&Ty2(D*HV-XNflu^$&dB$?Tq+vFNyNnfGE7Go=5qS=-*kE6=Zt z1)L0cGcg5RYHiJ7gdJ*V+K}@)uFCAs>33f@ZHm2=k-^$BDUr9s^Zx5l6_?eW=Tbj+ zzWOx!-F|m(m0IQHxj|Qrj7xFjW7*e^96S7S0d@LKpo#HAzhRobBHd$0T*arMCkb<3 z##-CsE8637B%2~liBTzzOt{-7 zD;%;*ap=#L5vJzd_uV?%mN3^=#9X1B;7;GTanO+#QJujo-V&Mqm9Qzo-M8MzGhggG zjcBH*RC<{sZsdFdXPjgHtWd%|ozEJDEW*UT7Y~0#k)=Iwn~_LZ6uq`$jq^Hq7hj^F zfWNZ~AHP2q5E1Z~8x~*E;m&o}6+9iP4|pdF98aeu-*?LyOEfiCXto=QVU%(nJ?WrQ z$1S6&_RmeWhq}CQKXqKhs`>ui$B&cAE6}N#H`YY+nx9FJ zluAqz)}40Q?*cZZ@Zg4XmzW1^bh8BeUnv3Kl*^ z#U?n<1mXK^qGp=**UEpM*2xRR%e53(%#AmnAz+Xrm6ltc=U$6PB^cqUiLYLCoH*~? z=BR(zt)e(7t9%Qwj1x~Es&o!`^h&oQeaGYUMg??MDvD!_A4+=l!Y{`z-L_|XWls== z-q9>kel?Y2JpQ4a%}>uA`xZVX5^viRlj&G)ST^;luwwRg+u++*GrhCHdBOc(GOukh z_R37PG9DMt9eeOzUP{X8@cuh4xtIAq={o6GsvbH0(IGWDTg_FrlfNZMY-C8_U0~Sv zEd;4|D^Z%35_AVYz4(y?9fPL$u(3 z*b`D(pI6I{nAM5C{GNw3TQMg+SAFyRv-*b+w5W{okafLb&rK9AMX%jbK-W>?{X$(I zva!HL7dK^M-e%;be#iadnt^jUpTzEYO%CQAoV8CmMS{hT)wXKbOqQpdtSH8rFT5wH^{;l`waZ22OHqlIqsTcwY_dz`{DO_4dN+$--IKr&kr6fJ?z^4F)+9|uc1}EBE7Td=Gi&R ziP4eap2|J+)G+T>_fyAE6#g5n*OPOMh^d#n<52KoUG2$JeAA!XR+S}J6=l?ITu0_} z>HhddLf+kduJW_QYLRW^B-^r}u&G3w^0_K5!135qop#5~RxRs7Bn`MMP(~jmw`~iQAuPBf9?s@Azt#HCXVQqv=a#AfbP3}+|CRu2^c=?%LNv%)Lqvbm0 zWHqt=ia&5u4D^9@3hR=n*4F!ryi3RV_o%N5q zI|a^m?JAqQ(QzZiM)#dXT3Nkk{p2DYFhTS&QI6u|8S=^yj zdb>l5^y2oTTd2n+)@{CtDD(EIs52?0hw^3<`(bpSJ38Iol58J=bmuL*iow)Zl_kM1 ziR=({imOY|+6*6iy)K**G(9Cj?8oc9W94DDpD0d=oqZx%SD;9g3pqnBJd;_nm$>`0 z>h6<&VjR#HUaj9)lG6M5=DckY+GAli@!53&`y$M4v|DC!c)uonuqP`4*6zFd2<>8r z9_q}Qk-KOm&bBJmlB791;Jp1OYf3u%(Y9S84qX`Ut3@KkpPz5N=QJ4#Rt&c{=1-aC zzcOv>^P-s6(cekG=(*Cq-4yLTv%%xp=v=nkoj8T$iQ07yCDEWnJ!4BN<@wvDh${tq zEgYxc3&9CReKqKo#9W_`hl@$VXYRTgigjjLv zY_t5|4n(($KY3O2z-Iy}llw=uQ3VN%P^B{(solbPO29t7%uU z&P{wdGZL0jrJ3<G`9+3f`B>669h~_ z4=PEU5eRogLep5JG8~UaI>Vqz7D(s7G2HVW23Ue@h98RzvZ0%RIg3F)2yz?&=&k?< ztiV7HgsvON(Lcz6ZUb->mk&gu$AHLDDBc5fIRJ>zGsKY%=Uyr-VGw9ZEv|^gO9sRZ z(hJU0j132jsUB>&BaExICCnKPaq#1^{DqXued&I(NJ%7dNHm7$GK(ecO+gOH1Db)O z7J2=YjsGiypUZ#&X6B}Fl!nHVlDt(diL%7QxOA33+3=RRJgWjz`RgqAacNSU#0I&B z0rV^^O^vko8h|u^kV7Stc;?ap*<==#$zibIs$3R4bMR&$b5dDs4$+Imf@9Et32AAJ zLZbj%st3o5?Fd8Txq^Ov(P*xDxL>Racil)h4+Dn9;^2S(gK!||^8cSakg%U)9FDtc z{NJQN^RUI4MNB*z&6D+$jyHn%EJ;8vj((MgUZUats$ek7+VNy#xX%y`SNBC4h@Q&> z$&FH7I&}A>(mmlQo~wa_e(oG@Xmg_ha^7-?@n(Mslpk~e*CESHAWPD<=xpkbXB{eq z0zzp3#l0g8qYC)?F`#QN)zgdP{F67=Q@^t2y7#9edEPrf@&W&|$F-r%gAz{>jZ%T* zacDSR8Rg8qReQ4G$}m8SP3Gnx1ccIu#54f8q8A^z61a0*N*G`WMLm_QMfaqEkUM~b z9MH!G$~}mMDV5EJ?8A!@t_@*;-4YutMit@;1r(IavVbn2510ei00|%i9smgNL;(~i z=>boG3eW%_fDSMK1|0;LkO>$b0F&m&{>35y3t$6mY9PR7lE@&y0XSYP5c&;Z0DeFq z5CjB+EQTD<98mQDV&Eulocx+Y+~*}jF4h;nmKV^XeswKzxgJ4dQ8*2aAC-r-^?IvK zwp%kK&=`lh^Bf(W_*~~TT0yfbJXY#fdta927u$@|<~wwX|IJnRg3^11Ueo(StxWku zjVeTMh3~T3+#7Yu8mF~dqE61x+T_-JThDuZQo@jJX8YvGeZnRunP)Jwe|!MqB#0*A?R2tZ+!38z-XX za^^&+k?h9JNs{(AlqzHq7X3(>*(V9vfRt~X?FuLrrcSGw_4~l0|Q*wnOGx=+9 z$X63Y&8Y50`|F=r?|tQc3Z3NQtaApaR;u623@j2%Dh`~B-4uH>tJ-pV$y1rsF94Np_Rnd->c@-=FOs2-~DnsVNJG)`u6E{bY*tr|_WW`jQPN+s)5NO3qP;8dd%0ZudyM6bz|IlUew1 z_h`I?&k1@i_^rF`TmCJawOrlz;kWN&WXi!PtF|4-L`u#RyIoG`jKti{v0&D(Y8Km> z*4N4myf(gD@SY z>o1auwnR0*z4vX);nM}jI`OPi0l=+1cjD>0*e)tHFG z_C>QRwZ;^Ng4|9n+!y+~JCYEK&nP1J&G&s93F(r`zTH=%?znO9&}seaok|uo z>s`sXao;BTY+V2LJ3U3xh3_m*)y0O{99W-g8aY$qkzGAf_kPac!})|M-$A44%uRD` z&H5UeH!Dx18;;jpex7unueQ2tEF>~Jq5Mw-c(g(KUR%a~tWxsuwHITTo+v4vBRIs3 zJi5^?kkkD3%Ms-LTPsRRYAL3DszR>o!_!u6jhnm>>)fxOLAR4}K4R~!6{?^!50iFV z%YUi%K&P?mlaU94`=(y+?~4{2bhn+AOCk$bwhBN~hN52Lo~E1U{|}ds+MN-R6=ktATNYp!(ka`bXvBGkb-P31c(p zhwq;dT2r=HYVwtyZ^0U&b2Y$3uQJOq;KTkG!q?(pRVkv8)++>bt6rifgaLKNBb|yL* zbcM;!M2%Q*a{H!MikThd7bH}jl!~@xn6S>+*y3Fa@(v#{cos6zb+3`Akf(~C zSQEU`DI6wL?N;SQI8&!07QNG^&#-2d(+P3+%0W>!H&{2exan-d=Z* zEhWS*#J#?D`uVeJc-gy?ioIf1SMl=KwNLl$2`2p}85Q}Z54kRlu?w(-IUIVOxQG8)w3+>DR_A;}%Xz_hoVOT)I@KV`(PKMZ zjp*Ax9=%3o<6Z^36`R2Gf|^;`?c!s_Z{oJxJ!*TdIka2}69-YHH(kIu~Hl70<(Q z8=sa>hz^~TU0INCXX`pK?ddvx?@`hpzQ3)dzZ}xbpF2=H>g?4y=1lZqgpW6y9}>Ge zcyeI1wt2OWP}HFJVD%GrZ^tFgSK(tNNK&D2m~5TxE6Q~H-Rr9pv{!w)8x-W`R?TwV zXPNKw8)DzBEy2EtYwnE;p$Nu=AckfBMm;psaoWQA%3lA;2MR(N&V{+g3F*dE`!La4 zS<#7t1vFe_b!lN^XFt_OH1yb0*%Fh0{E3I9H7~Art8(&EeNi!bdpO_wT)piL2j-0R z9Y|9u8Y#Q$kFURTuYcocO!`|QB^cQLu|%w$eNnn^BN@GUzsu3zZ#nX}^NWO~W=5A% zRA)_xv$q#`b12uXfWe^w{i*eHdX`v6xpz`xktZ8+BncOHnijn@k1V`-cu3%8Y|oLI zh`EicYFw%}%egk5oqy;i*uMU`0n1EebOzUyF+KTRBB*r1H%UMsXzpNzT*}2N=gJQM zulxM2Y_3`$2alLIB!o7axw+K4`rGDy6h|0h6|Y6{zfD>VOSpUF>iJN$ryYB4gTrVw z%(~%AMCVIqdk>%)D{y@)v&}bJ=2|x*=Y_``Hw;L1*rpYG6IGgYwsuh|8^!djuYA94DIcVcSM>9JtfJPB*l{*; zK1bvAmGdi~UJRCgEg5Y;dw%40f{0XN0y^x7<-$T~{g(#x%RYEePY9-^7ueI{>Hp|f zVPUFbC0}*$^}#c<^zV(qtUE7dl+Etdj@nzMr5C4LWAIh8pLYdU3yB=c&~~p_(fIuM zVeFu48Y~Z%7Ijc`{|SHi!HS)i@vEA)?X0bQv&ZZRv8u!_-q5`BH*BbO?jL(t7P5L3 zd*p<i6eum8m}vnK(wJWLU6*+7lprgx$~pqgNO*z!1=W{R6zRX#4Wv*JNCnFcUE_wXusN7 zl~+7J(Ue%M={omD_~!51?$}y;T6-pMkJizUW%)Rm#0DET7OtTIl{0PMu0_6o?b`W&+|D?tuWL>2;$w*Nm<_ge*gEOv=j{w~aksE}u4g}%ld^q%K*{ItnD7up(Qc{l z#~x4cMW{-?T>qfT@4#DIUCiwovArn|?!P}EH1PQB>HwYCa@MQgPaY2jReiQT`IIpf zeNH;WNIy0!H*EFDAi;@yh5u`5%PZo3y>Ty>cR%llcBUrF7eo{m2^9iM9Mm)eq1&l9 z$bq|qo>aOzV!WaX0jGMXBW$szNK+;e^r9LBv%rJF2dv1!-egq|gr){eO_K!G)SzM@ ziK$58b-vkf==!a`i)d-0w~LDqNC@;{`ao4CJkW_0BpN`Y6(I~ob`YII3RI-Cr6GAdMW}W^$mnb(o=!?+h7Uls z15ipxU|G;|y+UQs;atHacZMHF9pUFk^&pT`l`&*xw5lSA!6_@EP!yyh68b1oP$;wt zl0^2vkjTs8n7^p`7kSVGBoG7H0U8mY4uXdt8Dyy=^vzA+`d$n+XR+{wt12O}2w-XX z|CUyeZ~n6tAcroQK@Gwom_nr_B}fNqVrb~GsBlFcP>~F`LSqSVGyzG#q6q{nTn+de zCggmGlnA}~fZl}sA4q?}{DqXkvVuZF!;|jEq%k;fWhES(N#c;bXrMnxgCiHE@<^93 z)c~%aezDNMZ8H+n)bxM0nvV}Rthsmu9R}IY2P#Jmb^bp=^KbjvgZx8brXP#O%McGT z0MbCNZfwZaC`e-uGJ(Qi`H-OaCNY^%*-YXyATJ7#}j@E<~m2ZFX8D4KvDo03^IQzjPFqw;b93wByJ@jS#MHAhU8)SeBdp&|6J78Vg7B z5+BPQps)}gv`6qzbO>Ak3XR61QOXz;YA+InKq3(kh7~t{WPgo}W%dk~?6Qykp5PD) z)ZaJ+k~u$6xNd~NT7Dcah>#Z|azEOUfh>>$wZ~9c7Kk(3K6{r#US6Vbi1?rRi4W`0v zDE4iP%iyp`Q0s{Wz0QUM2dTkOuNn&nEE&*- z%WG4^0Yf^40q6Clpq`oz+)+&rsf*On#Uk;_NNp5WR~fIPf>&0>siKL>+E}czvc~_8 a;mqw2{@En_&7y0qLQU(`4o-)o1K{$*;8cfWSwR{W*9SL7E9DEWhqLuD3MfhOD>X< zR=H6sm8=z&y%Ne&Dg3?}wA}9RzdX;Kc|3E@yPx-c&pGdTX;G|f4A6!+gjRK5%1Hzs zKmnZ1!3Yx*&>mt32^atYhB$*ZOqKxR0iX?wDuApY8ix*%$q2rH2T?;2k(mXa_t`#1 z^I9KyFj@?GdT$FtcK}H%tq+vvpGayf-l>EQry&_;H)Ga&j4CDWy=5K~&)0mLW};MR zM!dOWX!z7k&@o{}oBOBN6B2FX{6uel;e2~8$A6h~f5k}i3p*fke!q6vux-LL!}FLXA~Za8#pq;uz0<7GE0@h|1v%fW+&WgXin!&1gu+LNplA{wWAw8Aw*=u&Mr7pr<3ZOPI zQWt5nVyjg2`_hgTFF_nTQ7kRD<`ZL@t7f0DXs)jM>j11uc<`##QuvPKy|vAliH6-a zp!c7Km*sg&b{{{wZ-2E5`XFBsR~`E$Gbg2d!Ch8-jk|uI%B|*kaSo50W8-`)Hm;;J zOYJrAY=&G@*HY8HtoOual{Cann~@hN)R@AzgqdhrLe*am#>Oo>W<)T5h@+jtZsVP? zM0i)&e>G@aV0$L$+)l@i;>9)Qb2EY}VknGLC@IXboD0fwS1kwx%c*s#a*zwB*R@oi zK5NQ~tTg5LX@%8+aWe|3B83TJg>M5E)w^N|qz+`B+I1FX*=m!^mo|(%5IT-}CV$S{ zRbRN43^_FBEk+;MkCDcdL_Q_23RHAHvoxk6a^-J zE#qRflVr}mT8b_0&l0e{Ma701=j1^>?AGk&_U2T;*SqvLC4OJ|nsVNT*RLMA)cus4 zdNn`NY@QVH&V-3M=Ngi@v9xaFD36Makzk z)w^H{lkenb+{+h%bDGZkb-Wcma5W#ga+=UQIJmS>`Z{4GBi`e_-}>f1lWbqV@ZEZ+ z8>C16?Z0sBu*A~N0w>8Qqu}KA@^2r%biCjD_1gzQ7rCwMYySP`$3A`P3_qT4L{hDR z-rah)ZGty8^tQIu@2bbmZ&jTV+lEX#_9wDm($cO?-fNv4uWlW0h}o6Q*K7V;&F+aH zG)t;cm!EDVtllSgar5TvD0_{*lX8UWD(B+MSNi29{8x@w%KCPkZ)&$u|1$9^sULm4 zOmEjnlGMS7v@pM$vWMOi8yY5(y~^zrc@NbIg0mrrmXY+1FsZ(*N`*N2t_YtG$5rp2 z&$j7Y9NZbR_$loHmRC>2^NP1;rydv|tj~#Pe!Do04s!FcKD1B~jC3I{x{*qPF=4pt5^ww<06Rb!eY1P`mPke32|q z-TD?~5AdoN9q*ob0AH2!fDy;Wp1nS2mZ~K8#)^9~)s5TS$vLNoK30U?$UNj&`*JBQ?^6G8pw(r0D34~~RwiuPq(0wPVK9zUBcnSf7@7US ztE(i)<@MSD2)SZu-n*6AOv)F1IYxp+!TZid7JW%EXUw}w^j|Go+1IsbP&qvH5$?~J z!_pTmnMpChK3%kI2eRCF)W@6+&Ye3QyHgX`P$vu~R!Ef+W&#<|<*pz56&6kDBu zngXQ&4@5xWV542GQt&~1k)zpF4*Ah?M@>*E>xxh+_{G{}_lYMT_l3OxrdtPh} zXxhpBpc2+*@7upBlWep?G^Jy9CF2-B)*FaQ`_dzJz!D|gc zPmh|ERTDce%&8G~sd~^wbv`^ zp+?k^OYoX1*KAN9Z{dEc82qFAo>9W2M6aLfS%^)aKE>gY=;Rlj_o81kj$n+KhT(qP z3a(LH2&7PhAkYD#GpQDwNWdEfqwy#lV1z;WB48vBVhaGQ=-xnp&Jdp?C^Yz6sILsKxJ`)W<*R| z?*Iv?bQlAmrvN{68~rNa$1)J0BgFwglgZOYidQwQ%Gn4Z;&c8XM!d`!tTDp)SFC6{ zjkKWhA(3N1PfL4SH*>vp5Gx!KFlkh=yR0BSjmP8)I6QzT5+Qbn7z4YL$>R$w8B`vC z#enwI=`k9E0zH^?0fX<2z!-@X{cm3}7Jq%5i_!v);!LiI-1<|({KMmX(jV|pqItOzG!MSym2jxuTH>>w5d zI|g(SK%wsNPQf8S2PU5nuSOhE(P|N(=d>6+mIzCQ!w>H~ZO|ID1vh{W;6{)Fx`9-1 zGe`sJAOwn4f`MQlyjeje$O1z_Hpl@vYzX9nT!_cy&_N!^2l-qo4FUzAfWd>{-v|yU z1S7#M5RaoH_5oZcLRbJTipkGeE}Bn!Z>o~~xsZex^0Ut^XDUw&j({VRzt@;8zF9|rPrU3v`^l<{8?%6r<+8hUgTH zF-Dni!+NfC>|VU>N<@-w(h!fgp^L3!r}x6t#AMQ}LtRNp)8FIESdt0mswSAXwtu}} zO^I8a_1nJKx_~GtuL9>TsD|%)$oh&F4{~=8KP>b<=X@v&^iRvH(bLt{Prqtic7Hr3 zCZ;E~I(C=INcjcDs0$ZPSS?37*3{~_=p;?z?3@l>J5i*4uFT45)0uAp9pw)`pWoFt zvSG;CH8|=-dP?ETm_PQcKYiHwzP5+%(M=n#IO(|RDsPN(X1Yo#+eJA!9W*N45cmp+uV1n@U4*86sB@LIvC z(D=}T_j0MO7kveL1DQso^tSc$pO9AX)Cu?tZ9~YoUXk%yiSurIIj)PbHM=YVB~Tho zHny|BzOK@4jzNZ#@uP2_HVsrp_h36tfBv*kGibQD$tPFQMK=3Pt!$9|ycST!#$W25&7t|;%%U6QhId%dxfs!K5}=S4%R~&ZGLt;0m%=- z0=q!@lh*vwc6JEDV|Zg)1>5J=UW-+&hwJ?6Dob8{l$BaAFIDc=ocnY|7tQR0*~*U; z;xH8D>TyAcM)=>H)%wG!c5`|__4u=>k*Xr|?tsy5VUewjw_x+BdvXn)!IZ26QWY|& zsvIxUef{Rx7{SHP)ZFevY7MDI^tpM#oDu-T5Uz4`{z z%dVLBl)N%1wZHnI>hKtk{5-0wW`3nd(29wZKIJ2K^K8i>P|wro4+oD!r~~!mwY{xD z&+w|b7_YYMueIBZ&ePae z*|hUSS!~r)lWuCyohL}J;Lu-h^&bz}s3_fxT^6~6Ys~b^8rHck`J(9kVukMU&xv)X zhqwRf=J_`bsgi!%zHc`3=Dbpct;m9Gy>h$lM7L)N-J^+@BM&M)wJZ9&7aNJ7u4*#($e^O1M!5)it7N7x1otZSCYQPa&{ z9Tkt;QMNM`Y5S#G`%!D^%GHnCt3JPUm^g$A-On*=nb*kV7O75q=ksK{Cp)fKhe2Lf>e5c8)L(TkIwg32IVhvlWDWNQ%E7&A z@JiP)+9lf6hlkdDyu4Z|zb;BzucbE%{BSwiccj%QH!bPxSG5i0zWY8VglufQ(5$Sq z)W7Wdxw3=$E?ouBFV<-hzPdIwG@h|dfZ{EyM+wUU3rwCKS@llJaq}zf0UsIt z@Rdb5VXAv}DfBL&MypM-7w+DF_uZjqbS*@oxw3FpnXLR$tJ~x!CTdAxiYk_AcMrtN z#z<6mke;}xWopdMxqMQ39ZELo2={3j6U&8MEn4IA{<2tqp*hm@h^sN=H5fCn zYej|RQugHMBlOa3nEVy<)&(!f$U9IrWU%^Kd!qeHkC4@K)EtTzTY<>!%XjrIA6%i7 zZ5f>ORs*ddkhsMAHkg-gl>IPz@rySb6~nS@DRV2SDM1y{0cLfxFUFs6F4r_gW;k|v z7%5$Hi}`Xdy&;R`FyCX%wxL?>M{oPJRr=Z^+y>GXnlDt)-f}C~F(#RzEBO2EMw#7b zz6poll+%KOKMgii=gvQ}H~RAXzuH?KC*!G@o7&ceT3e-Z-yNOXUU5@UpvT??k;}LX)9W+vg6?*?xB<8^LCrf-73Xjlf?QXjL(2(ZxykZ7 zK`hT@)uRU%IXY10-guj!SWwomIAmAwM?eNp9iG$F)cAOFoON%ZRxCerMQj{ep7^rx z@cQH6gBl+-%reKXEvlWsWQ%O3E2efn)HaWFf3u1LZ+3c<{%)@;fgjorg?@^D_IwN~ zt91YPf~!YF0qB+p^Y)R{RPUyFi~bmmTRUkXdk-ul^8Fqk=+0|E7%t9f(B8G0uclgw zR5|Z|bfN!SBDL&!La~$y^{;)nDg(gatIoLho3VYl4o^(fH-8;YlPQi*PLAsLdt+v) zd)jZySp73%6hA{kVaYD8YyBVl2f;1_dJZWQC1Hsb?{56osXdGcS;=XCEiyb zo>2EMeOve~?`xKSdExMfEfazF+`5)@9aXMA8RbtVnduc9M?cT-U3h*+8$Zf_C}(U; zZj#;C-tyYpE-B5-M>&1fkl&8hS&cTFYI5y5JkyS1CUH#W&bmM!ivU8!oX0$wH;t_) zKkUN~d^Kc?+u{m?4l zdNwEc4rW?wG}H3x*ACn$y8QZ;sxaue+Fu{fk2>3UZptNv95~;(s$t*f;Kohab6zA+ zmZIyZvno-$c*gY-IbcHIsnX(k%ZoI3Ut8R}w4IBVzr(fdq-;vT2^aXQdN_u>uWGB` z#^#t^dbtf@JwCsA%Nm}jPX6^FDSk5jTr$r*rhe3Wo(}di#U2_*Bz!OSOw1zTIx_?k z0Gpv8CfgJ_aP=k)T85v<>MulInkU=Ds zYY-^zSMmY4d^TNa>1=PaQbZ6*iVWq3!f!etGL*&UlOj!#VipoS7J)$|ASMxnm?AwL zD1d;&VTCXS0LGALh&DiD^?^VhT;xY^cp(7Vkbs0m^5}siXZSfgB@mvOA{hb!mjr?l z5fO$FSVImk2t*T!L=c4mF&G1w!hj#e7EmJ%*!)$nKCvN8&+lw(zMolbaD2mfh z9{R6+M&&v<{GYuR8Y)U_5go~jLlcI=&q+J0|DUA!uj5RoeK(jZKw&dt$t)&|N&N@E z7%$@g&IOO@)14UD*59Sf6%m5rg0p2TmmL`*}u20RPeFzZ3N15Qnb@ zQ)Gnbi2m)8_^B~4bJ}SC+hL;v_b^1Uf!!+Fz1pIU5C0nqz~BLlc+bO4C=3dXhw0$s zK}=#r5&_T{3?75VVKHbu6dH*_Az=zvQR-+dI!T)9iKo{l~xc7?#KxYnoq>9_V0BFY!65RE&0=!KK z1PgOxtQFeQ$^wnEvL@oK2^dQwEYaG+0*glBu;l+cg|Ddp%NJ020&#!{L?Qv9rDg4C GgZLkT!*s6z literal 0 HcmV?d00001 diff --git a/OMP.pdf b/OMP.pdf new file mode 100644 index 0000000000000000000000000000000000000000..654b7e8a30869981286b01f8da4e6513423b584d GIT binary patch literal 7431 zcmb_>3pmql_dX)%C zQ93G0QHdgw97}~Hiq!ABp~Ktz`ya0B-7eRj=RSO%`?>G?Io;GKW)>)n4i2GK^EUYe z0uP`8wtp~!L;`Ig7M&ji=)n{x(1O9_LtFr~U{d*z8AM|TKx8t4$LB)SP=qkEFx`&r zjb9KqHs&UjO;|!MCfg=k-ukYd^V7<@)766~aOWK1NFoygOrBYgoSO=z7_hv5ushxq12T za?4`hT}#ReS5e3gB8@8>={OA3$jxh7p&A~x&x8X8Ax`_<@3(1>9KPY5sqliDJqUg! zR#qBR68_qMxqe3pKVw#o{f1?TvWWvObsE7Yu5zWsQA*tA{Y{CchVG5>eD#Mmu) zr$QR<%kIsfG~GO*Q*k=Ou`xDZNl7r^*pw(@4^e7@gKy?o;P9oVoJ%toBq`E25lYW~ zaszP|Ehd7B(ESOh5wF)WE$w?9d#z7J?~2IE@${BCml1YKI^mKO1%L9CtSd^pA3g%od(Hc}1;@QuF!n%@av=XEHbixYF7q z*_92ecNKQnOrV}D2+i$tlFoixwhTHEtL%}EMARWnr>CTNF8>d6yHmkb$E8KO3zy(? z@^_gZ+xfRGWok+`o0m<`nD+SQ0x>(D*zAc_5Tvs;wfiY{b_RztJbLas_yi}OGZvJ0 zRFpk;dQdiC?VGTt&l=Z>7}gGH*tU01s+prKn{<sSmw@Sm*A&%VQJO%{ABa#um@J z4fHFceeOyZyduLfp>=taCId;GlMrx6d-Q{B*R3e04wrQ+zZJ5d>k}0H_AQH?BY#&L zW2q~(vd|$}`O=Fy&yJpm!w2_kGF$@p5HmFUgSJIB#yWo3t^D-VmOKQ_FfCU;GD2wI z7~|NwJ3~AFtdC8(sc3{I5kK4DB`l{V)BqO(-cpKABqsc~8 z)jeMN#b?cA%{*^sH!t)2<6nm)h8HCvsFQ$k&isef5tD$6^674ur=#??+@sniXCtcQ zz56qqwoLX2&&OWjm7Bhd8(u#ud~mGiY_>KpaV>9qdkU@Ka7AN6ppMeDdzp#xr3x$8 zoqeX(jBL(VA2!I|*w=Su+=`L7>QzKDsd|MKd3akJz7egwWu-9IMR<$ak{&IQw2LsH z9DF!#oAj#HX*Tj(q~b5QdfwbmCOQO{z|kY}RpgD*%BweQ zTt6Y1+3TO(f__`d?^yVXnLa98GJcy}N^PdU-mv!2h335KCh~Z}s7LpM()lY7_^WKa zr!@vNH@vAC)vS!ax%1eejX8?zq%2TUm*q{s+cvW+d$c!Ly|LHIr8pDmYe*#x5sM?p zPW9<`#yC&RP}|onj&|S|&~eVMBh-hYggxANow00J>9It;C-m!2mZXVq@ zMWMH#1)W(2&!nG=Hjd(;>*8J(fII*?2S# z(8r>^5ipYrvG{~uiUk{1$6&-A_?Q7r;XaJW14PG@69OhpnbQc@V7maZVLSlb$Ozy8o(PfI zP6%%RMi7V~e^M2pPoH#Cnx<4fmC2^hKulY22l1%^FbBX)5q^xV|0}?cX&^uciXDI< zlc$Xo&uV%oCw+uS&*=w@c$za@1BAh^Tv2zLX+q^eBFBL4rnZ)@#_Oyg<`#(0pi#x{ zGJ|+DE`!5oa{+<~LhKGP2X-fe%j25{QMrIF7PO^Kw=q~W=*9@(2k|@+Sbfnz|Jzs0 zMd0yzz(4<{G(^;2bP+##dU~Sy>VLKo|l!nuM4(1@x2l)RYoE0U-OqkSJ2{i8i& zGggEHe?`9{+-X^{y=XvJM1i$L(ld6#eNo!6;9CrXMTechGG_4@-}}x2f4(TkMQH&? zaVFP9Zv81?{^50T*Pa>*{d;&!;AH}@5)>9=0O;#s0eu|CTXdPC^Wc~uKw}2+$hNQ3lPJMQ1{=V?bv<6uJpsDL4dZ$Kdhc*@z=5nk@o! zpN7Hf5@1v~{P4=t0L?*5a3g33+Jh9(6{LdxAPo!vAy7Od7zhT!ixp&mOfVE=fozb? zfe3gVJ^0UuPXYQU@oF0x${(j4Jb(M2j?53Qx0IQq3TkW;gLc0^Alm*>tO8cc! z;%C>I8gm>eYXQol4OubCWo3o6yEi>~dPz%jH>Gv$sWat>Iafnm|B|vfKHD~N->PS2 z!DH75`dI_=D;`{+_ufAe)z|**>o@%uW0P}gpTsSak=*jAC4cyBL#1u5pnH#(WKf)Z zhGutIbVPE66Yk*N_2WVW8|;1;`i9=TO+AikX@FJKyJ{{g6|)a-xdxG-mGFVf-Pps@ zv|iU{NFseR>RP^JiK?&L=kWv*_OdFNw_(7>r?%8}mwEr&myaSG!J2OFQkddHKD`ty{PDrPRd4l0IHKwru+u#a zH?1R^?JFELU9=SKBb*p6l8V+5j*f@)%VM1A)(mFph+wO(C#U)tiw+q`Vum!m_Kg(pMfLJQx?rMR5;=I;w+=o8c0ZRS5B zs_)eFJBzW<%eZnQPw3SQXW$ z+x6F{v4yJik&>rgxr>}-vj47^q07%}@h0vjNlT$3Up2_Rlnj136t%rHOf?C2e{Q(& z!KXzxf$DEkqx;_}^kjL--F`gO2(51SvEB*HelIAr4wOG(&MWI=g&^EU><`>vd0pRU zviAAm2A_ti(vD#n$p!OLR)a!u~Rlw$`aZ%Cu7b3BOmw3}nL^3QjtKzY z$mXr=SREa(%lONV?k?3oqWo@mMJpyRo@d0Vob=*#y2cZZLcmpP_ksZ z_t*RdqngG6eX48HMutj!cKfGDxJ`P6NjSXpcsrC&HtYc>jsou!e2PQArJ9g+L%t^F~1tCOmp?mS)|Q~j9KOYOV;2niOZp6%Cu z_`yPH$+ei3!f1{G!{^wD=9SrP#qX9W^iF=--SF4Qj#IAgw`fSEw41hXB^cM{l__jP z7G|%zWW9sn`YgV8boaN}*&Pc^Qt6b9#U8T;=XQp#Rea&m%@0l(XL)&|L!6^ql~nka}{m3sd}iQ=P2z0?Q&h}`r(V}OU^VzNUdvm z6#>4#80G!(xqj|}gwqqs8!ve$4abMrKRMT|xMYQI`IY?gL)y+gg{|is)bu7?o;E%C z+cF-CGp!lbTNzkLdYr!YjijmiYU;!bg7Bc1wDy)Y#W`V1_r@x`T0o6b{>ECkXaAiy zsm}t`5Jkp{f;r_f@+-`4k{^+j6T%iLnI5=vFivLcteP(3BWLBz)e@PUxS-6ehqYY! zy^l?Tj+I9NOiAJ%zuL=n!2_uoDK7GDd1^}+)e96yDt0u=tdWU-C!xam#2jTT3K-{w?TdW1!lP|a^|VQ=wcx<$hPDlTTh#Q;Qvw1%QD-YuJ4R~n z@W5I(jcu*Dn-JcjHaYLCiOsoYp<%j<0pu~Xbud=t#_ScWZ=ccw%C=+AsLZnpUXYP@ zu>1o`{aNR3+cj<>>T{LtN|u>{$Q`R$whF6N9w)xBBg+_x$}uF!K5mjUGHU)Krr@KYd@+#dl{r zTOKCjsn}~8=0$4TBy-;!k?p*3jbH4G6f$EhyG(ZPWE-6NtLVeh-9Z&n-VXlw_fEp;*P~h^6{Ydvu`57WLJ^$m1TPx&tYDKJ7b%k9X*{;br7+{(MIJ*`RrENh`a(c$rdk z-C|DaiOG3;jASF{%MMuUNmn{~o*ey_Gq}WqjlBEG?9Jy#!DYnW_%j!yt`d%|MBOg( zna{o$aN9jTNd1Fq?qfq6kE{G#7lB>NabOi`)onV{ePzw)!Nm@C6xpl&@rw$}o0f&d z1`h+$z|xVqPoF+{=)cSSRgqc@FH^a2sbG0S#bU!i_sWrlfd2owxYU z(Onz9naJD)%LzQ6hX;G}nh-k6a+)+^)p^QGtB^_szDE}N_7kY(t??z2Br**;sBQM3YwI6( z!LA|KTj3ej6r)*3rEgmWdYSm?-I)83EB*S(^Aqor@PiX5hmWIH*S>sl{^ND1we%B} zI=16TZ_>f9z2j!{AMdMJIjDb6^}zss`}6nD`5gD=c<-T1^VQ9?yv7ZKSBo#c>{u$G zw<@0l_CDJw7y)Hzk?Sgt|itQ;^t@MKxZyj8`j zdn%W`TG7eD$lvBzc2hPd;{*$Qm%2HGysK_++|FVfU3jq_VLmy(IdVN$bWi^EAt`<` z{d{Gfc})Gd@44IA&Rq5|ID+2y%O1%{2;Vb9AU@y^(HSg5_>v#a z=7sFD`DL}Yqhz#QMIYbZ)4-eM~*VSQj=^%zcAb@Brh{d8{2^24a z#it5UEZ$mpJh34R_wQ;fo{rci9U40nWVnME9W*#I(9AQB!Da!XfvNs%0pAcQ5HJFW z{#acc0Z*l(AYDBi3WEtmqtNgNg(Fb)2?kgi9z*k=8IJRlnZJw&GvEPrVL!kvBK%$t z5YQm5A<~j!3s?rRdHktoCP2_Z^#3cX;Mn}T7vO+SyMYAD5bfZHTVRA4TrwbA za2Wu~3_{TW7c8C#V2K!_E`dlS03`4ql5p^0Ra3ZP4Og)LA5?#m{7IF~b%9fYOlJu= zOg10D>F5C*DxVg_gtkCT06jITSan*G1d8JHlZXCmpHVq>cK>Iug@%gKS|mp_W77no z@N?4I?Efce{_8jg(7qeY5pbE}6%s%LAtofUjR%Js16v$GBL=d$p;S1(sT>ac?4|PI zv1l?|^=6;_%U6hzu8P(Z3xMKNSXMb{ma<+iW!98ipt~ zuv_ zQR-++C&dgho2xMso_{WDSOl(61Vc3bcM(wpVY0D+9|S9kvqSTH$xq0I0^zb1T$d5; zz*8SU50BTy1A)La4Wn-Wmor5lfHgzY`xhEU9}Ab)ewD-E^?%bv!*l&z4*xsN01ubT z{((op!}ZW#Y4B~A!zo*rB-{S^-m0vziZ8lOvr3q@S`AB_O$%!q_* zzc>JNV#8Z13pfxLy4T!5qaMjBU@Fbb)VQ~g923i+up=V-&H!(BC>X}*K%`J4z iEzIzy> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Full.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 21:29:32 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +938 448 M +63 0 V +5946 0 R +-63 0 V +stroke +854 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +938 781 M +31 0 V +5978 0 R +-31 0 V +938 976 M +31 0 V +5978 0 R +-31 0 V +938 1114 M +31 0 V +5978 0 R +-31 0 V +938 1221 M +31 0 V +5978 0 R +-31 0 V +938 1308 M +31 0 V +5978 0 R +-31 0 V +938 1382 M +31 0 V +5978 0 R +-31 0 V +938 1447 M +31 0 V +5978 0 R +-31 0 V +938 1503 M +31 0 V +5978 0 R +-31 0 V +938 1554 M +63 0 V +5946 0 R +-63 0 V +stroke +854 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +938 1887 M +31 0 V +5978 0 R +-31 0 V +938 2081 M +31 0 V +5978 0 R +-31 0 V +938 2219 M +31 0 V +5978 0 R +-31 0 V +938 2327 M +31 0 V +5978 0 R +-31 0 V +938 2414 M +31 0 V +5978 0 R +-31 0 V +938 2488 M +31 0 V +5978 0 R +-31 0 V +938 2552 M +31 0 V +5978 0 R +-31 0 V +938 2609 M +31 0 V +5978 0 R +-31 0 V +938 2660 M +63 0 V +5946 0 R +-63 0 V +stroke +854 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +938 2992 M +31 0 V +5978 0 R +-31 0 V +938 3187 M +31 0 V +5978 0 R +-31 0 V +938 3325 M +31 0 V +5978 0 R +-31 0 V +938 3432 M +31 0 V +5978 0 R +-31 0 V +938 3520 M +31 0 V +5978 0 R +-31 0 V +938 3594 M +31 0 V +5978 0 R +-31 0 V +938 3658 M +31 0 V +5978 0 R +-31 0 V +938 3715 M +31 0 V +5978 0 R +-31 0 V +938 3765 M +63 0 V +5946 0 R +-63 0 V +stroke +854 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +938 4098 M +31 0 V +5978 0 R +-31 0 V +938 4293 M +31 0 V +5978 0 R +-31 0 V +938 4431 M +31 0 V +5978 0 R +-31 0 V +938 4538 M +31 0 V +5978 0 R +-31 0 V +938 4626 M +31 0 V +5978 0 R +-31 0 V +938 4700 M +31 0 V +5978 0 R +-31 0 V +938 4764 M +31 0 V +5978 0 R +-31 0 V +938 4820 M +31 0 V +5978 0 R +-31 0 V +938 4871 M +63 0 V +5946 0 R +-63 0 V +stroke +854 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MRshow +1.000 UL +LTb +938 448 M +0 63 V +0 4360 R +0 -63 V +stroke +938 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (1)] +] -46.7 MCshow +1.000 UL +LTb +2941 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2941 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (2)] +] -46.7 MCshow +1.000 UL +LTb +4944 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4944 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (3)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (4)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3942 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Number of GPUs)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K MPI)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +938 2013 M +2941 1685 L +4944 1538 L +6947 1430 L +938 2013 BoxF +2941 1685 BoxF +4944 1538 BoxF +6947 1430 BoxF +6579 4738 BoxF +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K OMP)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +938 2014 M +2941 1703 L +4944 1544 L +6947 1437 L +938 2014 TriUF +2941 1703 TriUF +4944 1544 TriUF +6947 1437 TriUF +6579 4598 TriUF +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K MPI)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +938 3346 M +2941 3008 L +4944 2816 L +6947 2690 L +938 3346 BoxF +2941 3008 BoxF +4944 2816 BoxF +6947 2690 BoxF +6579 4458 BoxF +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K OMP)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +938 3315 M +2941 3006 L +4944 2820 L +6947 2685 L +938 3315 TriUF +2941 3006 TriUF +4944 2820 TriUF +6947 2685 TriUF +6579 4318 TriUF +% End plot #4 +% Begin plot #5 +1.000 UP +3.000 UL +LT4 +LCb setrgbcolor +6296 4178 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M MPI)] +] -46.7 MRshow +LT4 +6380 4178 M +399 0 V +938 3917 M +2941 3542 L +4944 3370 L +6947 3230 L +938 3917 BoxF +2941 3542 BoxF +4944 3370 BoxF +6947 3230 BoxF +6579 4178 BoxF +% End plot #5 +% Begin plot #6 +1.000 UP +3.000 UL +LT5 +LC7 setrgbcolor +LCb setrgbcolor +6296 4038 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M OMP)] +] -46.7 MRshow +LT5 +LC7 setrgbcolor +6380 4038 M +399 0 V +938 3929 M +2941 3577 L +4944 3377 L +6947 3237 L +938 3929 TriUF +2941 3577 TriUF +4944 3377 TriUF +6947 3237 TriUF +6579 4038 TriUF +% End plot #6 +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Full_mpi.eps b/Simulations/Full_mpi.eps new file mode 100644 index 0000000..a53246c --- /dev/null +++ b/Simulations/Full_mpi.eps @@ -0,0 +1,899 @@ +%!PS-Adobe-2.0 +%%Title: Full_mpi.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Fri Dec 25 20:51:56 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color true def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Full_mpi.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 20:51:56 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +938 448 M +63 0 V +5946 0 R +-63 0 V +stroke +854 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +938 781 M +31 0 V +5978 0 R +-31 0 V +938 976 M +31 0 V +5978 0 R +-31 0 V +938 1114 M +31 0 V +5978 0 R +-31 0 V +938 1221 M +31 0 V +5978 0 R +-31 0 V +938 1308 M +31 0 V +5978 0 R +-31 0 V +938 1382 M +31 0 V +5978 0 R +-31 0 V +938 1447 M +31 0 V +5978 0 R +-31 0 V +938 1503 M +31 0 V +5978 0 R +-31 0 V +938 1554 M +63 0 V +5946 0 R +-63 0 V +stroke +854 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +938 1887 M +31 0 V +5978 0 R +-31 0 V +938 2081 M +31 0 V +5978 0 R +-31 0 V +938 2219 M +31 0 V +5978 0 R +-31 0 V +938 2327 M +31 0 V +5978 0 R +-31 0 V +938 2414 M +31 0 V +5978 0 R +-31 0 V +938 2488 M +31 0 V +5978 0 R +-31 0 V +938 2552 M +31 0 V +5978 0 R +-31 0 V +938 2609 M +31 0 V +5978 0 R +-31 0 V +938 2660 M +63 0 V +5946 0 R +-63 0 V +stroke +854 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +938 2992 M +31 0 V +5978 0 R +-31 0 V +938 3187 M +31 0 V +5978 0 R +-31 0 V +938 3325 M +31 0 V +5978 0 R +-31 0 V +938 3432 M +31 0 V +5978 0 R +-31 0 V +938 3520 M +31 0 V +5978 0 R +-31 0 V +938 3594 M +31 0 V +5978 0 R +-31 0 V +938 3658 M +31 0 V +5978 0 R +-31 0 V +938 3715 M +31 0 V +5978 0 R +-31 0 V +938 3765 M +63 0 V +5946 0 R +-63 0 V +stroke +854 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +938 4098 M +31 0 V +5978 0 R +-31 0 V +938 4293 M +31 0 V +5978 0 R +-31 0 V +938 4431 M +31 0 V +5978 0 R +-31 0 V +938 4538 M +31 0 V +5978 0 R +-31 0 V +938 4626 M +31 0 V +5978 0 R +-31 0 V +938 4700 M +31 0 V +5978 0 R +-31 0 V +938 4764 M +31 0 V +5978 0 R +-31 0 V +938 4820 M +31 0 V +5978 0 R +-31 0 V +938 4871 M +63 0 V +5946 0 R +-63 0 V +stroke +854 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MRshow +1.000 UL +LTb +938 448 M +0 63 V +0 4360 R +0 -63 V +stroke +938 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 0)] +] -46.7 MCshow +1.000 UL +LTb +1796 448 M +0 63 V +0 4360 R +0 -63 V +stroke +1796 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 200000)] +] -46.7 MCshow +1.000 UL +LTb +2655 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2655 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 400000)] +] -46.7 MCshow +1.000 UL +LTb +3513 448 M +0 63 V +0 4360 R +0 -63 V +stroke +3513 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 600000)] +] -46.7 MCshow +1.000 UL +LTb +4372 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4372 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 800000)] +] -46.7 MCshow +1.000 UL +LTb +5230 448 M +0 63 V +0 4360 R +0 -63 V +stroke +5230 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +6089 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6089 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.2e+06)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.4e+06)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3942 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +3335 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +3419 4738 M +399 0 V +1367 1305 M +429 708 V +859 787 V +858 391 V +859 155 V +858 338 V +859 83 V +858 150 V +1367 1305 Pls +1796 2013 Pls +2655 2800 Pls +3513 3191 Pls +4372 3346 Pls +5230 3684 Pls +6089 3767 Pls +6947 3917 Pls +3618 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +4322 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +4406 4738 M +399 0 V +1367 1220 M +429 465 V +859 799 V +858 456 V +859 68 V +858 372 V +859 150 V +858 12 V +1367 1220 Crs +1796 1685 Crs +2655 2484 Crs +3513 2940 Crs +4372 3008 Crs +5230 3380 Crs +6089 3530 Crs +6947 3542 Crs +4605 4738 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +5309 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +5393 4738 M +399 0 V +1367 1138 M +429 400 V +859 843 V +858 805 V +859 -370 V +858 366 V +859 199 V +858 -11 V +1367 1138 Star +1796 1538 Star +2655 2381 Star +3513 3186 Star +4372 2816 Star +5230 3182 Star +6089 3381 Star +6947 3370 Star +5592 4738 Star +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4738 M +399 0 V +1367 936 M +429 494 V +859 761 V +858 527 V +859 -28 V +858 416 V +859 100 V +858 24 V +1367 936 Box +1796 1430 Box +2655 2191 Box +3513 2718 Box +4372 2690 Box +5230 3106 Box +6089 3206 Box +6947 3230 Box +6579 4738 Box +% End plot #4 +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Full_omp.eps b/Simulations/Full_omp.eps new file mode 100644 index 0000000..2d1772f --- /dev/null +++ b/Simulations/Full_omp.eps @@ -0,0 +1,899 @@ +%!PS-Adobe-2.0 +%%Title: Full_omp.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Fri Dec 25 20:52:55 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color true def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Full_omp.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 20:52:55 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +938 448 M +63 0 V +5946 0 R +-63 0 V +stroke +854 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +938 781 M +31 0 V +5978 0 R +-31 0 V +938 976 M +31 0 V +5978 0 R +-31 0 V +938 1114 M +31 0 V +5978 0 R +-31 0 V +938 1221 M +31 0 V +5978 0 R +-31 0 V +938 1308 M +31 0 V +5978 0 R +-31 0 V +938 1382 M +31 0 V +5978 0 R +-31 0 V +938 1447 M +31 0 V +5978 0 R +-31 0 V +938 1503 M +31 0 V +5978 0 R +-31 0 V +938 1554 M +63 0 V +5946 0 R +-63 0 V +stroke +854 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +938 1887 M +31 0 V +5978 0 R +-31 0 V +938 2081 M +31 0 V +5978 0 R +-31 0 V +938 2219 M +31 0 V +5978 0 R +-31 0 V +938 2327 M +31 0 V +5978 0 R +-31 0 V +938 2414 M +31 0 V +5978 0 R +-31 0 V +938 2488 M +31 0 V +5978 0 R +-31 0 V +938 2552 M +31 0 V +5978 0 R +-31 0 V +938 2609 M +31 0 V +5978 0 R +-31 0 V +938 2660 M +63 0 V +5946 0 R +-63 0 V +stroke +854 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +938 2992 M +31 0 V +5978 0 R +-31 0 V +938 3187 M +31 0 V +5978 0 R +-31 0 V +938 3325 M +31 0 V +5978 0 R +-31 0 V +938 3432 M +31 0 V +5978 0 R +-31 0 V +938 3520 M +31 0 V +5978 0 R +-31 0 V +938 3594 M +31 0 V +5978 0 R +-31 0 V +938 3658 M +31 0 V +5978 0 R +-31 0 V +938 3715 M +31 0 V +5978 0 R +-31 0 V +938 3765 M +63 0 V +5946 0 R +-63 0 V +stroke +854 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +938 4098 M +31 0 V +5978 0 R +-31 0 V +938 4293 M +31 0 V +5978 0 R +-31 0 V +938 4431 M +31 0 V +5978 0 R +-31 0 V +938 4538 M +31 0 V +5978 0 R +-31 0 V +938 4626 M +31 0 V +5978 0 R +-31 0 V +938 4700 M +31 0 V +5978 0 R +-31 0 V +938 4764 M +31 0 V +5978 0 R +-31 0 V +938 4820 M +31 0 V +5978 0 R +-31 0 V +938 4871 M +63 0 V +5946 0 R +-63 0 V +stroke +854 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MRshow +1.000 UL +LTb +938 448 M +0 63 V +0 4360 R +0 -63 V +stroke +938 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 0)] +] -46.7 MCshow +1.000 UL +LTb +1796 448 M +0 63 V +0 4360 R +0 -63 V +stroke +1796 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 200000)] +] -46.7 MCshow +1.000 UL +LTb +2655 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2655 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 400000)] +] -46.7 MCshow +1.000 UL +LTb +3513 448 M +0 63 V +0 4360 R +0 -63 V +stroke +3513 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 600000)] +] -46.7 MCshow +1.000 UL +LTb +4372 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4372 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 800000)] +] -46.7 MCshow +1.000 UL +LTb +5230 448 M +0 63 V +0 4360 R +0 -63 V +stroke +5230 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +6089 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6089 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.2e+06)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.4e+06)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3942 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +3335 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +3419 4738 M +399 0 V +1367 1304 M +429 710 V +859 779 V +858 432 V +859 90 V +858 380 V +859 125 V +858 109 V +1367 1304 Pls +1796 2014 Pls +2655 2793 Pls +3513 3225 Pls +4372 3315 Pls +5230 3695 Pls +6089 3820 Pls +6947 3929 Pls +3618 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +4322 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +4406 4738 M +399 0 V +1367 1208 M +429 495 V +859 797 V +858 408 V +859 98 V +858 371 V +859 101 V +858 99 V +1367 1208 Crs +1796 1703 Crs +2655 2500 Crs +3513 2908 Crs +4372 3006 Crs +5230 3377 Crs +6089 3478 Crs +6947 3577 Crs +4605 4738 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +5309 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +5393 4738 M +399 0 V +1367 1149 M +429 395 V +859 826 V +858 819 V +859 -369 V +858 371 V +859 131 V +858 55 V +1367 1149 Star +1796 1544 Star +2655 2370 Star +3513 3189 Star +4372 2820 Star +5230 3191 Star +6089 3322 Star +6947 3377 Star +5592 4738 Star +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4738 M +399 0 V +1367 932 M +429 505 V +859 782 V +858 513 V +859 -47 V +858 412 V +859 132 V +858 8 V +1367 932 Box +1796 1437 Box +2655 2219 Box +3513 2732 Box +4372 2685 Box +5230 3097 Box +6089 3229 Box +6947 3237 Box +6579 4738 Box +% End plot #4 +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/MPI.eps b/Simulations/MPI.eps new file mode 100644 index 0000000..c0daa18 --- /dev/null +++ b/Simulations/MPI.eps @@ -0,0 +1,871 @@ +%!PS-Adobe-2.0 +%%Title: MPI.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Fri Dec 25 21:35:56 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color true def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (MPI.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 21:35:56 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +938 448 M +63 0 V +5946 0 R +-63 0 V +stroke +854 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +938 781 M +31 0 V +5978 0 R +-31 0 V +938 976 M +31 0 V +5978 0 R +-31 0 V +938 1114 M +31 0 V +5978 0 R +-31 0 V +938 1221 M +31 0 V +5978 0 R +-31 0 V +938 1308 M +31 0 V +5978 0 R +-31 0 V +938 1382 M +31 0 V +5978 0 R +-31 0 V +938 1447 M +31 0 V +5978 0 R +-31 0 V +938 1503 M +31 0 V +5978 0 R +-31 0 V +938 1554 M +63 0 V +5946 0 R +-63 0 V +stroke +854 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +938 1887 M +31 0 V +5978 0 R +-31 0 V +938 2081 M +31 0 V +5978 0 R +-31 0 V +938 2219 M +31 0 V +5978 0 R +-31 0 V +938 2327 M +31 0 V +5978 0 R +-31 0 V +938 2414 M +31 0 V +5978 0 R +-31 0 V +938 2488 M +31 0 V +5978 0 R +-31 0 V +938 2552 M +31 0 V +5978 0 R +-31 0 V +938 2609 M +31 0 V +5978 0 R +-31 0 V +938 2660 M +63 0 V +5946 0 R +-63 0 V +stroke +854 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +938 2992 M +31 0 V +5978 0 R +-31 0 V +938 3187 M +31 0 V +5978 0 R +-31 0 V +938 3325 M +31 0 V +5978 0 R +-31 0 V +938 3432 M +31 0 V +5978 0 R +-31 0 V +938 3520 M +31 0 V +5978 0 R +-31 0 V +938 3594 M +31 0 V +5978 0 R +-31 0 V +938 3658 M +31 0 V +5978 0 R +-31 0 V +938 3715 M +31 0 V +5978 0 R +-31 0 V +938 3765 M +63 0 V +5946 0 R +-63 0 V +stroke +854 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +938 4098 M +31 0 V +5978 0 R +-31 0 V +938 4293 M +31 0 V +5978 0 R +-31 0 V +938 4431 M +31 0 V +5978 0 R +-31 0 V +938 4538 M +31 0 V +5978 0 R +-31 0 V +938 4626 M +31 0 V +5978 0 R +-31 0 V +938 4700 M +31 0 V +5978 0 R +-31 0 V +938 4764 M +31 0 V +5978 0 R +-31 0 V +938 4820 M +31 0 V +5978 0 R +-31 0 V +938 4871 M +63 0 V +5946 0 R +-63 0 V +stroke +854 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MRshow +1.000 UL +LTb +938 448 M +0 63 V +0 4360 R +0 -63 V +stroke +938 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (1)] +] -46.7 MCshow +1.000 UL +LTb +2941 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2941 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (2)] +] -46.7 MCshow +1.000 UL +LTb +4944 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4944 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (3)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (4)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3942 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Number of GPUs)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K sparse)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +938 1336 M +2941 1125 L +2003 -17 V +6947 818 L +938 1336 BoxF +2941 1125 BoxF +4944 1108 BoxF +6947 818 BoxF +6579 4738 BoxF +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K full)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +938 2013 M +2941 1685 L +4944 1538 L +6947 1430 L +938 2013 TriUF +2941 1685 TriUF +4944 1538 TriUF +6947 1430 TriUF +6579 4598 TriUF +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K sparse)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +938 2902 M +2941 2519 L +4944 2368 L +6947 2052 L +938 2902 BoxF +2941 2519 BoxF +4944 2368 BoxF +6947 2052 BoxF +6579 4458 BoxF +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K full)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +938 3346 M +2941 3008 L +4944 2816 L +6947 2690 L +938 3346 TriUF +2941 3008 TriUF +4944 2816 TriUF +6947 2690 TriUF +6579 4318 TriUF +% End plot #4 +% Begin plot #5 +1.000 UP +3.000 UL +LT4 +LCb setrgbcolor +6296 4178 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M sparse)] +] -46.7 MRshow +LT4 +6380 4178 M +399 0 V +938 3223 M +2941 2990 L +2003 -74 V +2003 -69 V +938 3223 BoxF +2941 2990 BoxF +4944 2916 BoxF +6947 2847 BoxF +6579 4178 BoxF +% End plot #5 +% Begin plot #6 +1.000 UP +3.000 UL +LT5 +LC7 setrgbcolor +LCb setrgbcolor +6296 4038 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M full)] +] -46.7 MRshow +LT5 +LC7 setrgbcolor +6380 4038 M +399 0 V +938 3917 M +2941 3542 L +4944 3370 L +6947 3230 L +938 3917 TriUF +2941 3542 TriUF +4944 3370 TriUF +6947 3230 TriUF +6579 4038 TriUF +% End plot #6 +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/OMP.eps b/Simulations/OMP.eps new file mode 100644 index 0000000..554272c --- /dev/null +++ b/Simulations/OMP.eps @@ -0,0 +1,871 @@ +%!PS-Adobe-2.0 +%%Title: OMP.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Fri Dec 25 21:39:39 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color true def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (OMP.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 21:39:39 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +938 448 M +63 0 V +5946 0 R +-63 0 V +stroke +854 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +938 781 M +31 0 V +5978 0 R +-31 0 V +938 976 M +31 0 V +5978 0 R +-31 0 V +938 1114 M +31 0 V +5978 0 R +-31 0 V +938 1221 M +31 0 V +5978 0 R +-31 0 V +938 1308 M +31 0 V +5978 0 R +-31 0 V +938 1382 M +31 0 V +5978 0 R +-31 0 V +938 1447 M +31 0 V +5978 0 R +-31 0 V +938 1503 M +31 0 V +5978 0 R +-31 0 V +938 1554 M +63 0 V +5946 0 R +-63 0 V +stroke +854 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +938 1887 M +31 0 V +5978 0 R +-31 0 V +938 2081 M +31 0 V +5978 0 R +-31 0 V +938 2219 M +31 0 V +5978 0 R +-31 0 V +938 2327 M +31 0 V +5978 0 R +-31 0 V +938 2414 M +31 0 V +5978 0 R +-31 0 V +938 2488 M +31 0 V +5978 0 R +-31 0 V +938 2552 M +31 0 V +5978 0 R +-31 0 V +938 2609 M +31 0 V +5978 0 R +-31 0 V +938 2660 M +63 0 V +5946 0 R +-63 0 V +stroke +854 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +938 2992 M +31 0 V +5978 0 R +-31 0 V +938 3187 M +31 0 V +5978 0 R +-31 0 V +938 3325 M +31 0 V +5978 0 R +-31 0 V +938 3432 M +31 0 V +5978 0 R +-31 0 V +938 3520 M +31 0 V +5978 0 R +-31 0 V +938 3594 M +31 0 V +5978 0 R +-31 0 V +938 3658 M +31 0 V +5978 0 R +-31 0 V +938 3715 M +31 0 V +5978 0 R +-31 0 V +938 3765 M +63 0 V +5946 0 R +-63 0 V +stroke +854 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +938 4098 M +31 0 V +5978 0 R +-31 0 V +938 4293 M +31 0 V +5978 0 R +-31 0 V +938 4431 M +31 0 V +5978 0 R +-31 0 V +938 4538 M +31 0 V +5978 0 R +-31 0 V +938 4626 M +31 0 V +5978 0 R +-31 0 V +938 4700 M +31 0 V +5978 0 R +-31 0 V +938 4764 M +31 0 V +5978 0 R +-31 0 V +938 4820 M +31 0 V +5978 0 R +-31 0 V +938 4871 M +63 0 V +5946 0 R +-63 0 V +stroke +854 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MRshow +1.000 UL +LTb +938 448 M +0 63 V +0 4360 R +0 -63 V +stroke +938 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (1)] +] -46.7 MCshow +1.000 UL +LTb +2941 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2941 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (2)] +] -46.7 MCshow +1.000 UL +LTb +4944 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4944 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (3)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (4)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3942 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Number of GPUs)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K sparse)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +938 1383 M +2941 1058 L +2003 29 V +6947 847 L +938 1383 BoxF +2941 1058 BoxF +4944 1087 BoxF +6947 847 BoxF +6579 4738 BoxF +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K full)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +938 2014 M +2941 1703 L +4944 1544 L +6947 1437 L +938 2014 TriUF +2941 1703 TriUF +4944 1544 TriUF +6947 1437 TriUF +6579 4598 TriUF +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K sparse)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +938 2739 M +2941 2395 L +4944 2157 L +6947 2010 L +938 2739 BoxF +2941 2395 BoxF +4944 2157 BoxF +6947 2010 BoxF +6579 4458 BoxF +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K full)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +938 3315 M +2941 3006 L +4944 2820 L +6947 2685 L +938 3315 TriUF +2941 3006 TriUF +4944 2820 TriUF +6947 2685 TriUF +6579 4318 TriUF +% End plot #4 +% Begin plot #5 +1.000 UP +3.000 UL +LT4 +LCb setrgbcolor +6296 4178 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M sparse)] +] -46.7 MRshow +LT4 +6380 4178 M +399 0 V +938 3264 M +2941 3074 L +4944 2938 L +2003 -22 V +938 3264 BoxF +2941 3074 BoxF +4944 2938 BoxF +6947 2916 BoxF +6579 4178 BoxF +% End plot #5 +% Begin plot #6 +1.000 UP +3.000 UL +LT5 +LC7 setrgbcolor +LCb setrgbcolor +6296 4038 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M full)] +] -46.7 MRshow +LT5 +LC7 setrgbcolor +6380 4038 M +399 0 V +938 3929 M +2941 3577 L +4944 3377 L +6947 3237 L +938 3929 TriUF +2941 3577 TriUF +4944 3377 TriUF +6947 3237 TriUF +6579 4038 TriUF +% End plot #6 +1.000 UL +LTb +938 4871 N +938 448 L +6009 0 V +0 4423 V +-6009 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Sparse.eps b/Simulations/Sparse.eps new file mode 100644 index 0000000..e340085 --- /dev/null +++ b/Simulations/Sparse.eps @@ -0,0 +1,829 @@ +%!PS-Adobe-2.0 +%%Title: Sparse.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Fri Dec 25 21:06:52 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color true def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Sparse.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 21:06:52 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 892 M +31 0 V +6062 0 R +-31 0 V +854 1151 M +31 0 V +6062 0 R +-31 0 V +854 1336 M +31 0 V +6062 0 R +-31 0 V +854 1479 M +31 0 V +6062 0 R +-31 0 V +854 1595 M +31 0 V +6062 0 R +-31 0 V +854 1694 M +31 0 V +6062 0 R +-31 0 V +854 1779 M +31 0 V +6062 0 R +-31 0 V +854 1855 M +31 0 V +6062 0 R +-31 0 V +854 1922 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1922 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2366 M +31 0 V +6062 0 R +-31 0 V +854 2626 M +31 0 V +6062 0 R +-31 0 V +854 2810 M +31 0 V +6062 0 R +-31 0 V +854 2953 M +31 0 V +6062 0 R +-31 0 V +854 3070 M +31 0 V +6062 0 R +-31 0 V +854 3168 M +31 0 V +6062 0 R +-31 0 V +854 3254 M +31 0 V +6062 0 R +-31 0 V +854 3329 M +31 0 V +6062 0 R +-31 0 V +854 3397 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3397 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 3840 M +31 0 V +6062 0 R +-31 0 V +854 4100 M +31 0 V +6062 0 R +-31 0 V +854 4284 M +31 0 V +6062 0 R +-31 0 V +854 4427 M +31 0 V +6062 0 R +-31 0 V +854 4544 M +31 0 V +6062 0 R +-31 0 V +854 4643 M +31 0 V +6062 0 R +-31 0 V +854 4728 M +31 0 V +6062 0 R +-31 0 V +854 4804 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (1)] +] -46.7 MCshow +1.000 UL +LTb +2885 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2885 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (2)] +] -46.7 MCshow +1.000 UL +LTb +4916 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4916 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (3)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (4)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Number of GPUs)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K MPI)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +854 1632 M +2885 1351 L +2031 -23 V +6947 941 L +854 1632 BoxF +2885 1351 BoxF +4916 1328 BoxF +6947 941 BoxF +6579 4738 BoxF +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K OMP)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +854 1695 M +2885 1261 L +2031 39 V +6947 980 L +854 1695 TriUF +2885 1261 TriUF +4916 1300 TriUF +6947 980 TriUF +6579 4598 TriUF +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K MPI)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +854 3720 M +2885 3209 L +4916 3008 L +6947 2587 L +854 3720 BoxF +2885 3209 BoxF +4916 3008 BoxF +6947 2587 BoxF +6579 4458 BoxF +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K OMP)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +854 3503 M +2885 3044 L +4916 2727 L +6947 2531 L +854 3503 TriUF +2885 3044 TriUF +4916 2727 TriUF +6947 2531 TriUF +6579 4318 TriUF +% End plot #4 +% Begin plot #5 +1.000 UP +3.000 UL +LT4 +LCb setrgbcolor +6296 4178 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M MPI)] +] -46.7 MRshow +LT4 +6380 4178 M +399 0 V +854 4147 M +2885 3838 L +2031 -99 V +2031 -92 V +854 4147 BoxF +2885 3838 BoxF +4916 3739 BoxF +6947 3647 BoxF +6579 4178 BoxF +% End plot #5 +% Begin plot #6 +1.000 UP +3.000 UL +LT5 +LC7 setrgbcolor +LCb setrgbcolor +6296 4038 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M OMP)] +] -46.7 MRshow +LT5 +LC7 setrgbcolor +6380 4038 M +399 0 V +854 4203 M +2885 3949 L +4916 3768 L +2031 -30 V +854 4203 TriUF +2885 3949 TriUF +4916 3768 TriUF +6947 3738 TriUF +6579 4038 TriUF +% End plot #6 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Sparse_mpi.eps b/Simulations/Sparse_mpi.eps new file mode 100644 index 0000000..6b3baa5 --- /dev/null +++ b/Simulations/Sparse_mpi.eps @@ -0,0 +1,899 @@ +%!PS-Adobe-2.0 +%%Title: Sparse_mpi.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Fri Dec 25 20:48:48 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color true def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Sparse_mpi.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 20:48:48 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1)] +] -46.7 MRshow +1.000 UL +LTb +854 781 M +31 0 V +6062 0 R +-31 0 V +854 976 M +31 0 V +6062 0 R +-31 0 V +854 1114 M +31 0 V +6062 0 R +-31 0 V +854 1221 M +31 0 V +6062 0 R +-31 0 V +854 1308 M +31 0 V +6062 0 R +-31 0 V +854 1382 M +31 0 V +6062 0 R +-31 0 V +854 1447 M +31 0 V +6062 0 R +-31 0 V +854 1503 M +31 0 V +6062 0 R +-31 0 V +854 1554 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 1887 M +31 0 V +6062 0 R +-31 0 V +854 2081 M +31 0 V +6062 0 R +-31 0 V +854 2219 M +31 0 V +6062 0 R +-31 0 V +854 2327 M +31 0 V +6062 0 R +-31 0 V +854 2414 M +31 0 V +6062 0 R +-31 0 V +854 2488 M +31 0 V +6062 0 R +-31 0 V +854 2552 M +31 0 V +6062 0 R +-31 0 V +854 2609 M +31 0 V +6062 0 R +-31 0 V +854 2660 M +63 0 V +6030 0 R +-63 0 V +stroke +770 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2992 M +31 0 V +6062 0 R +-31 0 V +854 3187 M +31 0 V +6062 0 R +-31 0 V +854 3325 M +31 0 V +6062 0 R +-31 0 V +854 3432 M +31 0 V +6062 0 R +-31 0 V +854 3520 M +31 0 V +6062 0 R +-31 0 V +854 3594 M +31 0 V +6062 0 R +-31 0 V +854 3658 M +31 0 V +6062 0 R +-31 0 V +854 3715 M +31 0 V +6062 0 R +-31 0 V +854 3765 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 4098 M +31 0 V +6062 0 R +-31 0 V +854 4293 M +31 0 V +6062 0 R +-31 0 V +854 4431 M +31 0 V +6062 0 R +-31 0 V +854 4538 M +31 0 V +6062 0 R +-31 0 V +854 4626 M +31 0 V +6062 0 R +-31 0 V +854 4700 M +31 0 V +6062 0 R +-31 0 V +854 4764 M +31 0 V +6062 0 R +-31 0 V +854 4820 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 0)] +] -46.7 MCshow +1.000 UL +LTb +1724 448 M +0 63 V +0 4360 R +0 -63 V +stroke +1724 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 200000)] +] -46.7 MCshow +1.000 UL +LTb +2595 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2595 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 400000)] +] -46.7 MCshow +1.000 UL +LTb +3465 448 M +0 63 V +0 4360 R +0 -63 V +stroke +3465 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 600000)] +] -46.7 MCshow +1.000 UL +LTb +4336 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4336 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 800000)] +] -46.7 MCshow +1.000 UL +LTb +5206 448 M +0 63 V +0 4360 R +0 -63 V +stroke +5206 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +6077 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6077 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.2e+06)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.4e+06)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +3335 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +3419 4738 M +399 0 V +1289 1782 M +435 660 V +871 942 V +870 171 V +871 453 V +870 312 V +871 100 V +870 -92 V +1289 1782 Pls +1724 2442 Pls +2595 3384 Pls +3465 3555 Pls +4336 4008 Pls +5206 4320 Pls +6077 4420 Pls +6947 4328 Pls +3618 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +4322 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +4406 4738 M +399 0 V +1289 1484 M +435 747 V +871 525 V +870 426 V +871 443 V +870 41 V +871 339 V +870 91 V +1289 1484 Crs +1724 2231 Crs +2595 2756 Crs +3465 3182 Crs +4336 3625 Crs +5206 3666 Crs +6077 4005 Crs +6947 4096 Crs +4605 4738 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +5309 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +5393 4738 M +399 0 V +1289 1391 M +435 823 V +871 345 V +870 418 V +871 497 V +870 -2 V +871 524 V +870 26 V +1289 1391 Star +1724 2214 Star +2595 2559 Star +3465 2977 Star +4336 3474 Star +5206 3472 Star +6077 3996 Star +6947 4022 Star +5592 4738 Star +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4738 M +399 0 V +1289 1181 M +435 742 V +871 519 V +870 423 V +871 293 V +870 213 V +871 666 V +870 -84 V +1289 1181 Box +1724 1923 Box +2595 2442 Box +3465 2865 Box +4336 3158 Box +5206 3371 Box +6077 4037 Box +6947 3953 Box +6579 4738 Box +% End plot #4 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Sparse_omp.eps b/Simulations/Sparse_omp.eps new file mode 100644 index 0000000..ce681c3 --- /dev/null +++ b/Simulations/Sparse_omp.eps @@ -0,0 +1,899 @@ +%!PS-Adobe-2.0 +%%Title: Sparse_omp.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Fri Dec 25 20:50:16 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color true def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Sparse_omp.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Fri Dec 25 20:50:16 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1)] +] -46.7 MRshow +1.000 UL +LTb +854 781 M +31 0 V +6062 0 R +-31 0 V +854 976 M +31 0 V +6062 0 R +-31 0 V +854 1114 M +31 0 V +6062 0 R +-31 0 V +854 1221 M +31 0 V +6062 0 R +-31 0 V +854 1308 M +31 0 V +6062 0 R +-31 0 V +854 1382 M +31 0 V +6062 0 R +-31 0 V +854 1447 M +31 0 V +6062 0 R +-31 0 V +854 1503 M +31 0 V +6062 0 R +-31 0 V +854 1554 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 1887 M +31 0 V +6062 0 R +-31 0 V +854 2081 M +31 0 V +6062 0 R +-31 0 V +854 2219 M +31 0 V +6062 0 R +-31 0 V +854 2327 M +31 0 V +6062 0 R +-31 0 V +854 2414 M +31 0 V +6062 0 R +-31 0 V +854 2488 M +31 0 V +6062 0 R +-31 0 V +854 2552 M +31 0 V +6062 0 R +-31 0 V +854 2609 M +31 0 V +6062 0 R +-31 0 V +854 2660 M +63 0 V +6030 0 R +-63 0 V +stroke +770 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2992 M +31 0 V +6062 0 R +-31 0 V +854 3187 M +31 0 V +6062 0 R +-31 0 V +854 3325 M +31 0 V +6062 0 R +-31 0 V +854 3432 M +31 0 V +6062 0 R +-31 0 V +854 3520 M +31 0 V +6062 0 R +-31 0 V +854 3594 M +31 0 V +6062 0 R +-31 0 V +854 3658 M +31 0 V +6062 0 R +-31 0 V +854 3715 M +31 0 V +6062 0 R +-31 0 V +854 3765 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 4098 M +31 0 V +6062 0 R +-31 0 V +854 4293 M +31 0 V +6062 0 R +-31 0 V +854 4431 M +31 0 V +6062 0 R +-31 0 V +854 4538 M +31 0 V +6062 0 R +-31 0 V +854 4626 M +31 0 V +6062 0 R +-31 0 V +854 4700 M +31 0 V +6062 0 R +-31 0 V +854 4764 M +31 0 V +6062 0 R +-31 0 V +854 4820 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 0)] +] -46.7 MCshow +1.000 UL +LTb +1724 448 M +0 63 V +0 4360 R +0 -63 V +stroke +1724 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 200000)] +] -46.7 MCshow +1.000 UL +LTb +2595 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2595 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 400000)] +] -46.7 MCshow +1.000 UL +LTb +3465 448 M +0 63 V +0 4360 R +0 -63 V +stroke +3465 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 600000)] +] -46.7 MCshow +1.000 UL +LTb +4336 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4336 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 800000)] +] -46.7 MCshow +1.000 UL +LTb +5206 448 M +0 63 V +0 4360 R +0 -63 V +stroke +5206 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +6077 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6077 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.2e+06)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1.4e+06)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +3.000 UL +LT0 +LCb setrgbcolor +3335 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +3419 4738 M +399 0 V +1289 1785 M +435 704 V +871 608 V +870 415 V +871 333 V +870 152 V +871 451 V +870 -78 V +1289 1785 Pls +1724 2489 Pls +2595 3097 Pls +3465 3512 Pls +4336 3845 Pls +5206 3997 Pls +6077 4448 Pls +6947 4370 Pls +3618 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +3.000 UL +LT1 +LCb setrgbcolor +4322 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +4406 4738 M +399 0 V +1289 1510 M +435 654 V +871 592 V +870 428 V +871 317 V +870 186 V +871 313 V +870 180 V +1289 1510 Crs +1724 2164 Crs +2595 2756 Crs +3465 3184 Crs +4336 3501 Crs +5206 3687 Crs +6077 4000 Crs +6947 4180 Crs +4605 4738 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +3.000 UL +LT2 +LCb setrgbcolor +5309 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +5393 4738 M +399 0 V +1289 1447 M +435 746 V +871 395 V +870 410 V +871 265 V +870 256 V +871 592 V +870 -67 V +1289 1447 Star +1724 2193 Star +2595 2588 Star +3465 2998 Star +4336 3263 Star +5206 3519 Star +6077 4111 Star +6947 4044 Star +5592 4738 Star +% End plot #3 +% Begin plot #4 +1.000 UP +3.000 UL +LT3 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4738 M +399 0 V +1289 1298 M +435 655 V +871 522 V +870 393 V +871 248 V +870 235 V +871 627 V +870 43 V +1289 1298 Box +1724 1953 Box +2595 2475 Box +3465 2868 Box +4336 3116 Box +5206 3351 Box +6077 3978 Box +6947 4021 Box +6579 4738 Box +% End plot #4 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/full_mpi/full_mpi_1GPU.o140161 b/Simulations/full_mpi/full_mpi_1GPU.o140161 new file mode 100644 index 0000000..a833c6c --- /dev/null +++ b/Simulations/full_mpi/full_mpi_1GPU.o140161 @@ -0,0 +1,515 @@ +REMAINING: 1 +Taking GPU #3 +proc 0 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 60160 +proc 0 start 0 size 60160 +iter : 1 Arret : 4.93627E-05 s/iter 0.751338 +iter : 2 Arret : 4.72892E-05 s/iter 0.751311 +iter : 3 Arret : 4.32282E-05 s/iter 0.751351 +iter : 4 Arret : 4.40808E-05 s/iter 0.751390 +iter : 5 Arret : 4.31866E-05 s/iter 0.751343 +iter : 6 Arret : 4.51897E-05 s/iter 0.751236 +iter : 7 Arret : 5.50757E-05 s/iter 0.751346 +iter : 8 Arret : 0.000600625 s/iter 0.751189 +iter : 9 Arret : 0.00351745 s/iter 0.751224 +iter : 10 Arret : 0.0225499 s/iter 0.751147 +iter : 11 Arret : 1.92525 s/iter 1.257596 +iter : 12 Arret : 0.0724798 s/iter 0.751219 +iter : 13 Arret : 0.100634 s/iter 0.751209 +iter : 14 Arret : 0.104374 s/iter 1.286622 +iter : 15 Arret : 0.016746 s/iter 1.271784 +iter : 16 Arret : 0.00784681 s/iter 1.261270 +iter : 17 Arret : 0.00523028 s/iter 1.249434 +iter : 18 Arret : 0.00797883 s/iter 0.731764 +iter : 19 Arret : 0.00389307 s/iter 0.711145 +iter : 20 Arret : 0.00132613 s/iter 0.695894 +iter : 21 Arret : 0.00054363 s/iter 0.683618 +iter : 22 Arret : 0.00764188 s/iter 0.655728 +iter : 23 Arret : 0.0109632 s/iter 0.663047 +iter : 24 Arret : 0.000483636 s/iter 0.647992 +iter : 25 Arret : 0.000266785 s/iter 0.645841 +iter : 26 Arret : 9.21069E-05 s/iter 0.650690 +iter : 27 Arret : 0.00137817 s/iter 0.518549 +iter : 28 Arret : 0.00413942 s/iter 0.516303 +iter : 29 Arret : 1.28264E-05 s/iter 0.521554 +iter : 30 Arret : 2.62246E-10 s/iter 0.521585 +iter : 31 Arret : 8.10539E-15 s/iter 0.520315 +temps : 24.1491 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 8.10539E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.27804E-14 +i*-1.97481E-14| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 150016 +proc 0 start 0 size 150016 +iter : 1 Arret : 1.64136E-05 s/iter 4.670410 +iter : 2 Arret : 1.62219E-05 s/iter 4.668737 +iter : 3 Arret : 1.59634E-05 s/iter 4.668001 +iter : 4 Arret : 1.57203E-05 s/iter 4.668096 +iter : 5 Arret : 1.61134E-05 s/iter 4.668095 +iter : 6 Arret : 1.68096E-05 s/iter 4.667823 +iter : 7 Arret : 1.83395E-05 s/iter 4.668957 +iter : 8 Arret : 2.23347E-05 s/iter 4.668718 +iter : 9 Arret : 0.000193284 s/iter 4.669886 +iter : 10 Arret : 0.00650657 s/iter 4.666547 +iter : 11 Arret : 0.00202338 s/iter 4.668819 +iter : 12 Arret : 0.00858027 s/iter 4.668152 +iter : 13 Arret : 1.50198 s/iter 6.718188 +iter : 14 Arret : 0.0716136 s/iter 5.989323 +iter : 15 Arret : 0.0462949 s/iter 4.653326 +iter : 16 Arret : 0.0250802 s/iter 4.654335 +iter : 17 Arret : 0.014323 s/iter 6.635287 +iter : 18 Arret : 0.0102749 s/iter 6.598926 +iter : 19 Arret : 0.0107553 s/iter 6.248834 +iter : 20 Arret : 0.0163074 s/iter 5.917159 +iter : 21 Arret : 0.00966464 s/iter 5.868624 +iter : 22 Arret : 0.0126723 s/iter 4.502515 +iter : 23 Arret : 0.0194806 s/iter 5.728295 +iter : 24 Arret : 0.00314943 s/iter 4.460393 +iter : 25 Arret : 0.00455918 s/iter 4.451818 +iter : 26 Arret : 0.000131011 s/iter 4.482879 +iter : 27 Arret : 1.27601E-05 s/iter 4.481150 +iter : 28 Arret : 8.90079E-08 s/iter 4.447335 +iter : 29 Arret : 8.10668E-13 s/iter 4.446139 +temps : 146.49 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 8.10668E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235897 +i* 0.971778| 1|-3.15963E-14 +i*-8.88994E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 250112 +proc 0 start 0 size 250112 +iter : 1 Arret : 1.15411E-05 s/iter 13.046733 +iter : 2 Arret : 9.858E-06 s/iter 13.081326 +iter : 3 Arret : 1.15382E-05 s/iter 13.069120 +iter : 4 Arret : 9.47232E-06 s/iter 13.076010 +iter : 5 Arret : 1.17256E-05 s/iter 13.072118 +iter : 6 Arret : 9.56386E-06 s/iter 13.076291 +iter : 7 Arret : 9.97104E-06 s/iter 13.066170 +iter : 8 Arret : 1.14103E-05 s/iter 13.081314 +iter : 9 Arret : 2.05919E-05 s/iter 13.071473 +iter : 10 Arret : 0.000825792 s/iter 13.076037 +iter : 11 Arret : 0.00118923 s/iter 13.070033 +iter : 12 Arret : 0.000993305 s/iter 13.084702 +iter : 13 Arret : 0.00173445 s/iter 13.089852 +iter : 14 Arret : 0.00725752 s/iter 13.071956 +iter : 15 Arret : 0.00431675 s/iter 12.991545 +iter : 16 Arret : 0.00223336 s/iter 10.557352 +iter : 17 Arret : 0.00768504 s/iter 7.919767 +iter : 18 Arret : 0.0589957 s/iter 7.694604 +iter : 19 Arret : 0.25159 s/iter 7.214844 +iter : 20 Arret : 0.00281777 s/iter 7.197502 +iter : 21 Arret : 0.000159366 s/iter 7.094188 +iter : 22 Arret : 6.57562E-05 s/iter 7.066874 +iter : 23 Arret : 3.10389E-05 s/iter 7.014897 +iter : 24 Arret : 1.40727E-05 s/iter 7.069989 +iter : 25 Arret : 1.97654E-05 s/iter 7.070010 +iter : 26 Arret : 1.37694E-05 s/iter 7.006386 +iter : 27 Arret : 7.84672E-07 s/iter 7.000436 +iter : 28 Arret : 2.76696E-10 s/iter 6.995541 +iter : 29 Arret : 5.23691E-16 s/iter 6.993836 +temps : 300.171 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 5.23691E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 350208 +proc 0 start 0 size 350208 +iter : 1 Arret : 8.60988E-06 s/iter 25.315090 +iter : 2 Arret : 7.40762E-06 s/iter 25.250569 +iter : 3 Arret : 7.04966E-06 s/iter 25.240912 +iter : 4 Arret : 7.00431E-06 s/iter 25.295865 +iter : 5 Arret : 6.902E-06 s/iter 25.229976 +iter : 6 Arret : 7.05582E-06 s/iter 25.295774 +iter : 7 Arret : 7.08998E-06 s/iter 25.244072 +iter : 8 Arret : 7.80153E-06 s/iter 25.319330 +iter : 9 Arret : 3.47E-05 s/iter 25.270429 +iter : 10 Arret : 0.000704728 s/iter 25.254028 +iter : 11 Arret : 0.00103416 s/iter 25.267890 +iter : 12 Arret : 0.00106397 s/iter 25.219715 +iter : 13 Arret : 0.860111 s/iter 25.358661 +iter : 14 Arret : 3.1212 s/iter 25.438830 +iter : 15 Arret : 0.0931888 s/iter 25.230396 +iter : 16 Arret : 0.0389072 s/iter 25.512462 +iter : 17 Arret : 0.0434458 s/iter 25.567784 +iter : 18 Arret : 0.0492605 s/iter 25.737787 +iter : 19 Arret : 0.0322665 s/iter 25.683394 +iter : 20 Arret : 0.0311855 s/iter 25.569362 +iter : 21 Arret : 0.0249899 s/iter 24.998756 +iter : 22 Arret : 0.0236284 s/iter 25.007239 +iter : 23 Arret : 0.0147332 s/iter 24.894940 +iter : 24 Arret : 0.0045927 s/iter 25.318951 +iter : 25 Arret : 0.00241036 s/iter 24.996102 +iter : 26 Arret : 0.000981942 s/iter 24.881214 +iter : 27 Arret : 0.000188842 s/iter 24.914979 +iter : 28 Arret : 1.13979E-05 s/iter 24.908900 +iter : 29 Arret : 4.63289E-09 s/iter 24.885179 +iter : 30 Arret : 2.06854E-14 s/iter 24.907560 +temps : 757.352 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 2.06854E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153441 +i* -0.988158| 1| 2.08479E-14 +i* 5.5551E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 500224 +proc 0 start 0 size 500224 +iter : 1 Arret : 6.15685E-06 s/iter 51.380314 +iter : 2 Arret : 6.30268E-06 s/iter 51.404717 +iter : 3 Arret : 5.43665E-06 s/iter 51.327440 +iter : 4 Arret : 5.82943E-06 s/iter 51.330423 +iter : 5 Arret : 5.29982E-06 s/iter 51.375294 +iter : 6 Arret : 5.48392E-06 s/iter 51.311003 +iter : 7 Arret : 4.9788E-06 s/iter 51.305802 +iter : 8 Arret : 5.28812E-06 s/iter 51.293377 +iter : 9 Arret : 8.66477E-06 s/iter 51.300327 +iter : 10 Arret : 6.18367E-05 s/iter 51.365604 +iter : 11 Arret : 0.00106682 s/iter 51.326802 +iter : 12 Arret : 0.00302391 s/iter 51.361010 +iter : 13 Arret : 0.00805823 s/iter 51.856360 +iter : 14 Arret : 0.00569434 s/iter 51.969477 +iter : 15 Arret : 0.0032212 s/iter 47.185741 +iter : 16 Arret : 1.43264 s/iter 37.596552 +iter : 17 Arret : 0.0261708 s/iter 34.701842 +iter : 18 Arret : 0.0335751 s/iter 32.177584 +iter : 19 Arret : 0.00563912 s/iter 31.261275 +iter : 20 Arret : 0.0024634 s/iter 29.073429 +iter : 21 Arret : 0.00305489 s/iter 28.085556 +iter : 22 Arret : 0.00365771 s/iter 26.833086 +iter : 23 Arret : 0.00250143 s/iter 25.441707 +iter : 24 Arret : 0.00549424 s/iter 24.484295 +iter : 25 Arret : 0.00252639 s/iter 23.169509 +iter : 26 Arret : 5.43905E-05 s/iter 22.350315 +iter : 27 Arret : 1.35324E-06 s/iter 21.912846 +iter : 28 Arret : 9.26795E-09 s/iter 22.036576 +iter : 29 Arret : 2.63961E-14 s/iter 21.824040 +temps : 1148.46 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 2.63961E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +iter : 1 Arret : 4.88741E-06 s/iter 73.643121 +iter : 2 Arret : 4.97199E-06 s/iter 73.660774 +iter : 3 Arret : 4.86258E-06 s/iter 73.959554 +iter : 4 Arret : 4.28624E-06 s/iter 73.918069 +iter : 5 Arret : 4.70264E-06 s/iter 73.933005 +iter : 6 Arret : 4.85459E-06 s/iter 73.951374 +iter : 7 Arret : 4.4341E-06 s/iter 73.800704 +iter : 8 Arret : 4.56391E-06 s/iter 73.596272 +iter : 9 Arret : 5.75896E-06 s/iter 73.751223 +iter : 10 Arret : 0.000763198 s/iter 73.862761 +iter : 11 Arret : 0.000582931 s/iter 81.937266 +iter : 12 Arret : 0.00224489 s/iter 73.950715 +iter : 13 Arret : 1.80799 s/iter 73.968738 +iter : 14 Arret : 0.0742277 s/iter 74.508413 +iter : 15 Arret : 0.0962999 s/iter 74.277195 +iter : 16 Arret : 0.108643 s/iter 73.517886 +iter : 17 Arret : 0.0724179 s/iter 71.659228 +iter : 18 Arret : 0.105199 s/iter 70.746803 +iter : 19 Arret : 0.146372 s/iter 69.276722 +iter : 20 Arret : 0.117759 s/iter 68.338548 +iter : 21 Arret : 0.00754357 s/iter 67.172870 +iter : 22 Arret : 0.000921826 s/iter 65.662508 +iter : 23 Arret : 0.000616312 s/iter 65.353341 +iter : 24 Arret : 0.00179901 s/iter 65.174928 +iter : 25 Arret : 1.77897E-05 s/iter 65.467629 +iter : 26 Arret : 3.63702E-06 s/iter 65.144205 +iter : 27 Arret : 1.82722E-07 s/iter 65.288149 +iter : 28 Arret : 3.58982E-11 s/iter 64.840549 +iter : 29 Arret : 1.57009E-16 s/iter 64.759606 +temps : 2059.61 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 700160 +proc 0 start 0 size 700160 +iter : 1 Arret : 4.36089E-06 s/iter 100.538329 +iter : 2 Arret : 4.20009E-06 s/iter 100.086525 +iter : 3 Arret : 4.27261E-06 s/iter 100.410161 +iter : 4 Arret : 3.90142E-06 s/iter 100.336287 +iter : 5 Arret : 3.60563E-06 s/iter 100.308817 +iter : 6 Arret : 3.93135E-06 s/iter 100.373492 +iter : 7 Arret : 3.83714E-06 s/iter 100.283845 +iter : 8 Arret : 3.69157E-06 s/iter 100.391852 +iter : 9 Arret : 4.92428E-06 s/iter 100.459479 +iter : 10 Arret : 9.37908E-05 s/iter 100.446598 +iter : 11 Arret : 0.00213526 s/iter 100.396625 +iter : 12 Arret : 0.002542 s/iter 100.503838 +iter : 13 Arret : 0.0125219 s/iter 100.940510 +iter : 14 Arret : 0.010999 s/iter 109.789990 +iter : 15 Arret : 0.00932865 s/iter 109.205901 +iter : 16 Arret : 0.0450638 s/iter 100.884592 +iter : 17 Arret : 0.184973 s/iter 102.656255 +iter : 18 Arret : 0.0519142 s/iter 101.300314 +iter : 19 Arret : 0.0302111 s/iter 100.763046 +iter : 20 Arret : 0.0177202 s/iter 100.248985 +iter : 21 Arret : 0.00863847 s/iter 99.989614 +iter : 22 Arret : 0.00156575 s/iter 99.794924 +iter : 23 Arret : 0.000367723 s/iter 99.510307 +iter : 24 Arret : 0.000179924 s/iter 99.548317 +iter : 25 Arret : 2.80728E-05 s/iter 99.520822 +iter : 26 Arret : 9.99898E-06 s/iter 99.579748 +iter : 27 Arret : 2.46675E-08 s/iter 99.458855 +iter : 28 Arret : 9.85491E-15 s/iter 99.607347 +temps : 2827.9 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 9.85491E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 800000 +proc 0 start 0 size 800000 +iter : 1 Arret : 3.83515E-06 s/iter 131.128367 +iter : 2 Arret : 3.31342E-06 s/iter 130.895719 +iter : 3 Arret : 3.46185E-06 s/iter 130.774185 +iter : 4 Arret : 3.77822E-06 s/iter 130.629629 +iter : 5 Arret : 3.54151E-06 s/iter 131.099737 +iter : 6 Arret : 3.39913E-06 s/iter 130.729467 +iter : 7 Arret : 3.37038E-06 s/iter 130.632620 +iter : 8 Arret : 3.66135E-06 s/iter 130.656450 +iter : 9 Arret : 5.18164E-06 s/iter 130.618912 +iter : 10 Arret : 3.60623E-05 s/iter 130.609820 +iter : 11 Arret : 0.000919045 s/iter 130.931691 +iter : 12 Arret : 0.0269508 s/iter 130.735832 +iter : 13 Arret : 2.00753 s/iter 131.562739 +iter : 14 Arret : 0.113163 s/iter 131.675926 +iter : 15 Arret : 0.114468 s/iter 132.383980 +iter : 16 Arret : 0.0343723 s/iter 131.231628 +iter : 17 Arret : 0.0118406 s/iter 126.227547 +iter : 18 Arret : 0.00584689 s/iter 120.723541 +iter : 19 Arret : 0.00603455 s/iter 116.384134 +iter : 20 Arret : 0.00445856 s/iter 111.422234 +iter : 21 Arret : 0.00344019 s/iter 106.222631 +iter : 22 Arret : 0.000542325 s/iter 99.990260 +iter : 23 Arret : 0.00265194 s/iter 95.378338 +iter : 24 Arret : 0.00180528 s/iter 92.586290 +iter : 25 Arret : 4.07819E-06 s/iter 91.103601 +iter : 26 Arret : 1.49379E-06 s/iter 89.796006 +iter : 27 Arret : 7.96771E-09 s/iter 90.012737 +iter : 28 Arret : 1.91442E-14 s/iter 90.007579 +temps : 3326.77 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.91442E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_mpi/full_mpi_1GPU.sge b/Simulations/full_mpi/full_mpi_1GPU.sge new file mode 100755 index 0000000..fd35afa --- /dev/null +++ b/Simulations/full_mpi/full_mpi_1GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_1GPU +#$ -pe mpi 1 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +#mpirun -np $NSLOTS ./template -r -i 900000 700000 +#mpirun -np $NSLOTS ./template -r -i 1000000 800000 +#mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_mpi/full_mpi_2GPU.o140160 b/Simulations/full_mpi/full_mpi_2GPU.o140160 new file mode 100644 index 0000000..8016229 --- /dev/null +++ b/Simulations/full_mpi/full_mpi_2GPU.o140160 @@ -0,0 +1,562 @@ +REMAINING: 2 +Taking GPU #0 +Taking GPU #1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 1, start 30080 size 30080 +proc 1 start 30080 size 30080 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 30080 +proc 0 start 0 size 30080 +iter : 1 Arret : 3.94715E-05 s/iter 0.376579 +iter : 2 Arret : 4.00498E-05 s/iter 0.376426 +iter : 3 Arret : 3.94982E-05 s/iter 0.376469 +iter : 4 Arret : 3.91196E-05 s/iter 0.376474 +iter : 5 Arret : 4.06401E-05 s/iter 0.376476 +iter : 6 Arret : 4.41482E-05 s/iter 0.376495 +iter : 7 Arret : 5.50716E-05 s/iter 0.376547 +iter : 8 Arret : 0.000118504 s/iter 0.376518 +iter : 9 Arret : 0.00115954 s/iter 0.376505 +iter : 10 Arret : 0.0219062 s/iter 0.376584 +iter : 11 Arret : 2.08077 s/iter 1.164908 +iter : 12 Arret : 0.274053 s/iter 0.376485 +iter : 13 Arret : 0.163438 s/iter 1.196444 +iter : 14 Arret : 0.0502837 s/iter 1.195663 +iter : 15 Arret : 0.0171551 s/iter 1.191447 +iter : 16 Arret : 0.00931569 s/iter 1.183639 +iter : 17 Arret : 0.00645054 s/iter 1.167546 +iter : 18 Arret : 0.00448467 s/iter 0.370707 +iter : 19 Arret : 0.00168489 s/iter 0.366051 +iter : 20 Arret : 0.00126146 s/iter 0.365448 +iter : 21 Arret : 0.0157645 s/iter 0.356946 +iter : 22 Arret : 0.00414432 s/iter 0.349791 +iter : 23 Arret : 0.0293605 s/iter 0.344674 +iter : 24 Arret : 0.000309791 s/iter 0.347406 +iter : 25 Arret : 0.000479548 s/iter 0.344763 +iter : 26 Arret : 0.000172889 s/iter 0.342501 +iter : 27 Arret : 2.54873E-05 s/iter 0.344592 +iter : 28 Arret : 6.36446E-08 s/iter 0.343705 +iter : 29 Arret : 1.95655E-12 s/iter 0.343232 +iter : 30 Arret : 1.11022E-16 s/iter 0.343867 +temps : 15.9313 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-2.28637E-15 +i*-5.45917E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 1 +proc 0 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 1, start 75008 size 75008 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 75008 +proc 0 start 0 size 75008 +proc 1 start 75008 size 75008 +iter : 1 Arret : 1.60943E-05 s/iter 2.350355 +iter : 2 Arret : 1.67528E-05 s/iter 2.342992 +iter : 3 Arret : 1.68978E-05 s/iter 2.337485 +iter : 4 Arret : 1.60377E-05 s/iter 2.337553 +iter : 5 Arret : 1.62156E-05 s/iter 2.337558 +iter : 6 Arret : 1.69292E-05 s/iter 2.337450 +iter : 7 Arret : 1.84639E-05 s/iter 2.337768 +iter : 8 Arret : 2.25051E-05 s/iter 2.337545 +iter : 9 Arret : 4.76681E-05 s/iter 2.337634 +iter : 10 Arret : 0.00245562 s/iter 2.337594 +iter : 11 Arret : 0.00371283 s/iter 2.337716 +iter : 12 Arret : 0.010769 s/iter 2.910185 +iter : 13 Arret : 1.55694 s/iter 4.438167 +iter : 14 Arret : 0.116538 s/iter 2.911091 +iter : 15 Arret : 0.0585023 s/iter 3.939639 +iter : 16 Arret : 0.0321741 s/iter 3.902393 +iter : 17 Arret : 0.0186974 s/iter 3.930056 +iter : 18 Arret : 0.00687909 s/iter 3.962909 +iter : 19 Arret : 0.0214989 s/iter 2.321178 +iter : 20 Arret : 0.00865216 s/iter 3.260664 +iter : 21 Arret : 0.0168761 s/iter 3.221472 +iter : 22 Arret : 0.0147692 s/iter 4.261763 +iter : 23 Arret : 0.0125239 s/iter 2.251272 +iter : 24 Arret : 0.000664965 s/iter 2.239406 +iter : 25 Arret : 1.59841E-05 s/iter 2.245565 +iter : 26 Arret : 5.40825E-07 s/iter 2.231696 +iter : 27 Arret : 8.52059E-11 s/iter 2.240876 +iter : 28 Arret : 7.75295E-16 s/iter 2.238326 +temps : 78.4263 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 7.75295E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.23606 +i* 0.971739| 1| 2.9924E-14 +i*-1.32854E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 125056 +proc 0 start 0 size 125056 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 1, start 125056 size 125056 +proc 1 start 125056 size 125056 +iter : 1 Arret : 1.04122E-05 s/iter 6.893601 +iter : 2 Arret : 9.66995E-06 s/iter 6.882320 +iter : 3 Arret : 9.55261E-06 s/iter 6.898899 +iter : 4 Arret : 9.22665E-06 s/iter 6.899113 +iter : 5 Arret : 9.50477E-06 s/iter 6.894819 +iter : 6 Arret : 9.562E-06 s/iter 6.896301 +iter : 7 Arret : 9.85225E-06 s/iter 6.898079 +iter : 8 Arret : 1.00444E-05 s/iter 6.895828 +iter : 9 Arret : 1.26197E-05 s/iter 6.906197 +iter : 10 Arret : 0.000374245 s/iter 6.892279 +iter : 11 Arret : 0.000473147 s/iter 6.894504 +iter : 12 Arret : 0.00101736 s/iter 6.894983 +iter : 13 Arret : 0.00428892 s/iter 6.893815 +iter : 14 Arret : 0.0152171 s/iter 6.896640 +iter : 15 Arret : 0.00947972 s/iter 6.813081 +iter : 16 Arret : 0.00590834 s/iter 8.502086 +iter : 17 Arret : 0.0148154 s/iter 4.292037 +iter : 18 Arret : 0.303776 s/iter 4.191474 +iter : 19 Arret : 0.00212739 s/iter 4.153373 +iter : 20 Arret : 0.00703257 s/iter 3.618613 +iter : 21 Arret : 0.00722956 s/iter 5.063281 +iter : 22 Arret : 0.000539584 s/iter 3.599227 +iter : 23 Arret : 0.000175798 s/iter 3.593595 +iter : 24 Arret : 1.72224E-05 s/iter 3.538749 +iter : 25 Arret : 0.000115569 s/iter 3.554657 +iter : 26 Arret : 0.000113543 s/iter 3.546651 +iter : 27 Arret : 4.63885E-05 s/iter 3.544304 +iter : 28 Arret : 1.37358E-05 s/iter 3.565583 +iter : 29 Arret : 2.47356E-07 s/iter 3.564036 +iter : 30 Arret : 2.5459E-12 s/iter 3.540899 +iter : 31 Arret : 1.11022E-16 s/iter 3.548698 +temps : 169.022 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 1 +proc 0 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 1, start 175104 size 175104 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 175104 +proc 0 start 0 size 175104 +proc 1 start 175104 size 175104 +iter : 1 Arret : 7.23955E-06 s/iter 12.988714 +iter : 2 Arret : 8.17362E-06 s/iter 12.961404 +iter : 3 Arret : 7.81796E-06 s/iter 12.964651 +iter : 4 Arret : 7.21292E-06 s/iter 12.968827 +iter : 5 Arret : 7.55071E-06 s/iter 12.967829 +iter : 6 Arret : 7.49029E-06 s/iter 12.964916 +iter : 7 Arret : 7.62064E-06 s/iter 12.963339 +iter : 8 Arret : 7.80044E-06 s/iter 12.963493 +iter : 9 Arret : 9.75039E-06 s/iter 12.964925 +iter : 10 Arret : 0.000863071 s/iter 12.969839 +iter : 11 Arret : 0.000849607 s/iter 12.969054 +iter : 12 Arret : 0.00104766 s/iter 12.964139 +iter : 13 Arret : 0.831471 s/iter 12.972067 +iter : 14 Arret : 3.38426 s/iter 12.966001 +iter : 15 Arret : 0.107189 s/iter 12.934545 +iter : 16 Arret : 0.0542638 s/iter 16.933464 +iter : 17 Arret : 0.0319719 s/iter 16.802921 +iter : 18 Arret : 0.0123162 s/iter 17.515009 +iter : 19 Arret : 0.021246 s/iter 17.702219 +iter : 20 Arret : 0.0113278 s/iter 17.796152 +iter : 21 Arret : 0.0245772 s/iter 17.074640 +iter : 22 Arret : 0.00540155 s/iter 17.506599 +iter : 23 Arret : 0.00765026 s/iter 12.838465 +iter : 24 Arret : 0.0115831 s/iter 12.839289 +iter : 25 Arret : 0.0115203 s/iter 12.887210 +iter : 26 Arret : 0.000774924 s/iter 12.835436 +iter : 27 Arret : 0.000228102 s/iter 12.835530 +iter : 28 Arret : 0.000225979 s/iter 12.834198 +iter : 29 Arret : 2.70389E-05 s/iter 12.835221 +iter : 30 Arret : 1.29617E-05 s/iter 12.835156 +iter : 31 Arret : 1.12344E-06 s/iter 12.834214 +iter : 32 Arret : 1.60825E-09 s/iter 12.834300 +iter : 33 Arret : 5.97777E-15 s/iter 12.836140 +temps : 457.417 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 5.97777E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153441 +i* -0.988158| 1| 2.08479E-14 +i* 5.5551E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 1, start 250112 size 250112 +proc 1 start 250112 size 250112 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 250112 +proc 0 start 0 size 250112 +iter : 1 Arret : 4.9348E-06 s/iter 26.306811 +iter : 2 Arret : 5.74497E-06 s/iter 26.125397 +iter : 3 Arret : 5.90879E-06 s/iter 26.122962 +iter : 4 Arret : 5.45965E-06 s/iter 26.117846 +iter : 5 Arret : 5.51053E-06 s/iter 26.113294 +iter : 6 Arret : 5.44166E-06 s/iter 26.107906 +iter : 7 Arret : 5.61587E-06 s/iter 26.108065 +iter : 8 Arret : 5.37769E-06 s/iter 26.112535 +iter : 9 Arret : 6.392E-06 s/iter 26.112787 +iter : 10 Arret : 0.000222412 s/iter 26.105165 +iter : 11 Arret : 0.00364174 s/iter 26.108847 +iter : 12 Arret : 0.00224664 s/iter 28.294492 +iter : 13 Arret : 0.00428508 s/iter 29.203574 +iter : 14 Arret : 0.00509531 s/iter 32.497063 +iter : 15 Arret : 0.00237252 s/iter 26.034125 +iter : 16 Arret : 0.0225054 s/iter 21.475326 +iter : 17 Arret : 1.39022 s/iter 22.775590 +iter : 18 Arret : 0.0380632 s/iter 21.509248 +iter : 19 Arret : 0.0147501 s/iter 20.099820 +iter : 20 Arret : 0.0175634 s/iter 15.352961 +iter : 21 Arret : 0.00896774 s/iter 19.613858 +iter : 22 Arret : 0.00146838 s/iter 16.233299 +iter : 23 Arret : 0.000316321 s/iter 13.214624 +iter : 24 Arret : 0.000122654 s/iter 13.000460 +iter : 25 Arret : 4.91927E-05 s/iter 12.525060 +iter : 26 Arret : 2.33271E-06 s/iter 11.550850 +iter : 27 Arret : 3.0703E-06 s/iter 11.616325 +iter : 28 Arret : 4.34623E-07 s/iter 11.570420 +iter : 29 Arret : 4.32022E-10 s/iter 11.514451 +iter : 30 Arret : 1.24127E-15 s/iter 11.583468 +temps : 637.538 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.24127E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 300032 size 300032 +proc 1 start 300032 size 300032 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +iter : 1 Arret : 4.75638E-06 s/iter 37.194622 +iter : 2 Arret : 4.76706E-06 s/iter 37.169379 +iter : 3 Arret : 4.56609E-06 s/iter 37.187098 +iter : 4 Arret : 4.96449E-06 s/iter 37.189698 +iter : 5 Arret : 4.6101E-06 s/iter 37.190980 +iter : 6 Arret : 4.67386E-06 s/iter 37.170837 +iter : 7 Arret : 4.4173E-06 s/iter 37.184958 +iter : 8 Arret : 4.5841E-06 s/iter 37.189119 +iter : 9 Arret : 5.81936E-06 s/iter 37.194076 +iter : 10 Arret : 9.61381E-05 s/iter 37.202796 +iter : 11 Arret : 0.00253702 s/iter 37.201994 +iter : 12 Arret : 0.00382237 s/iter 43.720161 +iter : 13 Arret : 1.98237 s/iter 37.268722 +iter : 14 Arret : 0.139529 s/iter 43.928325 +iter : 15 Arret : 0.0833681 s/iter 37.165670 +iter : 16 Arret : 0.0902433 s/iter 37.013464 +iter : 17 Arret : 0.0538083 s/iter 36.747709 +iter : 18 Arret : 0.0285517 s/iter 42.040931 +iter : 19 Arret : 0.0244232 s/iter 35.402712 +iter : 20 Arret : 0.0156356 s/iter 34.951257 +iter : 21 Arret : 0.00306159 s/iter 34.044015 +iter : 22 Arret : 0.00259881 s/iter 33.314225 +iter : 23 Arret : 0.0020894 s/iter 33.562042 +iter : 24 Arret : 0.000144328 s/iter 32.902500 +iter : 25 Arret : 4.2377E-05 s/iter 32.909701 +iter : 26 Arret : 7.50207E-06 s/iter 33.017508 +iter : 27 Arret : 4.17723E-07 s/iter 32.694117 +iter : 28 Arret : 3.57073E-10 s/iter 32.849709 +iter : 29 Arret : 1.04738E-15 s/iter 32.706464 +temps : 1055.82 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 1, start 350080 size 350080 +proc 1 start 350080 size 350080 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 350080 +proc 0 start 0 size 350080 +iter : 1 Arret : 4.07504E-06 s/iter 50.276924 +iter : 2 Arret : 4.14637E-06 s/iter 50.316736 +iter : 3 Arret : 3.92125E-06 s/iter 50.311941 +iter : 4 Arret : 3.96177E-06 s/iter 50.319644 +iter : 5 Arret : 3.60866E-06 s/iter 50.315146 +iter : 6 Arret : 3.73875E-06 s/iter 50.345034 +iter : 7 Arret : 3.91631E-06 s/iter 50.311163 +iter : 8 Arret : 3.82723E-06 s/iter 50.332321 +iter : 9 Arret : 4.24177E-06 s/iter 50.340320 +iter : 10 Arret : 9.18215E-05 s/iter 50.349367 +iter : 11 Arret : 0.000848166 s/iter 50.316912 +iter : 12 Arret : 0.00161125 s/iter 50.303456 +iter : 13 Arret : 0.0024668 s/iter 57.717511 +iter : 14 Arret : 0.00479788 s/iter 53.570757 +iter : 15 Arret : 0.00495555 s/iter 52.732469 +iter : 16 Arret : 0.0099658 s/iter 51.316983 +iter : 17 Arret : 0.0910784 s/iter 52.848267 +iter : 18 Arret : 0.0669533 s/iter 53.379948 +iter : 19 Arret : 0.196091 s/iter 50.742367 +iter : 20 Arret : 0.0404469 s/iter 53.773228 +iter : 21 Arret : 0.0140031 s/iter 50.742372 +iter : 22 Arret : 0.00221639 s/iter 52.968592 +iter : 23 Arret : 0.00849041 s/iter 50.251971 +iter : 24 Arret : 0.00450336 s/iter 50.017079 +iter : 25 Arret : 0.000556405 s/iter 50.012361 +iter : 26 Arret : 2.14523E-05 s/iter 50.016154 +iter : 27 Arret : 3.07624E-05 s/iter 50.035967 +iter : 28 Arret : 4.85785E-07 s/iter 49.957854 +iter : 29 Arret : 3.24294E-13 s/iter 50.017899 +temps : 1484.54 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 3.24294E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 400000 size 400000 +proc 1 start 400000 size 400000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 400000 +proc 0 start 0 size 400000 +iter : 1 Arret : 3.43314E-06 s/iter 66.451646 +iter : 2 Arret : 3.25458E-06 s/iter 66.371208 +iter : 3 Arret : 3.1756E-06 s/iter 66.365954 +iter : 4 Arret : 3.16632E-06 s/iter 66.323972 +iter : 5 Arret : 3.35307E-06 s/iter 66.379156 +iter : 6 Arret : 3.06929E-06 s/iter 66.310093 +iter : 7 Arret : 3.05638E-06 s/iter 66.375498 +iter : 8 Arret : 3.30698E-06 s/iter 66.345679 +iter : 9 Arret : 4.07579E-06 s/iter 66.346425 +iter : 10 Arret : 1.06648E-05 s/iter 66.343012 +iter : 11 Arret : 0.00084876 s/iter 66.372100 +iter : 12 Arret : 0.00143415 s/iter 66.363225 +iter : 13 Arret : 1.46402 s/iter 66.856335 +iter : 14 Arret : 0.713405 s/iter 68.042881 +iter : 15 Arret : 2.95761 s/iter 73.478889 +iter : 16 Arret : 0.205334 s/iter 66.190886 +iter : 17 Arret : 0.294322 s/iter 63.619134 +iter : 18 Arret : 0.0487392 s/iter 60.944788 +iter : 19 Arret : 0.0248874 s/iter 62.800018 +iter : 20 Arret : 0.0170499 s/iter 62.693475 +iter : 21 Arret : 0.00846661 s/iter 60.956662 +iter : 22 Arret : 0.0198831 s/iter 55.137303 +iter : 23 Arret : 0.00364888 s/iter 51.869775 +iter : 24 Arret : 2.68554E-05 s/iter 47.810142 +iter : 25 Arret : 2.14844E-05 s/iter 46.502062 +iter : 26 Arret : 4.9054E-06 s/iter 46.126008 +iter : 27 Arret : 4.4697E-07 s/iter 45.649153 +iter : 28 Arret : 7.89107E-11 s/iter 45.613504 +iter : 29 Arret : 2.23773E-16 s/iter 45.669074 +temps : 1766.95 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 2.23773E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_mpi/full_mpi_2GPU.sge b/Simulations/full_mpi/full_mpi_2GPU.sge new file mode 100755 index 0000000..ea411bb --- /dev/null +++ b/Simulations/full_mpi/full_mpi_2GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_2GPU +#$ -pe mpi 2 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +#mpirun -np $NSLOTS ./template -r -i 900000 700000 +#mpirun -np $NSLOTS ./template -r -i 1000000 800000 +#mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_mpi/full_mpi_3GPU.o140159 b/Simulations/full_mpi/full_mpi_3GPU.o140159 new file mode 100644 index 0000000..158cd8f --- /dev/null +++ b/Simulations/full_mpi/full_mpi_3GPU.o140159 @@ -0,0 +1,604 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 1, start 20053 size 20053 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 20053 +proc 0 start 0 size 20053 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 2, start 40106 size 20053 +proc 2 start 40106 size 20053 +proc 1 start 20053 size 20053 +iter : 1 Arret : 4.51053E-05 s/iter 0.366915 +iter : 2 Arret : 3.79748E-05 s/iter 0.366823 +iter : 3 Arret : 3.83563E-05 s/iter 0.366880 +iter : 4 Arret : 3.91196E-05 s/iter 0.366902 +iter : 5 Arret : 4.35007E-05 s/iter 0.366756 +iter : 6 Arret : 4.41483E-05 s/iter 0.366710 +iter : 7 Arret : 5.50718E-05 s/iter 0.366766 +iter : 8 Arret : 0.000118505 s/iter 0.366821 +iter : 9 Arret : 0.00208632 s/iter 0.366803 +iter : 10 Arret : 0.0219374 s/iter 0.366869 +iter : 11 Arret : 2.12364 s/iter 1.163790 +iter : 12 Arret : 0.290713 s/iter 0.366853 +iter : 13 Arret : 0.144909 s/iter 1.195713 +iter : 14 Arret : 0.0571799 s/iter 1.188579 +iter : 15 Arret : 0.017729 s/iter 1.192088 +iter : 16 Arret : 0.00942695 s/iter 1.186675 +iter : 17 Arret : 0.00614493 s/iter 1.170362 +iter : 18 Arret : 0.0046828 s/iter 1.012161 +iter : 19 Arret : 0.0210424 s/iter 0.356542 +iter : 20 Arret : 0.0167084 s/iter 0.355054 +iter : 21 Arret : 0.00421459 s/iter 0.348901 +iter : 22 Arret : 0.00178855 s/iter 0.342348 +iter : 23 Arret : 0.00897727 s/iter 0.340678 +iter : 24 Arret : 0.00287444 s/iter 0.336510 +iter : 25 Arret : 0.000362565 s/iter 0.336936 +iter : 26 Arret : 0.000252972 s/iter 0.337141 +iter : 27 Arret : 3.73204E-05 s/iter 0.328363 +iter : 28 Arret : 8.45973E-06 s/iter 0.334747 +iter : 29 Arret : 1.8159E-08 s/iter 0.324239 +iter : 30 Arret : 5.61914E-13 s/iter 0.337980 +temps : 16.3645 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 5.61914E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583426 +i* -0.812166| 1| 4.94882E-14 +i*-9.16107E-15| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 1, start 50005 size 50005 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 50005 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 2, start 100010 size 50005 +proc 1 start 50005 size 50005 +proc 0 start 0 size 50005 +proc 2 start 100010 size 50005 +iter : 1 Arret : 1.83619E-05 s/iter 1.833058 +iter : 2 Arret : 1.73853E-05 s/iter 1.832458 +iter : 3 Arret : 1.70553E-05 s/iter 1.832448 +iter : 4 Arret : 1.72513E-05 s/iter 1.832684 +iter : 5 Arret : 1.69749E-05 s/iter 1.832295 +iter : 6 Arret : 1.78708E-05 s/iter 1.832450 +iter : 7 Arret : 2.02323E-05 s/iter 1.832391 +iter : 8 Arret : 2.61959E-05 s/iter 1.832666 +iter : 9 Arret : 0.000263463 s/iter 1.832325 +iter : 10 Arret : 0.00201062 s/iter 1.832469 +iter : 11 Arret : 0.0177962 s/iter 1.832459 +iter : 12 Arret : 0.00945112 s/iter 1.832643 +iter : 13 Arret : 1.13842 s/iter 3.083910 +iter : 14 Arret : 0.0340957 s/iter 3.886935 +iter : 15 Arret : 0.0812119 s/iter 1.824686 +iter : 16 Arret : 0.16371 s/iter 3.884591 +iter : 17 Arret : 0.0770217 s/iter 3.594364 +iter : 18 Arret : 0.0145081 s/iter 3.552164 +iter : 19 Arret : 0.00446866 s/iter 2.726939 +iter : 20 Arret : 0.00786537 s/iter 1.794160 +iter : 21 Arret : 0.0166355 s/iter 1.779567 +iter : 22 Arret : 0.0278383 s/iter 2.763164 +iter : 23 Arret : 0.00838616 s/iter 1.758182 +iter : 24 Arret : 0.000453907 s/iter 1.764407 +iter : 25 Arret : 3.67653E-05 s/iter 1.749282 +iter : 26 Arret : 1.55532E-05 s/iter 1.735726 +iter : 27 Arret : 9.01062E-07 s/iter 1.753730 +iter : 28 Arret : 4.37903E-10 s/iter 1.730440 +iter : 29 Arret : 3.95673E-15 s/iter 1.728429 +temps : 63.3058 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 3.95673E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235775 +i* 0.971808| 1|-4.13627E-14 +i* -1.0803E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 1, start 83370 size 83370 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 2, start 166740 size 83370 +proc 2 start 166740 size 83370 +proc 1 start 83370 size 83370 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 83370 +proc 0 start 0 size 83370 +iter : 1 Arret : 1.04122E-05 s/iter 4.603075 +iter : 2 Arret : 9.85149E-06 s/iter 4.604055 +iter : 3 Arret : 1.14683E-05 s/iter 4.603262 +iter : 4 Arret : 1.02226E-05 s/iter 4.602431 +iter : 5 Arret : 1.00729E-05 s/iter 4.602619 +iter : 6 Arret : 1.06838E-05 s/iter 4.601869 +iter : 7 Arret : 1.12564E-05 s/iter 4.604882 +iter : 8 Arret : 1.08854E-05 s/iter 4.602271 +iter : 9 Arret : 1.68728E-05 s/iter 4.602965 +iter : 10 Arret : 0.000908721 s/iter 4.605369 +iter : 11 Arret : 0.00208199 s/iter 4.606164 +iter : 12 Arret : 0.00236846 s/iter 4.603500 +iter : 13 Arret : 0.00395957 s/iter 4.603136 +iter : 14 Arret : 0.000973404 s/iter 4.602278 +iter : 15 Arret : 0.00182712 s/iter 4.583661 +iter : 16 Arret : 0.00194671 s/iter 3.758842 +iter : 17 Arret : 0.00719321 s/iter 2.889771 +iter : 18 Arret : 0.295953 s/iter 2.852424 +iter : 19 Arret : 0.00337128 s/iter 4.408132 +iter : 20 Arret : 0.00333381 s/iter 2.836731 +iter : 21 Arret : 0.00266677 s/iter 2.831149 +iter : 22 Arret : 0.00107544 s/iter 2.801808 +iter : 23 Arret : 0.000320605 s/iter 2.803352 +iter : 24 Arret : 0.000173629 s/iter 2.830132 +iter : 25 Arret : 0.000233464 s/iter 2.803594 +iter : 26 Arret : 0.000160813 s/iter 2.829786 +iter : 27 Arret : 0.000120024 s/iter 2.786102 +iter : 28 Arret : 9.55845E-05 s/iter 2.819982 +iter : 29 Arret : 2.30991E-05 s/iter 2.839073 +iter : 30 Arret : 9.78684E-06 s/iter 2.820049 +iter : 31 Arret : 1.81912E-06 s/iter 2.795290 +iter : 32 Arret : 6.40862E-09 s/iter 2.814603 +iter : 33 Arret : 7.74157E-15 s/iter 2.794434 +temps : 122.621 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 1, start 116736 size 116736 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 2, start 233472 size 116736 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 116736 +proc 0 start 0 size 116736 +proc 1 start 116736 size 116736 +proc 2 start 233472 size 116736 +iter : 1 Arret : 7.25108E-06 s/iter 8.701598 +iter : 2 Arret : 7.01169E-06 s/iter 8.695411 +iter : 3 Arret : 7.08063E-06 s/iter 8.691498 +iter : 4 Arret : 6.71613E-06 s/iter 8.696067 +iter : 5 Arret : 8.00231E-06 s/iter 8.693456 +iter : 6 Arret : 6.92129E-06 s/iter 8.693906 +iter : 7 Arret : 7.08909E-06 s/iter 8.691731 +iter : 8 Arret : 7.80014E-06 s/iter 8.689556 +iter : 9 Arret : 1.05064E-05 s/iter 8.687045 +iter : 10 Arret : 0.000743236 s/iter 8.683404 +iter : 11 Arret : 0.000665165 s/iter 8.679771 +iter : 12 Arret : 0.00104331 s/iter 8.679382 +iter : 13 Arret : 0.820946 s/iter 8.680273 +iter : 14 Arret : 3.39143 s/iter 10.141868 +iter : 15 Arret : 0.124079 s/iter 10.120875 +iter : 16 Arret : 0.060865 s/iter 10.097925 +iter : 17 Arret : 0.0362188 s/iter 10.080714 +iter : 18 Arret : 0.0235232 s/iter 13.316578 +iter : 19 Arret : 0.019308 s/iter 10.793160 +iter : 20 Arret : 0.0181476 s/iter 10.220050 +iter : 21 Arret : 0.0341411 s/iter 13.317077 +iter : 22 Arret : 0.0238257 s/iter 13.520573 +iter : 23 Arret : 0.0622072 s/iter 13.384251 +iter : 24 Arret : 0.0384535 s/iter 13.405236 +iter : 25 Arret : 0.0315007 s/iter 13.389625 +iter : 26 Arret : 0.0793407 s/iter 13.377513 +iter : 27 Arret : 0.00511819 s/iter 13.311241 +iter : 28 Arret : 0.000404404 s/iter 8.624483 +iter : 29 Arret : 8.29183E-05 s/iter 8.623864 +iter : 30 Arret : 0.000107024 s/iter 8.624427 +iter : 31 Arret : 1.83455E-05 s/iter 8.626520 +iter : 32 Arret : 9.95568E-06 s/iter 8.624102 +iter : 33 Arret : 3.50874E-06 s/iter 8.630894 +iter : 34 Arret : 3.09608E-08 s/iter 8.626743 +iter : 35 Arret : 1.44506E-13 s/iter 8.626785 +temps : 350.829 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.11023E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 2, start 333482 size 166741 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 1, start 166741 size 166741 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 166741 +proc 0 start 0 size 166741 +proc 1 start 166741 size 166741 +proc 2 start 333482 size 166741 +iter : 1 Arret : 5.44829E-06 s/iter 17.188421 +iter : 2 Arret : 5.42874E-06 s/iter 17.137695 +iter : 3 Arret : 5.23492E-06 s/iter 17.123244 +iter : 4 Arret : 5.51556E-06 s/iter 17.128160 +iter : 5 Arret : 5.22118E-06 s/iter 17.122102 +iter : 6 Arret : 5.01816E-06 s/iter 17.123783 +iter : 7 Arret : 5.0087E-06 s/iter 17.115281 +iter : 8 Arret : 5.28527E-06 s/iter 17.120375 +iter : 9 Arret : 6.38913E-06 s/iter 17.121394 +iter : 10 Arret : 2.99276E-05 s/iter 17.125175 +iter : 11 Arret : 0.000916092 s/iter 17.123111 +iter : 12 Arret : 0.00112622 s/iter 17.129686 +iter : 13 Arret : 0.00199901 s/iter 18.785503 +iter : 14 Arret : 0.00536103 s/iter 17.609054 +iter : 15 Arret : 0.00620338 s/iter 18.429826 +iter : 16 Arret : 0.00463214 s/iter 16.044795 +iter : 17 Arret : 1.5572 s/iter 16.371044 +iter : 18 Arret : 0.084601 s/iter 14.529226 +iter : 19 Arret : 0.0115579 s/iter 15.452523 +iter : 20 Arret : 0.00599505 s/iter 14.669002 +iter : 21 Arret : 0.00192484 s/iter 10.219969 +iter : 22 Arret : 0.0109349 s/iter 10.105479 +iter : 23 Arret : 0.00351895 s/iter 9.786904 +iter : 24 Arret : 8.50621E-05 s/iter 8.935303 +iter : 25 Arret : 3.28381E-05 s/iter 8.653848 +iter : 26 Arret : 4.45938E-06 s/iter 8.532165 +iter : 27 Arret : 1.46328E-08 s/iter 8.457670 +iter : 28 Arret : 4.31796E-14 s/iter 8.370340 +temps : 410.952 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.44695E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 0 +proc 1 +proc 2 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 200021 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 400042 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 200021 +proc 0 start 0 size 200021 +proc 2 start 400042 size 200021 +proc 1 start 200021 size 200021 +iter : 1 Arret : 4.17374E-06 s/iter 25.553089 +iter : 2 Arret : 4.24471E-06 s/iter 25.497354 +iter : 3 Arret : 4.02926E-06 s/iter 25.510295 +iter : 4 Arret : 3.90309E-06 s/iter 25.498014 +iter : 5 Arret : 4.14737E-06 s/iter 25.505852 +iter : 6 Arret : 4.14451E-06 s/iter 25.510250 +iter : 7 Arret : 4.54952E-06 s/iter 25.534869 +iter : 8 Arret : 4.39097E-06 s/iter 25.519822 +iter : 9 Arret : 5.39778E-06 s/iter 25.501601 +iter : 10 Arret : 1.06277E-05 s/iter 25.514311 +iter : 11 Arret : 0.000466846 s/iter 25.483886 +iter : 12 Arret : 0.00147408 s/iter 25.506990 +iter : 13 Arret : 0.917202 s/iter 25.532816 +iter : 14 Arret : 0.738772 s/iter 25.543670 +iter : 15 Arret : 1.09406 s/iter 33.427707 +iter : 16 Arret : 0.0147818 s/iter 30.484631 +iter : 17 Arret : 0.00982586 s/iter 27.428111 +iter : 18 Arret : 0.00305155 s/iter 23.911742 +iter : 19 Arret : 0.00879189 s/iter 27.378373 +iter : 20 Arret : 0.0148466 s/iter 27.330975 +iter : 21 Arret : 0.00541507 s/iter 27.053957 +iter : 22 Arret : 0.00917579 s/iter 22.028199 +iter : 23 Arret : 0.00176967 s/iter 24.447698 +iter : 24 Arret : 0.000776941 s/iter 21.846447 +iter : 25 Arret : 1.85979E-05 s/iter 21.763637 +iter : 26 Arret : 5.99112E-08 s/iter 21.943537 +iter : 27 Arret : 6.36688E-13 s/iter 21.839783 +temps : 688.615 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.72079E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 2, start 466772 size 233386 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 1, start 233386 size 233386 +proc 2 start 466772 size 233386 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 233386 +proc 0 start 0 size 233386 +proc 1 start 233386 size 233386 +iter : 1 Arret : 3.63067E-06 s/iter 34.355771 +iter : 2 Arret : 3.51666E-06 s/iter 34.313476 +iter : 3 Arret : 3.37718E-06 s/iter 34.302244 +iter : 4 Arret : 3.51452E-06 s/iter 34.331891 +iter : 5 Arret : 3.53495E-06 s/iter 34.305875 +iter : 6 Arret : 3.54533E-06 s/iter 34.270154 +iter : 7 Arret : 3.57791E-06 s/iter 34.269601 +iter : 8 Arret : 3.49843E-06 s/iter 34.269532 +iter : 9 Arret : 3.56279E-06 s/iter 34.267016 +iter : 10 Arret : 6.70933E-06 s/iter 34.264316 +iter : 11 Arret : 0.000744895 s/iter 34.272504 +iter : 12 Arret : 0.0168677 s/iter 34.261719 +iter : 13 Arret : 0.0132741 s/iter 41.631459 +iter : 14 Arret : 0.0144504 s/iter 34.370399 +iter : 15 Arret : 0.0148871 s/iter 34.380936 +iter : 16 Arret : 0.117079 s/iter 42.029927 +iter : 17 Arret : 0.125622 s/iter 35.777828 +iter : 18 Arret : 0.0338842 s/iter 34.659887 +iter : 19 Arret : 0.0255305 s/iter 34.785339 +iter : 20 Arret : 0.0303666 s/iter 35.462034 +iter : 21 Arret : 0.0337579 s/iter 34.650721 +iter : 22 Arret : 0.0214608 s/iter 34.657778 +iter : 23 Arret : 0.00401409 s/iter 37.611052 +iter : 24 Arret : 0.00127792 s/iter 34.577885 +iter : 25 Arret : 0.000708122 s/iter 34.760828 +iter : 26 Arret : 1.94192E-06 s/iter 34.694471 +iter : 27 Arret : 3.18954E-08 s/iter 34.634308 +iter : 28 Arret : 1.15496E-13 s/iter 34.588120 +temps : 985.364 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 1.15496E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 533332 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 266666 size 266666 +proc 1 start 266666 size 266666 +proc 2 start 533332 size 266666 +proc 0 start 0 size 266666 +iter : 1 Arret : 3.65034E-06 s/iter 44.298468 +iter : 2 Arret : 3.20717E-06 s/iter 44.362840 +iter : 3 Arret : 3.28214E-06 s/iter 44.348033 +iter : 4 Arret : 3.53473E-06 s/iter 44.372779 +iter : 5 Arret : 3.64435E-06 s/iter 44.339393 +iter : 6 Arret : 3.48715E-06 s/iter 44.311216 +iter : 7 Arret : 3.20236E-06 s/iter 44.195501 +iter : 8 Arret : 3.46765E-06 s/iter 44.337231 +iter : 9 Arret : 4.55782E-06 s/iter 44.336266 +iter : 10 Arret : 3.03387E-05 s/iter 44.344481 +iter : 11 Arret : 0.000895058 s/iter 44.372449 +iter : 12 Arret : 0.00155707 s/iter 51.112648 +iter : 13 Arret : 1.43645 s/iter 52.743256 +iter : 14 Arret : 1.09102 s/iter 44.524633 +iter : 15 Arret : 0.0755624 s/iter 44.574228 +iter : 16 Arret : 0.0191023 s/iter 48.607142 +iter : 17 Arret : 0.0113021 s/iter 49.878872 +iter : 18 Arret : 0.0136773 s/iter 47.858875 +iter : 19 Arret : 0.0252439 s/iter 39.188313 +iter : 20 Arret : 0.034702 s/iter 39.327917 +iter : 21 Arret : 0.0204901 s/iter 41.570418 +iter : 22 Arret : 0.00860925 s/iter 42.424027 +iter : 23 Arret : 0.0024318 s/iter 40.816516 +iter : 24 Arret : 0.000206468 s/iter 32.760844 +iter : 25 Arret : 0.000152172 s/iter 31.523865 +iter : 26 Arret : 0.000466464 s/iter 30.993628 +iter : 27 Arret : 7.31094E-05 s/iter 30.855992 +iter : 28 Arret : 3.56766E-10 s/iter 31.007972 +iter : 29 Arret : 8.9509E-16 s/iter 30.809036 +temps : 1218.9 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.0233219 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +799998 racines de module = 1 + 2 racines de module = 0.999973 diff --git a/Simulations/full_mpi/full_mpi_3GPU.sge b/Simulations/full_mpi/full_mpi_3GPU.sge new file mode 100755 index 0000000..53261fe --- /dev/null +++ b/Simulations/full_mpi/full_mpi_3GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_3GPU +#$ -pe mpi 3 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +#mpirun -np $NSLOTS ./template -r -i 900000 700000 +#mpirun -np $NSLOTS ./template -r -i 1000000 800000 +#mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_mpi/full_mpi_4GPU.o140132 b/Simulations/full_mpi/full_mpi_4GPU.o140132 new file mode 100644 index 0000000..2c3dc2a --- /dev/null +++ b/Simulations/full_mpi/full_mpi_4GPU.o140132 @@ -0,0 +1,622 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +proc 1 +proc 2 +proc 3 +proc 0 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 1, start 15040 size 15040 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 3, start 45120 size 15040 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 15040 +proc 1 start 15040 size 15040 +proc 3 start 45120 size 15040 +proc 0 start 0 size 15040 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 2, start 30080 size 15040 +proc 2 start 30080 size 15040 +iter : 1 Arret : 4.54253E-05 s/iter 0.190120 +iter : 2 Arret : 4.02349E-05 s/iter 0.189998 +iter : 3 Arret : 4.05851E-05 s/iter 0.190002 +iter : 4 Arret : 3.90123E-05 s/iter 0.189988 +iter : 5 Arret : 4.05115E-05 s/iter 0.189940 +iter : 6 Arret : 4.39547E-05 s/iter 0.189985 +iter : 7 Arret : 5.458E-05 s/iter 0.189984 +iter : 8 Arret : 0.000119494 s/iter 0.189981 +iter : 9 Arret : 0.00168327 s/iter 0.189962 +iter : 10 Arret : 0.0030417 s/iter 0.189891 +iter : 11 Arret : 2.15612 s/iter 0.189972 +iter : 12 Arret : 0.346227 s/iter 0.190014 +iter : 13 Arret : 0.126669 s/iter 1.018201 +iter : 14 Arret : 0.0535949 s/iter 1.016001 +iter : 15 Arret : 0.0185974 s/iter 1.012376 +iter : 16 Arret : 0.0101783 s/iter 1.010000 +iter : 17 Arret : 0.00628304 s/iter 1.004893 +iter : 18 Arret : 0.00442205 s/iter 0.867780 +iter : 19 Arret : 0.00334052 s/iter 0.850989 +iter : 20 Arret : 0.166672 s/iter 0.833688 +iter : 21 Arret : 0.154722 s/iter 0.185018 +iter : 22 Arret : 0.0369513 s/iter 0.857692 +iter : 23 Arret : 0.00795041 s/iter 0.183896 +iter : 24 Arret : 0.00113436 s/iter 0.179252 +iter : 25 Arret : 0.000916314 s/iter 0.179162 +iter : 26 Arret : 0.000437934 s/iter 0.173024 +iter : 27 Arret : 0.000164013 s/iter 0.173156 +iter : 28 Arret : 0.000120343 s/iter 0.173113 +iter : 29 Arret : 0.000163904 s/iter 0.173138 +iter : 30 Arret : 9.69458E-05 s/iter 0.173072 +iter : 31 Arret : 8.66273E-06 s/iter 0.172998 +iter : 32 Arret : 2.89696E-08 s/iter 0.173059 +iter : 33 Arret : 8.96067E-13 s/iter 0.173085 +temps : 13.0123 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 8.96067E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-2.28637E-15 +i*-5.45917E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.584107 +i* -0.811677| 1| 1.93838E-14 +i* -1.0613E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 37504 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 3, start 112512 size 37504 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 1, start 37504 size 37504 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 2, start 75008 size 37504 +proc 2 start 75008 size 37504 +proc 0 start 0 size 37504 +proc 3 start 112512 size 37504 +proc 1 start 37504 size 37504 +iter : 1 Arret : 1.61155E-05 s/iter 1.388910 +iter : 2 Arret : 1.5292E-05 s/iter 1.388566 +iter : 3 Arret : 1.53382E-05 s/iter 1.388256 +iter : 4 Arret : 1.53436E-05 s/iter 1.388459 +iter : 5 Arret : 1.56797E-05 s/iter 1.388267 +iter : 6 Arret : 1.62943E-05 s/iter 1.388223 +iter : 7 Arret : 1.78031E-05 s/iter 1.388438 +iter : 8 Arret : 2.07609E-05 s/iter 1.388272 +iter : 9 Arret : 4.52349E-05 s/iter 1.388452 +iter : 10 Arret : 0.00148307 s/iter 1.388277 +iter : 11 Arret : 0.00381365 s/iter 1.388380 +iter : 12 Arret : 0.00454231 s/iter 2.679420 +iter : 13 Arret : 0.017103 s/iter 2.976033 +iter : 14 Arret : 1.38869 s/iter 1.383510 +iter : 15 Arret : 0.0597475 s/iter 1.384033 +iter : 16 Arret : 0.0363329 s/iter 2.973069 +iter : 17 Arret : 0.0127731 s/iter 3.418217 +iter : 18 Arret : 0.0103682 s/iter 3.020991 +iter : 19 Arret : 0.00840855 s/iter 2.969344 +iter : 20 Arret : 0.00415465 s/iter 3.306301 +iter : 21 Arret : 0.00116781 s/iter 1.346551 +iter : 22 Arret : 0.00222874 s/iter 1.341294 +iter : 23 Arret : 0.00230842 s/iter 1.334988 +iter : 24 Arret : 0.00269266 s/iter 1.337748 +iter : 25 Arret : 0.000589182 s/iter 1.335027 +iter : 26 Arret : 1.15656E-05 s/iter 1.331811 +iter : 27 Arret : 2.039E-06 s/iter 1.328004 +iter : 28 Arret : 3.02093E-09 s/iter 1.343235 +iter : 29 Arret : 2.75813E-14 s/iter 1.332966 +temps : 51.6331 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 2.75813E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235978 +i* 0.971758| 1|-2.91295E-14 +i*-3.06716E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 1 +proc 2 +proc 3 +proc 0 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 2, start 125056 size 62528 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 62528 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 3, start 187584 size 62528 +proc 3 start 187584 size 62528 +proc 2 start 125056 size 62528 +proc 0 start 0 size 62528 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 1, start 62528 size 62528 +proc 1 start 62528 size 62528 +iter : 1 Arret : 1.11968E-05 s/iter 3.825242 +iter : 2 Arret : 1.00799E-05 s/iter 3.807837 +iter : 3 Arret : 9.41078E-06 s/iter 3.813149 +iter : 4 Arret : 9.26536E-06 s/iter 3.814952 +iter : 5 Arret : 9.34813E-06 s/iter 3.812300 +iter : 6 Arret : 9.56148E-06 s/iter 3.818827 +iter : 7 Arret : 9.85158E-06 s/iter 3.809789 +iter : 8 Arret : 1.00436E-05 s/iter 3.817985 +iter : 9 Arret : 3.01654E-05 s/iter 3.810639 +iter : 10 Arret : 0.000664555 s/iter 3.818425 +iter : 11 Arret : 0.000737975 s/iter 3.818479 +iter : 12 Arret : 0.000983341 s/iter 3.816886 +iter : 13 Arret : 0.00169178 s/iter 3.818781 +iter : 14 Arret : 0.00246696 s/iter 3.818401 +iter : 15 Arret : 0.00246605 s/iter 3.779944 +iter : 16 Arret : 0.00658304 s/iter 2.977729 +iter : 17 Arret : 0.00690937 s/iter 5.004823 +iter : 18 Arret : 0.300013 s/iter 4.828460 +iter : 19 Arret : 0.0468449 s/iter 4.960936 +iter : 20 Arret : 0.00243593 s/iter 2.120119 +iter : 21 Arret : 0.000654892 s/iter 2.126485 +iter : 22 Arret : 0.00213423 s/iter 2.116250 +iter : 23 Arret : 0.000510708 s/iter 2.110308 +iter : 24 Arret : 0.00102843 s/iter 2.108799 +iter : 25 Arret : 0.000140837 s/iter 2.110467 +iter : 26 Arret : 9.44179E-05 s/iter 2.106952 +iter : 27 Arret : 2.22669E-05 s/iter 2.108487 +iter : 28 Arret : 1.36769E-06 s/iter 2.108960 +iter : 29 Arret : 2.186E-10 s/iter 2.111770 +iter : 30 Arret : 2.77556E-16 s/iter 2.094068 +temps : 98.5095 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 3, start 262656 size 87552 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 1, start 87552 size 87552 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 2, start 175104 size 87552 +proc 1 start 87552 size 87552 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 87552 +proc 0 start 0 size 87552 +proc 3 start 262656 size 87552 +proc 2 start 175104 size 87552 +iter : 1 Arret : 7.37223E-06 s/iter 6.537086 +iter : 2 Arret : 6.87852E-06 s/iter 6.540337 +iter : 3 Arret : 6.62662E-06 s/iter 6.539807 +iter : 4 Arret : 6.78716E-06 s/iter 6.537314 +iter : 5 Arret : 6.73158E-06 s/iter 6.543333 +iter : 6 Arret : 7.46053E-06 s/iter 6.536618 +iter : 7 Arret : 7.08865E-06 s/iter 6.536382 +iter : 8 Arret : 7.79945E-06 s/iter 6.534593 +iter : 9 Arret : 9.74861E-06 s/iter 6.536504 +iter : 10 Arret : 0.000745782 s/iter 6.537362 +iter : 11 Arret : 0.000455744 s/iter 6.535194 +iter : 12 Arret : 0.00342228 s/iter 6.534104 +iter : 13 Arret : 0.810408 s/iter 6.536777 +iter : 14 Arret : 3.37422 s/iter 10.380895 +iter : 15 Arret : 0.136557 s/iter 11.212541 +iter : 16 Arret : 0.0661427 s/iter 9.571236 +iter : 17 Arret : 0.0390301 s/iter 11.168500 +iter : 18 Arret : 0.056921 s/iter 11.419060 +iter : 19 Arret : 0.0851919 s/iter 11.272764 +iter : 20 Arret : 0.0308655 s/iter 11.252338 +iter : 21 Arret : 0.0183277 s/iter 11.252867 +iter : 22 Arret : 0.0401954 s/iter 10.205076 +iter : 23 Arret : 0.0540968 s/iter 11.305983 +iter : 24 Arret : 0.0434344 s/iter 10.978858 +iter : 25 Arret : 0.0335517 s/iter 11.237082 +iter : 26 Arret : 0.115944 s/iter 11.039900 +iter : 27 Arret : 0.0492573 s/iter 8.777420 +iter : 28 Arret : 0.0191575 s/iter 6.485398 +iter : 29 Arret : 0.0184729 s/iter 7.151590 +iter : 30 Arret : 0.00124008 s/iter 6.484897 +iter : 31 Arret : 6.47966E-05 s/iter 6.485006 +iter : 32 Arret : 4.59568E-05 s/iter 6.485609 +iter : 33 Arret : 3.27878E-06 s/iter 6.484358 +iter : 34 Arret : 2.62749E-10 s/iter 6.485211 +iter : 35 Arret : 1.0339E-15 s/iter 6.482394 +temps : 289.016 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.11023E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287595 +i* -0.999586| 1| 4.76598E-14 +i*-1.43895E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 3, start 375168 size 125056 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 1, start 125056 size 125056 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 2, start 250112 size 125056 +proc 1 start 125056 size 125056 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 125056 +proc 0 start 0 size 125056 +proc 3 start 375168 size 125056 +proc 2 start 250112 size 125056 +iter : 1 Arret : 5.43999E-06 s/iter 13.794000 +iter : 2 Arret : 4.91286E-06 s/iter 13.791136 +iter : 3 Arret : 4.80927E-06 s/iter 13.796273 +iter : 4 Arret : 4.84881E-06 s/iter 13.800496 +iter : 5 Arret : 4.97591E-06 s/iter 13.796980 +iter : 6 Arret : 4.79153E-06 s/iter 13.804318 +iter : 7 Arret : 4.83022E-06 s/iter 13.810851 +iter : 8 Arret : 5.21278E-06 s/iter 13.801380 +iter : 9 Arret : 6.23421E-06 s/iter 13.799572 +iter : 10 Arret : 6.92488E-05 s/iter 13.809235 +iter : 11 Arret : 0.00410439 s/iter 13.803771 +iter : 12 Arret : 0.00309009 s/iter 13.812651 +iter : 13 Arret : 0.0029815 s/iter 18.000127 +iter : 14 Arret : 0.00820943 s/iter 19.596298 +iter : 15 Arret : 0.0062262 s/iter 19.403564 +iter : 16 Arret : 1.4696 s/iter 14.578745 +iter : 17 Arret : 0.0225548 s/iter 15.759602 +iter : 18 Arret : 0.00265918 s/iter 11.703397 +iter : 19 Arret : 0.0066924 s/iter 8.696998 +iter : 20 Arret : 0.00187233 s/iter 14.112555 +iter : 21 Arret : 0.00910475 s/iter 8.336565 +iter : 22 Arret : 0.0385392 s/iter 8.037996 +iter : 23 Arret : 0.0216755 s/iter 9.237626 +iter : 24 Arret : 0.0024009 s/iter 7.207663 +iter : 25 Arret : 0.00123955 s/iter 6.955790 +iter : 26 Arret : 3.53765E-05 s/iter 6.696812 +iter : 27 Arret : 7.34783E-06 s/iter 6.014489 +iter : 28 Arret : 1.71411E-07 s/iter 5.956492 +iter : 29 Arret : 3.11637E-12 s/iter 5.922541 +iter : 30 Arret : 1.57009E-16 s/iter 5.957097 +temps : 358.278 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 150016 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 3, start 450048 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 300032 size 150016 +proc 1 start 150016 size 150016 +proc 3 start 450048 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 150016 +proc 0 start 0 size 150016 +proc 2 start 300032 size 150016 +iter : 1 Arret : 4.20321E-06 s/iter 18.775985 +iter : 2 Arret : 4.09855E-06 s/iter 18.747734 +iter : 3 Arret : 3.93391E-06 s/iter 18.730793 +iter : 4 Arret : 4.03193E-06 s/iter 18.732680 +iter : 5 Arret : 4.10736E-06 s/iter 18.735318 +iter : 6 Arret : 4.01386E-06 s/iter 18.743326 +iter : 7 Arret : 4.19451E-06 s/iter 18.739337 +iter : 8 Arret : 4.62309E-06 s/iter 18.741333 +iter : 9 Arret : 6.05422E-06 s/iter 18.740129 +iter : 10 Arret : 4.11892E-05 s/iter 18.733834 +iter : 11 Arret : 0.000517404 s/iter 18.736838 +iter : 12 Arret : 0.00114025 s/iter 18.735603 +iter : 13 Arret : 0.00285906 s/iter 18.781157 +iter : 14 Arret : 1.38645 s/iter 26.334716 +iter : 15 Arret : 0.623951 s/iter 22.498967 +iter : 16 Arret : 0.011785 s/iter 22.383771 +iter : 17 Arret : 0.0286509 s/iter 18.675149 +iter : 18 Arret : 0.0199337 s/iter 21.455577 +iter : 19 Arret : 0.00279992 s/iter 23.472538 +iter : 20 Arret : 0.00154477 s/iter 24.299102 +iter : 21 Arret : 0.000859833 s/iter 17.698308 +iter : 22 Arret : 0.000296794 s/iter 17.754719 +iter : 23 Arret : 3.50155E-05 s/iter 17.796812 +iter : 24 Arret : 1.46092E-05 s/iter 16.575301 +iter : 25 Arret : 1.13486E-05 s/iter 16.409288 +iter : 26 Arret : 2.08371E-06 s/iter 16.504363 +iter : 27 Arret : 4.3351E-08 s/iter 16.502863 +iter : 28 Arret : 1.78892E-13 s/iter 17.369262 +temps : 539.966 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 2, start 350080 size 175040 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 1, start 175040 size 175040 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 3, start 525120 size 175040 +proc 3 start 525120 size 175040 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 175040 +proc 0 start 0 size 175040 +proc 2 start 350080 size 175040 +proc 1 start 175040 size 175040 +iter : 1 Arret : 4.05426E-06 s/iter 26.055375 +iter : 2 Arret : 3.62462E-06 s/iter 26.017320 +iter : 3 Arret : 3.57426E-06 s/iter 26.031338 +iter : 4 Arret : 3.57393E-06 s/iter 26.019895 +iter : 5 Arret : 3.53387E-06 s/iter 26.031664 +iter : 6 Arret : 3.57381E-06 s/iter 26.022006 +iter : 7 Arret : 4.05236E-06 s/iter 26.018695 +iter : 8 Arret : 3.5632E-06 s/iter 26.018506 +iter : 9 Arret : 3.74898E-06 s/iter 26.036369 +iter : 10 Arret : 1.82635E-05 s/iter 26.019377 +iter : 11 Arret : 0.0017458 s/iter 26.032260 +iter : 12 Arret : 0.00155961 s/iter 33.564621 +iter : 13 Arret : 0.00513024 s/iter 27.283039 +iter : 14 Arret : 0.00473339 s/iter 33.669836 +iter : 15 Arret : 0.00281261 s/iter 31.946913 +iter : 16 Arret : 0.00468659 s/iter 28.606391 +iter : 17 Arret : 0.0122921 s/iter 30.427694 +iter : 18 Arret : 0.0156527 s/iter 31.617517 +iter : 19 Arret : 0.0320085 s/iter 25.851204 +iter : 20 Arret : 0.22003 s/iter 25.842946 +iter : 21 Arret : 0.012535 s/iter 28.965802 +iter : 22 Arret : 0.00376424 s/iter 28.796070 +iter : 23 Arret : 0.00220948 s/iter 25.734592 +iter : 24 Arret : 0.00248624 s/iter 25.743976 +iter : 25 Arret : 0.000364428 s/iter 25.732814 +iter : 26 Arret : 0.000719089 s/iter 25.747749 +iter : 27 Arret : 0.000438507 s/iter 25.790591 +iter : 28 Arret : 1.26042E-05 s/iter 25.738843 +iter : 29 Arret : 3.25839E-06 s/iter 25.855423 +iter : 30 Arret : 1.74243E-07 s/iter 25.753106 +iter : 31 Arret : 3.09364E-11 s/iter 25.736769 +iter : 32 Arret : 1.57009E-16 s/iter 25.740011 +temps : 871.12 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 3, start 600000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 200000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 400000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 200000 +proc 1 start 200000 size 200000 +proc 2 start 400000 size 200000 +proc 3 start 600000 size 200000 +proc 0 start 0 size 200000 +iter : 1 Arret : 3.03518E-06 s/iter 34.128856 +iter : 2 Arret : 3.06784E-06 s/iter 34.090727 +iter : 3 Arret : 3.06891E-06 s/iter 34.094241 +iter : 4 Arret : 2.95036E-06 s/iter 34.084829 +iter : 5 Arret : 2.99138E-06 s/iter 34.097352 +iter : 6 Arret : 3.04517E-06 s/iter 34.105084 +iter : 7 Arret : 3.18905E-06 s/iter 34.137020 +iter : 8 Arret : 3.30369E-06 s/iter 34.092524 +iter : 9 Arret : 4.0676E-06 s/iter 34.099620 +iter : 10 Arret : 8.80539E-06 s/iter 34.123961 +iter : 11 Arret : 0.000853991 s/iter 34.124027 +iter : 12 Arret : 0.000833381 s/iter 39.333820 +iter : 13 Arret : 2.00076 s/iter 34.135418 +iter : 14 Arret : 1.04464 s/iter 39.211608 +iter : 15 Arret : 0.956436 s/iter 35.763699 +iter : 16 Arret : 1.05412 s/iter 34.269226 +iter : 17 Arret : 0.887869 s/iter 32.651104 +iter : 18 Arret : 2.49443 s/iter 39.662531 +iter : 19 Arret : 0.0130108 s/iter 30.564624 +iter : 20 Arret : 0.0127308 s/iter 29.378733 +iter : 21 Arret : 0.00448902 s/iter 28.875435 +iter : 22 Arret : 0.0025421 s/iter 27.743883 +iter : 23 Arret : 0.000929422 s/iter 25.969572 +iter : 24 Arret : 4.42165E-05 s/iter 25.190779 +iter : 25 Arret : 1.79364E-05 s/iter 23.938702 +iter : 26 Arret : 5.68442E-06 s/iter 23.601870 +iter : 27 Arret : 4.0515E-07 s/iter 23.613905 +iter : 28 Arret : 2.68075E-10 s/iter 23.702620 +iter : 29 Arret : 6.86635E-16 s/iter 23.681104 +temps : 917.174 seconde(s) diff --git a/Simulations/full_mpi/full_mpi_4GPU.sge b/Simulations/full_mpi/full_mpi_4GPU.sge new file mode 100755 index 0000000..dafa0cf --- /dev/null +++ b/Simulations/full_mpi/full_mpi_4GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_4GPU +#$ -pe mpi 4 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_mpi_bis/full_mpi_1GPU.o140351 b/Simulations/full_mpi_bis/full_mpi_1GPU.o140351 new file mode 100644 index 0000000..e5994d4 --- /dev/null +++ b/Simulations/full_mpi_bis/full_mpi_1GPU.o140351 @@ -0,0 +1,573 @@ +REMAINING: 1 +Taking GPU #3 +proc 0 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 100096 +proc 0 start 0 size 100096 +iter : 1 Arret : 2.57124E-05 s/iter 2.159876 +iter : 2 Arret : 2.45005E-05 s/iter 2.159265 +iter : 3 Arret : 2.39829E-05 s/iter 2.159267 +iter : 4 Arret : 2.46334E-05 s/iter 2.159223 +iter : 5 Arret : 2.36504E-05 s/iter 2.159218 +iter : 6 Arret : 2.48396E-05 s/iter 2.159305 +iter : 7 Arret : 2.76062E-05 s/iter 2.159351 +iter : 8 Arret : 3.59957E-05 s/iter 2.159303 +iter : 9 Arret : 0.000531126 s/iter 2.159380 +iter : 10 Arret : 0.00197252 s/iter 2.159496 +iter : 11 Arret : 0.00158765 s/iter 2.159268 +iter : 12 Arret : 0.247795 s/iter 2.159256 +iter : 13 Arret : 1.55484 s/iter 2.371449 +iter : 14 Arret : 0.00731985 s/iter 2.158830 +iter : 15 Arret : 0.00394835 s/iter 2.152148 +iter : 16 Arret : 0.00432084 s/iter 2.146166 +iter : 17 Arret : 0.0035879 s/iter 1.230891 +iter : 18 Arret : 0.00202383 s/iter 0.906115 +iter : 19 Arret : 0.00146188 s/iter 0.895430 +iter : 20 Arret : 0.0030635 s/iter 0.894637 +iter : 21 Arret : 0.0186656 s/iter 0.903878 +iter : 22 Arret : 0.0416525 s/iter 2.218711 +iter : 23 Arret : 0.0160884 s/iter 1.979886 +iter : 24 Arret : 0.0114388 s/iter 1.934919 +iter : 25 Arret : 0.022992 s/iter 2.001234 +iter : 26 Arret : 0.00173685 s/iter 0.903897 +iter : 27 Arret : 0.00166066 s/iter 0.894054 +iter : 28 Arret : 0.00173218 s/iter 0.897927 +iter : 29 Arret : 0.00199788 s/iter 0.911160 +iter : 30 Arret : 0.00168642 s/iter 0.892173 +iter : 31 Arret : 0.000952047 s/iter 0.894389 +iter : 32 Arret : 0.000313822 s/iter 0.893952 +iter : 33 Arret : 3.28903E-05 s/iter 0.898839 +iter : 34 Arret : 3.40913E-05 s/iter 0.902159 +iter : 35 Arret : 3.18794E-05 s/iter 0.885296 +iter : 36 Arret : 4.81227E-06 s/iter 0.892958 +iter : 37 Arret : 1.31242E-09 s/iter 0.894199 +iter : 38 Arret : 1.94667E-14 s/iter 0.907347 +temps : 59.5799 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 1.94667E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 8.60423E-16 +i* 1.94809E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-1.55837E-13 +i* 5.3703E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.79023E-14 +i* 5.46507E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 200192 +proc 0 start 0 size 200192 +iter : 1 Arret : 1.19577E-05 s/iter 8.522040 +iter : 2 Arret : 1.18507E-05 s/iter 8.485238 +iter : 3 Arret : 1.14926E-05 s/iter 8.496162 +iter : 4 Arret : 1.1843E-05 s/iter 8.514133 +iter : 5 Arret : 1.16132E-05 s/iter 8.490152 +iter : 6 Arret : 1.20299E-05 s/iter 8.489505 +iter : 7 Arret : 1.29547E-05 s/iter 8.484424 +iter : 8 Arret : 1.56044E-05 s/iter 8.492668 +iter : 9 Arret : 2.79641E-05 s/iter 8.495207 +iter : 10 Arret : 0.000384812 s/iter 8.504677 +iter : 11 Arret : 0.00189433 s/iter 8.492448 +iter : 12 Arret : 1.42613 s/iter 8.503569 +iter : 13 Arret : 0.362747 s/iter 9.006349 +iter : 14 Arret : 0.0667832 s/iter 8.952271 +iter : 15 Arret : 0.0268254 s/iter 8.939640 +iter : 16 Arret : 0.00407931 s/iter 8.450261 +iter : 17 Arret : 0.00185579 s/iter 8.435865 +iter : 18 Arret : 0.000960313 s/iter 8.407624 +iter : 19 Arret : 0.000563292 s/iter 8.160915 +iter : 20 Arret : 0.000141206 s/iter 8.091496 +iter : 21 Arret : 7.13547E-05 s/iter 8.083957 +iter : 22 Arret : 0.000381432 s/iter 8.127284 +iter : 23 Arret : 0.0129992 s/iter 8.205428 +iter : 24 Arret : 0.0126853 s/iter 8.300228 +iter : 25 Arret : 0.000213679 s/iter 8.166408 +iter : 26 Arret : 4.37206E-05 s/iter 8.112350 +iter : 27 Arret : 4.21984E-05 s/iter 8.074991 +iter : 28 Arret : 1.6149E-05 s/iter 8.082737 +iter : 29 Arret : 1.07878E-06 s/iter 8.076879 +iter : 30 Arret : 2.95387E-10 s/iter 8.118469 +iter : 31 Arret : 2.55593E-15 s/iter 8.124712 +temps : 260.107 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 2.55593E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659865 +i* -0.751385| 1| 2.17222E-14 +i*-1.50038E-13| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409013 +i* -0.912529| 1|-5.60801E-14 +i* 3.37699E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 400128 +proc 0 start 0 size 400128 +iter : 1 Arret : 6.81139E-06 s/iter 33.032996 +iter : 2 Arret : 6.06103E-06 s/iter 33.015096 +iter : 3 Arret : 5.93507E-06 s/iter 33.005369 +iter : 4 Arret : 5.92314E-06 s/iter 33.004657 +iter : 5 Arret : 5.92649E-06 s/iter 32.980033 +iter : 6 Arret : 5.78169E-06 s/iter 32.990352 +iter : 7 Arret : 5.94971E-06 s/iter 32.954192 +iter : 8 Arret : 6.19093E-06 s/iter 32.991129 +iter : 9 Arret : 6.32363E-06 s/iter 33.026221 +iter : 10 Arret : 1.54616E-05 s/iter 32.987263 +iter : 11 Arret : 0.00173932 s/iter 32.958812 +iter : 12 Arret : 0.00609254 s/iter 33.307167 +iter : 13 Arret : 0.00641692 s/iter 33.125638 +iter : 14 Arret : 0.00422127 s/iter 33.201310 +iter : 15 Arret : 0.2325 s/iter 33.016109 +iter : 16 Arret : 0.661386 s/iter 32.931174 +iter : 17 Arret : 0.391113 s/iter 34.017744 +iter : 18 Arret : 0.0847938 s/iter 33.202072 +iter : 19 Arret : 0.0429007 s/iter 34.565508 +iter : 20 Arret : 0.0386724 s/iter 37.182121 +iter : 21 Arret : 0.0200606 s/iter 36.684337 +iter : 22 Arret : 0.0153609 s/iter 32.948029 +iter : 23 Arret : 0.0123135 s/iter 34.090465 +iter : 24 Arret : 0.00975591 s/iter 36.698390 +iter : 25 Arret : 0.00938908 s/iter 36.054373 +iter : 26 Arret : 0.0642206 s/iter 34.102047 +iter : 27 Arret : 0.435754 s/iter 33.200030 +iter : 28 Arret : 0.710465 s/iter 33.054960 +iter : 29 Arret : 0.0884008 s/iter 33.137682 +iter : 30 Arret : 0.00601235 s/iter 33.067903 +iter : 31 Arret : 0.000106392 s/iter 32.965130 +iter : 32 Arret : 0.000107693 s/iter 32.986111 +iter : 33 Arret : 6.85378E-05 s/iter 32.989838 +iter : 34 Arret : 3.93845E-05 s/iter 32.899698 +iter : 35 Arret : 4.83198E-06 s/iter 32.935500 +iter : 36 Arret : 3.8562E-06 s/iter 32.899226 +iter : 37 Arret : 3.12033E-06 s/iter 32.874657 +iter : 38 Arret : 1.60088E-07 s/iter 32.989440 +iter : 39 Arret : 1.0643E-11 s/iter 32.879179 +iter : 40 Arret : 1.11022E-16 s/iter 32.998282 +temps : 1340.32 seconde(s) +Nb iterations : 40 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12993E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769081 +i* 0.639152| 1|-2.56017E-13 +i* 6.90161E-13| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857632 +i* 0.514263| 1| 7.84754E-13 +i* 2.86151E-13| +| 10| -0.0345309 +i* -0.999404| 1|-3.27058E-13 +i* 9.31755E-14| +| 11| 0.662503 +i* 0.74906| 1| 7.42843E-14 +i*-6.06277E-13| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926088 +i* 0.377307| 1| 6.5396E-13 +i* 7.07941E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.97283 +i* 0.23152| 1|-1.36773E-13 +i*-4.46509E-13| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +iter : 1 Arret : 5.03443E-06 s/iter 73.696929 +iter : 2 Arret : 4.61584E-06 s/iter 73.771737 +iter : 3 Arret : 4.97785E-06 s/iter 73.915402 +iter : 4 Arret : 5.01515E-06 s/iter 74.050809 +iter : 5 Arret : 5.02386E-06 s/iter 74.014277 +iter : 6 Arret : 4.99324E-06 s/iter 74.016897 +iter : 7 Arret : 4.90554E-06 s/iter 73.958392 +iter : 8 Arret : 4.38936E-06 s/iter 73.839302 +iter : 9 Arret : 6.21887E-06 s/iter 73.927269 +iter : 10 Arret : 0.000108223 s/iter 73.865281 +iter : 11 Arret : 0.000411941 s/iter 73.854431 +iter : 12 Arret : 0.000623661 s/iter 74.029655 +iter : 13 Arret : 1.80723 s/iter 73.811829 +iter : 14 Arret : 0.102793 s/iter 74.088517 +iter : 15 Arret : 0.0532764 s/iter 74.812682 +iter : 16 Arret : 0.0261347 s/iter 73.818984 +iter : 17 Arret : 0.0156151 s/iter 73.751168 +iter : 18 Arret : 0.00966403 s/iter 73.685324 +iter : 19 Arret : 0.00585551 s/iter 73.712934 +iter : 20 Arret : 0.00418415 s/iter 73.374676 +iter : 21 Arret : 0.026185 s/iter 74.284150 +iter : 22 Arret : 0.0439678 s/iter 73.991674 +iter : 23 Arret : 0.00925561 s/iter 73.914083 +iter : 24 Arret : 0.0124615 s/iter 74.159142 +iter : 25 Arret : 0.0315205 s/iter 74.142722 +iter : 26 Arret : 0.0321732 s/iter 74.311005 +iter : 27 Arret : 0.0105212 s/iter 73.453333 +iter : 28 Arret : 0.00485509 s/iter 73.717891 +iter : 29 Arret : 0.000470819 s/iter 73.323142 +iter : 30 Arret : 0.00110535 s/iter 73.429113 +iter : 31 Arret : 0.000637739 s/iter 73.538252 +iter : 32 Arret : 0.00062533 s/iter 73.285690 +iter : 33 Arret : 0.00316706 s/iter 73.428711 +iter : 34 Arret : 0.00477625 s/iter 73.330301 +iter : 35 Arret : 0.000753017 s/iter 73.590922 +iter : 36 Arret : 0.000462137 s/iter 73.646608 +iter : 37 Arret : 3.49599E-05 s/iter 73.278894 +iter : 38 Arret : 3.93073E-06 s/iter 73.310440 +iter : 39 Arret : 1.18018E-07 s/iter 73.398618 +iter : 40 Arret : 7.61643E-12 s/iter 73.261412 +iter : 41 Arret : 1.11022E-16 s/iter 73.471338 +temps : 3024.78 seconde(s) +Nb iterations : 41 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827243 +i* 0.561844| 1|-1.79082E-13 +i*-3.05719E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.765083 +i* 0.643932| 1| 3.06144E-14 +i*-3.59443E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 800000 +proc 0 start 0 size 800000 +iter : 1 Arret : 3.0223E-06 s/iter 130.910451 +iter : 2 Arret : 3.05312E-06 s/iter 130.776649 +iter : 3 Arret : 2.97193E-06 s/iter 131.189959 +iter : 4 Arret : 3.38837E-06 s/iter 130.938921 +iter : 5 Arret : 3.11255E-06 s/iter 131.156592 +iter : 6 Arret : 3.03853E-06 s/iter 130.803128 +iter : 7 Arret : 3.14049E-06 s/iter 131.179805 +iter : 8 Arret : 3.18043E-06 s/iter 131.407983 +iter : 9 Arret : 3.76919E-06 s/iter 130.828589 +iter : 10 Arret : 6.64299E-06 s/iter 130.912457 +iter : 11 Arret : 0.000184934 s/iter 130.849476 +iter : 12 Arret : 0.00113133 s/iter 130.609739 +iter : 13 Arret : 0.75957 s/iter 131.109558 +iter : 14 Arret : 0.969861 s/iter 130.735075 +iter : 15 Arret : 2.30034 s/iter 131.282231 +iter : 16 Arret : 0.0222707 s/iter 130.482018 +iter : 17 Arret : 0.0120899 s/iter 130.435161 +iter : 18 Arret : 0.00213689 s/iter 130.113007 +iter : 19 Arret : 0.00216319 s/iter 130.119966 +iter : 20 Arret : 0.00191413 s/iter 130.688058 +iter : 21 Arret : 0.000561228 s/iter 130.127500 +iter : 22 Arret : 0.00080725 s/iter 130.113179 +iter : 23 Arret : 0.000942131 s/iter 130.109476 +iter : 24 Arret : 0.000121077 s/iter 130.137272 +iter : 25 Arret : 6.87574E-05 s/iter 130.098610 +iter : 26 Arret : 1.12148E-05 s/iter 130.139358 +iter : 27 Arret : 1.91953E-05 s/iter 130.166965 +iter : 28 Arret : 1.46847E-05 s/iter 130.137866 +iter : 29 Arret : 2.25755E-06 s/iter 130.165937 +iter : 30 Arret : 7.71791E-08 s/iter 130.157443 +iter : 31 Arret : 5.12239E-12 s/iter 130.161648 +iter : 32 Arret : 1.57009E-16 s/iter 130.091430 +temps : 4178.79 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982853 +i* -0.184391| 1| 8.57613E-14 +i* 1.33506E-13| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 1000192 +proc 0 start 0 size 1000192 +iter : 1 Arret : 2.73502E-06 s/iter 204.279286 +iter : 2 Arret : 2.44464E-06 s/iter 204.498903 +iter : 3 Arret : 2.9324E-06 s/iter 204.374941 +iter : 4 Arret : 2.98966E-06 s/iter 204.075626 +iter : 5 Arret : 2.61797E-06 s/iter 203.959656 +iter : 6 Arret : 2.4979E-06 s/iter 203.988927 +iter : 7 Arret : 2.51762E-06 s/iter 204.231126 +iter : 8 Arret : 2.58671E-06 s/iter 204.166994 +iter : 9 Arret : 2.90834E-06 s/iter 204.332702 +iter : 10 Arret : 4.27749E-06 s/iter 204.314957 +iter : 11 Arret : 5.07307E-05 s/iter 203.530475 +iter : 12 Arret : 0.000123753 s/iter 204.108996 +iter : 13 Arret : 0.000131719 s/iter 204.098813 +iter : 14 Arret : 0.0021029 s/iter 204.342794 +iter : 15 Arret : 1.57047 s/iter 204.198189 +iter : 16 Arret : 0.0813952 s/iter 206.610273 +iter : 17 Arret : 0.0433113 s/iter 206.520683 +iter : 18 Arret : 0.0270058 s/iter 206.275171 +iter : 19 Arret : 0.0276935 s/iter 206.479388 +iter : 20 Arret : 0.0378979 s/iter 207.701222 +iter : 21 Arret : 0.0313855 s/iter 207.827615 +iter : 22 Arret : 0.0233655 s/iter 208.441193 +iter : 23 Arret : 0.0287783 s/iter 208.089309 +iter : 24 Arret : 0.100552 s/iter 207.729643 +iter : 25 Arret : 0.102695 s/iter 210.217294 +iter : 26 Arret : 0.02599 s/iter 207.019354 +iter : 27 Arret : 0.00608491 s/iter 209.059541 +iter : 28 Arret : 0.00162589 s/iter 208.815464 +iter : 29 Arret : 0.00099098 s/iter 206.703004 +iter : 30 Arret : 0.000945613 s/iter 206.381661 +iter : 31 Arret : 0.00119593 s/iter 206.382920 +iter : 32 Arret : 0.000135248 s/iter 206.201614 +iter : 33 Arret : 4.70878E-05 s/iter 206.372532 +iter : 34 Arret : 2.28065E-05 s/iter 206.465031 +iter : 35 Arret : 5.77295E-05 s/iter 206.597149 +iter : 36 Arret : 3.67008E-05 s/iter 206.794068 +iter : 37 Arret : 1.74792E-05 s/iter 206.834265 +iter : 38 Arret : 4.82238E-06 s/iter 206.391187 +iter : 39 Arret : 2.30742E-06 s/iter 206.223089 +iter : 40 Arret : 7.43635E-08 s/iter 206.381485 +iter : 41 Arret : 6.21299E-13 s/iter 206.681826 +temps : 8448.53 seconde(s) +Nb iterations : 41 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 6.21299E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.403485 +i* -0.914986| 1|-3.20004E-13 +i* 2.65225E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.345815 +i* -0.938303| 1| 5.50778E-13 +i* 8.9059E-14| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286806 +i* -0.957989| 1|-2.69538E-13 +i* 2.95529E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 1200128 +proc 0 start 0 size 1200128 +iter : 1 Arret : 2.4754E-06 s/iter 294.181649 +iter : 2 Arret : 2.55346E-06 s/iter 294.312460 +iter : 3 Arret : 2.19653E-06 s/iter 293.897603 +iter : 4 Arret : 2.15762E-06 s/iter 293.179922 +iter : 5 Arret : 2.17822E-06 s/iter 293.072674 +iter : 6 Arret : 2.02989E-06 s/iter 293.272996 +iter : 7 Arret : 2.03558E-06 s/iter 293.858388 +iter : 8 Arret : 2.41822E-06 s/iter 294.218898 +iter : 9 Arret : 2.30694E-06 s/iter 294.061104 +iter : 10 Arret : 8.15704E-06 s/iter 294.067083 +iter : 11 Arret : 4.27575E-05 s/iter 293.122401 +iter : 12 Arret : 0.00227073 s/iter 293.366596 +iter : 13 Arret : 0.000832685 s/iter 297.997094 +iter : 14 Arret : 0.000890514 s/iter 297.007020 +iter : 15 Arret : 0.0876147 s/iter 294.457487 +iter : 16 Arret : 1.31578 s/iter 297.437556 +iter : 17 Arret : 0.0429794 s/iter 295.107633 +iter : 18 Arret : 0.0308472 s/iter 296.336437 +iter : 19 Arret : 0.0219224 s/iter 296.183862 +iter : 20 Arret : 0.0173264 s/iter 295.691127 +iter : 21 Arret : 0.0681916 s/iter 299.846405 +iter : 22 Arret : 0.16453 s/iter 300.455513 +iter : 23 Arret : 0.259379 s/iter 298.873861 +iter : 24 Arret : 0.133491 s/iter 298.480044 +iter : 25 Arret : 0.0906637 s/iter 297.372981 +iter : 26 Arret : 0.0535533 s/iter 296.127023 +iter : 27 Arret : 0.0520641 s/iter 293.474277 +iter : 28 Arret : 0.0265199 s/iter 294.979085 +iter : 29 Arret : 0.00979862 s/iter 293.527378 +iter : 30 Arret : 0.000786488 s/iter 291.877183 +iter : 31 Arret : 5.11539E-05 s/iter 292.065401 +iter : 32 Arret : 1.82435E-06 s/iter 292.152352 +iter : 33 Arret : 3.41709E-08 s/iter 292.070505 +iter : 34 Arret : 3.9427E-13 s/iter 291.989170 +temps : 10029.1 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 3.9427E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 1400064 +proc 0 start 0 size 1400064 +iter : 1 Arret : 2.15917E-06 s/iter 399.723385 +iter : 2 Arret : 1.85088E-06 s/iter 400.081884 +iter : 3 Arret : 1.77547E-06 s/iter 399.972031 +iter : 4 Arret : 1.70334E-06 s/iter 400.104702 +iter : 5 Arret : 2.04999E-06 s/iter 398.636646 +iter : 6 Arret : 1.75711E-06 s/iter 399.861327 +iter : 7 Arret : 2.07853E-06 s/iter 399.248399 +iter : 8 Arret : 2.04246E-06 s/iter 400.060464 +iter : 9 Arret : 1.77029E-06 s/iter 399.691512 +iter : 10 Arret : 2.16444E-06 s/iter 398.773864 +iter : 11 Arret : 4.00026E-05 s/iter 399.545536 +iter : 12 Arret : 0.00062797 s/iter 399.345225 +iter : 13 Arret : 0.00137915 s/iter 410.635534 +iter : 14 Arret : 0.00118537 s/iter 401.201832 +iter : 15 Arret : 0.0014988 s/iter 416.951641 +iter : 16 Arret : 0.00924381 s/iter 420.806756 +iter : 17 Arret : 0.0111252 s/iter 405.291240 +iter : 18 Arret : 0.00690489 s/iter 400.950454 +iter : 19 Arret : 0.0231913 s/iter 420.075291 +iter : 20 Arret : 0.558603 s/iter 420.972938 +iter : 21 Arret : 0.377538 s/iter 420.162170 +iter : 22 Arret : 0.0534435 s/iter 403.124652 +iter : 23 Arret : 0.016058 s/iter 401.027424 +iter : 24 Arret : 0.00747446 s/iter 415.903713 +iter : 25 Arret : 0.00321124 s/iter 398.031216 +iter : 26 Arret : 0.0189268 s/iter 399.060242 +iter : 27 Arret : 0.000769252 s/iter 398.576199 +iter : 28 Arret : 0.000237512 s/iter 397.202227 +iter : 29 Arret : 4.17772E-05 s/iter 397.561175 +iter : 30 Arret : 9.03671E-06 s/iter 397.602643 +iter : 31 Arret : 7.65256E-06 s/iter 396.777496 +iter : 32 Arret : 5.68144E-07 s/iter 397.700035 +iter : 33 Arret : 5.85116E-09 s/iter 397.976888 +iter : 34 Arret : 5.58763E-15 s/iter 396.271102 +temps : 13710 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 5.58763E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957576 +i* -0.288179| 1|-2.69526E-12 +i* 1.63797E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.943789 +i* -0.33055| 1| 1.94401E-12 +i*-8.36756E-13| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_mpi_bis/full_mpi_2GPU.o140350 b/Simulations/full_mpi_bis/full_mpi_2GPU.o140350 new file mode 100644 index 0000000..a3ae963 --- /dev/null +++ b/Simulations/full_mpi_bis/full_mpi_2GPU.o140350 @@ -0,0 +1,620 @@ +REMAINING: 2 +Taking GPU #0 +Taking GPU #1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 50048 +proc 0 start 0 size 50048 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 50048 size 50048 +proc 1 start 50048 size 50048 +iter : 1 Arret : 2.54272E-05 s/iter 1.224784 +iter : 2 Arret : 2.39932E-05 s/iter 1.222242 +iter : 3 Arret : 2.30492E-05 s/iter 1.222005 +iter : 4 Arret : 2.30448E-05 s/iter 1.222506 +iter : 5 Arret : 2.36504E-05 s/iter 1.221949 +iter : 6 Arret : 2.48396E-05 s/iter 1.222824 +iter : 7 Arret : 2.76062E-05 s/iter 1.224550 +iter : 8 Arret : 3.59957E-05 s/iter 1.223351 +iter : 9 Arret : 0.000362412 s/iter 1.228701 +iter : 10 Arret : 0.000790437 s/iter 1.228129 +iter : 11 Arret : 0.00158756 s/iter 1.223561 +iter : 12 Arret : 0.247734 s/iter 1.223772 +iter : 13 Arret : 1.53144 s/iter 2.141741 +iter : 14 Arret : 0.0037855 s/iter 2.115060 +iter : 15 Arret : 0.00281732 s/iter 2.138643 +iter : 16 Arret : 0.00225403 s/iter 2.133266 +iter : 17 Arret : 0.00179177 s/iter 2.076951 +iter : 18 Arret : 0.00156427 s/iter 1.971566 +iter : 19 Arret : 0.00145078 s/iter 1.971490 +iter : 20 Arret : 0.00140889 s/iter 1.948742 +iter : 21 Arret : 0.00281494 s/iter 0.878177 +iter : 22 Arret : 0.0586086 s/iter 0.888041 +iter : 23 Arret : 0.0106937 s/iter 0.873504 +iter : 24 Arret : 0.0537105 s/iter 2.196119 +iter : 25 Arret : 0.02261 s/iter 2.192403 +iter : 26 Arret : 0.00135471 s/iter 0.884303 +iter : 27 Arret : 0.000883021 s/iter 0.882295 +iter : 28 Arret : 0.000445113 s/iter 0.884919 +iter : 29 Arret : 0.000371295 s/iter 0.885823 +iter : 30 Arret : 8.15432E-05 s/iter 0.897732 +iter : 31 Arret : 0.000123838 s/iter 0.896645 +iter : 32 Arret : 5.28388E-05 s/iter 0.886006 +iter : 33 Arret : 8.66297E-05 s/iter 0.882256 +iter : 34 Arret : 5.41229E-05 s/iter 0.884733 +iter : 35 Arret : 2.64238E-05 s/iter 0.879048 +iter : 36 Arret : 1.21433E-06 s/iter 0.885124 +iter : 37 Arret : 3.61565E-10 s/iter 0.885369 +iter : 38 Arret : 5.35474E-15 s/iter 0.885785 +temps : 49.9266 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 5.35474E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 8.11851E-16 +i* 1.95503E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.76317E-14 +i* 5.4734E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 100096 size 100096 +proc 1 start 100096 size 100096 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 100096 +proc 0 start 0 size 100096 +iter : 1 Arret : 1.22107E-05 s/iter 4.322402 +iter : 2 Arret : 1.32817E-05 s/iter 4.322068 +iter : 3 Arret : 1.18476E-05 s/iter 4.332042 +iter : 4 Arret : 1.30794E-05 s/iter 4.320178 +iter : 5 Arret : 1.44771E-05 s/iter 4.314866 +iter : 6 Arret : 1.32861E-05 s/iter 4.322297 +iter : 7 Arret : 1.30094E-05 s/iter 4.320581 +iter : 8 Arret : 1.57289E-05 s/iter 4.321287 +iter : 9 Arret : 3.86451E-05 s/iter 4.320423 +iter : 10 Arret : 0.000543891 s/iter 4.320183 +iter : 11 Arret : 0.00145339 s/iter 4.321120 +iter : 12 Arret : 1.79442 s/iter 4.320944 +iter : 13 Arret : 0.533237 s/iter 4.322201 +iter : 14 Arret : 0.70441 s/iter 5.187062 +iter : 15 Arret : 0.0611495 s/iter 5.169668 +iter : 16 Arret : 0.0229271 s/iter 5.149185 +iter : 17 Arret : 0.0061891 s/iter 4.285429 +iter : 18 Arret : 0.00210453 s/iter 4.282596 +iter : 19 Arret : 0.00109911 s/iter 4.274796 +iter : 20 Arret : 0.000622571 s/iter 4.266318 +iter : 21 Arret : 0.000386564 s/iter 4.270395 +iter : 22 Arret : 0.00170309 s/iter 4.244927 +iter : 23 Arret : 0.00230236 s/iter 4.241676 +iter : 24 Arret : 0.000633673 s/iter 4.246116 +iter : 25 Arret : 0.000558961 s/iter 4.245510 +iter : 26 Arret : 1.46803E-05 s/iter 4.242904 +iter : 27 Arret : 2.13349E-05 s/iter 4.251720 +iter : 28 Arret : 1.08022E-06 s/iter 4.246058 +iter : 29 Arret : 7.30296E-12 s/iter 4.247629 +iter : 30 Arret : 1.11076E-16 s/iter 4.239168 +temps : 131.492 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +proc 1 +proc 0 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 200064 size 200064 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 200064 +proc 0 start 0 size 200064 +proc 1 start 200064 size 200064 +iter : 1 Arret : 5.92769E-06 s/iter 17.091881 +iter : 2 Arret : 5.92861E-06 s/iter 17.079067 +iter : 3 Arret : 5.65084E-06 s/iter 17.071253 +iter : 4 Arret : 5.90123E-06 s/iter 17.075667 +iter : 5 Arret : 5.67405E-06 s/iter 17.086203 +iter : 6 Arret : 5.78163E-06 s/iter 17.085519 +iter : 7 Arret : 5.94963E-06 s/iter 17.071917 +iter : 8 Arret : 6.19084E-06 s/iter 17.072228 +iter : 9 Arret : 6.32356E-06 s/iter 17.066944 +iter : 10 Arret : 1.31102E-05 s/iter 17.080496 +iter : 11 Arret : 0.00173232 s/iter 17.074923 +iter : 12 Arret : 0.00543612 s/iter 17.071795 +iter : 13 Arret : 0.0042724 s/iter 17.070175 +iter : 14 Arret : 0.00387295 s/iter 17.065166 +iter : 15 Arret : 0.0699239 s/iter 21.304928 +iter : 16 Arret : 1.07204 s/iter 21.363177 +iter : 17 Arret : 0.838916 s/iter 17.021405 +iter : 18 Arret : 0.628391 s/iter 21.328594 +iter : 19 Arret : 0.10484 s/iter 21.427763 +iter : 20 Arret : 0.052212 s/iter 21.324082 +iter : 21 Arret : 0.0749816 s/iter 21.277334 +iter : 22 Arret : 0.186026 s/iter 21.527592 +iter : 23 Arret : 0.0844323 s/iter 21.678553 +iter : 24 Arret : 0.072278 s/iter 21.297469 +iter : 25 Arret : 0.0465913 s/iter 17.593773 +iter : 26 Arret : 0.124099 s/iter 16.983604 +iter : 27 Arret : 0.199717 s/iter 21.427746 +iter : 28 Arret : 0.0458777 s/iter 20.234226 +iter : 29 Arret : 0.00810233 s/iter 16.830607 +iter : 30 Arret : 0.00802723 s/iter 16.877332 +iter : 31 Arret : 0.000715802 s/iter 16.808412 +iter : 32 Arret : 0.000233133 s/iter 16.830470 +iter : 33 Arret : 3.40438E-05 s/iter 16.843692 +iter : 34 Arret : 1.56366E-05 s/iter 16.804982 +iter : 35 Arret : 8.38478E-06 s/iter 16.844967 +iter : 36 Arret : 5.53343E-07 s/iter 16.824226 +iter : 37 Arret : 4.68738E-10 s/iter 16.832721 +iter : 38 Arret : 5.97873E-16 s/iter 16.861706 +temps : 693.598 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12993E-08 +Stabilite : 5.97873E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769061 +i* 0.639176| 1|-1.82375E-13 +i* 1.0897E-12| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857616 +i* 0.51429| 1|-4.74988E-13 +i*-1.42508E-14| +| 10| -0.0345309 +i* -0.999404| 1| 3.31561E-13 +i*-9.06705E-14| +| 11| 0.662491 +i* 0.74907| 1| 5.75581E-15 +i*-3.34004E-14| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.9261 +i* 0.377277| 1|-4.84647E-14 +i*-1.93776E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.972834 +i* 0.231505| 1| 3.9433E-13 +i*-1.27901E-14| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 300032 size 300032 +proc 1 start 300032 size 300032 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +iter : 1 Arret : 4.69807E-06 s/iter 37.173976 +iter : 2 Arret : 5.03632E-06 s/iter 37.197736 +iter : 3 Arret : 4.52279E-06 s/iter 37.204045 +iter : 4 Arret : 4.45961E-06 s/iter 37.182431 +iter : 5 Arret : 4.70176E-06 s/iter 37.202778 +iter : 6 Arret : 4.16249E-06 s/iter 37.226442 +iter : 7 Arret : 4.44064E-06 s/iter 37.196239 +iter : 8 Arret : 4.86579E-06 s/iter 37.186716 +iter : 9 Arret : 5.22739E-06 s/iter 37.197811 +iter : 10 Arret : 3.13209E-05 s/iter 37.209556 +iter : 11 Arret : 0.000592076 s/iter 37.205383 +iter : 12 Arret : 0.000623857 s/iter 37.198123 +iter : 13 Arret : 1.78387 s/iter 37.207116 +iter : 14 Arret : 0.0628737 s/iter 41.602455 +iter : 15 Arret : 0.0454104 s/iter 42.064364 +iter : 16 Arret : 0.0306142 s/iter 37.146438 +iter : 17 Arret : 0.0187871 s/iter 40.174276 +iter : 18 Arret : 0.0120648 s/iter 37.140989 +iter : 19 Arret : 0.00826764 s/iter 37.218162 +iter : 20 Arret : 0.00721269 s/iter 43.538072 +iter : 21 Arret : 0.0049902 s/iter 42.294953 +iter : 22 Arret : 0.00681901 s/iter 36.981513 +iter : 23 Arret : 0.0226017 s/iter 44.791326 +iter : 24 Arret : 0.0423507 s/iter 44.356512 +iter : 25 Arret : 0.12069 s/iter 37.294818 +iter : 26 Arret : 0.0692912 s/iter 37.644635 +iter : 27 Arret : 0.0896514 s/iter 43.861766 +iter : 28 Arret : 0.00897008 s/iter 37.216239 +iter : 29 Arret : 0.00654192 s/iter 37.294418 +iter : 30 Arret : 0.00766928 s/iter 37.138645 +iter : 31 Arret : 0.0038097 s/iter 37.374897 +iter : 32 Arret : 0.00660869 s/iter 37.307820 +iter : 33 Arret : 0.00728531 s/iter 37.253897 +iter : 34 Arret : 0.00359169 s/iter 37.200093 +iter : 35 Arret : 0.00382107 s/iter 37.112699 +iter : 36 Arret : 0.00265225 s/iter 36.946149 +iter : 37 Arret : 0.000747329 s/iter 37.000942 +iter : 38 Arret : 0.000401385 s/iter 37.146111 +iter : 39 Arret : 0.000340744 s/iter 36.948884 +iter : 40 Arret : 0.000615944 s/iter 36.982747 +iter : 41 Arret : 0.000873228 s/iter 37.007010 +iter : 42 Arret : 5.51285E-05 s/iter 37.158816 +iter : 43 Arret : 2.43301E-05 s/iter 36.996671 +iter : 44 Arret : 1.56734E-05 s/iter 37.039054 +iter : 45 Arret : 3.51799E-06 s/iter 37.021331 +iter : 46 Arret : 3.01666E-08 s/iter 36.946668 +iter : 47 Arret : 1.00879E-13 s/iter 36.974289 +temps : 1792.33 seconde(s) +Nb iterations : 47 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827243 +i* 0.561844| 1|-1.79082E-13 +i*-3.05719E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.765083 +i* 0.643932| 1| 3.06144E-14 +i*-3.59443E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 400000 size 400000 +proc 1 start 400000 size 400000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 400000 +proc 0 start 0 size 400000 +iter : 1 Arret : 2.99198E-06 s/iter 66.413211 +iter : 2 Arret : 2.96778E-06 s/iter 66.392956 +iter : 3 Arret : 3.00937E-06 s/iter 66.339632 +iter : 4 Arret : 2.97226E-06 s/iter 66.349986 +iter : 5 Arret : 2.96286E-06 s/iter 66.378994 +iter : 6 Arret : 2.87376E-06 s/iter 66.345904 +iter : 7 Arret : 2.97178E-06 s/iter 66.395986 +iter : 8 Arret : 3.18041E-06 s/iter 66.374924 +iter : 9 Arret : 3.76916E-06 s/iter 66.312303 +iter : 10 Arret : 6.64281E-06 s/iter 66.353184 +iter : 11 Arret : 0.000184944 s/iter 66.327534 +iter : 12 Arret : 0.00113193 s/iter 66.326579 +iter : 13 Arret : 0.756784 s/iter 66.399690 +iter : 14 Arret : 0.953926 s/iter 66.384267 +iter : 15 Arret : 2.42788 s/iter 75.196469 +iter : 16 Arret : 0.0380351 s/iter 66.146967 +iter : 17 Arret : 0.00135087 s/iter 65.963185 +iter : 18 Arret : 0.00163803 s/iter 65.845992 +iter : 19 Arret : 0.00428499 s/iter 65.903836 +iter : 20 Arret : 0.0038067 s/iter 73.688871 +iter : 21 Arret : 0.000657342 s/iter 68.105543 +iter : 22 Arret : 0.000335199 s/iter 65.711333 +iter : 23 Arret : 0.000193741 s/iter 65.724966 +iter : 24 Arret : 0.000965407 s/iter 65.748314 +iter : 25 Arret : 0.000199254 s/iter 65.737120 +iter : 26 Arret : 4.1099E-05 s/iter 65.758689 +iter : 27 Arret : 1.24027E-05 s/iter 65.752451 +iter : 28 Arret : 3.05369E-06 s/iter 65.731804 +iter : 29 Arret : 1.17116E-07 s/iter 65.757803 +iter : 30 Arret : 2.27328E-11 s/iter 65.725830 +iter : 31 Arret : 1.57009E-16 s/iter 65.718433 +temps : 2067.97 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982853 +i* -0.184391| 1| 8.57613E-14 +i* 1.33506E-13| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 500096 size 500096 +proc 1 start 500096 size 500096 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 500096 +proc 0 start 0 size 500096 +iter : 1 Arret : 2.67114E-06 s/iter 102.819162 +iter : 2 Arret : 2.95315E-06 s/iter 102.252390 +iter : 3 Arret : 2.95969E-06 s/iter 102.326420 +iter : 4 Arret : 2.88779E-06 s/iter 102.301752 +iter : 5 Arret : 2.5581E-06 s/iter 102.372224 +iter : 6 Arret : 2.45683E-06 s/iter 102.364442 +iter : 7 Arret : 2.82722E-06 s/iter 102.364753 +iter : 8 Arret : 2.82432E-06 s/iter 102.261531 +iter : 9 Arret : 2.83699E-06 s/iter 102.313325 +iter : 10 Arret : 4.13032E-06 s/iter 102.332750 +iter : 11 Arret : 2.98919E-05 s/iter 102.321802 +iter : 12 Arret : 0.00010546 s/iter 102.183593 +iter : 13 Arret : 0.000196723 s/iter 102.213055 +iter : 14 Arret : 0.0866546 s/iter 102.220017 +iter : 15 Arret : 1.30889 s/iter 105.826907 +iter : 16 Arret : 0.252188 s/iter 104.637764 +iter : 17 Arret : 0.0921487 s/iter 105.496435 +iter : 18 Arret : 0.0494945 s/iter 105.312989 +iter : 19 Arret : 0.0729582 s/iter 114.285097 +iter : 20 Arret : 0.0422052 s/iter 116.523673 +iter : 21 Arret : 0.0595401 s/iter 114.447696 +iter : 22 Arret : 0.162804 s/iter 118.042214 +iter : 23 Arret : 0.649592 s/iter 117.511534 +iter : 24 Arret : 2.08783 s/iter 117.356798 +iter : 25 Arret : 0.139314 s/iter 116.842982 +iter : 26 Arret : 0.0404474 s/iter 103.939125 +iter : 27 Arret : 0.00407747 s/iter 115.878294 +iter : 28 Arret : 0.00207881 s/iter 103.573382 +iter : 29 Arret : 0.00103713 s/iter 116.131131 +iter : 30 Arret : 0.00321163 s/iter 116.112791 +iter : 31 Arret : 0.00537381 s/iter 103.809744 +iter : 32 Arret : 0.00145604 s/iter 116.197046 +iter : 33 Arret : 0.000282152 s/iter 103.606134 +iter : 34 Arret : 4.69677E-05 s/iter 103.606208 +iter : 35 Arret : 5.60351E-05 s/iter 103.499492 +iter : 36 Arret : 4.0077E-05 s/iter 103.645810 +iter : 37 Arret : 0.000111497 s/iter 103.598334 +iter : 38 Arret : 0.000135537 s/iter 103.560749 +iter : 39 Arret : 1.34079E-05 s/iter 103.613093 +iter : 40 Arret : 5.51686E-06 s/iter 103.871715 +iter : 41 Arret : 5.82845E-08 s/iter 103.484481 +iter : 42 Arret : 4.86438E-13 s/iter 103.585562 +temps : 4481.5 seconde(s) +Nb iterations : 42 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80136E-07 +Stabilite : 4.86438E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.403485 +i* -0.914986| 1|-3.20004E-13 +i* 2.65225E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.345815 +i* -0.938303| 1| 5.50778E-13 +i* 8.9059E-14| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 600064 size 600064 +proc 1 start 600064 size 600064 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +iter : 1 Arret : 2.32004E-06 s/iter 147.703091 +iter : 2 Arret : 2.41214E-06 s/iter 147.409302 +iter : 3 Arret : 2.18674E-06 s/iter 147.497496 +iter : 4 Arret : 2.29706E-06 s/iter 147.538618 +iter : 5 Arret : 2.29919E-06 s/iter 147.526595 +iter : 6 Arret : 2.25616E-06 s/iter 147.463773 +iter : 7 Arret : 2.32928E-06 s/iter 147.468515 +iter : 8 Arret : 2.10724E-06 s/iter 147.496893 +iter : 9 Arret : 2.29426E-06 s/iter 147.454209 +iter : 10 Arret : 2.67582E-06 s/iter 147.514097 +iter : 11 Arret : 8.24755E-05 s/iter 147.502532 +iter : 12 Arret : 0.00054508 s/iter 147.464990 +iter : 13 Arret : 0.00120005 s/iter 147.846365 +iter : 14 Arret : 0.00114159 s/iter 147.880756 +iter : 15 Arret : 0.00131473 s/iter 163.989918 +iter : 16 Arret : 3.03972 s/iter 159.348073 +iter : 17 Arret : 0.889441 s/iter 164.805690 +iter : 18 Arret : 0.728527 s/iter 163.890706 +iter : 19 Arret : 0.0284674 s/iter 166.182627 +iter : 20 Arret : 0.062266 s/iter 165.979919 +iter : 21 Arret : 0.234486 s/iter 165.737189 +iter : 22 Arret : 0.176675 s/iter 166.748944 +iter : 23 Arret : 0.0331294 s/iter 160.311184 +iter : 24 Arret : 0.0989117 s/iter 166.807740 +iter : 25 Arret : 0.0610064 s/iter 163.279540 +iter : 26 Arret : 0.194465 s/iter 165.941854 +iter : 27 Arret : 0.107536 s/iter 161.639438 +iter : 28 Arret : 0.0807225 s/iter 162.357391 +iter : 29 Arret : 0.0218584 s/iter 147.466888 +iter : 30 Arret : 0.0691534 s/iter 147.403771 +iter : 31 Arret : 0.0561441 s/iter 147.311133 +iter : 32 Arret : 0.00353269 s/iter 147.289484 +iter : 33 Arret : 0.000572685 s/iter 147.319084 +iter : 34 Arret : 0.000175169 s/iter 147.322464 +iter : 35 Arret : 7.25501E-05 s/iter 147.086067 +iter : 36 Arret : 8.75366E-06 s/iter 147.379819 +iter : 37 Arret : 2.60684E-06 s/iter 147.344248 +iter : 38 Arret : 2.17689E-07 s/iter 147.346281 +iter : 39 Arret : 3.28086E-10 s/iter 147.331241 +iter : 40 Arret : 3.14018E-16 s/iter 147.328046 +temps : 6131.73 seconde(s) +Nb iterations : 40 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 3.14018E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 700032 +proc 0 start 0 size 700032 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 700032 size 700032 +proc 1 start 700032 size 700032 +iter : 1 Arret : 1.71503E-06 s/iter 201.302757 +iter : 2 Arret : 2.08877E-06 s/iter 201.236342 +iter : 3 Arret : 1.80367E-06 s/iter 201.159959 +iter : 4 Arret : 1.72863E-06 s/iter 200.629208 +iter : 5 Arret : 2.02585E-06 s/iter 200.910093 +iter : 6 Arret : 1.75888E-06 s/iter 201.365208 +iter : 7 Arret : 1.76501E-06 s/iter 200.487957 +iter : 8 Arret : 1.72307E-06 s/iter 200.934009 +iter : 9 Arret : 1.76155E-06 s/iter 201.213512 +iter : 10 Arret : 2.12943E-06 s/iter 200.659277 +iter : 11 Arret : 3.32069E-05 s/iter 201.152277 +iter : 12 Arret : 0.000536706 s/iter 200.822344 +iter : 13 Arret : 0.00427681 s/iter 201.483572 +iter : 14 Arret : 0.00530359 s/iter 201.400972 +iter : 15 Arret : 0.0021808 s/iter 205.001900 +iter : 16 Arret : 0.00140702 s/iter 201.467662 +iter : 17 Arret : 0.00456042 s/iter 200.335860 +iter : 18 Arret : 0.00329506 s/iter 214.967030 +iter : 19 Arret : 0.00401452 s/iter 215.162153 +iter : 20 Arret : 0.0282907 s/iter 213.064879 +iter : 21 Arret : 0.554695 s/iter 200.569211 +iter : 22 Arret : 0.113844 s/iter 211.670465 +iter : 23 Arret : 0.0880466 s/iter 200.889715 +iter : 24 Arret : 0.00814891 s/iter 201.083685 +iter : 25 Arret : 0.00200474 s/iter 202.183564 +iter : 26 Arret : 0.00211039 s/iter 200.462930 +iter : 27 Arret : 0.0122898 s/iter 200.464215 +iter : 28 Arret : 0.0143102 s/iter 200.195416 +iter : 29 Arret : 0.000201512 s/iter 199.914634 +iter : 30 Arret : 2.5176E-08 s/iter 199.896196 +iter : 31 Arret : 1.06587E-14 s/iter 200.075278 +temps : 6283.33 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 1.06587E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_mpi_bis/full_mpi_3GPU.o140349 b/Simulations/full_mpi_bis/full_mpi_3GPU.o140349 new file mode 100644 index 0000000..30aa16b --- /dev/null +++ b/Simulations/full_mpi_bis/full_mpi_3GPU.o140349 @@ -0,0 +1,720 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +proc 0 +proc 1 +proc 2 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 2, start 66730 size 33365 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 33365 size 33365 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 33365 +proc 0 start 0 size 33365 +proc 2 start 66730 size 33365 +proc 1 start 33365 size 33365 +iter : 1 Arret : 2.36932E-05 s/iter 0.912595 +iter : 2 Arret : 2.25678E-05 s/iter 0.909870 +iter : 3 Arret : 2.27127E-05 s/iter 0.910905 +iter : 4 Arret : 2.30448E-05 s/iter 0.911916 +iter : 5 Arret : 2.36504E-05 s/iter 0.911890 +iter : 6 Arret : 2.48395E-05 s/iter 0.912035 +iter : 7 Arret : 2.76062E-05 s/iter 0.911594 +iter : 8 Arret : 3.59956E-05 s/iter 0.911731 +iter : 9 Arret : 0.000409875 s/iter 0.912179 +iter : 10 Arret : 0.000461544 s/iter 0.912231 +iter : 11 Arret : 0.00158737 s/iter 0.912026 +iter : 12 Arret : 0.247612 s/iter 0.912226 +iter : 13 Arret : 1.46428 s/iter 2.005755 +iter : 14 Arret : 0.0428271 s/iter 1.994579 +iter : 15 Arret : 0.0404634 s/iter 2.019498 +iter : 16 Arret : 0.011376 s/iter 2.014857 +iter : 17 Arret : 0.00573682 s/iter 1.968383 +iter : 18 Arret : 0.003628 s/iter 1.952685 +iter : 19 Arret : 0.0150183 s/iter 1.947536 +iter : 20 Arret : 0.0215975 s/iter 1.958206 +iter : 21 Arret : 0.0144709 s/iter 1.928139 +iter : 22 Arret : 0.00509184 s/iter 1.923413 +iter : 23 Arret : 0.00288936 s/iter 1.930780 +iter : 24 Arret : 0.00750083 s/iter 1.637255 +iter : 25 Arret : 0.0165955 s/iter 1.635785 +iter : 26 Arret : 0.00632453 s/iter 0.603414 +iter : 27 Arret : 0.000946387 s/iter 0.600817 +iter : 28 Arret : 0.00086876 s/iter 0.603653 +iter : 29 Arret : 0.000774268 s/iter 0.600645 +iter : 30 Arret : 0.000140958 s/iter 0.603676 +iter : 31 Arret : 5.59454E-05 s/iter 0.600412 +iter : 32 Arret : 1.74974E-05 s/iter 0.603616 +iter : 33 Arret : 2.92221E-06 s/iter 0.599461 +iter : 34 Arret : 3.73024E-09 s/iter 0.600284 +iter : 35 Arret : 5.53272E-14 s/iter 0.600305 +temps : 42.0352 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 5.53272E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 8.60423E-16 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.76109E-14 +i* 5.4734E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +proc 2 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 66730 size 66730 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 2, start 133460 size 66730 +proc 2 start 133460 size 66730 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 66730 +proc 0 start 0 size 66730 +proc 1 start 66730 size 66730 +iter : 1 Arret : 1.44509E-05 s/iter 3.056522 +iter : 2 Arret : 1.25749E-05 s/iter 3.056221 +iter : 3 Arret : 1.19709E-05 s/iter 3.057224 +iter : 4 Arret : 1.30543E-05 s/iter 3.056335 +iter : 5 Arret : 1.1608E-05 s/iter 3.059617 +iter : 6 Arret : 1.22313E-05 s/iter 3.055644 +iter : 7 Arret : 1.30346E-05 s/iter 3.056063 +iter : 8 Arret : 1.56192E-05 s/iter 3.055124 +iter : 9 Arret : 6.68978E-05 s/iter 3.056442 +iter : 10 Arret : 0.000611118 s/iter 3.055986 +iter : 11 Arret : 0.00182592 s/iter 3.056033 +iter : 12 Arret : 1.45412 s/iter 3.055856 +iter : 13 Arret : 0.246956 s/iter 5.884261 +iter : 14 Arret : 0.0936304 s/iter 5.835022 +iter : 15 Arret : 0.0431016 s/iter 5.831153 +iter : 16 Arret : 0.00010426 s/iter 3.040880 +iter : 17 Arret : 0.000256513 s/iter 3.053460 +iter : 18 Arret : 0.00035685 s/iter 3.052776 +iter : 19 Arret : 0.000601826 s/iter 3.053361 +iter : 20 Arret : 0.000107673 s/iter 3.045606 +iter : 21 Arret : 0.000214887 s/iter 3.025303 +iter : 22 Arret : 0.000475078 s/iter 3.016260 +iter : 23 Arret : 8.34148E-05 s/iter 3.018181 +iter : 24 Arret : 5.40535E-05 s/iter 3.018212 +iter : 25 Arret : 0.000430829 s/iter 3.020718 +iter : 26 Arret : 0.000304356 s/iter 3.012919 +iter : 27 Arret : 1.88367E-07 s/iter 3.013620 +iter : 28 Arret : 1.68394E-12 s/iter 3.013730 +iter : 29 Arret : 1.11076E-16 s/iter 3.025222 +temps : 96.864 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +proc 2 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 133376 size 133376 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 2, start 266752 size 133376 +proc 2 start 266752 size 133376 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 133376 +proc 0 start 0 size 133376 +proc 1 start 133376 size 133376 +iter : 1 Arret : 5.94905E-06 s/iter 11.257002 +iter : 2 Arret : 5.92558E-06 s/iter 11.204605 +iter : 3 Arret : 5.93122E-06 s/iter 11.166970 +iter : 4 Arret : 5.81174E-06 s/iter 11.168481 +iter : 5 Arret : 5.84437E-06 s/iter 11.165503 +iter : 6 Arret : 5.79144E-06 s/iter 11.168625 +iter : 7 Arret : 6.02557E-06 s/iter 11.167508 +iter : 8 Arret : 6.18739E-06 s/iter 11.162197 +iter : 9 Arret : 6.32181E-06 s/iter 11.169666 +iter : 10 Arret : 1.42434E-05 s/iter 11.158620 +iter : 11 Arret : 0.00172969 s/iter 11.161216 +iter : 12 Arret : 0.00557729 s/iter 13.454871 +iter : 13 Arret : 0.00434213 s/iter 11.157652 +iter : 14 Arret : 0.0314963 s/iter 11.162740 +iter : 15 Arret : 1.27983 s/iter 12.035655 +iter : 16 Arret : 1.95018 s/iter 12.012789 +iter : 17 Arret : 0.184317 s/iter 11.160210 +iter : 18 Arret : 0.412458 s/iter 14.538525 +iter : 19 Arret : 0.0528625 s/iter 15.550555 +iter : 20 Arret : 0.0340417 s/iter 15.411354 +iter : 21 Arret : 0.0239426 s/iter 14.493841 +iter : 22 Arret : 0.0142968 s/iter 16.200717 +iter : 23 Arret : 0.0287953 s/iter 16.378609 +iter : 24 Arret : 0.0216321 s/iter 16.406179 +iter : 25 Arret : 1.56829 s/iter 15.574619 +iter : 26 Arret : 0.528381 s/iter 16.233114 +iter : 27 Arret : 0.161933 s/iter 15.567062 +iter : 28 Arret : 0.0623358 s/iter 11.834575 +iter : 29 Arret : 0.0572874 s/iter 15.681484 +iter : 30 Arret : 0.00836878 s/iter 16.653970 +iter : 31 Arret : 0.00723158 s/iter 16.633490 +iter : 32 Arret : 0.00861441 s/iter 15.702041 +iter : 33 Arret : 0.00165411 s/iter 11.138865 +iter : 34 Arret : 0.000409009 s/iter 11.076497 +iter : 35 Arret : 0.000176011 s/iter 11.139679 +iter : 36 Arret : 0.000101507 s/iter 11.068780 +iter : 37 Arret : 8.8136E-05 s/iter 11.092742 +iter : 38 Arret : 3.91964E-05 s/iter 11.100536 +iter : 39 Arret : 2.81821E-05 s/iter 11.121540 +iter : 40 Arret : 2.67571E-05 s/iter 11.106333 +iter : 41 Arret : 1.12165E-05 s/iter 11.102930 +iter : 42 Arret : 5.58588E-07 s/iter 11.093405 +iter : 43 Arret : 1.3188E-10 s/iter 11.108241 +iter : 44 Arret : 2.48253E-16 s/iter 11.073402 +temps : 560.426 seconde(s) +Nb iterations : 44 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12993E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769071 +i* 0.639164| 1|-1.31544E-13 +i* 4.65595E-13| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857624 +i* 0.514277| 1| 3.15342E-13 +i* 8.14579E-13| +| 10| -0.0345309 +i* -0.999404| 1| 3.31561E-13 +i*-9.06705E-14| +| 11| 0.662491 +i* 0.74907| 1| 5.75581E-15 +i*-3.34004E-14| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926112 +i* 0.377248| 1| 4.98601E-13 +i* 1.04792E-12| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.972834 +i* 0.231505| 1| 3.9433E-13 +i*-1.27901E-14| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.996769 +i* 0.0803222| 1| 1.85257E-12 +i*-5.24946E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 200021 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 400042 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 200021 +proc 0 start 0 size 200021 +proc 1 start 200021 size 200021 +proc 2 start 400042 size 200021 +iter : 1 Arret : 3.9836E-06 s/iter 25.525561 +iter : 2 Arret : 3.95184E-06 s/iter 25.499626 +iter : 3 Arret : 3.95265E-06 s/iter 25.498954 +iter : 4 Arret : 4.3017E-06 s/iter 25.509370 +iter : 5 Arret : 3.95279E-06 s/iter 25.486493 +iter : 6 Arret : 3.85622E-06 s/iter 25.524103 +iter : 7 Arret : 4.27696E-06 s/iter 25.508367 +iter : 8 Arret : 4.31858E-06 s/iter 25.499364 +iter : 9 Arret : 5.22735E-06 s/iter 25.476088 +iter : 10 Arret : 9.55242E-06 s/iter 25.498282 +iter : 11 Arret : 0.000408813 s/iter 25.499924 +iter : 12 Arret : 0.000623962 s/iter 25.479031 +iter : 13 Arret : 2.07139 s/iter 30.576596 +iter : 14 Arret : 0.369572 s/iter 25.666070 +iter : 15 Arret : 0.0917113 s/iter 30.847343 +iter : 16 Arret : 0.014644 s/iter 30.823046 +iter : 17 Arret : 0.08377 s/iter 30.598259 +iter : 18 Arret : 0.122673 s/iter 29.319598 +iter : 19 Arret : 0.0541091 s/iter 30.620000 +iter : 20 Arret : 0.00949308 s/iter 30.742138 +iter : 21 Arret : 0.00771035 s/iter 30.781286 +iter : 22 Arret : 0.0322107 s/iter 30.666529 +iter : 23 Arret : 0.0185899 s/iter 30.740687 +iter : 24 Arret : 0.0148294 s/iter 30.870237 +iter : 25 Arret : 0.00825526 s/iter 32.570814 +iter : 26 Arret : 0.00715596 s/iter 30.852198 +iter : 27 Arret : 0.00420726 s/iter 30.886487 +iter : 28 Arret : 0.0531924 s/iter 31.004936 +iter : 29 Arret : 0.117022 s/iter 30.827523 +iter : 30 Arret : 0.0476926 s/iter 30.852345 +iter : 31 Arret : 0.0147319 s/iter 30.830238 +iter : 32 Arret : 0.00915774 s/iter 30.849625 +iter : 33 Arret : 0.00853895 s/iter 30.764715 +iter : 34 Arret : 0.00882479 s/iter 30.734756 +iter : 35 Arret : 0.00698376 s/iter 30.758187 +iter : 36 Arret : 0.00434219 s/iter 30.755631 +iter : 37 Arret : 0.00443135 s/iter 30.830488 +iter : 38 Arret : 0.00307639 s/iter 30.886661 +iter : 39 Arret : 0.00232794 s/iter 33.124359 +iter : 40 Arret : 0.00166971 s/iter 33.347585 +iter : 41 Arret : 0.00122295 s/iter 33.337013 +iter : 42 Arret : 0.00134613 s/iter 33.285912 +iter : 43 Arret : 0.00166112 s/iter 33.142078 +iter : 44 Arret : 0.000672024 s/iter 33.237063 +iter : 45 Arret : 0.00102215 s/iter 33.355120 +iter : 46 Arret : 0.000576134 s/iter 33.216977 +iter : 47 Arret : 0.000573071 s/iter 33.377160 +iter : 48 Arret : 0.000353889 s/iter 33.363547 +iter : 49 Arret : 0.000700172 s/iter 33.256834 +iter : 50 Arret : 0.000743481 s/iter 33.311955 +iter : 51 Arret : 0.000608469 s/iter 33.215625 +iter : 52 Arret : 0.000457263 s/iter 33.235940 +iter : 53 Arret : 0.000589296 s/iter 33.259107 +iter : 54 Arret : 0.00029042 s/iter 33.275375 +iter : 55 Arret : 0.000315472 s/iter 33.281962 +iter : 56 Arret : 0.000339342 s/iter 33.300298 +iter : 57 Arret : 0.000360241 s/iter 32.539274 +iter : 58 Arret : 0.000378409 s/iter 32.618195 +iter : 59 Arret : 0.000391962 s/iter 33.119674 +iter : 60 Arret : 0.000399828 s/iter 32.899002 +iter : 61 Arret : 0.000401281 s/iter 32.644672 +iter : 62 Arret : 0.000397059 s/iter 32.640126 +iter : 63 Arret : 0.000388639 s/iter 32.641116 +iter : 64 Arret : 0.00037597 s/iter 32.632602 +iter : 65 Arret : 0.000360455 s/iter 32.986045 +iter : 66 Arret : 0.000717297 s/iter 32.532920 +iter : 67 Arret : 0.00150294 s/iter 32.611614 +iter : 68 Arret : 0.000598521 s/iter 32.918210 +iter : 69 Arret : 0.000758787 s/iter 32.757914 +iter : 70 Arret : 0.000686837 s/iter 32.509446 +iter : 71 Arret : 0.000570881 s/iter 32.470879 +iter : 72 Arret : 0.000666462 s/iter 32.695344 +iter : 73 Arret : 0.00186755 s/iter 32.494798 +iter : 74 Arret : 0.00081939 s/iter 32.340122 +iter : 75 Arret : 0.00201132 s/iter 32.271960 +iter : 76 Arret : 0.002594 s/iter 32.320544 +iter : 77 Arret : 0.00723111 s/iter 32.265210 +iter : 78 Arret : 0.0396512 s/iter 32.353911 +iter : 79 Arret : 0.0862068 s/iter 32.342476 +iter : 80 Arret : 0.0251405 s/iter 32.348286 +iter : 81 Arret : 0.00613878 s/iter 32.351287 +iter : 82 Arret : 0.00228496 s/iter 32.701677 +iter : 83 Arret : 0.00108013 s/iter 32.346807 +iter : 84 Arret : 0.000639188 s/iter 25.993462 +iter : 85 Arret : 0.000657107 s/iter 25.901633 +iter : 86 Arret : 0.000334682 s/iter 25.818396 +iter : 87 Arret : 0.000190014 s/iter 25.496927 +iter : 88 Arret : 0.000130996 s/iter 25.552346 +iter : 89 Arret : 9.44195E-05 s/iter 25.504032 +iter : 90 Arret : 7.21415E-05 s/iter 25.545409 +iter : 91 Arret : 6.63758E-05 s/iter 25.516656 +iter : 92 Arret : 6.94495E-05 s/iter 25.530970 +iter : 93 Arret : 5.93857E-05 s/iter 25.505281 +iter : 94 Arret : 6.09831E-05 s/iter 25.539102 +iter : 95 Arret : 2.42734E-05 s/iter 25.538370 +iter : 96 Arret : 1.33758E-05 s/iter 25.540559 +iter : 97 Arret : 4.98428E-07 s/iter 25.505833 +iter : 98 Arret : 1.66718E-11 s/iter 25.536699 +iter : 99 Arret : 1.57009E-16 s/iter 25.524236 +temps : 2990.26 seconde(s) +Nb iterations : 99 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827243 +i* 0.561844| 1|-1.79082E-13 +i*-3.05719E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.76509 +i* 0.643924| 1| 2.51882E-15 +i*-2.49661E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 533332 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 266666 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 266666 +proc 0 start 0 size 266666 +proc 1 start 266666 size 266666 +proc 2 start 533332 size 266666 +iter : 1 Arret : 3.51402E-06 s/iter 44.294763 +iter : 2 Arret : 3.80357E-06 s/iter 44.319418 +iter : 3 Arret : 3.56184E-06 s/iter 44.328022 +iter : 4 Arret : 3.94545E-06 s/iter 44.304192 +iter : 5 Arret : 3.59077E-06 s/iter 44.249235 +iter : 6 Arret : 3.37535E-06 s/iter 44.261256 +iter : 7 Arret : 3.50756E-06 s/iter 44.236566 +iter : 8 Arret : 3.32785E-06 s/iter 44.304981 +iter : 9 Arret : 3.76915E-06 s/iter 44.299164 +iter : 10 Arret : 9.49674E-06 s/iter 44.332812 +iter : 11 Arret : 0.000293847 s/iter 44.217077 +iter : 12 Arret : 0.00113222 s/iter 44.131781 +iter : 13 Arret : 0.75504 s/iter 44.201398 +iter : 14 Arret : 0.948015 s/iter 49.079893 +iter : 15 Arret : 2.42978 s/iter 44.298151 +iter : 16 Arret : 0.042389 s/iter 44.184047 +iter : 17 Arret : 0.0110299 s/iter 44.615420 +iter : 18 Arret : 0.00252208 s/iter 44.609085 +iter : 19 Arret : 0.00162899 s/iter 44.829789 +iter : 20 Arret : 0.000831396 s/iter 44.821825 +iter : 21 Arret : 0.00100286 s/iter 44.786377 +iter : 22 Arret : 0.00241153 s/iter 44.690141 +iter : 23 Arret : 0.00162026 s/iter 44.718089 +iter : 24 Arret : 0.00177008 s/iter 44.710724 +iter : 25 Arret : 0.000154585 s/iter 44.844071 +iter : 26 Arret : 0.000152704 s/iter 44.760597 +iter : 27 Arret : 7.71707E-05 s/iter 44.702686 +iter : 28 Arret : 2.73778E-05 s/iter 44.701397 +iter : 29 Arret : 8.07591E-06 s/iter 44.876078 +iter : 30 Arret : 1.99761E-08 s/iter 44.710043 +iter : 31 Arret : 5.01256E-14 s/iter 44.939607 +temps : 1385.04 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.0233219 +Stabilite : 5.01256E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982853 +i* -0.184391| 1| 8.57613E-14 +i* 1.33506E-13| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +799998 racines de module = 1 + 2 racines de module = 0.999973 +proc 0 +proc 1 +proc 2 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 333397 size 333397 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 2, start 666794 size 333397 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 333397 +proc 0 start 0 size 333397 +proc 2 start 666794 size 333397 +proc 1 start 333397 size 333397 +iter : 1 Arret : 2.8451E-06 s/iter 68.382486 +iter : 2 Arret : 2.78948E-06 s/iter 68.433560 +iter : 3 Arret : 2.75233E-06 s/iter 68.300025 +iter : 4 Arret : 2.48943E-06 s/iter 68.458525 +iter : 5 Arret : 3.00008E-06 s/iter 68.432090 +iter : 6 Arret : 3.01453E-06 s/iter 68.524897 +iter : 7 Arret : 3.01551E-06 s/iter 68.446182 +iter : 8 Arret : 3.04535E-06 s/iter 68.434743 +iter : 9 Arret : 3.16579E-06 s/iter 68.422035 +iter : 10 Arret : 4.01535E-06 s/iter 68.414166 +iter : 11 Arret : 7.65071E-05 s/iter 68.321480 +iter : 12 Arret : 5.74976E-05 s/iter 68.468346 +iter : 13 Arret : 0.000147002 s/iter 68.502897 +iter : 14 Arret : 0.010635 s/iter 68.536016 +iter : 15 Arret : 1.48474 s/iter 69.952485 +iter : 16 Arret : 0.144549 s/iter 70.174661 +iter : 17 Arret : 0.072159 s/iter 71.191994 +iter : 18 Arret : 0.0444524 s/iter 71.740517 +iter : 19 Arret : 0.0333598 s/iter 71.272424 +iter : 20 Arret : 0.0200395 s/iter 84.578496 +iter : 21 Arret : 0.0382658 s/iter 71.993384 +iter : 22 Arret : 0.0565025 s/iter 84.082613 +iter : 23 Arret : 0.12442 s/iter 82.942989 +iter : 24 Arret : 0.115553 s/iter 83.042270 +iter : 25 Arret : 0.127644 s/iter 70.585446 +iter : 26 Arret : 0.0940982 s/iter 70.689985 +iter : 27 Arret : 0.408598 s/iter 69.739812 +iter : 28 Arret : 0.146925 s/iter 69.482126 +iter : 29 Arret : 0.117833 s/iter 69.445977 +iter : 30 Arret : 0.00176567 s/iter 69.543260 +iter : 31 Arret : 0.000770263 s/iter 69.219228 +iter : 32 Arret : 0.000776806 s/iter 69.180679 +iter : 33 Arret : 0.00227798 s/iter 69.395829 +iter : 34 Arret : 0.00273768 s/iter 69.480777 +iter : 35 Arret : 2.35509E-05 s/iter 69.247466 +iter : 36 Arret : 1.12109E-05 s/iter 69.338594 +iter : 37 Arret : 7.87711E-06 s/iter 69.330499 +iter : 38 Arret : 4.9475E-06 s/iter 69.070098 +iter : 39 Arret : 1.46624E-06 s/iter 69.286034 +iter : 40 Arret : 6.57085E-08 s/iter 69.209367 +iter : 41 Arret : 2.62868E-12 s/iter 69.216136 +iter : 42 Arret : 1.57009E-16 s/iter 69.263657 +temps : 2970.64 seconde(s) +Nb iterations : 42 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.40348 +i* -0.914989| 1|-3.45956E-13 +i*-2.59726E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.345815 +i* -0.938303| 1| 5.50778E-13 +i* 8.9059E-14| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 400042 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 400042 size 400042 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 2, start 800084 size 400042 +proc 2 start 800084 size 400042 +proc 0 start 0 size 400042 +proc 1 start 400042 size 400042 +iter : 1 Arret : 2.21726E-06 s/iter 98.933516 +iter : 2 Arret : 2.40944E-06 s/iter 99.024194 +iter : 3 Arret : 2.26938E-06 s/iter 98.935143 +iter : 4 Arret : 2.18952E-06 s/iter 98.915619 +iter : 5 Arret : 2.11829E-06 s/iter 98.890602 +iter : 6 Arret : 2.15946E-06 s/iter 99.042635 +iter : 7 Arret : 2.21461E-06 s/iter 98.822289 +iter : 8 Arret : 2.0517E-06 s/iter 98.833670 +iter : 9 Arret : 2.19174E-06 s/iter 98.820760 +iter : 10 Arret : 3.53644E-06 s/iter 98.877812 +iter : 11 Arret : 2.93712E-05 s/iter 98.816823 +iter : 12 Arret : 0.000329486 s/iter 98.801491 +iter : 13 Arret : 0.00111564 s/iter 99.137713 +iter : 14 Arret : 0.00153883 s/iter 98.876762 +iter : 15 Arret : 0.00119076 s/iter 109.789116 +iter : 16 Arret : 0.00186074 s/iter 112.218069 +iter : 17 Arret : 0.00210628 s/iter 109.255968 +iter : 18 Arret : 0.00980243 s/iter 107.550669 +iter : 19 Arret : 0.0184337 s/iter 114.843464 +iter : 20 Arret : 0.862797 s/iter 116.811287 +iter : 21 Arret : 1.29623 s/iter 117.220983 +iter : 22 Arret : 0.0557788 s/iter 118.439918 +iter : 23 Arret : 0.0754259 s/iter 118.702708 +iter : 24 Arret : 0.127579 s/iter 117.589152 +iter : 25 Arret : 0.243013 s/iter 116.977342 +iter : 26 Arret : 0.180211 s/iter 115.451612 +iter : 27 Arret : 0.132259 s/iter 110.412441 +iter : 28 Arret : 0.0619261 s/iter 111.019579 +iter : 29 Arret : 0.0360536 s/iter 101.119496 +iter : 30 Arret : 0.00610072 s/iter 110.162545 +iter : 31 Arret : 0.004289 s/iter 100.407968 +iter : 32 Arret : 0.000108571 s/iter 100.118461 +iter : 33 Arret : 6.29846E-06 s/iter 100.405665 +iter : 34 Arret : 2.52712E-05 s/iter 100.269833 +iter : 35 Arret : 1.38101E-05 s/iter 99.930403 +iter : 36 Arret : 2.18198E-05 s/iter 100.236092 +iter : 37 Arret : 1.62692E-05 s/iter 100.270854 +iter : 38 Arret : 5.12509E-06 s/iter 100.438752 +iter : 39 Arret : 4.17055E-05 s/iter 100.172456 +iter : 40 Arret : 3.74078E-05 s/iter 100.444459 +iter : 41 Arret : 9.75528E-07 s/iter 100.287457 +iter : 42 Arret : 5.34138E-11 s/iter 100.361764 +iter : 43 Arret : 1.57009E-16 s/iter 100.186348 +temps : 4497 seconde(s) +Nb iterations : 43 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +proc 0 +proc 1 +proc 2 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 466688 size 466688 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 2, start 933376 size 466688 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 466688 +proc 0 start 0 size 466688 +proc 1 start 466688 size 466688 +proc 2 start 933376 size 466688 +iter : 1 Arret : 2.08542E-06 s/iter 134.328776 +iter : 2 Arret : 2.15308E-06 s/iter 134.586017 +iter : 3 Arret : 2.11841E-06 s/iter 134.599024 +iter : 4 Arret : 2.04952E-06 s/iter 134.624374 +iter : 5 Arret : 2.06699E-06 s/iter 134.596768 +iter : 6 Arret : 1.83796E-06 s/iter 134.584295 +iter : 7 Arret : 2.00923E-06 s/iter 134.519336 +iter : 8 Arret : 1.86075E-06 s/iter 134.440160 +iter : 9 Arret : 2.1628E-06 s/iter 134.425205 +iter : 10 Arret : 1.9984E-06 s/iter 134.420418 +iter : 11 Arret : 2.90225E-05 s/iter 134.483615 +iter : 12 Arret : 0.000247724 s/iter 134.359944 +iter : 13 Arret : 0.000608129 s/iter 134.284262 +iter : 14 Arret : 0.00965224 s/iter 139.172750 +iter : 15 Arret : 0.00945937 s/iter 148.248623 +iter : 16 Arret : 0.00602604 s/iter 150.503292 +iter : 17 Arret : 0.0120208 s/iter 134.363579 +iter : 18 Arret : 0.69183 s/iter 152.465158 +iter : 19 Arret : 0.028323 s/iter 154.120630 +iter : 20 Arret : 0.0425547 s/iter 152.801781 +iter : 21 Arret : 0.0245225 s/iter 136.641648 +iter : 22 Arret : 0.0380377 s/iter 134.593207 +iter : 23 Arret : 0.0169297 s/iter 134.362628 +iter : 24 Arret : 0.00832844 s/iter 134.078323 +iter : 25 Arret : 0.00715569 s/iter 133.946911 +iter : 26 Arret : 0.000358787 s/iter 133.666167 +iter : 27 Arret : 0.000457827 s/iter 133.611801 +iter : 28 Arret : 8.98119E-05 s/iter 133.662721 +iter : 29 Arret : 6.67621E-05 s/iter 133.612559 +iter : 30 Arret : 5.46875E-06 s/iter 133.693580 +iter : 31 Arret : 1.14937E-09 s/iter 133.691083 +iter : 32 Arret : 4.44089E-16 s/iter 133.664082 +temps : 4390.32 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 4.44089E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_mpi_bis/full_mpi_4GPU.o140348 b/Simulations/full_mpi_bis/full_mpi_4GPU.o140348 new file mode 100644 index 0000000..a8b585d --- /dev/null +++ b/Simulations/full_mpi_bis/full_mpi_4GPU.o140348 @@ -0,0 +1,706 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 3, start 75072 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 2, start 50048 size 25024 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 25024 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 25024 +proc 0 start 0 size 25024 +proc 2 start 50048 size 25024 +proc 3 start 75072 size 25024 +proc 1 start 25024 size 25024 +iter : 1 Arret : 2.3698E-05 s/iter 0.622464 +iter : 2 Arret : 2.40774E-05 s/iter 0.619322 +iter : 3 Arret : 2.33816E-05 s/iter 0.622254 +iter : 4 Arret : 2.55691E-05 s/iter 0.619500 +iter : 5 Arret : 2.365E-05 s/iter 0.622231 +iter : 6 Arret : 2.4839E-05 s/iter 0.619471 +iter : 7 Arret : 2.76054E-05 s/iter 0.622258 +iter : 8 Arret : 3.59937E-05 s/iter 0.622274 +iter : 9 Arret : 0.000553325 s/iter 0.622136 +iter : 10 Arret : 0.000469003 s/iter 0.622260 +iter : 11 Arret : 0.00158435 s/iter 0.619193 +iter : 12 Arret : 0.246132 s/iter 0.619279 +iter : 13 Arret : 1.48068 s/iter 1.975105 +iter : 14 Arret : 0.103644 s/iter 1.943167 +iter : 15 Arret : 0.171523 s/iter 1.967974 +iter : 16 Arret : 0.02354 s/iter 0.615229 +iter : 17 Arret : 0.0107071 s/iter 0.613145 +iter : 18 Arret : 0.00621909 s/iter 0.605147 +iter : 19 Arret : 0.00420462 s/iter 0.609331 +iter : 20 Arret : 0.00306936 s/iter 0.594530 +iter : 21 Arret : 0.00511681 s/iter 0.597070 +iter : 22 Arret : 0.0196508 s/iter 1.625667 +iter : 23 Arret : 0.0198844 s/iter 1.658483 +iter : 24 Arret : 0.00719091 s/iter 0.596861 +iter : 25 Arret : 0.00764461 s/iter 0.596707 +iter : 26 Arret : 0.00231209 s/iter 0.596872 +iter : 27 Arret : 0.00336988 s/iter 0.585655 +iter : 28 Arret : 0.0032107 s/iter 0.604600 +iter : 29 Arret : 0.0004392 s/iter 0.597593 +iter : 30 Arret : 8.96988E-05 s/iter 0.604060 +iter : 31 Arret : 4.52E-05 s/iter 0.598907 +iter : 32 Arret : 1.11158E-05 s/iter 0.598888 +iter : 33 Arret : 3.29001E-07 s/iter 0.598027 +iter : 34 Arret : 9.9053E-12 s/iter 0.599338 +iter : 35 Arret : 1.47523E-16 s/iter 0.599264 +temps : 27.6039 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 1.18572E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 9.92262E-16 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.76803E-14 +i* 5.46854E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 50048 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 3, start 150144 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 50048 +proc 1 start 50048 size 50048 +proc 3 start 150144 size 50048 +proc 0 start 0 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 2, start 100096 size 50048 +proc 2 start 100096 size 50048 +iter : 1 Arret : 1.39753E-05 s/iter 2.454701 +iter : 2 Arret : 1.16206E-05 s/iter 2.453722 +iter : 3 Arret : 1.21137E-05 s/iter 2.453840 +iter : 4 Arret : 1.23953E-05 s/iter 2.453810 +iter : 5 Arret : 1.17605E-05 s/iter 2.453887 +iter : 6 Arret : 1.20661E-05 s/iter 2.453606 +iter : 7 Arret : 1.30094E-05 s/iter 2.453480 +iter : 8 Arret : 1.57289E-05 s/iter 2.453754 +iter : 9 Arret : 3.34285E-05 s/iter 2.453454 +iter : 10 Arret : 0.000544613 s/iter 2.453478 +iter : 11 Arret : 0.00145338 s/iter 2.453591 +iter : 12 Arret : 1.7916 s/iter 2.453592 +iter : 13 Arret : 0.5341 s/iter 2.453540 +iter : 14 Arret : 0.701316 s/iter 4.785432 +iter : 15 Arret : 0.0709253 s/iter 4.772111 +iter : 16 Arret : 0.0253489 s/iter 4.760393 +iter : 17 Arret : 0.00880876 s/iter 2.439729 +iter : 18 Arret : 0.00540524 s/iter 2.428756 +iter : 19 Arret : 0.00751501 s/iter 4.246084 +iter : 20 Arret : 0.000696017 s/iter 2.423215 +iter : 21 Arret : 0.000258851 s/iter 2.411144 +iter : 22 Arret : 0.000852084 s/iter 2.411313 +iter : 23 Arret : 0.00216745 s/iter 2.410298 +iter : 24 Arret : 0.000101556 s/iter 2.410149 +iter : 25 Arret : 3.90454E-05 s/iter 2.410818 +iter : 26 Arret : 4.27421E-06 s/iter 2.410450 +iter : 27 Arret : 8.23315E-09 s/iter 2.410253 +iter : 28 Arret : 7.23968E-14 s/iter 2.410321 +temps : 77.3108 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +proc 1 +proc 2 +proc 3 +proc 0 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 100032 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 3, start 300096 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 2, start 200064 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 100032 +proc 0 start 0 size 100032 +proc 3 start 300096 size 100032 +proc 1 start 100032 size 100032 +proc 2 start 200064 size 100032 +iter : 1 Arret : 6.83306E-06 s/iter 8.677004 +iter : 2 Arret : 5.9257E-06 s/iter 8.697850 +iter : 3 Arret : 6.91668E-06 s/iter 8.659525 +iter : 4 Arret : 5.9062E-06 s/iter 8.678462 +iter : 5 Arret : 6.02571E-06 s/iter 8.669431 +iter : 6 Arret : 6.06088E-06 s/iter 8.668278 +iter : 7 Arret : 6.7324E-06 s/iter 8.669384 +iter : 8 Arret : 6.68447E-06 s/iter 8.672863 +iter : 9 Arret : 6.32239E-06 s/iter 8.670323 +iter : 10 Arret : 1.42876E-05 s/iter 8.668937 +iter : 11 Arret : 0.00172685 s/iter 8.670461 +iter : 12 Arret : 0.00544908 s/iter 12.914516 +iter : 13 Arret : 0.00431593 s/iter 10.171823 +iter : 14 Arret : 0.00293852 s/iter 9.404589 +iter : 15 Arret : 0.044057 s/iter 12.996197 +iter : 16 Arret : 4.91968 s/iter 13.158558 +iter : 17 Arret : 1.81247 s/iter 8.618251 +iter : 18 Arret : 0.688864 s/iter 8.615137 +iter : 19 Arret : 0.196386 s/iter 14.110223 +iter : 20 Arret : 0.0903125 s/iter 12.832674 +iter : 21 Arret : 0.0537492 s/iter 11.060473 +iter : 22 Arret : 0.0403772 s/iter 10.156647 +iter : 23 Arret : 0.111806 s/iter 8.580673 +iter : 24 Arret : 0.142564 s/iter 13.127274 +iter : 25 Arret : 0.154624 s/iter 12.185580 +iter : 26 Arret : 0.544118 s/iter 13.839476 +iter : 27 Arret : 0.571895 s/iter 13.142991 +iter : 28 Arret : 0.00312334 s/iter 10.141662 +iter : 29 Arret : 0.00151621 s/iter 8.584536 +iter : 30 Arret : 0.0012406 s/iter 8.589488 +iter : 31 Arret : 0.00305995 s/iter 8.624266 +iter : 32 Arret : 0.000527656 s/iter 8.604648 +iter : 33 Arret : 0.000120024 s/iter 8.586316 +iter : 34 Arret : 0.000957696 s/iter 8.600210 +iter : 35 Arret : 0.000158139 s/iter 8.586223 +iter : 36 Arret : 4.18049E-07 s/iter 8.594167 +iter : 37 Arret : 2.54857E-11 s/iter 8.618119 +iter : 38 Arret : 1.11022E-16 s/iter 8.588337 +temps : 376.869 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12993E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769081 +i* 0.639152| 1|-2.56017E-13 +i* 6.90161E-13| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857632 +i* 0.514263| 1| 7.84754E-13 +i* 2.86151E-13| +| 10| -0.0345309 +i* -0.999404| 1| 3.31561E-13 +i*-9.06705E-14| +| 11| 0.662503 +i* 0.74906| 1| 7.42843E-14 +i*-6.06277E-13| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926248 +i* 0.376914| 1|-6.80071E-13 +i*-7.41305E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.972932 +i* 0.231092| 1| 1.37213E-13 +i* 8.45104E-13| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 3, start 450048 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 150016 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 300032 size 150016 +proc 1 start 150016 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 150016 +proc 0 start 0 size 150016 +proc 3 start 450048 size 150016 +proc 2 start 300032 size 150016 +iter : 1 Arret : 4.48435E-06 s/iter 18.838750 +iter : 2 Arret : 4.09959E-06 s/iter 18.766680 +iter : 3 Arret : 4.30879E-06 s/iter 18.762113 +iter : 4 Arret : 4.06302E-06 s/iter 18.763030 +iter : 5 Arret : 4.23595E-06 s/iter 18.764860 +iter : 6 Arret : 4.05416E-06 s/iter 18.761836 +iter : 7 Arret : 4.0595E-06 s/iter 18.757295 +iter : 8 Arret : 4.31359E-06 s/iter 18.756544 +iter : 9 Arret : 5.21531E-06 s/iter 18.755317 +iter : 10 Arret : 7.11795E-05 s/iter 18.758724 +iter : 11 Arret : 0.000408395 s/iter 18.756923 +iter : 12 Arret : 0.000706561 s/iter 18.760370 +iter : 13 Arret : 2.19093 s/iter 18.767510 +iter : 14 Arret : 0.451996 s/iter 18.759994 +iter : 15 Arret : 0.348648 s/iter 26.298146 +iter : 16 Arret : 0.184683 s/iter 18.925862 +iter : 17 Arret : 0.0408743 s/iter 18.697730 +iter : 18 Arret : 0.0214141 s/iter 23.426390 +iter : 19 Arret : 0.0133603 s/iter 18.929979 +iter : 20 Arret : 0.0171829 s/iter 19.527202 +iter : 21 Arret : 0.00669583 s/iter 20.574190 +iter : 22 Arret : 0.00488704 s/iter 24.911488 +iter : 23 Arret : 0.0145923 s/iter 24.829937 +iter : 24 Arret : 0.0160802 s/iter 25.179566 +iter : 25 Arret : 0.0887648 s/iter 25.160136 +iter : 26 Arret : 0.0156067 s/iter 24.806243 +iter : 27 Arret : 0.151029 s/iter 26.284457 +iter : 28 Arret : 0.0885446 s/iter 25.017191 +iter : 29 Arret : 0.0748154 s/iter 25.250652 +iter : 30 Arret : 0.0147904 s/iter 20.680925 +iter : 31 Arret : 0.00566475 s/iter 20.785703 +iter : 32 Arret : 0.0035956 s/iter 23.782230 +iter : 33 Arret : 0.00308793 s/iter 26.338575 +iter : 34 Arret : 0.00266822 s/iter 26.493405 +iter : 35 Arret : 0.00323756 s/iter 26.510053 +iter : 36 Arret : 0.00687861 s/iter 26.545076 +iter : 37 Arret : 0.0120672 s/iter 26.612693 +iter : 38 Arret : 0.00281708 s/iter 26.555146 +iter : 39 Arret : 0.00327894 s/iter 26.457712 +iter : 40 Arret : 0.00190532 s/iter 26.330070 +iter : 41 Arret : 0.000453493 s/iter 18.630883 +iter : 42 Arret : 0.00146626 s/iter 18.621114 +iter : 43 Arret : 0.00184988 s/iter 18.599559 +iter : 44 Arret : 0.00339119 s/iter 18.641018 +iter : 45 Arret : 0.000958132 s/iter 18.631149 +iter : 46 Arret : 0.000169759 s/iter 18.630007 +iter : 47 Arret : 4.09905E-05 s/iter 18.609641 +iter : 48 Arret : 1.22208E-05 s/iter 18.636672 +iter : 49 Arret : 1.7664E-05 s/iter 18.641179 +iter : 50 Arret : 9.49112E-06 s/iter 18.587389 +iter : 51 Arret : 1.73378E-06 s/iter 18.640660 +iter : 52 Arret : 1.6208E-08 s/iter 18.642526 +iter : 53 Arret : 3.34934E-14 s/iter 18.667701 +temps : 1130.49 seconde(s) +Nb iterations : 53 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827243 +i* 0.561844| 1|-1.79082E-13 +i*-3.05719E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.76509 +i* 0.643924| 1| 2.51882E-15 +i*-2.49661E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 200000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 3, start 600000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 400000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 200000 +proc 0 start 0 size 200000 +proc 3 start 600000 size 200000 +proc 1 start 200000 size 200000 +proc 2 start 400000 size 200000 +iter : 1 Arret : 2.99282E-06 s/iter 34.171307 +iter : 2 Arret : 2.96802E-06 s/iter 34.158886 +iter : 3 Arret : 2.87918E-06 s/iter 34.169609 +iter : 4 Arret : 2.96246E-06 s/iter 34.166563 +iter : 5 Arret : 3.22003E-06 s/iter 34.133966 +iter : 6 Arret : 2.96197E-06 s/iter 34.137747 +iter : 7 Arret : 2.97177E-06 s/iter 34.159250 +iter : 8 Arret : 3.1804E-06 s/iter 34.124814 +iter : 9 Arret : 3.76914E-06 s/iter 34.159243 +iter : 10 Arret : 6.64269E-06 s/iter 34.114240 +iter : 11 Arret : 0.000184945 s/iter 34.138524 +iter : 12 Arret : 0.00113219 s/iter 34.181721 +iter : 13 Arret : 0.754059 s/iter 34.135705 +iter : 14 Arret : 0.94401 s/iter 34.137755 +iter : 15 Arret : 2.44482 s/iter 34.169116 +iter : 16 Arret : 0.0480063 s/iter 35.766805 +iter : 17 Arret : 0.0138416 s/iter 33.976349 +iter : 18 Arret : 0.00117539 s/iter 34.110213 +iter : 19 Arret : 0.000995536 s/iter 33.875032 +iter : 20 Arret : 0.000973739 s/iter 43.110544 +iter : 21 Arret : 0.00036675 s/iter 33.895194 +iter : 22 Arret : 0.000735728 s/iter 33.856600 +iter : 23 Arret : 0.000600918 s/iter 33.874131 +iter : 24 Arret : 0.00149682 s/iter 33.873086 +iter : 25 Arret : 0.000266766 s/iter 33.874950 +iter : 26 Arret : 1.51897E-05 s/iter 33.908056 +iter : 27 Arret : 1.44525E-05 s/iter 33.906010 +iter : 28 Arret : 1.31808E-05 s/iter 33.929499 +iter : 29 Arret : 6.49441E-07 s/iter 33.876616 +iter : 30 Arret : 3.93534E-11 s/iter 33.895171 +iter : 31 Arret : 1.57009E-16 s/iter 33.905376 +temps : 1066.62 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982853 +i* -0.184391| 1| 8.57613E-14 +i* 1.33506E-13| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 2, start 500096 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 250048 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 3, start 750144 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 250048 +proc 3 start 750144 size 250048 +proc 2 start 500096 size 250048 +proc 1 start 250048 size 250048 +proc 0 start 0 size 250048 +iter : 1 Arret : 2.94061E-06 s/iter 52.698297 +iter : 2 Arret : 2.46698E-06 s/iter 52.503169 +iter : 3 Arret : 2.38127E-06 s/iter 52.386678 +iter : 4 Arret : 2.45221E-06 s/iter 52.386869 +iter : 5 Arret : 2.37409E-06 s/iter 52.369643 +iter : 6 Arret : 2.34372E-06 s/iter 52.374742 +iter : 7 Arret : 2.42042E-06 s/iter 52.378495 +iter : 8 Arret : 2.56887E-06 s/iter 52.390410 +iter : 9 Arret : 2.94319E-06 s/iter 52.379257 +iter : 10 Arret : 4.31763E-06 s/iter 52.380104 +iter : 11 Arret : 7.0141E-05 s/iter 52.403495 +iter : 12 Arret : 8.5522E-05 s/iter 52.383667 +iter : 13 Arret : 0.000141081 s/iter 52.398851 +iter : 14 Arret : 0.000759031 s/iter 52.396152 +iter : 15 Arret : 1.40075 s/iter 52.404926 +iter : 16 Arret : 0.156713 s/iter 54.411397 +iter : 17 Arret : 0.0802383 s/iter 61.981037 +iter : 18 Arret : 0.0488319 s/iter 63.074060 +iter : 19 Arret : 0.0700232 s/iter 65.986060 +iter : 20 Arret : 0.03747 s/iter 66.688981 +iter : 21 Arret : 0.732169 s/iter 66.379021 +iter : 22 Arret : 0.410928 s/iter 66.653050 +iter : 23 Arret : 0.788357 s/iter 59.935701 +iter : 24 Arret : 0.511921 s/iter 57.188880 +iter : 25 Arret : 1.0748 s/iter 66.455577 +iter : 26 Arret : 0.368191 s/iter 59.881724 +iter : 27 Arret : 0.248818 s/iter 52.766966 +iter : 28 Arret : 0.0947681 s/iter 53.773916 +iter : 29 Arret : 0.0146321 s/iter 52.795623 +iter : 30 Arret : 0.00257161 s/iter 53.551575 +iter : 31 Arret : 0.00302759 s/iter 52.794541 +iter : 32 Arret : 0.00133269 s/iter 52.882850 +iter : 33 Arret : 0.000334162 s/iter 52.761972 +iter : 34 Arret : 9.99262E-05 s/iter 52.689483 +iter : 35 Arret : 8.89289E-05 s/iter 52.759587 +iter : 36 Arret : 0.000225158 s/iter 52.695735 +iter : 37 Arret : 0.000221213 s/iter 52.610617 +iter : 38 Arret : 9.32626E-05 s/iter 52.752684 +iter : 39 Arret : 4.11315E-05 s/iter 52.828352 +iter : 40 Arret : 2.26747E-05 s/iter 52.792785 +iter : 41 Arret : 1.46142E-05 s/iter 52.752167 +iter : 42 Arret : 9.1881E-06 s/iter 52.801503 +iter : 43 Arret : 2.40363E-06 s/iter 52.785495 +iter : 44 Arret : 6.67512E-08 s/iter 52.788539 +iter : 45 Arret : 1.20655E-12 s/iter 52.741635 +iter : 46 Arret : 1.57009E-16 s/iter 52.604045 +temps : 2532.79 seconde(s) +Nb iterations : 46 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80136E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459584 +i* -0.888135| 1| 1.26007E-13 +i* 2.45656E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.40348 +i* -0.914989| 1|-3.45956E-13 +i*-2.59726E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.345815 +i* -0.938303| 1| 5.50778E-13 +i* 8.9059E-14| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 2, start 600064 size 300032 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 300032 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 3, start 900096 size 300032 +proc 1 start 300032 size 300032 +proc 2 start 600064 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +proc 3 start 900096 size 300032 +iter : 1 Arret : 2.41684E-06 s/iter 74.680415 +iter : 2 Arret : 2.34934E-06 s/iter 74.513298 +iter : 3 Arret : 2.24361E-06 s/iter 74.568412 +iter : 4 Arret : 2.30139E-06 s/iter 74.569489 +iter : 5 Arret : 2.19502E-06 s/iter 74.565946 +iter : 6 Arret : 2.16257E-06 s/iter 74.508327 +iter : 7 Arret : 2.21483E-06 s/iter 74.536184 +iter : 8 Arret : 2.16891E-06 s/iter 74.586815 +iter : 9 Arret : 2.23011E-06 s/iter 74.528038 +iter : 10 Arret : 2.69124E-06 s/iter 74.517197 +iter : 11 Arret : 4.92984E-05 s/iter 74.550859 +iter : 12 Arret : 0.000427572 s/iter 74.538977 +iter : 13 Arret : 0.00110562 s/iter 74.557139 +iter : 14 Arret : 0.00102196 s/iter 74.760683 +iter : 15 Arret : 0.00211358 s/iter 74.751961 +iter : 16 Arret : 0.00149598 s/iter 74.741455 +iter : 17 Arret : 0.00917911 s/iter 87.872447 +iter : 18 Arret : 1.253 s/iter 90.016573 +iter : 19 Arret : 0.0371056 s/iter 84.387165 +iter : 20 Arret : 0.0186204 s/iter 90.834430 +iter : 21 Arret : 0.0131853 s/iter 91.289375 +iter : 22 Arret : 0.0291424 s/iter 92.240706 +iter : 23 Arret : 0.0691475 s/iter 94.076629 +iter : 24 Arret : 0.124602 s/iter 92.439627 +iter : 25 Arret : 0.139498 s/iter 91.484030 +iter : 26 Arret : 0.177367 s/iter 90.934003 +iter : 27 Arret : 0.042046 s/iter 93.280120 +iter : 28 Arret : 0.0741543 s/iter 90.804921 +iter : 29 Arret : 0.0180153 s/iter 89.835217 +iter : 30 Arret : 0.00564118 s/iter 74.949138 +iter : 31 Arret : 0.00120143 s/iter 74.227934 +iter : 32 Arret : 0.00302603 s/iter 74.689866 +iter : 33 Arret : 8.92387E-06 s/iter 74.235900 +iter : 34 Arret : 6.14653E-06 s/iter 74.384440 +iter : 35 Arret : 3.82669E-06 s/iter 74.235345 +iter : 36 Arret : 2.31748E-06 s/iter 74.303943 +iter : 37 Arret : 3.45691E-07 s/iter 74.373067 +iter : 38 Arret : 2.5251E-10 s/iter 74.478555 +iter : 39 Arret : 2.22045E-16 s/iter 74.276414 +temps : 3118.23 seconde(s) +Nb iterations : 39 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 2.22045E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +proc 1 +proc 2 +proc 3 +proc 0 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 350016 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 2, start 700032 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 350016 size 350016 +proc 1 start 350016 size 350016 +proc 2 start 700032 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 3, start 1050048 size 350016 +proc 3 start 1050048 size 350016 +proc 0 start 0 size 350016 +iter : 1 Arret : 1.92064E-06 s/iter 101.461628 +iter : 2 Arret : 1.78121E-06 s/iter 101.017849 +iter : 3 Arret : 1.78964E-06 s/iter 100.947596 +iter : 4 Arret : 1.80649E-06 s/iter 100.948699 +iter : 5 Arret : 1.71769E-06 s/iter 101.184394 +iter : 6 Arret : 1.89005E-06 s/iter 100.925437 +iter : 7 Arret : 1.82286E-06 s/iter 100.967525 +iter : 8 Arret : 2.15308E-06 s/iter 101.001567 +iter : 9 Arret : 2.01412E-06 s/iter 101.354707 +iter : 10 Arret : 2.22413E-06 s/iter 101.335558 +iter : 11 Arret : 7.15679E-06 s/iter 101.339374 +iter : 12 Arret : 0.000420126 s/iter 100.981074 +iter : 13 Arret : 0.000823069 s/iter 107.792026 +iter : 14 Arret : 0.000795469 s/iter 102.230789 +iter : 15 Arret : 0.0022651 s/iter 116.821157 +iter : 16 Arret : 0.00190062 s/iter 101.354024 +iter : 17 Arret : 0.00221737 s/iter 112.635492 +iter : 18 Arret : 0.00588407 s/iter 119.719044 +iter : 19 Arret : 0.0113476 s/iter 119.316722 +iter : 20 Arret : 0.0559943 s/iter 119.966814 +iter : 21 Arret : 0.650611 s/iter 119.535510 +iter : 22 Arret : 0.0308283 s/iter 119.594304 +iter : 23 Arret : 0.00600492 s/iter 102.153319 +iter : 24 Arret : 0.00490094 s/iter 119.690249 +iter : 25 Arret : 0.0066092 s/iter 101.435132 +iter : 26 Arret : 0.00847932 s/iter 100.564152 +iter : 27 Arret : 0.000210646 s/iter 100.779524 +iter : 28 Arret : 5.44574E-06 s/iter 100.820292 +iter : 29 Arret : 5.18108E-07 s/iter 100.812661 +iter : 30 Arret : 3.48173E-10 s/iter 100.617382 +iter : 31 Arret : 1.57009E-16 s/iter 100.975151 +temps : 3281.76 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_openmp/full_openmp_1GPU.o140165 b/Simulations/full_openmp/full_openmp_1GPU.o140165 new file mode 100644 index 0000000..84aa3b6 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_1GPU.o140165 @@ -0,0 +1,511 @@ +REMAINING: 1 +Taking GPU #3 +zone limite de 'log-exp' 1.00593 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 235 start 0 size 60160 +gpu 0 iter : 1 Arret : 5.01505E-05 s/iter 0.752555 +gpu 0 iter : 2 Arret : 4.32789E-05 s/iter 0.752365 +gpu 0 iter : 3 Arret : 4.45615E-05 s/iter 0.752417 +gpu 0 iter : 4 Arret : 4.42697E-05 s/iter 0.752431 +gpu 0 iter : 5 Arret : 4.06411E-05 s/iter 0.752415 +gpu 0 iter : 6 Arret : 4.41499E-05 s/iter 0.752420 +gpu 0 iter : 7 Arret : 5.50757E-05 s/iter 0.752345 +gpu 0 iter : 8 Arret : 0.000694531 s/iter 0.752443 +gpu 0 iter : 9 Arret : 0.00117193 s/iter 0.752305 +gpu 0 iter : 10 Arret : 0.0225506 s/iter 0.752371 +gpu 0 iter : 11 Arret : 1.92499 s/iter 1.259044 +gpu 0 iter : 12 Arret : 0.0745471 s/iter 0.752271 +gpu 0 iter : 13 Arret : 0.0973834 s/iter 0.752268 +gpu 0 iter : 14 Arret : 0.106004 s/iter 1.275597 +gpu 0 iter : 15 Arret : 0.0165737 s/iter 1.272023 +gpu 0 iter : 16 Arret : 0.00779384 s/iter 1.273056 +gpu 0 iter : 17 Arret : 0.00519845 s/iter 1.250155 +gpu 0 iter : 18 Arret : 0.00892143 s/iter 0.736177 +gpu 0 iter : 19 Arret : 0.00448482 s/iter 0.708562 +gpu 0 iter : 20 Arret : 0.020935 s/iter 0.700305 +gpu 0 iter : 21 Arret : 0.0174876 s/iter 0.906835 +gpu 0 iter : 22 Arret : 0.00111891 s/iter 0.676895 +gpu 0 iter : 23 Arret : 0.000389286 s/iter 0.656019 +gpu 0 iter : 24 Arret : 0.00124195 s/iter 0.661695 +gpu 0 iter : 25 Arret : 0.00324262 s/iter 0.649796 +gpu 0 iter : 26 Arret : 6.61927E-05 s/iter 0.524316 +gpu 0 iter : 27 Arret : 2.71425E-05 s/iter 0.519333 +gpu 0 iter : 28 Arret : 9.63588E-07 s/iter 0.525346 +gpu 0 iter : 29 Arret : 1.01411E-10 s/iter 0.521530 +gpu 0 iter : 30 Arret : 3.15975E-15 s/iter 0.517480 +temps : 24.3248 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 3.15975E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.80273 +i* -0.596342| 1|-1.96995E-14 +i* -2.6033E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.27804E-14 +i*-1.97481E-14| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583256 +i* -0.812288| 1|-6.17215E-15 +i* 4.85358E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 0 iter : 1 Arret : 1.63964E-05 s/iter 4.677497 +gpu 0 iter : 2 Arret : 1.6127E-05 s/iter 4.675437 +gpu 0 iter : 3 Arret : 1.62587E-05 s/iter 4.673977 +gpu 0 iter : 4 Arret : 1.57168E-05 s/iter 4.675710 +gpu 0 iter : 5 Arret : 1.60975E-05 s/iter 4.675592 +gpu 0 iter : 6 Arret : 1.68058E-05 s/iter 4.675951 +gpu 0 iter : 7 Arret : 1.83433E-05 s/iter 4.674129 +gpu 0 iter : 8 Arret : 2.23201E-05 s/iter 4.676196 +gpu 0 iter : 9 Arret : 0.000120962 s/iter 4.674233 +gpu 0 iter : 10 Arret : 0.0050599 s/iter 4.675473 +gpu 0 iter : 11 Arret : 0.00201552 s/iter 4.674922 +gpu 0 iter : 12 Arret : 0.00812397 s/iter 4.675066 +gpu 0 iter : 13 Arret : 1.49892 s/iter 6.735627 +gpu 0 iter : 14 Arret : 0.0726739 s/iter 4.672589 +gpu 0 iter : 15 Arret : 0.0439834 s/iter 6.675641 +gpu 0 iter : 16 Arret : 0.0237516 s/iter 4.667633 +gpu 0 iter : 17 Arret : 0.0164273 s/iter 6.591866 +gpu 0 iter : 18 Arret : 0.0544284 s/iter 6.683422 +gpu 0 iter : 19 Arret : 0.0693187 s/iter 5.846457 +gpu 0 iter : 20 Arret : 0.0244663 s/iter 6.575941 +gpu 0 iter : 21 Arret : 0.0170064 s/iter 5.851392 +gpu 0 iter : 22 Arret : 0.0132914 s/iter 4.512540 +gpu 0 iter : 23 Arret : 0.000340596 s/iter 4.492501 +gpu 0 iter : 24 Arret : 0.000818373 s/iter 4.462503 +gpu 0 iter : 25 Arret : 0.000816806 s/iter 4.471482 +gpu 0 iter : 26 Arret : 2.75366E-05 s/iter 4.467418 +gpu 0 iter : 27 Arret : 1.11905E-05 s/iter 4.471479 +gpu 0 iter : 28 Arret : 1.25333E-07 s/iter 4.486611 +gpu 0 iter : 29 Arret : 1.10046E-12 s/iter 4.460078 +gpu 0 iter : 30 Arret : 1.11022E-16 s/iter 4.443078 +temps : 151.38 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235897 +i* 0.971778| 1|-3.15963E-14 +i*-8.88994E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 977 start 0 size 250112 +gpu 0 iter : 1 Arret : 1.15543E-05 s/iter 13.064328 +gpu 0 iter : 2 Arret : 1.05743E-05 s/iter 13.099577 +gpu 0 iter : 3 Arret : 1.00182E-05 s/iter 13.092478 +gpu 0 iter : 4 Arret : 9.77217E-06 s/iter 13.098796 +gpu 0 iter : 5 Arret : 1.10944E-05 s/iter 13.096321 +gpu 0 iter : 6 Arret : 1.15644E-05 s/iter 13.098761 +gpu 0 iter : 7 Arret : 9.85482E-06 s/iter 13.095612 +gpu 0 iter : 8 Arret : 1.06459E-05 s/iter 13.079031 +gpu 0 iter : 9 Arret : 2.17082E-05 s/iter 13.095096 +gpu 0 iter : 10 Arret : 0.00106372 s/iter 13.097410 +gpu 0 iter : 11 Arret : 0.00274403 s/iter 13.098142 +gpu 0 iter : 12 Arret : 0.00233621 s/iter 15.172668 +gpu 0 iter : 13 Arret : 0.00104775 s/iter 13.090864 +gpu 0 iter : 14 Arret : 0.00142817 s/iter 13.093375 +gpu 0 iter : 15 Arret : 0.00192709 s/iter 13.017860 +gpu 0 iter : 16 Arret : 0.0176279 s/iter 11.468330 +gpu 0 iter : 17 Arret : 0.0577522 s/iter 7.983525 +gpu 0 iter : 18 Arret : 0.0271883 s/iter 9.498511 +gpu 0 iter : 19 Arret : 0.32067 s/iter 9.329063 +gpu 0 iter : 20 Arret : 0.0289407 s/iter 9.296524 +gpu 0 iter : 21 Arret : 0.00140766 s/iter 7.142933 +gpu 0 iter : 22 Arret : 0.000475428 s/iter 7.123373 +gpu 0 iter : 23 Arret : 0.000240166 s/iter 7.094510 +gpu 0 iter : 24 Arret : 1.51927E-05 s/iter 7.077023 +gpu 0 iter : 25 Arret : 1.77863E-06 s/iter 7.010421 +gpu 0 iter : 26 Arret : 8.08854E-10 s/iter 7.130576 +gpu 0 iter : 27 Arret : 1.00074E-15 s/iter 7.048493 +temps : 296.321 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.00074E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 1368 start 0 size 350208 +gpu 0 iter : 1 Arret : 8.60936E-06 s/iter 25.332348 +gpu 0 iter : 2 Arret : 7.40646E-06 s/iter 25.331263 +gpu 0 iter : 3 Arret : 7.97813E-06 s/iter 25.297466 +gpu 0 iter : 4 Arret : 7.23099E-06 s/iter 25.306792 +gpu 0 iter : 5 Arret : 6.85143E-06 s/iter 25.280568 +gpu 0 iter : 6 Arret : 6.79155E-06 s/iter 25.305357 +gpu 0 iter : 7 Arret : 7.08999E-06 s/iter 25.314962 +gpu 0 iter : 8 Arret : 7.80158E-06 s/iter 25.279543 +gpu 0 iter : 9 Arret : 2.6561E-05 s/iter 25.267836 +gpu 0 iter : 10 Arret : 0.00102009 s/iter 25.308796 +gpu 0 iter : 11 Arret : 0.00106765 s/iter 25.285841 +gpu 0 iter : 12 Arret : 0.00106457 s/iter 25.305366 +gpu 0 iter : 13 Arret : 0.857755 s/iter 25.292478 +gpu 0 iter : 14 Arret : 3.15407 s/iter 25.495050 +gpu 0 iter : 15 Arret : 0.0928667 s/iter 25.354315 +gpu 0 iter : 16 Arret : 0.0413768 s/iter 25.910028 +gpu 0 iter : 17 Arret : 0.0497463 s/iter 25.748876 +gpu 0 iter : 18 Arret : 0.0497904 s/iter 25.748583 +gpu 0 iter : 19 Arret : 0.0354662 s/iter 25.596173 +gpu 0 iter : 20 Arret : 0.0431719 s/iter 25.648011 +gpu 0 iter : 21 Arret : 0.0230133 s/iter 25.155342 +gpu 0 iter : 22 Arret : 0.00525789 s/iter 25.160092 +gpu 0 iter : 23 Arret : 0.00203657 s/iter 24.929404 +gpu 0 iter : 24 Arret : 0.000600149 s/iter 24.929483 +gpu 0 iter : 25 Arret : 0.00016638 s/iter 24.931502 +gpu 0 iter : 26 Arret : 0.000154787 s/iter 24.957389 +gpu 0 iter : 27 Arret : 0.000302699 s/iter 24.917011 +gpu 0 iter : 28 Arret : 2.13113E-05 s/iter 24.916750 +gpu 0 iter : 29 Arret : 1.51643E-05 s/iter 24.917954 +gpu 0 iter : 30 Arret : 3.76262E-06 s/iter 24.943057 +gpu 0 iter : 31 Arret : 1.29245E-07 s/iter 24.913031 +gpu 0 iter : 32 Arret : 6.35329E-12 s/iter 24.917417 +gpu 0 iter : 33 Arret : 1.24127E-16 s/iter 24.950893 +temps : 833.807 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.24127E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 1954 start 0 size 500224 +gpu 0 iter : 1 Arret : 6.12242E-06 s/iter 51.505107 +gpu 0 iter : 2 Arret : 6.31918E-06 s/iter 51.453063 +gpu 0 iter : 3 Arret : 5.33763E-06 s/iter 51.408046 +gpu 0 iter : 4 Arret : 5.41422E-06 s/iter 51.400436 +gpu 0 iter : 5 Arret : 5.39348E-06 s/iter 51.382269 +gpu 0 iter : 6 Arret : 5.60111E-06 s/iter 51.438183 +gpu 0 iter : 7 Arret : 5.01475E-06 s/iter 51.488070 +gpu 0 iter : 8 Arret : 5.29744E-06 s/iter 51.358997 +gpu 0 iter : 9 Arret : 6.66838E-06 s/iter 51.085502 +gpu 0 iter : 10 Arret : 6.73287E-05 s/iter 51.335479 +gpu 0 iter : 11 Arret : 0.00990101 s/iter 51.464874 +gpu 0 iter : 12 Arret : 0.00823435 s/iter 51.403521 +gpu 0 iter : 13 Arret : 0.0131909 s/iter 51.825163 +gpu 0 iter : 14 Arret : 0.00701993 s/iter 52.176993 +gpu 0 iter : 15 Arret : 0.0153428 s/iter 47.885546 +gpu 0 iter : 16 Arret : 1.40554 s/iter 37.523257 +gpu 0 iter : 17 Arret : 0.017993 s/iter 33.363730 +gpu 0 iter : 18 Arret : 0.0130545 s/iter 31.485423 +gpu 0 iter : 19 Arret : 0.00840726 s/iter 29.781113 +gpu 0 iter : 20 Arret : 0.0195837 s/iter 30.113452 +gpu 0 iter : 21 Arret : 0.0204301 s/iter 30.982105 +gpu 0 iter : 22 Arret : 0.0051956 s/iter 26.750718 +gpu 0 iter : 23 Arret : 0.000187857 s/iter 25.344565 +gpu 0 iter : 24 Arret : 9.72305E-05 s/iter 24.719137 +gpu 0 iter : 25 Arret : 3.47336E-05 s/iter 23.203467 +gpu 0 iter : 26 Arret : 1.4149E-05 s/iter 22.255267 +gpu 0 iter : 27 Arret : 9.26981E-06 s/iter 22.153239 +gpu 0 iter : 28 Arret : 2.81196E-06 s/iter 22.023657 +gpu 0 iter : 29 Arret : 1.36843E-07 s/iter 21.837417 +gpu 0 iter : 30 Arret : 1.32082E-11 s/iter 21.847546 +gpu 0 iter : 31 Arret : 1.11022E-16 s/iter 21.866344 +temps : 1194.76 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 0 iter : 1 Arret : 5.11012E-06 s/iter 73.756595 +gpu 0 iter : 2 Arret : 5.49594E-06 s/iter 74.121359 +gpu 0 iter : 3 Arret : 4.95278E-06 s/iter 74.139359 +gpu 0 iter : 4 Arret : 4.31967E-06 s/iter 74.012268 +gpu 0 iter : 5 Arret : 4.586E-06 s/iter 74.059945 +gpu 0 iter : 6 Arret : 4.28143E-06 s/iter 74.091814 +gpu 0 iter : 7 Arret : 4.14913E-06 s/iter 74.022009 +gpu 0 iter : 8 Arret : 4.768E-06 s/iter 74.045411 +gpu 0 iter : 9 Arret : 6.32809E-06 s/iter 74.020498 +gpu 0 iter : 10 Arret : 0.000551734 s/iter 74.008861 +gpu 0 iter : 11 Arret : 0.000854623 s/iter 74.075006 +gpu 0 iter : 12 Arret : 0.00526383 s/iter 74.351997 +gpu 0 iter : 13 Arret : 1.86671 s/iter 74.338451 +gpu 0 iter : 14 Arret : 0.044381 s/iter 74.401470 +gpu 0 iter : 15 Arret : 0.0449663 s/iter 77.708059 +gpu 0 iter : 16 Arret : 0.0459647 s/iter 73.860654 +gpu 0 iter : 17 Arret : 0.0457241 s/iter 72.117134 +gpu 0 iter : 18 Arret : 0.0378989 s/iter 71.687519 +gpu 0 iter : 19 Arret : 0.0321851 s/iter 69.198666 +gpu 0 iter : 20 Arret : 0.0124933 s/iter 68.613221 +gpu 0 iter : 21 Arret : 0.00730326 s/iter 67.130299 +gpu 0 iter : 22 Arret : 0.00446236 s/iter 65.916847 +gpu 0 iter : 23 Arret : 0.000497812 s/iter 65.967574 +gpu 0 iter : 24 Arret : 0.000892713 s/iter 65.658481 +gpu 0 iter : 25 Arret : 4.7836E-06 s/iter 64.891775 +gpu 0 iter : 26 Arret : 1.04505E-09 s/iter 65.003588 +gpu 0 iter : 27 Arret : 3.1578E-15 s/iter 65.348519 +temps : 1931.46 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 3.1578E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 0 dimgrid2 2735 start 0 size 700160 +gpu 0 iter : 1 Arret : 4.40509E-06 s/iter 100.694769 +gpu 0 iter : 2 Arret : 4.14157E-06 s/iter 100.469337 +gpu 0 iter : 3 Arret : 4.41135E-06 s/iter 100.605636 +gpu 0 iter : 4 Arret : 3.77329E-06 s/iter 100.474382 +gpu 0 iter : 5 Arret : 3.66086E-06 s/iter 100.585159 +gpu 0 iter : 6 Arret : 3.72953E-06 s/iter 100.453144 +gpu 0 iter : 7 Arret : 3.69827E-06 s/iter 100.534472 +gpu 0 iter : 8 Arret : 4.0146E-06 s/iter 100.527939 +gpu 0 iter : 9 Arret : 4.40501E-06 s/iter 100.506852 +gpu 0 iter : 10 Arret : 0.000145438 s/iter 100.425934 +gpu 0 iter : 11 Arret : 0.000853238 s/iter 100.356423 +gpu 0 iter : 12 Arret : 0.00173408 s/iter 100.698172 +gpu 0 iter : 13 Arret : 0.00406782 s/iter 102.669605 +gpu 0 iter : 14 Arret : 0.00525798 s/iter 100.740660 +gpu 0 iter : 15 Arret : 0.00912631 s/iter 101.481624 +gpu 0 iter : 16 Arret : 0.0564377 s/iter 100.156723 +gpu 0 iter : 17 Arret : 0.173647 s/iter 101.052747 +gpu 0 iter : 18 Arret : 0.0415567 s/iter 103.159864 +gpu 0 iter : 19 Arret : 0.0291844 s/iter 101.678094 +gpu 0 iter : 20 Arret : 0.0193248 s/iter 101.283426 +gpu 0 iter : 21 Arret : 0.00828239 s/iter 100.513861 +gpu 0 iter : 22 Arret : 0.00218532 s/iter 99.669534 +gpu 0 iter : 23 Arret : 0.00038288 s/iter 99.672435 +gpu 0 iter : 24 Arret : 0.00053382 s/iter 99.680679 +gpu 0 iter : 25 Arret : 0.000180417 s/iter 99.792193 +gpu 0 iter : 26 Arret : 6.23119E-05 s/iter 99.656799 +gpu 0 iter : 27 Arret : 1.31328E-05 s/iter 99.708395 +gpu 0 iter : 28 Arret : 1.46741E-06 s/iter 99.655086 +gpu 0 iter : 29 Arret : 1.39344E-08 s/iter 99.775734 +gpu 0 iter : 30 Arret : 6.13969E-15 s/iter 99.639756 +temps : 3017.33 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 6.13969E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 3125 start 0 size 800000 +gpu 0 iter : 1 Arret : 3.74909E-06 s/iter 131.738179 +gpu 0 iter : 2 Arret : 3.49254E-06 s/iter 131.503382 +gpu 0 iter : 3 Arret : 3.79247E-06 s/iter 130.862896 +gpu 0 iter : 4 Arret : 3.40119E-06 s/iter 130.832910 +gpu 0 iter : 5 Arret : 3.64216E-06 s/iter 131.517237 +gpu 0 iter : 6 Arret : 3.50994E-06 s/iter 131.403093 +gpu 0 iter : 7 Arret : 3.54522E-06 s/iter 131.315477 +gpu 0 iter : 8 Arret : 3.57706E-06 s/iter 131.206471 +gpu 0 iter : 9 Arret : 4.78249E-06 s/iter 131.242355 +gpu 0 iter : 10 Arret : 0.000445854 s/iter 131.325342 +gpu 0 iter : 11 Arret : 0.00106438 s/iter 131.005859 +gpu 0 iter : 12 Arret : 0.0159228 s/iter 130.855281 +gpu 0 iter : 13 Arret : 1.96586 s/iter 131.580736 +gpu 0 iter : 14 Arret : 0.0310235 s/iter 139.161956 +gpu 0 iter : 15 Arret : 0.288368 s/iter 132.380708 +gpu 0 iter : 16 Arret : 0.268505 s/iter 131.753751 +gpu 0 iter : 17 Arret : 0.055019 s/iter 130.693875 +gpu 0 iter : 18 Arret : 0.0095986 s/iter 120.836692 +gpu 0 iter : 19 Arret : 0.0067465 s/iter 121.133462 +gpu 0 iter : 20 Arret : 0.00486301 s/iter 111.958685 +gpu 0 iter : 21 Arret : 0.00150462 s/iter 106.824156 +gpu 0 iter : 22 Arret : 0.00367623 s/iter 100.023867 +gpu 0 iter : 23 Arret : 0.000649555 s/iter 95.844251 +gpu 0 iter : 24 Arret : 1.61661E-05 s/iter 92.179310 +gpu 0 iter : 25 Arret : 1.57748E-05 s/iter 90.746510 +gpu 0 iter : 26 Arret : 2.71821E-06 s/iter 90.684064 +gpu 0 iter : 27 Arret : 5.01324E-07 s/iter 90.550543 +gpu 0 iter : 28 Arret : 6.04245E-10 s/iter 90.007638 +gpu 0 iter : 29 Arret : 1.57426E-15 s/iter 90.215782 +temps : 3442.42 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.57426E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_openmp/full_openmp_1GPU.sge b/Simulations/full_openmp/full_openmp_1GPU.sge new file mode 100755 index 0000000..038b92b --- /dev/null +++ b/Simulations/full_openmp/full_openmp_1GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 1 +#$ -V +#$ -cwd +#$ -N full_openmp_1GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=1 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/full_openmp/full_openmp_2GPU.o140164 b/Simulations/full_openmp/full_openmp_2GPU.o140164 new file mode 100644 index 0000000..09208b1 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_2GPU.o140164 @@ -0,0 +1,540 @@ +REMAINING: 2 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00593 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 118 start 0 size 30080 +gpu 1 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 1 dimgrid2 118 start 30080 size 30080 +gpu 0 iter : 1 Arret : 4.09766E-05 s/iter 0.377749 +gpu 0 iter : 2 Arret : 3.79749E-05 s/iter 0.377727 +gpu 0 iter : 3 Arret : 3.85767E-05 s/iter 0.377765 +gpu 0 iter : 4 Arret : 3.91197E-05 s/iter 0.377744 +gpu 0 iter : 5 Arret : 4.06402E-05 s/iter 0.377742 +gpu 0 iter : 6 Arret : 4.41484E-05 s/iter 0.377649 +gpu 0 iter : 7 Arret : 5.50721E-05 s/iter 0.377635 +gpu 0 iter : 8 Arret : 0.000118507 s/iter 0.377582 +gpu 0 iter : 9 Arret : 0.00116121 s/iter 0.377567 +gpu 0 iter : 10 Arret : 0.0219727 s/iter 0.377659 +gpu 0 iter : 11 Arret : 2.07933 s/iter 1.180745 +gpu 0 iter : 12 Arret : 0.27049 s/iter 0.377586 +gpu 0 iter : 13 Arret : 0.1554 s/iter 1.212301 +gpu 0 iter : 14 Arret : 0.0487107 s/iter 1.213253 +gpu 0 iter : 15 Arret : 0.0169372 s/iter 1.208391 +gpu 0 iter : 16 Arret : 0.00924961 s/iter 1.200600 +gpu 0 iter : 17 Arret : 0.00644126 s/iter 1.173874 +gpu 0 iter : 18 Arret : 0.00441137 s/iter 0.370745 +gpu 0 iter : 19 Arret : 0.00203274 s/iter 0.364311 +gpu 0 iter : 20 Arret : 0.00318275 s/iter 0.364538 +gpu 0 iter : 21 Arret : 0.009373 s/iter 0.355906 +gpu 0 iter : 22 Arret : 0.0125472 s/iter 0.351740 +gpu 0 iter : 23 Arret : 0.0298136 s/iter 0.350290 +gpu 0 iter : 24 Arret : 0.00227002 s/iter 0.351832 +gpu 0 iter : 25 Arret : 0.000622083 s/iter 0.342077 +gpu 0 iter : 26 Arret : 0.000137321 s/iter 0.346191 +gpu 0 iter : 27 Arret : 4.34709E-05 s/iter 0.348120 +gpu 0 iter : 28 Arret : 3.54366E-06 s/iter 0.343417 +gpu 0 iter : 29 Arret : 2.7858E-09 s/iter 0.341845 +gpu 0 iter : 30 Arret : 8.62089E-14 s/iter 0.341833 +temps : 16.8078 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-2.28637E-15 +i*-5.45917E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 293 start 0 size 75008 +gpu 1 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 1 dimgrid2 293 start 75008 size 75008 +gpu 0 iter : 1 Arret : 1.60819E-05 s/iter 2.345593 +gpu 0 iter : 2 Arret : 1.52654E-05 s/iter 2.345397 +gpu 0 iter : 3 Arret : 1.58146E-05 s/iter 2.345455 +gpu 0 iter : 4 Arret : 1.54189E-05 s/iter 2.345151 +gpu 0 iter : 5 Arret : 1.57815E-05 s/iter 2.345049 +gpu 0 iter : 6 Arret : 1.6413E-05 s/iter 2.345470 +gpu 0 iter : 7 Arret : 1.77314E-05 s/iter 2.345388 +gpu 0 iter : 8 Arret : 2.1072E-05 s/iter 2.345347 +gpu 0 iter : 9 Arret : 4.09887E-05 s/iter 2.344913 +gpu 0 iter : 10 Arret : 0.00231734 s/iter 2.344920 +gpu 0 iter : 11 Arret : 0.00364869 s/iter 2.344545 +gpu 0 iter : 12 Arret : 0.00595916 s/iter 2.901608 +gpu 0 iter : 13 Arret : 0.433645 s/iter 2.901110 +gpu 0 iter : 14 Arret : 2.16599 s/iter 4.403684 +gpu 0 iter : 15 Arret : 0.0451248 s/iter 2.331735 +gpu 0 iter : 16 Arret : 0.0269953 s/iter 4.010657 +gpu 0 iter : 17 Arret : 0.0143832 s/iter 2.323230 +gpu 0 iter : 18 Arret : 0.0101457 s/iter 4.336764 +gpu 0 iter : 19 Arret : 0.00443502 s/iter 3.973966 +gpu 0 iter : 20 Arret : 0.00482918 s/iter 2.285743 +gpu 0 iter : 21 Arret : 0.00559571 s/iter 3.957234 +gpu 0 iter : 22 Arret : 0.00102978 s/iter 2.262199 +gpu 0 iter : 23 Arret : 0.000982733 s/iter 2.250995 +gpu 0 iter : 24 Arret : 0.000314964 s/iter 2.256563 +gpu 0 iter : 25 Arret : 9.62593E-05 s/iter 2.257743 +gpu 0 iter : 26 Arret : 2.22765E-05 s/iter 2.274003 +gpu 0 iter : 27 Arret : 3.08519E-05 s/iter 2.262628 +gpu 0 iter : 28 Arret : 9.19951E-06 s/iter 2.243517 +gpu 0 iter : 29 Arret : 5.62649E-07 s/iter 2.241072 +gpu 0 iter : 30 Arret : 9.17827E-11 s/iter 2.245254 +gpu 0 iter : 31 Arret : 8.04912E-16 s/iter 2.239630 +temps : 82.6744 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 8.04912E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.23606 +i* 0.971739| 1| 2.9924E-14 +i*-1.32854E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 489 start 0 size 125056 +gpu 1 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 1 dimgrid2 489 start 125056 size 125056 +gpu 0 iter : 1 Arret : 1.04122E-05 s/iter 6.895757 +gpu 0 iter : 2 Arret : 9.66998E-06 s/iter 6.877326 +gpu 0 iter : 3 Arret : 9.65609E-06 s/iter 6.885434 +gpu 0 iter : 4 Arret : 1.03183E-05 s/iter 6.886343 +gpu 0 iter : 5 Arret : 9.75367E-06 s/iter 6.875198 +gpu 0 iter : 6 Arret : 9.56197E-06 s/iter 6.877253 +gpu 0 iter : 7 Arret : 9.85222E-06 s/iter 6.888180 +gpu 0 iter : 8 Arret : 1.00444E-05 s/iter 6.876080 +gpu 0 iter : 9 Arret : 1.14954E-05 s/iter 6.871764 +gpu 0 iter : 10 Arret : 0.00617074 s/iter 6.872061 +gpu 0 iter : 11 Arret : 0.00502727 s/iter 9.108306 +gpu 0 iter : 12 Arret : 0.00709612 s/iter 6.884838 +gpu 0 iter : 13 Arret : 0.00636365 s/iter 9.133645 +gpu 0 iter : 14 Arret : 0.000962158 s/iter 6.881477 +gpu 0 iter : 15 Arret : 0.00515317 s/iter 6.879637 +gpu 0 iter : 16 Arret : 0.00489618 s/iter 7.799484 +gpu 0 iter : 17 Arret : 0.0126101 s/iter 6.409073 +gpu 0 iter : 18 Arret : 0.306794 s/iter 4.221095 +gpu 0 iter : 19 Arret : 0.00788796 s/iter 5.229623 +gpu 0 iter : 20 Arret : 0.000261124 s/iter 4.114536 +gpu 0 iter : 21 Arret : 0.000181317 s/iter 3.590034 +gpu 0 iter : 22 Arret : 0.000215766 s/iter 3.589880 +gpu 0 iter : 23 Arret : 0.000292282 s/iter 3.567063 +gpu 0 iter : 24 Arret : 7.59488E-05 s/iter 3.557992 +gpu 0 iter : 25 Arret : 8.78575E-06 s/iter 3.569234 +gpu 0 iter : 26 Arret : 1.71E-07 s/iter 3.545083 +gpu 0 iter : 27 Arret : 3.25965E-13 s/iter 3.556937 +temps : 161.369 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.32861E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 1 dimgrid2 684 start 175104 size 175104 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 684 start 0 size 175104 +gpu 0 iter : 1 Arret : 7.32344E-06 s/iter 12.954303 +gpu 0 iter : 2 Arret : 7.07863E-06 s/iter 12.981308 +gpu 0 iter : 3 Arret : 6.90431E-06 s/iter 12.986614 +gpu 0 iter : 4 Arret : 7.26859E-06 s/iter 12.992632 +gpu 0 iter : 5 Arret : 6.9268E-06 s/iter 13.005304 +gpu 0 iter : 6 Arret : 6.766E-06 s/iter 12.980752 +gpu 0 iter : 7 Arret : 7.08928E-06 s/iter 12.936596 +gpu 0 iter : 8 Arret : 7.80045E-06 s/iter 12.948599 +gpu 0 iter : 9 Arret : 9.75059E-06 s/iter 12.933171 +gpu 0 iter : 10 Arret : 0.000389813 s/iter 12.982388 +gpu 0 iter : 11 Arret : 0.00168924 s/iter 12.933771 +gpu 0 iter : 12 Arret : 0.00163024 s/iter 16.015025 +gpu 0 iter : 13 Arret : 0.831287 s/iter 12.991337 +gpu 0 iter : 14 Arret : 3.41318 s/iter 13.007981 +gpu 0 iter : 15 Arret : 0.111579 s/iter 13.648097 +gpu 0 iter : 16 Arret : 0.0536558 s/iter 13.532104 +gpu 0 iter : 17 Arret : 0.0316379 s/iter 12.902939 +gpu 0 iter : 18 Arret : 0.0221392 s/iter 15.777843 +gpu 0 iter : 19 Arret : 0.023782 s/iter 13.053666 +gpu 0 iter : 20 Arret : 0.0188987 s/iter 16.564822 +gpu 0 iter : 21 Arret : 0.0391672 s/iter 17.699510 +gpu 0 iter : 22 Arret : 0.0433525 s/iter 14.316996 +gpu 0 iter : 23 Arret : 0.0310573 s/iter 12.886593 +gpu 0 iter : 24 Arret : 0.0130632 s/iter 14.221913 +gpu 0 iter : 25 Arret : 0.00228986 s/iter 12.848043 +gpu 0 iter : 26 Arret : 0.00142186 s/iter 12.844861 +gpu 0 iter : 27 Arret : 0.000342562 s/iter 12.846961 +gpu 0 iter : 28 Arret : 7.29744E-05 s/iter 12.848477 +gpu 0 iter : 29 Arret : 6.11624E-06 s/iter 12.846333 +gpu 0 iter : 30 Arret : 1.04055E-05 s/iter 12.845798 +gpu 0 iter : 31 Arret : 8.14262E-06 s/iter 12.846716 +gpu 0 iter : 32 Arret : 2.39311E-06 s/iter 12.848384 +gpu 0 iter : 33 Arret : 1.15675E-08 s/iter 12.847822 +gpu 0 iter : 34 Arret : 4.74404E-14 s/iter 12.843750 +temps : 458.792 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.14439E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287595 +i* -0.999586| 1| 4.76598E-14 +i*-1.43895E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 1 dimgrid2 977 start 250112 size 250112 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 977 start 0 size 250112 +gpu 0 iter : 1 Arret : 5.66981E-06 s/iter 26.243500 +gpu 0 iter : 2 Arret : 4.82614E-06 s/iter 26.155609 +gpu 0 iter : 3 Arret : 5.08487E-06 s/iter 26.220032 +gpu 0 iter : 4 Arret : 4.81813E-06 s/iter 26.206135 +gpu 0 iter : 5 Arret : 5.52439E-06 s/iter 26.225948 +gpu 0 iter : 6 Arret : 4.73134E-06 s/iter 26.199860 +gpu 0 iter : 7 Arret : 4.95057E-06 s/iter 26.197320 +gpu 0 iter : 8 Arret : 5.2867E-06 s/iter 26.218407 +gpu 0 iter : 9 Arret : 6.39202E-06 s/iter 26.195373 +gpu 0 iter : 10 Arret : 5.44877E-05 s/iter 26.194619 +gpu 0 iter : 11 Arret : 0.00113955 s/iter 26.198648 +gpu 0 iter : 12 Arret : 0.00233295 s/iter 26.205898 +gpu 0 iter : 13 Arret : 0.00269137 s/iter 26.219943 +gpu 0 iter : 14 Arret : 0.00436419 s/iter 26.210349 +gpu 0 iter : 15 Arret : 0.0325608 s/iter 26.028106 +gpu 0 iter : 16 Arret : 0.0458093 s/iter 20.473858 +gpu 0 iter : 17 Arret : 1.39035 s/iter 21.967251 +gpu 0 iter : 18 Arret : 0.0686378 s/iter 22.648105 +gpu 0 iter : 19 Arret : 0.0167258 s/iter 19.073745 +gpu 0 iter : 20 Arret : 0.0073255 s/iter 18.809805 +gpu 0 iter : 21 Arret : 0.00825181 s/iter 16.400626 +gpu 0 iter : 22 Arret : 0.00369807 s/iter 17.676396 +gpu 0 iter : 23 Arret : 0.00143206 s/iter 14.057186 +gpu 0 iter : 24 Arret : 0.000362864 s/iter 12.988505 +gpu 0 iter : 25 Arret : 5.99505E-05 s/iter 12.740882 +gpu 0 iter : 26 Arret : 1.38177E-05 s/iter 11.720352 +gpu 0 iter : 27 Arret : 7.95915E-06 s/iter 11.636867 +gpu 0 iter : 28 Arret : 2.45128E-06 s/iter 11.537776 +gpu 0 iter : 29 Arret : 4.00503E-08 s/iter 11.539953 +gpu 0 iter : 30 Arret : 2.18749E-13 s/iter 11.544507 +temps : 628.842 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 4.27998E-06 s/iter 37.322864 +gpu 0 iter : 2 Arret : 4.10617E-06 s/iter 37.241818 +gpu 0 iter : 3 Arret : 4.53518E-06 s/iter 37.266422 +gpu 0 iter : 4 Arret : 4.06183E-06 s/iter 37.257521 +gpu 0 iter : 5 Arret : 4.08957E-06 s/iter 37.242975 +gpu 0 iter : 6 Arret : 4.1063E-06 s/iter 37.243477 +gpu 0 iter : 7 Arret : 4.11679E-06 s/iter 37.260449 +gpu 0 iter : 8 Arret : 4.55908E-06 s/iter 37.268788 +gpu 0 iter : 9 Arret : 5.63978E-06 s/iter 37.274568 +gpu 0 iter : 10 Arret : 3.12352E-05 s/iter 37.263840 +gpu 0 iter : 11 Arret : 0.000760143 s/iter 37.275869 +gpu 0 iter : 12 Arret : 0.00101593 s/iter 37.272537 +gpu 0 iter : 13 Arret : 2.01147 s/iter 45.273128 +gpu 0 iter : 14 Arret : 0.399191 s/iter 37.620123 +gpu 0 iter : 15 Arret : 0.349288 s/iter 37.631719 +gpu 0 iter : 16 Arret : 0.208253 s/iter 39.378074 +gpu 0 iter : 17 Arret : 0.0357115 s/iter 36.777203 +gpu 0 iter : 18 Arret : 0.00764262 s/iter 36.020848 +gpu 0 iter : 19 Arret : 0.00870865 s/iter 35.507205 +gpu 0 iter : 20 Arret : 0.00636133 s/iter 36.016380 +gpu 0 iter : 21 Arret : 0.00247744 s/iter 34.115098 +gpu 0 iter : 22 Arret : 0.00232921 s/iter 33.193981 +gpu 0 iter : 23 Arret : 0.000237628 s/iter 33.032645 +gpu 0 iter : 24 Arret : 2.29813E-05 s/iter 32.946598 +gpu 0 iter : 25 Arret : 2.02338E-05 s/iter 32.928243 +gpu 0 iter : 26 Arret : 2.55188E-05 s/iter 32.809567 +gpu 0 iter : 27 Arret : 5.88928E-06 s/iter 32.589015 +gpu 0 iter : 28 Arret : 5.50518E-09 s/iter 32.619895 +gpu 0 iter : 29 Arret : 1.64317E-14 s/iter 32.704855 +temps : 1049.55 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 1 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid2 1368 start 350080 size 350080 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 0 dimgrid2 1368 start 0 size 350080 +gpu 0 iter : 1 Arret : 3.85506E-06 s/iter 50.537882 +gpu 0 iter : 2 Arret : 3.66998E-06 s/iter 50.446787 +gpu 0 iter : 3 Arret : 3.5726E-06 s/iter 50.500062 +gpu 0 iter : 4 Arret : 3.62569E-06 s/iter 50.536621 +gpu 0 iter : 5 Arret : 3.53038E-06 s/iter 50.517457 +gpu 0 iter : 6 Arret : 3.56934E-06 s/iter 50.509400 +gpu 0 iter : 7 Arret : 3.64216E-06 s/iter 50.424296 +gpu 0 iter : 8 Arret : 3.67185E-06 s/iter 50.440541 +gpu 0 iter : 9 Arret : 3.63502E-06 s/iter 50.438151 +gpu 0 iter : 10 Arret : 9.16823E-06 s/iter 50.456984 +gpu 0 iter : 11 Arret : 0.000775983 s/iter 50.442631 +gpu 0 iter : 12 Arret : 0.00172532 s/iter 50.492134 +gpu 0 iter : 13 Arret : 0.00299803 s/iter 51.124560 +gpu 0 iter : 14 Arret : 0.00358296 s/iter 56.913865 +gpu 0 iter : 15 Arret : 0.00444746 s/iter 51.832479 +gpu 0 iter : 16 Arret : 0.0771326 s/iter 55.051554 +gpu 0 iter : 17 Arret : 0.187135 s/iter 50.619418 +gpu 0 iter : 18 Arret : 0.0318843 s/iter 52.931554 +gpu 0 iter : 19 Arret : 0.0152072 s/iter 50.308926 +gpu 0 iter : 20 Arret : 0.0163219 s/iter 56.692462 +gpu 0 iter : 21 Arret : 0.00872806 s/iter 57.177894 +gpu 0 iter : 22 Arret : 0.0115686 s/iter 50.015870 +gpu 0 iter : 23 Arret : 0.0199021 s/iter 50.011047 +gpu 0 iter : 24 Arret : 0.00353983 s/iter 50.010630 +gpu 0 iter : 25 Arret : 0.000449015 s/iter 50.024349 +gpu 0 iter : 26 Arret : 0.000359858 s/iter 50.022460 +gpu 0 iter : 27 Arret : 0.000264692 s/iter 50.007880 +gpu 0 iter : 28 Arret : 9.80473E-05 s/iter 50.011312 +gpu 0 iter : 29 Arret : 1.12945E-05 s/iter 50.013302 +gpu 0 iter : 30 Arret : 1.06056E-08 s/iter 49.925806 +gpu 0 iter : 31 Arret : 5.50569E-15 s/iter 49.926960 +temps : 1589.66 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 5.50569E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1563 start 0 size 400000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1563 start 400000 size 400000 +gpu 0 iter : 1 Arret : 3.10089E-06 s/iter 66.233735 +gpu 0 iter : 2 Arret : 3.0838E-06 s/iter 65.987108 +gpu 0 iter : 3 Arret : 3.06149E-06 s/iter 66.189454 +gpu 0 iter : 4 Arret : 3.0062E-06 s/iter 65.996849 +gpu 0 iter : 5 Arret : 3.0175E-06 s/iter 65.939646 +gpu 0 iter : 6 Arret : 3.04713E-06 s/iter 65.973994 +gpu 0 iter : 7 Arret : 3.05645E-06 s/iter 66.066266 +gpu 0 iter : 8 Arret : 3.30702E-06 s/iter 65.988454 +gpu 0 iter : 9 Arret : 4.07591E-06 s/iter 65.937363 +gpu 0 iter : 10 Arret : 8.87751E-06 s/iter 65.957225 +gpu 0 iter : 11 Arret : 0.00223658 s/iter 66.065550 +gpu 0 iter : 12 Arret : 0.00280193 s/iter 66.350461 +gpu 0 iter : 13 Arret : 2.16738 s/iter 71.352901 +gpu 0 iter : 14 Arret : 0.942103 s/iter 66.359607 +gpu 0 iter : 15 Arret : 4.73642 s/iter 71.197413 +gpu 0 iter : 16 Arret : 0.106528 s/iter 66.581428 +gpu 0 iter : 17 Arret : 0.126902 s/iter 68.405076 +gpu 0 iter : 18 Arret : 0.0671442 s/iter 65.117577 +gpu 0 iter : 19 Arret : 0.0842362 s/iter 64.328947 +gpu 0 iter : 20 Arret : 0.06511 s/iter 58.256373 +gpu 0 iter : 21 Arret : 0.0412827 s/iter 62.163236 +gpu 0 iter : 22 Arret : 0.0193263 s/iter 56.316208 +gpu 0 iter : 23 Arret : 0.0142222 s/iter 56.754546 +gpu 0 iter : 24 Arret : 0.00245535 s/iter 47.889436 +gpu 0 iter : 25 Arret : 0.000939196 s/iter 46.695509 +gpu 0 iter : 26 Arret : 2.31722E-05 s/iter 46.175563 +gpu 0 iter : 27 Arret : 1.05871E-06 s/iter 45.766439 +gpu 0 iter : 28 Arret : 1.17662E-11 s/iter 45.536542 +gpu 0 iter : 29 Arret : 1.57009E-16 s/iter 45.801905 +temps : 1778.69 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_openmp/full_openmp_2GPU.sge b/Simulations/full_openmp/full_openmp_2GPU.sge new file mode 100755 index 0000000..82276b2 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_2GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 2 +#$ -V +#$ -cwd +#$ -N full_openmp_2GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=2 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/full_openmp/full_openmp_3GPU.o140163 b/Simulations/full_openmp/full_openmp_3GPU.o140163 new file mode 100644 index 0000000..693fb02 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_3GPU.o140163 @@ -0,0 +1,565 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +zone limite de 'log-exp' 1.00593 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 1 dimgrid2 79 start 20053 size 20053 +gpu 2 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 79 start 0 size 20053 +gpu 2 dimgrid2 79 start 40106 size 20053 +gpu 0 iter : 1 Arret : 4.45023E-05 s/iter 0.365910 +gpu 0 iter : 2 Arret : 3.97664E-05 s/iter 0.365783 +gpu 0 iter : 3 Arret : 3.83563E-05 s/iter 0.365808 +gpu 0 iter : 4 Arret : 4.09098E-05 s/iter 0.365792 +gpu 0 iter : 5 Arret : 4.06402E-05 s/iter 0.365790 +gpu 0 iter : 6 Arret : 4.41483E-05 s/iter 0.365795 +gpu 0 iter : 7 Arret : 5.50719E-05 s/iter 0.365797 +gpu 0 iter : 8 Arret : 0.000118506 s/iter 0.365824 +gpu 0 iter : 9 Arret : 0.00173508 s/iter 0.365741 +gpu 0 iter : 10 Arret : 0.0219619 s/iter 0.365806 +gpu 0 iter : 11 Arret : 2.12669 s/iter 1.163297 +gpu 0 iter : 12 Arret : 0.293659 s/iter 0.365830 +gpu 0 iter : 13 Arret : 0.150913 s/iter 1.192984 +gpu 0 iter : 14 Arret : 0.0525383 s/iter 1.193344 +gpu 0 iter : 15 Arret : 0.017941 s/iter 1.188756 +gpu 0 iter : 16 Arret : 0.00949223 s/iter 1.183377 +gpu 0 iter : 17 Arret : 0.00618922 s/iter 1.174720 +gpu 0 iter : 18 Arret : 0.00478541 s/iter 1.021119 +gpu 0 iter : 19 Arret : 0.0209781 s/iter 0.355703 +gpu 0 iter : 20 Arret : 0.00277186 s/iter 0.354432 +gpu 0 iter : 21 Arret : 0.00126164 s/iter 0.350947 +gpu 0 iter : 22 Arret : 0.0813 s/iter 0.342869 +gpu 0 iter : 23 Arret : 0.0695633 s/iter 0.341054 +gpu 0 iter : 24 Arret : 0.0249049 s/iter 0.344095 +gpu 0 iter : 25 Arret : 0.0236872 s/iter 0.333915 +gpu 0 iter : 26 Arret : 0.000649816 s/iter 0.333141 +gpu 0 iter : 27 Arret : 0.000117833 s/iter 0.336843 +gpu 0 iter : 28 Arret : 3.89955E-05 s/iter 0.333571 +gpu 0 iter : 29 Arret : 2.68794E-06 s/iter 0.331813 +gpu 0 iter : 30 Arret : 1.05565E-09 s/iter 0.327860 +gpu 0 iter : 31 Arret : 3.2677E-14 s/iter 0.331070 +temps : 17.7034 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583426 +i* -0.812166| 1| 4.94882E-14 +i*-9.16107E-15| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 196 start 0 size 50005 +gpu 1 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 1 dimgrid2 196 start 50005 size 50005 +gpu 2 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 2 dimgrid2 196 start 100010 size 50005 +gpu 0 iter : 1 Arret : 1.83196E-05 s/iter 1.828662 +gpu 0 iter : 2 Arret : 1.8175E-05 s/iter 1.828375 +gpu 0 iter : 3 Arret : 1.80869E-05 s/iter 1.828381 +gpu 0 iter : 4 Arret : 1.75155E-05 s/iter 1.828566 +gpu 0 iter : 5 Arret : 1.69231E-05 s/iter 1.828230 +gpu 0 iter : 6 Arret : 1.76582E-05 s/iter 1.828408 +gpu 0 iter : 7 Arret : 1.98465E-05 s/iter 1.828242 +gpu 0 iter : 8 Arret : 2.53794E-05 s/iter 1.828046 +gpu 0 iter : 9 Arret : 0.00032835 s/iter 1.833783 +gpu 0 iter : 10 Arret : 0.00175922 s/iter 1.828220 +gpu 0 iter : 11 Arret : 0.0175731 s/iter 1.828275 +gpu 0 iter : 12 Arret : 0.00953654 s/iter 1.828216 +gpu 0 iter : 13 Arret : 1.39903 s/iter 3.476936 +gpu 0 iter : 14 Arret : 0.171392 s/iter 1.827262 +gpu 0 iter : 15 Arret : 0.0745773 s/iter 2.751869 +gpu 0 iter : 16 Arret : 0.035733 s/iter 3.807813 +gpu 0 iter : 17 Arret : 0.00850526 s/iter 1.825655 +gpu 0 iter : 18 Arret : 0.00549164 s/iter 1.822042 +gpu 0 iter : 19 Arret : 0.00323678 s/iter 1.812501 +gpu 0 iter : 20 Arret : 0.00178409 s/iter 1.787063 +gpu 0 iter : 21 Arret : 0.00194964 s/iter 1.769047 +gpu 0 iter : 22 Arret : 0.00146162 s/iter 1.771480 +gpu 0 iter : 23 Arret : 0.000624549 s/iter 1.753749 +gpu 0 iter : 24 Arret : 0.000211682 s/iter 1.776112 +gpu 0 iter : 25 Arret : 8.45179E-05 s/iter 1.740231 +gpu 0 iter : 26 Arret : 0.000326207 s/iter 1.768913 +gpu 0 iter : 27 Arret : 0.000200902 s/iter 1.745549 +gpu 0 iter : 28 Arret : 1.1316E-05 s/iter 1.732325 +gpu 0 iter : 29 Arret : 8.18684E-09 s/iter 1.758605 +gpu 0 iter : 30 Arret : 7.64211E-14 s/iter 1.747829 +temps : 59.7653 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 7.64211E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235938 +i* 0.971768| 1|-1.10779E-14 +i* 1.06056E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 1 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 1 dimgrid2 326 start 83370 size 83370 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 326 start 0 size 83370 +gpu 2 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 2 dimgrid2 326 start 166740 size 83370 +gpu 0 iter : 1 Arret : 1.04122E-05 s/iter 4.597080 +gpu 0 iter : 2 Arret : 9.66981E-06 s/iter 4.598575 +gpu 0 iter : 3 Arret : 9.74545E-06 s/iter 4.597108 +gpu 0 iter : 4 Arret : 9.44307E-06 s/iter 4.597489 +gpu 0 iter : 5 Arret : 9.34819E-06 s/iter 4.598001 +gpu 0 iter : 6 Arret : 1.14416E-05 s/iter 4.598661 +gpu 0 iter : 7 Arret : 1.00875E-05 s/iter 4.598097 +gpu 0 iter : 8 Arret : 1.00498E-05 s/iter 4.597534 +gpu 0 iter : 9 Arret : 1.32154E-05 s/iter 4.597416 +gpu 0 iter : 10 Arret : 0.00051254 s/iter 4.597729 +gpu 0 iter : 11 Arret : 0.000628345 s/iter 4.596129 +gpu 0 iter : 12 Arret : 0.00250283 s/iter 4.597678 +gpu 0 iter : 13 Arret : 0.0026566 s/iter 4.597471 +gpu 0 iter : 14 Arret : 0.00107482 s/iter 4.597721 +gpu 0 iter : 15 Arret : 0.0010467 s/iter 4.579817 +gpu 0 iter : 16 Arret : 0.000858809 s/iter 3.750659 +gpu 0 iter : 17 Arret : 0.00453371 s/iter 2.883509 +gpu 0 iter : 18 Arret : 0.298024 s/iter 5.041367 +gpu 0 iter : 19 Arret : 0.0060016 s/iter 5.070989 +gpu 0 iter : 20 Arret : 0.0020976 s/iter 2.833299 +gpu 0 iter : 21 Arret : 0.000787752 s/iter 2.821846 +gpu 0 iter : 22 Arret : 0.00114118 s/iter 2.808072 +gpu 0 iter : 23 Arret : 0.000242876 s/iter 2.800882 +gpu 0 iter : 24 Arret : 6.73756E-05 s/iter 2.794362 +gpu 0 iter : 25 Arret : 2.16461E-05 s/iter 2.813139 +gpu 0 iter : 26 Arret : 2.86679E-06 s/iter 2.821334 +gpu 0 iter : 27 Arret : 9.41388E-09 s/iter 2.791395 +gpu 0 iter : 28 Arret : 1.06079E-14 s/iter 2.796462 +temps : 112.147 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.06079E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 456 start 0 size 116736 +gpu 2 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 2 dimgrid2 456 start 233472 size 116736 +gpu 1 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 1 dimgrid2 456 start 116736 size 116736 +gpu 0 iter : 1 Arret : 7.55039E-06 s/iter 8.728409 +gpu 0 iter : 2 Arret : 7.39793E-06 s/iter 8.712889 +gpu 0 iter : 3 Arret : 7.14478E-06 s/iter 8.682208 +gpu 0 iter : 4 Arret : 8.2105E-06 s/iter 8.682867 +gpu 0 iter : 5 Arret : 7.11502E-06 s/iter 8.683783 +gpu 0 iter : 6 Arret : 6.76587E-06 s/iter 8.680714 +gpu 0 iter : 7 Arret : 7.0891E-06 s/iter 8.680860 +gpu 0 iter : 8 Arret : 7.80018E-06 s/iter 8.676771 +gpu 0 iter : 9 Arret : 1.16108E-05 s/iter 8.679747 +gpu 0 iter : 10 Arret : 0.000768653 s/iter 8.679484 +gpu 0 iter : 11 Arret : 0.00361976 s/iter 8.676534 +gpu 0 iter : 12 Arret : 0.00104415 s/iter 8.674304 +gpu 0 iter : 13 Arret : 0.820674 s/iter 8.674523 +gpu 0 iter : 14 Arret : 3.33533 s/iter 11.712432 +gpu 0 iter : 15 Arret : 0.122884 s/iter 11.716566 +gpu 0 iter : 16 Arret : 0.0600695 s/iter 11.005801 +gpu 0 iter : 17 Arret : 0.0359638 s/iter 10.051106 +gpu 0 iter : 18 Arret : 0.0231638 s/iter 13.260628 +gpu 0 iter : 19 Arret : 0.0116355 s/iter 13.296853 +gpu 0 iter : 20 Arret : 0.102796 s/iter 11.567596 +gpu 0 iter : 21 Arret : 0.0633274 s/iter 11.618611 +gpu 0 iter : 22 Arret : 0.0252937 s/iter 12.797589 +gpu 0 iter : 23 Arret : 0.0319937 s/iter 11.830702 +gpu 0 iter : 24 Arret : 0.0268738 s/iter 13.413124 +gpu 0 iter : 25 Arret : 0.0121216 s/iter 10.946927 +gpu 0 iter : 26 Arret : 0.00234992 s/iter 8.617752 +gpu 0 iter : 27 Arret : 0.00204079 s/iter 8.617732 +gpu 0 iter : 28 Arret : 0.000634889 s/iter 8.617224 +gpu 0 iter : 29 Arret : 0.000124399 s/iter 8.616406 +gpu 0 iter : 30 Arret : 3.10052E-05 s/iter 8.615337 +gpu 0 iter : 31 Arret : 1.67246E-05 s/iter 8.616948 +gpu 0 iter : 32 Arret : 2.0926E-06 s/iter 8.616524 +gpu 0 iter : 33 Arret : 1.35583E-08 s/iter 8.618103 +gpu 0 iter : 34 Arret : 5.09118E-14 s/iter 8.615345 +temps : 334.994 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 5.09118E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 1 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 1 dimgrid2 652 start 166741 size 166741 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 652 start 0 size 166741 +gpu 2 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 2 dimgrid2 652 start 333482 size 166741 +gpu 0 iter : 1 Arret : 5.71659E-06 s/iter 17.161724 +gpu 0 iter : 2 Arret : 4.8241E-06 s/iter 17.102931 +gpu 0 iter : 3 Arret : 4.62087E-06 s/iter 17.128111 +gpu 0 iter : 4 Arret : 5.16204E-06 s/iter 17.101919 +gpu 0 iter : 5 Arret : 4.94408E-06 s/iter 17.092405 +gpu 0 iter : 6 Arret : 4.816E-06 s/iter 17.112302 +gpu 0 iter : 7 Arret : 4.87888E-06 s/iter 17.096377 +gpu 0 iter : 8 Arret : 5.28527E-06 s/iter 17.102422 +gpu 0 iter : 9 Arret : 6.38912E-06 s/iter 17.095757 +gpu 0 iter : 10 Arret : 0.000225655 s/iter 17.102543 +gpu 0 iter : 11 Arret : 0.000912484 s/iter 17.099976 +gpu 0 iter : 12 Arret : 0.001168 s/iter 17.099389 +gpu 0 iter : 13 Arret : 0.00167187 s/iter 21.294197 +gpu 0 iter : 14 Arret : 0.00151006 s/iter 17.896733 +gpu 0 iter : 15 Arret : 0.00184196 s/iter 17.074701 +gpu 0 iter : 16 Arret : 0.00799101 s/iter 18.651210 +gpu 0 iter : 17 Arret : 1.57022 s/iter 15.558990 +gpu 0 iter : 18 Arret : 0.0777881 s/iter 13.332881 +gpu 0 iter : 19 Arret : 0.020549 s/iter 14.677134 +gpu 0 iter : 20 Arret : 0.00806741 s/iter 15.739566 +gpu 0 iter : 21 Arret : 0.00459564 s/iter 12.928791 +gpu 0 iter : 22 Arret : 0.000774045 s/iter 10.091239 +gpu 0 iter : 23 Arret : 0.000687203 s/iter 9.870933 +gpu 0 iter : 24 Arret : 0.000321475 s/iter 8.758152 +gpu 0 iter : 25 Arret : 7.13963E-05 s/iter 8.577885 +gpu 0 iter : 26 Arret : 4.18738E-05 s/iter 8.536888 +gpu 0 iter : 27 Arret : 7.77414E-06 s/iter 8.435734 +gpu 0 iter : 28 Arret : 4.61674E-07 s/iter 8.385966 +gpu 0 iter : 29 Arret : 3.96914E-10 s/iter 8.211682 +gpu 0 iter : 30 Arret : 1.11723E-15 s/iter 8.267906 +temps : 432.911 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 782 start 400042 size 200021 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 782 start 200021 size 200021 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 782 start 0 size 200021 +gpu 0 iter : 1 Arret : 4.17374E-06 s/iter 25.502913 +gpu 0 iter : 2 Arret : 4.12988E-06 s/iter 25.466465 +gpu 0 iter : 3 Arret : 3.89098E-06 s/iter 25.456717 +gpu 0 iter : 4 Arret : 3.93498E-06 s/iter 25.471780 +gpu 0 iter : 5 Arret : 4.075E-06 s/iter 25.480147 +gpu 0 iter : 6 Arret : 4.05328E-06 s/iter 25.490152 +gpu 0 iter : 7 Arret : 4.09388E-06 s/iter 25.467915 +gpu 0 iter : 8 Arret : 4.4692E-06 s/iter 25.472589 +gpu 0 iter : 9 Arret : 5.3977E-06 s/iter 25.487936 +gpu 0 iter : 10 Arret : 1.31096E-05 s/iter 25.504106 +gpu 0 iter : 11 Arret : 0.000429141 s/iter 25.483586 +gpu 0 iter : 12 Arret : 0.00225971 s/iter 25.488006 +gpu 0 iter : 13 Arret : 0.918253 s/iter 25.485654 +gpu 0 iter : 14 Arret : 0.738628 s/iter 28.610440 +gpu 0 iter : 15 Arret : 1.06679 s/iter 25.657526 +gpu 0 iter : 16 Arret : 0.00754293 s/iter 28.023636 +gpu 0 iter : 17 Arret : 0.00928206 s/iter 27.385101 +gpu 0 iter : 18 Arret : 0.00238733 s/iter 27.805420 +gpu 0 iter : 19 Arret : 0.0221226 s/iter 23.602314 +gpu 0 iter : 20 Arret : 0.00167275 s/iter 23.298279 +gpu 0 iter : 21 Arret : 0.000828652 s/iter 23.099043 +gpu 0 iter : 22 Arret : 0.00089783 s/iter 22.283044 +gpu 0 iter : 23 Arret : 0.000189743 s/iter 21.934545 +gpu 0 iter : 24 Arret : 5.2959E-05 s/iter 21.894963 +gpu 0 iter : 25 Arret : 1.63869E-05 s/iter 21.689444 +gpu 0 iter : 26 Arret : 5.47754E-06 s/iter 21.811193 +gpu 0 iter : 27 Arret : 1.27747E-07 s/iter 21.641069 +gpu 0 iter : 28 Arret : 4.20926E-13 s/iter 21.740517 +temps : 693.102 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 4.20926E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 2 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 2 dimgrid2 912 start 466772 size 233386 +gpu 1 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid2 912 start 233386 size 233386 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 0 dimgrid2 912 start 0 size 233386 +gpu 0 iter : 1 Arret : 4.07574E-06 s/iter 34.223058 +gpu 0 iter : 2 Arret : 3.55154E-06 s/iter 34.224642 +gpu 0 iter : 3 Arret : 3.46878E-06 s/iter 34.212867 +gpu 0 iter : 4 Arret : 3.42717E-06 s/iter 34.222285 +gpu 0 iter : 5 Arret : 3.26935E-06 s/iter 34.215281 +gpu 0 iter : 6 Arret : 3.34195E-06 s/iter 34.197991 +gpu 0 iter : 7 Arret : 3.3903E-06 s/iter 34.208738 +gpu 0 iter : 8 Arret : 3.49838E-06 s/iter 34.196075 +gpu 0 iter : 9 Arret : 3.56276E-06 s/iter 34.209024 +gpu 0 iter : 10 Arret : 5.84108E-06 s/iter 34.213481 +gpu 0 iter : 11 Arret : 0.00066379 s/iter 34.219783 +gpu 0 iter : 12 Arret : 0.00134105 s/iter 34.213025 +gpu 0 iter : 13 Arret : 0.00258505 s/iter 34.466511 +gpu 0 iter : 14 Arret : 0.0103479 s/iter 43.404986 +gpu 0 iter : 15 Arret : 0.00921676 s/iter 37.016770 +gpu 0 iter : 16 Arret : 0.00524991 s/iter 34.402114 +gpu 0 iter : 17 Arret : 0.00461832 s/iter 34.685302 +gpu 0 iter : 18 Arret : 0.0111077 s/iter 37.320698 +gpu 0 iter : 19 Arret : 0.277174 s/iter 35.309915 +gpu 0 iter : 20 Arret : 0.0136382 s/iter 37.689142 +gpu 0 iter : 21 Arret : 0.0160865 s/iter 34.656561 +gpu 0 iter : 22 Arret : 0.0117015 s/iter 34.545629 +gpu 0 iter : 23 Arret : 0.00660409 s/iter 34.694858 +gpu 0 iter : 24 Arret : 0.0024069 s/iter 35.413033 +gpu 0 iter : 25 Arret : 0.00112793 s/iter 34.552170 +gpu 0 iter : 26 Arret : 0.000118329 s/iter 34.545882 +gpu 0 iter : 27 Arret : 7.75369E-06 s/iter 34.554405 +gpu 0 iter : 28 Arret : 1.97801E-06 s/iter 34.600018 +gpu 0 iter : 29 Arret : 1.19455E-08 s/iter 34.514124 +gpu 0 iter : 30 Arret : 5.31286E-15 s/iter 34.636400 +temps : 1053.03 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1042 start 0 size 266666 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 1042 start 533332 size 266666 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1042 start 266666 size 266666 +gpu 0 iter : 1 Arret : 3.43128E-06 s/iter 44.316497 +gpu 0 iter : 2 Arret : 3.77153E-06 s/iter 44.131572 +gpu 0 iter : 3 Arret : 3.23873E-06 s/iter 44.315408 +gpu 0 iter : 4 Arret : 3.15113E-06 s/iter 44.328033 +gpu 0 iter : 5 Arret : 3.60598E-06 s/iter 44.311559 +gpu 0 iter : 6 Arret : 3.57581E-06 s/iter 44.316239 +gpu 0 iter : 7 Arret : 3.25175E-06 s/iter 44.224296 +gpu 0 iter : 8 Arret : 3.4699E-06 s/iter 44.325585 +gpu 0 iter : 9 Arret : 4.55022E-06 s/iter 44.283208 +gpu 0 iter : 10 Arret : 3.7857E-05 s/iter 44.288810 +gpu 0 iter : 11 Arret : 0.000824026 s/iter 44.305832 +gpu 0 iter : 12 Arret : 0.00406403 s/iter 49.181390 +gpu 0 iter : 13 Arret : 1.91903 s/iter 44.281962 +gpu 0 iter : 14 Arret : 0.315909 s/iter 52.995186 +gpu 0 iter : 15 Arret : 0.325705 s/iter 48.752573 +gpu 0 iter : 16 Arret : 0.25171 s/iter 48.906019 +gpu 0 iter : 17 Arret : 0.107387 s/iter 44.063529 +gpu 0 iter : 18 Arret : 0.063654 s/iter 40.922131 +gpu 0 iter : 19 Arret : 0.0247294 s/iter 39.343896 +gpu 0 iter : 20 Arret : 0.015705 s/iter 38.504441 +gpu 0 iter : 21 Arret : 0.00670205 s/iter 39.597806 +gpu 0 iter : 22 Arret : 0.00378517 s/iter 35.764039 +gpu 0 iter : 23 Arret : 0.00973025 s/iter 33.436854 +gpu 0 iter : 24 Arret : 0.00954051 s/iter 32.742842 +gpu 0 iter : 25 Arret : 0.000557232 s/iter 31.071844 +gpu 0 iter : 26 Arret : 2.73926E-05 s/iter 30.889921 +gpu 0 iter : 27 Arret : 2.78216E-06 s/iter 30.780761 +gpu 0 iter : 28 Arret : 2.46904E-08 s/iter 30.743643 +gpu 0 iter : 29 Arret : 6.07909E-14 s/iter 30.869112 +temps : 1191.46 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.0233219 +Stabilite : 3.24723E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +799998 racines de module = 1 + 2 racines de module = 0.999973 diff --git a/Simulations/full_openmp/full_openmp_3GPU.sge b/Simulations/full_openmp/full_openmp_3GPU.sge new file mode 100755 index 0000000..c3a277c --- /dev/null +++ b/Simulations/full_openmp/full_openmp_3GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 3 +#$ -V +#$ -cwd +#$ -N full_openmp_3GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/full_openmp/full_openmp_4GPU.o140162 b/Simulations/full_openmp/full_openmp_4GPU.o140162 new file mode 100644 index 0000000..5a3649d --- /dev/null +++ b/Simulations/full_openmp/full_openmp_4GPU.o140162 @@ -0,0 +1,590 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00593 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 3 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 3 dimgrid2 59 start 45120 size 15040 +gpu 2 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 2 dimgrid2 59 start 30080 size 15040 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 59 start 0 size 15040 +gpu 1 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 1 dimgrid2 59 start 15040 size 15040 +gpu 0 iter : 1 Arret : 4.54253E-05 s/iter 0.204175 +gpu 0 iter : 2 Arret : 4.02349E-05 s/iter 0.189665 +gpu 0 iter : 3 Arret : 3.82695E-05 s/iter 0.189681 +gpu 0 iter : 4 Arret : 3.90123E-05 s/iter 0.189717 +gpu 0 iter : 5 Arret : 4.05115E-05 s/iter 0.189657 +gpu 0 iter : 6 Arret : 4.39547E-05 s/iter 0.189790 +gpu 0 iter : 7 Arret : 5.45799E-05 s/iter 0.189703 +gpu 0 iter : 8 Arret : 0.000119388 s/iter 0.189738 +gpu 0 iter : 9 Arret : 0.00119487 s/iter 0.189634 +gpu 0 iter : 10 Arret : 0.00289573 s/iter 0.189661 +gpu 0 iter : 11 Arret : 2.16041 s/iter 0.189628 +gpu 0 iter : 12 Arret : 0.350069 s/iter 0.189703 +gpu 0 iter : 13 Arret : 0.131331 s/iter 1.021619 +gpu 0 iter : 14 Arret : 0.0516998 s/iter 1.018752 +gpu 0 iter : 15 Arret : 0.0205122 s/iter 1.016639 +gpu 0 iter : 16 Arret : 0.012334 s/iter 1.013349 +gpu 0 iter : 17 Arret : 0.00704057 s/iter 1.007092 +gpu 0 iter : 18 Arret : 0.00458473 s/iter 0.868843 +gpu 0 iter : 19 Arret : 0.00325386 s/iter 0.853210 +gpu 0 iter : 20 Arret : 0.00249036 s/iter 0.836780 +gpu 0 iter : 21 Arret : 0.0018094 s/iter 0.184672 +gpu 0 iter : 22 Arret : 0.00401767 s/iter 0.184541 +gpu 0 iter : 23 Arret : 0.048161 s/iter 0.183544 +gpu 0 iter : 24 Arret : 0.00734855 s/iter 0.178753 +gpu 0 iter : 25 Arret : 0.0107124 s/iter 0.178628 +gpu 0 iter : 26 Arret : 0.00180991 s/iter 0.172491 +gpu 0 iter : 27 Arret : 0.000329189 s/iter 0.172292 +gpu 0 iter : 28 Arret : 7.3153E-05 s/iter 0.172287 +gpu 0 iter : 29 Arret : 9.70999E-06 s/iter 0.172276 +gpu 0 iter : 30 Arret : 5.49374E-08 s/iter 0.172248 +gpu 0 iter : 31 Arret : 1.71107E-12 s/iter 0.172323 +gpu 0 iter : 32 Arret : 1.57009E-16 s/iter 0.172301 +temps : 13.5366 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 147 start 0 size 37504 +gpu 3 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 3 dimgrid2 147 start 112512 size 37504 +gpu 1 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 1 dimgrid2 147 start 37504 size 37504 +gpu 2 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 2 dimgrid2 147 start 75008 size 37504 +gpu 0 iter : 1 Arret : 1.6116E-05 s/iter 1.403394 +gpu 0 iter : 2 Arret : 1.52925E-05 s/iter 1.387067 +gpu 0 iter : 3 Arret : 1.51523E-05 s/iter 1.386759 +gpu 0 iter : 4 Arret : 1.86476E-05 s/iter 1.382149 +gpu 0 iter : 5 Arret : 1.57671E-05 s/iter 1.386808 +gpu 0 iter : 6 Arret : 1.6295E-05 s/iter 1.386892 +gpu 0 iter : 7 Arret : 1.80188E-05 s/iter 1.386856 +gpu 0 iter : 8 Arret : 2.08003E-05 s/iter 1.386801 +gpu 0 iter : 9 Arret : 3.59837E-05 s/iter 1.386900 +gpu 0 iter : 10 Arret : 0.00139949 s/iter 1.381972 +gpu 0 iter : 11 Arret : 0.00379917 s/iter 1.387000 +gpu 0 iter : 12 Arret : 0.00480593 s/iter 2.678954 +gpu 0 iter : 13 Arret : 0.0063728 s/iter 2.972359 +gpu 0 iter : 14 Arret : 0.0158488 s/iter 1.381889 +gpu 0 iter : 15 Arret : 0.0137848 s/iter 3.041156 +gpu 0 iter : 16 Arret : 0.0131859 s/iter 1.379081 +gpu 0 iter : 17 Arret : 1.29468 s/iter 3.020840 +gpu 0 iter : 18 Arret : 0.0424345 s/iter 3.418165 +gpu 0 iter : 19 Arret : 0.0201069 s/iter 3.422654 +gpu 0 iter : 20 Arret : 0.00607561 s/iter 2.950185 +gpu 0 iter : 21 Arret : 0.00629018 s/iter 3.290739 +gpu 0 iter : 22 Arret : 0.00557589 s/iter 1.335444 +gpu 0 iter : 23 Arret : 0.000991862 s/iter 1.330521 +gpu 0 iter : 24 Arret : 0.00206487 s/iter 1.322392 +gpu 0 iter : 25 Arret : 0.000365679 s/iter 1.334823 +gpu 0 iter : 26 Arret : 0.000144648 s/iter 1.333867 +gpu 0 iter : 27 Arret : 0.00033044 s/iter 1.332139 +gpu 0 iter : 28 Arret : 1.48376E-05 s/iter 1.334037 +gpu 0 iter : 29 Arret : 4.12386E-10 s/iter 1.324928 +gpu 0 iter : 30 Arret : 4.00547E-15 s/iter 1.333918 +temps : 56.2628 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235978 +i* 0.971758| 1|-2.91295E-14 +i*-3.06716E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 2 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 2 dimgrid2 245 start 125056 size 62528 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 245 start 0 size 62528 +gpu 3 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 3 dimgrid2 245 start 187584 size 62528 +gpu 1 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 1 dimgrid2 245 start 62528 size 62528 +gpu 0 iter : 1 Arret : 1.14841E-05 s/iter 3.820958 +gpu 0 iter : 2 Arret : 9.97904E-06 s/iter 3.814972 +gpu 0 iter : 3 Arret : 1.0158E-05 s/iter 3.809374 +gpu 0 iter : 4 Arret : 9.50123E-06 s/iter 3.808973 +gpu 0 iter : 5 Arret : 9.84188E-06 s/iter 3.808465 +gpu 0 iter : 6 Arret : 9.56156E-06 s/iter 3.815126 +gpu 0 iter : 7 Arret : 9.85167E-06 s/iter 3.816179 +gpu 0 iter : 8 Arret : 1.00437E-05 s/iter 3.818435 +gpu 0 iter : 9 Arret : 3.05444E-05 s/iter 3.817012 +gpu 0 iter : 10 Arret : 0.00147405 s/iter 3.816247 +gpu 0 iter : 11 Arret : 0.00154571 s/iter 3.810174 +gpu 0 iter : 12 Arret : 0.000731342 s/iter 3.808902 +gpu 0 iter : 13 Arret : 0.00122682 s/iter 3.808356 +gpu 0 iter : 14 Arret : 0.00109532 s/iter 3.815259 +gpu 0 iter : 15 Arret : 0.0011892 s/iter 3.779459 +gpu 0 iter : 16 Arret : 0.000794066 s/iter 2.968072 +gpu 0 iter : 17 Arret : 0.00960632 s/iter 2.174069 +gpu 0 iter : 18 Arret : 0.3054 s/iter 4.920214 +gpu 0 iter : 19 Arret : 0.00164869 s/iter 2.134462 +gpu 0 iter : 20 Arret : 0.00100296 s/iter 2.137935 +gpu 0 iter : 21 Arret : 0.000263024 s/iter 2.128112 +gpu 0 iter : 22 Arret : 0.0007086 s/iter 2.111936 +gpu 0 iter : 23 Arret : 0.00101441 s/iter 2.112455 +gpu 0 iter : 24 Arret : 0.000848875 s/iter 2.109033 +gpu 0 iter : 25 Arret : 0.00150539 s/iter 2.111749 +gpu 0 iter : 26 Arret : 5.16459E-05 s/iter 2.096918 +gpu 0 iter : 27 Arret : 1.87546E-07 s/iter 2.098589 +gpu 0 iter : 28 Arret : 2.77608E-13 s/iter 2.110056 +temps : 89.8766 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.3128E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 3 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 3 dimgrid2 342 start 262656 size 87552 +gpu 2 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 2 dimgrid2 342 start 175104 size 87552 +gpu 1 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 1 dimgrid2 342 start 87552 size 87552 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 342 start 0 size 87552 +gpu 0 iter : 1 Arret : 6.88539E-06 s/iter 6.540061 +gpu 0 iter : 2 Arret : 6.8684E-06 s/iter 6.536458 +gpu 0 iter : 3 Arret : 7.55734E-06 s/iter 6.535814 +gpu 0 iter : 4 Arret : 6.96901E-06 s/iter 6.536741 +gpu 0 iter : 5 Arret : 6.72451E-06 s/iter 6.533504 +gpu 0 iter : 6 Arret : 6.76555E-06 s/iter 6.534876 +gpu 0 iter : 7 Arret : 7.08866E-06 s/iter 6.534819 +gpu 0 iter : 8 Arret : 7.79946E-06 s/iter 6.533534 +gpu 0 iter : 9 Arret : 9.74863E-06 s/iter 6.531511 +gpu 0 iter : 10 Arret : 0.000378804 s/iter 6.530246 +gpu 0 iter : 11 Arret : 0.000478777 s/iter 6.545753 +gpu 0 iter : 12 Arret : 0.0010319 s/iter 6.531644 +gpu 0 iter : 13 Arret : 0.810083 s/iter 6.532661 +gpu 0 iter : 14 Arret : 3.38477 s/iter 9.611632 +gpu 0 iter : 15 Arret : 0.137317 s/iter 9.586509 +gpu 0 iter : 16 Arret : 0.0655441 s/iter 11.282824 +gpu 0 iter : 17 Arret : 0.0396702 s/iter 11.222823 +gpu 0 iter : 18 Arret : 0.165636 s/iter 11.248406 +gpu 0 iter : 19 Arret : 0.114767 s/iter 11.345882 +gpu 0 iter : 20 Arret : 0.0535778 s/iter 11.198285 +gpu 0 iter : 21 Arret : 0.0468459 s/iter 10.374819 +gpu 0 iter : 22 Arret : 0.0531479 s/iter 11.376048 +gpu 0 iter : 23 Arret : 0.0587573 s/iter 9.681631 +gpu 0 iter : 24 Arret : 0.380742 s/iter 9.616663 +gpu 0 iter : 25 Arret : 0.158886 s/iter 6.481929 +gpu 0 iter : 26 Arret : 0.19048 s/iter 10.400978 +gpu 0 iter : 27 Arret : 0.115233 s/iter 7.157960 +gpu 0 iter : 28 Arret : 0.0624603 s/iter 7.226846 +gpu 0 iter : 29 Arret : 0.00065803 s/iter 6.480500 +gpu 0 iter : 30 Arret : 2.18809E-05 s/iter 6.480583 +gpu 0 iter : 31 Arret : 3.02291E-05 s/iter 6.478820 +gpu 0 iter : 32 Arret : 6.59107E-06 s/iter 6.479051 +gpu 0 iter : 33 Arret : 1.18098E-07 s/iter 6.480090 +gpu 0 iter : 34 Arret : 1.37334E-12 s/iter 6.481310 +gpu 0 iter : 35 Arret : 1.11023E-16 s/iter 6.479636 +temps : 279.804 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 3 dimgrid2 489 start 375168 size 125056 +gpu 1 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 1 dimgrid2 489 start 125056 size 125056 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 489 start 0 size 125056 +gpu 2 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 2 dimgrid2 489 start 250112 size 125056 +gpu 0 iter : 1 Arret : 5.43682E-06 s/iter 13.802902 +gpu 0 iter : 2 Arret : 4.91044E-06 s/iter 13.790958 +gpu 0 iter : 3 Arret : 4.91315E-06 s/iter 13.790511 +gpu 0 iter : 4 Arret : 4.67858E-06 s/iter 13.806112 +gpu 0 iter : 5 Arret : 4.77709E-06 s/iter 13.805612 +gpu 0 iter : 6 Arret : 4.66912E-06 s/iter 13.804348 +gpu 0 iter : 7 Arret : 4.83022E-06 s/iter 13.804019 +gpu 0 iter : 8 Arret : 5.21278E-06 s/iter 13.800214 +gpu 0 iter : 9 Arret : 6.23421E-06 s/iter 13.801225 +gpu 0 iter : 10 Arret : 0.000564578 s/iter 13.800687 +gpu 0 iter : 11 Arret : 0.000810388 s/iter 13.802100 +gpu 0 iter : 12 Arret : 0.00138997 s/iter 13.800427 +gpu 0 iter : 13 Arret : 0.00220275 s/iter 18.005536 +gpu 0 iter : 14 Arret : 0.00421803 s/iter 13.791507 +gpu 0 iter : 15 Arret : 0.00623459 s/iter 13.530051 +gpu 0 iter : 16 Arret : 1.4756 s/iter 11.805523 +gpu 0 iter : 17 Arret : 0.0156198 s/iter 14.532176 +gpu 0 iter : 18 Arret : 0.0107648 s/iter 13.020495 +gpu 0 iter : 19 Arret : 0.0045075 s/iter 12.656318 +gpu 0 iter : 20 Arret : 0.00121976 s/iter 8.450054 +gpu 0 iter : 21 Arret : 0.000890648 s/iter 11.499489 +gpu 0 iter : 22 Arret : 0.00233504 s/iter 7.388259 +gpu 0 iter : 23 Arret : 0.00149094 s/iter 7.283653 +gpu 0 iter : 24 Arret : 0.00113868 s/iter 11.307597 +gpu 0 iter : 25 Arret : 0.000125947 s/iter 7.035207 +gpu 0 iter : 26 Arret : 2.52318E-05 s/iter 6.864347 +gpu 0 iter : 27 Arret : 3.0855E-08 s/iter 6.748053 +gpu 0 iter : 28 Arret : 9.3245E-14 s/iter 5.878949 +temps : 337.034 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.41899E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 586 start 300032 size 150016 +gpu 3 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 3 dimgrid2 586 start 450048 size 150016 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 586 start 150016 size 150016 +gpu 0 iter : 1 Arret : 4.20321E-06 s/iter 18.776658 +gpu 0 iter : 2 Arret : 4.13056E-06 s/iter 18.721323 +gpu 0 iter : 3 Arret : 4.11084E-06 s/iter 18.739702 +gpu 0 iter : 4 Arret : 4.14768E-06 s/iter 18.725990 +gpu 0 iter : 5 Arret : 3.97777E-06 s/iter 18.735245 +gpu 0 iter : 6 Arret : 4.16195E-06 s/iter 18.723334 +gpu 0 iter : 7 Arret : 4.19454E-06 s/iter 18.733188 +gpu 0 iter : 8 Arret : 4.62315E-06 s/iter 18.730439 +gpu 0 iter : 9 Arret : 6.05437E-06 s/iter 18.723590 +gpu 0 iter : 10 Arret : 1.53978E-05 s/iter 18.723454 +gpu 0 iter : 11 Arret : 0.000456524 s/iter 18.740808 +gpu 0 iter : 12 Arret : 0.00137167 s/iter 18.729445 +gpu 0 iter : 13 Arret : 0.00165831 s/iter 18.748008 +gpu 0 iter : 14 Arret : 1.38016 s/iter 18.749001 +gpu 0 iter : 15 Arret : 0.619057 s/iter 19.564421 +gpu 0 iter : 16 Arret : 0.0544873 s/iter 20.890543 +gpu 0 iter : 17 Arret : 0.0338392 s/iter 23.493737 +gpu 0 iter : 18 Arret : 0.0124964 s/iter 20.037893 +gpu 0 iter : 19 Arret : 0.00639686 s/iter 21.581791 +gpu 0 iter : 20 Arret : 0.00399724 s/iter 18.002558 +gpu 0 iter : 21 Arret : 0.00256288 s/iter 17.692790 +gpu 0 iter : 22 Arret : 0.000413689 s/iter 17.539980 +gpu 0 iter : 23 Arret : 0.0010819 s/iter 17.582527 +gpu 0 iter : 24 Arret : 0.000517706 s/iter 17.387151 +gpu 0 iter : 25 Arret : 1.40294E-05 s/iter 17.415382 +gpu 0 iter : 26 Arret : 1.44098E-06 s/iter 17.345061 +gpu 0 iter : 27 Arret : 2.93009E-09 s/iter 16.538716 +gpu 0 iter : 28 Arret : 8.5314E-15 s/iter 16.484147 +temps : 525.532 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 8.5314E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 2 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 2 dimgrid2 684 start 350080 size 175040 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid2 684 start 175040 size 175040 +gpu 0 dimgrid2 684 start 0 size 175040 +gpu 3 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 3 dimgrid2 684 start 525120 size 175040 +gpu 0 iter : 1 Arret : 4.05179E-06 s/iter 26.057760 +gpu 0 iter : 2 Arret : 3.69041E-06 s/iter 26.006401 +gpu 0 iter : 3 Arret : 3.54349E-06 s/iter 26.017285 +gpu 0 iter : 4 Arret : 3.54342E-06 s/iter 26.011286 +gpu 0 iter : 5 Arret : 3.59693E-06 s/iter 26.022969 +gpu 0 iter : 6 Arret : 3.48529E-06 s/iter 26.021812 +gpu 0 iter : 7 Arret : 3.57662E-06 s/iter 26.011888 +gpu 0 iter : 8 Arret : 3.69147E-06 s/iter 26.008709 +gpu 0 iter : 9 Arret : 3.94782E-06 s/iter 26.004937 +gpu 0 iter : 10 Arret : 6.25107E-05 s/iter 26.012739 +gpu 0 iter : 11 Arret : 0.00192614 s/iter 26.023084 +gpu 0 iter : 12 Arret : 0.00191367 s/iter 26.017884 +gpu 0 iter : 13 Arret : 0.0032574 s/iter 26.009004 +gpu 0 iter : 14 Arret : 0.00729301 s/iter 35.180983 +gpu 0 iter : 15 Arret : 0.00245317 s/iter 26.015276 +gpu 0 iter : 16 Arret : 0.00433319 s/iter 25.893105 +gpu 0 iter : 17 Arret : 0.00843918 s/iter 31.680916 +gpu 0 iter : 18 Arret : 0.00512235 s/iter 31.753281 +gpu 0 iter : 19 Arret : 0.161408 s/iter 28.844658 +gpu 0 iter : 20 Arret : 0.0369396 s/iter 28.748462 +gpu 0 iter : 21 Arret : 0.0443209 s/iter 28.918638 +gpu 0 iter : 22 Arret : 0.00926227 s/iter 28.518098 +gpu 0 iter : 23 Arret : 0.10139 s/iter 28.915161 +gpu 0 iter : 24 Arret : 0.087367 s/iter 28.998391 +gpu 0 iter : 25 Arret : 0.00915331 s/iter 28.869297 +gpu 0 iter : 26 Arret : 0.000166928 s/iter 25.732016 +gpu 0 iter : 27 Arret : 8.36929E-05 s/iter 25.736037 +gpu 0 iter : 28 Arret : 1.72536E-05 s/iter 25.733697 +gpu 0 iter : 29 Arret : 7.0611E-08 s/iter 25.745297 +gpu 0 iter : 30 Arret : 2.0544E-12 s/iter 25.733511 +gpu 0 iter : 31 Arret : 1.57009E-16 s/iter 25.739637 +temps : 846.791 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 3 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 3 dimgrid2 782 start 600000 size 200000 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 782 start 400000 size 200000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 782 start 0 size 200000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 782 start 200000 size 200000 +gpu 0 iter : 1 Arret : 3.03518E-06 s/iter 34.140422 +gpu 0 iter : 2 Arret : 3.08048E-06 s/iter 34.112195 +gpu 0 iter : 3 Arret : 3.01956E-06 s/iter 34.096993 +gpu 0 iter : 4 Arret : 3.09293E-06 s/iter 34.110543 +gpu 0 iter : 5 Arret : 3.08006E-06 s/iter 34.076662 +gpu 0 iter : 6 Arret : 3.01434E-06 s/iter 34.084058 +gpu 0 iter : 7 Arret : 3.18584E-06 s/iter 34.136831 +gpu 0 iter : 8 Arret : 3.3042E-06 s/iter 34.131267 +gpu 0 iter : 9 Arret : 4.06872E-06 s/iter 34.106772 +gpu 0 iter : 10 Arret : 8.81449E-06 s/iter 34.108408 +gpu 0 iter : 11 Arret : 0.000633965 s/iter 34.129789 +gpu 0 iter : 12 Arret : 0.00092939 s/iter 34.108349 +gpu 0 iter : 13 Arret : 2.168 s/iter 34.099124 +gpu 0 iter : 14 Arret : 0.959162 s/iter 39.514454 +gpu 0 iter : 15 Arret : 1.25264 s/iter 39.163345 +gpu 0 iter : 16 Arret : 0.0492202 s/iter 41.068013 +gpu 0 iter : 17 Arret : 0.0215834 s/iter 32.733350 +gpu 0 iter : 18 Arret : 0.0247446 s/iter 37.879052 +gpu 0 iter : 19 Arret : 0.0179454 s/iter 29.650763 +gpu 0 iter : 20 Arret : 0.0206764 s/iter 29.407317 +gpu 0 iter : 21 Arret : 0.0222049 s/iter 35.012713 +gpu 0 iter : 22 Arret : 0.00255914 s/iter 27.067142 +gpu 0 iter : 23 Arret : 0.000919373 s/iter 25.980531 +gpu 0 iter : 24 Arret : 0.0031468 s/iter 24.573430 +gpu 0 iter : 25 Arret : 0.00100214 s/iter 23.918440 +gpu 0 iter : 26 Arret : 4.12095E-06 s/iter 23.670339 +gpu 0 iter : 27 Arret : 1.25002E-07 s/iter 23.794441 +gpu 0 iter : 28 Arret : 1.03352E-11 s/iter 23.663739 +gpu 0 iter : 29 Arret : 1.57009E-16 s/iter 23.563580 +temps : 925.912 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_openmp/full_openmp_4GPU.sge b/Simulations/full_openmp/full_openmp_4GPU.sge new file mode 100755 index 0000000..4aab3cf --- /dev/null +++ b/Simulations/full_openmp/full_openmp_4GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 4 +#$ -V +#$ -cwd +#$ -N full_openmp_4GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/full_openmp_bis/full_openmp_1GPU.o140355 b/Simulations/full_openmp_bis/full_openmp_1GPU.o140355 new file mode 100644 index 0000000..88b9457 --- /dev/null +++ b/Simulations/full_openmp_bis/full_openmp_1GPU.o140355 @@ -0,0 +1,569 @@ +REMAINING: 1 +Taking GPU #3 +zone limite de 'log-exp' 1.00356 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 391 start 0 size 100096 +gpu 0 iter : 1 Arret : 2.58226E-05 s/iter 2.159486 +gpu 0 iter : 2 Arret : 2.45531E-05 s/iter 2.159234 +gpu 0 iter : 3 Arret : 2.40163E-05 s/iter 2.159105 +gpu 0 iter : 4 Arret : 2.46521E-05 s/iter 2.159089 +gpu 0 iter : 5 Arret : 2.52796E-05 s/iter 2.159243 +gpu 0 iter : 6 Arret : 2.48396E-05 s/iter 2.159045 +gpu 0 iter : 7 Arret : 2.76062E-05 s/iter 2.159048 +gpu 0 iter : 8 Arret : 3.59957E-05 s/iter 2.159248 +gpu 0 iter : 9 Arret : 0.000373167 s/iter 2.159075 +gpu 0 iter : 10 Arret : 0.000980965 s/iter 2.158969 +gpu 0 iter : 11 Arret : 0.00158765 s/iter 2.158925 +gpu 0 iter : 12 Arret : 0.247827 s/iter 2.158915 +gpu 0 iter : 13 Arret : 1.55457 s/iter 2.371759 +gpu 0 iter : 14 Arret : 0.00728343 s/iter 2.158707 +gpu 0 iter : 15 Arret : 0.00391977 s/iter 2.151495 +gpu 0 iter : 16 Arret : 0.00434237 s/iter 2.149256 +gpu 0 iter : 17 Arret : 0.00364574 s/iter 1.230796 +gpu 0 iter : 18 Arret : 0.00202513 s/iter 0.905599 +gpu 0 iter : 19 Arret : 0.00146278 s/iter 0.897221 +gpu 0 iter : 20 Arret : 0.00325677 s/iter 0.895872 +gpu 0 iter : 21 Arret : 0.0132291 s/iter 0.894311 +gpu 0 iter : 22 Arret : 0.0348168 s/iter 2.191648 +gpu 0 iter : 23 Arret : 0.0104306 s/iter 1.997714 +gpu 0 iter : 24 Arret : 0.00811772 s/iter 1.979664 +gpu 0 iter : 25 Arret : 0.00278534 s/iter 1.964636 +gpu 0 iter : 26 Arret : 0.000888664 s/iter 0.897993 +gpu 0 iter : 27 Arret : 0.0119282 s/iter 0.900904 +gpu 0 iter : 28 Arret : 0.0102688 s/iter 1.998468 +gpu 0 iter : 29 Arret : 0.000612955 s/iter 0.893189 +gpu 0 iter : 30 Arret : 0.000227055 s/iter 0.890419 +gpu 0 iter : 31 Arret : 0.000227812 s/iter 0.898160 +gpu 0 iter : 32 Arret : 0.000163655 s/iter 0.895300 +gpu 0 iter : 33 Arret : 1.43229E-05 s/iter 0.887696 +gpu 0 iter : 34 Arret : 5.4895E-07 s/iter 0.893540 +gpu 0 iter : 35 Arret : 2.16271E-11 s/iter 0.908081 +gpu 0 iter : 36 Arret : 3.55445E-16 s/iter 0.896091 +temps : 59.4099 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 3.55445E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 8.74301E-16 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-1.55837E-13 +i* 5.3703E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.79579E-14 +i* 5.47271E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.25063E-13 +i*-1.80201E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 782 start 0 size 200192 +gpu 0 iter : 1 Arret : 1.19577E-05 s/iter 8.518021 +gpu 0 iter : 2 Arret : 1.18544E-05 s/iter 8.493295 +gpu 0 iter : 3 Arret : 1.18465E-05 s/iter 8.498027 +gpu 0 iter : 4 Arret : 1.14898E-05 s/iter 8.493370 +gpu 0 iter : 5 Arret : 1.16046E-05 s/iter 8.500819 +gpu 0 iter : 6 Arret : 1.20283E-05 s/iter 8.508273 +gpu 0 iter : 7 Arret : 1.29539E-05 s/iter 8.506512 +gpu 0 iter : 8 Arret : 1.56022E-05 s/iter 8.489532 +gpu 0 iter : 9 Arret : 2.79622E-05 s/iter 8.492543 +gpu 0 iter : 10 Arret : 0.00167591 s/iter 8.483745 +gpu 0 iter : 11 Arret : 0.00190247 s/iter 8.493757 +gpu 0 iter : 12 Arret : 1.42579 s/iter 8.502998 +gpu 0 iter : 13 Arret : 0.3622 s/iter 8.970736 +gpu 0 iter : 14 Arret : 0.0671407 s/iter 8.976913 +gpu 0 iter : 15 Arret : 0.0268324 s/iter 8.944642 +gpu 0 iter : 16 Arret : 0.0040824 s/iter 8.439861 +gpu 0 iter : 17 Arret : 0.00185582 s/iter 8.440204 +gpu 0 iter : 18 Arret : 0.000960302 s/iter 8.404752 +gpu 0 iter : 19 Arret : 0.000563258 s/iter 8.104206 +gpu 0 iter : 20 Arret : 0.000141038 s/iter 8.091827 +gpu 0 iter : 21 Arret : 7.1234E-05 s/iter 8.154739 +gpu 0 iter : 22 Arret : 0.000377766 s/iter 8.147061 +gpu 0 iter : 23 Arret : 0.0146003 s/iter 8.109327 +gpu 0 iter : 24 Arret : 0.0135886 s/iter 8.343876 +gpu 0 iter : 25 Arret : 0.000297131 s/iter 8.189923 +gpu 0 iter : 26 Arret : 9.38967E-05 s/iter 8.214499 +gpu 0 iter : 27 Arret : 0.000426801 s/iter 8.057328 +gpu 0 iter : 28 Arret : 0.000145068 s/iter 8.038564 +gpu 0 iter : 29 Arret : 9.80028E-07 s/iter 8.042612 +gpu 0 iter : 30 Arret : 2.84216E-10 s/iter 8.170034 +gpu 0 iter : 31 Arret : 2.45256E-15 s/iter 8.066322 +temps : 260.63 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 2.45256E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659865 +i* -0.751385| 1| 2.17222E-14 +i*-1.50038E-13| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409013 +i* -0.912529| 1|-5.60801E-14 +i* 3.37699E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +zone limite de 'log-exp' 1.00089 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 1563 start 0 size 400128 +gpu 0 iter : 1 Arret : 6.89717E-06 s/iter 33.035643 +gpu 0 iter : 2 Arret : 6.09277E-06 s/iter 33.002321 +gpu 0 iter : 3 Arret : 6.18401E-06 s/iter 32.966130 +gpu 0 iter : 4 Arret : 6.20392E-06 s/iter 32.970641 +gpu 0 iter : 5 Arret : 6.02588E-06 s/iter 32.953697 +gpu 0 iter : 6 Arret : 5.96691E-06 s/iter 33.002518 +gpu 0 iter : 7 Arret : 5.94972E-06 s/iter 33.004551 +gpu 0 iter : 8 Arret : 6.19095E-06 s/iter 32.980457 +gpu 0 iter : 9 Arret : 6.32652E-06 s/iter 32.941630 +gpu 0 iter : 10 Arret : 1.87729E-05 s/iter 32.968007 +gpu 0 iter : 11 Arret : 0.00174004 s/iter 32.975771 +gpu 0 iter : 12 Arret : 0.006455 s/iter 33.311216 +gpu 0 iter : 13 Arret : 0.00619341 s/iter 33.149516 +gpu 0 iter : 14 Arret : 0.00514904 s/iter 35.574066 +gpu 0 iter : 15 Arret : 0.686768 s/iter 35.420293 +gpu 0 iter : 16 Arret : 0.0967736 s/iter 32.983094 +gpu 0 iter : 17 Arret : 0.0585811 s/iter 33.051496 +gpu 0 iter : 18 Arret : 0.196737 s/iter 33.861740 +gpu 0 iter : 19 Arret : 0.193586 s/iter 33.039494 +gpu 0 iter : 20 Arret : 0.274238 s/iter 37.595186 +gpu 0 iter : 21 Arret : 0.134712 s/iter 32.615388 +gpu 0 iter : 22 Arret : 0.0560146 s/iter 37.446376 +gpu 0 iter : 23 Arret : 0.0311159 s/iter 38.261918 +gpu 0 iter : 24 Arret : 0.0248535 s/iter 37.121915 +gpu 0 iter : 25 Arret : 0.0895173 s/iter 37.431548 +gpu 0 iter : 26 Arret : 0.0556182 s/iter 32.958188 +gpu 0 iter : 27 Arret : 0.0378553 s/iter 36.029371 +gpu 0 iter : 28 Arret : 0.0220943 s/iter 33.124627 +gpu 0 iter : 29 Arret : 0.0616201 s/iter 33.340346 +gpu 0 iter : 30 Arret : 0.306501 s/iter 33.214060 +gpu 0 iter : 31 Arret : 0.0429906 s/iter 33.060634 +gpu 0 iter : 32 Arret : 0.0503025 s/iter 33.013435 +gpu 0 iter : 33 Arret : 0.00545981 s/iter 33.060662 +gpu 0 iter : 34 Arret : 0.000411005 s/iter 33.003953 +gpu 0 iter : 35 Arret : 1.74978E-05 s/iter 32.871800 +gpu 0 iter : 36 Arret : 6.62978E-06 s/iter 32.869981 +gpu 0 iter : 37 Arret : 5.96879E-07 s/iter 32.947857 +gpu 0 iter : 38 Arret : 7.70723E-10 s/iter 33.009008 +gpu 0 iter : 39 Arret : 2.98937E-16 s/iter 33.033254 +temps : 1320.13 seconde(s) +Nb iterations : 39 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12974E-08 +Stabilite : 2.98937E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769081 +i* 0.639152| 1|-2.56017E-13 +i* 6.90161E-13| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857632 +i* 0.514263| 1| 7.84754E-13 +i* 2.86151E-13| +| 10| -0.0345309 +i* -0.999404| 1|-3.27058E-13 +i* 9.31755E-14| +| 11| 0.662503 +i* 0.74906| 1| 7.42843E-14 +i*-6.06277E-13| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926088 +i* 0.377307| 1| 6.5396E-13 +i* 7.07941E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.97283 +i* 0.23152| 1|-1.36773E-13 +i*-4.46509E-13| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 0 iter : 1 Arret : 5.12901E-06 s/iter 73.685421 +gpu 0 iter : 2 Arret : 4.67865E-06 s/iter 73.891510 +gpu 0 iter : 3 Arret : 4.44293E-06 s/iter 73.940974 +gpu 0 iter : 4 Arret : 4.97803E-06 s/iter 74.035697 +gpu 0 iter : 5 Arret : 4.5111E-06 s/iter 74.103515 +gpu 0 iter : 6 Arret : 5.27464E-06 s/iter 73.917797 +gpu 0 iter : 7 Arret : 4.58131E-06 s/iter 73.960314 +gpu 0 iter : 8 Arret : 4.45902E-06 s/iter 73.837035 +gpu 0 iter : 9 Arret : 7.73118E-06 s/iter 73.811103 +gpu 0 iter : 10 Arret : 0.000221116 s/iter 73.910635 +gpu 0 iter : 11 Arret : 0.000537969 s/iter 73.999742 +gpu 0 iter : 12 Arret : 0.00062373 s/iter 73.935382 +gpu 0 iter : 13 Arret : 1.81094 s/iter 73.779410 +gpu 0 iter : 14 Arret : 0.0983124 s/iter 74.253973 +gpu 0 iter : 15 Arret : 0.0573313 s/iter 75.355839 +gpu 0 iter : 16 Arret : 0.025899 s/iter 73.752295 +gpu 0 iter : 17 Arret : 0.0161024 s/iter 73.677921 +gpu 0 iter : 18 Arret : 0.0318784 s/iter 73.497434 +gpu 0 iter : 19 Arret : 0.0231649 s/iter 73.463585 +gpu 0 iter : 20 Arret : 0.00926319 s/iter 73.655131 +gpu 0 iter : 21 Arret : 0.00647533 s/iter 73.431285 +gpu 0 iter : 22 Arret : 0.00266543 s/iter 73.868304 +gpu 0 iter : 23 Arret : 0.00275887 s/iter 73.853686 +gpu 0 iter : 24 Arret : 0.00207089 s/iter 73.806260 +gpu 0 iter : 25 Arret : 0.0060336 s/iter 74.563180 +gpu 0 iter : 26 Arret : 0.0232617 s/iter 73.515326 +gpu 0 iter : 27 Arret : 0.0530779 s/iter 73.901640 +gpu 0 iter : 28 Arret : 0.0992673 s/iter 73.931922 +gpu 0 iter : 29 Arret : 0.236569 s/iter 73.666367 +gpu 0 iter : 30 Arret : 0.0198351 s/iter 73.569145 +gpu 0 iter : 31 Arret : 0.00162818 s/iter 73.834910 +gpu 0 iter : 32 Arret : 0.00100554 s/iter 73.949973 +gpu 0 iter : 33 Arret : 0.001858 s/iter 73.272998 +gpu 0 iter : 34 Arret : 0.00117769 s/iter 73.566613 +gpu 0 iter : 35 Arret : 0.000929485 s/iter 73.374602 +gpu 0 iter : 36 Arret : 0.00194808 s/iter 73.262272 +gpu 0 iter : 37 Arret : 0.00243946 s/iter 73.361974 +gpu 0 iter : 38 Arret : 2.62282E-05 s/iter 73.353860 +gpu 0 iter : 39 Arret : 9.95281E-06 s/iter 73.499781 +gpu 0 iter : 40 Arret : 2.46923E-05 s/iter 73.607334 +gpu 0 iter : 41 Arret : 3.03977E-05 s/iter 73.265665 +gpu 0 iter : 42 Arret : 5.02702E-06 s/iter 73.382297 +gpu 0 iter : 43 Arret : 7.70155E-09 s/iter 73.281891 +gpu 0 iter : 44 Arret : 2.25842E-14 s/iter 73.261871 +temps : 3245.93 seconde(s) +Nb iterations : 44 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 2.25842E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880618 +i* 0.473828| 1| 6.7276E-14 +i* 2.01556E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827237 +i* 0.561853| 1|-1.75169E-13 +i*-1.39104E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.765083 +i* 0.643932| 1| 3.06144E-14 +i*-3.59443E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 3125 start 0 size 800000 +gpu 0 iter : 1 Arret : 3.01856E-06 s/iter 131.241325 +gpu 0 iter : 2 Arret : 3.11262E-06 s/iter 131.070876 +gpu 0 iter : 3 Arret : 2.98017E-06 s/iter 131.134178 +gpu 0 iter : 4 Arret : 3.31167E-06 s/iter 131.213355 +gpu 0 iter : 5 Arret : 3.49019E-06 s/iter 130.717520 +gpu 0 iter : 6 Arret : 2.98626E-06 s/iter 130.739891 +gpu 0 iter : 7 Arret : 3.0474E-06 s/iter 131.072598 +gpu 0 iter : 8 Arret : 3.46218E-06 s/iter 130.814937 +gpu 0 iter : 9 Arret : 3.76918E-06 s/iter 130.887124 +gpu 0 iter : 10 Arret : 6.64295E-06 s/iter 130.616269 +gpu 0 iter : 11 Arret : 0.000287123 s/iter 131.061993 +gpu 0 iter : 12 Arret : 0.0011314 s/iter 131.096953 +gpu 0 iter : 13 Arret : 0.758828 s/iter 130.517209 +gpu 0 iter : 14 Arret : 0.970871 s/iter 130.728334 +gpu 0 iter : 15 Arret : 2.27673 s/iter 131.219621 +gpu 0 iter : 16 Arret : 0.0177119 s/iter 130.593046 +gpu 0 iter : 17 Arret : 0.0177252 s/iter 130.374984 +gpu 0 iter : 18 Arret : 0.00390068 s/iter 130.607194 +gpu 0 iter : 19 Arret : 0.00164255 s/iter 130.576165 +gpu 0 iter : 20 Arret : 0.000668822 s/iter 130.128284 +gpu 0 iter : 21 Arret : 0.000778681 s/iter 130.140695 +gpu 0 iter : 22 Arret : 0.000235 s/iter 130.130882 +gpu 0 iter : 23 Arret : 0.000193184 s/iter 130.139223 +gpu 0 iter : 24 Arret : 0.000165967 s/iter 130.093578 +gpu 0 iter : 25 Arret : 6.36482E-05 s/iter 130.126442 +gpu 0 iter : 26 Arret : 1.17867E-05 s/iter 130.157075 +gpu 0 iter : 27 Arret : 1.80291E-05 s/iter 130.154475 +gpu 0 iter : 28 Arret : 7.5224E-07 s/iter 130.130959 +gpu 0 iter : 29 Arret : 6.55358E-12 s/iter 130.147007 +gpu 0 iter : 30 Arret : 1.11886E-16 s/iter 130.165996 +temps : 3918.85 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.11886E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982853 +i* -0.184391| 1| 8.57613E-14 +i* 1.33506E-13| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 3907 start 0 size 1000192 +gpu 0 iter : 1 Arret : 2.98257E-06 s/iter 204.592404 +gpu 0 iter : 2 Arret : 2.9E-06 s/iter 204.216721 +gpu 0 iter : 3 Arret : 2.54328E-06 s/iter 204.150315 +gpu 0 iter : 4 Arret : 2.94527E-06 s/iter 204.539015 +gpu 0 iter : 5 Arret : 2.571E-06 s/iter 204.048569 +gpu 0 iter : 6 Arret : 2.72596E-06 s/iter 204.454699 +gpu 0 iter : 7 Arret : 2.76401E-06 s/iter 204.321715 +gpu 0 iter : 8 Arret : 2.5796E-06 s/iter 204.045143 +gpu 0 iter : 9 Arret : 3.02161E-06 s/iter 203.819798 +gpu 0 iter : 10 Arret : 3.11776E-05 s/iter 204.121557 +gpu 0 iter : 11 Arret : 4.06009E-05 s/iter 204.318926 +gpu 0 iter : 12 Arret : 0.000242232 s/iter 204.174687 +gpu 0 iter : 13 Arret : 0.000656278 s/iter 203.971756 +gpu 0 iter : 14 Arret : 0.00152688 s/iter 204.607105 +gpu 0 iter : 15 Arret : 1.5754 s/iter 206.101068 +gpu 0 iter : 16 Arret : 0.0775864 s/iter 206.867317 +gpu 0 iter : 17 Arret : 0.0425266 s/iter 206.476680 +gpu 0 iter : 18 Arret : 0.0273753 s/iter 206.039938 +gpu 0 iter : 19 Arret : 0.0492683 s/iter 206.207176 +gpu 0 iter : 20 Arret : 0.152167 s/iter 207.326719 +gpu 0 iter : 21 Arret : 0.111598 s/iter 207.858495 +gpu 0 iter : 22 Arret : 0.0599443 s/iter 206.944468 +gpu 0 iter : 23 Arret : 0.0482603 s/iter 207.305659 +gpu 0 iter : 24 Arret : 0.0570369 s/iter 206.944140 +gpu 0 iter : 25 Arret : 0.0169728 s/iter 206.896150 +gpu 0 iter : 26 Arret : 0.0215828 s/iter 206.840083 +gpu 0 iter : 27 Arret : 0.00102729 s/iter 206.717689 +gpu 0 iter : 28 Arret : 0.000868114 s/iter 206.564478 +gpu 0 iter : 29 Arret : 0.000551725 s/iter 206.747089 +gpu 0 iter : 30 Arret : 0.000194227 s/iter 206.534220 +gpu 0 iter : 31 Arret : 0.000171752 s/iter 206.656897 +gpu 0 iter : 32 Arret : 7.08378E-05 s/iter 206.465671 +gpu 0 iter : 33 Arret : 2.72559E-05 s/iter 206.327374 +gpu 0 iter : 34 Arret : 1.67371E-05 s/iter 206.627970 +gpu 0 iter : 35 Arret : 1.20545E-05 s/iter 206.506207 +gpu 0 iter : 36 Arret : 1.13808E-05 s/iter 206.655490 +gpu 0 iter : 37 Arret : 4.72892E-06 s/iter 206.414689 +gpu 0 iter : 38 Arret : 5.87488E-06 s/iter 206.321397 +gpu 0 iter : 39 Arret : 2.6099E-06 s/iter 206.602598 +gpu 0 iter : 40 Arret : 3.99174E-08 s/iter 206.546842 +gpu 0 iter : 41 Arret : 1.47709E-12 s/iter 206.466833 +gpu 0 iter : 42 Arret : 1.57009E-16 s/iter 206.344233 +temps : 8646.97 seconde(s) +Nb iterations : 42 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.403485 +i* -0.914986| 1|-3.20004E-13 +i* 2.65225E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.34582 +i* -0.938301| 1| -3.3851E-13 +i* 1.59258E-13| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 4688 start 0 size 1200128 +gpu 0 iter : 1 Arret : 2.56175E-06 s/iter 294.198739 +gpu 0 iter : 2 Arret : 2.39645E-06 s/iter 293.539567 +gpu 0 iter : 3 Arret : 2.28545E-06 s/iter 293.019301 +gpu 0 iter : 4 Arret : 2.55013E-06 s/iter 293.130575 +gpu 0 iter : 5 Arret : 2.15054E-06 s/iter 293.718429 +gpu 0 iter : 6 Arret : 2.26473E-06 s/iter 293.411570 +gpu 0 iter : 7 Arret : 2.12003E-06 s/iter 293.199118 +gpu 0 iter : 8 Arret : 2.11596E-06 s/iter 293.205357 +gpu 0 iter : 9 Arret : 2.25693E-06 s/iter 294.020328 +gpu 0 iter : 10 Arret : 7.52194E-06 s/iter 293.568331 +gpu 0 iter : 11 Arret : 2.46681E-05 s/iter 293.905181 +gpu 0 iter : 12 Arret : 0.000134592 s/iter 293.275672 +gpu 0 iter : 13 Arret : 0.00122896 s/iter 293.689459 +gpu 0 iter : 14 Arret : 0.00140185 s/iter 294.001347 +gpu 0 iter : 15 Arret : 0.0011181 s/iter 293.816219 +gpu 0 iter : 16 Arret : 0.349778 s/iter 296.209339 +gpu 0 iter : 17 Arret : 1.66625 s/iter 298.554357 +gpu 0 iter : 18 Arret : 0.0121283 s/iter 306.025724 +gpu 0 iter : 19 Arret : 0.0193251 s/iter 300.409278 +gpu 0 iter : 20 Arret : 0.0223402 s/iter 297.671022 +gpu 0 iter : 21 Arret : 0.0359641 s/iter 298.853459 +gpu 0 iter : 22 Arret : 0.0453806 s/iter 302.203155 +gpu 0 iter : 23 Arret : 0.0430981 s/iter 300.736284 +gpu 0 iter : 24 Arret : 0.053164 s/iter 302.487489 +gpu 0 iter : 25 Arret : 0.062259 s/iter 297.583054 +gpu 0 iter : 26 Arret : 0.167003 s/iter 296.365662 +gpu 0 iter : 27 Arret : 0.153706 s/iter 295.151437 +gpu 0 iter : 28 Arret : 0.02344 s/iter 295.988707 +gpu 0 iter : 29 Arret : 0.019249 s/iter 294.785475 +gpu 0 iter : 30 Arret : 0.099235 s/iter 294.566553 +gpu 0 iter : 31 Arret : 0.0407263 s/iter 292.557322 +gpu 0 iter : 32 Arret : 0.00216205 s/iter 292.117083 +gpu 0 iter : 33 Arret : 9.5696E-06 s/iter 291.151411 +gpu 0 iter : 34 Arret : 3.22754E-06 s/iter 291.182878 +gpu 0 iter : 35 Arret : 3.94819E-06 s/iter 292.068117 +gpu 0 iter : 36 Arret : 4.93119E-07 s/iter 292.697469 +gpu 0 iter : 37 Arret : 3.02926E-10 s/iter 292.192247 +gpu 0 iter : 38 Arret : 2.48253E-16 s/iter 292.207138 +temps : 11218.8 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 2.48253E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +zone limite de 'log-exp' 1.00025 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 5469 start 0 size 1400064 +gpu 0 iter : 1 Arret : 2.11199E-06 s/iter 400.367337 +gpu 0 iter : 2 Arret : 1.81115E-06 s/iter 400.561038 +gpu 0 iter : 3 Arret : 2.12516E-06 s/iter 399.216992 +gpu 0 iter : 4 Arret : 2.02501E-06 s/iter 399.315468 +gpu 0 iter : 5 Arret : 1.89087E-06 s/iter 398.861869 +gpu 0 iter : 6 Arret : 1.90349E-06 s/iter 400.315587 +gpu 0 iter : 7 Arret : 2.16521E-06 s/iter 399.773331 +gpu 0 iter : 8 Arret : 1.75819E-06 s/iter 399.966079 +gpu 0 iter : 9 Arret : 1.78992E-06 s/iter 399.869453 +gpu 0 iter : 10 Arret : 2.12339E-06 s/iter 399.539904 +gpu 0 iter : 11 Arret : 8.89567E-06 s/iter 399.287349 +gpu 0 iter : 12 Arret : 0.00276075 s/iter 399.209467 +gpu 0 iter : 13 Arret : 0.000960174 s/iter 401.383177 +gpu 0 iter : 14 Arret : 0.00107461 s/iter 401.924658 +gpu 0 iter : 15 Arret : 0.000789748 s/iter 401.933082 +gpu 0 iter : 16 Arret : 0.00192311 s/iter 401.622946 +gpu 0 iter : 17 Arret : 0.00430932 s/iter 408.912321 +gpu 0 iter : 18 Arret : 0.0099758 s/iter 402.244107 +gpu 0 iter : 19 Arret : 0.0148989 s/iter 409.999325 +gpu 0 iter : 20 Arret : 0.237196 s/iter 415.371469 +gpu 0 iter : 21 Arret : 0.317447 s/iter 414.041756 +gpu 0 iter : 22 Arret : 0.166749 s/iter 416.053077 +gpu 0 iter : 23 Arret : 0.0349229 s/iter 408.339436 +gpu 0 iter : 24 Arret : 0.0118277 s/iter 400.150371 +gpu 0 iter : 25 Arret : 0.015135 s/iter 400.148135 +gpu 0 iter : 26 Arret : 0.00785199 s/iter 399.324366 +gpu 0 iter : 27 Arret : 0.00104749 s/iter 397.117949 +gpu 0 iter : 28 Arret : 0.00021138 s/iter 398.172226 +gpu 0 iter : 29 Arret : 1.32785E-05 s/iter 397.711467 +gpu 0 iter : 30 Arret : 7.17584E-06 s/iter 397.144030 +gpu 0 iter : 31 Arret : 2.35657E-06 s/iter 397.064502 +gpu 0 iter : 32 Arret : 1.32198E-06 s/iter 396.047174 +gpu 0 iter : 33 Arret : 7.61437E-08 s/iter 398.367619 +gpu 0 iter : 34 Arret : 2.00647E-11 s/iter 397.319188 +gpu 0 iter : 35 Arret : 1.57009E-16 s/iter 397.972018 +temps : 14056.1 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_openmp_bis/full_openmp_2GPU.o140354 b/Simulations/full_openmp_bis/full_openmp_2GPU.o140354 new file mode 100644 index 0000000..b443ef7 --- /dev/null +++ b/Simulations/full_openmp_bis/full_openmp_2GPU.o140354 @@ -0,0 +1,593 @@ +REMAINING: 2 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00356 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 0 iter : 1 Arret : 2.5392E-05 s/iter 1.227021 +gpu 0 iter : 2 Arret : 2.59923E-05 s/iter 1.226750 +gpu 0 iter : 3 Arret : 2.47588E-05 s/iter 1.226783 +gpu 0 iter : 4 Arret : 2.53721E-05 s/iter 1.226649 +gpu 0 iter : 5 Arret : 2.5768E-05 s/iter 1.226634 +gpu 0 iter : 6 Arret : 2.48396E-05 s/iter 1.226693 +gpu 0 iter : 7 Arret : 2.76062E-05 s/iter 1.226668 +gpu 0 iter : 8 Arret : 3.59957E-05 s/iter 1.226645 +gpu 0 iter : 9 Arret : 0.000362414 s/iter 1.226815 +gpu 0 iter : 10 Arret : 0.000438012 s/iter 1.226710 +gpu 0 iter : 11 Arret : 0.00158759 s/iter 1.226730 +gpu 0 iter : 12 Arret : 0.24777 s/iter 1.226734 +gpu 0 iter : 13 Arret : 1.53158 s/iter 2.168072 +gpu 0 iter : 14 Arret : 0.00387914 s/iter 2.141910 +gpu 0 iter : 15 Arret : 0.0028678 s/iter 2.126936 +gpu 0 iter : 16 Arret : 0.00228624 s/iter 2.099248 +gpu 0 iter : 17 Arret : 0.00181064 s/iter 2.101025 +gpu 0 iter : 18 Arret : 0.00157799 s/iter 1.985627 +gpu 0 iter : 19 Arret : 0.00145605 s/iter 1.977177 +gpu 0 iter : 20 Arret : 0.00140844 s/iter 1.961196 +gpu 0 iter : 21 Arret : 0.00253228 s/iter 0.894142 +gpu 0 iter : 22 Arret : 0.0332674 s/iter 0.893625 +gpu 0 iter : 23 Arret : 0.00414247 s/iter 0.888148 +gpu 0 iter : 24 Arret : 0.025916 s/iter 1.976938 +gpu 0 iter : 25 Arret : 0.00757988 s/iter 1.974905 +gpu 0 iter : 26 Arret : 0.00188449 s/iter 0.898490 +gpu 0 iter : 27 Arret : 0.000748859 s/iter 0.894305 +gpu 0 iter : 28 Arret : 0.000523018 s/iter 0.887614 +gpu 0 iter : 29 Arret : 0.000199226 s/iter 0.881339 +gpu 0 iter : 30 Arret : 0.000179502 s/iter 0.887366 +gpu 0 iter : 31 Arret : 0.000108553 s/iter 0.893577 +gpu 0 iter : 32 Arret : 3.9397E-05 s/iter 0.882608 +gpu 0 iter : 33 Arret : 9.99937E-06 s/iter 0.893968 +gpu 0 iter : 34 Arret : 3.14055E-07 s/iter 0.880895 +gpu 0 iter : 35 Arret : 8.35537E-12 s/iter 0.878925 +gpu 0 iter : 36 Arret : 1.57009E-16 s/iter 0.896426 +temps : 48.6545 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 0 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 1.01308E-15 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.76317E-14 +i* 5.4734E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 391 start 100096 size 100096 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 391 start 0 size 100096 +gpu 0 iter : 1 Arret : 1.21972E-05 s/iter 4.327451 +gpu 0 iter : 2 Arret : 1.18497E-05 s/iter 4.328801 +gpu 0 iter : 3 Arret : 1.14287E-05 s/iter 4.326593 +gpu 0 iter : 4 Arret : 1.14892E-05 s/iter 4.327311 +gpu 0 iter : 5 Arret : 1.16344E-05 s/iter 4.327558 +gpu 0 iter : 6 Arret : 1.24439E-05 s/iter 4.325758 +gpu 0 iter : 7 Arret : 1.30094E-05 s/iter 4.327196 +gpu 0 iter : 8 Arret : 1.57289E-05 s/iter 4.325790 +gpu 0 iter : 9 Arret : 2.86271E-05 s/iter 4.325443 +gpu 0 iter : 10 Arret : 0.000543962 s/iter 4.327012 +gpu 0 iter : 11 Arret : 0.00145339 s/iter 4.325004 +gpu 0 iter : 12 Arret : 1.7939 s/iter 4.326489 +gpu 0 iter : 13 Arret : 0.533681 s/iter 4.324580 +gpu 0 iter : 14 Arret : 0.706956 s/iter 5.153741 +gpu 0 iter : 15 Arret : 0.0614646 s/iter 5.142447 +gpu 0 iter : 16 Arret : 0.0230012 s/iter 5.125435 +gpu 0 iter : 17 Arret : 0.00620497 s/iter 4.284011 +gpu 0 iter : 18 Arret : 0.00210797 s/iter 4.270133 +gpu 0 iter : 19 Arret : 0.00110036 s/iter 4.266432 +gpu 0 iter : 20 Arret : 0.000623092 s/iter 4.271061 +gpu 0 iter : 21 Arret : 0.000386689 s/iter 4.258397 +gpu 0 iter : 22 Arret : 0.00169576 s/iter 4.255822 +gpu 0 iter : 23 Arret : 0.0018211 s/iter 4.243791 +gpu 0 iter : 24 Arret : 0.000306093 s/iter 4.250944 +gpu 0 iter : 25 Arret : 5.98974E-05 s/iter 4.247305 +gpu 0 iter : 26 Arret : 4.79522E-05 s/iter 4.244456 +gpu 0 iter : 27 Arret : 2.55686E-05 s/iter 4.265305 +gpu 0 iter : 28 Arret : 9.95609E-06 s/iter 4.237758 +gpu 0 iter : 29 Arret : 5.32771E-07 s/iter 4.256034 +gpu 0 iter : 30 Arret : 1.63124E-10 s/iter 4.257015 +gpu 0 iter : 31 Arret : 1.44755E-15 s/iter 4.243120 +temps : 136.465 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.37327E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +zone limite de 'log-exp' 1.00089 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 782 start 0 size 200064 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 782 start 200064 size 200064 +gpu 0 iter : 1 Arret : 5.94484E-06 s/iter 17.057815 +gpu 0 iter : 2 Arret : 5.92537E-06 s/iter 17.005169 +gpu 0 iter : 3 Arret : 5.74413E-06 s/iter 17.007141 +gpu 0 iter : 4 Arret : 5.92275E-06 s/iter 17.027536 +gpu 0 iter : 5 Arret : 5.93915E-06 s/iter 17.012176 +gpu 0 iter : 6 Arret : 5.90525E-06 s/iter 16.985779 +gpu 0 iter : 7 Arret : 5.94978E-06 s/iter 17.018302 +gpu 0 iter : 8 Arret : 6.191E-06 s/iter 17.004448 +gpu 0 iter : 9 Arret : 6.3237E-06 s/iter 17.002791 +gpu 0 iter : 10 Arret : 1.57957E-05 s/iter 17.007149 +gpu 0 iter : 11 Arret : 0.00173253 s/iter 16.988073 +gpu 0 iter : 12 Arret : 0.00576526 s/iter 17.188808 +gpu 0 iter : 13 Arret : 0.00490441 s/iter 17.078098 +gpu 0 iter : 14 Arret : 0.0136849 s/iter 17.088044 +gpu 0 iter : 15 Arret : 1.53569 s/iter 21.726923 +gpu 0 iter : 16 Arret : 0.714931 s/iter 19.519499 +gpu 0 iter : 17 Arret : 0.105859 s/iter 20.538553 +gpu 0 iter : 18 Arret : 0.0748796 s/iter 21.335769 +gpu 0 iter : 19 Arret : 0.051079 s/iter 20.554353 +gpu 0 iter : 20 Arret : 0.0359769 s/iter 21.367481 +gpu 0 iter : 21 Arret : 0.111166 s/iter 18.581125 +gpu 0 iter : 22 Arret : 0.154418 s/iter 16.808041 +gpu 0 iter : 23 Arret : 0.0583836 s/iter 21.831216 +gpu 0 iter : 24 Arret : 0.0179636 s/iter 18.796732 +gpu 0 iter : 25 Arret : 0.0125988 s/iter 20.543469 +gpu 0 iter : 26 Arret : 0.0281888 s/iter 16.905579 +gpu 0 iter : 27 Arret : 0.0767977 s/iter 17.046640 +gpu 0 iter : 28 Arret : 0.200845 s/iter 19.345275 +gpu 0 iter : 29 Arret : 0.413856 s/iter 16.933703 +gpu 0 iter : 30 Arret : 0.0209415 s/iter 16.868628 +gpu 0 iter : 31 Arret : 0.00722393 s/iter 16.918768 +gpu 0 iter : 32 Arret : 0.000890817 s/iter 16.871308 +gpu 0 iter : 33 Arret : 0.000258155 s/iter 16.808999 +gpu 0 iter : 34 Arret : 1.5274E-05 s/iter 16.862227 +gpu 0 iter : 35 Arret : 8.86275E-06 s/iter 16.885301 +gpu 0 iter : 36 Arret : 1.5192E-05 s/iter 16.877196 +gpu 0 iter : 37 Arret : 6.0864E-06 s/iter 16.848153 +gpu 0 iter : 38 Arret : 1.18965E-07 s/iter 16.804611 +gpu 0 iter : 39 Arret : 2.01826E-12 s/iter 16.797437 +gpu 0 iter : 40 Arret : 1.11022E-16 s/iter 16.815375 +temps : 716.812 seconde(s) +Nb iterations : 40 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12974E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769061 +i* 0.639176| 1|-1.82375E-13 +i* 1.0897E-12| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857616 +i* 0.51429| 1|-4.74988E-13 +i*-1.42508E-14| +| 10| -0.0345309 +i* -0.999404| 1|-3.27058E-13 +i* 9.31755E-14| +| 11| 0.662491 +i* 0.74907| 1| 5.75581E-15 +i*-3.34004E-14| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926094 +i* 0.377292| 1|-5.15376E-13 +i* 7.96363E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.972834 +i* 0.231505| 1| 3.9433E-13 +i*-1.27901E-14| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 0 iter : 1 Arret : 4.6999E-06 s/iter 37.313393 +gpu 0 iter : 2 Arret : 4.61211E-06 s/iter 37.199898 +gpu 0 iter : 3 Arret : 4.94232E-06 s/iter 37.196508 +gpu 0 iter : 4 Arret : 5.06404E-06 s/iter 37.291584 +gpu 0 iter : 5 Arret : 4.61546E-06 s/iter 37.202708 +gpu 0 iter : 6 Arret : 4.74158E-06 s/iter 37.200857 +gpu 0 iter : 7 Arret : 4.88982E-06 s/iter 37.276950 +gpu 0 iter : 8 Arret : 4.31859E-06 s/iter 37.262072 +gpu 0 iter : 9 Arret : 5.22739E-06 s/iter 37.253123 +gpu 0 iter : 10 Arret : 0.000130977 s/iter 37.254715 +gpu 0 iter : 11 Arret : 0.00041028 s/iter 37.194791 +gpu 0 iter : 12 Arret : 0.000623887 s/iter 37.318498 +gpu 0 iter : 13 Arret : 1.78898 s/iter 37.254605 +gpu 0 iter : 14 Arret : 0.0673819 s/iter 37.266139 +gpu 0 iter : 15 Arret : 0.0472277 s/iter 38.530516 +gpu 0 iter : 16 Arret : 0.030634 s/iter 37.174736 +gpu 0 iter : 17 Arret : 0.018818 s/iter 37.025610 +gpu 0 iter : 18 Arret : 0.0120862 s/iter 36.938528 +gpu 0 iter : 19 Arret : 0.00824809 s/iter 40.395626 +gpu 0 iter : 20 Arret : 0.00588075 s/iter 36.954404 +gpu 0 iter : 21 Arret : 0.00447832 s/iter 37.105898 +gpu 0 iter : 22 Arret : 0.00350155 s/iter 37.014229 +gpu 0 iter : 23 Arret : 0.00654542 s/iter 37.161474 +gpu 0 iter : 24 Arret : 0.0134571 s/iter 37.742687 +gpu 0 iter : 25 Arret : 0.0780491 s/iter 37.521204 +gpu 0 iter : 26 Arret : 0.0332669 s/iter 37.456467 +gpu 0 iter : 27 Arret : 0.00587749 s/iter 37.241220 +gpu 0 iter : 28 Arret : 0.0127476 s/iter 37.329206 +gpu 0 iter : 29 Arret : 0.0122203 s/iter 37.210345 +gpu 0 iter : 30 Arret : 0.00587852 s/iter 37.185516 +gpu 0 iter : 31 Arret : 0.0344622 s/iter 37.308553 +gpu 0 iter : 32 Arret : 0.0186991 s/iter 37.281719 +gpu 0 iter : 33 Arret : 0.00503143 s/iter 37.356625 +gpu 0 iter : 34 Arret : 0.00367461 s/iter 37.018488 +gpu 0 iter : 35 Arret : 0.00234557 s/iter 36.973784 +gpu 0 iter : 36 Arret : 0.000768482 s/iter 37.070586 +gpu 0 iter : 37 Arret : 0.000303551 s/iter 36.869699 +gpu 0 iter : 38 Arret : 0.000225245 s/iter 37.079451 +gpu 0 iter : 39 Arret : 0.000745948 s/iter 36.872638 +gpu 0 iter : 40 Arret : 4.12409E-05 s/iter 36.883019 +gpu 0 iter : 41 Arret : 2.49694E-05 s/iter 36.926393 +gpu 0 iter : 42 Arret : 9.2154E-06 s/iter 37.059010 +gpu 0 iter : 43 Arret : 1.44835E-06 s/iter 36.872101 +gpu 0 iter : 44 Arret : 2.90428E-08 s/iter 37.076104 +gpu 0 iter : 45 Arret : 2.43246E-13 s/iter 36.981771 +temps : 1678.41 seconde(s) +Nb iterations : 45 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827231 +i* 0.561862| 1| 3.25472E-13 +i* 1.93899E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.76509 +i* 0.643924| 1| 2.51882E-15 +i*-2.49661E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1563 start 0 size 400000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1563 start 400000 size 400000 +gpu 0 iter : 1 Arret : 2.97022E-06 s/iter 66.087244 +gpu 0 iter : 2 Arret : 3.74348E-06 s/iter 65.802142 +gpu 0 iter : 3 Arret : 2.96662E-06 s/iter 65.920112 +gpu 0 iter : 4 Arret : 2.97125E-06 s/iter 65.980555 +gpu 0 iter : 5 Arret : 2.96707E-06 s/iter 65.949526 +gpu 0 iter : 6 Arret : 3.02716E-06 s/iter 66.021381 +gpu 0 iter : 7 Arret : 2.97561E-06 s/iter 65.922781 +gpu 0 iter : 8 Arret : 3.18042E-06 s/iter 65.987064 +gpu 0 iter : 9 Arret : 3.76916E-06 s/iter 66.059465 +gpu 0 iter : 10 Arret : 6.64283E-06 s/iter 66.062157 +gpu 0 iter : 11 Arret : 0.000184939 s/iter 66.074614 +gpu 0 iter : 12 Arret : 0.00113173 s/iter 66.196432 +gpu 0 iter : 13 Arret : 0.75738 s/iter 66.106674 +gpu 0 iter : 14 Arret : 0.957228 s/iter 65.895454 +gpu 0 iter : 15 Arret : 2.3861 s/iter 68.828840 +gpu 0 iter : 16 Arret : 0.0351307 s/iter 69.377122 +gpu 0 iter : 17 Arret : 0.00895093 s/iter 65.983080 +gpu 0 iter : 18 Arret : 0.00109369 s/iter 72.736098 +gpu 0 iter : 19 Arret : 0.00106938 s/iter 65.849790 +gpu 0 iter : 20 Arret : 0.0006038 s/iter 65.737084 +gpu 0 iter : 21 Arret : 0.000521615 s/iter 65.668256 +gpu 0 iter : 22 Arret : 0.000188695 s/iter 65.742637 +gpu 0 iter : 23 Arret : 0.000484126 s/iter 65.703178 +gpu 0 iter : 24 Arret : 0.000502331 s/iter 65.740277 +gpu 0 iter : 25 Arret : 0.000122768 s/iter 65.782861 +gpu 0 iter : 26 Arret : 2.91772E-05 s/iter 65.801943 +gpu 0 iter : 27 Arret : 1.10661E-05 s/iter 65.604207 +gpu 0 iter : 28 Arret : 7.78588E-06 s/iter 65.895470 +gpu 0 iter : 29 Arret : 1.31457E-06 s/iter 65.723774 +gpu 0 iter : 30 Arret : 2.21556E-08 s/iter 65.693485 +gpu 0 iter : 31 Arret : 1.26249E-13 s/iter 65.705821 +temps : 2056.91 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.26249E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982852 +i* -0.184398| 1| 3.90184E-13 +i* -1.1725E-14| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +zone limite de 'log-exp' 1.00035 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 1954 start 500096 size 500096 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 1954 start 0 size 500096 +gpu 0 iter : 1 Arret : 2.94731E-06 s/iter 102.732772 +gpu 0 iter : 2 Arret : 3.05081E-06 s/iter 102.843725 +gpu 0 iter : 3 Arret : 3.02796E-06 s/iter 102.640965 +gpu 0 iter : 4 Arret : 2.95782E-06 s/iter 102.653967 +gpu 0 iter : 5 Arret : 2.56925E-06 s/iter 102.649656 +gpu 0 iter : 6 Arret : 2.71245E-06 s/iter 102.688581 +gpu 0 iter : 7 Arret : 2.67546E-06 s/iter 102.677506 +gpu 0 iter : 8 Arret : 2.93452E-06 s/iter 102.648119 +gpu 0 iter : 9 Arret : 3.44573E-06 s/iter 102.623089 +gpu 0 iter : 10 Arret : 4.80208E-06 s/iter 102.787478 +gpu 0 iter : 11 Arret : 8.94492E-05 s/iter 102.642135 +gpu 0 iter : 12 Arret : 0.000113514 s/iter 102.696405 +gpu 0 iter : 13 Arret : 0.0413548 s/iter 102.645274 +gpu 0 iter : 14 Arret : 1.35231 s/iter 102.638889 +gpu 0 iter : 15 Arret : 0.218731 s/iter 105.058576 +gpu 0 iter : 16 Arret : 0.0914886 s/iter 105.240190 +gpu 0 iter : 17 Arret : 0.0521127 s/iter 104.928961 +gpu 0 iter : 18 Arret : 0.0335715 s/iter 115.056330 +gpu 0 iter : 19 Arret : 0.0228248 s/iter 115.271436 +gpu 0 iter : 20 Arret : 0.0335467 s/iter 105.716331 +gpu 0 iter : 21 Arret : 1.29299 s/iter 117.813180 +gpu 0 iter : 22 Arret : 0.639664 s/iter 118.012366 +gpu 0 iter : 23 Arret : 0.333285 s/iter 117.160199 +gpu 0 iter : 24 Arret : 0.0818296 s/iter 117.167589 +gpu 0 iter : 25 Arret : 0.0801346 s/iter 105.298720 +gpu 0 iter : 26 Arret : 0.0631355 s/iter 104.466518 +gpu 0 iter : 27 Arret : 0.0340934 s/iter 104.104847 +gpu 0 iter : 28 Arret : 0.681646 s/iter 104.037494 +gpu 0 iter : 29 Arret : 0.465431 s/iter 117.512319 +gpu 0 iter : 30 Arret : 0.298835 s/iter 103.821795 +gpu 0 iter : 31 Arret : 0.00351419 s/iter 103.489177 +gpu 0 iter : 32 Arret : 0.000864466 s/iter 116.712174 +gpu 0 iter : 33 Arret : 0.000214957 s/iter 103.493343 +gpu 0 iter : 34 Arret : 0.000148302 s/iter 103.592701 +gpu 0 iter : 35 Arret : 3.2437E-05 s/iter 103.513605 +gpu 0 iter : 36 Arret : 4.52266E-05 s/iter 103.356971 +gpu 0 iter : 37 Arret : 1.03998E-05 s/iter 103.617528 +gpu 0 iter : 38 Arret : 5.09091E-06 s/iter 103.526121 +gpu 0 iter : 39 Arret : 3.7292E-06 s/iter 103.546718 +gpu 0 iter : 40 Arret : 5.35044E-07 s/iter 103.922018 +gpu 0 iter : 41 Arret : 4.20397E-09 s/iter 103.482205 +gpu 0 iter : 42 Arret : 6.71777E-15 s/iter 103.673030 +temps : 4455.65 seconde(s) +Nb iterations : 42 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.403485 +i* -0.914986| 1|-3.20004E-13 +i* 2.65225E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.34582 +i* -0.938301| 1| -3.3851E-13 +i* 1.59258E-13| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 2344 start 600064 size 600064 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 0 iter : 1 Arret : 2.44684E-06 s/iter 147.702152 +gpu 0 iter : 2 Arret : 2.10878E-06 s/iter 147.782081 +gpu 0 iter : 3 Arret : 2.05128E-06 s/iter 147.808831 +gpu 0 iter : 4 Arret : 1.98115E-06 s/iter 147.750313 +gpu 0 iter : 5 Arret : 1.98739E-06 s/iter 147.944152 +gpu 0 iter : 6 Arret : 2.0117E-06 s/iter 147.921565 +gpu 0 iter : 7 Arret : 1.98746E-06 s/iter 147.932493 +gpu 0 iter : 8 Arret : 2.29692E-06 s/iter 147.976951 +gpu 0 iter : 9 Arret : 2.31674E-06 s/iter 147.798701 +gpu 0 iter : 10 Arret : 2.64613E-06 s/iter 147.944050 +gpu 0 iter : 11 Arret : 2.65583E-05 s/iter 147.896073 +gpu 0 iter : 12 Arret : 0.00125155 s/iter 147.939067 +gpu 0 iter : 13 Arret : 0.00119101 s/iter 148.040908 +gpu 0 iter : 14 Arret : 0.001522 s/iter 148.794269 +gpu 0 iter : 15 Arret : 0.00804167 s/iter 160.863284 +gpu 0 iter : 16 Arret : 1.3178 s/iter 161.088149 +gpu 0 iter : 17 Arret : 0.0515059 s/iter 160.853214 +gpu 0 iter : 18 Arret : 0.0362208 s/iter 159.671026 +gpu 0 iter : 19 Arret : 0.0248425 s/iter 158.567943 +gpu 0 iter : 20 Arret : 0.0167257 s/iter 149.166188 +gpu 0 iter : 21 Arret : 0.127462 s/iter 166.296276 +gpu 0 iter : 22 Arret : 0.163762 s/iter 166.569107 +gpu 0 iter : 23 Arret : 0.0719382 s/iter 166.686464 +gpu 0 iter : 24 Arret : 0.0374022 s/iter 168.683200 +gpu 0 iter : 25 Arret : 0.0173532 s/iter 166.375173 +gpu 0 iter : 26 Arret : 0.254433 s/iter 167.257077 +gpu 0 iter : 27 Arret : 0.102685 s/iter 147.935462 +gpu 0 iter : 28 Arret : 0.0763967 s/iter 147.480570 +gpu 0 iter : 29 Arret : 0.0328496 s/iter 147.287576 +gpu 0 iter : 30 Arret : 0.000947375 s/iter 147.250547 +gpu 0 iter : 31 Arret : 0.000512767 s/iter 147.251333 +gpu 0 iter : 32 Arret : 0.000577297 s/iter 147.329319 +gpu 0 iter : 33 Arret : 0.000408862 s/iter 147.414464 +gpu 0 iter : 34 Arret : 4.17915E-05 s/iter 147.305507 +gpu 0 iter : 35 Arret : 1.97858E-07 s/iter 147.287049 +gpu 0 iter : 36 Arret : 1.9156E-13 s/iter 147.242774 +temps : 5498.65 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 1.9156E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +zone limite de 'log-exp' 1.00025 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 2735 start 0 size 700032 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 2735 start 700032 size 700032 +gpu 0 iter : 1 Arret : 2.07918E-06 s/iter 200.785971 +gpu 0 iter : 2 Arret : 2.14654E-06 s/iter 200.847374 +gpu 0 iter : 3 Arret : 2.09733E-06 s/iter 200.966795 +gpu 0 iter : 4 Arret : 2.17414E-06 s/iter 200.742012 +gpu 0 iter : 5 Arret : 2.14915E-06 s/iter 200.888842 +gpu 0 iter : 6 Arret : 1.73848E-06 s/iter 201.043988 +gpu 0 iter : 7 Arret : 1.7679E-06 s/iter 201.346581 +gpu 0 iter : 8 Arret : 1.75688E-06 s/iter 201.213462 +gpu 0 iter : 9 Arret : 2.09733E-06 s/iter 200.837430 +gpu 0 iter : 10 Arret : 2.37165E-06 s/iter 200.784259 +gpu 0 iter : 11 Arret : 2.03214E-05 s/iter 200.752392 +gpu 0 iter : 12 Arret : 0.000682738 s/iter 200.690430 +gpu 0 iter : 13 Arret : 0.00122186 s/iter 200.708074 +gpu 0 iter : 14 Arret : 0.00275961 s/iter 201.044696 +gpu 0 iter : 15 Arret : 0.00833316 s/iter 212.473429 +gpu 0 iter : 16 Arret : 0.00960814 s/iter 220.623179 +gpu 0 iter : 17 Arret : 0.00894371 s/iter 218.919552 +gpu 0 iter : 18 Arret : 0.0200361 s/iter 219.943687 +gpu 0 iter : 19 Arret : 0.00844372 s/iter 218.952200 +gpu 0 iter : 20 Arret : 0.029693 s/iter 218.757398 +gpu 0 iter : 21 Arret : 0.53477 s/iter 211.752218 +gpu 0 iter : 22 Arret : 0.0210435 s/iter 219.038056 +gpu 0 iter : 23 Arret : 0.0210357 s/iter 202.148847 +gpu 0 iter : 24 Arret : 0.0100972 s/iter 200.483076 +gpu 0 iter : 25 Arret : 0.00218231 s/iter 199.870622 +gpu 0 iter : 26 Arret : 7.97101E-05 s/iter 199.797464 +gpu 0 iter : 27 Arret : 0.000160077 s/iter 200.323425 +gpu 0 iter : 28 Arret : 0.000253845 s/iter 199.948448 +gpu 0 iter : 29 Arret : 1.67041E-05 s/iter 200.118545 +gpu 0 iter : 30 Arret : 3.98407E-05 s/iter 199.961802 +gpu 0 iter : 31 Arret : 3.20727E-05 s/iter 200.252811 +gpu 0 iter : 32 Arret : 1.71338E-08 s/iter 200.171925 +gpu 0 iter : 33 Arret : 7.14435E-15 s/iter 200.023251 +temps : 6757.87 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 7.14435E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_openmp_bis/full_openmp_2GPU.o140354~ b/Simulations/full_openmp_bis/full_openmp_2GPU.o140354~ new file mode 100644 index 0000000..b443ef7 --- /dev/null +++ b/Simulations/full_openmp_bis/full_openmp_2GPU.o140354~ @@ -0,0 +1,593 @@ +REMAINING: 2 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00356 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 0 iter : 1 Arret : 2.5392E-05 s/iter 1.227021 +gpu 0 iter : 2 Arret : 2.59923E-05 s/iter 1.226750 +gpu 0 iter : 3 Arret : 2.47588E-05 s/iter 1.226783 +gpu 0 iter : 4 Arret : 2.53721E-05 s/iter 1.226649 +gpu 0 iter : 5 Arret : 2.5768E-05 s/iter 1.226634 +gpu 0 iter : 6 Arret : 2.48396E-05 s/iter 1.226693 +gpu 0 iter : 7 Arret : 2.76062E-05 s/iter 1.226668 +gpu 0 iter : 8 Arret : 3.59957E-05 s/iter 1.226645 +gpu 0 iter : 9 Arret : 0.000362414 s/iter 1.226815 +gpu 0 iter : 10 Arret : 0.000438012 s/iter 1.226710 +gpu 0 iter : 11 Arret : 0.00158759 s/iter 1.226730 +gpu 0 iter : 12 Arret : 0.24777 s/iter 1.226734 +gpu 0 iter : 13 Arret : 1.53158 s/iter 2.168072 +gpu 0 iter : 14 Arret : 0.00387914 s/iter 2.141910 +gpu 0 iter : 15 Arret : 0.0028678 s/iter 2.126936 +gpu 0 iter : 16 Arret : 0.00228624 s/iter 2.099248 +gpu 0 iter : 17 Arret : 0.00181064 s/iter 2.101025 +gpu 0 iter : 18 Arret : 0.00157799 s/iter 1.985627 +gpu 0 iter : 19 Arret : 0.00145605 s/iter 1.977177 +gpu 0 iter : 20 Arret : 0.00140844 s/iter 1.961196 +gpu 0 iter : 21 Arret : 0.00253228 s/iter 0.894142 +gpu 0 iter : 22 Arret : 0.0332674 s/iter 0.893625 +gpu 0 iter : 23 Arret : 0.00414247 s/iter 0.888148 +gpu 0 iter : 24 Arret : 0.025916 s/iter 1.976938 +gpu 0 iter : 25 Arret : 0.00757988 s/iter 1.974905 +gpu 0 iter : 26 Arret : 0.00188449 s/iter 0.898490 +gpu 0 iter : 27 Arret : 0.000748859 s/iter 0.894305 +gpu 0 iter : 28 Arret : 0.000523018 s/iter 0.887614 +gpu 0 iter : 29 Arret : 0.000199226 s/iter 0.881339 +gpu 0 iter : 30 Arret : 0.000179502 s/iter 0.887366 +gpu 0 iter : 31 Arret : 0.000108553 s/iter 0.893577 +gpu 0 iter : 32 Arret : 3.9397E-05 s/iter 0.882608 +gpu 0 iter : 33 Arret : 9.99937E-06 s/iter 0.893968 +gpu 0 iter : 34 Arret : 3.14055E-07 s/iter 0.880895 +gpu 0 iter : 35 Arret : 8.35537E-12 s/iter 0.878925 +gpu 0 iter : 36 Arret : 1.57009E-16 s/iter 0.896426 +temps : 48.6545 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 0 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 1.01308E-15 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.76317E-14 +i* 5.4734E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 391 start 100096 size 100096 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 391 start 0 size 100096 +gpu 0 iter : 1 Arret : 1.21972E-05 s/iter 4.327451 +gpu 0 iter : 2 Arret : 1.18497E-05 s/iter 4.328801 +gpu 0 iter : 3 Arret : 1.14287E-05 s/iter 4.326593 +gpu 0 iter : 4 Arret : 1.14892E-05 s/iter 4.327311 +gpu 0 iter : 5 Arret : 1.16344E-05 s/iter 4.327558 +gpu 0 iter : 6 Arret : 1.24439E-05 s/iter 4.325758 +gpu 0 iter : 7 Arret : 1.30094E-05 s/iter 4.327196 +gpu 0 iter : 8 Arret : 1.57289E-05 s/iter 4.325790 +gpu 0 iter : 9 Arret : 2.86271E-05 s/iter 4.325443 +gpu 0 iter : 10 Arret : 0.000543962 s/iter 4.327012 +gpu 0 iter : 11 Arret : 0.00145339 s/iter 4.325004 +gpu 0 iter : 12 Arret : 1.7939 s/iter 4.326489 +gpu 0 iter : 13 Arret : 0.533681 s/iter 4.324580 +gpu 0 iter : 14 Arret : 0.706956 s/iter 5.153741 +gpu 0 iter : 15 Arret : 0.0614646 s/iter 5.142447 +gpu 0 iter : 16 Arret : 0.0230012 s/iter 5.125435 +gpu 0 iter : 17 Arret : 0.00620497 s/iter 4.284011 +gpu 0 iter : 18 Arret : 0.00210797 s/iter 4.270133 +gpu 0 iter : 19 Arret : 0.00110036 s/iter 4.266432 +gpu 0 iter : 20 Arret : 0.000623092 s/iter 4.271061 +gpu 0 iter : 21 Arret : 0.000386689 s/iter 4.258397 +gpu 0 iter : 22 Arret : 0.00169576 s/iter 4.255822 +gpu 0 iter : 23 Arret : 0.0018211 s/iter 4.243791 +gpu 0 iter : 24 Arret : 0.000306093 s/iter 4.250944 +gpu 0 iter : 25 Arret : 5.98974E-05 s/iter 4.247305 +gpu 0 iter : 26 Arret : 4.79522E-05 s/iter 4.244456 +gpu 0 iter : 27 Arret : 2.55686E-05 s/iter 4.265305 +gpu 0 iter : 28 Arret : 9.95609E-06 s/iter 4.237758 +gpu 0 iter : 29 Arret : 5.32771E-07 s/iter 4.256034 +gpu 0 iter : 30 Arret : 1.63124E-10 s/iter 4.257015 +gpu 0 iter : 31 Arret : 1.44755E-15 s/iter 4.243120 +temps : 136.465 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.37327E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +zone limite de 'log-exp' 1.00089 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 782 start 0 size 200064 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 782 start 200064 size 200064 +gpu 0 iter : 1 Arret : 5.94484E-06 s/iter 17.057815 +gpu 0 iter : 2 Arret : 5.92537E-06 s/iter 17.005169 +gpu 0 iter : 3 Arret : 5.74413E-06 s/iter 17.007141 +gpu 0 iter : 4 Arret : 5.92275E-06 s/iter 17.027536 +gpu 0 iter : 5 Arret : 5.93915E-06 s/iter 17.012176 +gpu 0 iter : 6 Arret : 5.90525E-06 s/iter 16.985779 +gpu 0 iter : 7 Arret : 5.94978E-06 s/iter 17.018302 +gpu 0 iter : 8 Arret : 6.191E-06 s/iter 17.004448 +gpu 0 iter : 9 Arret : 6.3237E-06 s/iter 17.002791 +gpu 0 iter : 10 Arret : 1.57957E-05 s/iter 17.007149 +gpu 0 iter : 11 Arret : 0.00173253 s/iter 16.988073 +gpu 0 iter : 12 Arret : 0.00576526 s/iter 17.188808 +gpu 0 iter : 13 Arret : 0.00490441 s/iter 17.078098 +gpu 0 iter : 14 Arret : 0.0136849 s/iter 17.088044 +gpu 0 iter : 15 Arret : 1.53569 s/iter 21.726923 +gpu 0 iter : 16 Arret : 0.714931 s/iter 19.519499 +gpu 0 iter : 17 Arret : 0.105859 s/iter 20.538553 +gpu 0 iter : 18 Arret : 0.0748796 s/iter 21.335769 +gpu 0 iter : 19 Arret : 0.051079 s/iter 20.554353 +gpu 0 iter : 20 Arret : 0.0359769 s/iter 21.367481 +gpu 0 iter : 21 Arret : 0.111166 s/iter 18.581125 +gpu 0 iter : 22 Arret : 0.154418 s/iter 16.808041 +gpu 0 iter : 23 Arret : 0.0583836 s/iter 21.831216 +gpu 0 iter : 24 Arret : 0.0179636 s/iter 18.796732 +gpu 0 iter : 25 Arret : 0.0125988 s/iter 20.543469 +gpu 0 iter : 26 Arret : 0.0281888 s/iter 16.905579 +gpu 0 iter : 27 Arret : 0.0767977 s/iter 17.046640 +gpu 0 iter : 28 Arret : 0.200845 s/iter 19.345275 +gpu 0 iter : 29 Arret : 0.413856 s/iter 16.933703 +gpu 0 iter : 30 Arret : 0.0209415 s/iter 16.868628 +gpu 0 iter : 31 Arret : 0.00722393 s/iter 16.918768 +gpu 0 iter : 32 Arret : 0.000890817 s/iter 16.871308 +gpu 0 iter : 33 Arret : 0.000258155 s/iter 16.808999 +gpu 0 iter : 34 Arret : 1.5274E-05 s/iter 16.862227 +gpu 0 iter : 35 Arret : 8.86275E-06 s/iter 16.885301 +gpu 0 iter : 36 Arret : 1.5192E-05 s/iter 16.877196 +gpu 0 iter : 37 Arret : 6.0864E-06 s/iter 16.848153 +gpu 0 iter : 38 Arret : 1.18965E-07 s/iter 16.804611 +gpu 0 iter : 39 Arret : 2.01826E-12 s/iter 16.797437 +gpu 0 iter : 40 Arret : 1.11022E-16 s/iter 16.815375 +temps : 716.812 seconde(s) +Nb iterations : 40 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12974E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769061 +i* 0.639176| 1|-1.82375E-13 +i* 1.0897E-12| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857616 +i* 0.51429| 1|-4.74988E-13 +i*-1.42508E-14| +| 10| -0.0345309 +i* -0.999404| 1|-3.27058E-13 +i* 9.31755E-14| +| 11| 0.662491 +i* 0.74907| 1| 5.75581E-15 +i*-3.34004E-14| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926094 +i* 0.377292| 1|-5.15376E-13 +i* 7.96363E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.972834 +i* 0.231505| 1| 3.9433E-13 +i*-1.27901E-14| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 0 iter : 1 Arret : 4.6999E-06 s/iter 37.313393 +gpu 0 iter : 2 Arret : 4.61211E-06 s/iter 37.199898 +gpu 0 iter : 3 Arret : 4.94232E-06 s/iter 37.196508 +gpu 0 iter : 4 Arret : 5.06404E-06 s/iter 37.291584 +gpu 0 iter : 5 Arret : 4.61546E-06 s/iter 37.202708 +gpu 0 iter : 6 Arret : 4.74158E-06 s/iter 37.200857 +gpu 0 iter : 7 Arret : 4.88982E-06 s/iter 37.276950 +gpu 0 iter : 8 Arret : 4.31859E-06 s/iter 37.262072 +gpu 0 iter : 9 Arret : 5.22739E-06 s/iter 37.253123 +gpu 0 iter : 10 Arret : 0.000130977 s/iter 37.254715 +gpu 0 iter : 11 Arret : 0.00041028 s/iter 37.194791 +gpu 0 iter : 12 Arret : 0.000623887 s/iter 37.318498 +gpu 0 iter : 13 Arret : 1.78898 s/iter 37.254605 +gpu 0 iter : 14 Arret : 0.0673819 s/iter 37.266139 +gpu 0 iter : 15 Arret : 0.0472277 s/iter 38.530516 +gpu 0 iter : 16 Arret : 0.030634 s/iter 37.174736 +gpu 0 iter : 17 Arret : 0.018818 s/iter 37.025610 +gpu 0 iter : 18 Arret : 0.0120862 s/iter 36.938528 +gpu 0 iter : 19 Arret : 0.00824809 s/iter 40.395626 +gpu 0 iter : 20 Arret : 0.00588075 s/iter 36.954404 +gpu 0 iter : 21 Arret : 0.00447832 s/iter 37.105898 +gpu 0 iter : 22 Arret : 0.00350155 s/iter 37.014229 +gpu 0 iter : 23 Arret : 0.00654542 s/iter 37.161474 +gpu 0 iter : 24 Arret : 0.0134571 s/iter 37.742687 +gpu 0 iter : 25 Arret : 0.0780491 s/iter 37.521204 +gpu 0 iter : 26 Arret : 0.0332669 s/iter 37.456467 +gpu 0 iter : 27 Arret : 0.00587749 s/iter 37.241220 +gpu 0 iter : 28 Arret : 0.0127476 s/iter 37.329206 +gpu 0 iter : 29 Arret : 0.0122203 s/iter 37.210345 +gpu 0 iter : 30 Arret : 0.00587852 s/iter 37.185516 +gpu 0 iter : 31 Arret : 0.0344622 s/iter 37.308553 +gpu 0 iter : 32 Arret : 0.0186991 s/iter 37.281719 +gpu 0 iter : 33 Arret : 0.00503143 s/iter 37.356625 +gpu 0 iter : 34 Arret : 0.00367461 s/iter 37.018488 +gpu 0 iter : 35 Arret : 0.00234557 s/iter 36.973784 +gpu 0 iter : 36 Arret : 0.000768482 s/iter 37.070586 +gpu 0 iter : 37 Arret : 0.000303551 s/iter 36.869699 +gpu 0 iter : 38 Arret : 0.000225245 s/iter 37.079451 +gpu 0 iter : 39 Arret : 0.000745948 s/iter 36.872638 +gpu 0 iter : 40 Arret : 4.12409E-05 s/iter 36.883019 +gpu 0 iter : 41 Arret : 2.49694E-05 s/iter 36.926393 +gpu 0 iter : 42 Arret : 9.2154E-06 s/iter 37.059010 +gpu 0 iter : 43 Arret : 1.44835E-06 s/iter 36.872101 +gpu 0 iter : 44 Arret : 2.90428E-08 s/iter 37.076104 +gpu 0 iter : 45 Arret : 2.43246E-13 s/iter 36.981771 +temps : 1678.41 seconde(s) +Nb iterations : 45 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827231 +i* 0.561862| 1| 3.25472E-13 +i* 1.93899E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.76509 +i* 0.643924| 1| 2.51882E-15 +i*-2.49661E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1563 start 0 size 400000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1563 start 400000 size 400000 +gpu 0 iter : 1 Arret : 2.97022E-06 s/iter 66.087244 +gpu 0 iter : 2 Arret : 3.74348E-06 s/iter 65.802142 +gpu 0 iter : 3 Arret : 2.96662E-06 s/iter 65.920112 +gpu 0 iter : 4 Arret : 2.97125E-06 s/iter 65.980555 +gpu 0 iter : 5 Arret : 2.96707E-06 s/iter 65.949526 +gpu 0 iter : 6 Arret : 3.02716E-06 s/iter 66.021381 +gpu 0 iter : 7 Arret : 2.97561E-06 s/iter 65.922781 +gpu 0 iter : 8 Arret : 3.18042E-06 s/iter 65.987064 +gpu 0 iter : 9 Arret : 3.76916E-06 s/iter 66.059465 +gpu 0 iter : 10 Arret : 6.64283E-06 s/iter 66.062157 +gpu 0 iter : 11 Arret : 0.000184939 s/iter 66.074614 +gpu 0 iter : 12 Arret : 0.00113173 s/iter 66.196432 +gpu 0 iter : 13 Arret : 0.75738 s/iter 66.106674 +gpu 0 iter : 14 Arret : 0.957228 s/iter 65.895454 +gpu 0 iter : 15 Arret : 2.3861 s/iter 68.828840 +gpu 0 iter : 16 Arret : 0.0351307 s/iter 69.377122 +gpu 0 iter : 17 Arret : 0.00895093 s/iter 65.983080 +gpu 0 iter : 18 Arret : 0.00109369 s/iter 72.736098 +gpu 0 iter : 19 Arret : 0.00106938 s/iter 65.849790 +gpu 0 iter : 20 Arret : 0.0006038 s/iter 65.737084 +gpu 0 iter : 21 Arret : 0.000521615 s/iter 65.668256 +gpu 0 iter : 22 Arret : 0.000188695 s/iter 65.742637 +gpu 0 iter : 23 Arret : 0.000484126 s/iter 65.703178 +gpu 0 iter : 24 Arret : 0.000502331 s/iter 65.740277 +gpu 0 iter : 25 Arret : 0.000122768 s/iter 65.782861 +gpu 0 iter : 26 Arret : 2.91772E-05 s/iter 65.801943 +gpu 0 iter : 27 Arret : 1.10661E-05 s/iter 65.604207 +gpu 0 iter : 28 Arret : 7.78588E-06 s/iter 65.895470 +gpu 0 iter : 29 Arret : 1.31457E-06 s/iter 65.723774 +gpu 0 iter : 30 Arret : 2.21556E-08 s/iter 65.693485 +gpu 0 iter : 31 Arret : 1.26249E-13 s/iter 65.705821 +temps : 2056.91 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.26249E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982852 +i* -0.184398| 1| 3.90184E-13 +i* -1.1725E-14| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +zone limite de 'log-exp' 1.00035 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 1954 start 500096 size 500096 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 1954 start 0 size 500096 +gpu 0 iter : 1 Arret : 2.94731E-06 s/iter 102.732772 +gpu 0 iter : 2 Arret : 3.05081E-06 s/iter 102.843725 +gpu 0 iter : 3 Arret : 3.02796E-06 s/iter 102.640965 +gpu 0 iter : 4 Arret : 2.95782E-06 s/iter 102.653967 +gpu 0 iter : 5 Arret : 2.56925E-06 s/iter 102.649656 +gpu 0 iter : 6 Arret : 2.71245E-06 s/iter 102.688581 +gpu 0 iter : 7 Arret : 2.67546E-06 s/iter 102.677506 +gpu 0 iter : 8 Arret : 2.93452E-06 s/iter 102.648119 +gpu 0 iter : 9 Arret : 3.44573E-06 s/iter 102.623089 +gpu 0 iter : 10 Arret : 4.80208E-06 s/iter 102.787478 +gpu 0 iter : 11 Arret : 8.94492E-05 s/iter 102.642135 +gpu 0 iter : 12 Arret : 0.000113514 s/iter 102.696405 +gpu 0 iter : 13 Arret : 0.0413548 s/iter 102.645274 +gpu 0 iter : 14 Arret : 1.35231 s/iter 102.638889 +gpu 0 iter : 15 Arret : 0.218731 s/iter 105.058576 +gpu 0 iter : 16 Arret : 0.0914886 s/iter 105.240190 +gpu 0 iter : 17 Arret : 0.0521127 s/iter 104.928961 +gpu 0 iter : 18 Arret : 0.0335715 s/iter 115.056330 +gpu 0 iter : 19 Arret : 0.0228248 s/iter 115.271436 +gpu 0 iter : 20 Arret : 0.0335467 s/iter 105.716331 +gpu 0 iter : 21 Arret : 1.29299 s/iter 117.813180 +gpu 0 iter : 22 Arret : 0.639664 s/iter 118.012366 +gpu 0 iter : 23 Arret : 0.333285 s/iter 117.160199 +gpu 0 iter : 24 Arret : 0.0818296 s/iter 117.167589 +gpu 0 iter : 25 Arret : 0.0801346 s/iter 105.298720 +gpu 0 iter : 26 Arret : 0.0631355 s/iter 104.466518 +gpu 0 iter : 27 Arret : 0.0340934 s/iter 104.104847 +gpu 0 iter : 28 Arret : 0.681646 s/iter 104.037494 +gpu 0 iter : 29 Arret : 0.465431 s/iter 117.512319 +gpu 0 iter : 30 Arret : 0.298835 s/iter 103.821795 +gpu 0 iter : 31 Arret : 0.00351419 s/iter 103.489177 +gpu 0 iter : 32 Arret : 0.000864466 s/iter 116.712174 +gpu 0 iter : 33 Arret : 0.000214957 s/iter 103.493343 +gpu 0 iter : 34 Arret : 0.000148302 s/iter 103.592701 +gpu 0 iter : 35 Arret : 3.2437E-05 s/iter 103.513605 +gpu 0 iter : 36 Arret : 4.52266E-05 s/iter 103.356971 +gpu 0 iter : 37 Arret : 1.03998E-05 s/iter 103.617528 +gpu 0 iter : 38 Arret : 5.09091E-06 s/iter 103.526121 +gpu 0 iter : 39 Arret : 3.7292E-06 s/iter 103.546718 +gpu 0 iter : 40 Arret : 5.35044E-07 s/iter 103.922018 +gpu 0 iter : 41 Arret : 4.20397E-09 s/iter 103.482205 +gpu 0 iter : 42 Arret : 6.71777E-15 s/iter 103.673030 +temps : 4455.65 seconde(s) +Nb iterations : 42 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.403485 +i* -0.914986| 1|-3.20004E-13 +i* 2.65225E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.34582 +i* -0.938301| 1| -3.3851E-13 +i* 1.59258E-13| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 2344 start 600064 size 600064 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 0 iter : 1 Arret : 2.44684E-06 s/iter 147.702152 +gpu 0 iter : 2 Arret : 2.10878E-06 s/iter 147.782081 +gpu 0 iter : 3 Arret : 2.05128E-06 s/iter 147.808831 +gpu 0 iter : 4 Arret : 1.98115E-06 s/iter 147.750313 +gpu 0 iter : 5 Arret : 1.98739E-06 s/iter 147.944152 +gpu 0 iter : 6 Arret : 2.0117E-06 s/iter 147.921565 +gpu 0 iter : 7 Arret : 1.98746E-06 s/iter 147.932493 +gpu 0 iter : 8 Arret : 2.29692E-06 s/iter 147.976951 +gpu 0 iter : 9 Arret : 2.31674E-06 s/iter 147.798701 +gpu 0 iter : 10 Arret : 2.64613E-06 s/iter 147.944050 +gpu 0 iter : 11 Arret : 2.65583E-05 s/iter 147.896073 +gpu 0 iter : 12 Arret : 0.00125155 s/iter 147.939067 +gpu 0 iter : 13 Arret : 0.00119101 s/iter 148.040908 +gpu 0 iter : 14 Arret : 0.001522 s/iter 148.794269 +gpu 0 iter : 15 Arret : 0.00804167 s/iter 160.863284 +gpu 0 iter : 16 Arret : 1.3178 s/iter 161.088149 +gpu 0 iter : 17 Arret : 0.0515059 s/iter 160.853214 +gpu 0 iter : 18 Arret : 0.0362208 s/iter 159.671026 +gpu 0 iter : 19 Arret : 0.0248425 s/iter 158.567943 +gpu 0 iter : 20 Arret : 0.0167257 s/iter 149.166188 +gpu 0 iter : 21 Arret : 0.127462 s/iter 166.296276 +gpu 0 iter : 22 Arret : 0.163762 s/iter 166.569107 +gpu 0 iter : 23 Arret : 0.0719382 s/iter 166.686464 +gpu 0 iter : 24 Arret : 0.0374022 s/iter 168.683200 +gpu 0 iter : 25 Arret : 0.0173532 s/iter 166.375173 +gpu 0 iter : 26 Arret : 0.254433 s/iter 167.257077 +gpu 0 iter : 27 Arret : 0.102685 s/iter 147.935462 +gpu 0 iter : 28 Arret : 0.0763967 s/iter 147.480570 +gpu 0 iter : 29 Arret : 0.0328496 s/iter 147.287576 +gpu 0 iter : 30 Arret : 0.000947375 s/iter 147.250547 +gpu 0 iter : 31 Arret : 0.000512767 s/iter 147.251333 +gpu 0 iter : 32 Arret : 0.000577297 s/iter 147.329319 +gpu 0 iter : 33 Arret : 0.000408862 s/iter 147.414464 +gpu 0 iter : 34 Arret : 4.17915E-05 s/iter 147.305507 +gpu 0 iter : 35 Arret : 1.97858E-07 s/iter 147.287049 +gpu 0 iter : 36 Arret : 1.9156E-13 s/iter 147.242774 +temps : 5498.65 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 1.9156E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +zone limite de 'log-exp' 1.00025 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 2735 start 0 size 700032 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 2735 start 700032 size 700032 +gpu 0 iter : 1 Arret : 2.07918E-06 s/iter 200.785971 +gpu 0 iter : 2 Arret : 2.14654E-06 s/iter 200.847374 +gpu 0 iter : 3 Arret : 2.09733E-06 s/iter 200.966795 +gpu 0 iter : 4 Arret : 2.17414E-06 s/iter 200.742012 +gpu 0 iter : 5 Arret : 2.14915E-06 s/iter 200.888842 +gpu 0 iter : 6 Arret : 1.73848E-06 s/iter 201.043988 +gpu 0 iter : 7 Arret : 1.7679E-06 s/iter 201.346581 +gpu 0 iter : 8 Arret : 1.75688E-06 s/iter 201.213462 +gpu 0 iter : 9 Arret : 2.09733E-06 s/iter 200.837430 +gpu 0 iter : 10 Arret : 2.37165E-06 s/iter 200.784259 +gpu 0 iter : 11 Arret : 2.03214E-05 s/iter 200.752392 +gpu 0 iter : 12 Arret : 0.000682738 s/iter 200.690430 +gpu 0 iter : 13 Arret : 0.00122186 s/iter 200.708074 +gpu 0 iter : 14 Arret : 0.00275961 s/iter 201.044696 +gpu 0 iter : 15 Arret : 0.00833316 s/iter 212.473429 +gpu 0 iter : 16 Arret : 0.00960814 s/iter 220.623179 +gpu 0 iter : 17 Arret : 0.00894371 s/iter 218.919552 +gpu 0 iter : 18 Arret : 0.0200361 s/iter 219.943687 +gpu 0 iter : 19 Arret : 0.00844372 s/iter 218.952200 +gpu 0 iter : 20 Arret : 0.029693 s/iter 218.757398 +gpu 0 iter : 21 Arret : 0.53477 s/iter 211.752218 +gpu 0 iter : 22 Arret : 0.0210435 s/iter 219.038056 +gpu 0 iter : 23 Arret : 0.0210357 s/iter 202.148847 +gpu 0 iter : 24 Arret : 0.0100972 s/iter 200.483076 +gpu 0 iter : 25 Arret : 0.00218231 s/iter 199.870622 +gpu 0 iter : 26 Arret : 7.97101E-05 s/iter 199.797464 +gpu 0 iter : 27 Arret : 0.000160077 s/iter 200.323425 +gpu 0 iter : 28 Arret : 0.000253845 s/iter 199.948448 +gpu 0 iter : 29 Arret : 1.67041E-05 s/iter 200.118545 +gpu 0 iter : 30 Arret : 3.98407E-05 s/iter 199.961802 +gpu 0 iter : 31 Arret : 3.20727E-05 s/iter 200.252811 +gpu 0 iter : 32 Arret : 1.71338E-08 s/iter 200.171925 +gpu 0 iter : 33 Arret : 7.14435E-15 s/iter 200.023251 +temps : 6757.87 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 7.14435E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_openmp_bis/full_openmp_3GPU.o140353 b/Simulations/full_openmp_bis/full_openmp_3GPU.o140353 new file mode 100644 index 0000000..abcf363 --- /dev/null +++ b/Simulations/full_openmp_bis/full_openmp_3GPU.o140353 @@ -0,0 +1,676 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +zone limite de 'log-exp' 1.00356 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 131 start 33365 size 33365 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 131 start 66730 size 33365 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 131 start 0 size 33365 +gpu 0 iter : 1 Arret : 2.36933E-05 s/iter 0.912105 +gpu 0 iter : 2 Arret : 2.25678E-05 s/iter 0.910489 +gpu 0 iter : 3 Arret : 2.27127E-05 s/iter 0.912053 +gpu 0 iter : 4 Arret : 2.30448E-05 s/iter 0.910005 +gpu 0 iter : 5 Arret : 2.36504E-05 s/iter 0.910131 +gpu 0 iter : 6 Arret : 2.48395E-05 s/iter 0.910253 +gpu 0 iter : 7 Arret : 2.76062E-05 s/iter 0.910741 +gpu 0 iter : 8 Arret : 3.59956E-05 s/iter 0.909947 +gpu 0 iter : 9 Arret : 0.000409875 s/iter 0.910245 +gpu 0 iter : 10 Arret : 0.000461544 s/iter 0.910290 +gpu 0 iter : 11 Arret : 0.00158737 s/iter 0.910149 +gpu 0 iter : 12 Arret : 0.247611 s/iter 0.910788 +gpu 0 iter : 13 Arret : 1.46429 s/iter 2.007602 +gpu 0 iter : 14 Arret : 0.0428258 s/iter 1.993064 +gpu 0 iter : 15 Arret : 0.0404824 s/iter 2.015318 +gpu 0 iter : 16 Arret : 0.0113811 s/iter 2.013062 +gpu 0 iter : 17 Arret : 0.00573837 s/iter 1.969456 +gpu 0 iter : 18 Arret : 0.00362863 s/iter 1.969720 +gpu 0 iter : 19 Arret : 0.0145957 s/iter 1.939594 +gpu 0 iter : 20 Arret : 0.0218949 s/iter 1.942380 +gpu 0 iter : 21 Arret : 0.0145668 s/iter 1.940447 +gpu 0 iter : 22 Arret : 0.00511795 s/iter 1.925449 +gpu 0 iter : 23 Arret : 0.00289866 s/iter 1.907045 +gpu 0 iter : 24 Arret : 0.0074939 s/iter 1.633175 +gpu 0 iter : 25 Arret : 0.0165795 s/iter 1.633093 +gpu 0 iter : 26 Arret : 0.00637562 s/iter 0.600606 +gpu 0 iter : 27 Arret : 0.000948084 s/iter 0.600496 +gpu 0 iter : 28 Arret : 0.000688755 s/iter 0.602971 +gpu 0 iter : 29 Arret : 0.000708471 s/iter 0.600812 +gpu 0 iter : 30 Arret : 0.000130964 s/iter 0.602700 +gpu 0 iter : 31 Arret : 5.64767E-05 s/iter 0.600363 +gpu 0 iter : 32 Arret : 2.43897E-05 s/iter 0.600069 +gpu 0 iter : 33 Arret : 3.99072E-06 s/iter 0.602441 +gpu 0 iter : 34 Arret : 8.82092E-09 s/iter 0.599942 +gpu 0 iter : 35 Arret : 1.30953E-13 s/iter 0.602836 +temps : 43.054 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.34887E-10 +Stabilite : 1.30953E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 8.60423E-16 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.77636E-14 +i* 5.47062E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 261 start 0 size 66730 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 261 start 66730 size 66730 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 261 start 133460 size 66730 +gpu 0 iter : 1 Arret : 1.42239E-05 s/iter 3.058157 +gpu 0 iter : 2 Arret : 1.33237E-05 s/iter 3.057661 +gpu 0 iter : 3 Arret : 1.45399E-05 s/iter 3.057902 +gpu 0 iter : 4 Arret : 1.44001E-05 s/iter 3.060916 +gpu 0 iter : 5 Arret : 1.21495E-05 s/iter 3.057114 +gpu 0 iter : 6 Arret : 1.24537E-05 s/iter 3.056895 +gpu 0 iter : 7 Arret : 1.29621E-05 s/iter 3.056594 +gpu 0 iter : 8 Arret : 1.56185E-05 s/iter 3.058429 +gpu 0 iter : 9 Arret : 2.80434E-05 s/iter 3.058080 +gpu 0 iter : 10 Arret : 0.000611146 s/iter 3.056594 +gpu 0 iter : 11 Arret : 0.00182901 s/iter 3.057135 +gpu 0 iter : 12 Arret : 1.45413 s/iter 3.056957 +gpu 0 iter : 13 Arret : 0.244871 s/iter 5.891327 +gpu 0 iter : 14 Arret : 0.0953068 s/iter 5.886920 +gpu 0 iter : 15 Arret : 0.0440287 s/iter 5.925775 +gpu 0 iter : 16 Arret : 0.00186276 s/iter 3.043476 +gpu 0 iter : 17 Arret : 0.000441252 s/iter 3.055191 +gpu 0 iter : 18 Arret : 0.00274545 s/iter 3.055363 +gpu 0 iter : 19 Arret : 0.00243858 s/iter 3.054491 +gpu 0 iter : 20 Arret : 0.000179277 s/iter 3.050175 +gpu 0 iter : 21 Arret : 0.000300628 s/iter 3.025675 +gpu 0 iter : 22 Arret : 0.000469664 s/iter 3.023116 +gpu 0 iter : 23 Arret : 9.34152E-05 s/iter 3.022761 +gpu 0 iter : 24 Arret : 3.32355E-05 s/iter 3.017888 +gpu 0 iter : 25 Arret : 7.24854E-05 s/iter 3.021478 +gpu 0 iter : 26 Arret : 0.000569912 s/iter 3.021195 +gpu 0 iter : 27 Arret : 0.000198032 s/iter 3.022745 +gpu 0 iter : 28 Arret : 6.05783E-09 s/iter 3.015186 +gpu 0 iter : 29 Arret : 5.32141E-14 s/iter 3.018484 +temps : 97.9976 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.11076E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +zone limite de 'log-exp' 1.00089 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 521 start 133376 size 133376 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 521 start 0 size 133376 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 521 start 266752 size 133376 +gpu 0 iter : 1 Arret : 6.13232E-06 s/iter 11.259812 +gpu 0 iter : 2 Arret : 5.92558E-06 s/iter 11.177361 +gpu 0 iter : 3 Arret : 5.74898E-06 s/iter 11.169113 +gpu 0 iter : 4 Arret : 5.74683E-06 s/iter 11.167439 +gpu 0 iter : 5 Arret : 5.9256E-06 s/iter 11.172006 +gpu 0 iter : 6 Arret : 5.84193E-06 s/iter 11.165888 +gpu 0 iter : 7 Arret : 5.94654E-06 s/iter 11.166336 +gpu 0 iter : 8 Arret : 6.18739E-06 s/iter 11.163405 +gpu 0 iter : 9 Arret : 6.32181E-06 s/iter 11.165346 +gpu 0 iter : 10 Arret : 1.41892E-05 s/iter 11.167820 +gpu 0 iter : 11 Arret : 0.00173091 s/iter 11.170827 +gpu 0 iter : 12 Arret : 0.00554495 s/iter 13.459397 +gpu 0 iter : 13 Arret : 0.0044383 s/iter 11.169515 +gpu 0 iter : 14 Arret : 0.031501 s/iter 11.165297 +gpu 0 iter : 15 Arret : 1.16288 s/iter 11.985429 +gpu 0 iter : 16 Arret : 6.27627 s/iter 12.095485 +gpu 0 iter : 17 Arret : 0.0403092 s/iter 11.172693 +gpu 0 iter : 18 Arret : 0.055556 s/iter 11.161876 +gpu 0 iter : 19 Arret : 0.0302831 s/iter 16.167669 +gpu 0 iter : 20 Arret : 0.0369686 s/iter 15.569488 +gpu 0 iter : 21 Arret : 0.0194517 s/iter 11.110141 +gpu 0 iter : 22 Arret : 0.0118511 s/iter 12.759873 +gpu 0 iter : 23 Arret : 0.0345743 s/iter 13.506285 +gpu 0 iter : 24 Arret : 0.0304606 s/iter 13.923765 +gpu 0 iter : 25 Arret : 0.0950833 s/iter 15.324505 +gpu 0 iter : 26 Arret : 0.201849 s/iter 13.760715 +gpu 0 iter : 27 Arret : 0.31272 s/iter 13.783168 +gpu 0 iter : 28 Arret : 0.0668102 s/iter 13.817758 +gpu 0 iter : 29 Arret : 0.069483 s/iter 15.595241 +gpu 0 iter : 30 Arret : 0.0481386 s/iter 14.677669 +gpu 0 iter : 31 Arret : 0.0342776 s/iter 16.431418 +gpu 0 iter : 32 Arret : 0.0203788 s/iter 14.590231 +gpu 0 iter : 33 Arret : 0.0236131 s/iter 13.744418 +gpu 0 iter : 34 Arret : 0.0103173 s/iter 13.780697 +gpu 0 iter : 35 Arret : 0.00216207 s/iter 12.470543 +gpu 0 iter : 36 Arret : 0.000283986 s/iter 11.120697 +gpu 0 iter : 37 Arret : 7.56411E-05 s/iter 11.129267 +gpu 0 iter : 38 Arret : 5.05174E-05 s/iter 11.119664 +gpu 0 iter : 39 Arret : 4.00197E-05 s/iter 11.136501 +gpu 0 iter : 40 Arret : 2.85744E-05 s/iter 11.060818 +gpu 0 iter : 41 Arret : 1.87363E-05 s/iter 11.175765 +gpu 0 iter : 42 Arret : 3.67393E-06 s/iter 11.101930 +gpu 0 iter : 43 Arret : 1.49816E-08 s/iter 11.105783 +gpu 0 iter : 44 Arret : 3.15022E-14 s/iter 11.164847 +temps : 547.721 seconde(s) +Nb iterations : 44 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12974E-08 +Stabilite : 3.15022E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769071 +i* 0.639164| 1|-1.31544E-13 +i* 4.65595E-13| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857616 +i* 0.51429| 1|-4.74988E-13 +i*-1.42508E-14| +| 10| -0.0345309 +i* -0.999404| 1| 3.31561E-13 +i*-9.06705E-14| +| 11| 0.662491 +i* 0.74907| 1| 5.75581E-15 +i*-3.34004E-14| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.9261 +i* 0.377277| 1|-4.84647E-14 +i*-1.93776E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.972834 +i* 0.231505| 1| 3.9433E-13 +i*-1.27901E-14| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.996768 +i* 0.0803379| 1| 1.8463E-13 +i* 1.59803E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 782 start 0 size 200021 +gpu 2 dimgrid2 782 start 400042 size 200021 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 782 start 200021 size 200021 +gpu 0 iter : 1 Arret : 4.42115E-06 s/iter 25.532168 +gpu 0 iter : 2 Arret : 4.01411E-06 s/iter 25.511018 +gpu 0 iter : 3 Arret : 3.79048E-06 s/iter 25.523219 +gpu 0 iter : 4 Arret : 3.87826E-06 s/iter 25.501777 +gpu 0 iter : 5 Arret : 3.77658E-06 s/iter 25.513780 +gpu 0 iter : 6 Arret : 3.85622E-06 s/iter 25.528563 +gpu 0 iter : 7 Arret : 4.00228E-06 s/iter 25.502697 +gpu 0 iter : 8 Arret : 4.31857E-06 s/iter 25.528176 +gpu 0 iter : 9 Arret : 5.22735E-06 s/iter 25.511069 +gpu 0 iter : 10 Arret : 9.5524E-06 s/iter 25.503897 +gpu 0 iter : 11 Arret : 0.000408501 s/iter 25.504020 +gpu 0 iter : 12 Arret : 0.000623968 s/iter 25.494891 +gpu 0 iter : 13 Arret : 2.07482 s/iter 30.574894 +gpu 0 iter : 14 Arret : 0.370284 s/iter 25.683751 +gpu 0 iter : 15 Arret : 0.0936332 s/iter 30.867923 +gpu 0 iter : 16 Arret : 0.0158122 s/iter 30.826508 +gpu 0 iter : 17 Arret : 0.0848863 s/iter 30.624568 +gpu 0 iter : 18 Arret : 0.0984771 s/iter 30.770613 +gpu 0 iter : 19 Arret : 0.0293052 s/iter 30.707411 +gpu 0 iter : 20 Arret : 0.015694 s/iter 30.625140 +gpu 0 iter : 21 Arret : 0.00993732 s/iter 30.738745 +gpu 0 iter : 22 Arret : 0.00974188 s/iter 30.679134 +gpu 0 iter : 23 Arret : 0.0156848 s/iter 33.722340 +gpu 0 iter : 24 Arret : 0.0118472 s/iter 34.000126 +gpu 0 iter : 25 Arret : 0.0180113 s/iter 34.012466 +gpu 0 iter : 26 Arret : 0.18738 s/iter 34.043297 +gpu 0 iter : 27 Arret : 0.107568 s/iter 34.157580 +gpu 0 iter : 28 Arret : 0.137713 s/iter 33.201182 +gpu 0 iter : 29 Arret : 0.0137755 s/iter 33.285894 +gpu 0 iter : 30 Arret : 0.00474748 s/iter 33.212318 +gpu 0 iter : 31 Arret : 0.00489404 s/iter 33.244301 +gpu 0 iter : 32 Arret : 0.00381072 s/iter 33.261318 +gpu 0 iter : 33 Arret : 0.00498548 s/iter 33.243623 +gpu 0 iter : 34 Arret : 0.00531641 s/iter 33.338206 +gpu 0 iter : 35 Arret : 0.00515556 s/iter 33.400232 +gpu 0 iter : 36 Arret : 0.00408584 s/iter 33.287904 +gpu 0 iter : 37 Arret : 0.00348274 s/iter 33.304307 +gpu 0 iter : 38 Arret : 0.00365564 s/iter 33.256264 +gpu 0 iter : 39 Arret : 0.00921371 s/iter 33.343042 +gpu 0 iter : 40 Arret : 0.0176099 s/iter 33.282810 +gpu 0 iter : 41 Arret : 0.0239859 s/iter 33.342108 +gpu 0 iter : 42 Arret : 0.0149358 s/iter 33.431581 +gpu 0 iter : 43 Arret : 0.00682354 s/iter 33.323957 +gpu 0 iter : 44 Arret : 0.00375261 s/iter 33.436075 +gpu 0 iter : 45 Arret : 0.00230738 s/iter 33.440640 +gpu 0 iter : 46 Arret : 0.00130962 s/iter 33.450702 +gpu 0 iter : 47 Arret : 0.00089917 s/iter 33.300875 +gpu 0 iter : 48 Arret : 0.000635547 s/iter 33.309161 +gpu 0 iter : 49 Arret : 0.000508468 s/iter 33.277050 +gpu 0 iter : 50 Arret : 0.000827291 s/iter 33.274590 +gpu 0 iter : 51 Arret : 0.000650233 s/iter 33.240408 +gpu 0 iter : 52 Arret : 0.000700256 s/iter 33.278291 +gpu 0 iter : 53 Arret : 0.000412659 s/iter 33.124736 +gpu 0 iter : 54 Arret : 0.000586589 s/iter 32.422683 +gpu 0 iter : 55 Arret : 0.0012868 s/iter 32.436270 +gpu 0 iter : 56 Arret : 0.00106518 s/iter 32.806249 +gpu 0 iter : 57 Arret : 0.000445726 s/iter 32.814593 +gpu 0 iter : 58 Arret : 0.000485601 s/iter 32.710351 +gpu 0 iter : 59 Arret : 0.000213682 s/iter 32.374542 +gpu 0 iter : 60 Arret : 0.000208775 s/iter 32.778982 +gpu 0 iter : 61 Arret : 0.000203004 s/iter 32.334758 +gpu 0 iter : 62 Arret : 0.000196855 s/iter 32.292382 +gpu 0 iter : 63 Arret : 0.000190277 s/iter 32.733295 +gpu 0 iter : 64 Arret : 0.000183901 s/iter 32.300771 +gpu 0 iter : 65 Arret : 0.000176756 s/iter 32.415378 +gpu 0 iter : 66 Arret : 0.000167493 s/iter 32.589207 +gpu 0 iter : 67 Arret : 0.00018076 s/iter 32.873886 +gpu 0 iter : 68 Arret : 0.000619032 s/iter 32.346507 +gpu 0 iter : 69 Arret : 0.000188413 s/iter 32.273915 +gpu 0 iter : 70 Arret : 0.000324167 s/iter 32.260261 +gpu 0 iter : 71 Arret : 0.000790055 s/iter 32.250504 +gpu 0 iter : 72 Arret : 0.0020091 s/iter 32.306464 +gpu 0 iter : 73 Arret : 0.00145307 s/iter 32.266935 +gpu 0 iter : 74 Arret : 0.000909746 s/iter 32.669586 +gpu 0 iter : 75 Arret : 0.00121515 s/iter 32.619090 +gpu 0 iter : 76 Arret : 0.00228086 s/iter 32.561584 +gpu 0 iter : 77 Arret : 0.00495307 s/iter 26.104182 +gpu 0 iter : 78 Arret : 0.0192162 s/iter 26.100281 +gpu 0 iter : 79 Arret : 0.0837333 s/iter 26.128891 +gpu 0 iter : 80 Arret : 0.0431442 s/iter 26.129669 +gpu 0 iter : 81 Arret : 0.00677511 s/iter 26.019917 +gpu 0 iter : 82 Arret : 0.00212692 s/iter 26.064682 +gpu 0 iter : 83 Arret : 0.00135281 s/iter 26.064123 +gpu 0 iter : 84 Arret : 0.000914556 s/iter 26.035560 +gpu 0 iter : 85 Arret : 0.000781515 s/iter 26.017245 +gpu 0 iter : 86 Arret : 0.000747597 s/iter 25.929151 +gpu 0 iter : 87 Arret : 0.000367635 s/iter 25.546043 +gpu 0 iter : 88 Arret : 0.000164338 s/iter 25.481507 +gpu 0 iter : 89 Arret : 0.000107136 s/iter 25.564070 +gpu 0 iter : 90 Arret : 9.91585E-05 s/iter 25.537950 +gpu 0 iter : 91 Arret : 7.76196E-05 s/iter 25.546276 +gpu 0 iter : 92 Arret : 5.97554E-05 s/iter 25.578209 +gpu 0 iter : 93 Arret : 5.73454E-05 s/iter 25.601675 +gpu 0 iter : 94 Arret : 0.000614403 s/iter 25.598729 +gpu 0 iter : 95 Arret : 0.000605289 s/iter 25.573868 +gpu 0 iter : 96 Arret : 5.81091E-05 s/iter 25.569256 +gpu 0 iter : 97 Arret : 3.26024E-05 s/iter 25.593508 +gpu 0 iter : 98 Arret : 6.21714E-07 s/iter 25.536712 +gpu 0 iter : 99 Arret : 1.32706E-11 s/iter 25.560915 +gpu 0 iter : 100 Arret : 1.11022E-16 s/iter 25.566948 +temps : 3012.17 seconde(s) +Nb iterations : 100 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827243 +i* 0.561844| 1|-1.79082E-13 +i*-3.05719E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.76509 +i* 0.643924| 1| 2.51882E-15 +i*-2.49661E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1042 start 0 size 266666 +gpu 2 dimgrid2 1042 start 533332 size 266666 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1042 start 266666 size 266666 +gpu 0 iter : 1 Arret : 3.39518E-06 s/iter 44.286440 +gpu 0 iter : 2 Arret : 3.55621E-06 s/iter 44.282503 +gpu 0 iter : 3 Arret : 3.81988E-06 s/iter 44.283858 +gpu 0 iter : 4 Arret : 3.20229E-06 s/iter 44.283196 +gpu 0 iter : 5 Arret : 3.61794E-06 s/iter 44.245554 +gpu 0 iter : 6 Arret : 3.25514E-06 s/iter 44.291484 +gpu 0 iter : 7 Arret : 3.5522E-06 s/iter 44.280702 +gpu 0 iter : 8 Arret : 3.69717E-06 s/iter 44.319658 +gpu 0 iter : 9 Arret : 3.76915E-06 s/iter 44.307083 +gpu 0 iter : 10 Arret : 6.95138E-06 s/iter 44.280166 +gpu 0 iter : 11 Arret : 0.000806968 s/iter 44.267355 +gpu 0 iter : 12 Arret : 0.00113229 s/iter 44.272240 +gpu 0 iter : 13 Arret : 0.75505 s/iter 44.163437 +gpu 0 iter : 14 Arret : 0.946508 s/iter 44.259421 +gpu 0 iter : 15 Arret : 2.43927 s/iter 44.329431 +gpu 0 iter : 16 Arret : 0.043497 s/iter 52.961254 +gpu 0 iter : 17 Arret : 0.0102184 s/iter 44.527790 +gpu 0 iter : 18 Arret : 0.00204126 s/iter 52.269867 +gpu 0 iter : 19 Arret : 0.00161291 s/iter 44.780673 +gpu 0 iter : 20 Arret : 0.00175389 s/iter 44.816386 +gpu 0 iter : 21 Arret : 0.000461718 s/iter 44.686271 +gpu 0 iter : 22 Arret : 0.000951687 s/iter 44.701369 +gpu 0 iter : 23 Arret : 0.000476023 s/iter 44.907447 +gpu 0 iter : 24 Arret : 0.000353722 s/iter 44.773719 +gpu 0 iter : 25 Arret : 5.60121E-05 s/iter 44.795957 +gpu 0 iter : 26 Arret : 0.000108991 s/iter 44.803320 +gpu 0 iter : 27 Arret : 0.000112326 s/iter 44.808614 +gpu 0 iter : 28 Arret : 2.88849E-05 s/iter 44.668869 +gpu 0 iter : 29 Arret : 7.56739E-07 s/iter 44.826463 +gpu 0 iter : 30 Arret : 1.3212E-11 s/iter 44.848912 +gpu 0 iter : 31 Arret : 1.57009E-16 s/iter 44.944694 +temps : 1397.8 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.0233219 +Stabilite : 1.11886E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.98285 +i* -0.184406| 1|-3.98841E-13 +i*-7.47926E-14| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +799998 racines de module = 1 + 2 racines de module = 0.999973 +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 1303 start 333397 size 333397 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 1303 start 0 size 333397 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 1303 start 666794 size 333397 +gpu 0 iter : 1 Arret : 2.59037E-06 s/iter 68.488379 +gpu 0 iter : 2 Arret : 2.69491E-06 s/iter 68.553223 +gpu 0 iter : 3 Arret : 2.97632E-06 s/iter 68.432077 +gpu 0 iter : 4 Arret : 3.11124E-06 s/iter 68.493633 +gpu 0 iter : 5 Arret : 3.04203E-06 s/iter 68.560718 +gpu 0 iter : 6 Arret : 3.05018E-06 s/iter 68.496612 +gpu 0 iter : 7 Arret : 2.74538E-06 s/iter 68.552569 +gpu 0 iter : 8 Arret : 3.10002E-06 s/iter 68.510878 +gpu 0 iter : 9 Arret : 2.82417E-06 s/iter 68.498986 +gpu 0 iter : 10 Arret : 4.54309E-06 s/iter 68.425008 +gpu 0 iter : 11 Arret : 4.79488E-05 s/iter 68.552577 +gpu 0 iter : 12 Arret : 0.000125717 s/iter 68.569825 +gpu 0 iter : 13 Arret : 0.000326339 s/iter 68.464165 +gpu 0 iter : 14 Arret : 0.000519728 s/iter 68.498582 +gpu 0 iter : 15 Arret : 1.47955 s/iter 68.521357 +gpu 0 iter : 16 Arret : 0.134232 s/iter 70.315716 +gpu 0 iter : 17 Arret : 0.0690512 s/iter 82.408199 +gpu 0 iter : 18 Arret : 0.0429404 s/iter 83.567721 +gpu 0 iter : 19 Arret : 0.0388433 s/iter 83.433066 +gpu 0 iter : 20 Arret : 0.0306758 s/iter 83.859032 +gpu 0 iter : 21 Arret : 0.0262957 s/iter 71.910490 +gpu 0 iter : 22 Arret : 0.0834022 s/iter 75.058900 +gpu 0 iter : 23 Arret : 0.581045 s/iter 83.985067 +gpu 0 iter : 24 Arret : 0.0651466 s/iter 84.660088 +gpu 0 iter : 25 Arret : 0.0409901 s/iter 84.216377 +gpu 0 iter : 26 Arret : 0.133715 s/iter 83.240685 +gpu 0 iter : 27 Arret : 0.562724 s/iter 71.666377 +gpu 0 iter : 28 Arret : 0.117979 s/iter 69.556080 +gpu 0 iter : 29 Arret : 0.00855429 s/iter 69.607828 +gpu 0 iter : 30 Arret : 0.00577175 s/iter 69.441755 +gpu 0 iter : 31 Arret : 0.00265769 s/iter 69.350066 +gpu 0 iter : 32 Arret : 0.00168914 s/iter 69.363060 +gpu 0 iter : 33 Arret : 0.00284192 s/iter 69.402571 +gpu 0 iter : 34 Arret : 0.000175291 s/iter 69.288887 +gpu 0 iter : 35 Arret : 4.78997E-05 s/iter 69.215592 +gpu 0 iter : 36 Arret : 0.000129689 s/iter 69.157034 +gpu 0 iter : 37 Arret : 2.9427E-05 s/iter 69.183780 +gpu 0 iter : 38 Arret : 5.5704E-06 s/iter 69.215726 +gpu 0 iter : 39 Arret : 3.28608E-06 s/iter 69.302036 +gpu 0 iter : 40 Arret : 1.2153E-06 s/iter 69.342960 +gpu 0 iter : 41 Arret : 2.69925E-08 s/iter 69.288879 +gpu 0 iter : 42 Arret : 5.24082E-13 s/iter 69.195992 +temps : 3027.59 seconde(s) +Nb iterations : 42 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.40348 +i* -0.914989| 1|-3.45956E-13 +i*-2.59726E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.345815 +i* -0.938303| 1| 5.50778E-13 +i* 8.9059E-14| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.16571 +i* -0.986175| 1| 2.49276E-13 +i*-1.75918E-13| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1563 start 0 size 400042 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1563 start 400042 size 400042 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 2 dimgrid2 1563 start 800084 size 400042 +gpu 0 iter : 1 Arret : 2.25216E-06 s/iter 98.802488 +gpu 0 iter : 2 Arret : 2.28156E-06 s/iter 98.869005 +gpu 0 iter : 3 Arret : 2.42149E-06 s/iter 98.869812 +gpu 0 iter : 4 Arret : 2.32642E-06 s/iter 98.888019 +gpu 0 iter : 5 Arret : 2.24106E-06 s/iter 98.881288 +gpu 0 iter : 6 Arret : 2.14078E-06 s/iter 98.768679 +gpu 0 iter : 7 Arret : 2.01977E-06 s/iter 98.829212 +gpu 0 iter : 8 Arret : 2.35568E-06 s/iter 98.865141 +gpu 0 iter : 9 Arret : 2.60008E-06 s/iter 98.812073 +gpu 0 iter : 10 Arret : 3.66078E-06 s/iter 98.815473 +gpu 0 iter : 11 Arret : 4.12489E-05 s/iter 98.871039 +gpu 0 iter : 12 Arret : 0.000570792 s/iter 98.872405 +gpu 0 iter : 13 Arret : 0.0011127 s/iter 98.856310 +gpu 0 iter : 14 Arret : 0.000811219 s/iter 98.938678 +gpu 0 iter : 15 Arret : 0.0035539 s/iter 99.304829 +gpu 0 iter : 16 Arret : 0.00751945 s/iter 99.166318 +gpu 0 iter : 17 Arret : 0.00281235 s/iter 112.579500 +gpu 0 iter : 18 Arret : 0.0119292 s/iter 115.248029 +gpu 0 iter : 19 Arret : 0.143732 s/iter 115.377954 +gpu 0 iter : 20 Arret : 0.154299 s/iter 117.172520 +gpu 0 iter : 21 Arret : 0.60856 s/iter 117.625351 +gpu 0 iter : 22 Arret : 0.435799 s/iter 118.396988 +gpu 0 iter : 23 Arret : 0.0170261 s/iter 119.934649 +gpu 0 iter : 24 Arret : 0.0538555 s/iter 116.719157 +gpu 0 iter : 25 Arret : 0.0861365 s/iter 117.930533 +gpu 0 iter : 26 Arret : 0.196912 s/iter 115.048511 +gpu 0 iter : 27 Arret : 0.296216 s/iter 117.136696 +gpu 0 iter : 28 Arret : 0.0248666 s/iter 100.414803 +gpu 0 iter : 29 Arret : 0.0108495 s/iter 100.959491 +gpu 0 iter : 30 Arret : 0.00622199 s/iter 100.460369 +gpu 0 iter : 31 Arret : 0.000227881 s/iter 100.164439 +gpu 0 iter : 32 Arret : 2.13476E-05 s/iter 100.505370 +gpu 0 iter : 33 Arret : 3.38983E-05 s/iter 100.295807 +gpu 0 iter : 34 Arret : 2.03881E-05 s/iter 100.206498 +gpu 0 iter : 35 Arret : 9.58301E-06 s/iter 100.337401 +gpu 0 iter : 36 Arret : 1.08404E-06 s/iter 100.087649 +gpu 0 iter : 37 Arret : 2.10757E-09 s/iter 100.316101 +gpu 0 iter : 38 Arret : 2.45077E-15 s/iter 100.255925 +temps : 3971.4 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 2.45077E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684051 +i* -0.729434| 1| -1.5885E-12 +i* 6.87395E-13| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +zone limite de 'log-exp' 1.00025 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1823 start 466688 size 466688 +gpu 0 dimgrid2 1823 start 0 size 466688 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1823 start 933376 size 466688 +gpu 0 iter : 1 Arret : 1.89746E-06 s/iter 134.484937 +gpu 0 iter : 2 Arret : 2.14906E-06 s/iter 134.419714 +gpu 0 iter : 3 Arret : 2.11472E-06 s/iter 134.349447 +gpu 0 iter : 4 Arret : 1.97302E-06 s/iter 134.398359 +gpu 0 iter : 5 Arret : 1.82457E-06 s/iter 134.283270 +gpu 0 iter : 6 Arret : 1.98209E-06 s/iter 134.253889 +gpu 0 iter : 7 Arret : 2.17735E-06 s/iter 134.421904 +gpu 0 iter : 8 Arret : 1.97101E-06 s/iter 134.321893 +gpu 0 iter : 9 Arret : 2.16129E-06 s/iter 134.535647 +gpu 0 iter : 10 Arret : 2.38282E-06 s/iter 134.478409 +gpu 0 iter : 11 Arret : 2.2405E-05 s/iter 134.248329 +gpu 0 iter : 12 Arret : 0.00022004 s/iter 134.464382 +gpu 0 iter : 13 Arret : 0.000932005 s/iter 134.312492 +gpu 0 iter : 14 Arret : 0.00118315 s/iter 149.387710 +gpu 0 iter : 15 Arret : 0.0018287 s/iter 134.929996 +gpu 0 iter : 16 Arret : 0.00180872 s/iter 134.615736 +gpu 0 iter : 17 Arret : 0.00176553 s/iter 151.347445 +gpu 0 iter : 18 Arret : 0.00766227 s/iter 151.119941 +gpu 0 iter : 19 Arret : 0.617872 s/iter 145.803441 +gpu 0 iter : 20 Arret : 0.0381828 s/iter 145.717407 +gpu 0 iter : 21 Arret : 0.0125131 s/iter 153.625414 +gpu 0 iter : 22 Arret : 0.0160462 s/iter 155.085773 +gpu 0 iter : 23 Arret : 0.0115931 s/iter 153.372730 +gpu 0 iter : 24 Arret : 0.00799913 s/iter 148.200528 +gpu 0 iter : 25 Arret : 0.00909452 s/iter 139.420458 +gpu 0 iter : 26 Arret : 0.0028869 s/iter 133.912895 +gpu 0 iter : 27 Arret : 0.00141577 s/iter 133.963731 +gpu 0 iter : 28 Arret : 0.000325039 s/iter 139.908989 +gpu 0 iter : 29 Arret : 8.64942E-06 s/iter 133.630287 +gpu 0 iter : 30 Arret : 8.1623E-07 s/iter 133.636979 +gpu 0 iter : 31 Arret : 5.03685E-10 s/iter 133.618481 +gpu 0 iter : 32 Arret : 2.48253E-16 s/iter 133.648900 +temps : 4453.8 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 2.48253E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_openmp_bis/full_openmp_4GPU.o140352 b/Simulations/full_openmp_bis/full_openmp_4GPU.o140352 new file mode 100644 index 0000000..510e00e --- /dev/null +++ b/Simulations/full_openmp_bis/full_openmp_4GPU.o140352 @@ -0,0 +1,650 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00356 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 98 start 0 size 25024 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 98 start 25024 size 25024 +gpu 3 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 3 dimgrid2 98 start 75072 size 25024 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 98 start 50048 size 25024 +gpu 0 iter : 1 Arret : 2.36972E-05 s/iter 0.668974 +gpu 0 iter : 2 Arret : 2.36251E-05 s/iter 0.622308 +gpu 0 iter : 3 Arret : 2.27126E-05 s/iter 0.622336 +gpu 0 iter : 4 Arret : 2.57604E-05 s/iter 0.618855 +gpu 0 iter : 5 Arret : 2.365E-05 s/iter 0.622339 +gpu 0 iter : 6 Arret : 2.4839E-05 s/iter 0.622318 +gpu 0 iter : 7 Arret : 2.76054E-05 s/iter 0.618812 +gpu 0 iter : 8 Arret : 3.59937E-05 s/iter 0.622306 +gpu 0 iter : 9 Arret : 0.000294653 s/iter 0.622262 +gpu 0 iter : 10 Arret : 0.000438307 s/iter 0.622307 +gpu 0 iter : 11 Arret : 0.00158434 s/iter 0.622293 +gpu 0 iter : 12 Arret : 0.246104 s/iter 0.618760 +gpu 0 iter : 13 Arret : 1.48046 s/iter 1.977287 +gpu 0 iter : 14 Arret : 0.10412 s/iter 1.945511 +gpu 0 iter : 15 Arret : 0.170314 s/iter 1.965573 +gpu 0 iter : 16 Arret : 0.0234815 s/iter 0.615532 +gpu 0 iter : 17 Arret : 0.0106919 s/iter 0.613697 +gpu 0 iter : 18 Arret : 0.00621352 s/iter 0.605074 +gpu 0 iter : 19 Arret : 0.00420192 s/iter 0.603919 +gpu 0 iter : 20 Arret : 0.00306773 s/iter 0.589799 +gpu 0 iter : 21 Arret : 0.017646 s/iter 0.596300 +gpu 0 iter : 22 Arret : 0.00931167 s/iter 0.596245 +gpu 0 iter : 23 Arret : 0.0648284 s/iter 0.600998 +gpu 0 iter : 24 Arret : 0.0665304 s/iter 1.714998 +gpu 0 iter : 25 Arret : 0.00296603 s/iter 0.588729 +gpu 0 iter : 26 Arret : 0.00111019 s/iter 0.596300 +gpu 0 iter : 27 Arret : 0.000529051 s/iter 0.590093 +gpu 0 iter : 28 Arret : 0.000107964 s/iter 0.591402 +gpu 0 iter : 29 Arret : 4.04502E-05 s/iter 0.591381 +gpu 0 iter : 30 Arret : 4.20399E-05 s/iter 0.591388 +gpu 0 iter : 31 Arret : 4.27625E-05 s/iter 0.591604 +gpu 0 iter : 32 Arret : 1.80992E-05 s/iter 0.590993 +gpu 0 iter : 33 Arret : 5.24579E-08 s/iter 0.591117 +gpu 0 iter : 34 Arret : 7.81263E-13 s/iter 0.603778 +temps : 27.3746 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.17553E-09 +Stabilite : 0 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 8.60423E-16 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.76109E-14 +i* 5.4734E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +zone limite de 'log-exp' 1.00178 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 3 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 196 start 100096 size 50048 +gpu 3 dimgrid2 196 start 150144 size 50048 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 0 iter : 1 Arret : 1.19072E-05 s/iter 2.455829 +gpu 0 iter : 2 Arret : 1.33377E-05 s/iter 2.452256 +gpu 0 iter : 3 Arret : 1.13632E-05 s/iter 2.452478 +gpu 0 iter : 4 Arret : 1.14039E-05 s/iter 2.452299 +gpu 0 iter : 5 Arret : 1.16344E-05 s/iter 2.452382 +gpu 0 iter : 6 Arret : 1.20661E-05 s/iter 2.452428 +gpu 0 iter : 7 Arret : 1.30094E-05 s/iter 2.452394 +gpu 0 iter : 8 Arret : 1.57289E-05 s/iter 2.452343 +gpu 0 iter : 9 Arret : 2.8627E-05 s/iter 2.452360 +gpu 0 iter : 10 Arret : 0.00054461 s/iter 2.452022 +gpu 0 iter : 11 Arret : 0.00145338 s/iter 2.452426 +gpu 0 iter : 12 Arret : 1.79253 s/iter 2.452107 +gpu 0 iter : 13 Arret : 0.533977 s/iter 2.452143 +gpu 0 iter : 14 Arret : 0.699076 s/iter 4.765744 +gpu 0 iter : 15 Arret : 0.0709274 s/iter 4.775254 +gpu 0 iter : 16 Arret : 0.0253286 s/iter 4.767205 +gpu 0 iter : 17 Arret : 0.00881713 s/iter 2.437767 +gpu 0 iter : 18 Arret : 0.00533107 s/iter 2.428440 +gpu 0 iter : 19 Arret : 0.00743265 s/iter 4.249640 +gpu 0 iter : 20 Arret : 0.000698696 s/iter 2.420553 +gpu 0 iter : 21 Arret : 0.000259303 s/iter 2.411812 +gpu 0 iter : 22 Arret : 0.000648656 s/iter 2.410234 +gpu 0 iter : 23 Arret : 0.00196532 s/iter 2.410082 +gpu 0 iter : 24 Arret : 0.000107854 s/iter 2.410295 +gpu 0 iter : 25 Arret : 4.09677E-05 s/iter 2.410995 +gpu 0 iter : 26 Arret : 5.37573E-06 s/iter 2.409992 +gpu 0 iter : 27 Arret : 1.62125E-08 s/iter 2.410152 +gpu 0 iter : 28 Arret : 1.42574E-13 s/iter 2.410051 +temps : 78.4901 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +zone limite de 'log-exp' 1.00089 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 391 start 0 size 100032 +gpu 1 dimgrid2 391 start 100032 size 100032 +gpu 3 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 3 dimgrid2 391 start 300096 size 100032 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 391 start 200064 size 100032 +gpu 0 iter : 1 Arret : 6.83308E-06 s/iter 8.687673 +gpu 0 iter : 2 Arret : 6.78936E-06 s/iter 8.662570 +gpu 0 iter : 3 Arret : 7.21603E-06 s/iter 8.680443 +gpu 0 iter : 4 Arret : 6.21887E-06 s/iter 8.660300 +gpu 0 iter : 5 Arret : 6.53427E-06 s/iter 8.660436 +gpu 0 iter : 6 Arret : 5.95601E-06 s/iter 8.669060 +gpu 0 iter : 7 Arret : 5.94684E-06 s/iter 8.673572 +gpu 0 iter : 8 Arret : 6.66715E-06 s/iter 8.679665 +gpu 0 iter : 9 Arret : 7.17748E-06 s/iter 8.664571 +gpu 0 iter : 10 Arret : 2.83521E-05 s/iter 8.686351 +gpu 0 iter : 11 Arret : 0.00172795 s/iter 8.683895 +gpu 0 iter : 12 Arret : 0.00549103 s/iter 12.889374 +gpu 0 iter : 13 Arret : 0.00456576 s/iter 10.269934 +gpu 0 iter : 14 Arret : 0.00289852 s/iter 9.402838 +gpu 0 iter : 15 Arret : 0.0438506 s/iter 12.988912 +gpu 0 iter : 16 Arret : 3.77879 s/iter 13.166240 +gpu 0 iter : 17 Arret : 2.10534 s/iter 8.617782 +gpu 0 iter : 18 Arret : 0.796087 s/iter 10.512729 +gpu 0 iter : 19 Arret : 0.311035 s/iter 8.624823 +gpu 0 iter : 20 Arret : 0.109701 s/iter 9.275524 +gpu 0 iter : 21 Arret : 0.0600409 s/iter 9.244258 +gpu 0 iter : 22 Arret : 0.0384709 s/iter 13.193445 +gpu 0 iter : 23 Arret : 0.0257604 s/iter 12.886058 +gpu 0 iter : 24 Arret : 0.115342 s/iter 11.285456 +gpu 0 iter : 25 Arret : 0.158851 s/iter 13.051696 +gpu 0 iter : 26 Arret : 0.361498 s/iter 11.279780 +gpu 0 iter : 27 Arret : 0.673522 s/iter 11.353180 +gpu 0 iter : 28 Arret : 0.0406058 s/iter 13.868227 +gpu 0 iter : 29 Arret : 0.016774 s/iter 13.878938 +gpu 0 iter : 30 Arret : 0.0124111 s/iter 14.114049 +gpu 0 iter : 31 Arret : 0.00546513 s/iter 13.998499 +gpu 0 iter : 32 Arret : 0.000358108 s/iter 8.577800 +gpu 0 iter : 33 Arret : 6.85612E-05 s/iter 8.572216 +gpu 0 iter : 34 Arret : 0.00100594 s/iter 8.603434 +gpu 0 iter : 35 Arret : 0.000298069 s/iter 8.578157 +gpu 0 iter : 36 Arret : 2.04019E-05 s/iter 8.587649 +gpu 0 iter : 37 Arret : 2.48589E-06 s/iter 8.588165 +gpu 0 iter : 38 Arret : 3.21069E-08 s/iter 8.581318 +gpu 0 iter : 39 Arret : 1.30873E-13 s/iter 8.589365 +temps : 399.7 seconde(s) +Nb iterations : 39 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12993E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769081 +i* 0.639152| 1|-2.56017E-13 +i* 6.90161E-13| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857632 +i* 0.514263| 1| 7.84754E-13 +i* 2.86151E-13| +| 10| -0.0345309 +i* -0.999404| 1| 3.31561E-13 +i*-9.06705E-14| +| 11| 0.662503 +i* 0.74906| 1| 7.42843E-14 +i*-6.06277E-13| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926088 +i* 0.377307| 1| 6.5396E-13 +i* 7.07941E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.97283 +i* 0.23152| 1|-1.36773E-13 +i*-4.46509E-13| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 586 start 300032 size 150016 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 586 start 150016 size 150016 +gpu 3 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 3 dimgrid2 586 start 450048 size 150016 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 0 iter : 1 Arret : 4.50774E-06 s/iter 18.767906 +gpu 0 iter : 2 Arret : 4.46347E-06 s/iter 18.760511 +gpu 0 iter : 3 Arret : 4.08919E-06 s/iter 18.749796 +gpu 0 iter : 4 Arret : 3.95781E-06 s/iter 18.756445 +gpu 0 iter : 5 Arret : 4.12023E-06 s/iter 18.760371 +gpu 0 iter : 6 Arret : 4.06808E-06 s/iter 18.729222 +gpu 0 iter : 7 Arret : 3.99899E-06 s/iter 18.743423 +gpu 0 iter : 8 Arret : 4.31359E-06 s/iter 18.751151 +gpu 0 iter : 9 Arret : 5.21531E-06 s/iter 18.733803 +gpu 0 iter : 10 Arret : 0.000101946 s/iter 18.734289 +gpu 0 iter : 11 Arret : 0.000408516 s/iter 18.733136 +gpu 0 iter : 12 Arret : 0.000706557 s/iter 18.732114 +gpu 0 iter : 13 Arret : 2.1909 s/iter 18.757334 +gpu 0 iter : 14 Arret : 0.451216 s/iter 18.748264 +gpu 0 iter : 15 Arret : 0.339953 s/iter 26.736153 +gpu 0 iter : 16 Arret : 0.169148 s/iter 26.789207 +gpu 0 iter : 17 Arret : 0.0402512 s/iter 26.808647 +gpu 0 iter : 18 Arret : 0.0210284 s/iter 26.763957 +gpu 0 iter : 19 Arret : 0.013235 s/iter 26.768900 +gpu 0 iter : 20 Arret : 0.00905439 s/iter 26.849639 +gpu 0 iter : 21 Arret : 0.00651652 s/iter 26.787569 +gpu 0 iter : 22 Arret : 0.0209755 s/iter 26.999416 +gpu 0 iter : 23 Arret : 0.0283027 s/iter 27.203851 +gpu 0 iter : 24 Arret : 0.0246379 s/iter 26.993683 +gpu 0 iter : 25 Arret : 0.101185 s/iter 26.803558 +gpu 0 iter : 26 Arret : 0.100313 s/iter 26.842046 +gpu 0 iter : 27 Arret : 0.163719 s/iter 26.828628 +gpu 0 iter : 28 Arret : 0.0482315 s/iter 26.845110 +gpu 0 iter : 29 Arret : 0.0103223 s/iter 26.896065 +gpu 0 iter : 30 Arret : 0.00496332 s/iter 26.806043 +gpu 0 iter : 31 Arret : 0.00367192 s/iter 26.760809 +gpu 0 iter : 32 Arret : 0.00341441 s/iter 26.789298 +gpu 0 iter : 33 Arret : 0.00247026 s/iter 26.756686 +gpu 0 iter : 34 Arret : 0.00208061 s/iter 26.652171 +gpu 0 iter : 35 Arret : 0.00185636 s/iter 26.575964 +gpu 0 iter : 36 Arret : 0.00352602 s/iter 26.683145 +gpu 0 iter : 37 Arret : 0.00653739 s/iter 26.590103 +gpu 0 iter : 38 Arret : 0.00492686 s/iter 26.588605 +gpu 0 iter : 39 Arret : 0.00447252 s/iter 26.496367 +gpu 0 iter : 40 Arret : 0.000547314 s/iter 26.592548 +gpu 0 iter : 41 Arret : 0.00136209 s/iter 26.538804 +gpu 0 iter : 42 Arret : 0.00197612 s/iter 26.583277 +gpu 0 iter : 43 Arret : 0.000392726 s/iter 18.622408 +gpu 0 iter : 44 Arret : 0.00131045 s/iter 18.685108 +gpu 0 iter : 45 Arret : 0.00104061 s/iter 19.378597 +gpu 0 iter : 46 Arret : 0.000234145 s/iter 18.609701 +gpu 0 iter : 47 Arret : 4.7188E-05 s/iter 18.577615 +gpu 0 iter : 48 Arret : 5.10545E-06 s/iter 18.608929 +gpu 0 iter : 49 Arret : 3.52111E-08 s/iter 18.602465 +gpu 0 iter : 50 Arret : 1.02528E-13 s/iter 18.651905 +temps : 1163.51 seconde(s) +Nb iterations : 50 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827243 +i* 0.561844| 1|-1.79082E-13 +i*-3.05719E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.765083 +i* 0.643932| 1| 3.06144E-14 +i*-3.59443E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 782 start 200000 size 200000 +gpu 3 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 3 dimgrid2 782 start 600000 size 200000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 782 start 0 size 200000 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 782 start 400000 size 200000 +gpu 0 iter : 1 Arret : 2.9665E-06 s/iter 34.132954 +gpu 0 iter : 2 Arret : 2.96498E-06 s/iter 34.060373 +gpu 0 iter : 3 Arret : 2.9937E-06 s/iter 34.106618 +gpu 0 iter : 4 Arret : 2.99019E-06 s/iter 34.131529 +gpu 0 iter : 5 Arret : 2.96254E-06 s/iter 34.072428 +gpu 0 iter : 6 Arret : 2.96634E-06 s/iter 34.094938 +gpu 0 iter : 7 Arret : 2.97177E-06 s/iter 34.087606 +gpu 0 iter : 8 Arret : 3.1804E-06 s/iter 34.105421 +gpu 0 iter : 9 Arret : 3.76913E-06 s/iter 34.122970 +gpu 0 iter : 10 Arret : 6.64268E-06 s/iter 34.130380 +gpu 0 iter : 11 Arret : 0.000184943 s/iter 34.119757 +gpu 0 iter : 12 Arret : 0.00113217 s/iter 34.095463 +gpu 0 iter : 13 Arret : 0.753916 s/iter 34.085029 +gpu 0 iter : 14 Arret : 0.945227 s/iter 34.115229 +gpu 0 iter : 15 Arret : 2.42544 s/iter 34.084082 +gpu 0 iter : 16 Arret : 0.0394416 s/iter 34.026900 +gpu 0 iter : 17 Arret : 0.0115328 s/iter 33.884844 +gpu 0 iter : 18 Arret : 0.000905462 s/iter 33.872131 +gpu 0 iter : 19 Arret : 0.000346005 s/iter 33.871123 +gpu 0 iter : 20 Arret : 0.000573762 s/iter 33.849199 +gpu 0 iter : 21 Arret : 0.000415648 s/iter 33.868251 +gpu 0 iter : 22 Arret : 0.000562449 s/iter 33.882749 +gpu 0 iter : 23 Arret : 0.0012921 s/iter 33.868629 +gpu 0 iter : 24 Arret : 0.000343321 s/iter 33.877909 +gpu 0 iter : 25 Arret : 6.89541E-05 s/iter 33.851132 +gpu 0 iter : 26 Arret : 2.43828E-05 s/iter 33.849227 +gpu 0 iter : 27 Arret : 1.8909E-05 s/iter 33.872817 +gpu 0 iter : 28 Arret : 2.44076E-05 s/iter 33.860491 +gpu 0 iter : 29 Arret : 3.23083E-06 s/iter 33.868783 +gpu 0 iter : 30 Arret : 1.58E-10 s/iter 33.857784 +gpu 0 iter : 31 Arret : 3.85593E-16 s/iter 33.840967 +temps : 1055.39 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982853 +i* -0.184391| 1| 8.57613E-14 +i* 1.33506E-13| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 977 start 0 size 250048 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 977 start 500096 size 250048 +gpu 3 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 3 dimgrid2 977 start 750144 size 250048 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 977 start 250048 size 250048 +gpu 0 iter : 1 Arret : 2.88781E-06 s/iter 52.567689 +gpu 0 iter : 2 Arret : 2.48174E-06 s/iter 52.412927 +gpu 0 iter : 3 Arret : 2.37734E-06 s/iter 52.445779 +gpu 0 iter : 4 Arret : 2.38169E-06 s/iter 52.428480 +gpu 0 iter : 5 Arret : 2.38448E-06 s/iter 52.401350 +gpu 0 iter : 6 Arret : 2.9427E-06 s/iter 52.358266 +gpu 0 iter : 7 Arret : 2.4276E-06 s/iter 52.420365 +gpu 0 iter : 8 Arret : 2.576E-06 s/iter 52.397873 +gpu 0 iter : 9 Arret : 2.95754E-06 s/iter 52.438769 +gpu 0 iter : 10 Arret : 4.376E-06 s/iter 52.429890 +gpu 0 iter : 11 Arret : 0.000112761 s/iter 52.466360 +gpu 0 iter : 12 Arret : 0.00014018 s/iter 52.402254 +gpu 0 iter : 13 Arret : 0.00011586 s/iter 52.424902 +gpu 0 iter : 14 Arret : 0.00133799 s/iter 52.444410 +gpu 0 iter : 15 Arret : 1.4567 s/iter 54.393527 +gpu 0 iter : 16 Arret : 0.157126 s/iter 54.676459 +gpu 0 iter : 17 Arret : 0.0769879 s/iter 54.372305 +gpu 0 iter : 18 Arret : 0.047361 s/iter 66.600120 +gpu 0 iter : 19 Arret : 0.0316599 s/iter 56.256144 +gpu 0 iter : 20 Arret : 0.0224311 s/iter 58.438101 +gpu 0 iter : 21 Arret : 0.0165373 s/iter 61.741227 +gpu 0 iter : 22 Arret : 0.401359 s/iter 56.531585 +gpu 0 iter : 23 Arret : 0.328672 s/iter 55.269982 +gpu 0 iter : 24 Arret : 0.202796 s/iter 55.021521 +gpu 0 iter : 25 Arret : 0.104584 s/iter 54.616326 +gpu 0 iter : 26 Arret : 0.0261205 s/iter 66.413122 +gpu 0 iter : 27 Arret : 0.0245485 s/iter 52.868792 +gpu 0 iter : 28 Arret : 0.0278169 s/iter 56.569999 +gpu 0 iter : 29 Arret : 0.00143344 s/iter 52.689834 +gpu 0 iter : 30 Arret : 0.00133282 s/iter 52.767469 +gpu 0 iter : 31 Arret : 0.00056116 s/iter 52.674243 +gpu 0 iter : 32 Arret : 0.00122145 s/iter 52.782739 +gpu 0 iter : 33 Arret : 0.00499332 s/iter 52.888671 +gpu 0 iter : 34 Arret : 8.64873E-05 s/iter 52.819841 +gpu 0 iter : 35 Arret : 3.87016E-05 s/iter 52.893826 +gpu 0 iter : 36 Arret : 0.000101821 s/iter 52.680312 +gpu 0 iter : 37 Arret : 0.00108852 s/iter 52.667928 +gpu 0 iter : 38 Arret : 0.00150801 s/iter 52.688010 +gpu 0 iter : 39 Arret : 0.000162458 s/iter 52.662407 +gpu 0 iter : 40 Arret : 4.74398E-05 s/iter 52.683807 +gpu 0 iter : 41 Arret : 2.2996E-05 s/iter 52.734431 +gpu 0 iter : 42 Arret : 1.52502E-05 s/iter 52.717114 +gpu 0 iter : 43 Arret : 5.47596E-06 s/iter 52.767661 +gpu 0 iter : 44 Arret : 7.00943E-07 s/iter 52.627015 +gpu 0 iter : 45 Arret : 3.22655E-09 s/iter 52.686211 +gpu 0 iter : 46 Arret : 5.38916E-15 s/iter 52.697776 +temps : 2489.06 seconde(s) +Nb iterations : 46 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.40348 +i* -0.914989| 1|-3.45956E-13 +i*-2.59726E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.345815 +i* -0.938303| 1| 5.50778E-13 +i* 8.9059E-14| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.165685 +i* -0.986179| 1| 7.63278E-16 +i*-3.73816E-14| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +zone limite de 'log-exp' 1.0003 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 2 dimgrid2 1172 start 600064 size 300032 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 3 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid2 1172 start 900096 size 300032 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 2.42652E-06 s/iter 74.617749 +gpu 0 iter : 2 Arret : 2.49614E-06 s/iter 74.548310 +gpu 0 iter : 3 Arret : 2.21192E-06 s/iter 74.556230 +gpu 0 iter : 4 Arret : 2.11473E-06 s/iter 74.504423 +gpu 0 iter : 5 Arret : 2.29716E-06 s/iter 74.525347 +gpu 0 iter : 6 Arret : 2.20002E-06 s/iter 74.448738 +gpu 0 iter : 7 Arret : 2.19767E-06 s/iter 74.591557 +gpu 0 iter : 8 Arret : 2.319E-06 s/iter 74.518969 +gpu 0 iter : 9 Arret : 2.33977E-06 s/iter 74.417513 +gpu 0 iter : 10 Arret : 3.18561E-06 s/iter 74.428935 +gpu 0 iter : 11 Arret : 2.39196E-05 s/iter 74.427517 +gpu 0 iter : 12 Arret : 0.000318633 s/iter 74.433069 +gpu 0 iter : 13 Arret : 0.00154086 s/iter 74.779282 +gpu 0 iter : 14 Arret : 0.000824248 s/iter 74.717977 +gpu 0 iter : 15 Arret : 0.000938617 s/iter 74.750958 +gpu 0 iter : 16 Arret : 0.00924203 s/iter 74.495587 +gpu 0 iter : 17 Arret : 1.22373 s/iter 89.902699 +gpu 0 iter : 18 Arret : 0.0309579 s/iter 89.741584 +gpu 0 iter : 19 Arret : 0.0522422 s/iter 89.331794 +gpu 0 iter : 20 Arret : 0.0374635 s/iter 89.988148 +gpu 0 iter : 21 Arret : 0.0161203 s/iter 93.229079 +gpu 0 iter : 22 Arret : 0.0347427 s/iter 92.221499 +gpu 0 iter : 23 Arret : 0.0641293 s/iter 93.761623 +gpu 0 iter : 24 Arret : 0.0357214 s/iter 93.514989 +gpu 0 iter : 25 Arret : 0.207308 s/iter 94.107114 +gpu 0 iter : 26 Arret : 0.125661 s/iter 92.472778 +gpu 0 iter : 27 Arret : 0.0748459 s/iter 90.193087 +gpu 0 iter : 28 Arret : 0.0395315 s/iter 91.296280 +gpu 0 iter : 29 Arret : 0.0352008 s/iter 87.646913 +gpu 0 iter : 30 Arret : 0.0383622 s/iter 74.418177 +gpu 0 iter : 31 Arret : 0.0225754 s/iter 74.526286 +gpu 0 iter : 32 Arret : 0.000665957 s/iter 74.146229 +gpu 0 iter : 33 Arret : 1.74739E-05 s/iter 74.377078 +gpu 0 iter : 34 Arret : 8.8614E-06 s/iter 74.306201 +gpu 0 iter : 35 Arret : 6.22465E-06 s/iter 74.346563 +gpu 0 iter : 36 Arret : 1.54539E-05 s/iter 74.268334 +gpu 0 iter : 37 Arret : 1.99901E-05 s/iter 74.305788 +gpu 0 iter : 38 Arret : 2.01663E-06 s/iter 74.513999 +gpu 0 iter : 39 Arret : 2.0507E-07 s/iter 74.179158 +gpu 0 iter : 40 Arret : 3.39098E-11 s/iter 74.283612 +gpu 0 iter : 41 Arret : 1.57009E-16 s/iter 74.098952 +temps : 3274.17 seconde(s) +Nb iterations : 41 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +zone limite de 'log-exp' 1.00025 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 1368 start 0 size 350016 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1368 start 350016 size 350016 +gpu 3 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 3 dimgrid2 1368 start 1050048 size 350016 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1368 start 700032 size 350016 +gpu 0 iter : 1 Arret : 2.03238E-06 s/iter 101.212949 +gpu 0 iter : 2 Arret : 1.8928E-06 s/iter 101.009938 +gpu 0 iter : 3 Arret : 1.76076E-06 s/iter 101.081176 +gpu 0 iter : 4 Arret : 1.69968E-06 s/iter 100.980005 +gpu 0 iter : 5 Arret : 2.05399E-06 s/iter 101.013322 +gpu 0 iter : 6 Arret : 1.85778E-06 s/iter 100.874154 +gpu 0 iter : 7 Arret : 1.7351E-06 s/iter 101.028880 +gpu 0 iter : 8 Arret : 1.82753E-06 s/iter 101.353518 +gpu 0 iter : 9 Arret : 1.78381E-06 s/iter 101.161489 +gpu 0 iter : 10 Arret : 1.95163E-06 s/iter 101.020805 +gpu 0 iter : 11 Arret : 1.11498E-05 s/iter 100.910293 +gpu 0 iter : 12 Arret : 0.000267342 s/iter 101.117136 +gpu 0 iter : 13 Arret : 0.000448589 s/iter 101.072866 +gpu 0 iter : 14 Arret : 0.00117343 s/iter 102.399232 +gpu 0 iter : 15 Arret : 0.0025383 s/iter 101.619405 +gpu 0 iter : 16 Arret : 0.0127207 s/iter 101.389072 +gpu 0 iter : 17 Arret : 0.00589486 s/iter 120.753705 +gpu 0 iter : 18 Arret : 0.00398562 s/iter 114.216025 +gpu 0 iter : 19 Arret : 0.00872604 s/iter 120.471159 +gpu 0 iter : 20 Arret : 0.0658269 s/iter 121.374423 +gpu 0 iter : 21 Arret : 0.643107 s/iter 120.581728 +gpu 0 iter : 22 Arret : 0.0256024 s/iter 101.540440 +gpu 0 iter : 23 Arret : 0.00590733 s/iter 101.350206 +gpu 0 iter : 24 Arret : 0.00290093 s/iter 102.021897 +gpu 0 iter : 25 Arret : 0.000722765 s/iter 102.009174 +gpu 0 iter : 26 Arret : 0.000172667 s/iter 100.437242 +gpu 0 iter : 27 Arret : 9.4954E-05 s/iter 100.408854 +gpu 0 iter : 28 Arret : 0.000102556 s/iter 100.581581 +gpu 0 iter : 29 Arret : 5.13171E-06 s/iter 100.431024 +gpu 0 iter : 30 Arret : 1.97065E-06 s/iter 100.464145 +gpu 0 iter : 31 Arret : 4.62246E-08 s/iter 100.685343 +gpu 0 iter : 32 Arret : 6.27512E-14 s/iter 100.695274 +temps : 3329.48 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/full_openmp_bis/full_openmp_4GPU.o140352~ b/Simulations/full_openmp_bis/full_openmp_4GPU.o140352~ new file mode 100644 index 0000000..510e00e --- /dev/null +++ b/Simulations/full_openmp_bis/full_openmp_4GPU.o140352~ @@ -0,0 +1,650 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00356 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 98 start 0 size 25024 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 98 start 25024 size 25024 +gpu 3 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 3 dimgrid2 98 start 75072 size 25024 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 98 start 50048 size 25024 +gpu 0 iter : 1 Arret : 2.36972E-05 s/iter 0.668974 +gpu 0 iter : 2 Arret : 2.36251E-05 s/iter 0.622308 +gpu 0 iter : 3 Arret : 2.27126E-05 s/iter 0.622336 +gpu 0 iter : 4 Arret : 2.57604E-05 s/iter 0.618855 +gpu 0 iter : 5 Arret : 2.365E-05 s/iter 0.622339 +gpu 0 iter : 6 Arret : 2.4839E-05 s/iter 0.622318 +gpu 0 iter : 7 Arret : 2.76054E-05 s/iter 0.618812 +gpu 0 iter : 8 Arret : 3.59937E-05 s/iter 0.622306 +gpu 0 iter : 9 Arret : 0.000294653 s/iter 0.622262 +gpu 0 iter : 10 Arret : 0.000438307 s/iter 0.622307 +gpu 0 iter : 11 Arret : 0.00158434 s/iter 0.622293 +gpu 0 iter : 12 Arret : 0.246104 s/iter 0.618760 +gpu 0 iter : 13 Arret : 1.48046 s/iter 1.977287 +gpu 0 iter : 14 Arret : 0.10412 s/iter 1.945511 +gpu 0 iter : 15 Arret : 0.170314 s/iter 1.965573 +gpu 0 iter : 16 Arret : 0.0234815 s/iter 0.615532 +gpu 0 iter : 17 Arret : 0.0106919 s/iter 0.613697 +gpu 0 iter : 18 Arret : 0.00621352 s/iter 0.605074 +gpu 0 iter : 19 Arret : 0.00420192 s/iter 0.603919 +gpu 0 iter : 20 Arret : 0.00306773 s/iter 0.589799 +gpu 0 iter : 21 Arret : 0.017646 s/iter 0.596300 +gpu 0 iter : 22 Arret : 0.00931167 s/iter 0.596245 +gpu 0 iter : 23 Arret : 0.0648284 s/iter 0.600998 +gpu 0 iter : 24 Arret : 0.0665304 s/iter 1.714998 +gpu 0 iter : 25 Arret : 0.00296603 s/iter 0.588729 +gpu 0 iter : 26 Arret : 0.00111019 s/iter 0.596300 +gpu 0 iter : 27 Arret : 0.000529051 s/iter 0.590093 +gpu 0 iter : 28 Arret : 0.000107964 s/iter 0.591402 +gpu 0 iter : 29 Arret : 4.04502E-05 s/iter 0.591381 +gpu 0 iter : 30 Arret : 4.20399E-05 s/iter 0.591388 +gpu 0 iter : 31 Arret : 4.27625E-05 s/iter 0.591604 +gpu 0 iter : 32 Arret : 1.80992E-05 s/iter 0.590993 +gpu 0 iter : 33 Arret : 5.24579E-08 s/iter 0.591117 +gpu 0 iter : 34 Arret : 7.81263E-13 s/iter 0.603778 +temps : 27.3746 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.17553E-09 +Stabilite : 0 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540601 +i* 0.841279| 1| -4.3885E-14 +i*-7.30839E-15| +| 2| -0.281748 +i* -0.959489| 1|-5.73395E-14 +i*-4.24574E-14| +| 3|-4.71234E-05 +i* 1| 1| 8.60423E-16 +i* 1.94116E-15| +| 4| 0.281778 +i* -0.95948| 1|-1.23963E-14 +i* 1.02314E-14| +| 5| -0.54068 +i* 0.841228| 1| 5.53932E-14 +i*-7.48533E-15| +| 6| 0.75578 +i* -0.654825| 1|-1.78253E-13 +i* 5.35631E-14| +| 7| -0.909652 +i* 0.415372| 1|-2.24577E-14 +i*-2.99309E-14| +| 8| 0.989828 +i* -0.142268| 1|-4.88647E-13 +i* 2.69096E-13| +| 9| -0.989815 +i* -0.142361| 1| 4.10505E-14 +i* 1.22957E-14| +| 10| 0.909612 +i* 0.415458| 1|-9.85774E-14 +i* 2.25852E-13| +| 11| -0.755719 +i* -0.654896| 1|-4.50195E-14 +i* 3.70867E-14| +| 12| 0.540548 +i* 0.841313| 1| 1.15279E-13 +i*-6.26114E-14| +| 13| -0.281687 +i* -0.959506| 1| 6.72067E-14 +i*-1.86153E-14| +| 14|-0.000109955 +i* 1| 1| 1.76109E-14 +i* 5.4734E-14| +| 15| 0.281838 +i* -0.959462| 1|-5.44356E-14 +i* 4.87822E-14| +| 16| -0.540733 +i* 0.841194| 1| 1.93526E-14 +i* 3.41446E-14| +| 17| 0.755822 +i* -0.654778| 1| 1.41439E-13 +i* 1.77344E-13| +| 18| -0.909678 +i* 0.415315| 1| 3.90799E-14 +i* 2.50217E-14| +| 19| 0.989837 +i* -0.142206| 1| 1.87558E-13 +i*-4.17969E-13| +| 20| -0.989806 +i* -0.142424| 1|-4.45512E-14 +i*-1.49828E-14| ++---+----------------------------+------------+----------------------------+ +100000 racines de module = 1 +zone limite de 'log-exp' 1.00178 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 3 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 196 start 100096 size 50048 +gpu 3 dimgrid2 196 start 150144 size 50048 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 0 iter : 1 Arret : 1.19072E-05 s/iter 2.455829 +gpu 0 iter : 2 Arret : 1.33377E-05 s/iter 2.452256 +gpu 0 iter : 3 Arret : 1.13632E-05 s/iter 2.452478 +gpu 0 iter : 4 Arret : 1.14039E-05 s/iter 2.452299 +gpu 0 iter : 5 Arret : 1.16344E-05 s/iter 2.452382 +gpu 0 iter : 6 Arret : 1.20661E-05 s/iter 2.452428 +gpu 0 iter : 7 Arret : 1.30094E-05 s/iter 2.452394 +gpu 0 iter : 8 Arret : 1.57289E-05 s/iter 2.452343 +gpu 0 iter : 9 Arret : 2.8627E-05 s/iter 2.452360 +gpu 0 iter : 10 Arret : 0.00054461 s/iter 2.452022 +gpu 0 iter : 11 Arret : 0.00145338 s/iter 2.452426 +gpu 0 iter : 12 Arret : 1.79253 s/iter 2.452107 +gpu 0 iter : 13 Arret : 0.533977 s/iter 2.452143 +gpu 0 iter : 14 Arret : 0.699076 s/iter 4.765744 +gpu 0 iter : 15 Arret : 0.0709274 s/iter 4.775254 +gpu 0 iter : 16 Arret : 0.0253286 s/iter 4.767205 +gpu 0 iter : 17 Arret : 0.00881713 s/iter 2.437767 +gpu 0 iter : 18 Arret : 0.00533107 s/iter 2.428440 +gpu 0 iter : 19 Arret : 0.00743265 s/iter 4.249640 +gpu 0 iter : 20 Arret : 0.000698696 s/iter 2.420553 +gpu 0 iter : 21 Arret : 0.000259303 s/iter 2.411812 +gpu 0 iter : 22 Arret : 0.000648656 s/iter 2.410234 +gpu 0 iter : 23 Arret : 0.00196532 s/iter 2.410082 +gpu 0 iter : 24 Arret : 0.000107854 s/iter 2.410295 +gpu 0 iter : 25 Arret : 4.09677E-05 s/iter 2.410995 +gpu 0 iter : 26 Arret : 5.37573E-06 s/iter 2.409992 +gpu 0 iter : 27 Arret : 1.62125E-08 s/iter 2.410152 +gpu 0 iter : 28 Arret : 1.42574E-13 s/iter 2.410051 +temps : 78.4901 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.64385E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540465 +i* 0.841367| 1| 1.87479E-13 +i*-5.02237E-14| +| 2| 0.176081 +i* -0.984376| 1|-5.37799E-14 +i* 6.92554E-14| +| 3| -0.852009 +i* -0.523527| 1| 3.18461E-14 +i* 4.03913E-14| +| 4| -0.79862 +i* 0.601836| 1| 5.14346E-14 +i* 3.91354E-14| +| 5| 0.980657 +i* -0.195736| 1| 6.46188E-13 +i*-7.37166E-13| +| 6| 0.268452 +i* 0.963293| 1|-8.54421E-14 +i* 3.23248E-14| +| 7| 0.458412 +i* -0.88874| 1| 2.7818E-14 +i* 6.11247E-14| +| 8| -0.659841 +i* -0.751405| 1|-6.41605E-14 +i*-6.23928E-14| +| 9| 0.994783 +i* 0.102018| 1| 6.80962E-13 +i*-1.84925E-12| +| 10| -0.940535 +i* 0.339697| 1| 2.92266E-14 +i* 1.23877E-14| +| 11| -0.0274147 +i* 0.999624| 1|-2.15418E-14 +i* -6.3281E-14| +| 12| 0.70001 +i* -0.714133| 1| 5.4335E-14 +i* -1.5535E-13| +| 13| 0.920515 +i* 0.390707| 1|-2.49037E-13 +i*-1.72111E-13| +| 14| -0.409041 +i* -0.912516| 1|-2.16806E-14 +i*-1.57877E-14| +| 15| -0.998877 +i* 0.047373| 1|-3.52392E-14 +i*-1.99354E-14| +| 16| -0.320845 +i* 0.947132| 1| 1.35437E-13 +i* 4.41019E-14| +| 17| 0.764454 +i* 0.644679| 1|-2.19425E-13 +i* -1.9223E-13| +| 18| 0.879407 +i* -0.47607| 1| 3.13968E-13 +i*-3.31275E-13| +| 19| -0.121864 +i* -0.992547| 1| 1.45647E-13 +i* 1.68268E-16| +| 20| -0.968462 +i* -0.24916| 1| 5.32629E-14 +i* 1.07952E-14| ++---+----------------------------+------------+----------------------------+ +200000 racines de module = 1 +zone limite de 'log-exp' 1.00089 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 391 start 0 size 100032 +gpu 1 dimgrid2 391 start 100032 size 100032 +gpu 3 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 3 dimgrid2 391 start 300096 size 100032 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 391 start 200064 size 100032 +gpu 0 iter : 1 Arret : 6.83308E-06 s/iter 8.687673 +gpu 0 iter : 2 Arret : 6.78936E-06 s/iter 8.662570 +gpu 0 iter : 3 Arret : 7.21603E-06 s/iter 8.680443 +gpu 0 iter : 4 Arret : 6.21887E-06 s/iter 8.660300 +gpu 0 iter : 5 Arret : 6.53427E-06 s/iter 8.660436 +gpu 0 iter : 6 Arret : 5.95601E-06 s/iter 8.669060 +gpu 0 iter : 7 Arret : 5.94684E-06 s/iter 8.673572 +gpu 0 iter : 8 Arret : 6.66715E-06 s/iter 8.679665 +gpu 0 iter : 9 Arret : 7.17748E-06 s/iter 8.664571 +gpu 0 iter : 10 Arret : 2.83521E-05 s/iter 8.686351 +gpu 0 iter : 11 Arret : 0.00172795 s/iter 8.683895 +gpu 0 iter : 12 Arret : 0.00549103 s/iter 12.889374 +gpu 0 iter : 13 Arret : 0.00456576 s/iter 10.269934 +gpu 0 iter : 14 Arret : 0.00289852 s/iter 9.402838 +gpu 0 iter : 15 Arret : 0.0438506 s/iter 12.988912 +gpu 0 iter : 16 Arret : 3.77879 s/iter 13.166240 +gpu 0 iter : 17 Arret : 2.10534 s/iter 8.617782 +gpu 0 iter : 18 Arret : 0.796087 s/iter 10.512729 +gpu 0 iter : 19 Arret : 0.311035 s/iter 8.624823 +gpu 0 iter : 20 Arret : 0.109701 s/iter 9.275524 +gpu 0 iter : 21 Arret : 0.0600409 s/iter 9.244258 +gpu 0 iter : 22 Arret : 0.0384709 s/iter 13.193445 +gpu 0 iter : 23 Arret : 0.0257604 s/iter 12.886058 +gpu 0 iter : 24 Arret : 0.115342 s/iter 11.285456 +gpu 0 iter : 25 Arret : 0.158851 s/iter 13.051696 +gpu 0 iter : 26 Arret : 0.361498 s/iter 11.279780 +gpu 0 iter : 27 Arret : 0.673522 s/iter 11.353180 +gpu 0 iter : 28 Arret : 0.0406058 s/iter 13.868227 +gpu 0 iter : 29 Arret : 0.016774 s/iter 13.878938 +gpu 0 iter : 30 Arret : 0.0124111 s/iter 14.114049 +gpu 0 iter : 31 Arret : 0.00546513 s/iter 13.998499 +gpu 0 iter : 32 Arret : 0.000358108 s/iter 8.577800 +gpu 0 iter : 33 Arret : 6.85612E-05 s/iter 8.572216 +gpu 0 iter : 34 Arret : 0.00100594 s/iter 8.603434 +gpu 0 iter : 35 Arret : 0.000298069 s/iter 8.578157 +gpu 0 iter : 36 Arret : 2.04019E-05 s/iter 8.587649 +gpu 0 iter : 37 Arret : 2.48589E-06 s/iter 8.588165 +gpu 0 iter : 38 Arret : 3.21069E-08 s/iter 8.581318 +gpu 0 iter : 39 Arret : 1.30873E-13 s/iter 8.589365 +temps : 399.7 seconde(s) +Nb iterations : 39 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.12993E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540383 +i* 0.841419| 1| 1.25143E-14 +i* 6.97793E-14| +| 2| -0.98885 +i* 0.148913| 1|-1.87034E-13 +i*-1.52024E-13| +| 3| 0.412505 +i* -0.910956| 1|-2.05679E-13 +i* 8.74266E-14| +| 4| 0.268615 +i* -0.963248| 1| 1.23929E-14 +i* 2.02841E-14| +| 5| -0.954531 +i* 0.298113| 1| 6.68562E-14 +i* 8.87016E-14| +| 6| 0.769081 +i* 0.639152| 1|-2.56017E-13 +i* 6.90161E-13| +| 7| 0.11843 +i* -0.992962| 1| -1.5522E-13 +i* 8.29944E-14| +| 8| -0.897838 +i* 0.440326| 1|-2.57121E-14 +i* 6.84192E-14| +| 9| 0.857632 +i* 0.514263| 1| 7.84754E-13 +i* 2.86151E-13| +| 10| -0.0345309 +i* -0.999404| 1| 3.31561E-13 +i*-9.06705E-14| +| 11| 0.662503 +i* 0.74906| 1| 7.42843E-14 +i*-6.06277E-13| +| 12| -0.820101 +i* 0.572218| 1|-4.91863E-14 +i*-2.00555E-13| +| 13| -0.186683 +i* -0.98242| 1| -1.8106E-13 +i* 3.61083E-14| +| 14| 0.926088 +i* 0.377307| 1| 6.5396E-13 +i* 7.07941E-13| +| 15| -0.723143 +i* 0.690699| 1|-1.75058E-13 +i* 1.33799E-14| +| 16| -0.334459 +i* -0.94241| 1| 2.20716E-13 +i*-8.68958E-14| +| 17| 0.97283 +i* 0.23152| 1|-1.36773E-13 +i*-4.46509E-13| +| 18| -0.609235 +i* 0.79299| 1|-8.90538E-14 +i* 1.42372E-13| +| 19| -0.474396 +i* -0.880312| 1| 2.76109E-13 +i* 7.19095E-14| +| 20| 0.99677 +i* 0.0803066| 1| 1.32664E-12 +i*-5.68624E-12| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 586 start 300032 size 150016 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 586 start 150016 size 150016 +gpu 3 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 3 dimgrid2 586 start 450048 size 150016 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 0 iter : 1 Arret : 4.50774E-06 s/iter 18.767906 +gpu 0 iter : 2 Arret : 4.46347E-06 s/iter 18.760511 +gpu 0 iter : 3 Arret : 4.08919E-06 s/iter 18.749796 +gpu 0 iter : 4 Arret : 3.95781E-06 s/iter 18.756445 +gpu 0 iter : 5 Arret : 4.12023E-06 s/iter 18.760371 +gpu 0 iter : 6 Arret : 4.06808E-06 s/iter 18.729222 +gpu 0 iter : 7 Arret : 3.99899E-06 s/iter 18.743423 +gpu 0 iter : 8 Arret : 4.31359E-06 s/iter 18.751151 +gpu 0 iter : 9 Arret : 5.21531E-06 s/iter 18.733803 +gpu 0 iter : 10 Arret : 0.000101946 s/iter 18.734289 +gpu 0 iter : 11 Arret : 0.000408516 s/iter 18.733136 +gpu 0 iter : 12 Arret : 0.000706557 s/iter 18.732114 +gpu 0 iter : 13 Arret : 2.1909 s/iter 18.757334 +gpu 0 iter : 14 Arret : 0.451216 s/iter 18.748264 +gpu 0 iter : 15 Arret : 0.339953 s/iter 26.736153 +gpu 0 iter : 16 Arret : 0.169148 s/iter 26.789207 +gpu 0 iter : 17 Arret : 0.0402512 s/iter 26.808647 +gpu 0 iter : 18 Arret : 0.0210284 s/iter 26.763957 +gpu 0 iter : 19 Arret : 0.013235 s/iter 26.768900 +gpu 0 iter : 20 Arret : 0.00905439 s/iter 26.849639 +gpu 0 iter : 21 Arret : 0.00651652 s/iter 26.787569 +gpu 0 iter : 22 Arret : 0.0209755 s/iter 26.999416 +gpu 0 iter : 23 Arret : 0.0283027 s/iter 27.203851 +gpu 0 iter : 24 Arret : 0.0246379 s/iter 26.993683 +gpu 0 iter : 25 Arret : 0.101185 s/iter 26.803558 +gpu 0 iter : 26 Arret : 0.100313 s/iter 26.842046 +gpu 0 iter : 27 Arret : 0.163719 s/iter 26.828628 +gpu 0 iter : 28 Arret : 0.0482315 s/iter 26.845110 +gpu 0 iter : 29 Arret : 0.0103223 s/iter 26.896065 +gpu 0 iter : 30 Arret : 0.00496332 s/iter 26.806043 +gpu 0 iter : 31 Arret : 0.00367192 s/iter 26.760809 +gpu 0 iter : 32 Arret : 0.00341441 s/iter 26.789298 +gpu 0 iter : 33 Arret : 0.00247026 s/iter 26.756686 +gpu 0 iter : 34 Arret : 0.00208061 s/iter 26.652171 +gpu 0 iter : 35 Arret : 0.00185636 s/iter 26.575964 +gpu 0 iter : 36 Arret : 0.00352602 s/iter 26.683145 +gpu 0 iter : 37 Arret : 0.00653739 s/iter 26.590103 +gpu 0 iter : 38 Arret : 0.00492686 s/iter 26.588605 +gpu 0 iter : 39 Arret : 0.00447252 s/iter 26.496367 +gpu 0 iter : 40 Arret : 0.000547314 s/iter 26.592548 +gpu 0 iter : 41 Arret : 0.00136209 s/iter 26.538804 +gpu 0 iter : 42 Arret : 0.00197612 s/iter 26.583277 +gpu 0 iter : 43 Arret : 0.000392726 s/iter 18.622408 +gpu 0 iter : 44 Arret : 0.00131045 s/iter 18.685108 +gpu 0 iter : 45 Arret : 0.00104061 s/iter 19.378597 +gpu 0 iter : 46 Arret : 0.000234145 s/iter 18.609701 +gpu 0 iter : 47 Arret : 4.7188E-05 s/iter 18.577615 +gpu 0 iter : 48 Arret : 5.10545E-06 s/iter 18.608929 +gpu 0 iter : 49 Arret : 3.52111E-08 s/iter 18.602465 +gpu 0 iter : 50 Arret : 1.02528E-13 s/iter 18.651905 +temps : 1163.51 seconde(s) +Nb iterations : 50 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.996672 +i* 0.0815122| 1|-4.60361E-14 +i*-1.54911E-15| +| 3| 0.396458 +i* -0.918053| 1|-3.61742E-13 +i* 4.28426E-13| +| 4| -0.983009 +i* 0.183558| 1| 2.27839E-14 +i* 1.21547E-13| +| 5| 0.299962 +i* -0.953951| 1| 3.10155E-13 +i*-4.52272E-13| +| 6| 0.701062 +i* 0.7131| 1| 6.08482E-13 +i* 3.68603E-13| +| 7| -0.958925 +i* 0.283658| 1|-3.43857E-14 +i*-4.33108E-14| +| 8| 0.200287 +i* -0.979737| 1| 4.39829E-13 +i*-3.61119E-13| +| 9| 0.770667 +i* 0.637238| 1| -2.7036E-13 +i*-8.38747E-13| +| 10| -0.924677 +i* 0.380752| 1| 1.44957E-13 +i* 1.13251E-13| +| 11| 0.0984885 +i* -0.995138| 1| 3.5235E-13 +i*-2.31698E-13| +| 12| 0.832104 +i* 0.55462| 1| 8.49546E-13 +i* -8.3842E-13| +| 13| -0.880627 +i* 0.473809| 1|-9.58227E-14 +i* -1.6529E-13| +| 14| -0.0043537 +i* -0.999991| 1| 1.63446E-13 +i*-5.45449E-14| +| 15| 0.88472 +i* 0.466123| 1| -6.8268E-13 +i* -3.8889E-13| +| 16| 0.624025 +i* 0.781404| 1| 9.47506E-15 +i*-6.78554E-13| +| 17| -0.827243 +i* 0.561844| 1|-1.79082E-13 +i*-3.05719E-13| +| 18| -0.10715 +i* -0.994243| 1| 3.32474E-13 +i*-4.57395E-14| +| 19| 0.927958 +i* 0.372686| 1| 1.0255E-13 +i* 1.0692E-13| +| 20| -0.765083 +i* 0.643932| 1| 3.06144E-14 +i*-3.59443E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 782 start 200000 size 200000 +gpu 3 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 3 dimgrid2 782 start 600000 size 200000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 782 start 0 size 200000 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 782 start 400000 size 200000 +gpu 0 iter : 1 Arret : 2.9665E-06 s/iter 34.132954 +gpu 0 iter : 2 Arret : 2.96498E-06 s/iter 34.060373 +gpu 0 iter : 3 Arret : 2.9937E-06 s/iter 34.106618 +gpu 0 iter : 4 Arret : 2.99019E-06 s/iter 34.131529 +gpu 0 iter : 5 Arret : 2.96254E-06 s/iter 34.072428 +gpu 0 iter : 6 Arret : 2.96634E-06 s/iter 34.094938 +gpu 0 iter : 7 Arret : 2.97177E-06 s/iter 34.087606 +gpu 0 iter : 8 Arret : 3.1804E-06 s/iter 34.105421 +gpu 0 iter : 9 Arret : 3.76913E-06 s/iter 34.122970 +gpu 0 iter : 10 Arret : 6.64268E-06 s/iter 34.130380 +gpu 0 iter : 11 Arret : 0.000184943 s/iter 34.119757 +gpu 0 iter : 12 Arret : 0.00113217 s/iter 34.095463 +gpu 0 iter : 13 Arret : 0.753916 s/iter 34.085029 +gpu 0 iter : 14 Arret : 0.945227 s/iter 34.115229 +gpu 0 iter : 15 Arret : 2.42544 s/iter 34.084082 +gpu 0 iter : 16 Arret : 0.0394416 s/iter 34.026900 +gpu 0 iter : 17 Arret : 0.0115328 s/iter 33.884844 +gpu 0 iter : 18 Arret : 0.000905462 s/iter 33.872131 +gpu 0 iter : 19 Arret : 0.000346005 s/iter 33.871123 +gpu 0 iter : 20 Arret : 0.000573762 s/iter 33.849199 +gpu 0 iter : 21 Arret : 0.000415648 s/iter 33.868251 +gpu 0 iter : 22 Arret : 0.000562449 s/iter 33.882749 +gpu 0 iter : 23 Arret : 0.0012921 s/iter 33.868629 +gpu 0 iter : 24 Arret : 0.000343321 s/iter 33.877909 +gpu 0 iter : 25 Arret : 6.89541E-05 s/iter 33.851132 +gpu 0 iter : 26 Arret : 2.43828E-05 s/iter 33.849227 +gpu 0 iter : 27 Arret : 1.8909E-05 s/iter 33.872817 +gpu 0 iter : 28 Arret : 2.44076E-05 s/iter 33.860491 +gpu 0 iter : 29 Arret : 3.23083E-06 s/iter 33.868783 +gpu 0 iter : 30 Arret : 1.58E-10 s/iter 33.857784 +gpu 0 iter : 31 Arret : 3.85593E-16 s/iter 33.840967 +temps : 1055.39 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| -0.942555 +i* -0.334052| 1| 2.1929E-13 +i*-2.49686E-13| +| 3| -0.558601 +i* 0.829437| 1|-3.51628E-14 +i*-4.09232E-13| +| 4| -0.0665975 +i* -0.99778| 1|-3.91888E-13 +i* 9.06636E-14| +| 5| 0.949627 +i* -0.313383| 1|-1.12544E-12 +i* 2.13597E-12| +| 6| -0.982853 +i* -0.184391| 1| 8.57613E-14 +i* 1.33506E-13| +| 7| 0.889798 +i* -0.456354| 1| 1.27488E-12 +i* 5.17779E-13| +| 8| -0.423729 +i* 0.905789| 1|-7.25461E-15 +i*-1.33088E-14| +| 9| -0.219973 +i* -0.975506| 1| 4.34097E-13 +i*-4.24712E-14| +| 10| 0.771464 +i* 0.636273| 1| -4.4266E-13 +i*-2.07773E-13| +| 11| -0.999541 +i* -0.0303078| 1| 3.54265E-14 +i* 1.32862E-14| +| 12| 0.808597 +i* -0.588363| 1|-5.90212E-13 +i*-1.43182E-12| +| 13| 0.663883 +i* 0.747836| 1| 4.13159E-13 +i* 1.10149E-12| +| 14| -0.27868 +i* 0.960384| 1|-1.03539E-13 +i*-1.45998E-13| +| 15| -0.368064 +i* -0.929801| 1| 4.60916E-14 +i*-1.09841E-13| +| 16| -0.992219 +i* 0.124503| 1| 2.74294E-13 +i* 2.11383E-13| +| 17| 0.707973 +i* -0.706239| 1|-1.10575E-12 +i*-7.41631E-13| +| 18| 0.860514 +i* 0.509426| 1| 9.86579E-13 +i* 1.10532E-12| +| 19| -0.126936 +i* 0.991911| 1| 1.67744E-13 +i* 5.51772E-13| +| 20| -0.507314 +i* -0.861761| 1| 5.50185E-14 +i* 3.42273E-13| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 977 start 0 size 250048 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 977 start 500096 size 250048 +gpu 3 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 3 dimgrid2 977 start 750144 size 250048 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 977 start 250048 size 250048 +gpu 0 iter : 1 Arret : 2.88781E-06 s/iter 52.567689 +gpu 0 iter : 2 Arret : 2.48174E-06 s/iter 52.412927 +gpu 0 iter : 3 Arret : 2.37734E-06 s/iter 52.445779 +gpu 0 iter : 4 Arret : 2.38169E-06 s/iter 52.428480 +gpu 0 iter : 5 Arret : 2.38448E-06 s/iter 52.401350 +gpu 0 iter : 6 Arret : 2.9427E-06 s/iter 52.358266 +gpu 0 iter : 7 Arret : 2.4276E-06 s/iter 52.420365 +gpu 0 iter : 8 Arret : 2.576E-06 s/iter 52.397873 +gpu 0 iter : 9 Arret : 2.95754E-06 s/iter 52.438769 +gpu 0 iter : 10 Arret : 4.376E-06 s/iter 52.429890 +gpu 0 iter : 11 Arret : 0.000112761 s/iter 52.466360 +gpu 0 iter : 12 Arret : 0.00014018 s/iter 52.402254 +gpu 0 iter : 13 Arret : 0.00011586 s/iter 52.424902 +gpu 0 iter : 14 Arret : 0.00133799 s/iter 52.444410 +gpu 0 iter : 15 Arret : 1.4567 s/iter 54.393527 +gpu 0 iter : 16 Arret : 0.157126 s/iter 54.676459 +gpu 0 iter : 17 Arret : 0.0769879 s/iter 54.372305 +gpu 0 iter : 18 Arret : 0.047361 s/iter 66.600120 +gpu 0 iter : 19 Arret : 0.0316599 s/iter 56.256144 +gpu 0 iter : 20 Arret : 0.0224311 s/iter 58.438101 +gpu 0 iter : 21 Arret : 0.0165373 s/iter 61.741227 +gpu 0 iter : 22 Arret : 0.401359 s/iter 56.531585 +gpu 0 iter : 23 Arret : 0.328672 s/iter 55.269982 +gpu 0 iter : 24 Arret : 0.202796 s/iter 55.021521 +gpu 0 iter : 25 Arret : 0.104584 s/iter 54.616326 +gpu 0 iter : 26 Arret : 0.0261205 s/iter 66.413122 +gpu 0 iter : 27 Arret : 0.0245485 s/iter 52.868792 +gpu 0 iter : 28 Arret : 0.0278169 s/iter 56.569999 +gpu 0 iter : 29 Arret : 0.00143344 s/iter 52.689834 +gpu 0 iter : 30 Arret : 0.00133282 s/iter 52.767469 +gpu 0 iter : 31 Arret : 0.00056116 s/iter 52.674243 +gpu 0 iter : 32 Arret : 0.00122145 s/iter 52.782739 +gpu 0 iter : 33 Arret : 0.00499332 s/iter 52.888671 +gpu 0 iter : 34 Arret : 8.64873E-05 s/iter 52.819841 +gpu 0 iter : 35 Arret : 3.87016E-05 s/iter 52.893826 +gpu 0 iter : 36 Arret : 0.000101821 s/iter 52.680312 +gpu 0 iter : 37 Arret : 0.00108852 s/iter 52.667928 +gpu 0 iter : 38 Arret : 0.00150801 s/iter 52.688010 +gpu 0 iter : 39 Arret : 0.000162458 s/iter 52.662407 +gpu 0 iter : 40 Arret : 4.74398E-05 s/iter 52.683807 +gpu 0 iter : 41 Arret : 2.2996E-05 s/iter 52.734431 +gpu 0 iter : 42 Arret : 1.52502E-05 s/iter 52.717114 +gpu 0 iter : 43 Arret : 5.47596E-06 s/iter 52.767661 +gpu 0 iter : 44 Arret : 7.00943E-07 s/iter 52.627015 +gpu 0 iter : 45 Arret : 3.22655E-09 s/iter 52.686211 +gpu 0 iter : 46 Arret : 5.38916E-15 s/iter 52.697776 +temps : 2489.06 seconde(s) +Nb iterations : 46 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80137E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54034 +i* 0.841447| 1| 4.08253E-13 +i*-6.65317E-13| +| 2| -0.513915 +i* -0.857841| 1|-9.07486E-13 +i* 1.86417E-13| +| 3| 0.486982 +i* 0.873412| 1|-6.63601E-14 +i*-1.18344E-12| +| 4| -0.459589 +i* -0.888132| 1|-5.16153E-13 +i*-2.68006E-13| +| 5| 0.43174 +i* 0.901998| 1|-6.77361E-13 +i* 7.93272E-13| +| 6| -0.40348 +i* -0.914989| 1|-3.45956E-13 +i*-2.59726E-13| +| 7| 0.374828 +i* 0.927094| 1| 3.65041E-13 +i* 3.54812E-13| +| 8| -0.345815 +i* -0.938303| 1| 5.50778E-13 +i* 8.9059E-14| +| 9| 0.316466 +i* 0.948604| 1|-2.87419E-13 +i* 5.21678E-13| +| 10| -0.286812 +i* -0.957987| 1| 6.43516E-13 +i* 2.73696E-13| +| 11| 0.25688 +i* 0.966443| 1|-4.31814E-13 +i* 5.6624E-13| +| 12| -0.226699 +i* -0.973965| 1| 4.35089E-13 +i* -6.6197E-14| +| 13| 0.196299 +i* 0.980544| 1| 3.90278E-14 +i*-7.14062E-13| +| 14| -0.165685 +i* -0.986179| 1| 7.63278E-16 +i*-3.73816E-14| +| 15| 0.13496 +i* 0.990851| 1| 1.03566E-13 +i*-6.61428E-13| +| 16| -0.104079 +i* -0.994569| 1| 7.90108E-13 +i*-1.74942E-13| +| 17| 0.0730977 +i* 0.997325| 1| 1.11931E-13 +i* 4.68587E-13| +| 18| -0.0420456 +i* -0.999116| 1| 2.29268E-13 +i*-1.21795E-14| +| 19| 0.0109529 +i* 0.99994| 1|-2.47309E-13 +i*-7.90307E-13| +| 20| 0.0201504 +i* -0.999797| 1| 6.69503E-13 +i*-2.16847E-13| ++---+----------------------------+------------+----------------------------+ +1000000 racines de module = 1 +zone limite de 'log-exp' 1.0003 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 2 dimgrid2 1172 start 600064 size 300032 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 3 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid2 1172 start 900096 size 300032 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 2.42652E-06 s/iter 74.617749 +gpu 0 iter : 2 Arret : 2.49614E-06 s/iter 74.548310 +gpu 0 iter : 3 Arret : 2.21192E-06 s/iter 74.556230 +gpu 0 iter : 4 Arret : 2.11473E-06 s/iter 74.504423 +gpu 0 iter : 5 Arret : 2.29716E-06 s/iter 74.525347 +gpu 0 iter : 6 Arret : 2.20002E-06 s/iter 74.448738 +gpu 0 iter : 7 Arret : 2.19767E-06 s/iter 74.591557 +gpu 0 iter : 8 Arret : 2.319E-06 s/iter 74.518969 +gpu 0 iter : 9 Arret : 2.33977E-06 s/iter 74.417513 +gpu 0 iter : 10 Arret : 3.18561E-06 s/iter 74.428935 +gpu 0 iter : 11 Arret : 2.39196E-05 s/iter 74.427517 +gpu 0 iter : 12 Arret : 0.000318633 s/iter 74.433069 +gpu 0 iter : 13 Arret : 0.00154086 s/iter 74.779282 +gpu 0 iter : 14 Arret : 0.000824248 s/iter 74.717977 +gpu 0 iter : 15 Arret : 0.000938617 s/iter 74.750958 +gpu 0 iter : 16 Arret : 0.00924203 s/iter 74.495587 +gpu 0 iter : 17 Arret : 1.22373 s/iter 89.902699 +gpu 0 iter : 18 Arret : 0.0309579 s/iter 89.741584 +gpu 0 iter : 19 Arret : 0.0522422 s/iter 89.331794 +gpu 0 iter : 20 Arret : 0.0374635 s/iter 89.988148 +gpu 0 iter : 21 Arret : 0.0161203 s/iter 93.229079 +gpu 0 iter : 22 Arret : 0.0347427 s/iter 92.221499 +gpu 0 iter : 23 Arret : 0.0641293 s/iter 93.761623 +gpu 0 iter : 24 Arret : 0.0357214 s/iter 93.514989 +gpu 0 iter : 25 Arret : 0.207308 s/iter 94.107114 +gpu 0 iter : 26 Arret : 0.125661 s/iter 92.472778 +gpu 0 iter : 27 Arret : 0.0748459 s/iter 90.193087 +gpu 0 iter : 28 Arret : 0.0395315 s/iter 91.296280 +gpu 0 iter : 29 Arret : 0.0352008 s/iter 87.646913 +gpu 0 iter : 30 Arret : 0.0383622 s/iter 74.418177 +gpu 0 iter : 31 Arret : 0.0225754 s/iter 74.526286 +gpu 0 iter : 32 Arret : 0.000665957 s/iter 74.146229 +gpu 0 iter : 33 Arret : 1.74739E-05 s/iter 74.377078 +gpu 0 iter : 34 Arret : 8.8614E-06 s/iter 74.306201 +gpu 0 iter : 35 Arret : 6.22465E-06 s/iter 74.346563 +gpu 0 iter : 36 Arret : 1.54539E-05 s/iter 74.268334 +gpu 0 iter : 37 Arret : 1.99901E-05 s/iter 74.305788 +gpu 0 iter : 38 Arret : 2.01663E-06 s/iter 74.513999 +gpu 0 iter : 39 Arret : 2.0507E-07 s/iter 74.179158 +gpu 0 iter : 40 Arret : 3.39098E-11 s/iter 74.283612 +gpu 0 iter : 41 Arret : 1.57009E-16 s/iter 74.098952 +temps : 3274.17 seconde(s) +Nb iterations : 41 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.34152E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.841451| 1|-1.40868E-12 +i*-1.55069E-13| +| 2| -0.583871 +i* 0.811846| 1| 5.87586E-14 +i* 2.63177E-13| +| 3| 0.0263196 +i* -0.999654| 1| 9.89594E-13 +i*-3.85265E-13| +| 4| -0.969647 +i* -0.244511| 1|-5.84047E-14 +i*-6.69829E-14| +| 5| 0.939323 +i* -0.343035| 1| 7.60725E-13 +i* 1.68227E-12| +| 6| -0.129097 +i* -0.991632| 1| -2.278E-13 +i*-2.09967E-13| +| 7| -0.450842 +i* 0.892604| 1| 3.34819E-13 +i* 5.30987E-13| +| 8| 0.874726 +i* -0.484618| 1| 6.94573E-13 +i* 1.33379E-12| +| 9| -0.995841 +i* -0.0911079| 1| 6.65572E-13 +i* 2.21578E-13| +| 10| 0.772266 +i* 0.635299| 1|-1.10511E-12 +i*-6.88458E-13| +| 11| -0.281387 +i* -0.959594| 1|-6.93022E-14 +i* 4.40275E-13| +| 12| -0.306893 +i* 0.951744| 1| 1.0443E-15 +i* 1.24753E-13| +| 13| 0.788944 +i* -0.614465| 1| -2.2269E-12 +i*-9.13604E-13| +| 14| -0.997918 +i* 0.0645018| 1| 2.81913E-13 +i* 2.2426E-13| +| 15| 0.861482 +i* 0.507788| 1| 2.41178E-12 +i* 5.79845E-13| +| 16| -0.426862 +i* -0.904317| 1| 6.20323E-13 +i* 5.74424E-13| +| 17| 0.664347 +i* 0.747424| 1| 4.99219E-13 +i* 1.52752E-12| +| 18| -0.155512 +i* 0.987834| 1| 2.30305E-13 +i* 4.37822E-13| +| 19| -0.975826 +i* 0.218549| 1| 1.82913E-13 +i* 5.28258E-14| +| 20| 0.684055 +i* -0.72943| 1|-1.32506E-12 +i*-1.70394E-12| ++---+----------------------------+------------+----------------------------+ +1200000 racines de module = 1 +zone limite de 'log-exp' 1.00025 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 1368 start 0 size 350016 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1368 start 350016 size 350016 +gpu 3 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 3 dimgrid2 1368 start 1050048 size 350016 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1368 start 700032 size 350016 +gpu 0 iter : 1 Arret : 2.03238E-06 s/iter 101.212949 +gpu 0 iter : 2 Arret : 1.8928E-06 s/iter 101.009938 +gpu 0 iter : 3 Arret : 1.76076E-06 s/iter 101.081176 +gpu 0 iter : 4 Arret : 1.69968E-06 s/iter 100.980005 +gpu 0 iter : 5 Arret : 2.05399E-06 s/iter 101.013322 +gpu 0 iter : 6 Arret : 1.85778E-06 s/iter 100.874154 +gpu 0 iter : 7 Arret : 1.7351E-06 s/iter 101.028880 +gpu 0 iter : 8 Arret : 1.82753E-06 s/iter 101.353518 +gpu 0 iter : 9 Arret : 1.78381E-06 s/iter 101.161489 +gpu 0 iter : 10 Arret : 1.95163E-06 s/iter 101.020805 +gpu 0 iter : 11 Arret : 1.11498E-05 s/iter 100.910293 +gpu 0 iter : 12 Arret : 0.000267342 s/iter 101.117136 +gpu 0 iter : 13 Arret : 0.000448589 s/iter 101.072866 +gpu 0 iter : 14 Arret : 0.00117343 s/iter 102.399232 +gpu 0 iter : 15 Arret : 0.0025383 s/iter 101.619405 +gpu 0 iter : 16 Arret : 0.0127207 s/iter 101.389072 +gpu 0 iter : 17 Arret : 0.00589486 s/iter 120.753705 +gpu 0 iter : 18 Arret : 0.00398562 s/iter 114.216025 +gpu 0 iter : 19 Arret : 0.00872604 s/iter 120.471159 +gpu 0 iter : 20 Arret : 0.0658269 s/iter 121.374423 +gpu 0 iter : 21 Arret : 0.643107 s/iter 120.581728 +gpu 0 iter : 22 Arret : 0.0256024 s/iter 101.540440 +gpu 0 iter : 23 Arret : 0.00590733 s/iter 101.350206 +gpu 0 iter : 24 Arret : 0.00290093 s/iter 102.021897 +gpu 0 iter : 25 Arret : 0.000722765 s/iter 102.009174 +gpu 0 iter : 26 Arret : 0.000172667 s/iter 100.437242 +gpu 0 iter : 27 Arret : 9.4954E-05 s/iter 100.408854 +gpu 0 iter : 28 Arret : 0.000102556 s/iter 100.581581 +gpu 0 iter : 29 Arret : 5.13171E-06 s/iter 100.431024 +gpu 0 iter : 30 Arret : 1.97065E-06 s/iter 100.464145 +gpu 0 iter : 31 Arret : 4.62246E-08 s/iter 100.685343 +gpu 0 iter : 32 Arret : 6.27512E-14 s/iter 100.695274 +temps : 3329.48 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.63785E-07 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540329 +i* 0.841454| 1| 4.3987E-13 +i* 1.7418E-12| +| 2| -0.0530086 +i* 0.998594| 1| 3.8728E-13 +i* 8.41422E-13| +| 3| -0.626376 +i* 0.779521| 1| 2.93654E-14 +i*-2.95439E-13| +| 4| -0.96376 +i* 0.26677| 1|-1.31943E-13 +i* 5.03167E-13| +| 5| -0.938055 +i* -0.346485| 1| 6.12451E-13 +i*-2.34033E-13| +| 6| -0.558945 +i* -0.829205| 1| 2.12923E-13 +i* 6.04209E-13| +| 7| 0.0307435 +i* -0.999527| 1|-3.70079E-13 +i* 1.04685E-13| +| 8| 0.60885 +i* -0.793286| 1| -1.5142E-12 +i* 2.45191E-13| +| 9| 0.957578 +i* -0.288175| 1|-3.17266E-12 +i* 2.02057E-12| +| 10| 0.945542 +i* 0.325501| 1|-1.50276E-12 +i* 3.84538E-13| +| 11| -0.00847209 +i* 0.999964| 1| 8.68958E-14 +i* 2.94643E-13| +| 12| -0.591029 +i* 0.80665| 1|-5.75824E-14 +i*-8.87086E-13| +| 13| -0.95092 +i* 0.309437| 1|-6.93591E-13 +i*-5.52411E-13| +| 14| -0.952559 +i* -0.304354| 1|-3.04982E-13 +i* 1.60452E-13| +| 15| -0.595328 +i* -0.803482| 1|-1.05039E-12 +i* 2.37501E-13| +| 16| -0.0138125 +i* -0.999905| 1|-8.72476E-13 +i* 2.69644E-13| +| 17| 0.572907 +i* -0.81962| 1| 1.32405E-12 +i*-6.73803E-13| +| 18| 0.94379 +i* -0.330546| 1|-1.85401E-12 +i* 2.58533E-12| +| 19| 0.959103 +i* 0.283057| 1|-2.75633E-12 +i* 3.49955E-12| +| 20| 0.613081 +i* 0.79002| 1| 4.49453E-13 +i*-4.47541E-14| ++---+----------------------------+------------+----------------------------+ +1400000 racines de module = 1 diff --git a/Simulations/mpi.txt b/Simulations/mpi.txt new file mode 100644 index 0000000..dbc59a1 --- /dev/null +++ b/Simulations/mpi.txt @@ -0,0 +1,9 @@ +#degre S1GPU S2GPU S3GPU 4SGPU F1GPU F2GPU F3GPU F4GPU +100000 16.1017 8.65634 7.13273 4.60588 59.5799 49.9266 42.0352 27.6039 +200000 63.5651 40.9684 39.5342 21.5922 260.107 131.492 96.864 77.3108 +400000 452.145 122.138 81.0542 63.5457 1340.32 693.598 560.426 376.869 +600000 646.009 297.134 193.628 153.471 3024.78 1792.33 2990.26 1130.49 +800000 1656.28 746.426 545.367 282.444 4178.79 2067.97 1385.04 1066.62 +1000000 3173.19 812.655 542.745 440.06 8448.53 4481.5 2970.64 2532.79 +1200000 3906.03 1647.22 1617.65 1762.58 10029.1 6131.73 4497 3118.23 +1400000 3229.79 1991.85 1707.73 1478.01 13710 6283.33 4390.32 3281.76 diff --git a/Simulations/mpivsomp.txt b/Simulations/mpivsomp.txt new file mode 100644 index 0000000..45b7a6a --- /dev/null +++ b/Simulations/mpivsomp.txt @@ -0,0 +1,5 @@ +#NB SMPI200K SMPI800K SMPI1.4M SOMP200K SOMP800K SOMP1.4M FMPI200K FMPI800K FMPI1.4M FOMP200K FOMP800K FOMP1.4M +1 63.5651 1656.28 3229.79 70.1186 1180.82 3523.14 260.107 4178.79 13710 260.63 3918.85 14056.1 +2 40.9684 746.426 1991.85 35.62 576.437 2371.12 131.492 2067.97 6283.33 136.465 2056.91 6757.87 +3 39.5342 545.367 1707.73 37.8394 351.42 1786.83 96.864 1385.04 4390.32 97.9976 1397.8 4453.8 +4 21.5922 282.444 1478.01 22.9576 258.82 1704.89 77.3108 1066.62 3281.76 78.4901 1055.39 3329.48 diff --git a/Simulations/omp.txt b/Simulations/omp.txt new file mode 100644 index 0000000..f22b3ab --- /dev/null +++ b/Simulations/omp.txt @@ -0,0 +1,9 @@ +#degre S1GPU S2GPU S3GPU 4SGPU F1GPU F2GPU F3GPU F4GPU +100000 16.1926 9.12342 8.00955 5.86914 59.4099 48.6545 43.054 27.3746 +200000 70.1186 35.62 37.8394 22.9576 260.63 136.465 97.9976 78.4901 +400000 248.893 122.327 86.1208 68.0633 1320.13 716.812 547.721 399.7 +600000 589.718 297.898 202.419 154.313 3245.93 1678.41 3012.17 1163.51 +800000 1180.82 576.437 351.42 258.82 3918.85 2056.91 1397.8 1055.39 +1000000 1621.79 850.208 598.968 422.324 8646.97 4455.65 3027.59 2489.06 +1200000 4148.3 1631.66 2056.31 1556.58 11218.8 5498.65 3971.4 3274.17 +1400000 3523.14 2371.12 1786.83 1704.89 14056.1 6757.87 4453.8 3329.48 diff --git a/Simulations/sparse_mpi/sparse_mpi_1GPU.o140032 b/Simulations/sparse_mpi/sparse_mpi_1GPU.o140032 new file mode 100644 index 0000000..42d7416 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_1GPU.o140032 @@ -0,0 +1,642 @@ +REMAINING: 1 +Taking GPU #3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 100096 +proc 0 start 0 size 100096 +iter : 1 Arret : 0.00679606 s/iter 0.774483 +iter : 2 Arret : 0.0240773 s/iter 0.852783 +iter : 3 Arret : 0.0190607 s/iter 0.841876 +iter : 4 Arret : 0.00753578 s/iter 0.774557 +iter : 5 Arret : 0.0903866 s/iter 0.774496 +iter : 6 Arret : 0.0766923 s/iter 0.843947 +iter : 7 Arret : 0.0135773 s/iter 0.851241 +iter : 8 Arret : 0.00988122 s/iter 0.846496 +iter : 9 Arret : 0.00740796 s/iter 0.842720 +iter : 10 Arret : 0.00490463 s/iter 0.774748 +iter : 11 Arret : 0.00478656 s/iter 0.774554 +iter : 12 Arret : 0.00116597 s/iter 0.774390 +iter : 13 Arret : 0.000965078 s/iter 0.774238 +iter : 14 Arret : 0.000208722 s/iter 0.774212 +iter : 15 Arret : 0.00022059 s/iter 0.774088 +iter : 16 Arret : 2.47061E-05 s/iter 0.774123 +iter : 17 Arret : 2.20962E-07 s/iter 0.774117 +iter : 18 Arret : 7.04174E-10 s/iter 0.774131 +iter : 19 Arret : 2.22676E-12 s/iter 0.773993 +iter : 20 Arret : 7.50806E-15 s/iter 0.774073 +temps : 16.1017 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.61117E-09 +Stabilite : 7.50806E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226711 +i* -0.973923| 0.999962|-4.27658E-13 +i* 6.01027E-13| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996021 +i* 0.0886823| 0.999962| 2.0266E-12 +i*-2.01894E-13| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968049 +i* 0.250607| 0.999962|-1.07025E-13 +i*-1.15224E-12| +| 10| -0.286815 +i* -0.957946| 0.999962|-6.55254E-13 +i* 1.20869E-12| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988582 +i* 0.150427| 0.999962|-1.54698E-12 +i*-6.48537E-13| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.981756 +i* 0.189945| 0.999962|-9.84324E-13 +i*-1.03573E-12| +| 19| -0.345809 +i* -0.938264| 0.999962| 1.03906E-12 +i* 1.95398E-12| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 200192 +proc 0 start 0 size 200192 +iter : 1 Arret : 0.000149243 s/iter 3.009897 +iter : 2 Arret : 0.000107669 s/iter 3.006186 +iter : 3 Arret : 0.000104952 s/iter 3.008833 +iter : 4 Arret : 0.000608712 s/iter 3.007077 +iter : 5 Arret : 0.00102516 s/iter 3.006467 +iter : 6 Arret : 0.00265088 s/iter 3.006726 +iter : 7 Arret : 0.0373682 s/iter 3.008694 +iter : 8 Arret : 0.0563565 s/iter 3.008459 +iter : 9 Arret : 0.130843 s/iter 3.042271 +iter : 10 Arret : 0.213629 s/iter 3.036578 +iter : 11 Arret : 0.153708 s/iter 3.075704 +iter : 12 Arret : 0.0916516 s/iter 3.036504 +iter : 13 Arret : 0.0619829 s/iter 3.025077 +iter : 14 Arret : 0.0382728 s/iter 3.001649 +iter : 15 Arret : 0.0125846 s/iter 3.026965 +iter : 16 Arret : 0.00175812 s/iter 3.007895 +iter : 17 Arret : 0.000317125 s/iter 3.006004 +iter : 18 Arret : 1.05887E-05 s/iter 3.006536 +iter : 19 Arret : 5.5903E-08 s/iter 3.012414 +iter : 20 Arret : 5.55768E-12 s/iter 3.013007 +iter : 21 Arret : 5.57854E-16 s/iter 3.013024 +temps : 63.5651 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.52377E-08 +Stabilite : 5.57854E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540195 +i* 0.841595| 1.00005|-2.98043E-09 +i*-3.27611E-08| +| 2| -0.837195 +i* 0.546877| 0.999985| 7.09943E-12 +i* 5.1133E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828525 +i* -0.559925| 0.999985|-4.34675E-12 +i* 1.07137E-12| +| 5| -0.819774 +i* 0.572768| 1.00005| 2.53887E-08 +i* 2.42315E-09| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591869 +i* 0.806015| 0.999985| 1.73195E-13 +i* 8.72591E-12| +| 9| -0.801379 +i* 0.598131| 0.999985| -1.2701E-12 +i* 3.96189E-12| +| 10| -0.60436 +i* -0.796769| 1.00005|-3.33815E-08 +i* 3.89061E-08| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628985 +i* -0.777398| 0.999985|-4.05476E-12 +i*-5.17236E-12| +| 15| 0.772548 +i* -0.635029| 1.00005| 1.1634E-09 +i* 1.87351E-08| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752229 +i* -0.658879| 0.999985| 1.34497E-11 +i*-6.49125E-12| +| 20| 0.664729 +i* 0.747146| 1.00005|-1.71597E-08 +i* 8.68463E-09| ++---+----------------------------+------------+----------------------------+ +50000 racines de module = 1.00005 +150000 racines de module = 0.999985 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 400128 +proc 0 start 0 size 400128 +iter : 1 Arret : 0.00730522 s/iter 11.729578 +iter : 2 Arret : 8.77601 s/iter 11.759538 +iter : 3 Arret : 1.00039 s/iter 11.791553 +iter : 4 Arret : 1.66037 s/iter 11.980569 +iter : 5 Arret : 1.60415 s/iter 11.887203 +iter : 6 Arret : 1.09308 s/iter 11.903519 +iter : 7 Arret : 1.03725 s/iter 11.950159 +iter : 8 Arret : 0.785865 s/iter 12.039659 +iter : 9 Arret : 0.676674 s/iter 12.064157 +iter : 10 Arret : 0.653102 s/iter 12.043182 +iter : 11 Arret : 0.61815 s/iter 12.032295 +iter : 12 Arret : 0.572922 s/iter 11.944839 +iter : 13 Arret : 0.514395 s/iter 11.923777 +iter : 14 Arret : 0.460854 s/iter 11.923746 +iter : 15 Arret : 0.546102 s/iter 11.925322 +iter : 16 Arret : 0.44308 s/iter 11.925810 +iter : 17 Arret : 0.411387 s/iter 11.926822 +iter : 18 Arret : 0.391387 s/iter 11.925774 +iter : 19 Arret : 0.377716 s/iter 11.927355 +iter : 20 Arret : 0.368007 s/iter 11.928976 +iter : 21 Arret : 0.476382 s/iter 11.927179 +iter : 22 Arret : 0.434562 s/iter 11.925163 +iter : 23 Arret : 0.42152 s/iter 11.926021 +iter : 24 Arret : 0.423381 s/iter 11.925847 +iter : 25 Arret : 0.433232 s/iter 11.929953 +iter : 26 Arret : 0.401895 s/iter 11.931379 +iter : 27 Arret : 0.411949 s/iter 11.917976 +iter : 28 Arret : 0.186193 s/iter 11.913066 +iter : 29 Arret : 0.106074 s/iter 11.943724 +iter : 30 Arret : 0.0412794 s/iter 11.831994 +iter : 31 Arret : 0.0419846 s/iter 11.810695 +iter : 32 Arret : 0.0167499 s/iter 11.814252 +iter : 33 Arret : 0.00536444 s/iter 11.787890 +iter : 34 Arret : 0.000655097 s/iter 11.754599 +iter : 35 Arret : 3.44296E-07 s/iter 11.747199 +iter : 36 Arret : 7.50023E-10 s/iter 11.751889 +iter : 37 Arret : 1.61565E-12 s/iter 11.752682 +iter : 38 Arret : 3.38203E-15 s/iter 11.747277 +temps : 452.145 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 3.38203E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540313 +i* 0.841453| 0.999991| 9.34197E-12 +i*-1.23633E-11| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991| 1.67755E-11 +i* 4.06477E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991| 1.73468E-11 +i*-3.74729E-12| +| 13| -0.983286 +i* 0.18202| 0.999991| 3.21676E-12 +i*-9.48297E-13| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.66503 +i* 0.746804| 0.999991| 5.74873E-13 +i* 8.53884E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-7.47291E-12 +i*-5.77033E-12| +| 17| 0.294374 +i* -0.955681| 0.999991| 1.82907E-11 +i*-2.45448E-12| +| 18| 0.688087 +i* 0.725616| 0.999991|-1.67164E-11 +i*-1.12573E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +iter : 1 Arret : 0.00438586 s/iter 26.290359 +iter : 2 Arret : 0.424079 s/iter 26.667931 +iter : 3 Arret : 0.949363 s/iter 26.761853 +iter : 4 Arret : 11.5671 s/iter 26.845045 +iter : 5 Arret : 0.975219 s/iter 27.289618 +iter : 6 Arret : 9.61533 s/iter 27.433768 +iter : 7 Arret : 1.85508 s/iter 27.722970 +iter : 8 Arret : 0.857551 s/iter 27.711823 +iter : 9 Arret : 1.17971 s/iter 27.827595 +iter : 10 Arret : 0.452875 s/iter 27.966012 +iter : 11 Arret : 0.892919 s/iter 27.734509 +iter : 12 Arret : 0.512768 s/iter 27.492632 +iter : 13 Arret : 0.378076 s/iter 27.324440 +iter : 14 Arret : 0.0806363 s/iter 26.960487 +iter : 15 Arret : 0.0453167 s/iter 26.499557 +iter : 16 Arret : 0.0240592 s/iter 26.395465 +iter : 17 Arret : 0.0199765 s/iter 26.315790 +iter : 18 Arret : 0.00860028 s/iter 26.347303 +iter : 19 Arret : 0.00210663 s/iter 26.347784 +iter : 20 Arret : 5.04056E-05 s/iter 26.356018 +iter : 21 Arret : 4.72721E-06 s/iter 26.365127 +iter : 22 Arret : 3.9901E-08 s/iter 26.360411 +iter : 23 Arret : 1.57869E-10 s/iter 26.353428 +iter : 24 Arret : 6.28564E-13 s/iter 26.351250 +temps : 646.009 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.58777E-07 +Stabilite : 6.28564E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-4.48197E-12 +i* 2.11486E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592043 +i* 0.805898| 0.999993|-1.75726E-12 +i*-2.31848E-11| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993| 1.4493E-11 +i* 1.3687E-11| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699509 +i* -0.714614| 0.999993| 1.85989E-11 +i*-4.93269E-12| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742916 +i* -0.669375| 0.999993| 1.59349E-11 +i* 1.71025E-11| +| 18| 0.753326 +i* 0.657637| 0.999993| 2.26833E-11 +i* 1.58007E-11| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773555 +i* 0.633743| 1.00001| 3.19794E-09 +i*-4.58601E-10| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 800000 +proc 0 start 0 size 800000 +iter : 1 Arret : 0.00154846 s/iter 46.736609 +iter : 2 Arret : 0.00623603 s/iter 46.773178 +iter : 3 Arret : 0.0858187 s/iter 46.841571 +iter : 4 Arret : 1.67232 s/iter 47.156772 +iter : 5 Arret : 1.01806 s/iter 47.406800 +iter : 6 Arret : 1.57506 s/iter 47.457844 +iter : 7 Arret : 1.13953 s/iter 47.697558 +iter : 8 Arret : 0.73881 s/iter 48.174119 +iter : 9 Arret : 0.626435 s/iter 48.572632 +iter : 10 Arret : 0.622256 s/iter 48.458622 +iter : 11 Arret : 0.692053 s/iter 48.464982 +iter : 12 Arret : 1.00181 s/iter 48.341828 +iter : 13 Arret : 0.551097 s/iter 48.068502 +iter : 14 Arret : 1.04389 s/iter 47.905646 +iter : 15 Arret : 1.21414 s/iter 47.815372 +iter : 16 Arret : 2.39612 s/iter 47.598487 +iter : 17 Arret : 0.78181 s/iter 47.580209 +iter : 18 Arret : 1.57712 s/iter 47.513484 +iter : 19 Arret : 0.980627 s/iter 47.491805 +iter : 20 Arret : 2.61529 s/iter 47.318510 +iter : 21 Arret : 0.836959 s/iter 47.192301 +iter : 22 Arret : 0.6961 s/iter 47.065027 +iter : 23 Arret : 1.08455 s/iter 47.015412 +iter : 24 Arret : 0.186278 s/iter 46.892588 +iter : 25 Arret : 0.155923 s/iter 46.834330 +iter : 26 Arret : 0.090441 s/iter 46.771351 +iter : 27 Arret : 0.093651 s/iter 46.749380 +iter : 28 Arret : 0.0452468 s/iter 46.755619 +iter : 29 Arret : 0.00859257 s/iter 46.764196 +iter : 30 Arret : 0.00968923 s/iter 46.773667 +iter : 31 Arret : 0.00619702 s/iter 46.763704 +iter : 32 Arret : 0.000332677 s/iter 46.713764 +iter : 33 Arret : 1.75349E-07 s/iter 46.747193 +iter : 34 Arret : 4.01254E-10 s/iter 46.753422 +iter : 35 Arret : 8.64369E-13 s/iter 46.729435 +temps : 1656.28 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.64697E-07 +Stabilite : 8.64369E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 3.40094E-11 +i* 1.45989E-12| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 1000192 +proc 0 start 0 size 1000192 +iter : 1 Arret : 0.00156919 s/iter 72.939595 +iter : 2 Arret : 1.90389 s/iter 73.046565 +iter : 3 Arret : 0.502696 s/iter 73.071131 +iter : 4 Arret : 1.00039 s/iter 73.810096 +iter : 5 Arret : 1.69451 s/iter 73.906653 +iter : 6 Arret : 1.26606 s/iter 73.980438 +iter : 7 Arret : 0.651915 s/iter 74.703433 +iter : 8 Arret : 0.531762 s/iter 74.806612 +iter : 9 Arret : 0.502687 s/iter 74.773948 +iter : 10 Arret : 0.48618 s/iter 74.532337 +iter : 11 Arret : 0.444215 s/iter 74.279878 +iter : 12 Arret : 0.427439 s/iter 74.140663 +iter : 13 Arret : 0.41232 s/iter 74.008804 +iter : 14 Arret : 0.406535 s/iter 74.075135 +iter : 15 Arret : 0.401671 s/iter 74.022094 +iter : 16 Arret : 0.398196 s/iter 74.055174 +iter : 17 Arret : 0.395555 s/iter 73.932752 +iter : 18 Arret : 0.394204 s/iter 74.040270 +iter : 19 Arret : 0.39412 s/iter 73.999365 +iter : 20 Arret : 0.395512 s/iter 74.042163 +iter : 21 Arret : 0.398528 s/iter 73.913334 +iter : 22 Arret : 0.404063 s/iter 74.043199 +iter : 23 Arret : 0.413614 s/iter 74.018474 +iter : 24 Arret : 0.430817 s/iter 73.977216 +iter : 25 Arret : 0.464104 s/iter 73.990264 +iter : 26 Arret : 0.534702 s/iter 73.999109 +iter : 27 Arret : 0.777706 s/iter 73.922712 +iter : 28 Arret : 0.780386 s/iter 73.805326 +iter : 29 Arret : 0.391957 s/iter 73.593419 +iter : 30 Arret : 0.489974 s/iter 73.269694 +iter : 31 Arret : 0.327545 s/iter 73.343344 +iter : 32 Arret : 0.110619 s/iter 73.177304 +iter : 33 Arret : 0.19712 s/iter 73.089524 +iter : 34 Arret : 0.288284 s/iter 73.082763 +iter : 35 Arret : 0.0226925 s/iter 73.058524 +iter : 36 Arret : 0.00572618 s/iter 73.055652 +iter : 37 Arret : 0.00398682 s/iter 72.948081 +iter : 38 Arret : 0.000421174 s/iter 72.910444 +iter : 39 Arret : 5.0226E-07 s/iter 72.907146 +iter : 40 Arret : 7.2296E-09 s/iter 72.950438 +iter : 41 Arret : 1.02029E-10 s/iter 72.929637 +iter : 42 Arret : 1.43894E-12 s/iter 72.923863 +iter : 43 Arret : 2.03366E-14 s/iter 72.908337 +temps : 3173.19 seconde(s) +Nb iterations : 43 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65132E-08 +Stabilite : 2.03366E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.52971 +i* 0.848174| 0.999996|-2.56639E-12 +i*-3.27674E-11| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502834 +i* 0.864379| 0.999996|-2.85585E-11 +i* 6.91519E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491932 +i* 0.870629| 0.999996|-1.74121E-11 +i*-2.86359E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475463 +i* 0.879732| 0.999996|-5.09415E-12 +i*-3.20905E-11| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447623 +i* 0.894218| 0.999996| -2.5447E-11 +i*-4.61239E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-3.70284E-11 +i*-5.06729E-12| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 1200128 +proc 0 start 0 size 1200128 +iter : 1 Arret : 0.00677598 s/iter 104.842623 +iter : 2 Arret : 1.43332 s/iter 108.451498 +iter : 3 Arret : 0.428119 s/iter 109.604920 +iter : 4 Arret : 0.429249 s/iter 111.528327 +iter : 5 Arret : 1.08646 s/iter 112.126605 +iter : 6 Arret : 4.298 s/iter 112.878995 +iter : 7 Arret : 1.29187 s/iter 114.015483 +iter : 8 Arret : 4.5768 s/iter 114.431935 +iter : 9 Arret : 0.867548 s/iter 114.405770 +iter : 10 Arret : 1.11265 s/iter 113.890021 +iter : 11 Arret : 0.535846 s/iter 113.718788 +iter : 12 Arret : 0.531876 s/iter 112.691524 +iter : 13 Arret : 2.32463 s/iter 111.476924 +iter : 14 Arret : 0.834993 s/iter 110.712739 +iter : 15 Arret : 1.67285 s/iter 110.494250 +iter : 16 Arret : 1.01044 s/iter 109.494899 +iter : 17 Arret : 0.807065 s/iter 109.193175 +iter : 18 Arret : 0.909238 s/iter 108.712803 +iter : 19 Arret : 1.14066 s/iter 108.492397 +iter : 20 Arret : 0.335581 s/iter 107.960425 +iter : 21 Arret : 0.196963 s/iter 107.373274 +iter : 22 Arret : 0.128663 s/iter 106.913981 +iter : 23 Arret : 0.275217 s/iter 106.284145 +iter : 24 Arret : 0.179897 s/iter 106.054702 +iter : 25 Arret : 0.420437 s/iter 105.799691 +iter : 26 Arret : 0.358355 s/iter 105.198589 +iter : 27 Arret : 0.11514 s/iter 105.120453 +iter : 28 Arret : 0.217484 s/iter 104.911034 +iter : 29 Arret : 0.207195 s/iter 104.903818 +iter : 30 Arret : 0.037319 s/iter 104.938544 +iter : 31 Arret : 0.0122038 s/iter 104.836750 +iter : 32 Arret : 0.000983648 s/iter 104.776137 +iter : 33 Arret : 4.35825E-07 s/iter 104.872755 +iter : 34 Arret : 1.94444E-09 s/iter 104.822262 +iter : 35 Arret : 1.37935E-11 s/iter 104.776349 +iter : 36 Arret : 1.88726E-13 s/iter 104.825146 +temps : 3906.03 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.78618E-08 +Stabilite : 1.88726E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540312 +i* 0.841461| 0.999997|-2.16913E-11 +i* 1.91294E-11| +| 2| 0.513645 +i* 0.857999| 0.999997|-6.29718E-12 +i*-2.39364E-12| +| 3| 0.486457 +i* 0.873701| 0.999997| 1.53235E-11 +i* 6.36435E-13| +| 4| 0.458805 +i* 0.888533| 0.999997| 1.78773E-11 +i* 1.55684E-11| +| 5| 0.430685 +i* 0.902499| 0.999997| 2.12053E-13 +i*-1.16324E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997| -2.5707E-11 +i* 3.11093E-13| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223614 +i* 0.974674| 0.999997| 7.05391E-12 +i* 1.2797E-11| +| 13| 0.192915 +i* 0.981212| 0.999997| 1.07495E-11 +i* 5.766E-12| +| 14| 0.162052 +i* 0.986779| 0.999997|-2.06171E-11 +i* 5.16515E-12| +| 15| 0.130977 +i* 0.991382| 0.999997| 5.89659E-11 +i* 7.29122E-12| +| 16| 0.0998077 +i* 0.995003| 0.999997|-3.45761E-11 +i*-1.61701E-11| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.04742E-11 +i* 1.15624E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 1400064 +proc 0 start 0 size 1400064 +iter : 1 Arret : 0.00938725 s/iter 142.328326 +iter : 2 Arret : 0.761578 s/iter 147.052418 +iter : 3 Arret : 1.35081 s/iter 149.289333 +iter : 4 Arret : 0.488828 s/iter 151.454940 +iter : 5 Arret : 0.352825 s/iter 152.322211 +iter : 6 Arret : 0.142284 s/iter 153.010051 +iter : 7 Arret : 0.0560259 s/iter 152.431968 +iter : 8 Arret : 0.196308 s/iter 152.003440 +iter : 9 Arret : 0.124897 s/iter 151.872606 +iter : 10 Arret : 0.0975323 s/iter 151.560877 +iter : 11 Arret : 0.147128 s/iter 149.300671 +iter : 12 Arret : 0.109558 s/iter 147.230298 +iter : 13 Arret : 0.0563761 s/iter 144.834459 +iter : 14 Arret : 0.0352169 s/iter 143.795377 +iter : 15 Arret : 0.0177334 s/iter 143.112879 +iter : 16 Arret : 0.0155926 s/iter 142.695503 +iter : 17 Arret : 0.00246736 s/iter 142.533975 +iter : 18 Arret : 9.78659E-05 s/iter 142.374961 +iter : 19 Arret : 5.69989E-07 s/iter 142.290712 +iter : 20 Arret : 3.43839E-09 s/iter 142.588568 +iter : 21 Arret : 1.59577E-11 s/iter 142.684647 +iter : 22 Arret : 7.40742E-14 s/iter 142.549602 +temps : 3229.79 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.95958E-08 +Stabilite : 7.40742E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-5.74141E-12 +i*-6.39521E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997|-8.89955E-13 +i* 2.61938E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416439 +i* -0.90916| 0.999997|-1.66807E-11 +i* 2.56219E-11| +| 12| 0.373179 +i* 0.927756| 0.999997|-7.07252E-11 +i*-5.29587E-11| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-3.74776E-11 +i*-3.89954E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:823 terminated with signal 11 at PC=404ae1 SP=7fff080bdf50. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 823 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:827 terminated with signal 11 at PC=404ae1 SP=7fffb55d2a00. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 827 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^1500000 + (1 +i*0)*x^2000000 + +(-50000 +i*0)*x^499999 + (-1.5E+07 +i*0)*x^1499999 + (2E+06 +i*0)*x^1999999 + + +template:831 terminated with signal 11 at PC=404ae1 SP=7fff64363320. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 831 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- diff --git a/Simulations/sparse_mpi/sparse_mpi_1GPU.sge b/Simulations/sparse_mpi/sparse_mpi_1GPU.sge new file mode 100755 index 0000000..8661da2 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_1GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_1GPU +#$ -pe mpi 1 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_mpi/sparse_mpi_2GPU.o140031 b/Simulations/sparse_mpi/sparse_mpi_2GPU.o140031 new file mode 100644 index 0000000..15b43d7 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_2GPU.o140031 @@ -0,0 +1,662 @@ +REMAINING: 2 +Taking GPU #0 +Taking GPU #1 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 50048 size 50048 +proc 1 start 50048 size 50048 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 50048 +proc 0 start 0 size 50048 +iter : 1 Arret : 0.00512448 s/iter 0.442006 +iter : 2 Arret : 0.00518524 s/iter 0.441749 +iter : 3 Arret : 0.0136123 s/iter 0.441743 +iter : 4 Arret : 0.0172088 s/iter 0.520551 +iter : 5 Arret : 0.0127637 s/iter 0.441752 +iter : 6 Arret : 0.00575024 s/iter 0.441718 +iter : 7 Arret : 0.00480045 s/iter 0.441722 +iter : 8 Arret : 0.0058672 s/iter 0.441765 +iter : 9 Arret : 0.00681665 s/iter 0.439578 +iter : 10 Arret : 0.00633876 s/iter 0.441755 +iter : 11 Arret : 0.0024546 s/iter 0.441765 +iter : 12 Arret : 0.00167883 s/iter 0.441695 +iter : 13 Arret : 0.000524245 s/iter 0.441627 +iter : 14 Arret : 0.000135332 s/iter 0.441622 +iter : 15 Arret : 4.9518E-06 s/iter 0.441652 +iter : 16 Arret : 7.49618E-08 s/iter 0.441569 +iter : 17 Arret : 1.11657E-09 s/iter 0.441553 +iter : 18 Arret : 1.66345E-11 s/iter 0.441549 +iter : 19 Arret : 2.47882E-13 s/iter 0.441578 +temps : 8.65634 seconde(s) +Nb iterations : 19 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.43376E-08 +Stabilite : 3.20054E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 2.07334E-12 +i* 2.33003E-12| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006| 1.35693E-10 +i*-3.47657E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 100096 size 100096 +proc 1 start 100096 size 100096 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 100096 +proc 0 start 0 size 100096 +iter : 1 Arret : 0.000100591 s/iter 1.548764 +iter : 2 Arret : 9.98047E-05 s/iter 1.548592 +iter : 3 Arret : 0.000401454 s/iter 1.548606 +iter : 4 Arret : 0.000612146 s/iter 1.548661 +iter : 5 Arret : 0.00261257 s/iter 1.548859 +iter : 6 Arret : 0.00389809 s/iter 1.707848 +iter : 7 Arret : 0.108958 s/iter 1.548567 +iter : 8 Arret : 0.0989986 s/iter 1.548572 +iter : 9 Arret : 0.159452 s/iter 1.549964 +iter : 10 Arret : 0.284956 s/iter 1.552722 +iter : 11 Arret : 0.805953 s/iter 1.552547 +iter : 12 Arret : 0.51544 s/iter 1.711577 +iter : 13 Arret : 0.544938 s/iter 1.707829 +iter : 14 Arret : 0.643974 s/iter 1.548388 +iter : 15 Arret : 1.69207 s/iter 1.548432 +iter : 16 Arret : 0.924273 s/iter 1.548552 +iter : 17 Arret : 0.444862 s/iter 1.548574 +iter : 18 Arret : 4.9242 s/iter 1.549903 +iter : 19 Arret : 0.716282 s/iter 1.548377 +iter : 20 Arret : 0.40305 s/iter 1.548788 +iter : 21 Arret : 0.294354 s/iter 1.548624 +iter : 22 Arret : 0.0209093 s/iter 1.548518 +iter : 23 Arret : 0.00144046 s/iter 1.548527 +iter : 24 Arret : 0.000306925 s/iter 1.548770 +iter : 25 Arret : 3.17447E-10 s/iter 1.548617 +iter : 26 Arret : 3.17541E-14 s/iter 1.548825 +temps : 40.9684 seconde(s) +Nb iterations : 26 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.58606E-05 +Stabilite : 6.47336E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005|-3.72767E-08 +i*-1.30274E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-1.93379E-12 +i*-1.29726E-11| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 200064 +proc 0 start 0 size 200064 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 200064 size 200064 +proc 1 start 200064 size 200064 +iter : 1 Arret : 0.000550449 s/iter 6.082917 +iter : 2 Arret : 0.00291862 s/iter 6.079734 +iter : 3 Arret : 0.00675438 s/iter 6.082746 +iter : 4 Arret : 0.00891928 s/iter 6.157166 +iter : 5 Arret : 0.0118747 s/iter 6.150345 +iter : 6 Arret : 0.0109883 s/iter 6.091520 +iter : 7 Arret : 0.00656673 s/iter 6.112417 +iter : 8 Arret : 0.00575864 s/iter 6.085608 +iter : 9 Arret : 0.00288805 s/iter 6.150350 +iter : 10 Arret : 0.00168944 s/iter 6.083333 +iter : 11 Arret : 0.00101594 s/iter 6.079295 +iter : 12 Arret : 0.000961205 s/iter 6.079555 +iter : 13 Arret : 0.000805832 s/iter 6.078713 +iter : 14 Arret : 0.00034457 s/iter 6.079666 +iter : 15 Arret : 0.000125967 s/iter 6.080354 +iter : 16 Arret : 2.22934E-05 s/iter 6.079409 +iter : 17 Arret : 5.34301E-06 s/iter 6.079653 +iter : 18 Arret : 3.49738E-08 s/iter 6.081697 +iter : 19 Arret : 7.48893E-11 s/iter 6.080662 +iter : 20 Arret : 1.61404E-13 s/iter 6.081309 +temps : 122.138 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.09706E-08 +Stabilite : 1.61404E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.43989 +i* -0.898041| 0.999991|-2.08855E-12 +i*-1.75276E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991|-1.29017E-11 +i*-4.43427E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991|-4.70735E-12 +i* -1.4127E-11| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688087 +i* 0.725616| 0.999991| 6.67011E-12 +i* 1.57173E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 300032 size 300032 +proc 1 start 300032 size 300032 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +iter : 1 Arret : 0.00169532 s/iter 13.268293 +iter : 2 Arret : 0.00577451 s/iter 13.754899 +iter : 3 Arret : 0.00560656 s/iter 13.317734 +iter : 4 Arret : 0.026637 s/iter 13.287596 +iter : 5 Arret : 0.0224878 s/iter 13.756785 +iter : 6 Arret : 0.0273249 s/iter 14.009301 +iter : 7 Arret : 0.0242205 s/iter 13.722890 +iter : 8 Arret : 0.0206627 s/iter 14.046207 +iter : 9 Arret : 0.0154355 s/iter 14.068750 +iter : 10 Arret : 0.0112335 s/iter 13.832264 +iter : 11 Arret : 0.00926749 s/iter 13.793343 +iter : 12 Arret : 0.0165133 s/iter 13.276606 +iter : 13 Arret : 0.00281445 s/iter 13.275977 +iter : 14 Arret : 0.0019915 s/iter 13.269355 +iter : 15 Arret : 0.00135028 s/iter 13.267568 +iter : 16 Arret : 0.00186824 s/iter 13.268070 +iter : 17 Arret : 0.000810658 s/iter 13.268154 +iter : 18 Arret : 0.000232438 s/iter 13.268534 +iter : 19 Arret : 3.11501E-07 s/iter 13.267454 +iter : 20 Arret : 1.18566E-09 s/iter 13.267871 +iter : 21 Arret : 9.65413E-12 s/iter 13.268070 +iter : 22 Arret : 1.37719E-13 s/iter 13.267729 +temps : 297.134 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.32595E-08 +Stabilite : 1.37719E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993| 1.33613E-11 +i*-1.98701E-11| +| 4| 0.591992 +i* 0.805956| 1.00001|-3.89872E-09 +i* 2.08385E-09| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993|-4.77973E-12 +i* 2.40621E-11| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| -2.6851E-11 +i*-1.44801E-11| +| 15| -0.721524 +i* -0.69238| 0.999993| 2.63193E-11 +i*-6.76318E-13| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.74294 +i* -0.669349| 0.999993| 1.02707E-12 +i* 2.14607E-11| +| 18| 0.753317 +i* 0.657672| 1.00001| 2.8295E-09 +i*-3.45603E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773543 +i* 0.633733| 0.999993|-3.47811E-12 +i*-5.94756E-12| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 400000 +proc 0 start 0 size 400000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 400000 size 400000 +proc 1 start 400000 size 400000 +iter : 1 Arret : 0.00108387 s/iter 23.672446 +iter : 2 Arret : 0.00660333 s/iter 23.805408 +iter : 3 Arret : 1.16255 s/iter 23.798567 +iter : 4 Arret : 1.00538 s/iter 23.799772 +iter : 5 Arret : 4.35503 s/iter 23.835095 +iter : 6 Arret : 2.85741 s/iter 24.191376 +iter : 7 Arret : 1.06724 s/iter 24.343970 +iter : 8 Arret : 0.752896 s/iter 24.414141 +iter : 9 Arret : 0.681451 s/iter 24.504496 +iter : 10 Arret : 0.666362 s/iter 24.940388 +iter : 11 Arret : 0.660981 s/iter 25.494551 +iter : 12 Arret : 0.6721 s/iter 24.530242 +iter : 13 Arret : 0.722307 s/iter 24.518027 +iter : 14 Arret : 0.735973 s/iter 24.579973 +iter : 15 Arret : 1.60274 s/iter 24.425419 +iter : 16 Arret : 1.08224 s/iter 24.263282 +iter : 17 Arret : 1.66761 s/iter 24.117742 +iter : 18 Arret : 0.562533 s/iter 23.946009 +iter : 19 Arret : 0.334526 s/iter 23.926164 +iter : 20 Arret : 0.247191 s/iter 23.871930 +iter : 21 Arret : 0.0856694 s/iter 23.809304 +iter : 22 Arret : 0.100266 s/iter 23.817817 +iter : 23 Arret : 0.0450244 s/iter 23.791545 +iter : 24 Arret : 0.0252731 s/iter 23.803368 +iter : 25 Arret : 0.0214701 s/iter 23.778507 +iter : 26 Arret : 0.00697008 s/iter 23.796671 +iter : 27 Arret : 0.00107605 s/iter 23.651300 +iter : 28 Arret : 1.6145E-06 s/iter 23.654996 +iter : 29 Arret : 4.22205E-09 s/iter 23.650903 +iter : 30 Arret : 9.10881E-12 s/iter 23.650544 +iter : 31 Arret : 1.96015E-14 s/iter 23.654309 +temps : 746.426 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.73089E-06 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995| -2.03E-11 +i* 2.74701E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 1.7531E-11 +i*-4.02243E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 500096 size 500096 +proc 1 start 500096 size 500096 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 500096 +proc 0 start 0 size 500096 +iter : 1 Arret : 0.00111034 s/iter 36.535863 +iter : 2 Arret : 0.00130138 s/iter 36.531318 +iter : 3 Arret : 0.095171 s/iter 36.617316 +iter : 4 Arret : 0.110384 s/iter 36.603388 +iter : 5 Arret : 0.0159644 s/iter 37.200734 +iter : 6 Arret : 0.0148525 s/iter 37.186773 +iter : 7 Arret : 0.0189588 s/iter 37.285760 +iter : 8 Arret : 0.0122669 s/iter 37.242480 +iter : 9 Arret : 0.025395 s/iter 37.493437 +iter : 10 Arret : 0.0249756 s/iter 36.552191 +iter : 11 Arret : 0.0032083 s/iter 36.587117 +iter : 12 Arret : 0.00514671 s/iter 36.496415 +iter : 13 Arret : 0.0026206 s/iter 36.537986 +iter : 14 Arret : 0.0021181 s/iter 36.525452 +iter : 15 Arret : 0.000448616 s/iter 36.534784 +iter : 16 Arret : 0.000260446 s/iter 36.531377 +iter : 17 Arret : 9.00305E-05 s/iter 36.520451 +iter : 18 Arret : 0.000137571 s/iter 36.497467 +iter : 19 Arret : 3.90888E-05 s/iter 36.496056 +iter : 20 Arret : 8.22264E-08 s/iter 36.494517 +iter : 21 Arret : 2.59921E-10 s/iter 36.529540 +iter : 22 Arret : 8.21945E-13 s/iter 36.531093 +temps : 812.655 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.28809E-07 +Stabilite : 8.21945E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841476| 1.00001| 4.82795E-10 +i* 3.31212E-09| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513638 +i* 0.858002| 0.999996|-2.64786E-11 +i* 1.3235E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 1.87346E-11 +i* 4.7471E-11| +| 9| 0.491932 +i* 0.870629| 0.999996|-2.65525E-11 +i* 1.22525E-11| +| 10| 0.486462 +i* 0.873698| 0.999996|-2.18452E-11 +i*-1.14808E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996|-5.47384E-12 +i* 1.02452E-11| +| 15| 0.458801 +i* 0.888545| 1.00001| 8.56622E-10 +i* 9.50588E-10| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1.00001 +600000 racines de module = 0.999996 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 600064 size 600064 +proc 1 start 600064 size 600064 +iter : 1 Arret : 0.0323131 s/iter 52.941074 +iter : 2 Arret : 2.76888 s/iter 55.568853 +iter : 3 Arret : 2.88621 s/iter 56.575624 +iter : 4 Arret : 1.26993 s/iter 55.935739 +iter : 5 Arret : 3.86036 s/iter 56.102261 +iter : 6 Arret : 5.37784 s/iter 57.046755 +iter : 7 Arret : 1.03129 s/iter 56.920764 +iter : 8 Arret : 3.95796 s/iter 57.471965 +iter : 9 Arret : 1.30769 s/iter 57.104425 +iter : 10 Arret : 1.0707 s/iter 57.036191 +iter : 11 Arret : 1.02855 s/iter 56.856622 +iter : 12 Arret : 0.563478 s/iter 56.398393 +iter : 13 Arret : 1.5244 s/iter 56.034393 +iter : 14 Arret : 1.47905 s/iter 55.457328 +iter : 15 Arret : 0.774422 s/iter 55.020273 +iter : 16 Arret : 10.8889 s/iter 54.981257 +iter : 17 Arret : 0.715912 s/iter 54.702463 +iter : 18 Arret : 0.577843 s/iter 54.436841 +iter : 19 Arret : 0.747995 s/iter 54.297662 +iter : 20 Arret : 0.163426 s/iter 53.892957 +iter : 21 Arret : 0.181209 s/iter 53.840332 +iter : 22 Arret : 0.0761215 s/iter 53.719165 +iter : 23 Arret : 0.0217437 s/iter 53.677726 +iter : 24 Arret : 0.00705727 s/iter 53.242080 +iter : 25 Arret : 0.00154816 s/iter 52.922070 +iter : 26 Arret : 1.96753E-05 s/iter 52.904231 +iter : 27 Arret : 2.53613E-08 s/iter 52.924736 +iter : 28 Arret : 3.62869E-10 s/iter 52.921481 +iter : 29 Arret : 5.17537E-12 s/iter 52.895150 +iter : 30 Arret : 7.38669E-14 s/iter 52.910075 +temps : 1647.22 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.62324E-08 +Stabilite : 7.38669E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540304 +i* 0.841466| 0.999997| 3.08649E-11 +i* 2.05843E-11| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1|-5.85295E-09 +i*-2.49566E-10| +| 4| 0.458812 +i* 0.888539| 1|-7.79592E-09 +i*-3.64417E-09| +| 5| 0.430677 +i* 0.902502| 0.999997|-2.03271E-11 +i*-3.18325E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192897 +i* 0.981224| 1| 2.91999E-10 +i* 9.18678E-11| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130967 +i* 0.991391| 1| 1.71549E-09 +i* 3.54225E-10| +| 16| 0.099812 +i* 0.995011| 1|-4.01255E-09 +i*-1.01435E-08| +| 17| 0.0685136 +i* 0.997647| 0.999997|-2.98188E-11 +i* 2.79243E-12| +| 18| 0.0371504 +i* 0.999314| 1|-1.38879E-09 +i*-2.32658E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 700032 +proc 0 start 0 size 700032 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 700032 size 700032 +proc 1 start 700032 size 700032 +iter : 1 Arret : 0.00634591 s/iter 71.315735 +iter : 2 Arret : 0.356583 s/iter 73.499155 +iter : 3 Arret : 0.616585 s/iter 74.055679 +iter : 4 Arret : 0.383366 s/iter 75.001269 +iter : 5 Arret : 0.113316 s/iter 76.417550 +iter : 6 Arret : 0.198101 s/iter 77.541428 +iter : 7 Arret : 0.157259 s/iter 77.127574 +iter : 8 Arret : 0.381996 s/iter 77.411132 +iter : 9 Arret : 0.254414 s/iter 77.254944 +iter : 10 Arret : 0.178383 s/iter 77.505940 +iter : 11 Arret : 0.147268 s/iter 76.909819 +iter : 12 Arret : 0.0894984 s/iter 77.135647 +iter : 13 Arret : 0.117288 s/iter 74.937817 +iter : 14 Arret : 0.0966418 s/iter 73.691614 +iter : 15 Arret : 0.0293232 s/iter 72.705894 +iter : 16 Arret : 0.0436007 s/iter 72.446877 +iter : 17 Arret : 0.0302845 s/iter 72.160465 +iter : 18 Arret : 0.00422446 s/iter 71.431150 +iter : 19 Arret : 0.00359251 s/iter 71.490724 +iter : 20 Arret : 0.00270137 s/iter 71.471506 +iter : 21 Arret : 0.00209394 s/iter 71.343579 +iter : 22 Arret : 0.000416465 s/iter 71.476428 +iter : 23 Arret : 4.15934E-05 s/iter 71.308920 +iter : 24 Arret : 5.37967E-08 s/iter 71.432393 +iter : 25 Arret : 2.48195E-10 s/iter 71.421751 +iter : 26 Arret : 1.15205E-12 s/iter 71.414405 +iter : 27 Arret : 5.31631E-15 s/iter 71.409806 +temps : 1991.85 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.8707E-07 +Stabilite : 3.51082E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997| 5.65794E-11 +i*-4.66756E-12| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-8.72191E-12 +i* 2.97079E-11| +| 4| 0.486439 +i* 0.873711| 0.999997|-3.15932E-11 +i*-1.15957E-12| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472673 +i* -0.881242| 1|-5.56631E-09 +i*-2.23833E-09| +| 8| 0.430664 +i* 0.902517| 1|-8.83373E-11 +i*-2.09199E-09| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.06317E-11 +i* 7.08794E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-3.74776E-11 +i*-3.89954E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 1.02587E-11 +i*-4.25648E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:32580 terminated with signal 11 at PC=404ae1 SP=7fffd45f56a0. Backtrace: + +template:32579 terminated with signal 11 at PC=404ae1 SP=7fff316ce300. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 32580 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:32586 terminated with signal 11 at PC=404ae1 SP=7fffbfe9f8d0. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:32587 terminated with signal 11 at PC=404ae1 SP=7fff632aee60. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 32587 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^1500000 + (1 +i*0)*x^2000000 + +(-50000 +i*0)*x^499999 + (-1.5E+07 +i*0)*x^1499999 + (2E+06 +i*0)*x^1999999 + + +template:32594 terminated with signal 11 at PC=404ae1 SP=7fff28fd9250. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:32593 terminated with signal 11 at PC=404ae1 SP=7fffe3e03f90. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 32594 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- diff --git a/Simulations/sparse_mpi/sparse_mpi_2GPU.sge b/Simulations/sparse_mpi/sparse_mpi_2GPU.sge new file mode 100755 index 0000000..2817b6b --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_2GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_2GPU +#$ -pe mpi 2 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_mpi/sparse_mpi_3GPU.o140030 b/Simulations/sparse_mpi/sparse_mpi_3GPU.o140030 new file mode 100644 index 0000000..b62c8d1 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_3GPU.o140030 @@ -0,0 +1,758 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 33365 +proc 0 start 0 size 33365 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 33365 size 33365 +proc 1 start 33365 size 33365 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 2, start 66730 size 33365 +proc 2 start 66730 size 33365 +iter : 1 Arret : 0.00638362 s/iter 0.326715 +iter : 2 Arret : 0.00780885 s/iter 0.399767 +iter : 3 Arret : 0.00278939 s/iter 0.327124 +iter : 4 Arret : 0.00312024 s/iter 0.327290 +iter : 5 Arret : 0.00261461 s/iter 0.327081 +iter : 6 Arret : 0.00443129 s/iter 0.326569 +iter : 7 Arret : 0.00529933 s/iter 0.326526 +iter : 8 Arret : 0.00962751 s/iter 0.327146 +iter : 9 Arret : 0.0107359 s/iter 0.326473 +iter : 10 Arret : 0.00603516 s/iter 0.326463 +iter : 11 Arret : 0.00278461 s/iter 0.327154 +iter : 12 Arret : 0.000336786 s/iter 0.326455 +iter : 13 Arret : 0.000245415 s/iter 0.326273 +iter : 14 Arret : 0.000266948 s/iter 0.326718 +iter : 15 Arret : 0.000254585 s/iter 0.326250 +iter : 16 Arret : 0.000456802 s/iter 0.326186 +iter : 17 Arret : 0.000147565 s/iter 0.326750 +iter : 18 Arret : 2.07387E-07 s/iter 0.326144 +iter : 19 Arret : 3.08546E-09 s/iter 0.326199 +iter : 20 Arret : 4.59676E-11 s/iter 0.326798 +iter : 21 Arret : 6.84814E-13 s/iter 0.326219 +temps : 7.13273 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.61117E-09 +Stabilite : 6.84814E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226885 +i* -0.973981| 1.00006|-5.81993E-10 +i*-4.18547E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 1.02962E-12 +i*-4.51911E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 2, start 133460 size 66730 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 66730 size 66730 +proc 1 start 66730 size 66730 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 66730 +proc 0 start 0 size 66730 +proc 2 start 133460 size 66730 +iter : 1 Arret : 0.000533936 s/iter 1.097687 +iter : 2 Arret : 0.00054918 s/iter 1.097788 +iter : 3 Arret : 0.000302619 s/iter 1.097094 +iter : 4 Arret : 0.000610723 s/iter 1.097469 +iter : 5 Arret : 0.0013942 s/iter 1.097408 +iter : 6 Arret : 0.0123305 s/iter 1.097332 +iter : 7 Arret : 0.0276413 s/iter 1.097585 +iter : 8 Arret : 0.0390327 s/iter 1.097910 +iter : 9 Arret : 0.0768762 s/iter 1.098286 +iter : 10 Arret : 0.261559 s/iter 1.199021 +iter : 11 Arret : 0.996838 s/iter 1.231967 +iter : 12 Arret : 2.41454 s/iter 1.226149 +iter : 13 Arret : 2.18621 s/iter 1.224592 +iter : 14 Arret : 1.07886 s/iter 1.189416 +iter : 15 Arret : 2.0468 s/iter 1.225182 +iter : 16 Arret : 2.06331 s/iter 1.228381 +iter : 17 Arret : 0.85728 s/iter 1.201017 +iter : 18 Arret : 0.652722 s/iter 1.225600 +iter : 19 Arret : 0.985485 s/iter 1.227406 +iter : 20 Arret : 4.10993 s/iter 1.228101 +iter : 21 Arret : 0.600123 s/iter 1.227670 +iter : 22 Arret : 0.86582 s/iter 1.231663 +iter : 23 Arret : 0.31213 s/iter 1.227752 +iter : 24 Arret : 0.424877 s/iter 1.223962 +iter : 25 Arret : 0.275449 s/iter 1.097197 +iter : 26 Arret : 0.212806 s/iter 1.221990 +iter : 27 Arret : 0.124734 s/iter 1.097336 +iter : 28 Arret : 0.088182 s/iter 1.096934 +iter : 29 Arret : 0.0330763 s/iter 1.097169 +iter : 30 Arret : 0.0100338 s/iter 1.097086 +iter : 31 Arret : 0.000168049 s/iter 1.097161 +iter : 32 Arret : 7.37376E-08 s/iter 1.096969 +iter : 33 Arret : 7.38629E-12 s/iter 1.097234 +iter : 34 Arret : 7.3696E-16 s/iter 1.097489 +temps : 39.5342 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.52377E-08 +Stabilite : 7.3696E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.592783 +i* 0.805419| 1.00005| 1.3403E-08 +i* 2.35166E-09| +| 9| -0.800777 +i* 0.59904| 1.00005|-1.05967E-08 +i* 2.82759E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-7.79776E-12 +i*-2.52076E-13| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 133376 size 133376 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 2, start 266752 size 133376 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 133376 +proc 2 start 266752 size 133376 +proc 1 start 133376 size 133376 +proc 0 start 0 size 133376 +iter : 1 Arret : 0.000533421 s/iter 3.991725 +iter : 2 Arret : 0.00367072 s/iter 3.993299 +iter : 3 Arret : 0.00493773 s/iter 4.310647 +iter : 4 Arret : 0.00496697 s/iter 3.992603 +iter : 5 Arret : 0.0140779 s/iter 3.991503 +iter : 6 Arret : 0.0122345 s/iter 3.993227 +iter : 7 Arret : 0.0118851 s/iter 4.320085 +iter : 8 Arret : 0.00413608 s/iter 3.992019 +iter : 9 Arret : 0.0042286 s/iter 4.269756 +iter : 10 Arret : 0.00316824 s/iter 3.992259 +iter : 11 Arret : 0.00072238 s/iter 3.992655 +iter : 12 Arret : 0.000430893 s/iter 3.992601 +iter : 13 Arret : 0.000433942 s/iter 3.991813 +iter : 14 Arret : 0.000150382 s/iter 3.993178 +iter : 15 Arret : 0.000238887 s/iter 3.991814 +iter : 16 Arret : 0.000121494 s/iter 3.993291 +iter : 17 Arret : 9.71544E-07 s/iter 3.992093 +iter : 18 Arret : 2.43359E-09 s/iter 3.992688 +iter : 19 Arret : 5.24302E-12 s/iter 3.992746 +iter : 20 Arret : 5.96461E-14 s/iter 3.992444 +temps : 81.0542 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 1.1328E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411559 +i* -0.9114| 1.00002| 1.04334E-09 +i*-9.84037E-10| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.988534 +i* 0.151098| 1.00002|-8.27014E-10 +i* 9.44171E-10| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641299 +i* 0.767311| 1.00002|-2.44657E-09 +i* -6.7886E-11| +| 13| -0.983286 +i* 0.18202| 0.999991| 3.21676E-12 +i*-9.48297E-13| +| 14| 0.324176 +i* -0.945987| 0.999991| 1.53594E-11 +i*-1.57324E-12| +| 15| 0.66503 +i* 0.746804| 0.999991| 5.74873E-13 +i* 8.53884E-12| +| 16| -0.977132 +i* 0.212706| 1.00002|-2.02093E-10 +i* 3.44548E-10| +| 17| 0.294374 +i* -0.955681| 0.999991| -1.2063E-11 +i* 1.32238E-11| +| 18| 0.688092 +i* 0.725645| 1.00002|-4.51021E-09 +i* 1.95437E-09| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991| 2.5573E-11 +i*-6.45539E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 2 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 200021 size 200021 +proc 1 start 200021 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 200021 +proc 0 start 0 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 400042 size 200021 +proc 2 start 400042 size 200021 +iter : 1 Arret : 0.00226498 s/iter 9.046598 +iter : 2 Arret : 0.286514 s/iter 9.041345 +iter : 3 Arret : 0.37126 s/iter 9.194828 +iter : 4 Arret : 0.357158 s/iter 9.425406 +iter : 5 Arret : 0.489627 s/iter 9.503770 +iter : 6 Arret : 0.0394603 s/iter 9.532369 +iter : 7 Arret : 0.0346491 s/iter 9.595128 +iter : 8 Arret : 0.058482 s/iter 9.502225 +iter : 9 Arret : 0.0456855 s/iter 9.517820 +iter : 10 Arret : 0.00888245 s/iter 9.163517 +iter : 11 Arret : 0.00755074 s/iter 9.164057 +iter : 12 Arret : 0.00999277 s/iter 9.132635 +iter : 13 Arret : 0.00331316 s/iter 9.163813 +iter : 14 Arret : 0.00348352 s/iter 9.037872 +iter : 15 Arret : 0.00131143 s/iter 9.062842 +iter : 16 Arret : 0.000194649 s/iter 9.032916 +iter : 17 Arret : 0.000108537 s/iter 9.040569 +iter : 18 Arret : 4.32539E-06 s/iter 9.040533 +iter : 19 Arret : 1.30764E-08 s/iter 9.032518 +iter : 20 Arret : 5.19734E-11 s/iter 9.039277 +iter : 21 Arret : 2.06945E-13 s/iter 9.037120 +temps : 193.628 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.29984E-05 +Stabilite : 6.87034E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-4.48197E-12 +i* 2.11486E-11| +| 3| -0.579282 +i* -0.815119| 0.999993| 1.33613E-11 +i*-1.98701E-11| +| 4| 0.592014 +i* 0.805919| 0.999993|-3.98037E-12 +i* 9.55808E-12| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993|-4.77973E-12 +i* 2.40621E-11| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742904 +i* -0.669389| 0.999993|-7.78222E-12 +i* 1.50098E-11| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.763538 +i* -0.645777| 1.00001|-8.22278E-10 +i*-5.86372E-10| +| 20| 0.773539 +i* 0.633763| 1.00001| -4.2314E-09 +i* 1.86243E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 266666 size 266666 +proc 1 start 266666 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 533332 size 266666 +proc 2 start 533332 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 266666 +proc 0 start 0 size 266666 +iter : 1 Arret : 0.013303 s/iter 15.845449 +iter : 2 Arret : 1.22368 s/iter 15.831599 +iter : 3 Arret : 0.34478 s/iter 15.835186 +iter : 4 Arret : 0.804966 s/iter 15.861997 +iter : 5 Arret : 0.957981 s/iter 15.872722 +iter : 6 Arret : 0.716801 s/iter 16.172143 +iter : 7 Arret : 0.496135 s/iter 16.224317 +iter : 8 Arret : 0.326979 s/iter 16.181063 +iter : 9 Arret : 0.252467 s/iter 16.538160 +iter : 10 Arret : 0.244395 s/iter 16.297675 +iter : 11 Arret : 0.173672 s/iter 16.136429 +iter : 12 Arret : 0.197369 s/iter 16.323607 +iter : 13 Arret : 0.168305 s/iter 16.324722 +iter : 14 Arret : 0.168579 s/iter 16.212899 +iter : 15 Arret : 0.208926 s/iter 16.207350 +iter : 16 Arret : 0.165995 s/iter 16.153929 +iter : 17 Arret : 0.223284 s/iter 16.250807 +iter : 18 Arret : 0.324113 s/iter 16.164325 +iter : 19 Arret : 0.771739 s/iter 16.136061 +iter : 20 Arret : 1.00477 s/iter 16.138977 +iter : 21 Arret : 1.00247 s/iter 16.140663 +iter : 22 Arret : 0.543015 s/iter 16.140175 +iter : 23 Arret : 0.476319 s/iter 15.852664 +iter : 24 Arret : 0.401176 s/iter 15.844834 +iter : 25 Arret : 0.142005 s/iter 15.837565 +iter : 26 Arret : 0.0393995 s/iter 15.832097 +iter : 27 Arret : 0.0199662 s/iter 15.824967 +iter : 28 Arret : 0.00992138 s/iter 15.835004 +iter : 29 Arret : 0.00549329 s/iter 15.825203 +iter : 30 Arret : 0.000480868 s/iter 15.805032 +iter : 31 Arret : 3.00435E-06 s/iter 15.832975 +iter : 32 Arret : 3.08148E-09 s/iter 15.816239 +iter : 33 Arret : 6.64256E-12 s/iter 15.831931 +iter : 34 Arret : 1.43767E-14 s/iter 15.816196 +temps : 545.367 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 12.9528 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995| -2.03E-11 +i* 2.74701E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995| 6.90537E-12 +i*-5.12417E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710675 +i* 0.703514| 0.999995|-8.58691E-12 +i* 2.79902E-11| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995|-1.40248E-11 +i* 5.11502E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-1.80345E-12 +i* 5.96675E-11| +| 15| 0.863146 +i* 0.504945| 0.999995|-1.01228E-11 +i* 1.20409E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +499999 racines de module = 0.999995 +299999 racines de module = 1.00001 + 2 racines de module = 1 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 333397 size 333397 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 2, start 666794 size 333397 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 333397 +proc 0 start 0 size 333397 +proc 1 start 333397 size 333397 +proc 2 start 666794 size 333397 +iter : 1 Arret : 0.000575468 s/iter 24.305180 +iter : 2 Arret : 0.00170361 s/iter 24.785627 +iter : 3 Arret : 0.00222192 s/iter 24.748506 +iter : 4 Arret : 0.017164 s/iter 24.358793 +iter : 5 Arret : 0.0140181 s/iter 24.395447 +iter : 6 Arret : 0.00863706 s/iter 24.606501 +iter : 7 Arret : 0.00646893 s/iter 24.858810 +iter : 8 Arret : 0.00503905 s/iter 24.788762 +iter : 9 Arret : 0.0052262 s/iter 24.427751 +iter : 10 Arret : 0.00485981 s/iter 24.358969 +iter : 11 Arret : 0.00893375 s/iter 24.357900 +iter : 12 Arret : 0.00681765 s/iter 24.368587 +iter : 13 Arret : 0.0016963 s/iter 24.362646 +iter : 14 Arret : 0.00106588 s/iter 24.361655 +iter : 15 Arret : 0.000173681 s/iter 24.354770 +iter : 16 Arret : 1.82719E-05 s/iter 24.350867 +iter : 17 Arret : 2.03911E-05 s/iter 24.358719 +iter : 18 Arret : 3.78438E-06 s/iter 24.284202 +iter : 19 Arret : 1.28475E-07 s/iter 24.295585 +iter : 20 Arret : 1.88663E-09 s/iter 24.290679 +iter : 21 Arret : 2.81124E-11 s/iter 24.288024 +iter : 22 Arret : 4.1882E-13 s/iter 24.288788 +temps : 542.745 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.4225E-07 +Stabilite : 4.77796E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491932 +i* 0.870629| 0.999996|-1.74121E-11 +i*-2.86359E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996| 2.92226E-11 +i* 2.71536E-11| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 400042 size 400042 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 400042 +proc 1 start 400042 size 400042 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 2, start 800084 size 400042 +proc 2 start 800084 size 400042 +proc 0 start 0 size 400042 +iter : 1 Arret : 0.00577737 s/iter 35.191437 +iter : 2 Arret : 1.60124 s/iter 35.687308 +iter : 3 Arret : 2.50845 s/iter 38.522110 +iter : 4 Arret : 0.88974 s/iter 37.972511 +iter : 5 Arret : 1.13571 s/iter 38.354084 +iter : 6 Arret : 0.802875 s/iter 38.309790 +iter : 7 Arret : 1.23189 s/iter 38.251469 +iter : 8 Arret : 2.00112 s/iter 38.369432 +iter : 9 Arret : 0.783463 s/iter 39.250540 +iter : 10 Arret : 1.64822 s/iter 38.419390 +iter : 11 Arret : 1.13791 s/iter 38.520696 +iter : 12 Arret : 4.19099 s/iter 38.244319 +iter : 13 Arret : 1.7036 s/iter 37.449747 +iter : 14 Arret : 0.953437 s/iter 37.710513 +iter : 15 Arret : 0.86512 s/iter 37.422749 +iter : 16 Arret : 3.83001 s/iter 37.601442 +iter : 17 Arret : 1.37636 s/iter 37.548538 +iter : 18 Arret : 1.57226 s/iter 37.331887 +iter : 19 Arret : 0.995472 s/iter 37.376323 +iter : 20 Arret : 0.780537 s/iter 37.065303 +iter : 21 Arret : 3.73222 s/iter 36.965816 +iter : 22 Arret : 1.52875 s/iter 36.851015 +iter : 23 Arret : 0.925666 s/iter 36.788322 +iter : 24 Arret : 0.416457 s/iter 36.673216 +iter : 25 Arret : 1.21819 s/iter 36.551043 +iter : 26 Arret : 0.782138 s/iter 36.720148 +iter : 27 Arret : 0.611118 s/iter 36.382233 +iter : 28 Arret : 1.40936 s/iter 36.605900 +iter : 29 Arret : 0.136834 s/iter 36.551610 +iter : 30 Arret : 0.982775 s/iter 36.549899 +iter : 31 Arret : 0.482303 s/iter 36.446318 +iter : 32 Arret : 0.314354 s/iter 35.262030 +iter : 33 Arret : 0.221468 s/iter 35.437839 +iter : 34 Arret : 0.148832 s/iter 35.903162 +iter : 35 Arret : 0.0771528 s/iter 35.243527 +iter : 36 Arret : 0.00786376 s/iter 35.408694 +iter : 37 Arret : 0.00153832 s/iter 35.423139 +iter : 38 Arret : 0.00226222 s/iter 35.250849 +iter : 39 Arret : 0.000875734 s/iter 35.254600 +iter : 40 Arret : 2.10425E-05 s/iter 35.253398 +iter : 41 Arret : 2.59204E-06 s/iter 35.253869 +iter : 42 Arret : 2.06088E-08 s/iter 35.143640 +iter : 43 Arret : 8.18267E-11 s/iter 35.260245 +iter : 44 Arret : 3.25714E-13 s/iter 35.264980 +temps : 1617.65 seconde(s) +Nb iterations : 44 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.09088E-05 +Stabilite : 2.22047E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1|-5.85295E-09 +i*-2.49566E-10| +| 4| 0.458789 +i* 0.888542| 0.999997| 2.48135E-13 +i*-2.88822E-11| +| 5| 0.430677 +i* 0.902502| 0.999997|-2.03271E-11 +i*-3.18325E-11| +| 6| 0.402092 +i* 0.915605| 1| 5.55538E-09 +i*-1.34284E-09| +| 7| 0.3732 +i* 0.927747| 0.999997| -2.5707E-11 +i* 3.11093E-13| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 5.41895E-11 +i*-2.05278E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192915 +i* 0.981212| 0.999997| 1.07495E-11 +i* 5.766E-12| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130977 +i* 0.991382| 0.999997| 5.89659E-11 +i* 7.29122E-12| +| 16| 0.0997898 +i* 0.995005| 0.999997|-3.84177E-11 +i*-1.21923E-11| +| 17| 0.0685136 +i* 0.997647| 0.999997|-2.98188E-11 +i* 2.79243E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 466688 size 466688 +proc 1 start 466688 size 466688 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 2, start 933376 size 466688 +proc 2 start 933376 size 466688 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 466688 +proc 0 start 0 size 466688 +iter : 1 Arret : 0.0476652 s/iter 48.053051 +iter : 2 Arret : 1.02145 s/iter 49.162936 +iter : 3 Arret : 3.11851 s/iter 50.138080 +iter : 4 Arret : 1.87547 s/iter 50.661272 +iter : 5 Arret : 1.24028 s/iter 52.617942 +iter : 6 Arret : 1.33274 s/iter 52.723740 +iter : 7 Arret : 1.1089 s/iter 52.451625 +iter : 8 Arret : 1.32856 s/iter 53.817849 +iter : 9 Arret : 0.584436 s/iter 54.233382 +iter : 10 Arret : 0.682561 s/iter 53.018367 +iter : 11 Arret : 1.10899 s/iter 52.903852 +iter : 12 Arret : 1.24673 s/iter 52.699001 +iter : 13 Arret : 2.03756 s/iter 51.822577 +iter : 14 Arret : 0.74595 s/iter 51.940124 +iter : 15 Arret : 0.336711 s/iter 51.566761 +iter : 16 Arret : 0.386748 s/iter 51.449106 +iter : 17 Arret : 0.175345 s/iter 51.008579 +iter : 18 Arret : 0.0799077 s/iter 50.523143 +iter : 19 Arret : 0.106562 s/iter 50.311514 +iter : 20 Arret : 0.102063 s/iter 50.013859 +iter : 21 Arret : 0.0811226 s/iter 48.967237 +iter : 22 Arret : 0.0777804 s/iter 48.802184 +iter : 23 Arret : 0.06176 s/iter 48.968763 +iter : 24 Arret : 0.0274141 s/iter 48.869900 +iter : 25 Arret : 0.0246722 s/iter 48.033190 +iter : 26 Arret : 0.0140326 s/iter 48.024256 +iter : 27 Arret : 0.00823776 s/iter 48.046597 +iter : 28 Arret : 0.00458441 s/iter 48.050189 +iter : 29 Arret : 0.000250093 s/iter 48.028503 +iter : 30 Arret : 6.92011E-06 s/iter 48.046144 +iter : 31 Arret : 1.1801E-07 s/iter 48.051103 +iter : 32 Arret : 1.60292E-09 s/iter 48.032612 +iter : 33 Arret : 2.20691E-11 s/iter 48.032677 +iter : 34 Arret : 3.03651E-13 s/iter 48.049192 +temps : 1707.73 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.35409E-07 +Stabilite : 2.22046E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-8.47142E-11 +i* 1.92466E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997|-3.15932E-11 +i*-1.15957E-12| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997|-8.89955E-13 +i* 2.61938E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-3.74776E-11 +i*-3.89954E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 1.02587E-11 +i*-4.25648E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:31135 terminated with signal 11 at PC=404b41 SP=7fffb89650f0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31134 terminated with signal 11 at PC=404b41 SP=7fff9a829580. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31136 terminated with signal 11 at PC=404b41 SP=7fffe0fa8a40. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 31135 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:31146 terminated with signal 11 at PC=404b41 SP=7fff82ca5fc0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31144 terminated with signal 11 at PC=404b41 SP=7fff0a32a700. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31145 terminated with signal 11 at PC=404b41 SP=7fff9885ac60. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 31145 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^1500000 + (1 +i*0)*x^2000000 + +(-50000 +i*0)*x^499999 + (-1.5E+07 +i*0)*x^1499999 + (2E+06 +i*0)*x^1999999 + + +template:31155 terminated with signal 11 at PC=404b41 SP=7fff5c26c610. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31154 terminated with signal 11 at PC=404b41 SP=7fffd7c701a0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31156 terminated with signal 11 at PC=404b41 SP=7fff9a2a1b00. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 31155 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- diff --git a/Simulations/sparse_mpi/sparse_mpi_3GPU.sge b/Simulations/sparse_mpi/sparse_mpi_3GPU.sge new file mode 100755 index 0000000..e779c55 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_3GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_3GPU +#$ -pe mpi 3 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_mpi/sparse_mpi_4GPU.o140023 b/Simulations/sparse_mpi/sparse_mpi_4GPU.o140023 new file mode 100644 index 0000000..872679a --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_4GPU.o140023 @@ -0,0 +1,841 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +proc 2 +proc 3 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 2, start 50048 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 25024 size 25024 +proc 2 start 50048 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 3, start 75072 size 25024 +proc 3 start 75072 size 25024 +proc 0 start 0 size 25024 +proc 1 start 25024 size 25024 +iter : 1 Arret : 0.00317264 s/iter 0.222955 +iter : 2 Arret : 0.00227167 s/iter 0.222762 +iter : 3 Arret : 0.00211003 s/iter 0.222838 +iter : 4 Arret : 0.00200743 s/iter 0.222746 +iter : 5 Arret : 0.00207223 s/iter 0.222703 +iter : 6 Arret : 0.00517083 s/iter 0.222804 +iter : 7 Arret : 0.0188667 s/iter 0.297002 +iter : 8 Arret : 0.0181557 s/iter 0.222717 +iter : 9 Arret : 0.0045178 s/iter 0.295501 +iter : 10 Arret : 0.000994006 s/iter 0.222726 +iter : 11 Arret : 0.00103689 s/iter 0.222762 +iter : 12 Arret : 0.000385068 s/iter 0.222694 +iter : 13 Arret : 0.000378374 s/iter 0.222655 +iter : 14 Arret : 0.000135377 s/iter 0.222528 +iter : 15 Arret : 2.77949E-05 s/iter 0.222508 +iter : 16 Arret : 6.74524E-07 s/iter 0.222580 +iter : 17 Arret : 2.18155E-09 s/iter 0.222640 +iter : 18 Arret : 2.22292E-11 s/iter 0.222554 +iter : 19 Arret : 3.31178E-13 s/iter 0.222495 +temps : 4.60588 seconde(s) +Nb iterations : 19 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.75156E-07 +Stabilite : 1.57015E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962|-4.03455E-13 +i* 2.85139E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 3, start 150144 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 2, start 100096 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 50048 size 50048 +proc 2 start 100096 size 50048 +proc 3 start 150144 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 50048 +proc 0 start 0 size 50048 +proc 1 start 50048 size 50048 +iter : 1 Arret : 0.000151301 s/iter 0.883876 +iter : 2 Arret : 0.000148172 s/iter 0.883954 +iter : 3 Arret : 0.000150921 s/iter 0.883918 +iter : 4 Arret : 0.00104559 s/iter 0.884013 +iter : 5 Arret : 0.00193123 s/iter 0.883951 +iter : 6 Arret : 0.0272836 s/iter 1.046760 +iter : 7 Arret : 0.102911 s/iter 1.039676 +iter : 8 Arret : 0.511951 s/iter 1.007660 +iter : 9 Arret : 0.34938 s/iter 1.017711 +iter : 10 Arret : 0.169476 s/iter 1.028045 +iter : 11 Arret : 0.0996115 s/iter 1.022146 +iter : 12 Arret : 0.0682782 s/iter 1.027682 +iter : 13 Arret : 0.0829552 s/iter 0.882503 +iter : 14 Arret : 0.0066689 s/iter 0.883836 +iter : 15 Arret : 0.0948233 s/iter 0.883899 +iter : 16 Arret : 0.00657146 s/iter 0.883885 +iter : 17 Arret : 0.00573604 s/iter 0.883894 +iter : 18 Arret : 0.00176675 s/iter 0.883914 +iter : 19 Arret : 0.000248502 s/iter 0.883875 +iter : 20 Arret : 6.04596E-05 s/iter 0.883987 +iter : 21 Arret : 4.48743E-06 s/iter 0.883955 +iter : 22 Arret : 4.98896E-09 s/iter 0.883421 +iter : 23 Arret : 4.99197E-13 s/iter 0.883862 +temps : 21.5922 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.000249603 +Stabilite : 2.22061E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985| 8.64808E-12 +i* 7.46794E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005| 2.77439E-08 +i*-6.74504E-09| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-7.79776E-12 +i*-2.52076E-13| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 100032 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 2, start 200064 size 100032 +proc 0 start 0 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 3, start 300096 size 100032 +proc 3 start 300096 size 100032 +proc 1 start 100032 size 100032 +proc 2 start 200064 size 100032 +iter : 1 Arret : 0.00163991 s/iter 3.109950 +iter : 2 Arret : 0.00132877 s/iter 3.110375 +iter : 3 Arret : 0.00184513 s/iter 3.110742 +iter : 4 Arret : 0.00262495 s/iter 3.111236 +iter : 5 Arret : 0.0150209 s/iter 3.111022 +iter : 6 Arret : 0.0137099 s/iter 3.414358 +iter : 7 Arret : 0.00835719 s/iter 3.385934 +iter : 8 Arret : 0.00440643 s/iter 3.394557 +iter : 9 Arret : 0.0060742 s/iter 3.385816 +iter : 10 Arret : 0.0050336 s/iter 3.099272 +iter : 11 Arret : 0.00112426 s/iter 3.099497 +iter : 12 Arret : 0.000775148 s/iter 3.099486 +iter : 13 Arret : 0.000376719 s/iter 3.099346 +iter : 14 Arret : 0.00024255 s/iter 3.099473 +iter : 15 Arret : 0.00012922 s/iter 3.099323 +iter : 16 Arret : 7.83137E-06 s/iter 3.099139 +iter : 17 Arret : 1.24719E-07 s/iter 3.099356 +iter : 18 Arret : 1.90294E-09 s/iter 3.099211 +iter : 19 Arret : 2.90173E-11 s/iter 3.099200 +iter : 20 Arret : 4.42472E-13 s/iter 3.099323 +temps : 63.5457 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 4.42472E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540313 +i* 0.841453| 0.999991| 9.34197E-12 +i*-1.23633E-11| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439833 +i* -0.898097| 1.00002| 5.42841E-10 +i*-5.60653E-10| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411559 +i* -0.9114| 1.00002| 1.04334E-09 +i*-9.84037E-10| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.988534 +i* 0.151098| 1.00002|-8.27014E-10 +i* 9.44171E-10| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641299 +i* 0.767311| 1.00002|-2.44657E-09 +i* -6.7886E-11| +| 13| -0.983301 +i* 0.182074| 1.00002| 4.64689E-09 +i* 2.00425E-09| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.665084 +i* 0.746789| 1.00002| 1.80952E-09 +i* 3.83855E-09| +| 16| -0.977132 +i* 0.212706| 1.00002|-2.02093E-10 +i* 3.44548E-10| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688092 +i* 0.725645| 1.00002|-4.51021E-09 +i* 1.95437E-09| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 1 +proc 2 +proc 3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 150016 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 300032 size 150016 +proc 2 start 300032 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 3, start 450048 size 150016 +proc 3 start 450048 size 150016 +proc 0 start 0 size 150016 +proc 1 start 150016 size 150016 +iter : 1 Arret : 0.00232098 s/iter 6.732718 +iter : 2 Arret : 0.0100189 s/iter 7.051391 +iter : 3 Arret : 0.283193 s/iter 6.895968 +iter : 4 Arret : 0.546502 s/iter 7.050469 +iter : 5 Arret : 1.13206 s/iter 7.216506 +iter : 6 Arret : 0.441232 s/iter 7.188011 +iter : 7 Arret : 0.210349 s/iter 7.506718 +iter : 8 Arret : 0.182959 s/iter 7.511723 +iter : 9 Arret : 0.15465 s/iter 7.074342 +iter : 10 Arret : 0.0273709 s/iter 7.116926 +iter : 11 Arret : 0.0179972 s/iter 7.067210 +iter : 12 Arret : 0.00914143 s/iter 7.085819 +iter : 13 Arret : 0.0269815 s/iter 7.021625 +iter : 14 Arret : 0.0268503 s/iter 6.729633 +iter : 15 Arret : 0.00822944 s/iter 6.729247 +iter : 16 Arret : 0.000264736 s/iter 6.731353 +iter : 17 Arret : 8.47333E-05 s/iter 6.730750 +iter : 18 Arret : 5.17416E-06 s/iter 6.730768 +iter : 19 Arret : 1.12397E-07 s/iter 6.731123 +iter : 20 Arret : 1.61278E-09 s/iter 6.731670 +iter : 21 Arret : 2.30014E-11 s/iter 6.731613 +iter : 22 Arret : 3.28041E-13 s/iter 6.730969 +temps : 153.471 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.81388E-08 +Stabilite : 3.28041E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592012 +i* 0.805941| 1.00001| 4.1526E-09 +i* 1.02046E-09| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742916 +i* -0.669375| 0.999993| 1.59349E-11 +i* 1.71025E-11| +| 18| 0.7533 +i* 0.657691| 1.00001|-2.76219E-09 +i* 4.10298E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773539 +i* 0.633763| 1.00001|-3.80449E-10 +i* 3.97541E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 1 +proc 2 +proc 3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 3, start 600000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 200000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 3 start 600000 size 200000 +proc 0 start 0 size 200000 +proc 1 start 200000 size 200000 +proc 2, start 400000 size 200000 +proc 2 start 400000 size 200000 +iter : 1 Arret : 0.00108417 s/iter 12.159097 +iter : 2 Arret : 0.00154617 s/iter 12.285160 +iter : 3 Arret : 0.0140448 s/iter 12.174373 +iter : 4 Arret : 0.150783 s/iter 12.211473 +iter : 5 Arret : 0.984534 s/iter 12.253215 +iter : 6 Arret : 0.846873 s/iter 12.667593 +iter : 7 Arret : 0.850687 s/iter 12.449265 +iter : 8 Arret : 0.239017 s/iter 12.498637 +iter : 9 Arret : 0.0932856 s/iter 12.372293 +iter : 10 Arret : 0.0273595 s/iter 12.770787 +iter : 11 Arret : 0.0236411 s/iter 12.268012 +iter : 12 Arret : 0.0229952 s/iter 12.192238 +iter : 13 Arret : 0.00327267 s/iter 12.153660 +iter : 14 Arret : 0.00103051 s/iter 12.183109 +iter : 15 Arret : 0.000584357 s/iter 12.153559 +iter : 16 Arret : 0.000158231 s/iter 12.151369 +iter : 17 Arret : 9.49875E-05 s/iter 12.153222 +iter : 18 Arret : 4.14038E-05 s/iter 12.152653 +iter : 19 Arret : 3.27846E-05 s/iter 12.153803 +iter : 20 Arret : 7.57551E-06 s/iter 12.157708 +iter : 21 Arret : 4.73473E-08 s/iter 12.155670 +iter : 22 Arret : 1.01116E-10 s/iter 12.154833 +iter : 23 Arret : 2.17895E-13 s/iter 12.155276 +temps : 282.444 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.01989E-05 +Stabilite : 2.17895E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 1.7531E-11 +i*-4.02243E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-1.80345E-12 +i* 5.96675E-11| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 250048 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 2, start 500096 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 3, start 750144 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 250048 +proc 0 start 0 size 250048 +proc 1 start 250048 size 250048 +proc 2 start 500096 size 250048 +proc 3 start 750144 size 250048 +iter : 1 Arret : 0.00113008 s/iter 18.764692 +iter : 2 Arret : 0.00490148 s/iter 18.766269 +iter : 3 Arret : 0.00255472 s/iter 18.765964 +iter : 4 Arret : 0.00771565 s/iter 19.551743 +iter : 5 Arret : 0.0148595 s/iter 19.510100 +iter : 6 Arret : 0.079485 s/iter 18.780627 +iter : 7 Arret : 1.0761 s/iter 19.466310 +iter : 8 Arret : 0.523791 s/iter 19.319585 +iter : 9 Arret : 0.256077 s/iter 18.918614 +iter : 10 Arret : 0.128041 s/iter 18.796063 +iter : 11 Arret : 0.0619619 s/iter 18.783666 +iter : 12 Arret : 0.0408163 s/iter 18.797339 +iter : 13 Arret : 0.028885 s/iter 18.787154 +iter : 14 Arret : 0.0101069 s/iter 18.869406 +iter : 15 Arret : 0.00233147 s/iter 18.789676 +iter : 16 Arret : 0.000443751 s/iter 18.784933 +iter : 17 Arret : 2.02171E-05 s/iter 18.760903 +iter : 18 Arret : 3.97233E-05 s/iter 18.758606 +iter : 19 Arret : 4.71594E-06 s/iter 18.782682 +iter : 20 Arret : 1.93517E-07 s/iter 18.760467 +iter : 21 Arret : 1.50186E-09 s/iter 18.801736 +iter : 22 Arret : 2.23717E-11 s/iter 18.757476 +iter : 23 Arret : 3.33298E-13 s/iter 18.760972 +temps : 440.06 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.68365E-07 +Stabilite : 2.22044E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540414 +i* 0.841394| 0.999996| 2.27135E-11 +i*-8.06094E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 1.87346E-11 +i* 4.7471E-11| +| 9| 0.491932 +i* 0.870629| 0.999996|-2.65525E-11 +i* 1.22525E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996|-3.09397E-11 +i*-1.68578E-11| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996|-5.47384E-12 +i* 1.02452E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +proc 1 +proc 2 +proc 3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 300032 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 2, start 600064 size 300032 +proc 2 start 600064 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 3, start 900096 size 300032 +proc 3 start 900096 size 300032 +proc 1 start 300032 size 300032 +iter : 1 Arret : 0.00819256 s/iter 26.577664 +iter : 2 Arret : 2.02982 s/iter 28.548195 +iter : 3 Arret : 1.20559 s/iter 28.444826 +iter : 4 Arret : 2.45066 s/iter 28.500080 +iter : 5 Arret : 2.54532 s/iter 28.613591 +iter : 6 Arret : 2.62994 s/iter 29.464998 +iter : 7 Arret : 0.906074 s/iter 29.815525 +iter : 8 Arret : 0.993745 s/iter 29.873610 +iter : 9 Arret : 0.405461 s/iter 30.471669 +iter : 10 Arret : 0.367721 s/iter 30.642427 +iter : 11 Arret : 0.351446 s/iter 30.327877 +iter : 12 Arret : 0.35197 s/iter 30.656805 +iter : 13 Arret : 0.356371 s/iter 29.659115 +iter : 14 Arret : 0.361711 s/iter 29.463647 +iter : 15 Arret : 0.337763 s/iter 29.495300 +iter : 16 Arret : 0.31327 s/iter 29.423447 +iter : 17 Arret : 0.311198 s/iter 29.291099 +iter : 18 Arret : 0.318456 s/iter 29.460846 +iter : 19 Arret : 0.32907 s/iter 29.325250 +iter : 20 Arret : 0.301059 s/iter 29.261791 +iter : 21 Arret : 0.265061 s/iter 29.531117 +iter : 22 Arret : 0.259472 s/iter 29.429866 +iter : 23 Arret : 0.281898 s/iter 29.291621 +iter : 24 Arret : 0.346388 s/iter 29.302478 +iter : 25 Arret : 1.26802 s/iter 29.286807 +iter : 26 Arret : 0.283944 s/iter 29.171558 +iter : 27 Arret : 1.48554 s/iter 29.009241 +iter : 28 Arret : 1.52006 s/iter 28.992115 +iter : 29 Arret : 0.739441 s/iter 28.878319 +iter : 30 Arret : 0.752787 s/iter 28.680746 +iter : 31 Arret : 0.846761 s/iter 28.681431 +iter : 32 Arret : 1.66027 s/iter 28.631316 +iter : 33 Arret : 1.18999 s/iter 28.536383 +iter : 34 Arret : 1.7472 s/iter 28.533855 +iter : 35 Arret : 0.99662 s/iter 28.619741 +iter : 36 Arret : 0.685041 s/iter 28.524906 +iter : 37 Arret : 3.10061 s/iter 28.469691 +iter : 38 Arret : 2.19552 s/iter 28.360443 +iter : 39 Arret : 0.82349 s/iter 28.436085 +iter : 40 Arret : 3.50591 s/iter 28.172287 +iter : 41 Arret : 1.02641 s/iter 27.664102 +iter : 42 Arret : 1.74412 s/iter 27.599336 +iter : 43 Arret : 0.666046 s/iter 27.622028 +iter : 44 Arret : 0.436645 s/iter 27.665222 +iter : 45 Arret : 0.362378 s/iter 27.576919 +iter : 46 Arret : 0.355561 s/iter 27.619140 +iter : 47 Arret : 0.261884 s/iter 27.609494 +iter : 48 Arret : 0.135369 s/iter 27.625744 +iter : 49 Arret : 0.0915402 s/iter 27.430183 +iter : 50 Arret : 0.161087 s/iter 27.574724 +iter : 51 Arret : 0.133264 s/iter 27.503435 +iter : 52 Arret : 0.19955 s/iter 27.556902 +iter : 53 Arret : 0.16774 s/iter 27.535538 +iter : 54 Arret : 0.0367464 s/iter 26.597157 +iter : 55 Arret : 0.0226237 s/iter 26.593894 +iter : 56 Arret : 0.0108181 s/iter 26.570226 +iter : 57 Arret : 0.00267111 s/iter 26.648842 +iter : 58 Arret : 0.000387499 s/iter 26.572189 +iter : 59 Arret : 3.11267E-06 s/iter 26.574203 +iter : 60 Arret : 2.51854E-08 s/iter 26.572782 +iter : 61 Arret : 1.01362E-10 s/iter 26.570380 +iter : 62 Arret : 4.03524E-13 s/iter 26.570734 +temps : 1762.58 seconde(s) +Nb iterations : 62 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.06807E-05 +Stabilite : 1.0906E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1| 1.95054E-09 +i* 6.77633E-10| +| 4| 0.458789 +i* 0.888542| 0.999997| 2.48135E-13 +i*-2.88822E-11| +| 5| 0.430685 +i* 0.902499| 0.999997| 2.12053E-13 +i*-1.16324E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192897 +i* 0.981224| 1| 2.91999E-10 +i* 9.18678E-11| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130967 +i* 0.991391| 1| 1.71549E-09 +i* 3.54225E-10| +| 16| 0.0997898 +i* 0.995005| 0.999997| -3.8231E-11 +i* 3.92186E-14| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371504 +i* 0.999314| 1|-1.38879E-09 +i*-2.32658E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +proc 2 +proc 3 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 3, start 1050048 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 350016 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 2, start 700032 size 350016 +proc 2 start 700032 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 350016 +proc 0 start 0 size 350016 +proc 3 start 1050048 size 350016 +proc 1 start 350016 size 350016 +iter : 1 Arret : 0.00218957 s/iter 36.159933 +iter : 2 Arret : 0.133227 s/iter 36.695373 +iter : 3 Arret : 6.01621 s/iter 37.299386 +iter : 4 Arret : 3.16113 s/iter 37.976941 +iter : 5 Arret : 2.89902 s/iter 37.835787 +iter : 6 Arret : 1.55692 s/iter 38.098839 +iter : 7 Arret : 1.64303 s/iter 39.033767 +iter : 8 Arret : 9.63322 s/iter 39.962469 +iter : 9 Arret : 3.25551 s/iter 40.250439 +iter : 10 Arret : 1.80839 s/iter 41.322631 +iter : 11 Arret : 2.10312 s/iter 39.721944 +iter : 12 Arret : 1.27787 s/iter 40.175542 +iter : 13 Arret : 1.28405 s/iter 39.345510 +iter : 14 Arret : 1.10597 s/iter 39.326031 +iter : 15 Arret : 1.54753 s/iter 39.371562 +iter : 16 Arret : 3.97338 s/iter 39.040715 +iter : 17 Arret : 1.16165 s/iter 39.074694 +iter : 18 Arret : 1.33248 s/iter 38.851097 +iter : 19 Arret : 0.864994 s/iter 38.922556 +iter : 20 Arret : 0.781144 s/iter 38.428134 +iter : 21 Arret : 0.717927 s/iter 38.952301 +iter : 22 Arret : 0.651466 s/iter 38.352980 +iter : 23 Arret : 0.458583 s/iter 38.047111 +iter : 24 Arret : 0.283507 s/iter 38.133746 +iter : 25 Arret : 0.279826 s/iter 37.853592 +iter : 26 Arret : 0.243863 s/iter 36.926821 +iter : 27 Arret : 0.220856 s/iter 37.645303 +iter : 28 Arret : 0.139293 s/iter 36.485655 +iter : 29 Arret : 0.66161 s/iter 36.276980 +iter : 30 Arret : 0.269576 s/iter 36.156120 +iter : 31 Arret : 0.139673 s/iter 36.247656 +iter : 32 Arret : 0.055674 s/iter 36.155399 +iter : 33 Arret : 0.0217982 s/iter 36.204812 +iter : 34 Arret : 0.00427148 s/iter 36.153944 +iter : 35 Arret : 0.000628248 s/iter 36.153697 +iter : 36 Arret : 1.01228E-07 s/iter 36.154597 +iter : 37 Arret : 4.84665E-10 s/iter 36.152819 +iter : 38 Arret : 2.2498E-12 s/iter 36.150757 +iter : 39 Arret : 1.80732E-14 s/iter 36.149673 +temps : 1478.01 seconde(s) +Nb iterations : 39 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.34519E-06 +Stabilite : 2.22046E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997| 5.65794E-11 +i*-4.66756E-12| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472673 +i* -0.881242| 1|-5.56631E-09 +i*-2.23833E-09| +| 8| 0.430664 +i* 0.902517| 1|-8.83373E-11 +i*-2.09199E-09| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-4.93405E-11 +i*-7.15173E-13| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:29834 terminated with signal 11 at PC=404b41 SP=7fff0b4740b0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29835 terminated with signal 11 at PC=404b41 SP=7fff081a2530. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29833 terminated with signal 11 at PC=404b41 SP=7fffe6ecdf90. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29836 terminated with signal 11 at PC=404b41 SP=7fff35c7eff0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 29834 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:29849 terminated with signal 11 at PC=404b41 SP=7fff6792aa30. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29846 terminated with signal 11 at PC=404b41 SP=7ffffaf225e0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29848 terminated with signal 11 at PC=404b41 SP=7fff7de06640. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29847 terminated with signal 11 at PC=404b41 SP=7fff5bacc3f0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 29846 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.03613 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^2000 + (-10 +i*0)*x^8000 + (1 +i*0)*x^10000 + +(-200 +i*0)*x^1999 + (-80000 +i*0)*x^7999 + (10000 +i*0)*x^9999 + +zone limite de 'log-exp' 1.03613 +zone limite de 'log-exp' 1.03613 +zone limite de 'log-exp' 1.03613 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 1, start 2560 size 2560 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 0, start 0 size 2560 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 3, start 7680 size 2560 +proc 0 start 0 size 2560 +proc 3 start 7680 size 2560 +proc 1 start 2560 size 2560 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 2, start 5120 size 2560 +proc 2 start 5120 size 2560 +iter : 1 Arret : 0.000540066 s/iter 0.008420 +iter : 2 Arret : 0.0239499 s/iter 0.008298 +iter : 3 Arret : 0.0108994 s/iter 0.008290 +iter : 4 Arret : 0.00347071 s/iter 0.008305 +iter : 5 Arret : 0.00757939 s/iter 0.008311 +iter : 6 Arret : 0.00186666 s/iter 0.008310 +iter : 7 Arret : 0.00179112 s/iter 0.008306 +iter : 8 Arret : 0.00147265 s/iter 0.008305 +iter : 9 Arret : 0.00165602 s/iter 0.008296 +iter : 10 Arret : 0.00248191 s/iter 0.008307 +iter : 11 Arret : 0.000812537 s/iter 0.008297 +iter : 12 Arret : 5.39531E-05 s/iter 0.008412 +iter : 13 Arret : 1.08824E-08 s/iter 0.008404 +iter : 14 Arret : 1.089E-13 s/iter 0.008419 +temps : 0.323036 seconde(s) +Nb iterations : 14 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.17761E-05 +Stabilite : 8.2797E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.547024 +i* 0.838493| 1.00115|-6.21719E-10 +i*-5.53774E-09| +| 2| -0.540305 +i* 0.841127| 0.999712|-1.60982E-13 +i*-4.97213E-14| +| 3| -0.909192 +i* 0.415685| 0.999712| 4.35207E-14 +i* 5.29003E-13| +| 4| -0.989628 +i* -0.141638| 0.999712|-2.84439E-13 +i*-1.69935E-14| +| 5| -0.759236 +i* -0.652585| 1.00115|-6.07508E-09 +i* 4.66733E-09| +| 6| -0.281925 +i* -0.959136| 0.999712|-1.54099E-13 +i* 3.80991E-14| +| 7| 0.281172 +i* -0.959357| 0.999712|-1.43663E-13 +i*-1.53777E-13| +| 8| 0.755064 +i* -0.655212| 0.999712| 4.61076E-13 +i* 3.15322E-13| +| 9| 0.989404 +i* -0.143192| 0.999712|-1.63203E-13 +i*-1.45101E-14| +| 10| 0.912453 +i* 0.411988| 1.00115|-1.77634E-10 +i* 4.15663E-09| +| 11| 0.540966 +i* 0.840703| 0.999712| -2.5091E-14 +i*-1.99096E-13| +| 12| 0.540305 +i* 0.841127| 0.999712| 3.22853E-13 +i* 1.07785E-13| +| 13| 0.00314521 +i* 1.00115| 1.00115| 4.5119E-09 +i*-6.21719E-11| +| 14| -0.540966 +i* 0.840703| 0.999712| -2.5091E-14 +i* 1.99096E-13| +| 15| -0.909518 +i* 0.414971| 0.999712|-1.80966E-13 +i*-6.20692E-14| +| 16| -0.989516 +i* -0.142415| 0.999712| 2.81108E-13 +i* 5.11239E-14| +| 17| -0.755579 +i* -0.654618| 0.999712| 5.59774E-13 +i* 8.84721E-14| +| 18| -0.285348 +i* -0.959626| 1.00115|-9.98303E-09 +i*-1.88292E-09| +| 19| 0.281925 +i* -0.959136| 0.999712| 1.08247E-13 +i*-4.02221E-13| +| 20| 0.755579 +i* -0.654618| 0.999712| 5.59774E-13 +i*-8.84721E-14| ++---+----------------------------+------------+----------------------------+ +2000 racines de module = 1.00115 +8000 racines de module = 0.999712 diff --git a/Simulations/sparse_mpi/sparse_mpi_4GPU.sge b/Simulations/sparse_mpi/sparse_mpi_4GPU.sge new file mode 100755 index 0000000..d9ab42c --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_4GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_4GPU +#$ -pe mpi 4 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_1GPU.o140100 b/Simulations/sparse_openmp/sparse_openmp_1GPU.o140100 new file mode 100644 index 0000000..7332981 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_1GPU.o140100 @@ -0,0 +1,512 @@ +REMAINING: 1 +Taking GPU #3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 391 start 0 size 100096 +gpu 0 iter : 1 Arret : 0.0052669 s/iter 0.775408 +gpu 0 iter : 2 Arret : 0.00752645 s/iter 0.775369 +gpu 0 iter : 3 Arret : 0.0240999 s/iter 0.775305 +gpu 0 iter : 4 Arret : 0.0224589 s/iter 0.850697 +gpu 0 iter : 5 Arret : 0.00804703 s/iter 0.844340 +gpu 0 iter : 6 Arret : 0.00438171 s/iter 0.775251 +gpu 0 iter : 7 Arret : 0.00744568 s/iter 0.775238 +gpu 0 iter : 8 Arret : 0.00764888 s/iter 0.775261 +gpu 0 iter : 9 Arret : 0.00410621 s/iter 0.775320 +gpu 0 iter : 10 Arret : 0.00247273 s/iter 0.775247 +gpu 0 iter : 11 Arret : 0.00227795 s/iter 0.775273 +gpu 0 iter : 12 Arret : 0.00210901 s/iter 0.775117 +gpu 0 iter : 13 Arret : 0.000438336 s/iter 0.774935 +gpu 0 iter : 14 Arret : 0.000273199 s/iter 0.774865 +gpu 0 iter : 15 Arret : 0.000137109 s/iter 0.774789 +gpu 0 iter : 16 Arret : 1.40101E-05 s/iter 0.774828 +gpu 0 iter : 17 Arret : 1.89958E-07 s/iter 0.774719 +gpu 0 iter : 18 Arret : 2.82623E-09 s/iter 0.774706 +gpu 0 iter : 19 Arret : 4.21054E-11 s/iter 0.774674 +gpu 0 iter : 20 Arret : 6.27215E-13 s/iter 0.774731 +temps : 16.1926 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.61117E-09 +Stabilite : 6.27215E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226711 +i* -0.973923| 0.999962|-4.27658E-13 +i* 6.01027E-13| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996021 +i* 0.0886823| 0.999962| 1.17772E-12 +i* 6.16285E-13| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968049 +i* 0.250607| 0.999962|-1.07025E-13 +i*-1.15224E-12| +| 10| -0.286815 +i* -0.957946| 0.999962|-6.55254E-13 +i* 1.20869E-12| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988582 +i* 0.150427| 0.999962|-1.54698E-12 +i*-6.48537E-13| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.981756 +i* 0.189945| 0.999962|-1.13665E-12 +i* 1.13043E-12| +| 19| -0.345809 +i* -0.938264| 0.999962| 1.03906E-12 +i* 1.95398E-12| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 782 start 0 size 200192 +gpu 0 iter : 1 Arret : 0.000149329 s/iter 3.019382 +gpu 0 iter : 2 Arret : 0.000107708 s/iter 3.016857 +gpu 0 iter : 3 Arret : 0.000113605 s/iter 3.016990 +gpu 0 iter : 4 Arret : 0.000830779 s/iter 3.018300 +gpu 0 iter : 5 Arret : 0.00353705 s/iter 3.017239 +gpu 0 iter : 6 Arret : 0.0150507 s/iter 3.033347 +gpu 0 iter : 7 Arret : 0.0172496 s/iter 3.028650 +gpu 0 iter : 8 Arret : 0.032361 s/iter 3.025908 +gpu 0 iter : 9 Arret : 0.0281394 s/iter 3.030298 +gpu 0 iter : 10 Arret : 0.116314 s/iter 3.043482 +gpu 0 iter : 11 Arret : 0.129494 s/iter 3.073542 +gpu 0 iter : 12 Arret : 0.0352338 s/iter 3.047419 +gpu 0 iter : 13 Arret : 0.0316693 s/iter 3.041094 +gpu 0 iter : 14 Arret : 0.0153664 s/iter 3.020001 +gpu 0 iter : 15 Arret : 0.0125995 s/iter 3.011952 +gpu 0 iter : 16 Arret : 0.00505109 s/iter 3.013206 +gpu 0 iter : 17 Arret : 0.0072726 s/iter 3.013400 +gpu 0 iter : 18 Arret : 0.00841241 s/iter 3.012671 +gpu 0 iter : 19 Arret : 0.00316401 s/iter 3.011866 +gpu 0 iter : 20 Arret : 1.36142E-05 s/iter 3.011905 +gpu 0 iter : 21 Arret : 1.07816E-09 s/iter 3.012487 +gpu 0 iter : 22 Arret : 2.83648E-12 s/iter 3.012609 +gpu 0 iter : 23 Arret : 4.24948E-14 s/iter 3.012386 +temps : 70.1186 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.52377E-08 +Stabilite : 4.24948E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540195 +i* 0.841595| 1.00005|-2.98043E-09 +i*-3.27611E-08| +| 2| -0.837195 +i* 0.546877| 0.999985| 7.09943E-12 +i* 5.1133E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828525 +i* -0.559925| 0.999985|-4.34675E-12 +i* 1.07137E-12| +| 5| -0.819774 +i* 0.572768| 1.00005| 2.53887E-08 +i* 2.42315E-09| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985| 8.64808E-12 +i* 7.46794E-12| +| 8| 0.591869 +i* 0.806015| 0.999985| 1.73195E-13 +i* 8.72591E-12| +| 9| -0.801379 +i* 0.598131| 0.999985| -1.2701E-12 +i* 3.96189E-12| +| 10| -0.60436 +i* -0.796769| 1.00005|-3.33815E-08 +i* 3.89061E-08| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628985 +i* -0.777398| 0.999985|-4.05476E-12 +i*-5.17236E-12| +| 15| 0.772548 +i* -0.635029| 1.00005| 1.1634E-09 +i* 1.87351E-08| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752229 +i* -0.658879| 0.999985|-5.97611E-12 +i* 1.03431E-11| +| 20| 0.664729 +i* 0.747146| 1.00005|-1.71597E-08 +i* 8.68463E-09| ++---+----------------------------+------------+----------------------------+ +50000 racines de module = 1.00005 +150000 racines de module = 0.999985 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 1563 start 0 size 400128 +gpu 0 iter : 1 Arret : 0.00172099 s/iter 11.753718 +gpu 0 iter : 2 Arret : 0.0208557 s/iter 11.747391 +gpu 0 iter : 3 Arret : 0.221528 s/iter 11.807046 +gpu 0 iter : 4 Arret : 0.572248 s/iter 11.998301 +gpu 0 iter : 5 Arret : 0.542189 s/iter 11.842988 +gpu 0 iter : 6 Arret : 0.306206 s/iter 11.822805 +gpu 0 iter : 7 Arret : 0.0317191 s/iter 12.059261 +gpu 0 iter : 8 Arret : 0.0184143 s/iter 12.061589 +gpu 0 iter : 9 Arret : 0.030511 s/iter 11.936705 +gpu 0 iter : 10 Arret : 0.023696 s/iter 11.899096 +gpu 0 iter : 11 Arret : 0.0135298 s/iter 11.850230 +gpu 0 iter : 12 Arret : 0.0119889 s/iter 11.808974 +gpu 0 iter : 13 Arret : 0.00485045 s/iter 11.776383 +gpu 0 iter : 14 Arret : 0.00522437 s/iter 11.809750 +gpu 0 iter : 15 Arret : 0.00252909 s/iter 11.735442 +gpu 0 iter : 16 Arret : 0.000417464 s/iter 11.739448 +gpu 0 iter : 17 Arret : 0.000235756 s/iter 11.733345 +gpu 0 iter : 18 Arret : 6.4985E-07 s/iter 11.743853 +gpu 0 iter : 19 Arret : 1.48939E-09 s/iter 11.732225 +gpu 0 iter : 20 Arret : 3.20792E-12 s/iter 11.734648 +gpu 0 iter : 21 Arret : 1.34164E-14 s/iter 11.732088 +temps : 248.893 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 1.34164E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991| 1.11042E-11 +i*-9.27687E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991| 1.67755E-11 +i* 4.06477E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991| 1.73468E-11 +i*-3.74729E-12| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991| 1.53594E-11 +i*-1.57324E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991| -1.2063E-11 +i* 1.32238E-11| +| 18| 0.688087 +i* 0.725616| 0.999991|-1.67164E-11 +i*-1.12573E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 0 iter : 1 Arret : 0.00525558 s/iter 26.336656 +gpu 0 iter : 2 Arret : 0.441677 s/iter 26.703831 +gpu 0 iter : 3 Arret : 0.906705 s/iter 26.966169 +gpu 0 iter : 4 Arret : 3.755 s/iter 26.950936 +gpu 0 iter : 5 Arret : 1.26305 s/iter 27.316144 +gpu 0 iter : 6 Arret : 3.03186 s/iter 27.389925 +gpu 0 iter : 7 Arret : 0.213406 s/iter 27.490831 +gpu 0 iter : 8 Arret : 1.0101 s/iter 27.559501 +gpu 0 iter : 9 Arret : 0.207377 s/iter 27.194849 +gpu 0 iter : 10 Arret : 0.0920517 s/iter 27.466967 +gpu 0 iter : 11 Arret : 0.0893085 s/iter 27.380003 +gpu 0 iter : 12 Arret : 0.0218947 s/iter 26.617878 +gpu 0 iter : 13 Arret : 0.00718218 s/iter 26.491846 +gpu 0 iter : 14 Arret : 0.014641 s/iter 26.379537 +gpu 0 iter : 15 Arret : 0.00209026 s/iter 26.349906 +gpu 0 iter : 16 Arret : 0.00174853 s/iter 26.344560 +gpu 0 iter : 17 Arret : 0.00249398 s/iter 26.348383 +gpu 0 iter : 18 Arret : 0.00020801 s/iter 26.354612 +gpu 0 iter : 19 Arret : 1.26142E-07 s/iter 26.370520 +gpu 0 iter : 20 Arret : 5.14341E-10 s/iter 26.370752 +gpu 0 iter : 21 Arret : 2.04751E-12 s/iter 26.372247 +gpu 0 iter : 22 Arret : 8.06082E-15 s/iter 26.364052 +temps : 589.718 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.32595E-08 +Stabilite : 8.06082E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993| 2.30783E-11 +i*-6.91999E-12| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592029 +i* 0.805909| 0.999993| 8.2111E-12 +i* 2.02799E-11| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| -2.6851E-11 +i*-1.44801E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 2.88447E-09 +i* 3.69506E-09| +| 16| 0.73231 +i* 0.680962| 0.999993|-5.73186E-12 +i* 1.14335E-11| +| 17| -0.742916 +i* -0.669375| 0.999993| 1.59349E-11 +i* 1.71025E-11| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773539 +i* 0.633763| 1.00001| -4.2314E-09 +i* 1.86243E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 3125 start 0 size 800000 +gpu 0 iter : 1 Arret : 0.00051726 s/iter 46.868704 +gpu 0 iter : 2 Arret : 0.00517255 s/iter 46.735194 +gpu 0 iter : 3 Arret : 0.0728679 s/iter 46.891988 +gpu 0 iter : 4 Arret : 0.771691 s/iter 46.979491 +gpu 0 iter : 5 Arret : 0.75662 s/iter 47.336136 +gpu 0 iter : 6 Arret : 0.635995 s/iter 47.811859 +gpu 0 iter : 7 Arret : 0.505749 s/iter 48.056193 +gpu 0 iter : 8 Arret : 0.931022 s/iter 48.270194 +gpu 0 iter : 9 Arret : 0.398721 s/iter 48.514679 +gpu 0 iter : 10 Arret : 0.247741 s/iter 48.434629 +gpu 0 iter : 11 Arret : 0.0707263 s/iter 48.136785 +gpu 0 iter : 12 Arret : 0.0344289 s/iter 47.624785 +gpu 0 iter : 13 Arret : 0.0278743 s/iter 46.948359 +gpu 0 iter : 14 Arret : 0.0109553 s/iter 46.857728 +gpu 0 iter : 15 Arret : 0.0093023 s/iter 46.844682 +gpu 0 iter : 16 Arret : 0.00935315 s/iter 46.835990 +gpu 0 iter : 17 Arret : 0.0162429 s/iter 46.715238 +gpu 0 iter : 18 Arret : 0.00648616 s/iter 46.741249 +gpu 0 iter : 19 Arret : 0.000839627 s/iter 46.741507 +gpu 0 iter : 20 Arret : 0.00184254 s/iter 46.754071 +gpu 0 iter : 21 Arret : 4.91346E-06 s/iter 46.769016 +gpu 0 iter : 22 Arret : 4.60158E-08 s/iter 46.820581 +gpu 0 iter : 23 Arret : 6.70363E-10 s/iter 46.824110 +gpu 0 iter : 24 Arret : 9.78247E-12 s/iter 46.828052 +gpu 0 iter : 25 Arret : 1.42634E-13 s/iter 46.828472 +temps : 1180.82 seconde(s) +Nb iterations : 25 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.1101E-08 +Stabilite : 1.42634E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 3.40094E-11 +i* 1.45989E-12| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995| 3.88137E-11 +i*-3.00611E-11| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 3907 start 0 size 1000192 +gpu 0 iter : 1 Arret : 0.00369829 s/iter 72.960026 +gpu 0 iter : 2 Arret : 0.656453 s/iter 73.009854 +gpu 0 iter : 3 Arret : 1.85379 s/iter 73.909530 +gpu 0 iter : 4 Arret : 0.184697 s/iter 73.870387 +gpu 0 iter : 5 Arret : 0.149335 s/iter 73.917721 +gpu 0 iter : 6 Arret : 0.0961951 s/iter 74.759550 +gpu 0 iter : 7 Arret : 0.0847578 s/iter 74.840915 +gpu 0 iter : 8 Arret : 0.0292103 s/iter 74.694556 +gpu 0 iter : 9 Arret : 0.0283648 s/iter 74.484213 +gpu 0 iter : 10 Arret : 0.0181273 s/iter 73.989131 +gpu 0 iter : 11 Arret : 0.0158134 s/iter 73.602331 +gpu 0 iter : 12 Arret : 0.0047499 s/iter 73.110712 +gpu 0 iter : 13 Arret : 0.00558216 s/iter 73.004439 +gpu 0 iter : 14 Arret : 0.00502349 s/iter 72.957971 +gpu 0 iter : 15 Arret : 0.00203782 s/iter 72.966516 +gpu 0 iter : 16 Arret : 0.000101539 s/iter 72.953065 +gpu 0 iter : 17 Arret : 0.000105985 s/iter 72.981166 +gpu 0 iter : 18 Arret : 7.62032E-06 s/iter 72.955710 +gpu 0 iter : 19 Arret : 2.53593E-08 s/iter 72.953928 +gpu 0 iter : 20 Arret : 2.22162E-10 s/iter 72.808169 +gpu 0 iter : 21 Arret : 3.30983E-12 s/iter 72.824788 +gpu 0 iter : 22 Arret : 4.92853E-14 s/iter 72.871341 +temps : 1621.79 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65132E-08 +Stabilite : 4.92853E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841476| 1.00001| 4.82795E-10 +i* 3.31212E-09| +| 2| 0.52971 +i* 0.848174| 0.999996|-2.56639E-12 +i*-3.27674E-11| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.519019 +i* 0.854758| 0.999996|-1.39375E-11 +i* 5.79731E-12| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502834 +i* 0.864379| 0.999996|-2.85585E-11 +i* 6.91519E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491942 +i* 0.870624| 0.999996| -1.9825E-11 +i*-1.52329E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46438 +i* 0.885632| 0.999996| 1.33844E-11 +i*-1.06731E-12| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447623 +i* 0.894218| 0.999996| 3.85803E-11 +i* 3.3129E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.43636 +i* 0.899768| 0.999996| 3.23241E-12 +i* 9.4037E-12| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1.00001 +600000 racines de module = 0.999996 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 4688 start 0 size 1200128 +gpu 0 iter : 1 Arret : 0.0182376 s/iter 104.837597 +gpu 0 iter : 2 Arret : 1.12373 s/iter 108.563668 +gpu 0 iter : 3 Arret : 0.426381 s/iter 110.022983 +gpu 0 iter : 4 Arret : 0.721244 s/iter 111.488820 +gpu 0 iter : 5 Arret : 1.17091 s/iter 111.916174 +gpu 0 iter : 6 Arret : 0.351155 s/iter 112.354360 +gpu 0 iter : 7 Arret : 0.375654 s/iter 113.067528 +gpu 0 iter : 8 Arret : 1.04032 s/iter 113.381487 +gpu 0 iter : 9 Arret : 1.12875 s/iter 114.128347 +gpu 0 iter : 10 Arret : 12.358 s/iter 114.591594 +gpu 0 iter : 11 Arret : 1.18398 s/iter 114.167437 +gpu 0 iter : 12 Arret : 4.45048 s/iter 113.754284 +gpu 0 iter : 13 Arret : 5.09703 s/iter 112.914247 +gpu 0 iter : 14 Arret : 1.04453 s/iter 112.076259 +gpu 0 iter : 15 Arret : 3.05711 s/iter 111.467739 +gpu 0 iter : 16 Arret : 0.859735 s/iter 110.945464 +gpu 0 iter : 17 Arret : 4.25309 s/iter 110.793391 +gpu 0 iter : 18 Arret : 0.893951 s/iter 110.388272 +gpu 0 iter : 19 Arret : 0.603038 s/iter 110.132291 +gpu 0 iter : 20 Arret : 3.09335 s/iter 109.413247 +gpu 0 iter : 21 Arret : 1.28616 s/iter 109.106140 +gpu 0 iter : 22 Arret : 2.25952 s/iter 109.082492 +gpu 0 iter : 23 Arret : 1.67614 s/iter 108.802369 +gpu 0 iter : 24 Arret : 0.645561 s/iter 108.387380 +gpu 0 iter : 25 Arret : 0.661038 s/iter 108.106268 +gpu 0 iter : 26 Arret : 0.728448 s/iter 107.627940 +gpu 0 iter : 27 Arret : 0.456849 s/iter 107.304474 +gpu 0 iter : 28 Arret : 0.254278 s/iter 106.811137 +gpu 0 iter : 29 Arret : 0.111958 s/iter 106.339104 +gpu 0 iter : 30 Arret : 0.0531874 s/iter 105.891059 +gpu 0 iter : 31 Arret : 0.0531871 s/iter 105.523621 +gpu 0 iter : 32 Arret : 0.013254 s/iter 105.034027 +gpu 0 iter : 33 Arret : 0.00334602 s/iter 104.894966 +gpu 0 iter : 34 Arret : 0.00027649 s/iter 104.840988 +gpu 0 iter : 35 Arret : 1.17344E-07 s/iter 104.858305 +gpu 0 iter : 36 Arret : 4.79311E-10 s/iter 104.840632 +gpu 0 iter : 37 Arret : 1.90774E-12 s/iter 104.820758 +gpu 0 iter : 38 Arret : 8.88875E-15 s/iter 104.804403 +temps : 4148.3 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.76717E-08 +Stabilite : 8.88875E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540312 +i* 0.841461| 0.999997|-2.16913E-11 +i* 1.91294E-11| +| 2| 0.513645 +i* 0.857999| 0.999997|-6.29718E-12 +i*-2.39364E-12| +| 3| 0.486457 +i* 0.873701| 0.999997| 1.53235E-11 +i* 6.36435E-13| +| 4| 0.458797 +i* 0.888537| 0.999997| 1.72345E-11 +i* 1.48229E-11| +| 5| 0.430698 +i* 0.902501| 1| 9.83414E-09 +i*-4.46881E-09| +| 6| 0.402138 +i* 0.915584| 1|-5.37264E-09 +i* 9.04446E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192915 +i* 0.981212| 0.999997| 1.07495E-11 +i* 5.766E-12| +| 14| 0.162034 +i* 0.986782| 0.999997| 3.99512E-11 +i* 6.63664E-12| +| 15| 0.130977 +i* 0.991382| 0.999997| 5.89659E-11 +i* 7.29122E-12| +| 16| 0.0997987 +i* 0.995004| 0.999997|-2.34084E-11 +i*-4.34534E-12| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371629 +i* 0.999314| 1| 1.55887E-09 +i*-4.23222E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 5469 start 0 size 1400064 +gpu 0 iter : 1 Arret : 0.00928965 s/iter 142.375846 +gpu 0 iter : 2 Arret : 0.576413 s/iter 147.373084 +gpu 0 iter : 3 Arret : 0.762551 s/iter 150.232559 +gpu 0 iter : 4 Arret : 1.07413 s/iter 151.768093 +gpu 0 iter : 5 Arret : 0.0991065 s/iter 153.056251 +gpu 0 iter : 6 Arret : 0.123507 s/iter 152.742000 +gpu 0 iter : 7 Arret : 0.136183 s/iter 152.857808 +gpu 0 iter : 8 Arret : 0.113786 s/iter 152.881427 +gpu 0 iter : 9 Arret : 0.0800623 s/iter 152.835777 +gpu 0 iter : 10 Arret : 0.0571798 s/iter 151.922898 +gpu 0 iter : 11 Arret : 0.0727241 s/iter 150.276395 +gpu 0 iter : 12 Arret : 0.0702862 s/iter 147.770220 +gpu 0 iter : 13 Arret : 0.0246309 s/iter 145.850735 +gpu 0 iter : 14 Arret : 0.0213611 s/iter 144.099565 +gpu 0 iter : 15 Arret : 0.0247135 s/iter 143.346943 +gpu 0 iter : 16 Arret : 0.0164575 s/iter 142.914262 +gpu 0 iter : 17 Arret : 0.00452215 s/iter 142.729324 +gpu 0 iter : 18 Arret : 0.00260492 s/iter 142.530031 +gpu 0 iter : 19 Arret : 0.000151029 s/iter 142.510219 +gpu 0 iter : 20 Arret : 1.40988E-06 s/iter 142.510180 +gpu 0 iter : 21 Arret : 1.38776E-08 s/iter 142.480080 +gpu 0 iter : 22 Arret : 1.91581E-10 s/iter 142.453226 +gpu 0 iter : 23 Arret : 2.63708E-12 s/iter 142.412633 +gpu 0 iter : 24 Arret : 3.63243E-14 s/iter 142.487841 +temps : 3523.14 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65661E-08 +Stabilite : 3.63243E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-8.47142E-11 +i* 1.92466E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416439 +i* -0.90916| 0.999997|-1.66807E-11 +i* 2.56219E-11| +| 12| 0.373179 +i* 0.927756| 0.999997| 2.89372E-11 +i*-2.61371E-11| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.06317E-11 +i* 7.08794E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-4.93405E-11 +i*-7.15173E-13| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140100: line 23: 13069 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140100: line 24: 13073 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140100: line 25: 13075 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_1GPU.sge b/Simulations/sparse_openmp/sparse_openmp_1GPU.sge new file mode 100755 index 0000000..ceb97b1 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_1GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 1 +#$ -V +#$ -cwd +#$ -N sparse_openmp_1GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=1 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Simulations/sparse_openmp/sparse_openmp_2GPU.o140099 b/Simulations/sparse_openmp/sparse_openmp_2GPU.o140099 new file mode 100644 index 0000000..b18a418 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_2GPU.o140099 @@ -0,0 +1,534 @@ +REMAINING: 2 +Taking GPU #0 +Taking GPU #1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 0 iter : 1 Arret : 0.00380313 s/iter 0.441566 +gpu 0 iter : 2 Arret : 0.00367222 s/iter 0.441506 +gpu 0 iter : 3 Arret : 0.00329063 s/iter 0.441545 +gpu 0 iter : 4 Arret : 0.00599232 s/iter 0.441517 +gpu 0 iter : 5 Arret : 0.00559475 s/iter 0.441533 +gpu 0 iter : 6 Arret : 0.0062995 s/iter 0.441538 +gpu 0 iter : 7 Arret : 0.00458799 s/iter 0.441558 +gpu 0 iter : 8 Arret : 0.00622521 s/iter 0.441510 +gpu 0 iter : 9 Arret : 0.0073983 s/iter 0.439550 +gpu 0 iter : 10 Arret : 0.00804763 s/iter 0.441536 +gpu 0 iter : 11 Arret : 0.00548469 s/iter 0.441528 +gpu 0 iter : 12 Arret : 0.00120813 s/iter 0.441416 +gpu 0 iter : 13 Arret : 0.000406962 s/iter 0.441414 +gpu 0 iter : 14 Arret : 0.00112455 s/iter 0.441391 +gpu 0 iter : 15 Arret : 0.000729656 s/iter 0.441398 +gpu 0 iter : 16 Arret : 6.06095E-06 s/iter 0.441340 +gpu 0 iter : 17 Arret : 1.51135E-08 s/iter 0.441471 +gpu 0 iter : 18 Arret : 4.78213E-11 s/iter 0.441372 +gpu 0 iter : 19 Arret : 1.51316E-13 s/iter 0.441309 +temps : 9.12342 seconde(s) +Nb iterations : 19 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.21439E-09 +Stabilite : 1.51316E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006| 1.35693E-10 +i*-3.47657E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 1.02962E-12 +i*-4.51911E-12| +| 18| 0.981895 +i* 0.189225| 0.999962|-4.05187E-12 +i* 1.36536E-13| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 391 start 100096 size 100096 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 391 start 0 size 100096 +gpu 0 iter : 1 Arret : 0.000107626 s/iter 1.547978 +gpu 0 iter : 2 Arret : 9.81369E-05 s/iter 1.548082 +gpu 0 iter : 3 Arret : 0.000765995 s/iter 1.548065 +gpu 0 iter : 4 Arret : 0.000973277 s/iter 1.548057 +gpu 0 iter : 5 Arret : 0.00848586 s/iter 1.548089 +gpu 0 iter : 6 Arret : 0.0120973 s/iter 1.707264 +gpu 0 iter : 7 Arret : 0.029256 s/iter 1.698285 +gpu 0 iter : 8 Arret : 0.134426 s/iter 1.548025 +gpu 0 iter : 9 Arret : 0.152262 s/iter 1.549290 +gpu 0 iter : 10 Arret : 0.121741 s/iter 1.710977 +gpu 0 iter : 11 Arret : 0.196968 s/iter 1.549235 +gpu 0 iter : 12 Arret : 0.832961 s/iter 1.703810 +gpu 0 iter : 13 Arret : 0.389199 s/iter 1.552020 +gpu 0 iter : 14 Arret : 0.303622 s/iter 1.712838 +gpu 0 iter : 15 Arret : 0.0708981 s/iter 1.549269 +gpu 0 iter : 16 Arret : 0.0516286 s/iter 1.547858 +gpu 0 iter : 17 Arret : 0.0237403 s/iter 1.547965 +gpu 0 iter : 18 Arret : 0.00575736 s/iter 1.548048 +gpu 0 iter : 19 Arret : 0.00016543 s/iter 1.547970 +gpu 0 iter : 20 Arret : 8.19796E-06 s/iter 1.547960 +gpu 0 iter : 21 Arret : 1.89926E-09 s/iter 1.548018 +gpu 0 iter : 22 Arret : 1.89968E-13 s/iter 1.548057 +temps : 35.62 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.49941E-05 +Stabilite : 5.04191E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005|-3.72767E-08 +i*-1.30274E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-7.79776E-12 +i*-2.52076E-13| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 782 start 0 size 200064 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 782 start 200064 size 200064 +gpu 0 iter : 1 Arret : 0.000533421 s/iter 6.081044 +gpu 0 iter : 2 Arret : 0.00294166 s/iter 6.077042 +gpu 0 iter : 3 Arret : 0.00816274 s/iter 6.076551 +gpu 0 iter : 4 Arret : 0.0970896 s/iter 6.051363 +gpu 0 iter : 5 Arret : 0.1861 s/iter 6.117092 +gpu 0 iter : 6 Arret : 0.205221 s/iter 6.087839 +gpu 0 iter : 7 Arret : 0.0897097 s/iter 6.084694 +gpu 0 iter : 8 Arret : 0.0591358 s/iter 6.078173 +gpu 0 iter : 9 Arret : 0.023858 s/iter 6.079091 +gpu 0 iter : 10 Arret : 0.00304425 s/iter 6.076912 +gpu 0 iter : 11 Arret : 0.00136708 s/iter 6.063903 +gpu 0 iter : 12 Arret : 0.000789721 s/iter 6.076452 +gpu 0 iter : 13 Arret : 0.00195862 s/iter 6.078631 +gpu 0 iter : 14 Arret : 0.00243823 s/iter 6.075599 +gpu 0 iter : 15 Arret : 0.000282668 s/iter 6.076158 +gpu 0 iter : 16 Arret : 4.27745E-05 s/iter 6.075788 +gpu 0 iter : 17 Arret : 4.20725E-06 s/iter 6.077506 +gpu 0 iter : 18 Arret : 1.6828E-08 s/iter 6.078853 +gpu 0 iter : 19 Arret : 3.63614E-11 s/iter 6.079236 +gpu 0 iter : 20 Arret : 1.38589E-13 s/iter 6.077430 +temps : 122.327 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.45366E-07 +Stabilite : 1.02274E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540319 +i* 0.841478| 1.00002|-2.32809E-09 +i* 1.97672E-09| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.43989 +i* -0.898041| 0.999991|-2.08855E-12 +i*-1.75276E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991| 1.11042E-11 +i*-9.27687E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991|-1.29017E-11 +i*-4.43427E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991|-4.70735E-12 +i* -1.4127E-11| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688087 +i* 0.725616| 0.999991| 6.67011E-12 +i* 1.57173E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1.00002 +250000 racines de module = 0.999991 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 0.00183894 s/iter 13.264868 +gpu 0 iter : 2 Arret : 0.00332589 s/iter 13.263027 +gpu 0 iter : 3 Arret : 0.0778545 s/iter 13.329862 +gpu 0 iter : 4 Arret : 0.134953 s/iter 13.784249 +gpu 0 iter : 5 Arret : 0.100777 s/iter 14.153947 +gpu 0 iter : 6 Arret : 0.107368 s/iter 13.911608 +gpu 0 iter : 7 Arret : 0.112184 s/iter 13.982400 +gpu 0 iter : 8 Arret : 0.0819523 s/iter 13.863669 +gpu 0 iter : 9 Arret : 0.0470621 s/iter 13.750970 +gpu 0 iter : 10 Arret : 0.0265395 s/iter 13.686381 +gpu 0 iter : 11 Arret : 0.0114418 s/iter 13.768352 +gpu 0 iter : 12 Arret : 0.0132102 s/iter 13.687711 +gpu 0 iter : 13 Arret : 0.0107799 s/iter 13.263263 +gpu 0 iter : 14 Arret : 0.00702915 s/iter 13.271004 +gpu 0 iter : 15 Arret : 0.00272883 s/iter 13.265259 +gpu 0 iter : 16 Arret : 0.000385595 s/iter 13.264764 +gpu 0 iter : 17 Arret : 0.000332015 s/iter 13.264693 +gpu 0 iter : 18 Arret : 0.000909613 s/iter 13.264925 +gpu 0 iter : 19 Arret : 9.10926E-07 s/iter 13.264547 +gpu 0 iter : 20 Arret : 4.37366E-09 s/iter 13.265195 +gpu 0 iter : 21 Arret : 1.73951E-11 s/iter 13.264664 +gpu 0 iter : 22 Arret : 6.9226E-14 s/iter 13.264587 +temps : 297.898 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80963E-08 +Stabilite : 6.9226E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592012 +i* 0.805941| 1.00001| 4.1526E-09 +i* 1.02046E-09| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993|-4.77973E-12 +i* 2.40621E-11| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| -2.6851E-11 +i*-1.44801E-11| +| 15| -0.721524 +i* -0.69238| 0.999993| 2.63193E-11 +i*-6.76318E-13| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742928 +i* -0.669362| 0.999993| 3.04134E-12 +i*-9.84154E-12| +| 18| 0.7533 +i* 0.657691| 1.00001|-2.76219E-09 +i* 4.10298E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773543 +i* 0.633733| 0.999993| 6.56308E-12 +i* 2.27492E-11| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1563 start 400000 size 400000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1563 start 0 size 400000 +gpu 0 iter : 1 Arret : 0.000985945 s/iter 23.676133 +gpu 0 iter : 2 Arret : 0.00575711 s/iter 23.813100 +gpu 0 iter : 3 Arret : 0.80372 s/iter 23.766696 +gpu 0 iter : 4 Arret : 1.12755 s/iter 23.828097 +gpu 0 iter : 5 Arret : 0.927252 s/iter 23.871271 +gpu 0 iter : 6 Arret : 1.8727 s/iter 23.858341 +gpu 0 iter : 7 Arret : 1.02108 s/iter 24.362443 +gpu 0 iter : 8 Arret : 0.40485 s/iter 24.813205 +gpu 0 iter : 9 Arret : 0.204025 s/iter 24.848475 +gpu 0 iter : 10 Arret : 0.322307 s/iter 24.766030 +gpu 0 iter : 11 Arret : 0.966794 s/iter 24.450352 +gpu 0 iter : 12 Arret : 0.519786 s/iter 24.347418 +gpu 0 iter : 13 Arret : 0.209179 s/iter 24.204030 +gpu 0 iter : 14 Arret : 0.0738373 s/iter 23.789427 +gpu 0 iter : 15 Arret : 0.0394797 s/iter 23.786761 +gpu 0 iter : 16 Arret : 0.0224964 s/iter 23.792150 +gpu 0 iter : 17 Arret : 0.0104646 s/iter 23.802294 +gpu 0 iter : 18 Arret : 0.00882482 s/iter 23.804999 +gpu 0 iter : 19 Arret : 0.000586803 s/iter 23.663425 +gpu 0 iter : 20 Arret : 1.2904E-06 s/iter 23.667331 +gpu 0 iter : 21 Arret : 2.17443E-08 s/iter 23.669417 +gpu 0 iter : 22 Arret : 3.31651E-10 s/iter 23.663042 +gpu 0 iter : 23 Arret : 5.05742E-12 s/iter 23.667395 +gpu 0 iter : 24 Arret : 7.71156E-14 s/iter 23.671701 +temps : 576.437 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.80859E-08 +Stabilite : 7.7914E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995|-1.40248E-11 +i* 5.11502E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-1.80345E-12 +i* 5.96675E-11| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 1954 start 0 size 500096 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 1954 start 500096 size 500096 +gpu 0 iter : 1 Arret : 0.000661333 s/iter 36.538739 +gpu 0 iter : 2 Arret : 0.00112864 s/iter 36.545395 +gpu 0 iter : 3 Arret : 0.00370767 s/iter 36.541300 +gpu 0 iter : 4 Arret : 0.00748235 s/iter 37.223998 +gpu 0 iter : 5 Arret : 0.0147148 s/iter 37.021293 +gpu 0 iter : 6 Arret : 0.0212816 s/iter 37.146418 +gpu 0 iter : 7 Arret : 0.00895178 s/iter 37.219267 +gpu 0 iter : 8 Arret : 0.00887668 s/iter 37.316626 +gpu 0 iter : 9 Arret : 0.00504713 s/iter 36.647500 +gpu 0 iter : 10 Arret : 0.00709815 s/iter 37.285606 +gpu 0 iter : 11 Arret : 0.00694487 s/iter 36.891551 +gpu 0 iter : 12 Arret : 0.00243476 s/iter 36.546690 +gpu 0 iter : 13 Arret : 0.00268555 s/iter 36.502800 +gpu 0 iter : 14 Arret : 0.000904871 s/iter 36.508349 +gpu 0 iter : 15 Arret : 0.0005848 s/iter 36.503946 +gpu 0 iter : 16 Arret : 8.64186E-05 s/iter 36.503619 +gpu 0 iter : 17 Arret : 8.33778E-05 s/iter 36.511641 +gpu 0 iter : 18 Arret : 1.10486E-05 s/iter 36.503510 +gpu 0 iter : 19 Arret : 1.76382E-05 s/iter 36.534320 +gpu 0 iter : 20 Arret : 1.2926E-06 s/iter 36.537729 +gpu 0 iter : 21 Arret : 5.95413E-09 s/iter 36.503894 +gpu 0 iter : 22 Arret : 1.88485E-11 s/iter 36.540363 +gpu 0 iter : 23 Arret : 5.96427E-14 s/iter 36.541307 +temps : 850.208 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65132E-08 +Stabilite : 5.96427E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 1.87346E-11 +i* 4.7471E-11| +| 9| 0.491932 +i* 0.870629| 0.999996|-1.74121E-11 +i*-2.86359E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.60997E-11 +i*-9.69844E-12| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996| 2.73914E-12 +i* 2.25153E-11| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 2344 start 600064 size 600064 +gpu 0 iter : 1 Arret : 0.00780904 s/iter 52.957678 +gpu 0 iter : 2 Arret : 0.698753 s/iter 54.370408 +gpu 0 iter : 3 Arret : 0.512229 s/iter 55.903856 +gpu 0 iter : 4 Arret : 0.256495 s/iter 56.546686 +gpu 0 iter : 5 Arret : 0.481397 s/iter 56.384400 +gpu 0 iter : 6 Arret : 0.892443 s/iter 56.641431 +gpu 0 iter : 7 Arret : 1.58519 s/iter 56.603728 +gpu 0 iter : 8 Arret : 1.00461 s/iter 56.787414 +gpu 0 iter : 9 Arret : 0.667954 s/iter 56.936636 +gpu 0 iter : 10 Arret : 1.69048 s/iter 56.433809 +gpu 0 iter : 11 Arret : 0.673973 s/iter 56.247309 +gpu 0 iter : 12 Arret : 0.286904 s/iter 55.583712 +gpu 0 iter : 13 Arret : 0.809155 s/iter 54.972406 +gpu 0 iter : 14 Arret : 1.04967 s/iter 54.200475 +gpu 0 iter : 15 Arret : 0.767419 s/iter 54.073912 +gpu 0 iter : 16 Arret : 1.25055 s/iter 53.969523 +gpu 0 iter : 17 Arret : 0.313555 s/iter 53.619940 +gpu 0 iter : 18 Arret : 0.0612844 s/iter 53.103551 +gpu 0 iter : 19 Arret : 0.0812813 s/iter 53.087654 +gpu 0 iter : 20 Arret : 0.0798413 s/iter 52.895378 +gpu 0 iter : 21 Arret : 0.0193508 s/iter 52.929617 +gpu 0 iter : 22 Arret : 0.0112127 s/iter 52.923694 +gpu 0 iter : 23 Arret : 0.00926876 s/iter 52.906420 +gpu 0 iter : 24 Arret : 0.00234025 s/iter 52.924598 +gpu 0 iter : 25 Arret : 0.000902467 s/iter 52.922805 +gpu 0 iter : 26 Arret : 2.88058E-05 s/iter 52.927734 +gpu 0 iter : 27 Arret : 3.35406E-07 s/iter 52.973958 +gpu 0 iter : 28 Arret : 1.39702E-09 s/iter 52.974028 +gpu 0 iter : 29 Arret : 8.02785E-12 s/iter 52.966681 +gpu 0 iter : 30 Arret : 1.1441E-13 s/iter 52.951515 +temps : 1631.66 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.74574E-08 +Stabilite : 2.21335E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540304 +i* 0.841466| 0.999997| 3.08649E-11 +i* 2.05843E-11| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1| 1.95054E-09 +i* 6.77633E-10| +| 4| 0.458805 +i* 0.888533| 0.999997| 1.78773E-11 +i* 1.55684E-11| +| 5| 0.43071 +i* 0.902487| 0.999997|-9.50928E-12 +i*-1.85143E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997| -2.5707E-11 +i* 3.11093E-13| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192909 +i* 0.981221| 1|-1.95729E-09 +i* 4.84549E-09| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130967 +i* 0.991391| 1|-1.93729E-10 +i*-4.06442E-10| +| 16| 0.0998077 +i* 0.995003| 0.999997| -4.5103E-11 +i*-6.66658E-12| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 2735 start 700032 size 700032 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 2735 start 0 size 700032 +gpu 0 iter : 1 Arret : 0.00527111 s/iter 71.308499 +gpu 0 iter : 2 Arret : 0.172644 s/iter 72.713414 +gpu 0 iter : 3 Arret : 0.69639 s/iter 72.958242 +gpu 0 iter : 4 Arret : 1.18582 s/iter 75.255529 +gpu 0 iter : 5 Arret : 0.29345 s/iter 76.866618 +gpu 0 iter : 6 Arret : 0.163076 s/iter 77.369587 +gpu 0 iter : 7 Arret : 1.88246 s/iter 78.558083 +gpu 0 iter : 8 Arret : 1.71023 s/iter 77.826546 +gpu 0 iter : 9 Arret : 1.23231 s/iter 77.642649 +gpu 0 iter : 10 Arret : 0.367931 s/iter 79.759527 +gpu 0 iter : 11 Arret : 1.0997 s/iter 78.755024 +gpu 0 iter : 12 Arret : 2.11197 s/iter 77.725889 +gpu 0 iter : 13 Arret : 0.848296 s/iter 76.267112 +gpu 0 iter : 14 Arret : 0.433295 s/iter 75.435820 +gpu 0 iter : 15 Arret : 0.817759 s/iter 74.683488 +gpu 0 iter : 16 Arret : 0.767209 s/iter 74.057568 +gpu 0 iter : 17 Arret : 0.573024 s/iter 73.720984 +gpu 0 iter : 18 Arret : 0.597274 s/iter 73.499266 +gpu 0 iter : 19 Arret : 0.303085 s/iter 72.741656 +gpu 0 iter : 20 Arret : 0.180774 s/iter 72.806213 +gpu 0 iter : 21 Arret : 0.0722903 s/iter 72.559828 +gpu 0 iter : 22 Arret : 0.146427 s/iter 72.512488 +gpu 0 iter : 23 Arret : 0.129512 s/iter 72.128992 +gpu 0 iter : 24 Arret : 0.0402274 s/iter 71.576335 +gpu 0 iter : 25 Arret : 0.0124264 s/iter 71.526353 +gpu 0 iter : 26 Arret : 0.00203683 s/iter 71.463273 +gpu 0 iter : 27 Arret : 0.000373803 s/iter 71.462289 +gpu 0 iter : 28 Arret : 7.43881E-07 s/iter 71.336304 +gpu 0 iter : 29 Arret : 9.02153E-09 s/iter 71.333249 +gpu 0 iter : 30 Arret : 1.20401E-10 s/iter 71.481701 +gpu 0 iter : 31 Arret : 1.60504E-12 s/iter 71.339739 +gpu 0 iter : 32 Arret : 2.14019E-14 s/iter 71.437524 +temps : 2371.12 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65661E-08 +Stabilite : 5.97875E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997| 5.65794E-11 +i*-4.66756E-12| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-8.72191E-12 +i* 2.97079E-11| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997| 8.13599E-11 +i*-1.42233E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140099: line 23: 12958 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140099: line 24: 12962 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140099: line 25: 12964 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_2GPU.sge b/Simulations/sparse_openmp/sparse_openmp_2GPU.sge new file mode 100755 index 0000000..769c2b7 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_2GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 2 +#$ -V +#$ -cwd +#$ -N sparse_openmp_2GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=2 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Simulations/sparse_openmp/sparse_openmp_3GPU.o140098 b/Simulations/sparse_openmp/sparse_openmp_3GPU.o140098 new file mode 100644 index 0000000..2aea52b --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_3GPU.o140098 @@ -0,0 +1,602 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 131 start 0 size 33365 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 131 start 33365 size 33365 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 131 start 66730 size 33365 +gpu 0 iter : 1 Arret : 0.00638376 s/iter 0.326852 +gpu 0 iter : 2 Arret : 0.00780969 s/iter 0.399828 +gpu 0 iter : 3 Arret : 0.00239395 s/iter 0.326756 +gpu 0 iter : 4 Arret : 0.00316529 s/iter 0.326768 +gpu 0 iter : 5 Arret : 0.0038084 s/iter 0.326767 +gpu 0 iter : 6 Arret : 0.00482452 s/iter 0.326696 +gpu 0 iter : 7 Arret : 0.00928999 s/iter 0.326751 +gpu 0 iter : 8 Arret : 0.0101647 s/iter 0.326710 +gpu 0 iter : 9 Arret : 0.0111077 s/iter 0.326857 +gpu 0 iter : 10 Arret : 0.00655022 s/iter 0.326801 +gpu 0 iter : 11 Arret : 0.00316276 s/iter 0.326810 +gpu 0 iter : 12 Arret : 0.000516233 s/iter 0.326609 +gpu 0 iter : 13 Arret : 0.00040416 s/iter 0.326572 +gpu 0 iter : 14 Arret : 0.000177079 s/iter 0.326480 +gpu 0 iter : 15 Arret : 8.53367E-05 s/iter 0.326486 +gpu 0 iter : 16 Arret : 4.34291E-05 s/iter 0.326528 +gpu 0 iter : 17 Arret : 2.94612E-06 s/iter 0.326471 +gpu 0 iter : 18 Arret : 4.24038E-08 s/iter 0.326469 +gpu 0 iter : 19 Arret : 6.31898E-10 s/iter 0.326431 +gpu 0 iter : 20 Arret : 9.41384E-12 s/iter 0.326448 +gpu 0 iter : 21 Arret : 1.40182E-13 s/iter 0.326484 +temps : 8.00955 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.10777E-09 +Stabilite : 1.57015E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226885 +i* -0.973981| 1.00006|-5.81993E-10 +i*-4.18547E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962|-4.03455E-13 +i* 2.85139E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 1.02962E-12 +i*-4.51911E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| -8.9615E-10 +i* 1.84549E-11| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 261 start 66730 size 66730 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 261 start 0 size 66730 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 261 start 133460 size 66730 +gpu 0 iter : 1 Arret : 0.000229669 s/iter 1.096870 +gpu 0 iter : 2 Arret : 0.00021193 s/iter 1.097026 +gpu 0 iter : 3 Arret : 0.000280313 s/iter 1.096954 +gpu 0 iter : 4 Arret : 0.000636926 s/iter 1.096899 +gpu 0 iter : 5 Arret : 0.00105388 s/iter 1.096829 +gpu 0 iter : 6 Arret : 0.0149052 s/iter 1.096638 +gpu 0 iter : 7 Arret : 0.0123684 s/iter 1.096797 +gpu 0 iter : 8 Arret : 0.0421817 s/iter 1.098043 +gpu 0 iter : 9 Arret : 0.0899445 s/iter 1.098654 +gpu 0 iter : 10 Arret : 0.204522 s/iter 1.186313 +gpu 0 iter : 11 Arret : 2.97201 s/iter 1.218384 +gpu 0 iter : 12 Arret : 0.648253 s/iter 1.218710 +gpu 0 iter : 13 Arret : 1.88772 s/iter 1.241862 +gpu 0 iter : 14 Arret : 1.33785 s/iter 1.208066 +gpu 0 iter : 15 Arret : 1.70034 s/iter 1.098449 +gpu 0 iter : 16 Arret : 1.16245 s/iter 1.197714 +gpu 0 iter : 17 Arret : 2.06315 s/iter 1.228122 +gpu 0 iter : 18 Arret : 1.22433 s/iter 1.198366 +gpu 0 iter : 19 Arret : 0.795342 s/iter 1.228114 +gpu 0 iter : 20 Arret : 0.622909 s/iter 1.095861 +gpu 0 iter : 21 Arret : 1.12395 s/iter 1.224956 +gpu 0 iter : 22 Arret : 1.99041 s/iter 1.227156 +gpu 0 iter : 23 Arret : 1.15739 s/iter 1.209773 +gpu 0 iter : 24 Arret : 0.455675 s/iter 1.226888 +gpu 0 iter : 25 Arret : 0.680625 s/iter 1.097847 +gpu 0 iter : 26 Arret : 0.577238 s/iter 1.095693 +gpu 0 iter : 27 Arret : 0.0687706 s/iter 1.095867 +gpu 0 iter : 28 Arret : 0.0224681 s/iter 1.096036 +gpu 0 iter : 29 Arret : 0.002804 s/iter 1.095993 +gpu 0 iter : 30 Arret : 6.05493E-06 s/iter 1.095754 +gpu 0 iter : 31 Arret : 3.11042E-10 s/iter 1.095829 +gpu 0 iter : 32 Arret : 3.1096E-14 s/iter 1.096050 +temps : 37.8394 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.30431E-05 +Stabilite : 3.1096E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985| 8.64808E-12 +i* 7.46794E-12| +| 8| 0.59177 +i* 0.806164| 1.00005|-6.74238E-09 +i* 4.40492E-09| +| 9| -0.801529 +i* 0.598033| 1.00005| 7.19885E-09 +i* 8.43319E-09| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628894 +i* -0.777551| 1.00005| 2.29838E-09 +i* 1.59417E-08| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-1.93379E-12 +i*-1.29726E-11| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 521 start 133376 size 133376 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 521 start 0 size 133376 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 521 start 266752 size 133376 +gpu 0 iter : 1 Arret : 0.00053336 s/iter 4.015433 +gpu 0 iter : 2 Arret : 0.00165478 s/iter 4.015274 +gpu 0 iter : 3 Arret : 0.00149659 s/iter 4.015225 +gpu 0 iter : 4 Arret : 0.00476307 s/iter 4.014142 +gpu 0 iter : 5 Arret : 0.0270497 s/iter 4.020618 +gpu 0 iter : 6 Arret : 0.0269319 s/iter 4.340327 +gpu 0 iter : 7 Arret : 0.0180523 s/iter 4.298465 +gpu 0 iter : 8 Arret : 0.0146534 s/iter 4.308899 +gpu 0 iter : 9 Arret : 0.00619736 s/iter 4.011731 +gpu 0 iter : 10 Arret : 0.00299981 s/iter 4.010855 +gpu 0 iter : 11 Arret : 0.00111873 s/iter 4.009952 +gpu 0 iter : 12 Arret : 0.000851809 s/iter 4.011669 +gpu 0 iter : 13 Arret : 0.000757841 s/iter 4.011889 +gpu 0 iter : 14 Arret : 0.000509989 s/iter 4.011347 +gpu 0 iter : 15 Arret : 0.000667055 s/iter 4.011093 +gpu 0 iter : 16 Arret : 2.71105E-05 s/iter 4.000315 +gpu 0 iter : 17 Arret : 8.00906E-06 s/iter 3.991624 +gpu 0 iter : 18 Arret : 1.99192E-07 s/iter 3.991746 +gpu 0 iter : 19 Arret : 3.11567E-09 s/iter 3.991734 +gpu 0 iter : 20 Arret : 4.89263E-11 s/iter 3.991803 +gpu 0 iter : 21 Arret : 7.68172E-13 s/iter 3.991754 +temps : 86.1208 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 7.68172E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.43989 +i* -0.898041| 0.999991|-2.08855E-12 +i*-1.75276E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991| 1.11042E-11 +i*-9.27687E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991|-1.29017E-11 +i*-4.43427E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991| 1.73468E-11 +i*-3.74729E-12| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991| 1.53594E-11 +i*-1.57324E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991| -1.2063E-11 +i* 1.32238E-11| +| 18| 0.688087 +i* 0.725616| 0.999991| 6.67011E-12 +i* 1.57173E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991| 2.5573E-11 +i*-6.45539E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 782 start 200021 size 200021 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 782 start 400042 size 200021 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 782 start 0 size 200021 +gpu 0 iter : 1 Arret : 0.00574299 s/iter 9.047838 +gpu 0 iter : 2 Arret : 0.00960381 s/iter 9.043639 +gpu 0 iter : 3 Arret : 0.130996 s/iter 9.471525 +gpu 0 iter : 4 Arret : 0.142079 s/iter 9.198199 +gpu 0 iter : 5 Arret : 0.0868349 s/iter 9.506055 +gpu 0 iter : 6 Arret : 0.0882721 s/iter 9.145065 +gpu 0 iter : 7 Arret : 0.114689 s/iter 9.172845 +gpu 0 iter : 8 Arret : 0.108656 s/iter 9.193791 +gpu 0 iter : 9 Arret : 0.0356399 s/iter 9.170752 +gpu 0 iter : 10 Arret : 0.0134072 s/iter 9.594206 +gpu 0 iter : 11 Arret : 0.00832588 s/iter 9.158565 +gpu 0 iter : 12 Arret : 0.00682235 s/iter 9.135471 +gpu 0 iter : 13 Arret : 0.00415856 s/iter 9.143664 +gpu 0 iter : 14 Arret : 0.00311193 s/iter 9.065571 +gpu 0 iter : 15 Arret : 0.000707097 s/iter 9.044745 +gpu 0 iter : 16 Arret : 0.000778409 s/iter 9.042087 +gpu 0 iter : 17 Arret : 0.000667704 s/iter 9.043931 +gpu 0 iter : 18 Arret : 9.33212E-06 s/iter 9.043636 +gpu 0 iter : 19 Arret : 7.71387E-08 s/iter 9.041264 +gpu 0 iter : 20 Arret : 1.09443E-09 s/iter 9.041736 +gpu 0 iter : 21 Arret : 1.56107E-11 s/iter 9.047621 +gpu 0 iter : 22 Arret : 2.22664E-13 s/iter 9.046678 +temps : 202.419 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.53549E-08 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993| 1.33613E-11 +i*-1.98701E-11| +| 4| 0.592014 +i* 0.805919| 0.999993|-3.98037E-12 +i* 9.55808E-12| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 2.88447E-09 +i* 3.69506E-09| +| 16| 0.73231 +i* 0.680962| 0.999993|-5.73186E-12 +i* 1.14335E-11| +| 17| -0.742904 +i* -0.669389| 0.999993|-7.78222E-12 +i* 1.50098E-11| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773539 +i* 0.633763| 1.00001| 5.39271E-09 +i*-2.77636E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1042 start 266666 size 266666 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1042 start 0 size 266666 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 1042 start 533332 size 266666 +gpu 0 iter : 1 Arret : 0.000985945 s/iter 15.851621 +gpu 0 iter : 2 Arret : 0.00155936 s/iter 15.788402 +gpu 0 iter : 3 Arret : 0.0129473 s/iter 15.851181 +gpu 0 iter : 4 Arret : 0.0558872 s/iter 16.300649 +gpu 0 iter : 5 Arret : 0.19954 s/iter 15.808251 +gpu 0 iter : 6 Arret : 0.377937 s/iter 15.879884 +gpu 0 iter : 7 Arret : 0.514814 s/iter 16.303367 +gpu 0 iter : 8 Arret : 0.338633 s/iter 15.914224 +gpu 0 iter : 9 Arret : 0.206607 s/iter 16.151496 +gpu 0 iter : 10 Arret : 0.138277 s/iter 16.399153 +gpu 0 iter : 11 Arret : 0.113953 s/iter 15.857365 +gpu 0 iter : 12 Arret : 0.0627751 s/iter 15.843953 +gpu 0 iter : 13 Arret : 0.0358213 s/iter 15.848470 +gpu 0 iter : 14 Arret : 0.0221421 s/iter 15.846627 +gpu 0 iter : 15 Arret : 0.00243723 s/iter 15.842171 +gpu 0 iter : 16 Arret : 0.000254217 s/iter 15.843580 +gpu 0 iter : 17 Arret : 0.000130358 s/iter 15.845033 +gpu 0 iter : 18 Arret : 0.00018532 s/iter 15.849105 +gpu 0 iter : 19 Arret : 1.35363E-05 s/iter 15.847663 +gpu 0 iter : 20 Arret : 2.14908E-09 s/iter 15.847042 +gpu 0 iter : 21 Arret : 4.62703E-12 s/iter 15.807436 +gpu 0 iter : 22 Arret : 9.97217E-15 s/iter 15.847751 +temps : 351.42 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 12.9528 +Stabilite : 7.80251E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 1.7531E-11 +i*-4.02243E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +499998 racines de module = 0.999995 +300000 racines de module = 1.00001 + 2 racines de module = 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 1303 start 666794 size 333397 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 1303 start 333397 size 333397 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 1303 start 0 size 333397 +gpu 0 iter : 1 Arret : 0.0011104 s/iter 24.284964 +gpu 0 iter : 2 Arret : 0.00309979 s/iter 24.283383 +gpu 0 iter : 3 Arret : 0.247623 s/iter 24.789931 +gpu 0 iter : 4 Arret : 0.461817 s/iter 24.581195 +gpu 0 iter : 5 Arret : 0.334336 s/iter 25.044367 +gpu 0 iter : 6 Arret : 0.274486 s/iter 25.665034 +gpu 0 iter : 7 Arret : 0.159668 s/iter 26.197375 +gpu 0 iter : 8 Arret : 0.0519691 s/iter 25.694996 +gpu 0 iter : 9 Arret : 0.0269291 s/iter 25.673851 +gpu 0 iter : 10 Arret : 0.0602316 s/iter 25.604792 +gpu 0 iter : 11 Arret : 0.0619642 s/iter 24.773954 +gpu 0 iter : 12 Arret : 0.0234 s/iter 24.787706 +gpu 0 iter : 13 Arret : 0.0244077 s/iter 24.353884 +gpu 0 iter : 14 Arret : 0.00963063 s/iter 24.344876 +gpu 0 iter : 15 Arret : 0.00340716 s/iter 24.345219 +gpu 0 iter : 16 Arret : 0.000234823 s/iter 24.297435 +gpu 0 iter : 17 Arret : 0.000256334 s/iter 24.352140 +gpu 0 iter : 18 Arret : 0.000224052 s/iter 24.290971 +gpu 0 iter : 19 Arret : 0.000781478 s/iter 24.296445 +gpu 0 iter : 20 Arret : 0.000194356 s/iter 24.291281 +gpu 0 iter : 21 Arret : 2.40806E-07 s/iter 24.291827 +gpu 0 iter : 22 Arret : 3.31687E-09 s/iter 24.291690 +gpu 0 iter : 23 Arret : 4.67724E-11 s/iter 24.290907 +gpu 0 iter : 24 Arret : 6.59569E-13 s/iter 24.293931 +temps : 598.968 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.52682E-07 +Stabilite : 6.59569E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.519015 +i* 0.854772| 1.00001| 2.38413E-09 +i*-5.89917E-09| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491942 +i* 0.870624| 0.999996| -1.9825E-11 +i*-1.52329E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996|-3.09397E-11 +i*-1.68578E-11| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46438 +i* 0.885632| 0.999996| 1.33844E-11 +i*-1.06731E-12| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436355 +i* 0.899781| 1.00001| 4.84598E-09 +i*-1.12092E-09| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1563 start 0 size 400042 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1563 start 400042 size 400042 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 2 dimgrid2 1563 start 800084 size 400042 +gpu 0 iter : 1 Arret : 0.0129118 s/iter 35.194295 +gpu 0 iter : 2 Arret : 1.14226 s/iter 37.357952 +gpu 0 iter : 3 Arret : 1.41831 s/iter 37.472613 +gpu 0 iter : 4 Arret : 1.98712 s/iter 37.475866 +gpu 0 iter : 5 Arret : 0.777118 s/iter 37.323598 +gpu 0 iter : 6 Arret : 0.414132 s/iter 38.133114 +gpu 0 iter : 7 Arret : 0.596053 s/iter 38.249814 +gpu 0 iter : 8 Arret : 0.923957 s/iter 38.214227 +gpu 0 iter : 9 Arret : 1.37764 s/iter 38.802357 +gpu 0 iter : 10 Arret : 3.75882 s/iter 38.537349 +gpu 0 iter : 11 Arret : 3.50583 s/iter 39.060169 +gpu 0 iter : 12 Arret : 3.46154 s/iter 38.314523 +gpu 0 iter : 13 Arret : 1.44838 s/iter 38.304672 +gpu 0 iter : 14 Arret : 2.97866 s/iter 38.101085 +gpu 0 iter : 15 Arret : 1.47363 s/iter 37.961455 +gpu 0 iter : 16 Arret : 3.02916 s/iter 37.963549 +gpu 0 iter : 17 Arret : 3.44273 s/iter 37.562647 +gpu 0 iter : 18 Arret : 9.75818 s/iter 37.462847 +gpu 0 iter : 19 Arret : 3.55089 s/iter 37.388809 +gpu 0 iter : 20 Arret : 1.23127 s/iter 37.253955 +gpu 0 iter : 21 Arret : 2.15757 s/iter 37.181593 +gpu 0 iter : 22 Arret : 1.41689 s/iter 37.239248 +gpu 0 iter : 23 Arret : 2.71181 s/iter 37.183043 +gpu 0 iter : 24 Arret : 1.74358 s/iter 37.093614 +gpu 0 iter : 25 Arret : 1.20275 s/iter 37.190846 +gpu 0 iter : 26 Arret : 4.12739 s/iter 37.151827 +gpu 0 iter : 27 Arret : 0.963355 s/iter 37.085124 +gpu 0 iter : 28 Arret : 0.780804 s/iter 37.089879 +gpu 0 iter : 29 Arret : 1.04543 s/iter 37.116299 +gpu 0 iter : 30 Arret : 0.861461 s/iter 36.766134 +gpu 0 iter : 31 Arret : 0.882203 s/iter 36.884355 +gpu 0 iter : 32 Arret : 1.2718 s/iter 36.769843 +gpu 0 iter : 33 Arret : 2.35224 s/iter 36.354615 +gpu 0 iter : 34 Arret : 0.727156 s/iter 36.255055 +gpu 0 iter : 35 Arret : 1.44624 s/iter 36.206611 +gpu 0 iter : 36 Arret : 0.991076 s/iter 36.090368 +gpu 0 iter : 37 Arret : 1.04914 s/iter 35.800864 +gpu 0 iter : 38 Arret : 1.8416 s/iter 35.547956 +gpu 0 iter : 39 Arret : 73.3357 s/iter 35.569370 +gpu 0 iter : 40 Arret : 1.27526 s/iter 35.589183 +gpu 0 iter : 41 Arret : 0.664432 s/iter 35.572552 +gpu 0 iter : 42 Arret : 2.02267 s/iter 35.596663 +gpu 0 iter : 43 Arret : 3.3247 s/iter 35.518933 +gpu 0 iter : 44 Arret : 0.753208 s/iter 35.558919 +gpu 0 iter : 45 Arret : 0.406779 s/iter 35.517839 +gpu 0 iter : 46 Arret : 0.190344 s/iter 35.499532 +gpu 0 iter : 47 Arret : 0.053701 s/iter 35.454469 +gpu 0 iter : 48 Arret : 0.0180092 s/iter 35.423771 +gpu 0 iter : 49 Arret : 0.0103853 s/iter 35.469037 +gpu 0 iter : 50 Arret : 0.00392672 s/iter 35.295894 +gpu 0 iter : 51 Arret : 0.00130348 s/iter 35.285682 +gpu 0 iter : 52 Arret : 5.94285E-05 s/iter 35.279833 +gpu 0 iter : 53 Arret : 3.66884E-07 s/iter 35.262013 +gpu 0 iter : 54 Arret : 1.24856E-09 s/iter 35.260448 +gpu 0 iter : 55 Arret : 1.23865E-11 s/iter 35.262868 +gpu 0 iter : 56 Arret : 1.69469E-13 s/iter 35.261163 +temps : 2056.31 seconde(s) +Nb iterations : 56 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.48302E-06 +Stabilite : 1.69469E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513633 +i* 0.858015| 1| 1.54651E-09 +i*-2.27023E-10| +| 3| 0.486464 +i* 0.873697| 0.999997| 5.22282E-12 +i* 2.0872E-11| +| 4| 0.458789 +i* 0.888542| 0.999997| 2.48135E-13 +i*-2.88822E-11| +| 5| 0.430701 +i* 0.902491| 0.999997| 1.55062E-11 +i*-3.45463E-12| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192909 +i* 0.981221| 1|-1.95729E-09 +i* 4.84549E-09| +| 14| 0.162018 +i* 0.986792| 1| 1.18712E-08 +i* 5.95858E-09| +| 15| 0.128886 +i* 0.991664| 1|-2.36358E-09 +i* 3.79427E-11| +| 16| 0.099787 +i* 0.995013| 1|-7.20324E-09 +i* 2.86361E-09| +| 17| 0.0685404 +i* 0.997645| 0.999997| 1.01124E-11 +i* 3.1089E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1823 start 466688 size 466688 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1823 start 933376 size 466688 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 1823 start 0 size 466688 +gpu 0 iter : 1 Arret : 0.047657 s/iter 48.025151 +gpu 0 iter : 2 Arret : 0.964913 s/iter 49.123050 +gpu 0 iter : 3 Arret : 2.4727 s/iter 49.732738 +gpu 0 iter : 4 Arret : 2.06376 s/iter 50.210543 +gpu 0 iter : 5 Arret : 0.958099 s/iter 51.132618 +gpu 0 iter : 6 Arret : 0.828164 s/iter 51.281245 +gpu 0 iter : 7 Arret : 2.24981 s/iter 51.515152 +gpu 0 iter : 8 Arret : 1.27056 s/iter 52.721722 +gpu 0 iter : 9 Arret : 1.7356 s/iter 52.706102 +gpu 0 iter : 10 Arret : 0.542543 s/iter 52.785746 +gpu 0 iter : 11 Arret : 0.703757 s/iter 52.816724 +gpu 0 iter : 12 Arret : 0.310008 s/iter 52.461451 +gpu 0 iter : 13 Arret : 0.443499 s/iter 51.910352 +gpu 0 iter : 14 Arret : 0.600068 s/iter 51.409402 +gpu 0 iter : 15 Arret : 0.482174 s/iter 51.392959 +gpu 0 iter : 16 Arret : 0.771182 s/iter 50.626111 +gpu 0 iter : 17 Arret : 0.532518 s/iter 50.225728 +gpu 0 iter : 18 Arret : 0.257696 s/iter 49.125636 +gpu 0 iter : 19 Arret : 0.177381 s/iter 48.905491 +gpu 0 iter : 20 Arret : 0.130753 s/iter 48.447574 +gpu 0 iter : 21 Arret : 0.0607806 s/iter 48.417696 +gpu 0 iter : 22 Arret : 3.28538 s/iter 48.161859 +gpu 0 iter : 23 Arret : 1.32615 s/iter 48.015609 +gpu 0 iter : 24 Arret : 0.026712 s/iter 48.032029 +gpu 0 iter : 25 Arret : 0.0189921 s/iter 48.023109 +gpu 0 iter : 26 Arret : 0.0252448 s/iter 48.022355 +gpu 0 iter : 27 Arret : 0.0183014 s/iter 48.029077 +gpu 0 iter : 28 Arret : 0.0259939 s/iter 48.031196 +gpu 0 iter : 29 Arret : 0.0148008 s/iter 48.034595 +gpu 0 iter : 30 Arret : 0.00511391 s/iter 48.034650 +gpu 0 iter : 31 Arret : 0.000444388 s/iter 48.016595 +gpu 0 iter : 32 Arret : 1.35417E-05 s/iter 48.015821 +gpu 0 iter : 33 Arret : 5.22681E-07 s/iter 48.020076 +gpu 0 iter : 34 Arret : 2.63971E-09 s/iter 48.039932 +gpu 0 iter : 35 Arret : 1.22535E-11 s/iter 48.040535 +gpu 0 iter : 36 Arret : 5.68579E-14 s/iter 48.039757 +temps : 1786.83 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.48488E-08 +Stabilite : 5.68579E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-8.47142E-11 +i* 1.92466E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997|-8.89955E-13 +i* 2.61938E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997|-1.30287E-11 +i*-2.87501E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-4.93405E-11 +i*-7.15173E-13| +| 16| 0.314233 +i* 0.949343| 0.999997| 1.02587E-11 +i*-4.25648E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140098: line 23: 11749 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140098: line 24: 11753 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140098: line 25: 11755 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_3GPU.sge b/Simulations/sparse_openmp/sparse_openmp_3GPU.sge new file mode 100755 index 0000000..f3bb47b --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_3GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 3 +#$ -V +#$ -cwd +#$ -N sparse_openmp_3GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097 b/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097 new file mode 100644 index 0000000..2edc5c1 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097 @@ -0,0 +1,621 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 98 start 0 size 25024 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 98 start 50048 size 25024 +gpu 3 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 3 dimgrid2 98 start 75072 size 25024 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 98 start 25024 size 25024 +gpu 0 iter : 1 Arret : 0.00317265 s/iter 0.236357 +gpu 0 iter : 2 Arret : 0.00227157 s/iter 0.222729 +gpu 0 iter : 3 Arret : 0.00205316 s/iter 0.222769 +gpu 0 iter : 4 Arret : 0.00128297 s/iter 0.222748 +gpu 0 iter : 5 Arret : 0.00112626 s/iter 0.222747 +gpu 0 iter : 6 Arret : 0.0020822 s/iter 0.222736 +gpu 0 iter : 7 Arret : 0.0115304 s/iter 0.222730 +gpu 0 iter : 8 Arret : 0.0115653 s/iter 0.295379 +gpu 0 iter : 9 Arret : 0.00182694 s/iter 0.222647 +gpu 0 iter : 10 Arret : 0.000971807 s/iter 0.222690 +gpu 0 iter : 11 Arret : 0.00050868 s/iter 0.222743 +gpu 0 iter : 12 Arret : 0.000554626 s/iter 0.222588 +gpu 0 iter : 13 Arret : 0.000773549 s/iter 0.222519 +gpu 0 iter : 14 Arret : 0.000652981 s/iter 0.222480 +gpu 0 iter : 15 Arret : 7.85268E-05 s/iter 0.222478 +gpu 0 iter : 16 Arret : 1.67519E-05 s/iter 0.222489 +gpu 0 iter : 17 Arret : 1.93862E-07 s/iter 0.222504 +gpu 0 iter : 18 Arret : 2.89153E-09 s/iter 0.222440 +gpu 0 iter : 19 Arret : 4.30769E-11 s/iter 0.222397 +gpu 0 iter : 20 Arret : 6.41743E-13 s/iter 0.222499 +temps : 5.86914 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.09748E-08 +Stabilite : 1.57015E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962|-4.03455E-13 +i* 2.85139E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 196 start 100096 size 50048 +gpu 3 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 3 dimgrid2 196 start 150144 size 50048 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 0 iter : 1 Arret : 0.000151294 s/iter 0.873722 +gpu 0 iter : 2 Arret : 0.000148163 s/iter 0.876720 +gpu 0 iter : 3 Arret : 0.000156239 s/iter 0.876483 +gpu 0 iter : 4 Arret : 0.000917016 s/iter 0.876408 +gpu 0 iter : 5 Arret : 0.00193309 s/iter 0.877387 +gpu 0 iter : 6 Arret : 0.012901 s/iter 1.040793 +gpu 0 iter : 7 Arret : 0.0696679 s/iter 1.039198 +gpu 0 iter : 8 Arret : 0.0831135 s/iter 1.017396 +gpu 0 iter : 9 Arret : 0.655093 s/iter 1.021459 +gpu 0 iter : 10 Arret : 0.310762 s/iter 1.026425 +gpu 0 iter : 11 Arret : 0.25028 s/iter 1.016739 +gpu 0 iter : 12 Arret : 0.12787 s/iter 1.024487 +gpu 0 iter : 13 Arret : 0.174578 s/iter 0.991808 +gpu 0 iter : 14 Arret : 0.13471 s/iter 1.020582 +gpu 0 iter : 15 Arret : 0.260288 s/iter 0.881413 +gpu 0 iter : 16 Arret : 0.151424 s/iter 1.018801 +gpu 0 iter : 17 Arret : 0.070357 s/iter 0.881097 +gpu 0 iter : 18 Arret : 0.0196537 s/iter 0.881104 +gpu 0 iter : 19 Arret : 0.00113921 s/iter 0.878041 +gpu 0 iter : 20 Arret : 4.42128E-05 s/iter 0.877967 +gpu 0 iter : 21 Arret : 3.87634E-06 s/iter 0.878342 +gpu 0 iter : 22 Arret : 3.63936E-09 s/iter 0.878295 +gpu 0 iter : 23 Arret : 3.63838E-13 s/iter 0.878170 +temps : 22.9576 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.000181892 +Stabilite : 2.22061E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005| 5.92533E-09 +i* 3.55911E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-1.93379E-12 +i*-1.29726E-11| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 391 start 0 size 100032 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 391 start 200064 size 100032 +gpu 3 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 3 dimgrid2 391 start 300096 size 100032 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 391 start 100032 size 100032 +gpu 0 iter : 1 Arret : 0.00053336 s/iter 3.114080 +gpu 0 iter : 2 Arret : 0.00132869 s/iter 3.113006 +gpu 0 iter : 3 Arret : 0.00304211 s/iter 3.113002 +gpu 0 iter : 4 Arret : 0.0081892 s/iter 3.421884 +gpu 0 iter : 5 Arret : 0.0174091 s/iter 3.393637 +gpu 0 iter : 6 Arret : 0.0170263 s/iter 3.378163 +gpu 0 iter : 7 Arret : 0.00925735 s/iter 3.423651 +gpu 0 iter : 8 Arret : 0.00879968 s/iter 3.111951 +gpu 0 iter : 9 Arret : 0.0133997 s/iter 3.368852 +gpu 0 iter : 10 Arret : 0.00968114 s/iter 3.111774 +gpu 0 iter : 11 Arret : 0.00462525 s/iter 3.110863 +gpu 0 iter : 12 Arret : 0.00341319 s/iter 3.111132 +gpu 0 iter : 13 Arret : 0.00439696 s/iter 3.110364 +gpu 0 iter : 14 Arret : 0.000354857 s/iter 3.110007 +gpu 0 iter : 15 Arret : 0.00105657 s/iter 3.109831 +gpu 0 iter : 16 Arret : 0.000563123 s/iter 3.109784 +gpu 0 iter : 17 Arret : 2.74759E-05 s/iter 3.109683 +gpu 0 iter : 18 Arret : 3.06801E-07 s/iter 3.109172 +gpu 0 iter : 19 Arret : 7.06164E-10 s/iter 3.108923 +gpu 0 iter : 20 Arret : 1.07684E-11 s/iter 3.109509 +gpu 0 iter : 21 Arret : 1.64161E-13 s/iter 3.109378 +temps : 68.0633 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.09466E-07 +Stabilite : 3.51078E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540313 +i* 0.841453| 0.999991| 9.34197E-12 +i*-1.23633E-11| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411521 +i* -0.911417| 1.00002|-2.94737E-09 +i* 1.73005E-09| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.988534 +i* 0.151098| 1.00002|-8.27014E-10 +i* 9.44171E-10| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641299 +i* 0.767311| 1.00002|-2.44657E-09 +i* -6.7886E-11| +| 13| -0.983286 +i* 0.18202| 0.999991| 3.21676E-12 +i*-9.48297E-13| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.66503 +i* 0.746804| 0.999991| 5.74873E-13 +i* 8.53884E-12| +| 16| -0.977123 +i* 0.212747| 1.00002| 1.09185E-09 +i* 2.38902E-10| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688122 +i* 0.725616| 1.00002|-2.54456E-09 +i* 8.15125E-10| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991| 2.5573E-11 +i*-6.45539E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 586 start 300032 size 150016 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 586 start 150016 size 150016 +gpu 3 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 3 dimgrid2 586 start 450048 size 150016 +gpu 0 iter : 1 Arret : 0.00166144 s/iter 6.733254 +gpu 0 iter : 2 Arret : 0.00663307 s/iter 6.721345 +gpu 0 iter : 3 Arret : 0.0196947 s/iter 6.725089 +gpu 0 iter : 4 Arret : 0.0354088 s/iter 7.044531 +gpu 0 iter : 5 Arret : 0.0344666 s/iter 7.231490 +gpu 0 iter : 6 Arret : 0.0255965 s/iter 7.223546 +gpu 0 iter : 7 Arret : 0.0250307 s/iter 7.248225 +gpu 0 iter : 8 Arret : 0.0220818 s/iter 7.524758 +gpu 0 iter : 9 Arret : 0.0193422 s/iter 7.217155 +gpu 0 iter : 10 Arret : 0.0384961 s/iter 7.206267 +gpu 0 iter : 11 Arret : 0.0308611 s/iter 7.198073 +gpu 0 iter : 12 Arret : 0.0139003 s/iter 7.227655 +gpu 0 iter : 13 Arret : 0.00821788 s/iter 6.730489 +gpu 0 iter : 14 Arret : 0.00366002 s/iter 7.146524 +gpu 0 iter : 15 Arret : 0.00103013 s/iter 6.725238 +gpu 0 iter : 16 Arret : 0.000538911 s/iter 6.724848 +gpu 0 iter : 17 Arret : 0.000270623 s/iter 6.725086 +gpu 0 iter : 18 Arret : 4.24795E-05 s/iter 6.724157 +gpu 0 iter : 19 Arret : 5.07342E-09 s/iter 6.723896 +gpu 0 iter : 20 Arret : 7.14369E-11 s/iter 6.724108 +gpu 0 iter : 21 Arret : 1.00557E-12 s/iter 6.725050 +gpu 0 iter : 22 Arret : 1.41479E-14 s/iter 6.724347 +temps : 154.313 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.37653E-08 +Stabilite : 2.77613E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592014 +i* 0.805919| 0.999993|-3.98037E-12 +i* 9.55808E-12| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742944 +i* -0.669367| 1.00001| 9.14394E-11 +i*-3.49261E-09| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.763551 +i* -0.645737| 0.999993| 1.68299E-11 +i* 1.43271E-11| +| 20| 0.773539 +i* 0.633763| 1.00001| -4.2314E-09 +i* 1.86243E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 3 dimgrid2 782 start 600000 size 200000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 782 start 200000 size 200000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 782 start 0 size 200000 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 782 start 400000 size 200000 +gpu 0 iter : 1 Arret : 0.00108387 s/iter 12.149827 +gpu 0 iter : 2 Arret : 0.00154284 s/iter 12.327396 +gpu 0 iter : 3 Arret : 0.00442373 s/iter 12.172431 +gpu 0 iter : 4 Arret : 0.0484674 s/iter 12.229082 +gpu 0 iter : 5 Arret : 0.0462186 s/iter 12.248952 +gpu 0 iter : 6 Arret : 0.0672711 s/iter 12.235166 +gpu 0 iter : 7 Arret : 0.0371959 s/iter 12.355881 +gpu 0 iter : 8 Arret : 0.0332451 s/iter 12.399234 +gpu 0 iter : 9 Arret : 0.0347928 s/iter 12.369857 +gpu 0 iter : 10 Arret : 0.0382283 s/iter 12.701023 +gpu 0 iter : 11 Arret : 0.010893 s/iter 12.800482 +gpu 0 iter : 12 Arret : 0.0100182 s/iter 12.206749 +gpu 0 iter : 13 Arret : 0.000870471 s/iter 12.137340 +gpu 0 iter : 14 Arret : 0.00222619 s/iter 12.140578 +gpu 0 iter : 15 Arret : 0.000360359 s/iter 12.119427 +gpu 0 iter : 16 Arret : 0.000163251 s/iter 12.146378 +gpu 0 iter : 17 Arret : 8.3446E-05 s/iter 12.146441 +gpu 0 iter : 18 Arret : 5.95325E-07 s/iter 12.141680 +gpu 0 iter : 19 Arret : 1.07969E-09 s/iter 12.142666 +gpu 0 iter : 20 Arret : 2.37954E-12 s/iter 12.145013 +gpu 0 iter : 21 Arret : 3.63218E-14 s/iter 12.145853 +temps : 258.82 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.97756E-07 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995| -2.03E-11 +i* 2.74701E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995| 6.90537E-12 +i*-5.12417E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 3.40094E-11 +i* 1.45989E-12| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 3 dimgrid2 977 start 750144 size 250048 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 977 start 0 size 250048 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 977 start 250048 size 250048 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 977 start 500096 size 250048 +gpu 0 iter : 1 Arret : 0.000456228 s/iter 18.772328 +gpu 0 iter : 2 Arret : 0.00142575 s/iter 18.751830 +gpu 0 iter : 3 Arret : 0.00549425 s/iter 18.764447 +gpu 0 iter : 4 Arret : 0.0229296 s/iter 19.538754 +gpu 0 iter : 5 Arret : 0.0173741 s/iter 19.273977 +gpu 0 iter : 6 Arret : 0.0179817 s/iter 19.297823 +gpu 0 iter : 7 Arret : 0.0102999 s/iter 18.835443 +gpu 0 iter : 8 Arret : 0.00783109 s/iter 19.616467 +gpu 0 iter : 9 Arret : 0.00443683 s/iter 19.576776 +gpu 0 iter : 10 Arret : 0.00652305 s/iter 18.757222 +gpu 0 iter : 11 Arret : 0.00589396 s/iter 18.772725 +gpu 0 iter : 12 Arret : 0.00781914 s/iter 18.746761 +gpu 0 iter : 13 Arret : 0.00825508 s/iter 18.745513 +gpu 0 iter : 14 Arret : 0.00209831 s/iter 18.746669 +gpu 0 iter : 15 Arret : 0.000157396 s/iter 18.747760 +gpu 0 iter : 16 Arret : 0.000185725 s/iter 18.747416 +gpu 0 iter : 17 Arret : 0.000163905 s/iter 18.747056 +gpu 0 iter : 18 Arret : 6.34206E-05 s/iter 18.748309 +gpu 0 iter : 19 Arret : 5.65573E-06 s/iter 18.749904 +gpu 0 iter : 20 Arret : 7.0784E-09 s/iter 18.749738 +gpu 0 iter : 21 Arret : 2.24468E-11 s/iter 18.748487 +gpu 0 iter : 22 Arret : 7.09418E-14 s/iter 18.747345 +temps : 422.324 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.97857E-06 +Stabilite : 5.20859E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491932 +i* 0.870629| 0.999996|-2.65525E-11 +i* 1.22525E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996| 2.73914E-12 +i* 2.25153E-11| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid2 1172 start 900096 size 300032 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 2 dimgrid2 1172 start 600064 size 300032 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 0.00368442 s/iter 26.569710 +gpu 0 iter : 2 Arret : 3.704 s/iter 28.385681 +gpu 0 iter : 3 Arret : 1.74615 s/iter 28.502041 +gpu 0 iter : 4 Arret : 2.12336 s/iter 28.609424 +gpu 0 iter : 5 Arret : 2.13811 s/iter 29.338801 +gpu 0 iter : 6 Arret : 0.766739 s/iter 29.346300 +gpu 0 iter : 7 Arret : 0.657775 s/iter 29.516021 +gpu 0 iter : 8 Arret : 0.597705 s/iter 29.678298 +gpu 0 iter : 9 Arret : 0.573945 s/iter 29.579526 +gpu 0 iter : 10 Arret : 0.542611 s/iter 29.795670 +gpu 0 iter : 11 Arret : 0.488156 s/iter 29.717429 +gpu 0 iter : 12 Arret : 0.463721 s/iter 29.588883 +gpu 0 iter : 13 Arret : 0.442782 s/iter 29.618542 +gpu 0 iter : 14 Arret : 0.43109 s/iter 29.294507 +gpu 0 iter : 15 Arret : 0.427026 s/iter 29.324604 +gpu 0 iter : 16 Arret : 0.434845 s/iter 29.362199 +gpu 0 iter : 17 Arret : 0.442084 s/iter 29.279579 +gpu 0 iter : 18 Arret : 0.46093 s/iter 29.338081 +gpu 0 iter : 19 Arret : 0.48645 s/iter 29.333743 +gpu 0 iter : 20 Arret : 0.496349 s/iter 29.369982 +gpu 0 iter : 21 Arret : 1.56187 s/iter 28.940178 +gpu 0 iter : 22 Arret : 2.3748 s/iter 28.784866 +gpu 0 iter : 23 Arret : 1.09653 s/iter 28.933834 +gpu 0 iter : 24 Arret : 1.43739 s/iter 28.700919 +gpu 0 iter : 25 Arret : 2.22796 s/iter 28.722635 +gpu 0 iter : 26 Arret : 1.54855 s/iter 28.698877 +gpu 0 iter : 27 Arret : 1.95651 s/iter 28.629259 +gpu 0 iter : 28 Arret : 0.897983 s/iter 28.648379 +gpu 0 iter : 29 Arret : 7.34662 s/iter 28.534855 +gpu 0 iter : 30 Arret : 1.74621 s/iter 28.422914 +gpu 0 iter : 31 Arret : 0.597689 s/iter 28.621303 +gpu 0 iter : 32 Arret : 0.857922 s/iter 28.617561 +gpu 0 iter : 33 Arret : 1.33974 s/iter 28.328536 +gpu 0 iter : 34 Arret : 10.8161 s/iter 28.390666 +gpu 0 iter : 35 Arret : 6.6951 s/iter 28.507533 +gpu 0 iter : 36 Arret : 0.757761 s/iter 28.460493 +gpu 0 iter : 37 Arret : 0.588104 s/iter 28.489026 +gpu 0 iter : 38 Arret : 0.593958 s/iter 28.232970 +gpu 0 iter : 39 Arret : 0.333943 s/iter 27.617579 +gpu 0 iter : 40 Arret : 0.276517 s/iter 27.632546 +gpu 0 iter : 41 Arret : 0.137564 s/iter 27.552902 +gpu 0 iter : 42 Arret : 0.0648876 s/iter 27.307198 +gpu 0 iter : 43 Arret : 0.0511538 s/iter 27.320582 +gpu 0 iter : 44 Arret : 0.0242118 s/iter 26.798806 +gpu 0 iter : 45 Arret : 0.00922443 s/iter 26.583042 +gpu 0 iter : 46 Arret : 0.00927718 s/iter 26.616458 +gpu 0 iter : 47 Arret : 0.0412361 s/iter 26.563085 +gpu 0 iter : 48 Arret : 0.0405407 s/iter 26.561073 +gpu 0 iter : 49 Arret : 0.00788436 s/iter 26.567749 +gpu 0 iter : 50 Arret : 0.00128029 s/iter 26.567412 +gpu 0 iter : 51 Arret : 0.000171237 s/iter 26.567449 +gpu 0 iter : 52 Arret : 7.02979E-07 s/iter 26.567944 +gpu 0 iter : 53 Arret : 2.0296E-09 s/iter 26.567809 +gpu 0 iter : 54 Arret : 8.07801E-12 s/iter 26.567272 +gpu 0 iter : 55 Arret : 3.21626E-14 s/iter 26.572179 +temps : 1556.58 seconde(s) +Nb iterations : 55 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.03717E-06 +Stabilite : 4.93017E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513633 +i* 0.858015| 1| 1.54651E-09 +i*-2.27023E-10| +| 3| 0.486451 +i* 0.873713| 1| 1.95054E-09 +i* 6.77633E-10| +| 4| 0.458805 +i* 0.888533| 0.999997| 1.78773E-11 +i* 1.55684E-11| +| 5| 0.430685 +i* 0.902499| 0.999997| 2.12053E-13 +i*-1.16324E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192909 +i* 0.981221| 1|-1.95729E-09 +i* 4.84549E-09| +| 14| 0.162018 +i* 0.986792| 1| 1.80241E-09 +i* 1.03051E-10| +| 15| 0.130967 +i* 0.991391| 1|-1.93729E-10 +i*-4.06442E-10| +| 16| 0.0998077 +i* 0.995003| 0.999997| -4.5103E-11 +i*-6.66658E-12| +| 17| 0.0685404 +i* 0.997645| 0.999997| 1.01124E-11 +i* 3.1089E-12| +| 18| 0.0371504 +i* 0.999314| 1|-1.38879E-09 +i*-2.32658E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 1368 start 0 size 350016 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1368 start 350016 size 350016 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1368 start 700032 size 350016 +gpu 3 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 3 dimgrid2 1368 start 1050048 size 350016 +gpu 0 iter : 1 Arret : 0.00408309 s/iter 36.124369 +gpu 0 iter : 2 Arret : 0.208632 s/iter 36.641290 +gpu 0 iter : 3 Arret : 1.37702 s/iter 37.617641 +gpu 0 iter : 4 Arret : 1.45346 s/iter 37.349167 +gpu 0 iter : 5 Arret : 1.6393 s/iter 37.990887 +gpu 0 iter : 6 Arret : 3.4316 s/iter 38.064434 +gpu 0 iter : 7 Arret : 1.9865 s/iter 38.951955 +gpu 0 iter : 8 Arret : 4.57739 s/iter 39.092906 +gpu 0 iter : 9 Arret : 2.70182 s/iter 39.516603 +gpu 0 iter : 10 Arret : 2.54353 s/iter 40.448257 +gpu 0 iter : 11 Arret : 1.82865 s/iter 40.236603 +gpu 0 iter : 12 Arret : 0.783909 s/iter 39.432599 +gpu 0 iter : 13 Arret : 1.89333 s/iter 39.521084 +gpu 0 iter : 14 Arret : 1.37044 s/iter 39.264476 +gpu 0 iter : 15 Arret : 3.05361 s/iter 38.860385 +gpu 0 iter : 16 Arret : 2.08571 s/iter 38.971159 +gpu 0 iter : 17 Arret : 2.09101 s/iter 38.887096 +gpu 0 iter : 18 Arret : 1.02745 s/iter 38.910018 +gpu 0 iter : 19 Arret : 0.704384 s/iter 38.234669 +gpu 0 iter : 20 Arret : 0.741087 s/iter 38.350019 +gpu 0 iter : 21 Arret : 0.788627 s/iter 38.106199 +gpu 0 iter : 22 Arret : 1.04305 s/iter 37.990724 +gpu 0 iter : 23 Arret : 2.78018 s/iter 38.167968 +gpu 0 iter : 24 Arret : 3.62183 s/iter 38.203661 +gpu 0 iter : 25 Arret : 5.50084 s/iter 37.940466 +gpu 0 iter : 26 Arret : 0.606592 s/iter 38.122389 +gpu 0 iter : 27 Arret : 0.700038 s/iter 37.866885 +gpu 0 iter : 28 Arret : 0.418813 s/iter 37.840730 +gpu 0 iter : 29 Arret : 0.495401 s/iter 37.808439 +gpu 0 iter : 30 Arret : 0.988549 s/iter 37.865318 +gpu 0 iter : 31 Arret : 0.749386 s/iter 37.753243 +gpu 0 iter : 32 Arret : 0.852267 s/iter 37.713161 +gpu 0 iter : 33 Arret : 1.16501 s/iter 37.855558 +gpu 0 iter : 34 Arret : 0.385689 s/iter 37.935460 +gpu 0 iter : 35 Arret : 0.393423 s/iter 37.441807 +gpu 0 iter : 36 Arret : 0.317888 s/iter 36.669962 +gpu 0 iter : 37 Arret : 0.23539 s/iter 36.318606 +gpu 0 iter : 38 Arret : 0.0527559 s/iter 36.193597 +gpu 0 iter : 39 Arret : 0.0143793 s/iter 36.106964 +gpu 0 iter : 40 Arret : 0.00318939 s/iter 36.183822 +gpu 0 iter : 41 Arret : 2.64184E-05 s/iter 36.123292 +gpu 0 iter : 42 Arret : 1.30802E-08 s/iter 36.116093 +gpu 0 iter : 43 Arret : 1.80499E-10 s/iter 36.117759 +gpu 0 iter : 44 Arret : 2.48451E-12 s/iter 36.115451 +gpu 0 iter : 45 Arret : 3.41814E-14 s/iter 36.113705 +temps : 1704.89 seconde(s) +Nb iterations : 45 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.68566E-08 +Stabilite : 7.85076E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-5.74141E-12 +i*-6.39521E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.06317E-11 +i* 7.08794E-11| +| 15| -0.358575 +i* -0.933498| 0.999997| 8.13599E-11 +i*-1.42233E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 23: 10309 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 24: 10313 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 25: 10315 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097~ b/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097~ new file mode 100644 index 0000000..2edc5c1 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097~ @@ -0,0 +1,621 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 98 start 0 size 25024 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 98 start 50048 size 25024 +gpu 3 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 3 dimgrid2 98 start 75072 size 25024 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 98 start 25024 size 25024 +gpu 0 iter : 1 Arret : 0.00317265 s/iter 0.236357 +gpu 0 iter : 2 Arret : 0.00227157 s/iter 0.222729 +gpu 0 iter : 3 Arret : 0.00205316 s/iter 0.222769 +gpu 0 iter : 4 Arret : 0.00128297 s/iter 0.222748 +gpu 0 iter : 5 Arret : 0.00112626 s/iter 0.222747 +gpu 0 iter : 6 Arret : 0.0020822 s/iter 0.222736 +gpu 0 iter : 7 Arret : 0.0115304 s/iter 0.222730 +gpu 0 iter : 8 Arret : 0.0115653 s/iter 0.295379 +gpu 0 iter : 9 Arret : 0.00182694 s/iter 0.222647 +gpu 0 iter : 10 Arret : 0.000971807 s/iter 0.222690 +gpu 0 iter : 11 Arret : 0.00050868 s/iter 0.222743 +gpu 0 iter : 12 Arret : 0.000554626 s/iter 0.222588 +gpu 0 iter : 13 Arret : 0.000773549 s/iter 0.222519 +gpu 0 iter : 14 Arret : 0.000652981 s/iter 0.222480 +gpu 0 iter : 15 Arret : 7.85268E-05 s/iter 0.222478 +gpu 0 iter : 16 Arret : 1.67519E-05 s/iter 0.222489 +gpu 0 iter : 17 Arret : 1.93862E-07 s/iter 0.222504 +gpu 0 iter : 18 Arret : 2.89153E-09 s/iter 0.222440 +gpu 0 iter : 19 Arret : 4.30769E-11 s/iter 0.222397 +gpu 0 iter : 20 Arret : 6.41743E-13 s/iter 0.222499 +temps : 5.86914 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.09748E-08 +Stabilite : 1.57015E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962|-4.03455E-13 +i* 2.85139E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 196 start 100096 size 50048 +gpu 3 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 3 dimgrid2 196 start 150144 size 50048 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 0 iter : 1 Arret : 0.000151294 s/iter 0.873722 +gpu 0 iter : 2 Arret : 0.000148163 s/iter 0.876720 +gpu 0 iter : 3 Arret : 0.000156239 s/iter 0.876483 +gpu 0 iter : 4 Arret : 0.000917016 s/iter 0.876408 +gpu 0 iter : 5 Arret : 0.00193309 s/iter 0.877387 +gpu 0 iter : 6 Arret : 0.012901 s/iter 1.040793 +gpu 0 iter : 7 Arret : 0.0696679 s/iter 1.039198 +gpu 0 iter : 8 Arret : 0.0831135 s/iter 1.017396 +gpu 0 iter : 9 Arret : 0.655093 s/iter 1.021459 +gpu 0 iter : 10 Arret : 0.310762 s/iter 1.026425 +gpu 0 iter : 11 Arret : 0.25028 s/iter 1.016739 +gpu 0 iter : 12 Arret : 0.12787 s/iter 1.024487 +gpu 0 iter : 13 Arret : 0.174578 s/iter 0.991808 +gpu 0 iter : 14 Arret : 0.13471 s/iter 1.020582 +gpu 0 iter : 15 Arret : 0.260288 s/iter 0.881413 +gpu 0 iter : 16 Arret : 0.151424 s/iter 1.018801 +gpu 0 iter : 17 Arret : 0.070357 s/iter 0.881097 +gpu 0 iter : 18 Arret : 0.0196537 s/iter 0.881104 +gpu 0 iter : 19 Arret : 0.00113921 s/iter 0.878041 +gpu 0 iter : 20 Arret : 4.42128E-05 s/iter 0.877967 +gpu 0 iter : 21 Arret : 3.87634E-06 s/iter 0.878342 +gpu 0 iter : 22 Arret : 3.63936E-09 s/iter 0.878295 +gpu 0 iter : 23 Arret : 3.63838E-13 s/iter 0.878170 +temps : 22.9576 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.000181892 +Stabilite : 2.22061E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005| 5.92533E-09 +i* 3.55911E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-1.93379E-12 +i*-1.29726E-11| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 391 start 0 size 100032 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 391 start 200064 size 100032 +gpu 3 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 3 dimgrid2 391 start 300096 size 100032 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 391 start 100032 size 100032 +gpu 0 iter : 1 Arret : 0.00053336 s/iter 3.114080 +gpu 0 iter : 2 Arret : 0.00132869 s/iter 3.113006 +gpu 0 iter : 3 Arret : 0.00304211 s/iter 3.113002 +gpu 0 iter : 4 Arret : 0.0081892 s/iter 3.421884 +gpu 0 iter : 5 Arret : 0.0174091 s/iter 3.393637 +gpu 0 iter : 6 Arret : 0.0170263 s/iter 3.378163 +gpu 0 iter : 7 Arret : 0.00925735 s/iter 3.423651 +gpu 0 iter : 8 Arret : 0.00879968 s/iter 3.111951 +gpu 0 iter : 9 Arret : 0.0133997 s/iter 3.368852 +gpu 0 iter : 10 Arret : 0.00968114 s/iter 3.111774 +gpu 0 iter : 11 Arret : 0.00462525 s/iter 3.110863 +gpu 0 iter : 12 Arret : 0.00341319 s/iter 3.111132 +gpu 0 iter : 13 Arret : 0.00439696 s/iter 3.110364 +gpu 0 iter : 14 Arret : 0.000354857 s/iter 3.110007 +gpu 0 iter : 15 Arret : 0.00105657 s/iter 3.109831 +gpu 0 iter : 16 Arret : 0.000563123 s/iter 3.109784 +gpu 0 iter : 17 Arret : 2.74759E-05 s/iter 3.109683 +gpu 0 iter : 18 Arret : 3.06801E-07 s/iter 3.109172 +gpu 0 iter : 19 Arret : 7.06164E-10 s/iter 3.108923 +gpu 0 iter : 20 Arret : 1.07684E-11 s/iter 3.109509 +gpu 0 iter : 21 Arret : 1.64161E-13 s/iter 3.109378 +temps : 68.0633 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.09466E-07 +Stabilite : 3.51078E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540313 +i* 0.841453| 0.999991| 9.34197E-12 +i*-1.23633E-11| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411521 +i* -0.911417| 1.00002|-2.94737E-09 +i* 1.73005E-09| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.988534 +i* 0.151098| 1.00002|-8.27014E-10 +i* 9.44171E-10| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641299 +i* 0.767311| 1.00002|-2.44657E-09 +i* -6.7886E-11| +| 13| -0.983286 +i* 0.18202| 0.999991| 3.21676E-12 +i*-9.48297E-13| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.66503 +i* 0.746804| 0.999991| 5.74873E-13 +i* 8.53884E-12| +| 16| -0.977123 +i* 0.212747| 1.00002| 1.09185E-09 +i* 2.38902E-10| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688122 +i* 0.725616| 1.00002|-2.54456E-09 +i* 8.15125E-10| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991| 2.5573E-11 +i*-6.45539E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 586 start 300032 size 150016 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 586 start 150016 size 150016 +gpu 3 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 3 dimgrid2 586 start 450048 size 150016 +gpu 0 iter : 1 Arret : 0.00166144 s/iter 6.733254 +gpu 0 iter : 2 Arret : 0.00663307 s/iter 6.721345 +gpu 0 iter : 3 Arret : 0.0196947 s/iter 6.725089 +gpu 0 iter : 4 Arret : 0.0354088 s/iter 7.044531 +gpu 0 iter : 5 Arret : 0.0344666 s/iter 7.231490 +gpu 0 iter : 6 Arret : 0.0255965 s/iter 7.223546 +gpu 0 iter : 7 Arret : 0.0250307 s/iter 7.248225 +gpu 0 iter : 8 Arret : 0.0220818 s/iter 7.524758 +gpu 0 iter : 9 Arret : 0.0193422 s/iter 7.217155 +gpu 0 iter : 10 Arret : 0.0384961 s/iter 7.206267 +gpu 0 iter : 11 Arret : 0.0308611 s/iter 7.198073 +gpu 0 iter : 12 Arret : 0.0139003 s/iter 7.227655 +gpu 0 iter : 13 Arret : 0.00821788 s/iter 6.730489 +gpu 0 iter : 14 Arret : 0.00366002 s/iter 7.146524 +gpu 0 iter : 15 Arret : 0.00103013 s/iter 6.725238 +gpu 0 iter : 16 Arret : 0.000538911 s/iter 6.724848 +gpu 0 iter : 17 Arret : 0.000270623 s/iter 6.725086 +gpu 0 iter : 18 Arret : 4.24795E-05 s/iter 6.724157 +gpu 0 iter : 19 Arret : 5.07342E-09 s/iter 6.723896 +gpu 0 iter : 20 Arret : 7.14369E-11 s/iter 6.724108 +gpu 0 iter : 21 Arret : 1.00557E-12 s/iter 6.725050 +gpu 0 iter : 22 Arret : 1.41479E-14 s/iter 6.724347 +temps : 154.313 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.37653E-08 +Stabilite : 2.77613E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592014 +i* 0.805919| 0.999993|-3.98037E-12 +i* 9.55808E-12| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742944 +i* -0.669367| 1.00001| 9.14394E-11 +i*-3.49261E-09| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.763551 +i* -0.645737| 0.999993| 1.68299E-11 +i* 1.43271E-11| +| 20| 0.773539 +i* 0.633763| 1.00001| -4.2314E-09 +i* 1.86243E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 3 dimgrid2 782 start 600000 size 200000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 782 start 200000 size 200000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 782 start 0 size 200000 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 782 start 400000 size 200000 +gpu 0 iter : 1 Arret : 0.00108387 s/iter 12.149827 +gpu 0 iter : 2 Arret : 0.00154284 s/iter 12.327396 +gpu 0 iter : 3 Arret : 0.00442373 s/iter 12.172431 +gpu 0 iter : 4 Arret : 0.0484674 s/iter 12.229082 +gpu 0 iter : 5 Arret : 0.0462186 s/iter 12.248952 +gpu 0 iter : 6 Arret : 0.0672711 s/iter 12.235166 +gpu 0 iter : 7 Arret : 0.0371959 s/iter 12.355881 +gpu 0 iter : 8 Arret : 0.0332451 s/iter 12.399234 +gpu 0 iter : 9 Arret : 0.0347928 s/iter 12.369857 +gpu 0 iter : 10 Arret : 0.0382283 s/iter 12.701023 +gpu 0 iter : 11 Arret : 0.010893 s/iter 12.800482 +gpu 0 iter : 12 Arret : 0.0100182 s/iter 12.206749 +gpu 0 iter : 13 Arret : 0.000870471 s/iter 12.137340 +gpu 0 iter : 14 Arret : 0.00222619 s/iter 12.140578 +gpu 0 iter : 15 Arret : 0.000360359 s/iter 12.119427 +gpu 0 iter : 16 Arret : 0.000163251 s/iter 12.146378 +gpu 0 iter : 17 Arret : 8.3446E-05 s/iter 12.146441 +gpu 0 iter : 18 Arret : 5.95325E-07 s/iter 12.141680 +gpu 0 iter : 19 Arret : 1.07969E-09 s/iter 12.142666 +gpu 0 iter : 20 Arret : 2.37954E-12 s/iter 12.145013 +gpu 0 iter : 21 Arret : 3.63218E-14 s/iter 12.145853 +temps : 258.82 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.97756E-07 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995| -2.03E-11 +i* 2.74701E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995| 6.90537E-12 +i*-5.12417E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 3.40094E-11 +i* 1.45989E-12| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 3 dimgrid2 977 start 750144 size 250048 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 977 start 0 size 250048 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 977 start 250048 size 250048 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 977 start 500096 size 250048 +gpu 0 iter : 1 Arret : 0.000456228 s/iter 18.772328 +gpu 0 iter : 2 Arret : 0.00142575 s/iter 18.751830 +gpu 0 iter : 3 Arret : 0.00549425 s/iter 18.764447 +gpu 0 iter : 4 Arret : 0.0229296 s/iter 19.538754 +gpu 0 iter : 5 Arret : 0.0173741 s/iter 19.273977 +gpu 0 iter : 6 Arret : 0.0179817 s/iter 19.297823 +gpu 0 iter : 7 Arret : 0.0102999 s/iter 18.835443 +gpu 0 iter : 8 Arret : 0.00783109 s/iter 19.616467 +gpu 0 iter : 9 Arret : 0.00443683 s/iter 19.576776 +gpu 0 iter : 10 Arret : 0.00652305 s/iter 18.757222 +gpu 0 iter : 11 Arret : 0.00589396 s/iter 18.772725 +gpu 0 iter : 12 Arret : 0.00781914 s/iter 18.746761 +gpu 0 iter : 13 Arret : 0.00825508 s/iter 18.745513 +gpu 0 iter : 14 Arret : 0.00209831 s/iter 18.746669 +gpu 0 iter : 15 Arret : 0.000157396 s/iter 18.747760 +gpu 0 iter : 16 Arret : 0.000185725 s/iter 18.747416 +gpu 0 iter : 17 Arret : 0.000163905 s/iter 18.747056 +gpu 0 iter : 18 Arret : 6.34206E-05 s/iter 18.748309 +gpu 0 iter : 19 Arret : 5.65573E-06 s/iter 18.749904 +gpu 0 iter : 20 Arret : 7.0784E-09 s/iter 18.749738 +gpu 0 iter : 21 Arret : 2.24468E-11 s/iter 18.748487 +gpu 0 iter : 22 Arret : 7.09418E-14 s/iter 18.747345 +temps : 422.324 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.97857E-06 +Stabilite : 5.20859E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491932 +i* 0.870629| 0.999996|-2.65525E-11 +i* 1.22525E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996| 2.73914E-12 +i* 2.25153E-11| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid2 1172 start 900096 size 300032 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 2 dimgrid2 1172 start 600064 size 300032 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 0.00368442 s/iter 26.569710 +gpu 0 iter : 2 Arret : 3.704 s/iter 28.385681 +gpu 0 iter : 3 Arret : 1.74615 s/iter 28.502041 +gpu 0 iter : 4 Arret : 2.12336 s/iter 28.609424 +gpu 0 iter : 5 Arret : 2.13811 s/iter 29.338801 +gpu 0 iter : 6 Arret : 0.766739 s/iter 29.346300 +gpu 0 iter : 7 Arret : 0.657775 s/iter 29.516021 +gpu 0 iter : 8 Arret : 0.597705 s/iter 29.678298 +gpu 0 iter : 9 Arret : 0.573945 s/iter 29.579526 +gpu 0 iter : 10 Arret : 0.542611 s/iter 29.795670 +gpu 0 iter : 11 Arret : 0.488156 s/iter 29.717429 +gpu 0 iter : 12 Arret : 0.463721 s/iter 29.588883 +gpu 0 iter : 13 Arret : 0.442782 s/iter 29.618542 +gpu 0 iter : 14 Arret : 0.43109 s/iter 29.294507 +gpu 0 iter : 15 Arret : 0.427026 s/iter 29.324604 +gpu 0 iter : 16 Arret : 0.434845 s/iter 29.362199 +gpu 0 iter : 17 Arret : 0.442084 s/iter 29.279579 +gpu 0 iter : 18 Arret : 0.46093 s/iter 29.338081 +gpu 0 iter : 19 Arret : 0.48645 s/iter 29.333743 +gpu 0 iter : 20 Arret : 0.496349 s/iter 29.369982 +gpu 0 iter : 21 Arret : 1.56187 s/iter 28.940178 +gpu 0 iter : 22 Arret : 2.3748 s/iter 28.784866 +gpu 0 iter : 23 Arret : 1.09653 s/iter 28.933834 +gpu 0 iter : 24 Arret : 1.43739 s/iter 28.700919 +gpu 0 iter : 25 Arret : 2.22796 s/iter 28.722635 +gpu 0 iter : 26 Arret : 1.54855 s/iter 28.698877 +gpu 0 iter : 27 Arret : 1.95651 s/iter 28.629259 +gpu 0 iter : 28 Arret : 0.897983 s/iter 28.648379 +gpu 0 iter : 29 Arret : 7.34662 s/iter 28.534855 +gpu 0 iter : 30 Arret : 1.74621 s/iter 28.422914 +gpu 0 iter : 31 Arret : 0.597689 s/iter 28.621303 +gpu 0 iter : 32 Arret : 0.857922 s/iter 28.617561 +gpu 0 iter : 33 Arret : 1.33974 s/iter 28.328536 +gpu 0 iter : 34 Arret : 10.8161 s/iter 28.390666 +gpu 0 iter : 35 Arret : 6.6951 s/iter 28.507533 +gpu 0 iter : 36 Arret : 0.757761 s/iter 28.460493 +gpu 0 iter : 37 Arret : 0.588104 s/iter 28.489026 +gpu 0 iter : 38 Arret : 0.593958 s/iter 28.232970 +gpu 0 iter : 39 Arret : 0.333943 s/iter 27.617579 +gpu 0 iter : 40 Arret : 0.276517 s/iter 27.632546 +gpu 0 iter : 41 Arret : 0.137564 s/iter 27.552902 +gpu 0 iter : 42 Arret : 0.0648876 s/iter 27.307198 +gpu 0 iter : 43 Arret : 0.0511538 s/iter 27.320582 +gpu 0 iter : 44 Arret : 0.0242118 s/iter 26.798806 +gpu 0 iter : 45 Arret : 0.00922443 s/iter 26.583042 +gpu 0 iter : 46 Arret : 0.00927718 s/iter 26.616458 +gpu 0 iter : 47 Arret : 0.0412361 s/iter 26.563085 +gpu 0 iter : 48 Arret : 0.0405407 s/iter 26.561073 +gpu 0 iter : 49 Arret : 0.00788436 s/iter 26.567749 +gpu 0 iter : 50 Arret : 0.00128029 s/iter 26.567412 +gpu 0 iter : 51 Arret : 0.000171237 s/iter 26.567449 +gpu 0 iter : 52 Arret : 7.02979E-07 s/iter 26.567944 +gpu 0 iter : 53 Arret : 2.0296E-09 s/iter 26.567809 +gpu 0 iter : 54 Arret : 8.07801E-12 s/iter 26.567272 +gpu 0 iter : 55 Arret : 3.21626E-14 s/iter 26.572179 +temps : 1556.58 seconde(s) +Nb iterations : 55 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.03717E-06 +Stabilite : 4.93017E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513633 +i* 0.858015| 1| 1.54651E-09 +i*-2.27023E-10| +| 3| 0.486451 +i* 0.873713| 1| 1.95054E-09 +i* 6.77633E-10| +| 4| 0.458805 +i* 0.888533| 0.999997| 1.78773E-11 +i* 1.55684E-11| +| 5| 0.430685 +i* 0.902499| 0.999997| 2.12053E-13 +i*-1.16324E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192909 +i* 0.981221| 1|-1.95729E-09 +i* 4.84549E-09| +| 14| 0.162018 +i* 0.986792| 1| 1.80241E-09 +i* 1.03051E-10| +| 15| 0.130967 +i* 0.991391| 1|-1.93729E-10 +i*-4.06442E-10| +| 16| 0.0998077 +i* 0.995003| 0.999997| -4.5103E-11 +i*-6.66658E-12| +| 17| 0.0685404 +i* 0.997645| 0.999997| 1.01124E-11 +i* 3.1089E-12| +| 18| 0.0371504 +i* 0.999314| 1|-1.38879E-09 +i*-2.32658E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 1368 start 0 size 350016 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1368 start 350016 size 350016 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1368 start 700032 size 350016 +gpu 3 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 3 dimgrid2 1368 start 1050048 size 350016 +gpu 0 iter : 1 Arret : 0.00408309 s/iter 36.124369 +gpu 0 iter : 2 Arret : 0.208632 s/iter 36.641290 +gpu 0 iter : 3 Arret : 1.37702 s/iter 37.617641 +gpu 0 iter : 4 Arret : 1.45346 s/iter 37.349167 +gpu 0 iter : 5 Arret : 1.6393 s/iter 37.990887 +gpu 0 iter : 6 Arret : 3.4316 s/iter 38.064434 +gpu 0 iter : 7 Arret : 1.9865 s/iter 38.951955 +gpu 0 iter : 8 Arret : 4.57739 s/iter 39.092906 +gpu 0 iter : 9 Arret : 2.70182 s/iter 39.516603 +gpu 0 iter : 10 Arret : 2.54353 s/iter 40.448257 +gpu 0 iter : 11 Arret : 1.82865 s/iter 40.236603 +gpu 0 iter : 12 Arret : 0.783909 s/iter 39.432599 +gpu 0 iter : 13 Arret : 1.89333 s/iter 39.521084 +gpu 0 iter : 14 Arret : 1.37044 s/iter 39.264476 +gpu 0 iter : 15 Arret : 3.05361 s/iter 38.860385 +gpu 0 iter : 16 Arret : 2.08571 s/iter 38.971159 +gpu 0 iter : 17 Arret : 2.09101 s/iter 38.887096 +gpu 0 iter : 18 Arret : 1.02745 s/iter 38.910018 +gpu 0 iter : 19 Arret : 0.704384 s/iter 38.234669 +gpu 0 iter : 20 Arret : 0.741087 s/iter 38.350019 +gpu 0 iter : 21 Arret : 0.788627 s/iter 38.106199 +gpu 0 iter : 22 Arret : 1.04305 s/iter 37.990724 +gpu 0 iter : 23 Arret : 2.78018 s/iter 38.167968 +gpu 0 iter : 24 Arret : 3.62183 s/iter 38.203661 +gpu 0 iter : 25 Arret : 5.50084 s/iter 37.940466 +gpu 0 iter : 26 Arret : 0.606592 s/iter 38.122389 +gpu 0 iter : 27 Arret : 0.700038 s/iter 37.866885 +gpu 0 iter : 28 Arret : 0.418813 s/iter 37.840730 +gpu 0 iter : 29 Arret : 0.495401 s/iter 37.808439 +gpu 0 iter : 30 Arret : 0.988549 s/iter 37.865318 +gpu 0 iter : 31 Arret : 0.749386 s/iter 37.753243 +gpu 0 iter : 32 Arret : 0.852267 s/iter 37.713161 +gpu 0 iter : 33 Arret : 1.16501 s/iter 37.855558 +gpu 0 iter : 34 Arret : 0.385689 s/iter 37.935460 +gpu 0 iter : 35 Arret : 0.393423 s/iter 37.441807 +gpu 0 iter : 36 Arret : 0.317888 s/iter 36.669962 +gpu 0 iter : 37 Arret : 0.23539 s/iter 36.318606 +gpu 0 iter : 38 Arret : 0.0527559 s/iter 36.193597 +gpu 0 iter : 39 Arret : 0.0143793 s/iter 36.106964 +gpu 0 iter : 40 Arret : 0.00318939 s/iter 36.183822 +gpu 0 iter : 41 Arret : 2.64184E-05 s/iter 36.123292 +gpu 0 iter : 42 Arret : 1.30802E-08 s/iter 36.116093 +gpu 0 iter : 43 Arret : 1.80499E-10 s/iter 36.117759 +gpu 0 iter : 44 Arret : 2.48451E-12 s/iter 36.115451 +gpu 0 iter : 45 Arret : 3.41814E-14 s/iter 36.113705 +temps : 1704.89 seconde(s) +Nb iterations : 45 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.68566E-08 +Stabilite : 7.85076E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-5.74141E-12 +i*-6.39521E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.06317E-11 +i* 7.08794E-11| +| 15| -0.358575 +i* -0.933498| 0.999997| 8.13599E-11 +i*-1.42233E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 23: 10309 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 24: 10313 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 25: 10315 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_4GPU.sge b/Simulations/sparse_openmp/sparse_openmp_4GPU.sge new file mode 100755 index 0000000..1b5ae2f --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_4GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 4 +#$ -V +#$ -cwd +#$ -N sparse_openmp_4GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Sparse.pdf b/Sparse.pdf new file mode 100644 index 0000000000000000000000000000000000000000..f55c0a33b9ce5eb686dced70ea6fc0ec24aa85a9 GIT binary patch literal 7162 zcmb_B2{=^i`xR0nNl7KkQEBQj&a7s^*tZyDDN<_89A-3TrkTNHi3p{#mnDkIO(La5 zgs5B>mr5HYrL?#uE%u_{nL+FQ{g>ytXP$ZH``-O~-}igZ_r0UzY-x?c=;IMO^=}f7 zA_xE);Q9C?jEq1Bi0da}0R}L{1+->!M34XgtvPfNWC<~NOo&QF2t@*j9)J*M7kk({ z6M>`=9Rr@nd`vkd26`5t-X-lQCu_ku7=#f!-bjl zTW9x16g)dI6ql%yP~BgDxA@b@3>-neVN<2WvP+9ZQEq4`u$)UCd7=*s%)ODg=!?3y zx4O61{NujzTiUQ1k+~YCXqEHz_bN)|u!r(W7b;vHWpZM#u4Hj)ueQkTYj$pv-H-BU zTMaRADh6f@1=S#jy0$qnw3}^FF&Z!It{U03<*az)I3pl?SKgV~YF=kb^Arut*`#Z= zD>;f^UQlgTEgd~keRt#0f$avAH2>y#f7UY#_ALB}kqLVARnAeOfdzd5{^AyTXtoVB zp~%;u-~a5CP42f-O(zKM`!cjAY-*ntt%z=$ma53m%RSEGM76SF|M30XZEeB!s<)Qe zp>*!nx!dzT7c90QBh8xhGH$e|CNIIHC%MRB7rb1Pxi7=cHgiU%XU%xe4sn1GuPP9M1ZdixiuEcx0vUVG*RV{KmHfy29Ed%{zZ)9>xu>7Tbcy2Yu-_xI!e z;UV{Kwyq0%Rzz>kD!7+LXs$SwSz0*Iu%AuW=dy!Ztq5lz31K0{-XR(#q4|d zfs>EyXFvA}OMH8KfG8WG{YiFw_sz0hM8)pnTc4eW)4y!m96l2Ev8yG#y1Xig82om8 z^zUnr9)_+lym5DFj_x0&?pv-ruI?BQA8QB~zx2-e($GC``Y}cW;`i{qv=8I!gM-GK zj3WLpp2>;cbIC2O&1m)BEyX!nJ|>6DTmP6>hd8#UVTfw4aIx*WM^kJGYu2!aR_WE} z+vDi0m|9aZ^|RGSmffl=1B)6KeK3`KIj|@%#iHTl=|Mle^)yQ4-iDcZjn1xBJ4_6< z1}a42xS4(9=5b|jbWd$oi(wSR>=l-1H?7+E;T*s2##K8b{p|X(h>hWA#T~Ne6Y59G zp)sR&n?fI2GWFDTM(>_i8{R&{KUs3;j4){yHQDUB+SZot+;Fm^#mfq<^>NFIdS_}? zdUOq0GKq#30sd`dTUj-Z`l)^S%W3Oh_%*YRD2N9h-%7lZ6*-?X<3UE`pfe`@&NvAf zS-EY7VCjMy=atiZ7T*ZoyG3s9j?M_}=a-I5i;s(&dHit7+&i64YvgSP&Wp^Cmi6os z3C6u!%?_BPIELzJ%!wY_uQIoYPuO=AbLZ-FkNV$t?~Pul|FnW0(==Y2vpl9r^LG*O z@=SWma8YafIW{Xd^?a--O5Wo*ZqCY_x}D2*MfTOD&8;Q}B)6b5M5^)$N&X#n$nGT7 z9*5{Pe%o?q<)d0pZaa_=ZqTFG|I#i_(r`oLjGslBybrbngPsH=8iqwr>9hDWJ!<^ss4tj-x!|P80jy zbpw{wL0f`Ha{E-*4xVh%-SzrKLEaYB(>p1B&*q!w#d=z5siK-Mx!JeQYRh`C&gz1@ zbEv*T<86D4teolnen;nPXxR(FPiE~j$ktv}x%l<60y^3ZHFthqT23xtzDbs#_*((I z%Kp+>2&1BSwVA1Ro|-D_7yI?c9ea;FR#KE$qVz>(acuD@#AQxaQFtV&ypnn=`NiPy zXv8E8|E(&!ZRbOvGu;mYX%Lf5H|L1~FEorMpz#0^i{6BQkphS-0&tSLjR0LBAumwC zfP`>GcNXv%u8_zJglj$kx*|>_}st#Zza$pu~9?XuxNGEWS2QA<^EKvwZ zUJfn@7&K{?M8(9*0+t5b1xO7O0-!ycDFnO_60=x)72$23%ulXXR$EYYTCLAQ78Em%7Um5;6pAzKACP$Py7!cStd?JJ|xE z$bv-|05~k@K%X3AuxM~Sn<-)my%1QUMA3iyNU;b4!2tOAJHa7={=kd)HZw4gtd}U2 zKcQs;Lc-zTY{5z}hzZC9j|BFO`|C(5QK}scXWFDCQ&wZY@<^mkVx=57$sFd8P)=D1 z&m~F6g-;M{t{?0It{GRz{yKLJ^btuiT#^)U45ufhVJno4RV)wt$a&7&K8vLyS8HXqZ=NQ>457Sh-FsGkW|7&ufK9rsGjwhOEC1N9`Cvof(2?xfCk$(EKk6+X>L|wrzi1hX z_%al+{OAg9n(d0LjG|lXSp9X|{nvxjXp8cea9O{5+%y~{7rx3&`}>(qs$B5dC;IFR zOjoi>^`RMY#(5tWuF;zxaLRc8mHhLCMVHRlmh?B-dcD?~hwh75o|l}Q+(>i3vSaN^ zR^wg;`?TureDhgn#^uU#_?G=>Bjgc{~OUIH(s9X9!{qpXQG-;k2XSsEN%Pr1@)eu zr5j8lUnuU*LfwRvEf)B{c>kJCB~3?qgx6?!msLf2*v^hfkWmR`4A-w`ymNa~PN9%i z1x#ZCRlcRVM(VXuO9nIPmp%Q@$>(kGLt(`Y^Yr4BHJh=9ezid=KE6z)oC^#J6X5;1 zq+VPj6BSnM9+C(QrR?tz)>gladUPEzX7lhyj#1G0o@1{=%awyddrwyx$~hXOXmcJ^ zQnNzMBl~vDu56wWaentLYdn8P3bpjo5xwwSXj8<9;-9k zlKOEDyMTF0`EqLAP8nr2O7_}cLfbks?0FS^V?-`OEH@4WW5qw3g;fStNw zWz|;Ghik=-p=<5(`&-a&v=Vxe@umx1A*W=_jNmhk{ny{A43s|5TwY@X!Fsm!AyQ^8g)4_j8nx=JY=bVF2@p>`%5KWo)mo!UiW{%F5 z=}eOGCdFw&8(-13?z4rW7Dx9BBHo}y8!DL#(`O&VXy~4Ld!^}5{UW3L?yZIz-3GbZ zbA41RYd#D=PCwnazQ#^9>}+z`kGbBM+u*1>=9B$u zy6xN8chh^w$A$h{NhwwXXQCIyc3v57X@4reHfLORHxHoesMb@nxPl`(>MGnyHLvzR9Fl7ZGi29l(w&+$>%_geYtOyfr=f9nZ*tkO z_$?HC^k7@uQHptV8_t=*+z{ z->H+U9ac2w_RKGcb{M4JA1x^OYk)3mx#T^Xp~ERw2@l^qN7yi^?D!1*?53USXa_RJ zHJ51EJ@eLX4cdzLWvOAL*B)PXxfy9MAL6?vSH80h+{=%#2sC4=e;U(We6YrcA3CR6 z;AUewICkW6dIcA3e|4!gqED~}_vz6AuSc76?yYEg-&XR-t9fMgY5lAQYRjvBC%5%Q z8<6+C-H9ue6*Oong3brIPe(WAQ%~CrS1L8qT2&unm)=Q|Z=Xi9Suosr?+@Qa)1UGe zoP4nQM^Djc`Ge5&W%f@k^v_3>7xFb{K z^f!Dsj*1+%cXZ5+a2`}jnw=TobU3NBZ@#+cG7@v)HEp*h!>z>$MR$u-_x|>{7FS3< z(1ev!pqK#W$p)AQeqA{WGAdplDf7@D6OCNZ0yqD?Q19yg54wNj{>E)Ju~RjV>24l5 z31#J!hdw3ip6h#RgH$5mHx7R~tG{z;Mdn4)So1)kxz)Q3Z_4W(mKaAB{>R5|INc`%|7Z44swx zy*-}NNjjNiJT}_4NaL}COrlklm~yy^q$dC7pjT$qqCukO=R5q17v9I$WIho1oGTQK z@N^p=-`#QMXsoc#Pxg!1@nu{iOV;A3#hUdV+Ar#Il^$H$S2xyzr|gbtG1E-PIL|C& zD}~Eo)waZ#-L1)3nc#p8fAyB?@{*c)bX;bzx8GKBF#Yk~CcUA2e@30UyL>xfdC(lD zPFEN_nfWn?0T4|ZE25#R&)vAM>`zROpT0GnxyTu-2(X?zQa#kLI*K&~Nej_ z779F;fI%c6B@t~kMtabk0TGYK*~%6HSbefS28F@t0lotGR2|F{Yy~j-21r<>fayzd zfp3o!0^yl4k|h%HDIgde9IPLV)8`5NKn$5o2GLj$i$%c{DB*Ulh%QEPh09@mQbX7t zU)i`qeW^|Q3|;`p_5d;ZXmCo=)UArm;{p=JbRS-z$QT(I$YxT=5Q&WS#gb7F&H#_X zV0_UiH2k2*cp{0&phFk}7MfDW|IW-G^uY*NArAHfJfgtYV`d-&5*Qo7vI>sPKYIZV=%gErU>XVyzA5=`w}fx#RBHhnKv_a42H=JzPyj3i zLqQu*C|JM<{D~3{KFn$Xw`bvY?f-%GJIe1^c>*^$C8&PfKt6{j0`U3<0G}>musBc< z!~xI~TBWR$lt!Q=PTzUx-}V`uPow?MUJD42q_u>OV##9!2Edm$JInu1()`j375AlT)@!+tj69XwH_)Qu-Vn|Yi zCzufE3T>N`Oy#gSZ2C|9QoMx!D;GRwPWC=vbAOdGl{%9A`ESC05bzHPBn81m2hJt% zYe}ObfPd-v_XK^b^q|60jINmVnbmV~}Vx5~gsIWY4N^c`+rNCs;KV zp`SN5OaeCs{2_+uD~TkCFxV_m#DW>639|ZYpG_=)eBrJS29J=`;fV(@AP{f_z!#W= zVcE`!?rHr5!{dM9MZ?Sel@9jM&%AJF^cNTj3pXKu)PaTl z_A?AaH28%MLnQwKgZ=#r3{S?v{kJI{A^{!l&j{fE)&S6z9RfF8@c`(;g9|In2)F>C z9oLr!NSilstH~1ZGO{wWCRw71WD?o}jW;mI8jvv6Kn6rC8KI+N_x;W}pQO2to;*@P5hmF@oR9^>00@BY zb^xZX4jL0_o-8jw34&OFdSnWV$N)e+3V}t`A-dB&h&UXK$zl)*R9IkohP_Fwvoind zT36oylid|xrkl$IxFfZbOl`AcQK?bMRs1v3)Ni5kVun+p=*TKWtV&seoU5aLu_ul~ zn@+p5VIc!_d zjD6Rvd}X7e*g{L;%ZaJ__OT~Q=gZPGc^=Zu$ZN0ir})VRCG3p+)ORqrc!o}2RM)6f zsaDTUteo}iLe0Q)7Y~PC46{ut-g?Bu{P~@G@fw1J)u^*chD2GMn8O7kK(;gFH}pL#o|8?yRA~*+ci_O#SX3OFeq@kCuDGPt+txn>R}V zF;Tb9y({qeYLA?k6ZzYo_JkMkNPXC$Y1IaMnxvhfaMd*^uj?^}~D zqiXT*mAXG{>fYUyRkOAJ7V8v!u=-5^gPQQMQlls2ve`ttNKJOyL8DRIuOrmaYC~3c zXn*TNKi|?k@1`s{)+uiY-H%4wsQcH!;YEp#FXCc4ZR_mURU^YrOjvyUs4kYCf5dXz zV2DRYd1%!f_YSjhib!qNXvpWVi6DA1zNM`se1!IGc7AGcVQS{n3@v0XY>pKW@@?@8 zoS~MY+!0Za93jt3)o+;|T?`Em51X5-q~oZCqi+sYRl28L5oEsa2%DIlY@pwFokw+^ zZ)P?Q;Ul$Wb9}ipS1WZ(t3~@#r!M-{IGo@u(n*T_L+!-nd~GJWVaT9*vu|WE;;##{ zAJlu!2HpP%M48`=+~;p<>mr_Q!%vI$Z>~BAs_W6}m#vSO!j7)nOk@UI zQW7E5#q#m%b<(9U@PvK|TzatKis-aDI)z?bJa|%M_i}>pc0am?@M-NS?6^< zQ{Q_cFGx^^IwnFbEkrcb=$Fb;;1>5No^A~lm+$$%8oPeAR>$aRtQPadTO>|rqncvg z3*E&jJH2`Hi~bNO=GrURhU9IMUlv-O)IV#sNluNgNg3D}-LmMnt8L$zvTmL^%yx%k zR~qJ;i&Uz5n`RCiQ}!%H9rfMvK!7eWrPy%l7JA}_R9mUSi;k(}KGK5B(6Q8d3JIvZ1tD#O=nh3u}+rTRUja%})1^QbLAh#kPw#rR~GEyTq^@|Q5qwM7P`>~I#*WoYs z`kg#7Wy~Wdb!qO-tbpOhIrGDsM8Y z61Z<}n%=Y1a+6v7r4}vqiuhKea5uxy7*F*l*6LS-gzhKmD~`u0QhWZ+HW^QJ>+O4c zFhobgK+8cUrZC##uwO2%ymVmibEWtSo2Yv<{_uY_ zp2(KU_RO>CJ0CY(FK55g_sz{D$+?2y56`kZi9_Z0N)asoG%jJj`tg`a;ZIrJDaCM4 zIfoRR^JR5qzNz_|XJ3oBAxm^e{LW{in{O6o|LL0@#9fdonM{3;>a0s-+o^S+@@Y5H zWh#4>#2NW!p!j`Httcb0LkRRd&z~Cpw}rvZ-1m41f-9_Ip!xHkrO)OiDchT!Wbq_r z9yuEx{iBQHhrP>>TkRTZFBeNXpGdVMI-h%y zm*Bd}vZBD~b_F71M-c8{(b-u+&zy3_QVo?IQ|ofx3-{-=fX4m8nHyj3&WVhao~=@p zpGd79!5N2qv9wP)i8PPpr!F*NKdITzXZ9~r1%ZGq!xVo!#jS#Th@d&alL(p+ zJ;(%YdLZD4fR-@`ML-#aaE3vP3?hvMpxMuP7-&Ic()}3jL?)C0m^0|^mPD2#2;~R> zXhjTULFl@HEPYEBlm!4tHXn#Yj}DO|k(>#X6o7bW4sm1x>}0|M27#8%o%_<__103M9SvAoR=(7;t4DQh3>h+Vp)3=B8%VwtpLa+ zUO!|j|H|OUHejHcxe0*8;g*%;>}pw*g))pyXYqp#XPYalSQz%#RrYjwQJcUdvJC_3 z?Xxi1t1W9lr1%qAWOo9`TslOiJA>@QqB8&$HVck9I4h7j$qXh7??qq$XcTBnSRNx$ zNYIw-!SZ4{!cfX=K|j7I6x%%PF9yrrHv-^bz%Upk;P*cW2ZFBr|G@(R`!QBhV((h{ zH!09MY-wc)QyGQg$ofIY89{uOB_NhYKg&Zc)3ATBX!MG99NB309HL?CzC;7jvw0xc zQL0OWa!xYM6F_oY4O;rSvDl%_jt0niDl_g%w$6L;lv2rhA_}>nGFW50&#@`3OdWupf0EnnuFFL0dxmFKqANy1(Kjc z4|;-RkOERc8b}A}G$QB&nSkyA`cV9sKUoB1fJ~4{4g{G#1a~6H0$E-RBJ>+T2mQc6 zFbE7LGU&TG=76dOA{s!lR9)_hif z+HT7fL7^QQlUO=Br*fUwY6X2=<-w&}=Y2_F zw6{{I^w3{cg55F4td+D@i!|t_lv%x8fcH0*ghX7K!+LgTFh^f~tL;AcZ93d`j|%^# zHQaZP8I(%77PJ{#KljY6%0IM2GwwW~W9R+aTYj_2g=Br#IBkhYugmzEubV;|_p^@F zU%EIJx>s62@QkQ^kwT?39Ib(e2gD{g_l>-JH`6V2{?MUSGas`wYg+1`RHP0%%m{u? zDtvaWt;53G@9^if9=G&PrOKFf3KBhgTdm3DkBT97NA_NFk==Ozi3iEEuq~xh-X~=) zIAqQkUO%jxYM(#B_~0u;z3#L-!TL%+*-GWxErWf@#+9ZgPi?>0W+^0`opW`|70)K` z;=Y!JE5Y~1rp7Z=VzbxrUy{Tkl^kefAqM|b-Jg&CyWch26SL;J6({agw)*F;^R!6mE@a@2OebdhmF`(M~m^z^{ChKJz*y)V~BL-jEzVzq0wP6x(@9`Hk>iwL0{X zgZ71AxwJ;)27~rTFWlKMw<|(5UOBT+)o;FcaVVrqJg2<3M8i=)cJR1Pz5{!|T>Nw9 zQM*1)v$#4c!*I0z(u*^9)-=?0jf6zxB;WoUPCVQ!QS&Hs4@M#7W8TY=^A8o|PpUd3 z4Babw%zvf5XEqFRr*u_GNdw8GS7n1M-=TEwZ3*LN}=aFYKsPxz~bmiK}sSyug{20=~TeNFdnZ<&_ebaWFY zlXmb<)P}XUWW~qd==m0`-EguV9P3tOI0k&$^Kw)E>%iV*ej0LNlgU}WeSO(P17?Y4 z`-{@JPdOW3X*d$KDf*vo>)4A&pgt?>QtKs@gg)6-2JMR{t&Q0)8JSstti7d_;##ru zw39(sxXg6S&^}gf?g$)0QMPnr#t9o+W!HkM2g3}Wg^YF8wBqHi zs-VW!26H(bf^DeVU+blMq7f?`yVIuEu%6o~YKvR-fY5q{ME(w}z2crz($_GKnh*HC z-Z-i|4^M-OH;2R=B%61&cFxjWEbY<{JK?k%C3WYzg6=&m&<{x8b7i0P;PFCJF-=BK zzJqj`YWzaN+q~m1p49=j-bc%K3tMF?%j9bx@0AKBtP_oinC(UUk*=!tHUgEp!+H4D zUZE(v!fdfI9M%vT*l6rptbnYX-Ksx{N$WMUavpCPx$!PxYt>=flkK6M+&BIdFWu#n)0uVUEpPm- z%o-8ZJG>{Uh&E~5eb48L_YKrO6N^&uX1Lm$gHC-VciKjF%_R@6`J%2q+Ng6DCQb8D*e!CyZHg( zs)6YK)!OED)D1BM-UD?HncYv%YrZ)&Qi32{-xMz0X#0lr<#AR1>SS&1iK?KW{rl?} zu4)$7sO#WrrCWo2Pp_>R-GEdzQVpV8Tocek`8a;rXMI`LfBdf8hD_({xkkwuMr8YN zq0+3_)9VW;N)dHs*IPUL$TmWuN1sTS7zbP%YbmRLng3jcbv4Zw8K)=3`qt~}ZEx5= zW2Emun8f1F?P`kTtElM{7>>*6!IOePvCk#KkC~|wy#nqi!96aAFO)j+KIYvVo^~;| zjHL3_DP=HY3jw#+Z%-$a7S7JSd}^9RjXR_;ERTI*c> z)PGLR@3LU+f_w0gu|slbtJ!{+CRcyk+|OI!h8X$07~Y;Ut6|AiVcAKc>QA0Zl@mXr z)X{%@JdbxipV)1RqOVfw<;pP^u*kJ;O&&X9&&%Yk4UoHR6Qnd%7Bz`3-!RXO5*d1& zAQ_YWyzNP`2BP-Ej)(!JJR>#HyPL<``-0DH37Kuuxxe17YbtBHPoD2$(d_HgZuKaq zQ{_3}?T!AY4$p5IZQa-}{?s=8hBqGDrn9Y!OcD^*v%dVT+(ITuLs{O>_W@SD556NY zV*U#5?d2q{C#k^_Z$)G6za|ZpCvO%%os0?(vshRtYnp9Fz3K&mUWcGNxy1(HCnm$>(pPtbsIJx$kcYLT-Ev_ z@*rkFB^`DZmL6j%v?t0Ru&ms9NtwHC`_6{ycT#3y_}UV?Q-oB3(xi_U4`=s?M zrFI8h>|nM$yQOh=^Vm@`DJ#z{v2P)?(RuJ(PUGp5$JR3fpT5;{l2r-1Jr^gWsl~lZ zu_~BIU+ZBac;~LmPSIW?tfOHe#`lj)caIz~37qG#A%hadW2JgrJNCfJJL{fDJgh*|c@ZBz_-!%6 zNKF0R-j!IMkRtn-=+ah{)}7Zv?Rpv6`Cv59<_%X`oSVzDEv7QhHV)lw2sP{+-n3pZ z``)Ds!r?_{@2o$Q^ft8aj%qjKXODn6XTTx5s5*dzbA<5nt@Pu>P=(; zZbVNqO#?n!Sqlfq9vX04j0wWT2T$}O8w4|mmcgc0?!n&fDjsl6986u40M*n)`9Ok? zJc-lsW&%+9t??J$!dUMwHbS6kAk~KoRhd8_l|o~x25P`LB&yJu4F=%=2ZiOW0k<e$4j?h08X6EXQ3b(( zfB=O6v;v*s2_jWgR6qm@M4{v%40&b{jYSBQr!gfUc^pN^cHhZpOa+ck3hs0&NVWr! z3J7pT&`P~RrqcknV1gUnkEH?k^CNqxx~Y&9(F7Dho`_ablt&^-2zdnbktZQM2w0@D ziV_BkSP|#*lbXNCgBBoxXvhxGNEPZJc=)*!85(eXb7Mf?i_T;%6~2Iq0s;dEm$(0K zX$AS_KU)EE=&~8qAskf`sFWlH=|D{koF0P=$mVg*^zxB^;*?Ewacg3K7RSe_9mQ(ttu{ zpC?rcf##_J50v*Hk_dhj793~kLtrq8u2dhg0?~)L02TgFiSzBX@R~&>2fi zEs4G>+;J2#g-rO3p0m!T|4s#sJ(gQUkjnq$vJyV*82ay+{lefs1Q7=WT|7`cf#0t+ z91QrEKK~x0A9p$QgwTKouy5*rJS%?cDXd&N(*Nns*$uTq*uH_x%09%>?DG%3&je5y z0L3}_idblX#6Wn^Ex|$2QDp;=C=>>TR79gyWD!U>0s)6Gtk@AG{cCKj2%s~hSG@H5 zA%{?)9>)QqJL@|N+mR4h%a7#+5psfL_xF}$AcIJPT4YEJjC~(3eE=m428{toz%mT# z0YdFo_6MM?z?9KSP^0iy7=#A3|9*oZ5dWY>KwJJD52=Fv2MmS6LT$g__@S{-L-IEm z76bLqeuJUejmzI*n18^~NG#Nl{0&c;-K6{#hEc};v|kp30JWbO(5q|!v?K>Z{b~#V zTF{|Om)$M306;?;i4JgjQ&3+`2XItJ=pZmyU2Sa?QV)qy!KxrJI!HxbJzb2hq7D+T fsE7OCF`U^wYbJ}pU~!zLjKN}Il9IY+da(Zj|0~At literal 0 HcmV?d00001 diff --git a/Sparse_omp.pdf b/Sparse_omp.pdf new file mode 100644 index 0000000000000000000000000000000000000000..42b21a0c4476c610b7d8ae417c3ffb4e51ef766a GIT binary patch literal 8031 zcmb_B2{@GN_a${TD3z@e;IcU+x`8w=eaWv^M2<&+k4J=-}jvJDOwvEBhl&_Fva?@J#^PUeD!pf8gGl1MNPmkp8wVWAnPT`U4T z@M2w+UO^!iDkV>6>x;w$4(O-czT9dQ^r9!l@0eEBo5})e^Mmc<9V%h+OXYU>X{1n_ zx3_)0TGGW#`g*@*^i}UCd~n1pYl89Vlh|z07p`~J%;13hfNat6$GZf_Dj4HS&8!?s z%>roC-?qfcb#Ed)fUA_0K$AsUPrldBB(f2j1pzazwE41-QhsXh>^w?mq;$H7{ z_L``6-0PC1`z)+G?s%Vgv4FW^>ufGPmN$L%sxMAckG$HSUgw=d_0t!7N6n?zZ5Rhu zO|h=W-5$6-)UWZNxlbmtNC#b`y7H2jwtm8u)1$NIR7iz5t2FDx$S z0&S^~rXIK~X49$c<$PVXjCq$*l*dpZD@AtY)+rs_hPBsxm9R`FW6U?df7Y{FWIB;+ zbz8-_%v8Tm@<^NWF-K+N2b(vWZ=*`)-1e(6*RK+!Pt~R$g?x{XRhMt;rj(*iSuDbnqBD!xSHu_Oh|- zqkTw0u{A5XcRcM1**|VWYQp<|IL??vmV5P<7MIT|bwo~`R?Epxxa{D8l?2b8ayJ_v z$meh(lv8?NO`l=qj}OCLNk@YpO1)~+0>9b+=go5|f z;Y(AYR)M4&NjYi7`mJ^vl8`S9Zz2YS$q zO`x#cm0`40j_3vhx-Hd!@xf-Nx6>xVqc%PI^Bw}>i0m$Z`wuB7Y%jPMj$}TyM$V7#hzKEzC(U}>l+T)X;W1D)~CxEX_qAJl&>V9 z-zDyMdY7o?Qi~;-zUdkmeHa&yNN&4)FsG%>V0>WZ8}Vk@@-6m=a2IchY_*+Vk}py6 z51cKGa!fyux-n2ilc^8uooJS-eY&oEWkgb=yYModWAam0#yf*NUFF|ZjkTsccD%_B zuqnJAD8tDUN$--r>MWgvwUTRXE{!btu(|3Sm-e2fM&Ed%OQU)T;+k;(99QskDPbhXSDhREq| z>ByIz_8zY*-1{CTr7AJD1nH)2fg5)r&@&P|CmyGQDY7vk{qE4UYRz8sCm)wCn^+QyNh%%QxxW zGh@-I02So4n*NpYC#K+*XYw17to$b1lL|ILr z$EKn$GRtg_&ZLiMSG~F)6i@4&TH}y;>iHo#D@!kP4|i@bW9L$0rl4?kIr4fah49UX zy}^~F*xaA;*v=+Pdt*pZwtK#Zy%tIEe*4#*@6)Y1+v2`0iC|k^0vVKryA~Sp?q}Yu z%=<-a5m2xNn8uI0+dhm10@h?d5U>C#G_pQ36z+zCrg10@I39!YfI*XNkimsxdABENE{5a>*2E29BQR^+PuPR|Y?p0Ryb8E#PPpX+cT;suo1q;$b{G z+aGNB%Uqn*f@%Fa%X?gy)F*R5o?!rE8(RxgeJB;7?*h3rUoziZh9Jk6O=EGHY&e0( zf^QD~3}j9ko5MBmC$r&L3}8-P7^5+0z==lT`g7c17(7qVk1qzpGY{{J)8efg1?OYH za5zo)?|%>u1YP|9g9i%sW2~vkTQ&YSDbPG@er6sMkHPR|{h;HIAU+EcQ1hdoEGe<%Kpc8X)H_h8TbL zr$G5m2k;!S$ON(^Lyy6seSbEjQK=xb4WPJpgJB6kP%slpa%q14T#p~Td7k>2HP5|2 z9Le{dB{>lM&mPx@b{@3xkQlTU9IuIi<2BG8yd2t(1J{57dK_Qg9)y6<_93&jgFMmm zk30#yIUXep*a1a7%~y}%M+YHy0Crq3&=J~u5DN<$hXdJ%A0s>)!T{$5HaIK+;tB;6 zw3n3uBftc(1{?q~;0sUy5a5dfsL-Yd`~Vt22Lb^Gzyz2K5MV(jU{U}UJ(%;8MF2Ly z0XVc!fWspDf&drb`m;gkH-rfU1ED||5Dv1LDtvQ5wE_sG7Q8t5c@OcP7YsRHP5fL; zK#Tg>wFZmT2L^}MB$2+?84eD@_UoKBWJ+VOuC*y#L&Iaa9?SK@J}jXuHL40YuPh`f zj@B34c~Gb~%O|g>BH#c0wn%#mK?&1RiJN=>v={G=Kj@&Tw@kXm=tPly=NH6KU13B_ z&L=IuW*yG>i*J?PyT8pwIc+0|oEH?hdvNKyJYV5Io*nT)lW*&M_lK`CsPWZU1@B#4G4~&Tuv!AK9;U()g})5^*1=sXsgxLc%$p+}bDNs!6VBJBBz=XpFLmh#gk?gdMYsA+YB)NvD28#!chxlMhwkJp->t=&tRSMN9`97!JBRMJ(TkpIf&U~N*Aqor`JMa*m= zCA(_0c3^J%o0Qb)pkdSZXV=ZOHkpugub0Q3-Z5T%{`v7cf;Cm`ZzE!|Q*Yl#fYJ2| z6|I@uaOx*sU+R2&=8-z`DA6@}^ug7~A~{WcANQc{++0#vSVOhwC#>=k-kTw?A^F{3 zNgjhHnG9z|k3B8{dXZZUKf@HfR|uV{v1~K*dNg`hbnA4_w*CakVIQXtD#v}-R5fpT zc2{sr^pI}IGcGChxYfEYc#Zw2?7PR$YvOvbGKQ)|p+AK1g}nw*pUKWO2B$JCwT=Z_ z6##SRY@avNJ4(W4jcc-_TpbmbeWvGTCx-?`fAEwV8$H>kCw_M*`KZX`il`Sg_g;w? zp0ghs-yT-iJy`ePw$!ZJn*D2VnT*|cVplCMR+D}A(l{t@`KqJUz(ltO+b!hHw$3$| zyF&X@MHuKWYb^c}wi(Ol8DjI!i z4}0(^&m<&cTaJyx$e{wuO}gy9%dW~r#H26DJ(mtWe^v!Aeieu8mbA~pt6tVW)UOmy z{zE1{=3_r}2-8YYKlF%Js~l2RC#IM6=x@}iT8e9;}s8%-w66+1>?nt z@s&BtnlTUmwznPzfy}+*P1ZXl%ZB5Img!qp1+I!84j8U_#OZ!|M)&33w}mKj{+cM| zTBn!P_m9giFH6-Im?{ek^Y*S{du_G768HyV>&^AyL21h?##f<57z(22%M+;9C}0WLd+=FCi7$BG;3;_RQ{^6BDTRtP)r8YB=)wp10^@;pf}gR%^#*H5)VE zzxyT~R`ez4xQIyDoL#BP$@EH(@~68#Z4JI4Uirm0eAL`EHL}6V+q2GVms9Sf6k-Ps zc`06~@AxuUYT2Hwlt}F-PnB+guQA%#m9Nhjc$_)XZHZwn(d=KEZ7pV->(G!ovCl<_ zBUBl(<$`0F=1fuSH1^i2&jJ|f(Z|V(@mU>>Pp<2rDhK3ZhBYslZI!vZ_FdCp_(`dV zk9CGEqR#Cz=Vk|y!e_63>`L#}j&(nFD;v1Ide^b&&uhjTRu9QOb;`IFV4&4#xS^d! z6_Ye}xbW?kt!kJK9vK|;P)mCdA$KI^a}KHJLdw!7>EQ}JG6^mpQbup3u9Zzo#YF9~ z{qm)#?qfaXML#^OD+1fx4JbAH?Rs!CKmQc6T(Bzq^6=pgjBgF$?2;FX8deoGV=lHC zr>~uMz~U=E%={T%wQB9oOnslyB@NFH?8XffGGG^B8S!=!+hTXY?Mmg(;{_Tw%GZ?l zDp~C@s4R3ow!^yZ4_u^v?hPfjjk0m6l1kXwX3o85#X5J_PVA>q&t394GWaF3)??&k zc5T|xgQD!vr#*V^YJ{-cpAsc>^#nF+l!b%LxftyKkRG z=;sxVG(h3{#7*O+a@%0H+NwHYA7`~yUcB~sqA~57uGd`en(KdWEOB!1bMQN{DZ!AW z%no!lPYO3{$X`we%4b`@UWyqQ2$r(KDa_n&YCm!-`GneI(6jOCsqRbn0^2(ev^^ZZ zM0yjLG${a~Jst{pnl5{RNYT4*8(VdsV|61Dei@2XN?#1%% zM~>)hVZN9kqH!qf_XJT}Hx$ZF13)g^2lS&cbP(gEl?XVEqJwb4S)eRf2B1G}dpH}k z3%9iQ4G-`oP!PH#n6@q%s;NO_D4B(%^84HzIFx?t{AploZu}LB0FGAI zL_jRr6e`gcDzN7nLQgsfe=e6r1b~o`5cLqOI+N`Opa}#5fWiP63=+aXa>5u~aww9) zQGn#}6`?tQCu4Bb`8uilG6MmcGk{h{0gHkb>lGT40p|%O`!IvKI*8z48ihzkYiXdV zWC9YzYHA?SXetVcf<8#R7D&*bk}(7=AN-;?)=z5wA`hB?1Y#jOKqDg5L7)Wtf@~dx ziM2W0#GlFG&KJILf;tL^02Y@2Z)pYj=095ja_E8?v>_a#1yo8>!wjJ&2FaLBgCh+= zq%YhagCoK*L=+K+A`&&>+Q4s^knm^xotDK>8ErPozw?JroioKSnT%&g8;1 z)HUHOGS}Ci4(9iH4l$y$n*^kgv!w! zhX0?S`M3Q{@%^qaE0|5^?+}VF0MbF8ZXC$fXh>sAJA#M{Y0db8Gbs5P$UJUl7s171j&v?W^+I2LB<5_#o)uf#M1HeyovT@PFy^?=kvumP0p$4kCniQvc(w_^GF`c<3nqr!z+d zYK8E81DTb#iIsW#A9{-k$Kc=?{?ZH8MUe8Zv9TzC$yQ$U((jubLVI}2Z_q}mSiX!q(Ut+ zG!Di)kLN#dO&ku3gHz!PFboC-wOe@~IAalp$Ks$y;jb`g2~hj*R~U4;{DT$+E%~2# z_crz!^7kL0mJcImWy~? zHW_L^v7r~(aKMfh4)v>XaKM%c9lE@3sVyAX!JsnX{N5DQS2KjWX=98Hj4=eXCKjz> vjMFnVGDKl8Mg$xIi#LKCZ=gZ?-!VLRJ!=k^%;xf)1}UipQ&cpvGKT#ZD-FFC literal 0 HcmV?d00001 diff --git a/paper.tex b/paper.tex index 5004934..a2e5a92 100644 --- a/paper.tex +++ b/paper.tex @@ -697,7 +697,7 @@ The initialization values of the vector solution of the methods are given in %Section~\ref{sec:vec_initialization}. \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.5\textwidth]{Sparse_openmp} + \includegraphics[angle=-90,width=0.5\textwidth]{Sparse_omp} \caption{Execution times in seconds of the Ehrlich-Aberth method for solving sparse polynomials on GPUs using shared memory paradigm with OpenMP} \label{fig:01} \end{figure} @@ -711,7 +711,7 @@ of the methods are given in %Section~\ref{sec:vec_initialization}. \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.5\textwidth]{Full_openmp} + \includegraphics[angle=-90,width=0.5\textwidth]{Full_omp} \caption{Execution times in seconds of the Ehrlich-Aberth method for solving full polynomials on GPUs using shared memory paradigm with OpenMP} \label{fig:03} \end{figure} @@ -725,28 +725,28 @@ of the methods are given in %Section~\ref{sec:vec_initialization}. \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.5\textwidth]{Sparse_mpivsomp} + \includegraphics[angle=-90,width=0.5\textwidth]{Sparse} \caption{Comparaison between MPI and OpenMP versions of the Ehrlich-Aberth method for solving sparse plynomials on GPUs} \label{fig:05} \end{figure} \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.5\textwidth]{Full_mpivsomp} + \includegraphics[angle=-90,width=0.5\textwidth]{Full} \caption{Comparaison between MPI and OpenMP versions of the Ehrlich-Aberth method for solving full polynomials on GPUs} \label{fig:06} \end{figure} \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.5\textwidth]{MPI_mpivsomp} + \includegraphics[angle=-90,width=0.5\textwidth]{MPI} \caption{Comparaison of execution times of the Ehrlich-Aberth method for solving sparse and full polynomials on GPUs with distributed memory paradigm using MPI} \label{fig:07} \end{figure} \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.5\textwidth]{OMP_mpivsomp} + \includegraphics[angle=-90,width=0.5\textwidth]{OMP} \caption{Comparaison of execution times of the Ehrlich-Aberth method for solving sparse and full polynomials on GPUs with shared memory paradigm using OpenMP} \label{fig:08} \end{figure} -- 2.39.5