From: zianekhodja Date: Wed, 16 Dec 2015 22:14:24 +0000 (+0100) Subject: new figures X-Git-Url: https://bilbo.iut-bm.univ-fcomte.fr/and/gitweb/kahina_paper2.git/commitdiff_plain/d566429ab3c43daff17f049fdb37b08d05b6de39?ds=sidebyside new figures --- diff --git a/Full_mpi.pdf b/Full_mpi.pdf new file mode 100644 index 0000000..14df67e Binary files /dev/null and b/Full_mpi.pdf differ diff --git a/Full_mpivsomp.pdf b/Full_mpivsomp.pdf new file mode 100644 index 0000000..eb62281 Binary files /dev/null and b/Full_mpivsomp.pdf differ diff --git a/Full_openmp.pdf b/Full_openmp.pdf new file mode 100644 index 0000000..0404dad Binary files /dev/null and b/Full_openmp.pdf differ diff --git a/GPU_mpi.pdf b/GPU_mpi.pdf deleted file mode 100644 index 5d5849b..0000000 Binary files a/GPU_mpi.pdf and /dev/null differ diff --git a/GPU_openmp.pdf b/GPU_openmp.pdf deleted file mode 100644 index 6ce9386..0000000 Binary files a/GPU_openmp.pdf and /dev/null differ diff --git a/Simulations/Full_mpi.eps b/Simulations/Full_mpi.eps new file mode 100644 index 0000000..1ffb068 --- /dev/null +++ b/Simulations/Full_mpi.eps @@ -0,0 +1,913 @@ +%!PS-Adobe-2.0 +%%Title: Full_mpi.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Wed Dec 16 22:36:38 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color false def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Full_mpi.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Wed Dec 16 22:36:38 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 892 M +31 0 V +6062 0 R +-31 0 V +854 1151 M +31 0 V +6062 0 R +-31 0 V +854 1336 M +31 0 V +6062 0 R +-31 0 V +854 1479 M +31 0 V +6062 0 R +-31 0 V +854 1595 M +31 0 V +6062 0 R +-31 0 V +854 1694 M +31 0 V +6062 0 R +-31 0 V +854 1779 M +31 0 V +6062 0 R +-31 0 V +854 1855 M +31 0 V +6062 0 R +-31 0 V +854 1922 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1922 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2366 M +31 0 V +6062 0 R +-31 0 V +854 2626 M +31 0 V +6062 0 R +-31 0 V +854 2810 M +31 0 V +6062 0 R +-31 0 V +854 2953 M +31 0 V +6062 0 R +-31 0 V +854 3070 M +31 0 V +6062 0 R +-31 0 V +854 3168 M +31 0 V +6062 0 R +-31 0 V +854 3254 M +31 0 V +6062 0 R +-31 0 V +854 3329 M +31 0 V +6062 0 R +-31 0 V +854 3397 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3397 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 3840 M +31 0 V +6062 0 R +-31 0 V +854 4100 M +31 0 V +6062 0 R +-31 0 V +854 4284 M +31 0 V +6062 0 R +-31 0 V +854 4427 M +31 0 V +6062 0 R +-31 0 V +854 4544 M +31 0 V +6062 0 R +-31 0 V +854 4643 M +31 0 V +6062 0 R +-31 0 V +854 4728 M +31 0 V +6062 0 R +-31 0 V +854 4804 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MCshow +1.000 UL +LTb +1465 448 M +0 31 V +0 4392 R +0 -31 V +1823 448 M +0 31 V +0 4392 R +0 -31 V +2077 448 M +0 31 V +0 4392 R +0 -31 V +2274 448 M +0 31 V +0 4392 R +0 -31 V +2434 448 M +0 31 V +0 4392 R +0 -31 V +2570 448 M +0 31 V +0 4392 R +0 -31 V +2688 448 M +0 31 V +0 4392 R +0 -31 V +2792 448 M +0 31 V +0 4392 R +0 -31 V +2885 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2885 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MCshow +1.000 UL +LTb +3496 448 M +0 31 V +0 4392 R +0 -31 V +3854 448 M +0 31 V +0 4392 R +0 -31 V +4108 448 M +0 31 V +0 4392 R +0 -31 V +4305 448 M +0 31 V +0 4392 R +0 -31 V +4465 448 M +0 31 V +0 4392 R +0 -31 V +4601 448 M +0 31 V +0 4392 R +0 -31 V +4719 448 M +0 31 V +0 4392 R +0 -31 V +4823 448 M +0 31 V +0 4392 R +0 -31 V +4916 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4916 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +5527 448 M +0 31 V +0 4392 R +0 -31 V +5885 448 M +0 31 V +0 4392 R +0 -31 V +6139 448 M +0 31 V +0 4392 R +0 -31 V +6336 448 M +0 31 V +0 4392 R +0 -31 V +6496 448 M +0 31 V +0 4392 R +0 -31 V +6632 448 M +0 31 V +0 4392 R +0 -31 V +6750 448 M +0 31 V +0 4392 R +0 -31 V +6854 448 M +0 31 V +0 4392 R +0 -31 V +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+07)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +1.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +2885 1013 M +611 1154 V +612 459 V +357 593 V +254 266 V +197 374 V +161 203 V +136 104 V +2885 1013 Pls +3496 2167 Pls +4108 2626 Pls +4465 3219 Pls +4719 3485 Pls +4916 3859 Pls +5077 4062 Pls +5213 4166 Pls +6579 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +1.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +2885 746 M +611 1021 V +612 491 V +357 638 V +254 212 V +197 323 V +161 219 V +136 111 V +2885 746 Crs +3496 1767 Crs +4108 2258 Crs +4465 2896 Crs +4719 3108 Crs +4916 3431 Crs +5077 3650 Crs +5213 3761 Crs +6579 4598 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +1.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +2885 763 M +611 867 V +612 423 V +357 673 V +254 101 V +197 331 V +161 229 V +136 136 V +2885 763 Star +3496 1630 Star +4108 2053 Star +4465 2726 Star +4719 2827 Star +4916 3158 Star +5077 3387 Star +5213 3523 Star +6579 4458 Star +% End plot #3 +% Begin plot #4 +1.000 UP +1.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +2885 617 M +611 882 V +612 414 V +357 689 V +254 137 V +197 263 V +161 306 V +136 33 V +2885 617 Box +3496 1499 Box +4108 1913 Box +4465 2602 Box +4719 2739 Box +4916 3002 Box +5077 3308 Box +5213 3341 Box +6579 4318 Box +% End plot #4 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Full_mpivsomp.eps b/Simulations/Full_mpivsomp.eps new file mode 100644 index 0000000..b5f9e19 --- /dev/null +++ b/Simulations/Full_mpivsomp.eps @@ -0,0 +1,827 @@ +%!PS-Adobe-2.0 +%%Title: Full_mpivsomp.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Wed Dec 16 22:55:31 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color false def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Full_mpivsomp.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Wed Dec 16 22:55:31 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 892 M +31 0 V +6062 0 R +-31 0 V +854 1151 M +31 0 V +6062 0 R +-31 0 V +854 1336 M +31 0 V +6062 0 R +-31 0 V +854 1479 M +31 0 V +6062 0 R +-31 0 V +854 1595 M +31 0 V +6062 0 R +-31 0 V +854 1694 M +31 0 V +6062 0 R +-31 0 V +854 1779 M +31 0 V +6062 0 R +-31 0 V +854 1855 M +31 0 V +6062 0 R +-31 0 V +854 1922 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1922 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2366 M +31 0 V +6062 0 R +-31 0 V +854 2626 M +31 0 V +6062 0 R +-31 0 V +854 2810 M +31 0 V +6062 0 R +-31 0 V +854 2953 M +31 0 V +6062 0 R +-31 0 V +854 3070 M +31 0 V +6062 0 R +-31 0 V +854 3168 M +31 0 V +6062 0 R +-31 0 V +854 3254 M +31 0 V +6062 0 R +-31 0 V +854 3329 M +31 0 V +6062 0 R +-31 0 V +854 3397 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3397 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 3840 M +31 0 V +6062 0 R +-31 0 V +854 4100 M +31 0 V +6062 0 R +-31 0 V +854 4284 M +31 0 V +6062 0 R +-31 0 V +854 4427 M +31 0 V +6062 0 R +-31 0 V +854 4544 M +31 0 V +6062 0 R +-31 0 V +854 4643 M +31 0 V +6062 0 R +-31 0 V +854 4728 M +31 0 V +6062 0 R +-31 0 V +854 4804 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (1)] +] -46.7 MCshow +1.000 UL +LTb +2885 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2885 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (2)] +] -46.7 MCshow +1.000 UL +LTb +4916 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4916 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (3)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (4)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Number of GPU)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +1.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K MPI)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +854 2167 M +2885 1767 L +4916 1630 L +6947 1499 L +854 2167 Pls +2885 1767 Pls +4916 1630 Pls +6947 1499 Pls +6579 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +1.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K OpenMP)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +854 2188 M +2885 1801 L +4916 1593 L +2031 -39 V +854 2188 Crs +2885 1801 Crs +4916 1593 Crs +6947 1554 Crs +6579 4598 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +1.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K MPI)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +854 3485 M +2885 3108 L +4916 2827 L +2031 -88 V +854 3485 Star +2885 3108 Star +4916 2827 Star +6947 2739 Star +6579 4458 Star +% End plot #3 +% Begin plot #4 +1.000 UP +1.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K OpenMP)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +854 3511 M +2885 3100 L +4916 2861 L +6947 2700 L +854 3511 Box +2885 3100 Box +4916 2861 Box +6947 2700 Box +6579 4318 Box +% End plot #4 +% Begin plot #5 +1.000 UP +1.000 UL +LT4 +LCb setrgbcolor +6296 4178 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M MPI)] +] -46.7 MRshow +LT4 +6380 4178 M +399 0 V +854 4166 M +2885 3761 L +4916 3523 L +6947 3341 L +854 4166 BoxF +2885 3761 BoxF +4916 3523 BoxF +6947 3341 BoxF +6579 4178 BoxF +% End plot #5 +% Begin plot #6 +1.000 UP +1.000 UL +LT5 +LCb setrgbcolor +6296 4038 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M OpenMP)] +] -46.7 MRshow +LT5 +6380 4038 M +399 0 V +854 4188 M +2885 3765 L +4916 3509 L +6947 3347 L +854 4188 Circle +2885 3765 Circle +4916 3509 Circle +6947 3347 Circle +6579 4038 Circle +% End plot #6 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Full_openmp.eps b/Simulations/Full_openmp.eps new file mode 100644 index 0000000..d612e35 --- /dev/null +++ b/Simulations/Full_openmp.eps @@ -0,0 +1,913 @@ +%!PS-Adobe-2.0 +%%Title: Full_openmp.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Wed Dec 16 22:38:26 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color false def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Full_openmp.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Wed Dec 16 22:38:26 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 892 M +31 0 V +6062 0 R +-31 0 V +854 1151 M +31 0 V +6062 0 R +-31 0 V +854 1336 M +31 0 V +6062 0 R +-31 0 V +854 1479 M +31 0 V +6062 0 R +-31 0 V +854 1595 M +31 0 V +6062 0 R +-31 0 V +854 1694 M +31 0 V +6062 0 R +-31 0 V +854 1779 M +31 0 V +6062 0 R +-31 0 V +854 1855 M +31 0 V +6062 0 R +-31 0 V +854 1922 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1922 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2366 M +31 0 V +6062 0 R +-31 0 V +854 2626 M +31 0 V +6062 0 R +-31 0 V +854 2810 M +31 0 V +6062 0 R +-31 0 V +854 2953 M +31 0 V +6062 0 R +-31 0 V +854 3070 M +31 0 V +6062 0 R +-31 0 V +854 3168 M +31 0 V +6062 0 R +-31 0 V +854 3254 M +31 0 V +6062 0 R +-31 0 V +854 3329 M +31 0 V +6062 0 R +-31 0 V +854 3397 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3397 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 3840 M +31 0 V +6062 0 R +-31 0 V +854 4100 M +31 0 V +6062 0 R +-31 0 V +854 4284 M +31 0 V +6062 0 R +-31 0 V +854 4427 M +31 0 V +6062 0 R +-31 0 V +854 4544 M +31 0 V +6062 0 R +-31 0 V +854 4643 M +31 0 V +6062 0 R +-31 0 V +854 4728 M +31 0 V +6062 0 R +-31 0 V +854 4804 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MCshow +1.000 UL +LTb +1465 448 M +0 31 V +0 4392 R +0 -31 V +1823 448 M +0 31 V +0 4392 R +0 -31 V +2077 448 M +0 31 V +0 4392 R +0 -31 V +2274 448 M +0 31 V +0 4392 R +0 -31 V +2434 448 M +0 31 V +0 4392 R +0 -31 V +2570 448 M +0 31 V +0 4392 R +0 -31 V +2688 448 M +0 31 V +0 4392 R +0 -31 V +2792 448 M +0 31 V +0 4392 R +0 -31 V +2885 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2885 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MCshow +1.000 UL +LTb +3496 448 M +0 31 V +0 4392 R +0 -31 V +3854 448 M +0 31 V +0 4392 R +0 -31 V +4108 448 M +0 31 V +0 4392 R +0 -31 V +4305 448 M +0 31 V +0 4392 R +0 -31 V +4465 448 M +0 31 V +0 4392 R +0 -31 V +4601 448 M +0 31 V +0 4392 R +0 -31 V +4719 448 M +0 31 V +0 4392 R +0 -31 V +4823 448 M +0 31 V +0 4392 R +0 -31 V +4916 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4916 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +5527 448 M +0 31 V +0 4392 R +0 -31 V +5885 448 M +0 31 V +0 4392 R +0 -31 V +6139 448 M +0 31 V +0 4392 R +0 -31 V +6336 448 M +0 31 V +0 4392 R +0 -31 V +6496 448 M +0 31 V +0 4392 R +0 -31 V +6632 448 M +0 31 V +0 4392 R +0 -31 V +6750 448 M +0 31 V +0 4392 R +0 -31 V +6854 448 M +0 31 V +0 4392 R +0 -31 V +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+07)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +1.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +2885 1017 M +611 1171 V +612 430 V +357 662 V +254 231 V +197 307 V +161 286 V +136 84 V +2885 1017 Pls +3496 2188 Pls +4108 2618 Pls +4465 3280 Pls +4719 3511 Pls +4916 3818 Pls +5077 4104 Pls +5213 4188 Pls +6579 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +1.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +2885 780 M +611 1021 V +612 428 V +357 669 V +254 202 V +197 328 V +161 265 V +136 72 V +2885 780 Crs +3496 1801 Crs +4108 2229 Crs +4465 2898 Crs +4719 3100 Crs +4916 3428 Crs +5077 3693 Crs +5213 3765 Crs +6579 4598 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +1.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +2885 814 M +611 779 V +612 403 V +357 700 V +254 165 V +197 301 V +161 268 V +136 79 V +2885 814 Star +3496 1593 Star +4108 1996 Star +4465 2696 Star +4719 2861 Star +4916 3162 Star +5077 3430 Star +5213 3509 Star +6579 4458 Star +% End plot #3 +% Begin plot #4 +1.000 UP +1.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +2885 642 M +611 912 V +612 300 V +357 727 V +254 119 V +197 285 V +161 305 V +136 57 V +2885 642 Box +3496 1554 Box +4108 1854 Box +4465 2581 Box +4719 2700 Box +4916 2985 Box +5077 3290 Box +5213 3347 Box +6579 4318 Box +% End plot #4 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Sparse_mpi.eps b/Simulations/Sparse_mpi.eps new file mode 100644 index 0000000..f9e6d5f --- /dev/null +++ b/Simulations/Sparse_mpi.eps @@ -0,0 +1,955 @@ +%!PS-Adobe-2.0 +%%Title: Sparse_mpi.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Wed Dec 16 22:35:02 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color false def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Sparse_mpi.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Wed Dec 16 22:35:02 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1)] +] -46.7 MRshow +1.000 UL +LTb +854 781 M +31 0 V +6062 0 R +-31 0 V +854 976 M +31 0 V +6062 0 R +-31 0 V +854 1114 M +31 0 V +6062 0 R +-31 0 V +854 1221 M +31 0 V +6062 0 R +-31 0 V +854 1308 M +31 0 V +6062 0 R +-31 0 V +854 1382 M +31 0 V +6062 0 R +-31 0 V +854 1447 M +31 0 V +6062 0 R +-31 0 V +854 1503 M +31 0 V +6062 0 R +-31 0 V +854 1554 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 1887 M +31 0 V +6062 0 R +-31 0 V +854 2081 M +31 0 V +6062 0 R +-31 0 V +854 2219 M +31 0 V +6062 0 R +-31 0 V +854 2327 M +31 0 V +6062 0 R +-31 0 V +854 2414 M +31 0 V +6062 0 R +-31 0 V +854 2488 M +31 0 V +6062 0 R +-31 0 V +854 2552 M +31 0 V +6062 0 R +-31 0 V +854 2609 M +31 0 V +6062 0 R +-31 0 V +854 2660 M +63 0 V +6030 0 R +-63 0 V +stroke +770 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2992 M +31 0 V +6062 0 R +-31 0 V +854 3187 M +31 0 V +6062 0 R +-31 0 V +854 3325 M +31 0 V +6062 0 R +-31 0 V +854 3432 M +31 0 V +6062 0 R +-31 0 V +854 3520 M +31 0 V +6062 0 R +-31 0 V +854 3594 M +31 0 V +6062 0 R +-31 0 V +854 3658 M +31 0 V +6062 0 R +-31 0 V +854 3715 M +31 0 V +6062 0 R +-31 0 V +854 3765 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 4098 M +31 0 V +6062 0 R +-31 0 V +854 4293 M +31 0 V +6062 0 R +-31 0 V +854 4431 M +31 0 V +6062 0 R +-31 0 V +854 4538 M +31 0 V +6062 0 R +-31 0 V +854 4626 M +31 0 V +6062 0 R +-31 0 V +854 4700 M +31 0 V +6062 0 R +-31 0 V +854 4764 M +31 0 V +6062 0 R +-31 0 V +854 4820 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MCshow +1.000 UL +LTb +1465 448 M +0 31 V +0 4392 R +0 -31 V +1823 448 M +0 31 V +0 4392 R +0 -31 V +2077 448 M +0 31 V +0 4392 R +0 -31 V +2274 448 M +0 31 V +0 4392 R +0 -31 V +2434 448 M +0 31 V +0 4392 R +0 -31 V +2570 448 M +0 31 V +0 4392 R +0 -31 V +2688 448 M +0 31 V +0 4392 R +0 -31 V +2792 448 M +0 31 V +0 4392 R +0 -31 V +2885 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2885 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MCshow +1.000 UL +LTb +3496 448 M +0 31 V +0 4392 R +0 -31 V +3854 448 M +0 31 V +0 4392 R +0 -31 V +4108 448 M +0 31 V +0 4392 R +0 -31 V +4305 448 M +0 31 V +0 4392 R +0 -31 V +4465 448 M +0 31 V +0 4392 R +0 -31 V +4601 448 M +0 31 V +0 4392 R +0 -31 V +4719 448 M +0 31 V +0 4392 R +0 -31 V +4823 448 M +0 31 V +0 4392 R +0 -31 V +4916 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4916 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +5527 448 M +0 31 V +0 4392 R +0 -31 V +5885 448 M +0 31 V +0 4392 R +0 -31 V +6139 448 M +0 31 V +0 4392 R +0 -31 V +6336 448 M +0 31 V +0 4392 R +0 -31 V +6496 448 M +0 31 V +0 4392 R +0 -31 V +6632 448 M +0 31 V +0 4392 R +0 -31 V +6750 448 M +0 31 V +0 4392 R +0 -31 V +6854 448 M +0 31 V +0 4392 R +0 -31 V +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+07)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +1.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +2885 1782 M +611 660 V +612 942 V +357 171 V +254 453 V +197 312 V +161 100 V +136 -92 V +2885 1782 Pls +3496 2442 Pls +4108 3384 Pls +4465 3555 Pls +4719 4008 Pls +4916 4320 Pls +5077 4420 Pls +5213 4328 Pls +6579 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +1.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +2885 1484 M +611 747 V +612 525 V +357 426 V +254 443 V +197 41 V +161 339 V +136 91 V +2885 1484 Crs +3496 2231 Crs +4108 2756 Crs +4465 3182 Crs +4719 3625 Crs +4916 3666 Crs +5077 4005 Crs +5213 4096 Crs +6579 4598 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +1.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +2885 1391 M +611 823 V +612 345 V +357 418 V +254 497 V +197 -2 V +161 524 V +136 26 V +2885 1391 Star +3496 2214 Star +4108 2559 Star +4465 2977 Star +4719 3474 Star +4916 3472 Star +5077 3996 Star +5213 4022 Star +6579 4458 Star +% End plot #3 +% Begin plot #4 +1.000 UP +1.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +2885 1181 M +611 742 V +612 519 V +357 423 V +254 293 V +197 213 V +161 666 V +136 -84 V +2885 1181 Box +3496 1923 Box +4108 2442 Box +4465 2865 Box +4719 3158 Box +4916 3371 Box +5077 4037 Box +5213 3953 Box +6579 4318 Box +% End plot #4 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Sparse_mpivsomp.eps b/Simulations/Sparse_mpivsomp.eps new file mode 100644 index 0000000..8a99ac7 --- /dev/null +++ b/Simulations/Sparse_mpivsomp.eps @@ -0,0 +1,827 @@ +%!PS-Adobe-2.0 +%%Title: Sparse_mpivsomp.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Wed Dec 16 22:52:50 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color false def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Sparse_mpivsomp.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Wed Dec 16 22:52:50 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 892 M +31 0 V +6062 0 R +-31 0 V +854 1151 M +31 0 V +6062 0 R +-31 0 V +854 1336 M +31 0 V +6062 0 R +-31 0 V +854 1479 M +31 0 V +6062 0 R +-31 0 V +854 1595 M +31 0 V +6062 0 R +-31 0 V +854 1694 M +31 0 V +6062 0 R +-31 0 V +854 1779 M +31 0 V +6062 0 R +-31 0 V +854 1855 M +31 0 V +6062 0 R +-31 0 V +854 1922 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1922 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2366 M +31 0 V +6062 0 R +-31 0 V +854 2626 M +31 0 V +6062 0 R +-31 0 V +854 2810 M +31 0 V +6062 0 R +-31 0 V +854 2953 M +31 0 V +6062 0 R +-31 0 V +854 3070 M +31 0 V +6062 0 R +-31 0 V +854 3168 M +31 0 V +6062 0 R +-31 0 V +854 3254 M +31 0 V +6062 0 R +-31 0 V +854 3329 M +31 0 V +6062 0 R +-31 0 V +854 3397 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3397 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 3840 M +31 0 V +6062 0 R +-31 0 V +854 4100 M +31 0 V +6062 0 R +-31 0 V +854 4284 M +31 0 V +6062 0 R +-31 0 V +854 4427 M +31 0 V +6062 0 R +-31 0 V +854 4544 M +31 0 V +6062 0 R +-31 0 V +854 4643 M +31 0 V +6062 0 R +-31 0 V +854 4728 M +31 0 V +6062 0 R +-31 0 V +854 4804 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (1)] +] -46.7 MCshow +1.000 UL +LTb +2885 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2885 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (2)] +] -46.7 MCshow +1.000 UL +LTb +4916 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4916 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (3)] +] -46.7 MCshow +1.000 UL +LTb +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 (4)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Number of GPU)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +1.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K MPI)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +854 1632 M +2885 1351 L +2031 -23 V +6947 941 L +854 1632 Pls +2885 1351 Pls +4916 1328 Pls +6947 941 Pls +6579 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +1.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (200K OpenMP)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +854 1695 M +2885 1261 L +2031 39 V +6947 980 L +854 1695 Crs +2885 1261 Crs +4916 1300 Crs +6947 980 Crs +6579 4598 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +1.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K MPI)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +854 3720 M +2885 3209 L +4916 3008 L +6947 2587 L +854 3720 Star +2885 3209 Star +4916 3008 Star +6947 2587 Star +6579 4458 Star +% End plot #3 +% Begin plot #4 +1.000 UP +1.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (800K OpenMP)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +854 3503 M +2885 3044 L +4916 2727 L +6947 2531 L +854 3503 Box +2885 3044 Box +4916 2727 Box +6947 2531 Box +6579 4318 Box +% End plot #4 +% Begin plot #5 +1.000 UP +1.000 UL +LT4 +LCb setrgbcolor +6296 4178 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M MPI)] +] -46.7 MRshow +LT4 +6380 4178 M +399 0 V +854 4147 M +2885 3838 L +2031 -99 V +2031 -92 V +854 4147 BoxF +2885 3838 BoxF +4916 3739 BoxF +6947 3647 BoxF +6579 4178 BoxF +% End plot #5 +% Begin plot #6 +1.000 UP +1.000 UL +LT5 +LCb setrgbcolor +6296 4038 M +[ [(Helvetica) 140.0 0.0 true true 0 (1.4M OpenMP)] +] -46.7 MRshow +LT5 +6380 4038 M +399 0 V +854 4203 M +2885 3949 L +4916 3768 L +2031 -30 V +854 4203 Circle +2885 3949 Circle +4916 3768 Circle +6947 3738 Circle +6579 4038 Circle +% End plot #6 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/Sparse_openmp.eps b/Simulations/Sparse_openmp.eps new file mode 100644 index 0000000..b816be4 --- /dev/null +++ b/Simulations/Sparse_openmp.eps @@ -0,0 +1,955 @@ +%!PS-Adobe-2.0 +%%Title: Sparse_openmp.eps +%%Creator: gnuplot 4.6 patchlevel 0 +%%CreationDate: Wed Dec 16 22:37:48 2015 +%%DocumentFonts: (atend) +%%BoundingBox: 50 50 554 770 +%%Orientation: Landscape +%%Pages: (atend) +%%EndComments +%%BeginProlog +/gnudict 256 dict def +gnudict begin +% +% The following true/false flags may be edited by hand if desired. +% The unit line width and grayscale image gamma correction may also be changed. +% +/Color false def +/Blacktext false def +/Solid false def +/Dashlength 1 def +/Landscape true def +/Level1 false def +/Rounded false def +/ClipToBoundingBox false def +/SuppressPDFMark false def +/TransparentPatterns false def +/gnulinewidth 5.000 def +/userlinewidth gnulinewidth def +/Gamma 1.0 def +/BackgroundColor {-1.000 -1.000 -1.000} def +% +/vshift -46 def +/dl1 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul sub dup 0 le { pop 0.01 } if } if +} def +/dl2 { + 10.0 Dashlength mul mul + Rounded { currentlinewidth 0.75 mul add } if +} def +/hpt_ 31.5 def +/vpt_ 31.5 def +/hpt hpt_ def +/vpt vpt_ def +/doclip { + ClipToBoundingBox { + newpath 50 50 moveto 554 50 lineto 554 770 lineto 50 770 lineto closepath + clip + } if +} def +% +% Gnuplot Prolog Version 4.4 (August 2010) +% +%/SuppressPDFMark true def +% +/M {moveto} bind def +/L {lineto} bind def +/R {rmoveto} bind def +/V {rlineto} bind def +/N {newpath moveto} bind def +/Z {closepath} bind def +/C {setrgbcolor} bind def +/f {rlineto fill} bind def +/g {setgray} bind def +/Gshow {show} def % May be redefined later in the file to support UTF-8 +/vpt2 vpt 2 mul def +/hpt2 hpt 2 mul def +/Lshow {currentpoint stroke M 0 vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Rshow {currentpoint stroke M dup stringwidth pop neg vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/Cshow {currentpoint stroke M dup stringwidth pop -2 div vshift R + Blacktext {gsave 0 setgray show grestore} {show} ifelse} def +/UP {dup vpt_ mul /vpt exch def hpt_ mul /hpt exch def + /hpt2 hpt 2 mul def /vpt2 vpt 2 mul def} def +/DL {Color {setrgbcolor Solid {pop []} if 0 setdash} + {pop pop pop 0 setgray Solid {pop []} if 0 setdash} ifelse} def +/BL {stroke userlinewidth 2 mul setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/AL {stroke userlinewidth 2 div setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +/UL {dup gnulinewidth mul /userlinewidth exch def + dup 1 lt {pop 1} if 10 mul /udl exch def} def +/PL {stroke userlinewidth setlinewidth + Rounded {1 setlinejoin 1 setlinecap} if} def +3.8 setmiterlimit +% Default Line colors +/LCw {1 1 1} def +/LCb {0 0 0} def +/LCa {0 0 0} def +/LC0 {1 0 0} def +/LC1 {0 1 0} def +/LC2 {0 0 1} def +/LC3 {1 0 1} def +/LC4 {0 1 1} def +/LC5 {1 1 0} def +/LC6 {0 0 0} def +/LC7 {1 0.3 0} def +/LC8 {0.5 0.5 0.5} def +% Default Line Types +/LTw {PL [] 1 setgray} def +/LTb {BL [] LCb DL} def +/LTa {AL [1 udl mul 2 udl mul] 0 setdash LCa setrgbcolor} def +/LT0 {PL [] LC0 DL} def +/LT1 {PL [4 dl1 2 dl2] LC1 DL} def +/LT2 {PL [2 dl1 3 dl2] LC2 DL} def +/LT3 {PL [1 dl1 1.5 dl2] LC3 DL} def +/LT4 {PL [6 dl1 2 dl2 1 dl1 2 dl2] LC4 DL} def +/LT5 {PL [3 dl1 3 dl2 1 dl1 3 dl2] LC5 DL} def +/LT6 {PL [2 dl1 2 dl2 2 dl1 6 dl2] LC6 DL} def +/LT7 {PL [1 dl1 2 dl2 6 dl1 2 dl2 1 dl1 2 dl2] LC7 DL} def +/LT8 {PL [2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 2 dl2 2 dl1 4 dl2] LC8 DL} def +/Pnt {stroke [] 0 setdash gsave 1 setlinecap M 0 0 V stroke grestore} def +/Dia {stroke [] 0 setdash 2 copy vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke + Pnt} def +/Pls {stroke [] 0 setdash vpt sub M 0 vpt2 V + currentpoint stroke M + hpt neg vpt neg R hpt2 0 V stroke + } def +/Box {stroke [] 0 setdash 2 copy exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke + Pnt} def +/Crs {stroke [] 0 setdash exch hpt sub exch vpt add M + hpt2 vpt2 neg V currentpoint stroke M + hpt2 neg 0 R hpt2 vpt2 V stroke} def +/TriU {stroke [] 0 setdash 2 copy vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke + Pnt} def +/Star {2 copy Pls Crs} def +/BoxF {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath fill} def +/TriUF {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath fill} def +/TriD {stroke [] 0 setdash 2 copy vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke + Pnt} def +/TriDF {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath fill} def +/DiaF {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath fill} def +/Pent {stroke [] 0 setdash 2 copy gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore Pnt} def +/PentF {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath fill grestore} def +/Circle {stroke [] 0 setdash 2 copy + hpt 0 360 arc stroke Pnt} def +/CircleF {stroke [] 0 setdash hpt 0 360 arc fill} def +/C0 {BL [] 0 setdash 2 copy moveto vpt 90 450 arc} bind def +/C1 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + vpt 0 360 arc closepath} bind def +/C2 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C3 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C4 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C5 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc + 2 copy moveto + 2 copy vpt 180 270 arc closepath fill + vpt 0 360 arc} bind def +/C6 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C7 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 270 arc closepath fill + vpt 0 360 arc closepath} bind def +/C8 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C9 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 270 450 arc closepath fill + vpt 0 360 arc closepath} bind def +/C10 {BL [] 0 setdash 2 copy 2 copy moveto vpt 270 360 arc closepath fill + 2 copy moveto + 2 copy vpt 90 180 arc closepath fill + vpt 0 360 arc closepath} bind def +/C11 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 180 arc closepath fill + 2 copy moveto + 2 copy vpt 270 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C12 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C13 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 0 90 arc closepath fill + 2 copy moveto + 2 copy vpt 180 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/C14 {BL [] 0 setdash 2 copy moveto + 2 copy vpt 90 360 arc closepath fill + vpt 0 360 arc} bind def +/C15 {BL [] 0 setdash 2 copy vpt 0 360 arc closepath fill + vpt 0 360 arc closepath} bind def +/Rec {newpath 4 2 roll moveto 1 index 0 rlineto 0 exch rlineto + neg 0 rlineto closepath} bind def +/Square {dup Rec} bind def +/Bsquare {vpt sub exch vpt sub exch vpt2 Square} bind def +/S0 {BL [] 0 setdash 2 copy moveto 0 vpt rlineto BL Bsquare} bind def +/S1 {BL [] 0 setdash 2 copy vpt Square fill Bsquare} bind def +/S2 {BL [] 0 setdash 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S3 {BL [] 0 setdash 2 copy exch vpt sub exch vpt2 vpt Rec fill Bsquare} bind def +/S4 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S5 {BL [] 0 setdash 2 copy 2 copy vpt Square fill + exch vpt sub exch vpt sub vpt Square fill Bsquare} bind def +/S6 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S7 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt vpt2 Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S8 {BL [] 0 setdash 2 copy vpt sub vpt Square fill Bsquare} bind def +/S9 {BL [] 0 setdash 2 copy vpt sub vpt vpt2 Rec fill Bsquare} bind def +/S10 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt Square fill + Bsquare} bind def +/S11 {BL [] 0 setdash 2 copy vpt sub vpt Square fill 2 copy exch vpt sub exch vpt2 vpt Rec fill + Bsquare} bind def +/S12 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill Bsquare} bind def +/S13 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy vpt Square fill Bsquare} bind def +/S14 {BL [] 0 setdash 2 copy exch vpt sub exch vpt sub vpt2 vpt Rec fill + 2 copy exch vpt sub exch vpt Square fill Bsquare} bind def +/S15 {BL [] 0 setdash 2 copy Bsquare fill Bsquare} bind def +/D0 {gsave translate 45 rotate 0 0 S0 stroke grestore} bind def +/D1 {gsave translate 45 rotate 0 0 S1 stroke grestore} bind def +/D2 {gsave translate 45 rotate 0 0 S2 stroke grestore} bind def +/D3 {gsave translate 45 rotate 0 0 S3 stroke grestore} bind def +/D4 {gsave translate 45 rotate 0 0 S4 stroke grestore} bind def +/D5 {gsave translate 45 rotate 0 0 S5 stroke grestore} bind def +/D6 {gsave translate 45 rotate 0 0 S6 stroke grestore} bind def +/D7 {gsave translate 45 rotate 0 0 S7 stroke grestore} bind def +/D8 {gsave translate 45 rotate 0 0 S8 stroke grestore} bind def +/D9 {gsave translate 45 rotate 0 0 S9 stroke grestore} bind def +/D10 {gsave translate 45 rotate 0 0 S10 stroke grestore} bind def +/D11 {gsave translate 45 rotate 0 0 S11 stroke grestore} bind def +/D12 {gsave translate 45 rotate 0 0 S12 stroke grestore} bind def +/D13 {gsave translate 45 rotate 0 0 S13 stroke grestore} bind def +/D14 {gsave translate 45 rotate 0 0 S14 stroke grestore} bind def +/D15 {gsave translate 45 rotate 0 0 S15 stroke grestore} bind def +/DiaE {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V closepath stroke} def +/BoxE {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V closepath stroke} def +/TriUE {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V closepath stroke} def +/TriDE {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V closepath stroke} def +/PentE {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + closepath stroke grestore} def +/CircE {stroke [] 0 setdash + hpt 0 360 arc stroke} def +/Opaque {gsave closepath 1 setgray fill grestore 0 setgray closepath} def +/DiaW {stroke [] 0 setdash vpt add M + hpt neg vpt neg V hpt vpt neg V + hpt vpt V hpt neg vpt V Opaque stroke} def +/BoxW {stroke [] 0 setdash exch hpt sub exch vpt add M + 0 vpt2 neg V hpt2 0 V 0 vpt2 V + hpt2 neg 0 V Opaque stroke} def +/TriUW {stroke [] 0 setdash vpt 1.12 mul add M + hpt neg vpt -1.62 mul V + hpt 2 mul 0 V + hpt neg vpt 1.62 mul V Opaque stroke} def +/TriDW {stroke [] 0 setdash vpt 1.12 mul sub M + hpt neg vpt 1.62 mul V + hpt 2 mul 0 V + hpt neg vpt -1.62 mul V Opaque stroke} def +/PentW {stroke [] 0 setdash gsave + translate 0 hpt M 4 {72 rotate 0 hpt L} repeat + Opaque stroke grestore} def +/CircW {stroke [] 0 setdash + hpt 0 360 arc Opaque stroke} def +/BoxFill {gsave Rec 1 setgray fill grestore} def +/Density { + /Fillden exch def + currentrgbcolor + /ColB exch def /ColG exch def /ColR exch def + /ColR ColR Fillden mul Fillden sub 1 add def + /ColG ColG Fillden mul Fillden sub 1 add def + /ColB ColB Fillden mul Fillden sub 1 add def + ColR ColG ColB setrgbcolor} def +/BoxColFill {gsave Rec PolyFill} def +/PolyFill {gsave Density fill grestore grestore} def +/h {rlineto rlineto rlineto gsave closepath fill grestore} bind def +% +% PostScript Level 1 Pattern Fill routine for rectangles +% Usage: x y w h s a XX PatternFill +% x,y = lower left corner of box to be filled +% w,h = width and height of box +% a = angle in degrees between lines and x-axis +% XX = 0/1 for no/yes cross-hatch +% +/PatternFill {gsave /PFa [ 9 2 roll ] def + PFa 0 get PFa 2 get 2 div add PFa 1 get PFa 3 get 2 div add translate + PFa 2 get -2 div PFa 3 get -2 div PFa 2 get PFa 3 get Rec + gsave 1 setgray fill grestore clip + currentlinewidth 0.5 mul setlinewidth + /PFs PFa 2 get dup mul PFa 3 get dup mul add sqrt def + 0 0 M PFa 5 get rotate PFs -2 div dup translate + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 M 0 PFs V} for + 0 PFa 6 get ne { + 0 1 PFs PFa 4 get div 1 add floor cvi + {PFa 4 get mul 0 2 1 roll M PFs 0 V} for + } if + stroke grestore} def +% +/languagelevel where + {pop languagelevel} {1} ifelse + 2 lt + {/InterpretLevel1 true def} + {/InterpretLevel1 Level1 def} + ifelse +% +% PostScript level 2 pattern fill definitions +% +/Level2PatternFill { +/Tile8x8 {/PaintType 2 /PatternType 1 /TilingType 1 /BBox [0 0 8 8] /XStep 8 /YStep 8} + bind def +/KeepColor {currentrgbcolor [/Pattern /DeviceRGB] setcolorspace} bind def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke} +>> matrix makepattern +/Pat1 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 8 8 L 0 8 M 8 0 L stroke + 0 4 M 4 8 L 8 4 L 4 0 L 0 4 L stroke} +>> matrix makepattern +/Pat2 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 0 M 0 8 L + 8 8 L 8 0 L 0 0 L fill} +>> matrix makepattern +/Pat3 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 8 M 8 -4 L + 0 12 M 12 0 L stroke} +>> matrix makepattern +/Pat4 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -4 0 M 8 12 L + 0 -4 M 12 8 L stroke} +>> matrix makepattern +/Pat5 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 8 M 4 -4 L + 0 12 M 8 -4 L 4 12 M 10 0 L stroke} +>> matrix makepattern +/Pat6 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop -2 0 M 4 12 L + 0 -4 M 8 12 L 4 -4 M 10 8 L stroke} +>> matrix makepattern +/Pat7 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 8 -2 M -4 4 L + 12 0 M -4 8 L 12 4 M 0 10 L stroke} +>> matrix makepattern +/Pat8 exch def +<< Tile8x8 + /PaintProc {0.5 setlinewidth pop 0 -2 M 12 4 L + -4 0 M 12 8 L -4 4 M 8 10 L stroke} +>> matrix makepattern +/Pat9 exch def +/Pattern1 {PatternBgnd KeepColor Pat1 setpattern} bind def +/Pattern2 {PatternBgnd KeepColor Pat2 setpattern} bind def +/Pattern3 {PatternBgnd KeepColor Pat3 setpattern} bind def +/Pattern4 {PatternBgnd KeepColor Landscape {Pat5} {Pat4} ifelse setpattern} bind def +/Pattern5 {PatternBgnd KeepColor Landscape {Pat4} {Pat5} ifelse setpattern} bind def +/Pattern6 {PatternBgnd KeepColor Landscape {Pat9} {Pat6} ifelse setpattern} bind def +/Pattern7 {PatternBgnd KeepColor Landscape {Pat8} {Pat7} ifelse setpattern} bind def +} def +% +% +%End of PostScript Level 2 code +% +/PatternBgnd { + TransparentPatterns {} {gsave 1 setgray fill grestore} ifelse +} def +% +% Substitute for Level 2 pattern fill codes with +% grayscale if Level 2 support is not selected. +% +/Level1PatternFill { +/Pattern1 {0.250 Density} bind def +/Pattern2 {0.500 Density} bind def +/Pattern3 {0.750 Density} bind def +/Pattern4 {0.125 Density} bind def +/Pattern5 {0.375 Density} bind def +/Pattern6 {0.625 Density} bind def +/Pattern7 {0.875 Density} bind def +} def +% +% Now test for support of Level 2 code +% +Level1 {Level1PatternFill} {Level2PatternFill} ifelse +% +/Symbol-Oblique /Symbol findfont [1 0 .167 1 0 0] makefont +dup length dict begin {1 index /FID eq {pop pop} {def} ifelse} forall +currentdict end definefont pop +/MFshow { + { dup 5 get 3 ge + { 5 get 3 eq {gsave} {grestore} ifelse } + {dup dup 0 get findfont exch 1 get scalefont setfont + [ currentpoint ] exch dup 2 get 0 exch R dup 5 get 2 ne {dup dup 6 + get exch 4 get {Gshow} {stringwidth pop 0 R} ifelse }if dup 5 get 0 eq + {dup 3 get {2 get neg 0 exch R pop} {pop aload pop M} ifelse} {dup 5 + get 1 eq {dup 2 get exch dup 3 get exch 6 get stringwidth pop -2 div + dup 0 R} {dup 6 get stringwidth pop -2 div 0 R 6 get + show 2 index {aload pop M neg 3 -1 roll neg R pop pop} {pop pop pop + pop aload pop M} ifelse }ifelse }ifelse } + ifelse } + forall} def +/Gswidth {dup type /stringtype eq {stringwidth} {pop (n) stringwidth} ifelse} def +/MFwidth {0 exch { dup 5 get 3 ge { 5 get 3 eq { 0 } { pop } ifelse } + {dup 3 get{dup dup 0 get findfont exch 1 get scalefont setfont + 6 get Gswidth pop add} {pop} ifelse} ifelse} forall} def +/MLshow { currentpoint stroke M + 0 exch R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MRshow { currentpoint stroke M + exch dup MFwidth neg 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/MCshow { currentpoint stroke M + exch dup MFwidth -2 div 3 -1 roll R + Blacktext {gsave 0 setgray MFshow grestore} {MFshow} ifelse } bind def +/XYsave { [( ) 1 2 true false 3 ()] } bind def +/XYrestore { [( ) 1 2 true false 4 ()] } bind def +Level1 SuppressPDFMark or +{} { +/SDict 10 dict def +systemdict /pdfmark known not { + userdict /pdfmark systemdict /cleartomark get put +} if +SDict begin [ + /Title (Sparse_openmp.eps) + /Subject (gnuplot plot) + /Creator (gnuplot 4.6 patchlevel 0) + /Author (lilia) +% /Producer (gnuplot) +% /Keywords () + /CreationDate (Wed Dec 16 22:37:48 2015) + /DOCINFO pdfmark +end +} ifelse +end +%%EndProlog +%%Page: 1 1 +gnudict begin +gsave +doclip +50 50 translate +0.100 0.100 scale +90 rotate +0 -5040 translate +0 setgray +newpath +(Helvetica) findfont 140 scalefont setfont +BackgroundColor 0 lt 3 1 roll 0 lt exch 0 lt or or not {gsave BackgroundColor C clippath fill grestore} if +1.000 UL +LTb +854 448 M +63 0 V +6030 0 R +-63 0 V +stroke +770 448 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1)] +] -46.7 MRshow +1.000 UL +LTb +854 781 M +31 0 V +6062 0 R +-31 0 V +854 976 M +31 0 V +6062 0 R +-31 0 V +854 1114 M +31 0 V +6062 0 R +-31 0 V +854 1221 M +31 0 V +6062 0 R +-31 0 V +854 1308 M +31 0 V +6062 0 R +-31 0 V +854 1382 M +31 0 V +6062 0 R +-31 0 V +854 1447 M +31 0 V +6062 0 R +-31 0 V +854 1503 M +31 0 V +6062 0 R +-31 0 V +854 1554 M +63 0 V +6030 0 R +-63 0 V +stroke +770 1554 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10)] +] -46.7 MRshow +1.000 UL +LTb +854 1887 M +31 0 V +6062 0 R +-31 0 V +854 2081 M +31 0 V +6062 0 R +-31 0 V +854 2219 M +31 0 V +6062 0 R +-31 0 V +854 2327 M +31 0 V +6062 0 R +-31 0 V +854 2414 M +31 0 V +6062 0 R +-31 0 V +854 2488 M +31 0 V +6062 0 R +-31 0 V +854 2552 M +31 0 V +6062 0 R +-31 0 V +854 2609 M +31 0 V +6062 0 R +-31 0 V +854 2660 M +63 0 V +6030 0 R +-63 0 V +stroke +770 2660 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100)] +] -46.7 MRshow +1.000 UL +LTb +854 2992 M +31 0 V +6062 0 R +-31 0 V +854 3187 M +31 0 V +6062 0 R +-31 0 V +854 3325 M +31 0 V +6062 0 R +-31 0 V +854 3432 M +31 0 V +6062 0 R +-31 0 V +854 3520 M +31 0 V +6062 0 R +-31 0 V +854 3594 M +31 0 V +6062 0 R +-31 0 V +854 3658 M +31 0 V +6062 0 R +-31 0 V +854 3715 M +31 0 V +6062 0 R +-31 0 V +854 3765 M +63 0 V +6030 0 R +-63 0 V +stroke +770 3765 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1000)] +] -46.7 MRshow +1.000 UL +LTb +854 4098 M +31 0 V +6062 0 R +-31 0 V +854 4293 M +31 0 V +6062 0 R +-31 0 V +854 4431 M +31 0 V +6062 0 R +-31 0 V +854 4538 M +31 0 V +6062 0 R +-31 0 V +854 4626 M +31 0 V +6062 0 R +-31 0 V +854 4700 M +31 0 V +6062 0 R +-31 0 V +854 4764 M +31 0 V +6062 0 R +-31 0 V +854 4820 M +31 0 V +6062 0 R +-31 0 V +854 4871 M +63 0 V +6030 0 R +-63 0 V +stroke +770 4871 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MRshow +1.000 UL +LTb +854 448 M +0 63 V +0 4360 R +0 -63 V +stroke +854 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 10000)] +] -46.7 MCshow +1.000 UL +LTb +1465 448 M +0 31 V +0 4392 R +0 -31 V +1823 448 M +0 31 V +0 4392 R +0 -31 V +2077 448 M +0 31 V +0 4392 R +0 -31 V +2274 448 M +0 31 V +0 4392 R +0 -31 V +2434 448 M +0 31 V +0 4392 R +0 -31 V +2570 448 M +0 31 V +0 4392 R +0 -31 V +2688 448 M +0 31 V +0 4392 R +0 -31 V +2792 448 M +0 31 V +0 4392 R +0 -31 V +2885 448 M +0 63 V +0 4360 R +0 -63 V +stroke +2885 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 100000)] +] -46.7 MCshow +1.000 UL +LTb +3496 448 M +0 31 V +0 4392 R +0 -31 V +3854 448 M +0 31 V +0 4392 R +0 -31 V +4108 448 M +0 31 V +0 4392 R +0 -31 V +4305 448 M +0 31 V +0 4392 R +0 -31 V +4465 448 M +0 31 V +0 4392 R +0 -31 V +4601 448 M +0 31 V +0 4392 R +0 -31 V +4719 448 M +0 31 V +0 4392 R +0 -31 V +4823 448 M +0 31 V +0 4392 R +0 -31 V +4916 448 M +0 63 V +0 4360 R +0 -63 V +stroke +4916 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+06)] +] -46.7 MCshow +1.000 UL +LTb +5527 448 M +0 31 V +0 4392 R +0 -31 V +5885 448 M +0 31 V +0 4392 R +0 -31 V +6139 448 M +0 31 V +0 4392 R +0 -31 V +6336 448 M +0 31 V +0 4392 R +0 -31 V +6496 448 M +0 31 V +0 4392 R +0 -31 V +6632 448 M +0 31 V +0 4392 R +0 -31 V +6750 448 M +0 31 V +0 4392 R +0 -31 V +6854 448 M +0 31 V +0 4392 R +0 -31 V +6947 448 M +0 63 V +0 4360 R +0 -63 V +stroke +6947 308 M +[ [(Helvetica) 140.0 0.0 true true 0 ( 1e+07)] +] -46.7 MCshow +1.000 UL +LTb +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +LCb setrgbcolor +112 2659 M +currentpoint gsave translate -270 rotate 0 0 moveto +[ [(Helvetica) 140.0 0.0 true true 0 (Execution time in seconds)] +] -46.7 MCshow +grestore +LTb +LCb setrgbcolor +3900 98 M +[ [(Helvetica) 140.0 0.0 true true 0 (Polynomial's degrees)] +] -46.7 MCshow +LTb +1.000 UP +1.000 UL +LTb +% Begin plot #1 +1.000 UP +1.000 UL +LT0 +LCb setrgbcolor +6296 4738 M +[ [(Helvetica) 140.0 0.0 true true 0 (1 GPU)] +] -46.7 MRshow +LT0 +6380 4738 M +399 0 V +2885 1785 M +611 704 V +612 608 V +357 415 V +254 333 V +197 152 V +161 451 V +136 -78 V +2885 1785 Pls +3496 2489 Pls +4108 3097 Pls +4465 3512 Pls +4719 3845 Pls +4916 3997 Pls +5077 4448 Pls +5213 4370 Pls +6579 4738 Pls +% End plot #1 +% Begin plot #2 +1.000 UP +1.000 UL +LT1 +LCb setrgbcolor +6296 4598 M +[ [(Helvetica) 140.0 0.0 true true 0 (2 GPU)] +] -46.7 MRshow +LT1 +6380 4598 M +399 0 V +2885 1510 M +611 654 V +612 592 V +357 428 V +254 317 V +197 186 V +161 313 V +136 180 V +2885 1510 Crs +3496 2164 Crs +4108 2756 Crs +4465 3184 Crs +4719 3501 Crs +4916 3687 Crs +5077 4000 Crs +5213 4180 Crs +6579 4598 Crs +% End plot #2 +% Begin plot #3 +1.000 UP +1.000 UL +LT2 +LCb setrgbcolor +6296 4458 M +[ [(Helvetica) 140.0 0.0 true true 0 (3 GPU)] +] -46.7 MRshow +LT2 +6380 4458 M +399 0 V +2885 1447 M +611 746 V +612 395 V +357 410 V +254 265 V +197 256 V +161 592 V +136 -67 V +2885 1447 Star +3496 2193 Star +4108 2588 Star +4465 2998 Star +4719 3263 Star +4916 3519 Star +5077 4111 Star +5213 4044 Star +6579 4458 Star +% End plot #3 +% Begin plot #4 +1.000 UP +1.000 UL +LT3 +LCb setrgbcolor +6296 4318 M +[ [(Helvetica) 140.0 0.0 true true 0 (4 GPU)] +] -46.7 MRshow +LT3 +6380 4318 M +399 0 V +2885 1298 M +611 655 V +612 522 V +357 393 V +254 248 V +197 235 V +161 627 V +136 43 V +2885 1298 Box +3496 1953 Box +4108 2475 Box +4465 2868 Box +4719 3116 Box +4916 3351 Box +5077 3978 Box +5213 4021 Box +6579 4318 Box +% End plot #4 +1.000 UL +LTb +854 4871 N +854 448 L +6093 0 V +0 4423 V +-6093 0 V +Z stroke +1.000 UP +1.000 UL +LTb +stroke +grestore +end +showpage +%%Trailer +%%DocumentFonts: Helvetica +%%Pages: 1 diff --git a/Simulations/full_mpi/full_mpi_1GPU.o140161 b/Simulations/full_mpi/full_mpi_1GPU.o140161 new file mode 100644 index 0000000..a833c6c --- /dev/null +++ b/Simulations/full_mpi/full_mpi_1GPU.o140161 @@ -0,0 +1,515 @@ +REMAINING: 1 +Taking GPU #3 +proc 0 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 60160 +proc 0 start 0 size 60160 +iter : 1 Arret : 4.93627E-05 s/iter 0.751338 +iter : 2 Arret : 4.72892E-05 s/iter 0.751311 +iter : 3 Arret : 4.32282E-05 s/iter 0.751351 +iter : 4 Arret : 4.40808E-05 s/iter 0.751390 +iter : 5 Arret : 4.31866E-05 s/iter 0.751343 +iter : 6 Arret : 4.51897E-05 s/iter 0.751236 +iter : 7 Arret : 5.50757E-05 s/iter 0.751346 +iter : 8 Arret : 0.000600625 s/iter 0.751189 +iter : 9 Arret : 0.00351745 s/iter 0.751224 +iter : 10 Arret : 0.0225499 s/iter 0.751147 +iter : 11 Arret : 1.92525 s/iter 1.257596 +iter : 12 Arret : 0.0724798 s/iter 0.751219 +iter : 13 Arret : 0.100634 s/iter 0.751209 +iter : 14 Arret : 0.104374 s/iter 1.286622 +iter : 15 Arret : 0.016746 s/iter 1.271784 +iter : 16 Arret : 0.00784681 s/iter 1.261270 +iter : 17 Arret : 0.00523028 s/iter 1.249434 +iter : 18 Arret : 0.00797883 s/iter 0.731764 +iter : 19 Arret : 0.00389307 s/iter 0.711145 +iter : 20 Arret : 0.00132613 s/iter 0.695894 +iter : 21 Arret : 0.00054363 s/iter 0.683618 +iter : 22 Arret : 0.00764188 s/iter 0.655728 +iter : 23 Arret : 0.0109632 s/iter 0.663047 +iter : 24 Arret : 0.000483636 s/iter 0.647992 +iter : 25 Arret : 0.000266785 s/iter 0.645841 +iter : 26 Arret : 9.21069E-05 s/iter 0.650690 +iter : 27 Arret : 0.00137817 s/iter 0.518549 +iter : 28 Arret : 0.00413942 s/iter 0.516303 +iter : 29 Arret : 1.28264E-05 s/iter 0.521554 +iter : 30 Arret : 2.62246E-10 s/iter 0.521585 +iter : 31 Arret : 8.10539E-15 s/iter 0.520315 +temps : 24.1491 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 8.10539E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.27804E-14 +i*-1.97481E-14| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 150016 +proc 0 start 0 size 150016 +iter : 1 Arret : 1.64136E-05 s/iter 4.670410 +iter : 2 Arret : 1.62219E-05 s/iter 4.668737 +iter : 3 Arret : 1.59634E-05 s/iter 4.668001 +iter : 4 Arret : 1.57203E-05 s/iter 4.668096 +iter : 5 Arret : 1.61134E-05 s/iter 4.668095 +iter : 6 Arret : 1.68096E-05 s/iter 4.667823 +iter : 7 Arret : 1.83395E-05 s/iter 4.668957 +iter : 8 Arret : 2.23347E-05 s/iter 4.668718 +iter : 9 Arret : 0.000193284 s/iter 4.669886 +iter : 10 Arret : 0.00650657 s/iter 4.666547 +iter : 11 Arret : 0.00202338 s/iter 4.668819 +iter : 12 Arret : 0.00858027 s/iter 4.668152 +iter : 13 Arret : 1.50198 s/iter 6.718188 +iter : 14 Arret : 0.0716136 s/iter 5.989323 +iter : 15 Arret : 0.0462949 s/iter 4.653326 +iter : 16 Arret : 0.0250802 s/iter 4.654335 +iter : 17 Arret : 0.014323 s/iter 6.635287 +iter : 18 Arret : 0.0102749 s/iter 6.598926 +iter : 19 Arret : 0.0107553 s/iter 6.248834 +iter : 20 Arret : 0.0163074 s/iter 5.917159 +iter : 21 Arret : 0.00966464 s/iter 5.868624 +iter : 22 Arret : 0.0126723 s/iter 4.502515 +iter : 23 Arret : 0.0194806 s/iter 5.728295 +iter : 24 Arret : 0.00314943 s/iter 4.460393 +iter : 25 Arret : 0.00455918 s/iter 4.451818 +iter : 26 Arret : 0.000131011 s/iter 4.482879 +iter : 27 Arret : 1.27601E-05 s/iter 4.481150 +iter : 28 Arret : 8.90079E-08 s/iter 4.447335 +iter : 29 Arret : 8.10668E-13 s/iter 4.446139 +temps : 146.49 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 8.10668E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235897 +i* 0.971778| 1|-3.15963E-14 +i*-8.88994E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 250112 +proc 0 start 0 size 250112 +iter : 1 Arret : 1.15411E-05 s/iter 13.046733 +iter : 2 Arret : 9.858E-06 s/iter 13.081326 +iter : 3 Arret : 1.15382E-05 s/iter 13.069120 +iter : 4 Arret : 9.47232E-06 s/iter 13.076010 +iter : 5 Arret : 1.17256E-05 s/iter 13.072118 +iter : 6 Arret : 9.56386E-06 s/iter 13.076291 +iter : 7 Arret : 9.97104E-06 s/iter 13.066170 +iter : 8 Arret : 1.14103E-05 s/iter 13.081314 +iter : 9 Arret : 2.05919E-05 s/iter 13.071473 +iter : 10 Arret : 0.000825792 s/iter 13.076037 +iter : 11 Arret : 0.00118923 s/iter 13.070033 +iter : 12 Arret : 0.000993305 s/iter 13.084702 +iter : 13 Arret : 0.00173445 s/iter 13.089852 +iter : 14 Arret : 0.00725752 s/iter 13.071956 +iter : 15 Arret : 0.00431675 s/iter 12.991545 +iter : 16 Arret : 0.00223336 s/iter 10.557352 +iter : 17 Arret : 0.00768504 s/iter 7.919767 +iter : 18 Arret : 0.0589957 s/iter 7.694604 +iter : 19 Arret : 0.25159 s/iter 7.214844 +iter : 20 Arret : 0.00281777 s/iter 7.197502 +iter : 21 Arret : 0.000159366 s/iter 7.094188 +iter : 22 Arret : 6.57562E-05 s/iter 7.066874 +iter : 23 Arret : 3.10389E-05 s/iter 7.014897 +iter : 24 Arret : 1.40727E-05 s/iter 7.069989 +iter : 25 Arret : 1.97654E-05 s/iter 7.070010 +iter : 26 Arret : 1.37694E-05 s/iter 7.006386 +iter : 27 Arret : 7.84672E-07 s/iter 7.000436 +iter : 28 Arret : 2.76696E-10 s/iter 6.995541 +iter : 29 Arret : 5.23691E-16 s/iter 6.993836 +temps : 300.171 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 5.23691E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 350208 +proc 0 start 0 size 350208 +iter : 1 Arret : 8.60988E-06 s/iter 25.315090 +iter : 2 Arret : 7.40762E-06 s/iter 25.250569 +iter : 3 Arret : 7.04966E-06 s/iter 25.240912 +iter : 4 Arret : 7.00431E-06 s/iter 25.295865 +iter : 5 Arret : 6.902E-06 s/iter 25.229976 +iter : 6 Arret : 7.05582E-06 s/iter 25.295774 +iter : 7 Arret : 7.08998E-06 s/iter 25.244072 +iter : 8 Arret : 7.80153E-06 s/iter 25.319330 +iter : 9 Arret : 3.47E-05 s/iter 25.270429 +iter : 10 Arret : 0.000704728 s/iter 25.254028 +iter : 11 Arret : 0.00103416 s/iter 25.267890 +iter : 12 Arret : 0.00106397 s/iter 25.219715 +iter : 13 Arret : 0.860111 s/iter 25.358661 +iter : 14 Arret : 3.1212 s/iter 25.438830 +iter : 15 Arret : 0.0931888 s/iter 25.230396 +iter : 16 Arret : 0.0389072 s/iter 25.512462 +iter : 17 Arret : 0.0434458 s/iter 25.567784 +iter : 18 Arret : 0.0492605 s/iter 25.737787 +iter : 19 Arret : 0.0322665 s/iter 25.683394 +iter : 20 Arret : 0.0311855 s/iter 25.569362 +iter : 21 Arret : 0.0249899 s/iter 24.998756 +iter : 22 Arret : 0.0236284 s/iter 25.007239 +iter : 23 Arret : 0.0147332 s/iter 24.894940 +iter : 24 Arret : 0.0045927 s/iter 25.318951 +iter : 25 Arret : 0.00241036 s/iter 24.996102 +iter : 26 Arret : 0.000981942 s/iter 24.881214 +iter : 27 Arret : 0.000188842 s/iter 24.914979 +iter : 28 Arret : 1.13979E-05 s/iter 24.908900 +iter : 29 Arret : 4.63289E-09 s/iter 24.885179 +iter : 30 Arret : 2.06854E-14 s/iter 24.907560 +temps : 757.352 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 2.06854E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153441 +i* -0.988158| 1| 2.08479E-14 +i* 5.5551E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 500224 +proc 0 start 0 size 500224 +iter : 1 Arret : 6.15685E-06 s/iter 51.380314 +iter : 2 Arret : 6.30268E-06 s/iter 51.404717 +iter : 3 Arret : 5.43665E-06 s/iter 51.327440 +iter : 4 Arret : 5.82943E-06 s/iter 51.330423 +iter : 5 Arret : 5.29982E-06 s/iter 51.375294 +iter : 6 Arret : 5.48392E-06 s/iter 51.311003 +iter : 7 Arret : 4.9788E-06 s/iter 51.305802 +iter : 8 Arret : 5.28812E-06 s/iter 51.293377 +iter : 9 Arret : 8.66477E-06 s/iter 51.300327 +iter : 10 Arret : 6.18367E-05 s/iter 51.365604 +iter : 11 Arret : 0.00106682 s/iter 51.326802 +iter : 12 Arret : 0.00302391 s/iter 51.361010 +iter : 13 Arret : 0.00805823 s/iter 51.856360 +iter : 14 Arret : 0.00569434 s/iter 51.969477 +iter : 15 Arret : 0.0032212 s/iter 47.185741 +iter : 16 Arret : 1.43264 s/iter 37.596552 +iter : 17 Arret : 0.0261708 s/iter 34.701842 +iter : 18 Arret : 0.0335751 s/iter 32.177584 +iter : 19 Arret : 0.00563912 s/iter 31.261275 +iter : 20 Arret : 0.0024634 s/iter 29.073429 +iter : 21 Arret : 0.00305489 s/iter 28.085556 +iter : 22 Arret : 0.00365771 s/iter 26.833086 +iter : 23 Arret : 0.00250143 s/iter 25.441707 +iter : 24 Arret : 0.00549424 s/iter 24.484295 +iter : 25 Arret : 0.00252639 s/iter 23.169509 +iter : 26 Arret : 5.43905E-05 s/iter 22.350315 +iter : 27 Arret : 1.35324E-06 s/iter 21.912846 +iter : 28 Arret : 9.26795E-09 s/iter 22.036576 +iter : 29 Arret : 2.63961E-14 s/iter 21.824040 +temps : 1148.46 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 2.63961E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +iter : 1 Arret : 4.88741E-06 s/iter 73.643121 +iter : 2 Arret : 4.97199E-06 s/iter 73.660774 +iter : 3 Arret : 4.86258E-06 s/iter 73.959554 +iter : 4 Arret : 4.28624E-06 s/iter 73.918069 +iter : 5 Arret : 4.70264E-06 s/iter 73.933005 +iter : 6 Arret : 4.85459E-06 s/iter 73.951374 +iter : 7 Arret : 4.4341E-06 s/iter 73.800704 +iter : 8 Arret : 4.56391E-06 s/iter 73.596272 +iter : 9 Arret : 5.75896E-06 s/iter 73.751223 +iter : 10 Arret : 0.000763198 s/iter 73.862761 +iter : 11 Arret : 0.000582931 s/iter 81.937266 +iter : 12 Arret : 0.00224489 s/iter 73.950715 +iter : 13 Arret : 1.80799 s/iter 73.968738 +iter : 14 Arret : 0.0742277 s/iter 74.508413 +iter : 15 Arret : 0.0962999 s/iter 74.277195 +iter : 16 Arret : 0.108643 s/iter 73.517886 +iter : 17 Arret : 0.0724179 s/iter 71.659228 +iter : 18 Arret : 0.105199 s/iter 70.746803 +iter : 19 Arret : 0.146372 s/iter 69.276722 +iter : 20 Arret : 0.117759 s/iter 68.338548 +iter : 21 Arret : 0.00754357 s/iter 67.172870 +iter : 22 Arret : 0.000921826 s/iter 65.662508 +iter : 23 Arret : 0.000616312 s/iter 65.353341 +iter : 24 Arret : 0.00179901 s/iter 65.174928 +iter : 25 Arret : 1.77897E-05 s/iter 65.467629 +iter : 26 Arret : 3.63702E-06 s/iter 65.144205 +iter : 27 Arret : 1.82722E-07 s/iter 65.288149 +iter : 28 Arret : 3.58982E-11 s/iter 64.840549 +iter : 29 Arret : 1.57009E-16 s/iter 64.759606 +temps : 2059.61 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 700160 +proc 0 start 0 size 700160 +iter : 1 Arret : 4.36089E-06 s/iter 100.538329 +iter : 2 Arret : 4.20009E-06 s/iter 100.086525 +iter : 3 Arret : 4.27261E-06 s/iter 100.410161 +iter : 4 Arret : 3.90142E-06 s/iter 100.336287 +iter : 5 Arret : 3.60563E-06 s/iter 100.308817 +iter : 6 Arret : 3.93135E-06 s/iter 100.373492 +iter : 7 Arret : 3.83714E-06 s/iter 100.283845 +iter : 8 Arret : 3.69157E-06 s/iter 100.391852 +iter : 9 Arret : 4.92428E-06 s/iter 100.459479 +iter : 10 Arret : 9.37908E-05 s/iter 100.446598 +iter : 11 Arret : 0.00213526 s/iter 100.396625 +iter : 12 Arret : 0.002542 s/iter 100.503838 +iter : 13 Arret : 0.0125219 s/iter 100.940510 +iter : 14 Arret : 0.010999 s/iter 109.789990 +iter : 15 Arret : 0.00932865 s/iter 109.205901 +iter : 16 Arret : 0.0450638 s/iter 100.884592 +iter : 17 Arret : 0.184973 s/iter 102.656255 +iter : 18 Arret : 0.0519142 s/iter 101.300314 +iter : 19 Arret : 0.0302111 s/iter 100.763046 +iter : 20 Arret : 0.0177202 s/iter 100.248985 +iter : 21 Arret : 0.00863847 s/iter 99.989614 +iter : 22 Arret : 0.00156575 s/iter 99.794924 +iter : 23 Arret : 0.000367723 s/iter 99.510307 +iter : 24 Arret : 0.000179924 s/iter 99.548317 +iter : 25 Arret : 2.80728E-05 s/iter 99.520822 +iter : 26 Arret : 9.99898E-06 s/iter 99.579748 +iter : 27 Arret : 2.46675E-08 s/iter 99.458855 +iter : 28 Arret : 9.85491E-15 s/iter 99.607347 +temps : 2827.9 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 9.85491E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 0 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 800000 +proc 0 start 0 size 800000 +iter : 1 Arret : 3.83515E-06 s/iter 131.128367 +iter : 2 Arret : 3.31342E-06 s/iter 130.895719 +iter : 3 Arret : 3.46185E-06 s/iter 130.774185 +iter : 4 Arret : 3.77822E-06 s/iter 130.629629 +iter : 5 Arret : 3.54151E-06 s/iter 131.099737 +iter : 6 Arret : 3.39913E-06 s/iter 130.729467 +iter : 7 Arret : 3.37038E-06 s/iter 130.632620 +iter : 8 Arret : 3.66135E-06 s/iter 130.656450 +iter : 9 Arret : 5.18164E-06 s/iter 130.618912 +iter : 10 Arret : 3.60623E-05 s/iter 130.609820 +iter : 11 Arret : 0.000919045 s/iter 130.931691 +iter : 12 Arret : 0.0269508 s/iter 130.735832 +iter : 13 Arret : 2.00753 s/iter 131.562739 +iter : 14 Arret : 0.113163 s/iter 131.675926 +iter : 15 Arret : 0.114468 s/iter 132.383980 +iter : 16 Arret : 0.0343723 s/iter 131.231628 +iter : 17 Arret : 0.0118406 s/iter 126.227547 +iter : 18 Arret : 0.00584689 s/iter 120.723541 +iter : 19 Arret : 0.00603455 s/iter 116.384134 +iter : 20 Arret : 0.00445856 s/iter 111.422234 +iter : 21 Arret : 0.00344019 s/iter 106.222631 +iter : 22 Arret : 0.000542325 s/iter 99.990260 +iter : 23 Arret : 0.00265194 s/iter 95.378338 +iter : 24 Arret : 0.00180528 s/iter 92.586290 +iter : 25 Arret : 4.07819E-06 s/iter 91.103601 +iter : 26 Arret : 1.49379E-06 s/iter 89.796006 +iter : 27 Arret : 7.96771E-09 s/iter 90.012737 +iter : 28 Arret : 1.91442E-14 s/iter 90.007579 +temps : 3326.77 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.91442E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_mpi/full_mpi_1GPU.sge b/Simulations/full_mpi/full_mpi_1GPU.sge new file mode 100644 index 0000000..fd35afa --- /dev/null +++ b/Simulations/full_mpi/full_mpi_1GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_1GPU +#$ -pe mpi 1 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +#mpirun -np $NSLOTS ./template -r -i 900000 700000 +#mpirun -np $NSLOTS ./template -r -i 1000000 800000 +#mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_mpi/full_mpi_2GPU.o140160 b/Simulations/full_mpi/full_mpi_2GPU.o140160 new file mode 100644 index 0000000..8016229 --- /dev/null +++ b/Simulations/full_mpi/full_mpi_2GPU.o140160 @@ -0,0 +1,562 @@ +REMAINING: 2 +Taking GPU #0 +Taking GPU #1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 1, start 30080 size 30080 +proc 1 start 30080 size 30080 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 30080 +proc 0 start 0 size 30080 +iter : 1 Arret : 3.94715E-05 s/iter 0.376579 +iter : 2 Arret : 4.00498E-05 s/iter 0.376426 +iter : 3 Arret : 3.94982E-05 s/iter 0.376469 +iter : 4 Arret : 3.91196E-05 s/iter 0.376474 +iter : 5 Arret : 4.06401E-05 s/iter 0.376476 +iter : 6 Arret : 4.41482E-05 s/iter 0.376495 +iter : 7 Arret : 5.50716E-05 s/iter 0.376547 +iter : 8 Arret : 0.000118504 s/iter 0.376518 +iter : 9 Arret : 0.00115954 s/iter 0.376505 +iter : 10 Arret : 0.0219062 s/iter 0.376584 +iter : 11 Arret : 2.08077 s/iter 1.164908 +iter : 12 Arret : 0.274053 s/iter 0.376485 +iter : 13 Arret : 0.163438 s/iter 1.196444 +iter : 14 Arret : 0.0502837 s/iter 1.195663 +iter : 15 Arret : 0.0171551 s/iter 1.191447 +iter : 16 Arret : 0.00931569 s/iter 1.183639 +iter : 17 Arret : 0.00645054 s/iter 1.167546 +iter : 18 Arret : 0.00448467 s/iter 0.370707 +iter : 19 Arret : 0.00168489 s/iter 0.366051 +iter : 20 Arret : 0.00126146 s/iter 0.365448 +iter : 21 Arret : 0.0157645 s/iter 0.356946 +iter : 22 Arret : 0.00414432 s/iter 0.349791 +iter : 23 Arret : 0.0293605 s/iter 0.344674 +iter : 24 Arret : 0.000309791 s/iter 0.347406 +iter : 25 Arret : 0.000479548 s/iter 0.344763 +iter : 26 Arret : 0.000172889 s/iter 0.342501 +iter : 27 Arret : 2.54873E-05 s/iter 0.344592 +iter : 28 Arret : 6.36446E-08 s/iter 0.343705 +iter : 29 Arret : 1.95655E-12 s/iter 0.343232 +iter : 30 Arret : 1.11022E-16 s/iter 0.343867 +temps : 15.9313 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-2.28637E-15 +i*-5.45917E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 1 +proc 0 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 1, start 75008 size 75008 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 75008 +proc 0 start 0 size 75008 +proc 1 start 75008 size 75008 +iter : 1 Arret : 1.60943E-05 s/iter 2.350355 +iter : 2 Arret : 1.67528E-05 s/iter 2.342992 +iter : 3 Arret : 1.68978E-05 s/iter 2.337485 +iter : 4 Arret : 1.60377E-05 s/iter 2.337553 +iter : 5 Arret : 1.62156E-05 s/iter 2.337558 +iter : 6 Arret : 1.69292E-05 s/iter 2.337450 +iter : 7 Arret : 1.84639E-05 s/iter 2.337768 +iter : 8 Arret : 2.25051E-05 s/iter 2.337545 +iter : 9 Arret : 4.76681E-05 s/iter 2.337634 +iter : 10 Arret : 0.00245562 s/iter 2.337594 +iter : 11 Arret : 0.00371283 s/iter 2.337716 +iter : 12 Arret : 0.010769 s/iter 2.910185 +iter : 13 Arret : 1.55694 s/iter 4.438167 +iter : 14 Arret : 0.116538 s/iter 2.911091 +iter : 15 Arret : 0.0585023 s/iter 3.939639 +iter : 16 Arret : 0.0321741 s/iter 3.902393 +iter : 17 Arret : 0.0186974 s/iter 3.930056 +iter : 18 Arret : 0.00687909 s/iter 3.962909 +iter : 19 Arret : 0.0214989 s/iter 2.321178 +iter : 20 Arret : 0.00865216 s/iter 3.260664 +iter : 21 Arret : 0.0168761 s/iter 3.221472 +iter : 22 Arret : 0.0147692 s/iter 4.261763 +iter : 23 Arret : 0.0125239 s/iter 2.251272 +iter : 24 Arret : 0.000664965 s/iter 2.239406 +iter : 25 Arret : 1.59841E-05 s/iter 2.245565 +iter : 26 Arret : 5.40825E-07 s/iter 2.231696 +iter : 27 Arret : 8.52059E-11 s/iter 2.240876 +iter : 28 Arret : 7.75295E-16 s/iter 2.238326 +temps : 78.4263 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 7.75295E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.23606 +i* 0.971739| 1| 2.9924E-14 +i*-1.32854E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 125056 +proc 0 start 0 size 125056 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 1, start 125056 size 125056 +proc 1 start 125056 size 125056 +iter : 1 Arret : 1.04122E-05 s/iter 6.893601 +iter : 2 Arret : 9.66995E-06 s/iter 6.882320 +iter : 3 Arret : 9.55261E-06 s/iter 6.898899 +iter : 4 Arret : 9.22665E-06 s/iter 6.899113 +iter : 5 Arret : 9.50477E-06 s/iter 6.894819 +iter : 6 Arret : 9.562E-06 s/iter 6.896301 +iter : 7 Arret : 9.85225E-06 s/iter 6.898079 +iter : 8 Arret : 1.00444E-05 s/iter 6.895828 +iter : 9 Arret : 1.26197E-05 s/iter 6.906197 +iter : 10 Arret : 0.000374245 s/iter 6.892279 +iter : 11 Arret : 0.000473147 s/iter 6.894504 +iter : 12 Arret : 0.00101736 s/iter 6.894983 +iter : 13 Arret : 0.00428892 s/iter 6.893815 +iter : 14 Arret : 0.0152171 s/iter 6.896640 +iter : 15 Arret : 0.00947972 s/iter 6.813081 +iter : 16 Arret : 0.00590834 s/iter 8.502086 +iter : 17 Arret : 0.0148154 s/iter 4.292037 +iter : 18 Arret : 0.303776 s/iter 4.191474 +iter : 19 Arret : 0.00212739 s/iter 4.153373 +iter : 20 Arret : 0.00703257 s/iter 3.618613 +iter : 21 Arret : 0.00722956 s/iter 5.063281 +iter : 22 Arret : 0.000539584 s/iter 3.599227 +iter : 23 Arret : 0.000175798 s/iter 3.593595 +iter : 24 Arret : 1.72224E-05 s/iter 3.538749 +iter : 25 Arret : 0.000115569 s/iter 3.554657 +iter : 26 Arret : 0.000113543 s/iter 3.546651 +iter : 27 Arret : 4.63885E-05 s/iter 3.544304 +iter : 28 Arret : 1.37358E-05 s/iter 3.565583 +iter : 29 Arret : 2.47356E-07 s/iter 3.564036 +iter : 30 Arret : 2.5459E-12 s/iter 3.540899 +iter : 31 Arret : 1.11022E-16 s/iter 3.548698 +temps : 169.022 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 1 +proc 0 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 1, start 175104 size 175104 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 175104 +proc 0 start 0 size 175104 +proc 1 start 175104 size 175104 +iter : 1 Arret : 7.23955E-06 s/iter 12.988714 +iter : 2 Arret : 8.17362E-06 s/iter 12.961404 +iter : 3 Arret : 7.81796E-06 s/iter 12.964651 +iter : 4 Arret : 7.21292E-06 s/iter 12.968827 +iter : 5 Arret : 7.55071E-06 s/iter 12.967829 +iter : 6 Arret : 7.49029E-06 s/iter 12.964916 +iter : 7 Arret : 7.62064E-06 s/iter 12.963339 +iter : 8 Arret : 7.80044E-06 s/iter 12.963493 +iter : 9 Arret : 9.75039E-06 s/iter 12.964925 +iter : 10 Arret : 0.000863071 s/iter 12.969839 +iter : 11 Arret : 0.000849607 s/iter 12.969054 +iter : 12 Arret : 0.00104766 s/iter 12.964139 +iter : 13 Arret : 0.831471 s/iter 12.972067 +iter : 14 Arret : 3.38426 s/iter 12.966001 +iter : 15 Arret : 0.107189 s/iter 12.934545 +iter : 16 Arret : 0.0542638 s/iter 16.933464 +iter : 17 Arret : 0.0319719 s/iter 16.802921 +iter : 18 Arret : 0.0123162 s/iter 17.515009 +iter : 19 Arret : 0.021246 s/iter 17.702219 +iter : 20 Arret : 0.0113278 s/iter 17.796152 +iter : 21 Arret : 0.0245772 s/iter 17.074640 +iter : 22 Arret : 0.00540155 s/iter 17.506599 +iter : 23 Arret : 0.00765026 s/iter 12.838465 +iter : 24 Arret : 0.0115831 s/iter 12.839289 +iter : 25 Arret : 0.0115203 s/iter 12.887210 +iter : 26 Arret : 0.000774924 s/iter 12.835436 +iter : 27 Arret : 0.000228102 s/iter 12.835530 +iter : 28 Arret : 0.000225979 s/iter 12.834198 +iter : 29 Arret : 2.70389E-05 s/iter 12.835221 +iter : 30 Arret : 1.29617E-05 s/iter 12.835156 +iter : 31 Arret : 1.12344E-06 s/iter 12.834214 +iter : 32 Arret : 1.60825E-09 s/iter 12.834300 +iter : 33 Arret : 5.97777E-15 s/iter 12.836140 +temps : 457.417 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 5.97777E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153441 +i* -0.988158| 1| 2.08479E-14 +i* 5.5551E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 1, start 250112 size 250112 +proc 1 start 250112 size 250112 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 250112 +proc 0 start 0 size 250112 +iter : 1 Arret : 4.9348E-06 s/iter 26.306811 +iter : 2 Arret : 5.74497E-06 s/iter 26.125397 +iter : 3 Arret : 5.90879E-06 s/iter 26.122962 +iter : 4 Arret : 5.45965E-06 s/iter 26.117846 +iter : 5 Arret : 5.51053E-06 s/iter 26.113294 +iter : 6 Arret : 5.44166E-06 s/iter 26.107906 +iter : 7 Arret : 5.61587E-06 s/iter 26.108065 +iter : 8 Arret : 5.37769E-06 s/iter 26.112535 +iter : 9 Arret : 6.392E-06 s/iter 26.112787 +iter : 10 Arret : 0.000222412 s/iter 26.105165 +iter : 11 Arret : 0.00364174 s/iter 26.108847 +iter : 12 Arret : 0.00224664 s/iter 28.294492 +iter : 13 Arret : 0.00428508 s/iter 29.203574 +iter : 14 Arret : 0.00509531 s/iter 32.497063 +iter : 15 Arret : 0.00237252 s/iter 26.034125 +iter : 16 Arret : 0.0225054 s/iter 21.475326 +iter : 17 Arret : 1.39022 s/iter 22.775590 +iter : 18 Arret : 0.0380632 s/iter 21.509248 +iter : 19 Arret : 0.0147501 s/iter 20.099820 +iter : 20 Arret : 0.0175634 s/iter 15.352961 +iter : 21 Arret : 0.00896774 s/iter 19.613858 +iter : 22 Arret : 0.00146838 s/iter 16.233299 +iter : 23 Arret : 0.000316321 s/iter 13.214624 +iter : 24 Arret : 0.000122654 s/iter 13.000460 +iter : 25 Arret : 4.91927E-05 s/iter 12.525060 +iter : 26 Arret : 2.33271E-06 s/iter 11.550850 +iter : 27 Arret : 3.0703E-06 s/iter 11.616325 +iter : 28 Arret : 4.34623E-07 s/iter 11.570420 +iter : 29 Arret : 4.32022E-10 s/iter 11.514451 +iter : 30 Arret : 1.24127E-15 s/iter 11.583468 +temps : 637.538 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.24127E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 300032 size 300032 +proc 1 start 300032 size 300032 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +iter : 1 Arret : 4.75638E-06 s/iter 37.194622 +iter : 2 Arret : 4.76706E-06 s/iter 37.169379 +iter : 3 Arret : 4.56609E-06 s/iter 37.187098 +iter : 4 Arret : 4.96449E-06 s/iter 37.189698 +iter : 5 Arret : 4.6101E-06 s/iter 37.190980 +iter : 6 Arret : 4.67386E-06 s/iter 37.170837 +iter : 7 Arret : 4.4173E-06 s/iter 37.184958 +iter : 8 Arret : 4.5841E-06 s/iter 37.189119 +iter : 9 Arret : 5.81936E-06 s/iter 37.194076 +iter : 10 Arret : 9.61381E-05 s/iter 37.202796 +iter : 11 Arret : 0.00253702 s/iter 37.201994 +iter : 12 Arret : 0.00382237 s/iter 43.720161 +iter : 13 Arret : 1.98237 s/iter 37.268722 +iter : 14 Arret : 0.139529 s/iter 43.928325 +iter : 15 Arret : 0.0833681 s/iter 37.165670 +iter : 16 Arret : 0.0902433 s/iter 37.013464 +iter : 17 Arret : 0.0538083 s/iter 36.747709 +iter : 18 Arret : 0.0285517 s/iter 42.040931 +iter : 19 Arret : 0.0244232 s/iter 35.402712 +iter : 20 Arret : 0.0156356 s/iter 34.951257 +iter : 21 Arret : 0.00306159 s/iter 34.044015 +iter : 22 Arret : 0.00259881 s/iter 33.314225 +iter : 23 Arret : 0.0020894 s/iter 33.562042 +iter : 24 Arret : 0.000144328 s/iter 32.902500 +iter : 25 Arret : 4.2377E-05 s/iter 32.909701 +iter : 26 Arret : 7.50207E-06 s/iter 33.017508 +iter : 27 Arret : 4.17723E-07 s/iter 32.694117 +iter : 28 Arret : 3.57073E-10 s/iter 32.849709 +iter : 29 Arret : 1.04738E-15 s/iter 32.706464 +temps : 1055.82 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 1, start 350080 size 350080 +proc 1 start 350080 size 350080 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 350080 +proc 0 start 0 size 350080 +iter : 1 Arret : 4.07504E-06 s/iter 50.276924 +iter : 2 Arret : 4.14637E-06 s/iter 50.316736 +iter : 3 Arret : 3.92125E-06 s/iter 50.311941 +iter : 4 Arret : 3.96177E-06 s/iter 50.319644 +iter : 5 Arret : 3.60866E-06 s/iter 50.315146 +iter : 6 Arret : 3.73875E-06 s/iter 50.345034 +iter : 7 Arret : 3.91631E-06 s/iter 50.311163 +iter : 8 Arret : 3.82723E-06 s/iter 50.332321 +iter : 9 Arret : 4.24177E-06 s/iter 50.340320 +iter : 10 Arret : 9.18215E-05 s/iter 50.349367 +iter : 11 Arret : 0.000848166 s/iter 50.316912 +iter : 12 Arret : 0.00161125 s/iter 50.303456 +iter : 13 Arret : 0.0024668 s/iter 57.717511 +iter : 14 Arret : 0.00479788 s/iter 53.570757 +iter : 15 Arret : 0.00495555 s/iter 52.732469 +iter : 16 Arret : 0.0099658 s/iter 51.316983 +iter : 17 Arret : 0.0910784 s/iter 52.848267 +iter : 18 Arret : 0.0669533 s/iter 53.379948 +iter : 19 Arret : 0.196091 s/iter 50.742367 +iter : 20 Arret : 0.0404469 s/iter 53.773228 +iter : 21 Arret : 0.0140031 s/iter 50.742372 +iter : 22 Arret : 0.00221639 s/iter 52.968592 +iter : 23 Arret : 0.00849041 s/iter 50.251971 +iter : 24 Arret : 0.00450336 s/iter 50.017079 +iter : 25 Arret : 0.000556405 s/iter 50.012361 +iter : 26 Arret : 2.14523E-05 s/iter 50.016154 +iter : 27 Arret : 3.07624E-05 s/iter 50.035967 +iter : 28 Arret : 4.85785E-07 s/iter 49.957854 +iter : 29 Arret : 3.24294E-13 s/iter 50.017899 +temps : 1484.54 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 3.24294E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 400000 size 400000 +proc 1 start 400000 size 400000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 400000 +proc 0 start 0 size 400000 +iter : 1 Arret : 3.43314E-06 s/iter 66.451646 +iter : 2 Arret : 3.25458E-06 s/iter 66.371208 +iter : 3 Arret : 3.1756E-06 s/iter 66.365954 +iter : 4 Arret : 3.16632E-06 s/iter 66.323972 +iter : 5 Arret : 3.35307E-06 s/iter 66.379156 +iter : 6 Arret : 3.06929E-06 s/iter 66.310093 +iter : 7 Arret : 3.05638E-06 s/iter 66.375498 +iter : 8 Arret : 3.30698E-06 s/iter 66.345679 +iter : 9 Arret : 4.07579E-06 s/iter 66.346425 +iter : 10 Arret : 1.06648E-05 s/iter 66.343012 +iter : 11 Arret : 0.00084876 s/iter 66.372100 +iter : 12 Arret : 0.00143415 s/iter 66.363225 +iter : 13 Arret : 1.46402 s/iter 66.856335 +iter : 14 Arret : 0.713405 s/iter 68.042881 +iter : 15 Arret : 2.95761 s/iter 73.478889 +iter : 16 Arret : 0.205334 s/iter 66.190886 +iter : 17 Arret : 0.294322 s/iter 63.619134 +iter : 18 Arret : 0.0487392 s/iter 60.944788 +iter : 19 Arret : 0.0248874 s/iter 62.800018 +iter : 20 Arret : 0.0170499 s/iter 62.693475 +iter : 21 Arret : 0.00846661 s/iter 60.956662 +iter : 22 Arret : 0.0198831 s/iter 55.137303 +iter : 23 Arret : 0.00364888 s/iter 51.869775 +iter : 24 Arret : 2.68554E-05 s/iter 47.810142 +iter : 25 Arret : 2.14844E-05 s/iter 46.502062 +iter : 26 Arret : 4.9054E-06 s/iter 46.126008 +iter : 27 Arret : 4.4697E-07 s/iter 45.649153 +iter : 28 Arret : 7.89107E-11 s/iter 45.613504 +iter : 29 Arret : 2.23773E-16 s/iter 45.669074 +temps : 1766.95 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 2.23773E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_mpi/full_mpi_2GPU.sge b/Simulations/full_mpi/full_mpi_2GPU.sge new file mode 100644 index 0000000..ea411bb --- /dev/null +++ b/Simulations/full_mpi/full_mpi_2GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_2GPU +#$ -pe mpi 2 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +#mpirun -np $NSLOTS ./template -r -i 900000 700000 +#mpirun -np $NSLOTS ./template -r -i 1000000 800000 +#mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_mpi/full_mpi_3GPU.o140159 b/Simulations/full_mpi/full_mpi_3GPU.o140159 new file mode 100644 index 0000000..158cd8f --- /dev/null +++ b/Simulations/full_mpi/full_mpi_3GPU.o140159 @@ -0,0 +1,604 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 1, start 20053 size 20053 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 20053 +proc 0 start 0 size 20053 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 2, start 40106 size 20053 +proc 2 start 40106 size 20053 +proc 1 start 20053 size 20053 +iter : 1 Arret : 4.51053E-05 s/iter 0.366915 +iter : 2 Arret : 3.79748E-05 s/iter 0.366823 +iter : 3 Arret : 3.83563E-05 s/iter 0.366880 +iter : 4 Arret : 3.91196E-05 s/iter 0.366902 +iter : 5 Arret : 4.35007E-05 s/iter 0.366756 +iter : 6 Arret : 4.41483E-05 s/iter 0.366710 +iter : 7 Arret : 5.50718E-05 s/iter 0.366766 +iter : 8 Arret : 0.000118505 s/iter 0.366821 +iter : 9 Arret : 0.00208632 s/iter 0.366803 +iter : 10 Arret : 0.0219374 s/iter 0.366869 +iter : 11 Arret : 2.12364 s/iter 1.163790 +iter : 12 Arret : 0.290713 s/iter 0.366853 +iter : 13 Arret : 0.144909 s/iter 1.195713 +iter : 14 Arret : 0.0571799 s/iter 1.188579 +iter : 15 Arret : 0.017729 s/iter 1.192088 +iter : 16 Arret : 0.00942695 s/iter 1.186675 +iter : 17 Arret : 0.00614493 s/iter 1.170362 +iter : 18 Arret : 0.0046828 s/iter 1.012161 +iter : 19 Arret : 0.0210424 s/iter 0.356542 +iter : 20 Arret : 0.0167084 s/iter 0.355054 +iter : 21 Arret : 0.00421459 s/iter 0.348901 +iter : 22 Arret : 0.00178855 s/iter 0.342348 +iter : 23 Arret : 0.00897727 s/iter 0.340678 +iter : 24 Arret : 0.00287444 s/iter 0.336510 +iter : 25 Arret : 0.000362565 s/iter 0.336936 +iter : 26 Arret : 0.000252972 s/iter 0.337141 +iter : 27 Arret : 3.73204E-05 s/iter 0.328363 +iter : 28 Arret : 8.45973E-06 s/iter 0.334747 +iter : 29 Arret : 1.8159E-08 s/iter 0.324239 +iter : 30 Arret : 5.61914E-13 s/iter 0.337980 +temps : 16.3645 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 5.61914E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583426 +i* -0.812166| 1| 4.94882E-14 +i*-9.16107E-15| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 1, start 50005 size 50005 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 50005 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 2, start 100010 size 50005 +proc 1 start 50005 size 50005 +proc 0 start 0 size 50005 +proc 2 start 100010 size 50005 +iter : 1 Arret : 1.83619E-05 s/iter 1.833058 +iter : 2 Arret : 1.73853E-05 s/iter 1.832458 +iter : 3 Arret : 1.70553E-05 s/iter 1.832448 +iter : 4 Arret : 1.72513E-05 s/iter 1.832684 +iter : 5 Arret : 1.69749E-05 s/iter 1.832295 +iter : 6 Arret : 1.78708E-05 s/iter 1.832450 +iter : 7 Arret : 2.02323E-05 s/iter 1.832391 +iter : 8 Arret : 2.61959E-05 s/iter 1.832666 +iter : 9 Arret : 0.000263463 s/iter 1.832325 +iter : 10 Arret : 0.00201062 s/iter 1.832469 +iter : 11 Arret : 0.0177962 s/iter 1.832459 +iter : 12 Arret : 0.00945112 s/iter 1.832643 +iter : 13 Arret : 1.13842 s/iter 3.083910 +iter : 14 Arret : 0.0340957 s/iter 3.886935 +iter : 15 Arret : 0.0812119 s/iter 1.824686 +iter : 16 Arret : 0.16371 s/iter 3.884591 +iter : 17 Arret : 0.0770217 s/iter 3.594364 +iter : 18 Arret : 0.0145081 s/iter 3.552164 +iter : 19 Arret : 0.00446866 s/iter 2.726939 +iter : 20 Arret : 0.00786537 s/iter 1.794160 +iter : 21 Arret : 0.0166355 s/iter 1.779567 +iter : 22 Arret : 0.0278383 s/iter 2.763164 +iter : 23 Arret : 0.00838616 s/iter 1.758182 +iter : 24 Arret : 0.000453907 s/iter 1.764407 +iter : 25 Arret : 3.67653E-05 s/iter 1.749282 +iter : 26 Arret : 1.55532E-05 s/iter 1.735726 +iter : 27 Arret : 9.01062E-07 s/iter 1.753730 +iter : 28 Arret : 4.37903E-10 s/iter 1.730440 +iter : 29 Arret : 3.95673E-15 s/iter 1.728429 +temps : 63.3058 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 3.95673E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235775 +i* 0.971808| 1|-4.13627E-14 +i* -1.0803E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 1, start 83370 size 83370 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 2, start 166740 size 83370 +proc 2 start 166740 size 83370 +proc 1 start 83370 size 83370 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 83370 +proc 0 start 0 size 83370 +iter : 1 Arret : 1.04122E-05 s/iter 4.603075 +iter : 2 Arret : 9.85149E-06 s/iter 4.604055 +iter : 3 Arret : 1.14683E-05 s/iter 4.603262 +iter : 4 Arret : 1.02226E-05 s/iter 4.602431 +iter : 5 Arret : 1.00729E-05 s/iter 4.602619 +iter : 6 Arret : 1.06838E-05 s/iter 4.601869 +iter : 7 Arret : 1.12564E-05 s/iter 4.604882 +iter : 8 Arret : 1.08854E-05 s/iter 4.602271 +iter : 9 Arret : 1.68728E-05 s/iter 4.602965 +iter : 10 Arret : 0.000908721 s/iter 4.605369 +iter : 11 Arret : 0.00208199 s/iter 4.606164 +iter : 12 Arret : 0.00236846 s/iter 4.603500 +iter : 13 Arret : 0.00395957 s/iter 4.603136 +iter : 14 Arret : 0.000973404 s/iter 4.602278 +iter : 15 Arret : 0.00182712 s/iter 4.583661 +iter : 16 Arret : 0.00194671 s/iter 3.758842 +iter : 17 Arret : 0.00719321 s/iter 2.889771 +iter : 18 Arret : 0.295953 s/iter 2.852424 +iter : 19 Arret : 0.00337128 s/iter 4.408132 +iter : 20 Arret : 0.00333381 s/iter 2.836731 +iter : 21 Arret : 0.00266677 s/iter 2.831149 +iter : 22 Arret : 0.00107544 s/iter 2.801808 +iter : 23 Arret : 0.000320605 s/iter 2.803352 +iter : 24 Arret : 0.000173629 s/iter 2.830132 +iter : 25 Arret : 0.000233464 s/iter 2.803594 +iter : 26 Arret : 0.000160813 s/iter 2.829786 +iter : 27 Arret : 0.000120024 s/iter 2.786102 +iter : 28 Arret : 9.55845E-05 s/iter 2.819982 +iter : 29 Arret : 2.30991E-05 s/iter 2.839073 +iter : 30 Arret : 9.78684E-06 s/iter 2.820049 +iter : 31 Arret : 1.81912E-06 s/iter 2.795290 +iter : 32 Arret : 6.40862E-09 s/iter 2.814603 +iter : 33 Arret : 7.74157E-15 s/iter 2.794434 +temps : 122.621 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 1, start 116736 size 116736 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 2, start 233472 size 116736 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 116736 +proc 0 start 0 size 116736 +proc 1 start 116736 size 116736 +proc 2 start 233472 size 116736 +iter : 1 Arret : 7.25108E-06 s/iter 8.701598 +iter : 2 Arret : 7.01169E-06 s/iter 8.695411 +iter : 3 Arret : 7.08063E-06 s/iter 8.691498 +iter : 4 Arret : 6.71613E-06 s/iter 8.696067 +iter : 5 Arret : 8.00231E-06 s/iter 8.693456 +iter : 6 Arret : 6.92129E-06 s/iter 8.693906 +iter : 7 Arret : 7.08909E-06 s/iter 8.691731 +iter : 8 Arret : 7.80014E-06 s/iter 8.689556 +iter : 9 Arret : 1.05064E-05 s/iter 8.687045 +iter : 10 Arret : 0.000743236 s/iter 8.683404 +iter : 11 Arret : 0.000665165 s/iter 8.679771 +iter : 12 Arret : 0.00104331 s/iter 8.679382 +iter : 13 Arret : 0.820946 s/iter 8.680273 +iter : 14 Arret : 3.39143 s/iter 10.141868 +iter : 15 Arret : 0.124079 s/iter 10.120875 +iter : 16 Arret : 0.060865 s/iter 10.097925 +iter : 17 Arret : 0.0362188 s/iter 10.080714 +iter : 18 Arret : 0.0235232 s/iter 13.316578 +iter : 19 Arret : 0.019308 s/iter 10.793160 +iter : 20 Arret : 0.0181476 s/iter 10.220050 +iter : 21 Arret : 0.0341411 s/iter 13.317077 +iter : 22 Arret : 0.0238257 s/iter 13.520573 +iter : 23 Arret : 0.0622072 s/iter 13.384251 +iter : 24 Arret : 0.0384535 s/iter 13.405236 +iter : 25 Arret : 0.0315007 s/iter 13.389625 +iter : 26 Arret : 0.0793407 s/iter 13.377513 +iter : 27 Arret : 0.00511819 s/iter 13.311241 +iter : 28 Arret : 0.000404404 s/iter 8.624483 +iter : 29 Arret : 8.29183E-05 s/iter 8.623864 +iter : 30 Arret : 0.000107024 s/iter 8.624427 +iter : 31 Arret : 1.83455E-05 s/iter 8.626520 +iter : 32 Arret : 9.95568E-06 s/iter 8.624102 +iter : 33 Arret : 3.50874E-06 s/iter 8.630894 +iter : 34 Arret : 3.09608E-08 s/iter 8.626743 +iter : 35 Arret : 1.44506E-13 s/iter 8.626785 +temps : 350.829 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.11023E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 2, start 333482 size 166741 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 1, start 166741 size 166741 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 166741 +proc 0 start 0 size 166741 +proc 1 start 166741 size 166741 +proc 2 start 333482 size 166741 +iter : 1 Arret : 5.44829E-06 s/iter 17.188421 +iter : 2 Arret : 5.42874E-06 s/iter 17.137695 +iter : 3 Arret : 5.23492E-06 s/iter 17.123244 +iter : 4 Arret : 5.51556E-06 s/iter 17.128160 +iter : 5 Arret : 5.22118E-06 s/iter 17.122102 +iter : 6 Arret : 5.01816E-06 s/iter 17.123783 +iter : 7 Arret : 5.0087E-06 s/iter 17.115281 +iter : 8 Arret : 5.28527E-06 s/iter 17.120375 +iter : 9 Arret : 6.38913E-06 s/iter 17.121394 +iter : 10 Arret : 2.99276E-05 s/iter 17.125175 +iter : 11 Arret : 0.000916092 s/iter 17.123111 +iter : 12 Arret : 0.00112622 s/iter 17.129686 +iter : 13 Arret : 0.00199901 s/iter 18.785503 +iter : 14 Arret : 0.00536103 s/iter 17.609054 +iter : 15 Arret : 0.00620338 s/iter 18.429826 +iter : 16 Arret : 0.00463214 s/iter 16.044795 +iter : 17 Arret : 1.5572 s/iter 16.371044 +iter : 18 Arret : 0.084601 s/iter 14.529226 +iter : 19 Arret : 0.0115579 s/iter 15.452523 +iter : 20 Arret : 0.00599505 s/iter 14.669002 +iter : 21 Arret : 0.00192484 s/iter 10.219969 +iter : 22 Arret : 0.0109349 s/iter 10.105479 +iter : 23 Arret : 0.00351895 s/iter 9.786904 +iter : 24 Arret : 8.50621E-05 s/iter 8.935303 +iter : 25 Arret : 3.28381E-05 s/iter 8.653848 +iter : 26 Arret : 4.45938E-06 s/iter 8.532165 +iter : 27 Arret : 1.46328E-08 s/iter 8.457670 +iter : 28 Arret : 4.31796E-14 s/iter 8.370340 +temps : 410.952 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.44695E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 0 +proc 1 +proc 2 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 200021 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 400042 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 200021 +proc 0 start 0 size 200021 +proc 2 start 400042 size 200021 +proc 1 start 200021 size 200021 +iter : 1 Arret : 4.17374E-06 s/iter 25.553089 +iter : 2 Arret : 4.24471E-06 s/iter 25.497354 +iter : 3 Arret : 4.02926E-06 s/iter 25.510295 +iter : 4 Arret : 3.90309E-06 s/iter 25.498014 +iter : 5 Arret : 4.14737E-06 s/iter 25.505852 +iter : 6 Arret : 4.14451E-06 s/iter 25.510250 +iter : 7 Arret : 4.54952E-06 s/iter 25.534869 +iter : 8 Arret : 4.39097E-06 s/iter 25.519822 +iter : 9 Arret : 5.39778E-06 s/iter 25.501601 +iter : 10 Arret : 1.06277E-05 s/iter 25.514311 +iter : 11 Arret : 0.000466846 s/iter 25.483886 +iter : 12 Arret : 0.00147408 s/iter 25.506990 +iter : 13 Arret : 0.917202 s/iter 25.532816 +iter : 14 Arret : 0.738772 s/iter 25.543670 +iter : 15 Arret : 1.09406 s/iter 33.427707 +iter : 16 Arret : 0.0147818 s/iter 30.484631 +iter : 17 Arret : 0.00982586 s/iter 27.428111 +iter : 18 Arret : 0.00305155 s/iter 23.911742 +iter : 19 Arret : 0.00879189 s/iter 27.378373 +iter : 20 Arret : 0.0148466 s/iter 27.330975 +iter : 21 Arret : 0.00541507 s/iter 27.053957 +iter : 22 Arret : 0.00917579 s/iter 22.028199 +iter : 23 Arret : 0.00176967 s/iter 24.447698 +iter : 24 Arret : 0.000776941 s/iter 21.846447 +iter : 25 Arret : 1.85979E-05 s/iter 21.763637 +iter : 26 Arret : 5.99112E-08 s/iter 21.943537 +iter : 27 Arret : 6.36688E-13 s/iter 21.839783 +temps : 688.615 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.72079E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 2, start 466772 size 233386 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 1, start 233386 size 233386 +proc 2 start 466772 size 233386 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 233386 +proc 0 start 0 size 233386 +proc 1 start 233386 size 233386 +iter : 1 Arret : 3.63067E-06 s/iter 34.355771 +iter : 2 Arret : 3.51666E-06 s/iter 34.313476 +iter : 3 Arret : 3.37718E-06 s/iter 34.302244 +iter : 4 Arret : 3.51452E-06 s/iter 34.331891 +iter : 5 Arret : 3.53495E-06 s/iter 34.305875 +iter : 6 Arret : 3.54533E-06 s/iter 34.270154 +iter : 7 Arret : 3.57791E-06 s/iter 34.269601 +iter : 8 Arret : 3.49843E-06 s/iter 34.269532 +iter : 9 Arret : 3.56279E-06 s/iter 34.267016 +iter : 10 Arret : 6.70933E-06 s/iter 34.264316 +iter : 11 Arret : 0.000744895 s/iter 34.272504 +iter : 12 Arret : 0.0168677 s/iter 34.261719 +iter : 13 Arret : 0.0132741 s/iter 41.631459 +iter : 14 Arret : 0.0144504 s/iter 34.370399 +iter : 15 Arret : 0.0148871 s/iter 34.380936 +iter : 16 Arret : 0.117079 s/iter 42.029927 +iter : 17 Arret : 0.125622 s/iter 35.777828 +iter : 18 Arret : 0.0338842 s/iter 34.659887 +iter : 19 Arret : 0.0255305 s/iter 34.785339 +iter : 20 Arret : 0.0303666 s/iter 35.462034 +iter : 21 Arret : 0.0337579 s/iter 34.650721 +iter : 22 Arret : 0.0214608 s/iter 34.657778 +iter : 23 Arret : 0.00401409 s/iter 37.611052 +iter : 24 Arret : 0.00127792 s/iter 34.577885 +iter : 25 Arret : 0.000708122 s/iter 34.760828 +iter : 26 Arret : 1.94192E-06 s/iter 34.694471 +iter : 27 Arret : 3.18954E-08 s/iter 34.634308 +iter : 28 Arret : 1.15496E-13 s/iter 34.588120 +temps : 985.364 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 1.15496E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 1 +proc 2 +proc 0 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 533332 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 266666 size 266666 +proc 1 start 266666 size 266666 +proc 2 start 533332 size 266666 +proc 0 start 0 size 266666 +iter : 1 Arret : 3.65034E-06 s/iter 44.298468 +iter : 2 Arret : 3.20717E-06 s/iter 44.362840 +iter : 3 Arret : 3.28214E-06 s/iter 44.348033 +iter : 4 Arret : 3.53473E-06 s/iter 44.372779 +iter : 5 Arret : 3.64435E-06 s/iter 44.339393 +iter : 6 Arret : 3.48715E-06 s/iter 44.311216 +iter : 7 Arret : 3.20236E-06 s/iter 44.195501 +iter : 8 Arret : 3.46765E-06 s/iter 44.337231 +iter : 9 Arret : 4.55782E-06 s/iter 44.336266 +iter : 10 Arret : 3.03387E-05 s/iter 44.344481 +iter : 11 Arret : 0.000895058 s/iter 44.372449 +iter : 12 Arret : 0.00155707 s/iter 51.112648 +iter : 13 Arret : 1.43645 s/iter 52.743256 +iter : 14 Arret : 1.09102 s/iter 44.524633 +iter : 15 Arret : 0.0755624 s/iter 44.574228 +iter : 16 Arret : 0.0191023 s/iter 48.607142 +iter : 17 Arret : 0.0113021 s/iter 49.878872 +iter : 18 Arret : 0.0136773 s/iter 47.858875 +iter : 19 Arret : 0.0252439 s/iter 39.188313 +iter : 20 Arret : 0.034702 s/iter 39.327917 +iter : 21 Arret : 0.0204901 s/iter 41.570418 +iter : 22 Arret : 0.00860925 s/iter 42.424027 +iter : 23 Arret : 0.0024318 s/iter 40.816516 +iter : 24 Arret : 0.000206468 s/iter 32.760844 +iter : 25 Arret : 0.000152172 s/iter 31.523865 +iter : 26 Arret : 0.000466464 s/iter 30.993628 +iter : 27 Arret : 7.31094E-05 s/iter 30.855992 +iter : 28 Arret : 3.56766E-10 s/iter 31.007972 +iter : 29 Arret : 8.9509E-16 s/iter 30.809036 +temps : 1218.9 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.0233219 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +799998 racines de module = 1 + 2 racines de module = 0.999973 diff --git a/Simulations/full_mpi/full_mpi_3GPU.sge b/Simulations/full_mpi/full_mpi_3GPU.sge new file mode 100644 index 0000000..53261fe --- /dev/null +++ b/Simulations/full_mpi/full_mpi_3GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_3GPU +#$ -pe mpi 3 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +#mpirun -np $NSLOTS ./template -r -i 900000 700000 +#mpirun -np $NSLOTS ./template -r -i 1000000 800000 +#mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_mpi/full_mpi_4GPU.o140132 b/Simulations/full_mpi/full_mpi_4GPU.o140132 new file mode 100644 index 0000000..2c3dc2a --- /dev/null +++ b/Simulations/full_mpi/full_mpi_4GPU.o140132 @@ -0,0 +1,622 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +proc 1 +proc 2 +proc 3 +proc 0 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +zone limite de 'log-exp' 1.00593 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 1, start 15040 size 15040 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 3, start 45120 size 15040 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 0, start 0 size 15040 +proc 1 start 15040 size 15040 +proc 3 start 45120 size 15040 +proc 0 start 0 size 15040 +dimgrid 235 dimblock 256 degrePoly 60000 +proc 2, start 30080 size 15040 +proc 2 start 30080 size 15040 +iter : 1 Arret : 4.54253E-05 s/iter 0.190120 +iter : 2 Arret : 4.02349E-05 s/iter 0.189998 +iter : 3 Arret : 4.05851E-05 s/iter 0.190002 +iter : 4 Arret : 3.90123E-05 s/iter 0.189988 +iter : 5 Arret : 4.05115E-05 s/iter 0.189940 +iter : 6 Arret : 4.39547E-05 s/iter 0.189985 +iter : 7 Arret : 5.458E-05 s/iter 0.189984 +iter : 8 Arret : 0.000119494 s/iter 0.189981 +iter : 9 Arret : 0.00168327 s/iter 0.189962 +iter : 10 Arret : 0.0030417 s/iter 0.189891 +iter : 11 Arret : 2.15612 s/iter 0.189972 +iter : 12 Arret : 0.346227 s/iter 0.190014 +iter : 13 Arret : 0.126669 s/iter 1.018201 +iter : 14 Arret : 0.0535949 s/iter 1.016001 +iter : 15 Arret : 0.0185974 s/iter 1.012376 +iter : 16 Arret : 0.0101783 s/iter 1.010000 +iter : 17 Arret : 0.00628304 s/iter 1.004893 +iter : 18 Arret : 0.00442205 s/iter 0.867780 +iter : 19 Arret : 0.00334052 s/iter 0.850989 +iter : 20 Arret : 0.166672 s/iter 0.833688 +iter : 21 Arret : 0.154722 s/iter 0.185018 +iter : 22 Arret : 0.0369513 s/iter 0.857692 +iter : 23 Arret : 0.00795041 s/iter 0.183896 +iter : 24 Arret : 0.00113436 s/iter 0.179252 +iter : 25 Arret : 0.000916314 s/iter 0.179162 +iter : 26 Arret : 0.000437934 s/iter 0.173024 +iter : 27 Arret : 0.000164013 s/iter 0.173156 +iter : 28 Arret : 0.000120343 s/iter 0.173113 +iter : 29 Arret : 0.000163904 s/iter 0.173138 +iter : 30 Arret : 9.69458E-05 s/iter 0.173072 +iter : 31 Arret : 8.66273E-06 s/iter 0.172998 +iter : 32 Arret : 2.89696E-08 s/iter 0.173059 +iter : 33 Arret : 8.96067E-13 s/iter 0.173085 +temps : 13.0123 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 8.96067E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-2.28637E-15 +i*-5.45917E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.584107 +i* -0.811677| 1| 1.93838E-14 +i* -1.0613E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +zone limite de 'log-exp' 1.00237 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 0, start 0 size 37504 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 3, start 112512 size 37504 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 1, start 37504 size 37504 +dimgrid 586 dimblock 256 degrePoly 150000 +proc 2, start 75008 size 37504 +proc 2 start 75008 size 37504 +proc 0 start 0 size 37504 +proc 3 start 112512 size 37504 +proc 1 start 37504 size 37504 +iter : 1 Arret : 1.61155E-05 s/iter 1.388910 +iter : 2 Arret : 1.5292E-05 s/iter 1.388566 +iter : 3 Arret : 1.53382E-05 s/iter 1.388256 +iter : 4 Arret : 1.53436E-05 s/iter 1.388459 +iter : 5 Arret : 1.56797E-05 s/iter 1.388267 +iter : 6 Arret : 1.62943E-05 s/iter 1.388223 +iter : 7 Arret : 1.78031E-05 s/iter 1.388438 +iter : 8 Arret : 2.07609E-05 s/iter 1.388272 +iter : 9 Arret : 4.52349E-05 s/iter 1.388452 +iter : 10 Arret : 0.00148307 s/iter 1.388277 +iter : 11 Arret : 0.00381365 s/iter 1.388380 +iter : 12 Arret : 0.00454231 s/iter 2.679420 +iter : 13 Arret : 0.017103 s/iter 2.976033 +iter : 14 Arret : 1.38869 s/iter 1.383510 +iter : 15 Arret : 0.0597475 s/iter 1.384033 +iter : 16 Arret : 0.0363329 s/iter 2.973069 +iter : 17 Arret : 0.0127731 s/iter 3.418217 +iter : 18 Arret : 0.0103682 s/iter 3.020991 +iter : 19 Arret : 0.00840855 s/iter 2.969344 +iter : 20 Arret : 0.00415465 s/iter 3.306301 +iter : 21 Arret : 0.00116781 s/iter 1.346551 +iter : 22 Arret : 0.00222874 s/iter 1.341294 +iter : 23 Arret : 0.00230842 s/iter 1.334988 +iter : 24 Arret : 0.00269266 s/iter 1.337748 +iter : 25 Arret : 0.000589182 s/iter 1.335027 +iter : 26 Arret : 1.15656E-05 s/iter 1.331811 +iter : 27 Arret : 2.039E-06 s/iter 1.328004 +iter : 28 Arret : 3.02093E-09 s/iter 1.343235 +iter : 29 Arret : 2.75813E-14 s/iter 1.332966 +temps : 51.6331 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 2.75813E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235978 +i* 0.971758| 1|-2.91295E-14 +i*-3.06716E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +proc 1 +proc 2 +proc 3 +proc 0 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +zone limite de 'log-exp' 1.00142 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 2, start 125056 size 62528 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 0, start 0 size 62528 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 3, start 187584 size 62528 +proc 3 start 187584 size 62528 +proc 2 start 125056 size 62528 +proc 0 start 0 size 62528 +dimgrid 977 dimblock 256 degrePoly 250000 +proc 1, start 62528 size 62528 +proc 1 start 62528 size 62528 +iter : 1 Arret : 1.11968E-05 s/iter 3.825242 +iter : 2 Arret : 1.00799E-05 s/iter 3.807837 +iter : 3 Arret : 9.41078E-06 s/iter 3.813149 +iter : 4 Arret : 9.26536E-06 s/iter 3.814952 +iter : 5 Arret : 9.34813E-06 s/iter 3.812300 +iter : 6 Arret : 9.56148E-06 s/iter 3.818827 +iter : 7 Arret : 9.85158E-06 s/iter 3.809789 +iter : 8 Arret : 1.00436E-05 s/iter 3.817985 +iter : 9 Arret : 3.01654E-05 s/iter 3.810639 +iter : 10 Arret : 0.000664555 s/iter 3.818425 +iter : 11 Arret : 0.000737975 s/iter 3.818479 +iter : 12 Arret : 0.000983341 s/iter 3.816886 +iter : 13 Arret : 0.00169178 s/iter 3.818781 +iter : 14 Arret : 0.00246696 s/iter 3.818401 +iter : 15 Arret : 0.00246605 s/iter 3.779944 +iter : 16 Arret : 0.00658304 s/iter 2.977729 +iter : 17 Arret : 0.00690937 s/iter 5.004823 +iter : 18 Arret : 0.300013 s/iter 4.828460 +iter : 19 Arret : 0.0468449 s/iter 4.960936 +iter : 20 Arret : 0.00243593 s/iter 2.120119 +iter : 21 Arret : 0.000654892 s/iter 2.126485 +iter : 22 Arret : 0.00213423 s/iter 2.116250 +iter : 23 Arret : 0.000510708 s/iter 2.110308 +iter : 24 Arret : 0.00102843 s/iter 2.108799 +iter : 25 Arret : 0.000140837 s/iter 2.110467 +iter : 26 Arret : 9.44179E-05 s/iter 2.106952 +iter : 27 Arret : 2.22669E-05 s/iter 2.108487 +iter : 28 Arret : 1.36769E-06 s/iter 2.108960 +iter : 29 Arret : 2.186E-10 s/iter 2.111770 +iter : 30 Arret : 2.77556E-16 s/iter 2.094068 +temps : 98.5095 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +zone limite de 'log-exp' 1.00101 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 3, start 262656 size 87552 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 1, start 87552 size 87552 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 2, start 175104 size 87552 +proc 1 start 87552 size 87552 +dimgrid 1368 dimblock 256 degrePoly 350000 +proc 0, start 0 size 87552 +proc 0 start 0 size 87552 +proc 3 start 262656 size 87552 +proc 2 start 175104 size 87552 +iter : 1 Arret : 7.37223E-06 s/iter 6.537086 +iter : 2 Arret : 6.87852E-06 s/iter 6.540337 +iter : 3 Arret : 6.62662E-06 s/iter 6.539807 +iter : 4 Arret : 6.78716E-06 s/iter 6.537314 +iter : 5 Arret : 6.73158E-06 s/iter 6.543333 +iter : 6 Arret : 7.46053E-06 s/iter 6.536618 +iter : 7 Arret : 7.08865E-06 s/iter 6.536382 +iter : 8 Arret : 7.79945E-06 s/iter 6.534593 +iter : 9 Arret : 9.74861E-06 s/iter 6.536504 +iter : 10 Arret : 0.000745782 s/iter 6.537362 +iter : 11 Arret : 0.000455744 s/iter 6.535194 +iter : 12 Arret : 0.00342228 s/iter 6.534104 +iter : 13 Arret : 0.810408 s/iter 6.536777 +iter : 14 Arret : 3.37422 s/iter 10.380895 +iter : 15 Arret : 0.136557 s/iter 11.212541 +iter : 16 Arret : 0.0661427 s/iter 9.571236 +iter : 17 Arret : 0.0390301 s/iter 11.168500 +iter : 18 Arret : 0.056921 s/iter 11.419060 +iter : 19 Arret : 0.0851919 s/iter 11.272764 +iter : 20 Arret : 0.0308655 s/iter 11.252338 +iter : 21 Arret : 0.0183277 s/iter 11.252867 +iter : 22 Arret : 0.0401954 s/iter 10.205076 +iter : 23 Arret : 0.0540968 s/iter 11.305983 +iter : 24 Arret : 0.0434344 s/iter 10.978858 +iter : 25 Arret : 0.0335517 s/iter 11.237082 +iter : 26 Arret : 0.115944 s/iter 11.039900 +iter : 27 Arret : 0.0492573 s/iter 8.777420 +iter : 28 Arret : 0.0191575 s/iter 6.485398 +iter : 29 Arret : 0.0184729 s/iter 7.151590 +iter : 30 Arret : 0.00124008 s/iter 6.484897 +iter : 31 Arret : 6.47966E-05 s/iter 6.485006 +iter : 32 Arret : 4.59568E-05 s/iter 6.485609 +iter : 33 Arret : 3.27878E-06 s/iter 6.484358 +iter : 34 Arret : 2.62749E-10 s/iter 6.485211 +iter : 35 Arret : 1.0339E-15 s/iter 6.482394 +temps : 289.016 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.11023E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287595 +i* -0.999586| 1| 4.76598E-14 +i*-1.43895E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +zone limite de 'log-exp' 1.00071 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 3, start 375168 size 125056 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 1, start 125056 size 125056 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 2, start 250112 size 125056 +proc 1 start 125056 size 125056 +dimgrid 1954 dimblock 256 degrePoly 500000 +proc 0, start 0 size 125056 +proc 0 start 0 size 125056 +proc 3 start 375168 size 125056 +proc 2 start 250112 size 125056 +iter : 1 Arret : 5.43999E-06 s/iter 13.794000 +iter : 2 Arret : 4.91286E-06 s/iter 13.791136 +iter : 3 Arret : 4.80927E-06 s/iter 13.796273 +iter : 4 Arret : 4.84881E-06 s/iter 13.800496 +iter : 5 Arret : 4.97591E-06 s/iter 13.796980 +iter : 6 Arret : 4.79153E-06 s/iter 13.804318 +iter : 7 Arret : 4.83022E-06 s/iter 13.810851 +iter : 8 Arret : 5.21278E-06 s/iter 13.801380 +iter : 9 Arret : 6.23421E-06 s/iter 13.799572 +iter : 10 Arret : 6.92488E-05 s/iter 13.809235 +iter : 11 Arret : 0.00410439 s/iter 13.803771 +iter : 12 Arret : 0.00309009 s/iter 13.812651 +iter : 13 Arret : 0.0029815 s/iter 18.000127 +iter : 14 Arret : 0.00820943 s/iter 19.596298 +iter : 15 Arret : 0.0062262 s/iter 19.403564 +iter : 16 Arret : 1.4696 s/iter 14.578745 +iter : 17 Arret : 0.0225548 s/iter 15.759602 +iter : 18 Arret : 0.00265918 s/iter 11.703397 +iter : 19 Arret : 0.0066924 s/iter 8.696998 +iter : 20 Arret : 0.00187233 s/iter 14.112555 +iter : 21 Arret : 0.00910475 s/iter 8.336565 +iter : 22 Arret : 0.0385392 s/iter 8.037996 +iter : 23 Arret : 0.0216755 s/iter 9.237626 +iter : 24 Arret : 0.0024009 s/iter 7.207663 +iter : 25 Arret : 0.00123955 s/iter 6.955790 +iter : 26 Arret : 3.53765E-05 s/iter 6.696812 +iter : 27 Arret : 7.34783E-06 s/iter 6.014489 +iter : 28 Arret : 1.71411E-07 s/iter 5.956492 +iter : 29 Arret : 3.11637E-12 s/iter 5.922541 +iter : 30 Arret : 1.57009E-16 s/iter 5.957097 +temps : 358.278 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 150016 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 3, start 450048 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 300032 size 150016 +proc 1 start 150016 size 150016 +proc 3 start 450048 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 150016 +proc 0 start 0 size 150016 +proc 2 start 300032 size 150016 +iter : 1 Arret : 4.20321E-06 s/iter 18.775985 +iter : 2 Arret : 4.09855E-06 s/iter 18.747734 +iter : 3 Arret : 3.93391E-06 s/iter 18.730793 +iter : 4 Arret : 4.03193E-06 s/iter 18.732680 +iter : 5 Arret : 4.10736E-06 s/iter 18.735318 +iter : 6 Arret : 4.01386E-06 s/iter 18.743326 +iter : 7 Arret : 4.19451E-06 s/iter 18.739337 +iter : 8 Arret : 4.62309E-06 s/iter 18.741333 +iter : 9 Arret : 6.05422E-06 s/iter 18.740129 +iter : 10 Arret : 4.11892E-05 s/iter 18.733834 +iter : 11 Arret : 0.000517404 s/iter 18.736838 +iter : 12 Arret : 0.00114025 s/iter 18.735603 +iter : 13 Arret : 0.00285906 s/iter 18.781157 +iter : 14 Arret : 1.38645 s/iter 26.334716 +iter : 15 Arret : 0.623951 s/iter 22.498967 +iter : 16 Arret : 0.011785 s/iter 22.383771 +iter : 17 Arret : 0.0286509 s/iter 18.675149 +iter : 18 Arret : 0.0199337 s/iter 21.455577 +iter : 19 Arret : 0.00279992 s/iter 23.472538 +iter : 20 Arret : 0.00154477 s/iter 24.299102 +iter : 21 Arret : 0.000859833 s/iter 17.698308 +iter : 22 Arret : 0.000296794 s/iter 17.754719 +iter : 23 Arret : 3.50155E-05 s/iter 17.796812 +iter : 24 Arret : 1.46092E-05 s/iter 16.575301 +iter : 25 Arret : 1.13486E-05 s/iter 16.409288 +iter : 26 Arret : 2.08371E-06 s/iter 16.504363 +iter : 27 Arret : 4.3351E-08 s/iter 16.502863 +iter : 28 Arret : 1.78892E-13 s/iter 17.369262 +temps : 539.966 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +zone limite de 'log-exp' 1.00051 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 2, start 350080 size 175040 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 1, start 175040 size 175040 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 3, start 525120 size 175040 +proc 3 start 525120 size 175040 +dimgrid 2735 dimblock 256 degrePoly 700000 +proc 0, start 0 size 175040 +proc 0 start 0 size 175040 +proc 2 start 350080 size 175040 +proc 1 start 175040 size 175040 +iter : 1 Arret : 4.05426E-06 s/iter 26.055375 +iter : 2 Arret : 3.62462E-06 s/iter 26.017320 +iter : 3 Arret : 3.57426E-06 s/iter 26.031338 +iter : 4 Arret : 3.57393E-06 s/iter 26.019895 +iter : 5 Arret : 3.53387E-06 s/iter 26.031664 +iter : 6 Arret : 3.57381E-06 s/iter 26.022006 +iter : 7 Arret : 4.05236E-06 s/iter 26.018695 +iter : 8 Arret : 3.5632E-06 s/iter 26.018506 +iter : 9 Arret : 3.74898E-06 s/iter 26.036369 +iter : 10 Arret : 1.82635E-05 s/iter 26.019377 +iter : 11 Arret : 0.0017458 s/iter 26.032260 +iter : 12 Arret : 0.00155961 s/iter 33.564621 +iter : 13 Arret : 0.00513024 s/iter 27.283039 +iter : 14 Arret : 0.00473339 s/iter 33.669836 +iter : 15 Arret : 0.00281261 s/iter 31.946913 +iter : 16 Arret : 0.00468659 s/iter 28.606391 +iter : 17 Arret : 0.0122921 s/iter 30.427694 +iter : 18 Arret : 0.0156527 s/iter 31.617517 +iter : 19 Arret : 0.0320085 s/iter 25.851204 +iter : 20 Arret : 0.22003 s/iter 25.842946 +iter : 21 Arret : 0.012535 s/iter 28.965802 +iter : 22 Arret : 0.00376424 s/iter 28.796070 +iter : 23 Arret : 0.00220948 s/iter 25.734592 +iter : 24 Arret : 0.00248624 s/iter 25.743976 +iter : 25 Arret : 0.000364428 s/iter 25.732814 +iter : 26 Arret : 0.000719089 s/iter 25.747749 +iter : 27 Arret : 0.000438507 s/iter 25.790591 +iter : 28 Arret : 1.26042E-05 s/iter 25.738843 +iter : 29 Arret : 3.25839E-06 s/iter 25.855423 +iter : 30 Arret : 1.74243E-07 s/iter 25.753106 +iter : 31 Arret : 3.09364E-11 s/iter 25.736769 +iter : 32 Arret : 1.57009E-16 s/iter 25.740011 +temps : 871.12 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 3, start 600000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 200000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 400000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 200000 +proc 1 start 200000 size 200000 +proc 2 start 400000 size 200000 +proc 3 start 600000 size 200000 +proc 0 start 0 size 200000 +iter : 1 Arret : 3.03518E-06 s/iter 34.128856 +iter : 2 Arret : 3.06784E-06 s/iter 34.090727 +iter : 3 Arret : 3.06891E-06 s/iter 34.094241 +iter : 4 Arret : 2.95036E-06 s/iter 34.084829 +iter : 5 Arret : 2.99138E-06 s/iter 34.097352 +iter : 6 Arret : 3.04517E-06 s/iter 34.105084 +iter : 7 Arret : 3.18905E-06 s/iter 34.137020 +iter : 8 Arret : 3.30369E-06 s/iter 34.092524 +iter : 9 Arret : 4.0676E-06 s/iter 34.099620 +iter : 10 Arret : 8.80539E-06 s/iter 34.123961 +iter : 11 Arret : 0.000853991 s/iter 34.124027 +iter : 12 Arret : 0.000833381 s/iter 39.333820 +iter : 13 Arret : 2.00076 s/iter 34.135418 +iter : 14 Arret : 1.04464 s/iter 39.211608 +iter : 15 Arret : 0.956436 s/iter 35.763699 +iter : 16 Arret : 1.05412 s/iter 34.269226 +iter : 17 Arret : 0.887869 s/iter 32.651104 +iter : 18 Arret : 2.49443 s/iter 39.662531 +iter : 19 Arret : 0.0130108 s/iter 30.564624 +iter : 20 Arret : 0.0127308 s/iter 29.378733 +iter : 21 Arret : 0.00448902 s/iter 28.875435 +iter : 22 Arret : 0.0025421 s/iter 27.743883 +iter : 23 Arret : 0.000929422 s/iter 25.969572 +iter : 24 Arret : 4.42165E-05 s/iter 25.190779 +iter : 25 Arret : 1.79364E-05 s/iter 23.938702 +iter : 26 Arret : 5.68442E-06 s/iter 23.601870 +iter : 27 Arret : 4.0515E-07 s/iter 23.613905 +iter : 28 Arret : 2.68075E-10 s/iter 23.702620 +iter : 29 Arret : 6.86635E-16 s/iter 23.681104 +temps : 917.174 seconde(s) diff --git a/Simulations/full_mpi/full_mpi_4GPU.sge b/Simulations/full_mpi/full_mpi_4GPU.sge new file mode 100644 index 0000000..dafa0cf --- /dev/null +++ b/Simulations/full_mpi/full_mpi_4GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N full_mpi_4GPU +#$ -pe mpi 4 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/full_openmp/full_openmp_1GPU.o140165 b/Simulations/full_openmp/full_openmp_1GPU.o140165 new file mode 100644 index 0000000..84aa3b6 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_1GPU.o140165 @@ -0,0 +1,511 @@ +REMAINING: 1 +Taking GPU #3 +zone limite de 'log-exp' 1.00593 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 235 start 0 size 60160 +gpu 0 iter : 1 Arret : 5.01505E-05 s/iter 0.752555 +gpu 0 iter : 2 Arret : 4.32789E-05 s/iter 0.752365 +gpu 0 iter : 3 Arret : 4.45615E-05 s/iter 0.752417 +gpu 0 iter : 4 Arret : 4.42697E-05 s/iter 0.752431 +gpu 0 iter : 5 Arret : 4.06411E-05 s/iter 0.752415 +gpu 0 iter : 6 Arret : 4.41499E-05 s/iter 0.752420 +gpu 0 iter : 7 Arret : 5.50757E-05 s/iter 0.752345 +gpu 0 iter : 8 Arret : 0.000694531 s/iter 0.752443 +gpu 0 iter : 9 Arret : 0.00117193 s/iter 0.752305 +gpu 0 iter : 10 Arret : 0.0225506 s/iter 0.752371 +gpu 0 iter : 11 Arret : 1.92499 s/iter 1.259044 +gpu 0 iter : 12 Arret : 0.0745471 s/iter 0.752271 +gpu 0 iter : 13 Arret : 0.0973834 s/iter 0.752268 +gpu 0 iter : 14 Arret : 0.106004 s/iter 1.275597 +gpu 0 iter : 15 Arret : 0.0165737 s/iter 1.272023 +gpu 0 iter : 16 Arret : 0.00779384 s/iter 1.273056 +gpu 0 iter : 17 Arret : 0.00519845 s/iter 1.250155 +gpu 0 iter : 18 Arret : 0.00892143 s/iter 0.736177 +gpu 0 iter : 19 Arret : 0.00448482 s/iter 0.708562 +gpu 0 iter : 20 Arret : 0.020935 s/iter 0.700305 +gpu 0 iter : 21 Arret : 0.0174876 s/iter 0.906835 +gpu 0 iter : 22 Arret : 0.00111891 s/iter 0.676895 +gpu 0 iter : 23 Arret : 0.000389286 s/iter 0.656019 +gpu 0 iter : 24 Arret : 0.00124195 s/iter 0.661695 +gpu 0 iter : 25 Arret : 0.00324262 s/iter 0.649796 +gpu 0 iter : 26 Arret : 6.61927E-05 s/iter 0.524316 +gpu 0 iter : 27 Arret : 2.71425E-05 s/iter 0.519333 +gpu 0 iter : 28 Arret : 9.63588E-07 s/iter 0.525346 +gpu 0 iter : 29 Arret : 1.01411E-10 s/iter 0.521530 +gpu 0 iter : 30 Arret : 3.15975E-15 s/iter 0.517480 +temps : 24.3248 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 3.15975E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.80273 +i* -0.596342| 1|-1.96995E-14 +i* -2.6033E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.27804E-14 +i*-1.97481E-14| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583256 +i* -0.812288| 1|-6.17215E-15 +i* 4.85358E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 0 iter : 1 Arret : 1.63964E-05 s/iter 4.677497 +gpu 0 iter : 2 Arret : 1.6127E-05 s/iter 4.675437 +gpu 0 iter : 3 Arret : 1.62587E-05 s/iter 4.673977 +gpu 0 iter : 4 Arret : 1.57168E-05 s/iter 4.675710 +gpu 0 iter : 5 Arret : 1.60975E-05 s/iter 4.675592 +gpu 0 iter : 6 Arret : 1.68058E-05 s/iter 4.675951 +gpu 0 iter : 7 Arret : 1.83433E-05 s/iter 4.674129 +gpu 0 iter : 8 Arret : 2.23201E-05 s/iter 4.676196 +gpu 0 iter : 9 Arret : 0.000120962 s/iter 4.674233 +gpu 0 iter : 10 Arret : 0.0050599 s/iter 4.675473 +gpu 0 iter : 11 Arret : 0.00201552 s/iter 4.674922 +gpu 0 iter : 12 Arret : 0.00812397 s/iter 4.675066 +gpu 0 iter : 13 Arret : 1.49892 s/iter 6.735627 +gpu 0 iter : 14 Arret : 0.0726739 s/iter 4.672589 +gpu 0 iter : 15 Arret : 0.0439834 s/iter 6.675641 +gpu 0 iter : 16 Arret : 0.0237516 s/iter 4.667633 +gpu 0 iter : 17 Arret : 0.0164273 s/iter 6.591866 +gpu 0 iter : 18 Arret : 0.0544284 s/iter 6.683422 +gpu 0 iter : 19 Arret : 0.0693187 s/iter 5.846457 +gpu 0 iter : 20 Arret : 0.0244663 s/iter 6.575941 +gpu 0 iter : 21 Arret : 0.0170064 s/iter 5.851392 +gpu 0 iter : 22 Arret : 0.0132914 s/iter 4.512540 +gpu 0 iter : 23 Arret : 0.000340596 s/iter 4.492501 +gpu 0 iter : 24 Arret : 0.000818373 s/iter 4.462503 +gpu 0 iter : 25 Arret : 0.000816806 s/iter 4.471482 +gpu 0 iter : 26 Arret : 2.75366E-05 s/iter 4.467418 +gpu 0 iter : 27 Arret : 1.11905E-05 s/iter 4.471479 +gpu 0 iter : 28 Arret : 1.25333E-07 s/iter 4.486611 +gpu 0 iter : 29 Arret : 1.10046E-12 s/iter 4.460078 +gpu 0 iter : 30 Arret : 1.11022E-16 s/iter 4.443078 +temps : 151.38 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235897 +i* 0.971778| 1|-3.15963E-14 +i*-8.88994E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 977 start 0 size 250112 +gpu 0 iter : 1 Arret : 1.15543E-05 s/iter 13.064328 +gpu 0 iter : 2 Arret : 1.05743E-05 s/iter 13.099577 +gpu 0 iter : 3 Arret : 1.00182E-05 s/iter 13.092478 +gpu 0 iter : 4 Arret : 9.77217E-06 s/iter 13.098796 +gpu 0 iter : 5 Arret : 1.10944E-05 s/iter 13.096321 +gpu 0 iter : 6 Arret : 1.15644E-05 s/iter 13.098761 +gpu 0 iter : 7 Arret : 9.85482E-06 s/iter 13.095612 +gpu 0 iter : 8 Arret : 1.06459E-05 s/iter 13.079031 +gpu 0 iter : 9 Arret : 2.17082E-05 s/iter 13.095096 +gpu 0 iter : 10 Arret : 0.00106372 s/iter 13.097410 +gpu 0 iter : 11 Arret : 0.00274403 s/iter 13.098142 +gpu 0 iter : 12 Arret : 0.00233621 s/iter 15.172668 +gpu 0 iter : 13 Arret : 0.00104775 s/iter 13.090864 +gpu 0 iter : 14 Arret : 0.00142817 s/iter 13.093375 +gpu 0 iter : 15 Arret : 0.00192709 s/iter 13.017860 +gpu 0 iter : 16 Arret : 0.0176279 s/iter 11.468330 +gpu 0 iter : 17 Arret : 0.0577522 s/iter 7.983525 +gpu 0 iter : 18 Arret : 0.0271883 s/iter 9.498511 +gpu 0 iter : 19 Arret : 0.32067 s/iter 9.329063 +gpu 0 iter : 20 Arret : 0.0289407 s/iter 9.296524 +gpu 0 iter : 21 Arret : 0.00140766 s/iter 7.142933 +gpu 0 iter : 22 Arret : 0.000475428 s/iter 7.123373 +gpu 0 iter : 23 Arret : 0.000240166 s/iter 7.094510 +gpu 0 iter : 24 Arret : 1.51927E-05 s/iter 7.077023 +gpu 0 iter : 25 Arret : 1.77863E-06 s/iter 7.010421 +gpu 0 iter : 26 Arret : 8.08854E-10 s/iter 7.130576 +gpu 0 iter : 27 Arret : 1.00074E-15 s/iter 7.048493 +temps : 296.321 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.00074E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 1368 start 0 size 350208 +gpu 0 iter : 1 Arret : 8.60936E-06 s/iter 25.332348 +gpu 0 iter : 2 Arret : 7.40646E-06 s/iter 25.331263 +gpu 0 iter : 3 Arret : 7.97813E-06 s/iter 25.297466 +gpu 0 iter : 4 Arret : 7.23099E-06 s/iter 25.306792 +gpu 0 iter : 5 Arret : 6.85143E-06 s/iter 25.280568 +gpu 0 iter : 6 Arret : 6.79155E-06 s/iter 25.305357 +gpu 0 iter : 7 Arret : 7.08999E-06 s/iter 25.314962 +gpu 0 iter : 8 Arret : 7.80158E-06 s/iter 25.279543 +gpu 0 iter : 9 Arret : 2.6561E-05 s/iter 25.267836 +gpu 0 iter : 10 Arret : 0.00102009 s/iter 25.308796 +gpu 0 iter : 11 Arret : 0.00106765 s/iter 25.285841 +gpu 0 iter : 12 Arret : 0.00106457 s/iter 25.305366 +gpu 0 iter : 13 Arret : 0.857755 s/iter 25.292478 +gpu 0 iter : 14 Arret : 3.15407 s/iter 25.495050 +gpu 0 iter : 15 Arret : 0.0928667 s/iter 25.354315 +gpu 0 iter : 16 Arret : 0.0413768 s/iter 25.910028 +gpu 0 iter : 17 Arret : 0.0497463 s/iter 25.748876 +gpu 0 iter : 18 Arret : 0.0497904 s/iter 25.748583 +gpu 0 iter : 19 Arret : 0.0354662 s/iter 25.596173 +gpu 0 iter : 20 Arret : 0.0431719 s/iter 25.648011 +gpu 0 iter : 21 Arret : 0.0230133 s/iter 25.155342 +gpu 0 iter : 22 Arret : 0.00525789 s/iter 25.160092 +gpu 0 iter : 23 Arret : 0.00203657 s/iter 24.929404 +gpu 0 iter : 24 Arret : 0.000600149 s/iter 24.929483 +gpu 0 iter : 25 Arret : 0.00016638 s/iter 24.931502 +gpu 0 iter : 26 Arret : 0.000154787 s/iter 24.957389 +gpu 0 iter : 27 Arret : 0.000302699 s/iter 24.917011 +gpu 0 iter : 28 Arret : 2.13113E-05 s/iter 24.916750 +gpu 0 iter : 29 Arret : 1.51643E-05 s/iter 24.917954 +gpu 0 iter : 30 Arret : 3.76262E-06 s/iter 24.943057 +gpu 0 iter : 31 Arret : 1.29245E-07 s/iter 24.913031 +gpu 0 iter : 32 Arret : 6.35329E-12 s/iter 24.917417 +gpu 0 iter : 33 Arret : 1.24127E-16 s/iter 24.950893 +temps : 833.807 seconde(s) +Nb iterations : 33 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.24127E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 1954 start 0 size 500224 +gpu 0 iter : 1 Arret : 6.12242E-06 s/iter 51.505107 +gpu 0 iter : 2 Arret : 6.31918E-06 s/iter 51.453063 +gpu 0 iter : 3 Arret : 5.33763E-06 s/iter 51.408046 +gpu 0 iter : 4 Arret : 5.41422E-06 s/iter 51.400436 +gpu 0 iter : 5 Arret : 5.39348E-06 s/iter 51.382269 +gpu 0 iter : 6 Arret : 5.60111E-06 s/iter 51.438183 +gpu 0 iter : 7 Arret : 5.01475E-06 s/iter 51.488070 +gpu 0 iter : 8 Arret : 5.29744E-06 s/iter 51.358997 +gpu 0 iter : 9 Arret : 6.66838E-06 s/iter 51.085502 +gpu 0 iter : 10 Arret : 6.73287E-05 s/iter 51.335479 +gpu 0 iter : 11 Arret : 0.00990101 s/iter 51.464874 +gpu 0 iter : 12 Arret : 0.00823435 s/iter 51.403521 +gpu 0 iter : 13 Arret : 0.0131909 s/iter 51.825163 +gpu 0 iter : 14 Arret : 0.00701993 s/iter 52.176993 +gpu 0 iter : 15 Arret : 0.0153428 s/iter 47.885546 +gpu 0 iter : 16 Arret : 1.40554 s/iter 37.523257 +gpu 0 iter : 17 Arret : 0.017993 s/iter 33.363730 +gpu 0 iter : 18 Arret : 0.0130545 s/iter 31.485423 +gpu 0 iter : 19 Arret : 0.00840726 s/iter 29.781113 +gpu 0 iter : 20 Arret : 0.0195837 s/iter 30.113452 +gpu 0 iter : 21 Arret : 0.0204301 s/iter 30.982105 +gpu 0 iter : 22 Arret : 0.0051956 s/iter 26.750718 +gpu 0 iter : 23 Arret : 0.000187857 s/iter 25.344565 +gpu 0 iter : 24 Arret : 9.72305E-05 s/iter 24.719137 +gpu 0 iter : 25 Arret : 3.47336E-05 s/iter 23.203467 +gpu 0 iter : 26 Arret : 1.4149E-05 s/iter 22.255267 +gpu 0 iter : 27 Arret : 9.26981E-06 s/iter 22.153239 +gpu 0 iter : 28 Arret : 2.81196E-06 s/iter 22.023657 +gpu 0 iter : 29 Arret : 1.36843E-07 s/iter 21.837417 +gpu 0 iter : 30 Arret : 1.32082E-11 s/iter 21.847546 +gpu 0 iter : 31 Arret : 1.11022E-16 s/iter 21.866344 +temps : 1194.76 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 0 iter : 1 Arret : 5.11012E-06 s/iter 73.756595 +gpu 0 iter : 2 Arret : 5.49594E-06 s/iter 74.121359 +gpu 0 iter : 3 Arret : 4.95278E-06 s/iter 74.139359 +gpu 0 iter : 4 Arret : 4.31967E-06 s/iter 74.012268 +gpu 0 iter : 5 Arret : 4.586E-06 s/iter 74.059945 +gpu 0 iter : 6 Arret : 4.28143E-06 s/iter 74.091814 +gpu 0 iter : 7 Arret : 4.14913E-06 s/iter 74.022009 +gpu 0 iter : 8 Arret : 4.768E-06 s/iter 74.045411 +gpu 0 iter : 9 Arret : 6.32809E-06 s/iter 74.020498 +gpu 0 iter : 10 Arret : 0.000551734 s/iter 74.008861 +gpu 0 iter : 11 Arret : 0.000854623 s/iter 74.075006 +gpu 0 iter : 12 Arret : 0.00526383 s/iter 74.351997 +gpu 0 iter : 13 Arret : 1.86671 s/iter 74.338451 +gpu 0 iter : 14 Arret : 0.044381 s/iter 74.401470 +gpu 0 iter : 15 Arret : 0.0449663 s/iter 77.708059 +gpu 0 iter : 16 Arret : 0.0459647 s/iter 73.860654 +gpu 0 iter : 17 Arret : 0.0457241 s/iter 72.117134 +gpu 0 iter : 18 Arret : 0.0378989 s/iter 71.687519 +gpu 0 iter : 19 Arret : 0.0321851 s/iter 69.198666 +gpu 0 iter : 20 Arret : 0.0124933 s/iter 68.613221 +gpu 0 iter : 21 Arret : 0.00730326 s/iter 67.130299 +gpu 0 iter : 22 Arret : 0.00446236 s/iter 65.916847 +gpu 0 iter : 23 Arret : 0.000497812 s/iter 65.967574 +gpu 0 iter : 24 Arret : 0.000892713 s/iter 65.658481 +gpu 0 iter : 25 Arret : 4.7836E-06 s/iter 64.891775 +gpu 0 iter : 26 Arret : 1.04505E-09 s/iter 65.003588 +gpu 0 iter : 27 Arret : 3.1578E-15 s/iter 65.348519 +temps : 1931.46 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 3.1578E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 0 dimgrid2 2735 start 0 size 700160 +gpu 0 iter : 1 Arret : 4.40509E-06 s/iter 100.694769 +gpu 0 iter : 2 Arret : 4.14157E-06 s/iter 100.469337 +gpu 0 iter : 3 Arret : 4.41135E-06 s/iter 100.605636 +gpu 0 iter : 4 Arret : 3.77329E-06 s/iter 100.474382 +gpu 0 iter : 5 Arret : 3.66086E-06 s/iter 100.585159 +gpu 0 iter : 6 Arret : 3.72953E-06 s/iter 100.453144 +gpu 0 iter : 7 Arret : 3.69827E-06 s/iter 100.534472 +gpu 0 iter : 8 Arret : 4.0146E-06 s/iter 100.527939 +gpu 0 iter : 9 Arret : 4.40501E-06 s/iter 100.506852 +gpu 0 iter : 10 Arret : 0.000145438 s/iter 100.425934 +gpu 0 iter : 11 Arret : 0.000853238 s/iter 100.356423 +gpu 0 iter : 12 Arret : 0.00173408 s/iter 100.698172 +gpu 0 iter : 13 Arret : 0.00406782 s/iter 102.669605 +gpu 0 iter : 14 Arret : 0.00525798 s/iter 100.740660 +gpu 0 iter : 15 Arret : 0.00912631 s/iter 101.481624 +gpu 0 iter : 16 Arret : 0.0564377 s/iter 100.156723 +gpu 0 iter : 17 Arret : 0.173647 s/iter 101.052747 +gpu 0 iter : 18 Arret : 0.0415567 s/iter 103.159864 +gpu 0 iter : 19 Arret : 0.0291844 s/iter 101.678094 +gpu 0 iter : 20 Arret : 0.0193248 s/iter 101.283426 +gpu 0 iter : 21 Arret : 0.00828239 s/iter 100.513861 +gpu 0 iter : 22 Arret : 0.00218532 s/iter 99.669534 +gpu 0 iter : 23 Arret : 0.00038288 s/iter 99.672435 +gpu 0 iter : 24 Arret : 0.00053382 s/iter 99.680679 +gpu 0 iter : 25 Arret : 0.000180417 s/iter 99.792193 +gpu 0 iter : 26 Arret : 6.23119E-05 s/iter 99.656799 +gpu 0 iter : 27 Arret : 1.31328E-05 s/iter 99.708395 +gpu 0 iter : 28 Arret : 1.46741E-06 s/iter 99.655086 +gpu 0 iter : 29 Arret : 1.39344E-08 s/iter 99.775734 +gpu 0 iter : 30 Arret : 6.13969E-15 s/iter 99.639756 +temps : 3017.33 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 6.13969E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 3125 start 0 size 800000 +gpu 0 iter : 1 Arret : 3.74909E-06 s/iter 131.738179 +gpu 0 iter : 2 Arret : 3.49254E-06 s/iter 131.503382 +gpu 0 iter : 3 Arret : 3.79247E-06 s/iter 130.862896 +gpu 0 iter : 4 Arret : 3.40119E-06 s/iter 130.832910 +gpu 0 iter : 5 Arret : 3.64216E-06 s/iter 131.517237 +gpu 0 iter : 6 Arret : 3.50994E-06 s/iter 131.403093 +gpu 0 iter : 7 Arret : 3.54522E-06 s/iter 131.315477 +gpu 0 iter : 8 Arret : 3.57706E-06 s/iter 131.206471 +gpu 0 iter : 9 Arret : 4.78249E-06 s/iter 131.242355 +gpu 0 iter : 10 Arret : 0.000445854 s/iter 131.325342 +gpu 0 iter : 11 Arret : 0.00106438 s/iter 131.005859 +gpu 0 iter : 12 Arret : 0.0159228 s/iter 130.855281 +gpu 0 iter : 13 Arret : 1.96586 s/iter 131.580736 +gpu 0 iter : 14 Arret : 0.0310235 s/iter 139.161956 +gpu 0 iter : 15 Arret : 0.288368 s/iter 132.380708 +gpu 0 iter : 16 Arret : 0.268505 s/iter 131.753751 +gpu 0 iter : 17 Arret : 0.055019 s/iter 130.693875 +gpu 0 iter : 18 Arret : 0.0095986 s/iter 120.836692 +gpu 0 iter : 19 Arret : 0.0067465 s/iter 121.133462 +gpu 0 iter : 20 Arret : 0.00486301 s/iter 111.958685 +gpu 0 iter : 21 Arret : 0.00150462 s/iter 106.824156 +gpu 0 iter : 22 Arret : 0.00367623 s/iter 100.023867 +gpu 0 iter : 23 Arret : 0.000649555 s/iter 95.844251 +gpu 0 iter : 24 Arret : 1.61661E-05 s/iter 92.179310 +gpu 0 iter : 25 Arret : 1.57748E-05 s/iter 90.746510 +gpu 0 iter : 26 Arret : 2.71821E-06 s/iter 90.684064 +gpu 0 iter : 27 Arret : 5.01324E-07 s/iter 90.550543 +gpu 0 iter : 28 Arret : 6.04245E-10 s/iter 90.007638 +gpu 0 iter : 29 Arret : 1.57426E-15 s/iter 90.215782 +temps : 3442.42 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.57426E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_openmp/full_openmp_1GPU.sge b/Simulations/full_openmp/full_openmp_1GPU.sge new file mode 100644 index 0000000..038b92b --- /dev/null +++ b/Simulations/full_openmp/full_openmp_1GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 1 +#$ -V +#$ -cwd +#$ -N full_openmp_1GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=1 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/full_openmp/full_openmp_2GPU.o140164 b/Simulations/full_openmp/full_openmp_2GPU.o140164 new file mode 100644 index 0000000..09208b1 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_2GPU.o140164 @@ -0,0 +1,540 @@ +REMAINING: 2 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00593 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 118 start 0 size 30080 +gpu 1 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 1 dimgrid2 118 start 30080 size 30080 +gpu 0 iter : 1 Arret : 4.09766E-05 s/iter 0.377749 +gpu 0 iter : 2 Arret : 3.79749E-05 s/iter 0.377727 +gpu 0 iter : 3 Arret : 3.85767E-05 s/iter 0.377765 +gpu 0 iter : 4 Arret : 3.91197E-05 s/iter 0.377744 +gpu 0 iter : 5 Arret : 4.06402E-05 s/iter 0.377742 +gpu 0 iter : 6 Arret : 4.41484E-05 s/iter 0.377649 +gpu 0 iter : 7 Arret : 5.50721E-05 s/iter 0.377635 +gpu 0 iter : 8 Arret : 0.000118507 s/iter 0.377582 +gpu 0 iter : 9 Arret : 0.00116121 s/iter 0.377567 +gpu 0 iter : 10 Arret : 0.0219727 s/iter 0.377659 +gpu 0 iter : 11 Arret : 2.07933 s/iter 1.180745 +gpu 0 iter : 12 Arret : 0.27049 s/iter 0.377586 +gpu 0 iter : 13 Arret : 0.1554 s/iter 1.212301 +gpu 0 iter : 14 Arret : 0.0487107 s/iter 1.213253 +gpu 0 iter : 15 Arret : 0.0169372 s/iter 1.208391 +gpu 0 iter : 16 Arret : 0.00924961 s/iter 1.200600 +gpu 0 iter : 17 Arret : 0.00644126 s/iter 1.173874 +gpu 0 iter : 18 Arret : 0.00441137 s/iter 0.370745 +gpu 0 iter : 19 Arret : 0.00203274 s/iter 0.364311 +gpu 0 iter : 20 Arret : 0.00318275 s/iter 0.364538 +gpu 0 iter : 21 Arret : 0.009373 s/iter 0.355906 +gpu 0 iter : 22 Arret : 0.0125472 s/iter 0.351740 +gpu 0 iter : 23 Arret : 0.0298136 s/iter 0.350290 +gpu 0 iter : 24 Arret : 0.00227002 s/iter 0.351832 +gpu 0 iter : 25 Arret : 0.000622083 s/iter 0.342077 +gpu 0 iter : 26 Arret : 0.000137321 s/iter 0.346191 +gpu 0 iter : 27 Arret : 4.34709E-05 s/iter 0.348120 +gpu 0 iter : 28 Arret : 3.54366E-06 s/iter 0.343417 +gpu 0 iter : 29 Arret : 2.7858E-09 s/iter 0.341845 +gpu 0 iter : 30 Arret : 8.62089E-14 s/iter 0.341833 +temps : 16.8078 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-2.28637E-15 +i*-5.45917E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 293 start 0 size 75008 +gpu 1 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 1 dimgrid2 293 start 75008 size 75008 +gpu 0 iter : 1 Arret : 1.60819E-05 s/iter 2.345593 +gpu 0 iter : 2 Arret : 1.52654E-05 s/iter 2.345397 +gpu 0 iter : 3 Arret : 1.58146E-05 s/iter 2.345455 +gpu 0 iter : 4 Arret : 1.54189E-05 s/iter 2.345151 +gpu 0 iter : 5 Arret : 1.57815E-05 s/iter 2.345049 +gpu 0 iter : 6 Arret : 1.6413E-05 s/iter 2.345470 +gpu 0 iter : 7 Arret : 1.77314E-05 s/iter 2.345388 +gpu 0 iter : 8 Arret : 2.1072E-05 s/iter 2.345347 +gpu 0 iter : 9 Arret : 4.09887E-05 s/iter 2.344913 +gpu 0 iter : 10 Arret : 0.00231734 s/iter 2.344920 +gpu 0 iter : 11 Arret : 0.00364869 s/iter 2.344545 +gpu 0 iter : 12 Arret : 0.00595916 s/iter 2.901608 +gpu 0 iter : 13 Arret : 0.433645 s/iter 2.901110 +gpu 0 iter : 14 Arret : 2.16599 s/iter 4.403684 +gpu 0 iter : 15 Arret : 0.0451248 s/iter 2.331735 +gpu 0 iter : 16 Arret : 0.0269953 s/iter 4.010657 +gpu 0 iter : 17 Arret : 0.0143832 s/iter 2.323230 +gpu 0 iter : 18 Arret : 0.0101457 s/iter 4.336764 +gpu 0 iter : 19 Arret : 0.00443502 s/iter 3.973966 +gpu 0 iter : 20 Arret : 0.00482918 s/iter 2.285743 +gpu 0 iter : 21 Arret : 0.00559571 s/iter 3.957234 +gpu 0 iter : 22 Arret : 0.00102978 s/iter 2.262199 +gpu 0 iter : 23 Arret : 0.000982733 s/iter 2.250995 +gpu 0 iter : 24 Arret : 0.000314964 s/iter 2.256563 +gpu 0 iter : 25 Arret : 9.62593E-05 s/iter 2.257743 +gpu 0 iter : 26 Arret : 2.22765E-05 s/iter 2.274003 +gpu 0 iter : 27 Arret : 3.08519E-05 s/iter 2.262628 +gpu 0 iter : 28 Arret : 9.19951E-06 s/iter 2.243517 +gpu 0 iter : 29 Arret : 5.62649E-07 s/iter 2.241072 +gpu 0 iter : 30 Arret : 9.17827E-11 s/iter 2.245254 +gpu 0 iter : 31 Arret : 8.04912E-16 s/iter 2.239630 +temps : 82.6744 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 8.04912E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.23606 +i* 0.971739| 1| 2.9924E-14 +i*-1.32854E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 489 start 0 size 125056 +gpu 1 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 1 dimgrid2 489 start 125056 size 125056 +gpu 0 iter : 1 Arret : 1.04122E-05 s/iter 6.895757 +gpu 0 iter : 2 Arret : 9.66998E-06 s/iter 6.877326 +gpu 0 iter : 3 Arret : 9.65609E-06 s/iter 6.885434 +gpu 0 iter : 4 Arret : 1.03183E-05 s/iter 6.886343 +gpu 0 iter : 5 Arret : 9.75367E-06 s/iter 6.875198 +gpu 0 iter : 6 Arret : 9.56197E-06 s/iter 6.877253 +gpu 0 iter : 7 Arret : 9.85222E-06 s/iter 6.888180 +gpu 0 iter : 8 Arret : 1.00444E-05 s/iter 6.876080 +gpu 0 iter : 9 Arret : 1.14954E-05 s/iter 6.871764 +gpu 0 iter : 10 Arret : 0.00617074 s/iter 6.872061 +gpu 0 iter : 11 Arret : 0.00502727 s/iter 9.108306 +gpu 0 iter : 12 Arret : 0.00709612 s/iter 6.884838 +gpu 0 iter : 13 Arret : 0.00636365 s/iter 9.133645 +gpu 0 iter : 14 Arret : 0.000962158 s/iter 6.881477 +gpu 0 iter : 15 Arret : 0.00515317 s/iter 6.879637 +gpu 0 iter : 16 Arret : 0.00489618 s/iter 7.799484 +gpu 0 iter : 17 Arret : 0.0126101 s/iter 6.409073 +gpu 0 iter : 18 Arret : 0.306794 s/iter 4.221095 +gpu 0 iter : 19 Arret : 0.00788796 s/iter 5.229623 +gpu 0 iter : 20 Arret : 0.000261124 s/iter 4.114536 +gpu 0 iter : 21 Arret : 0.000181317 s/iter 3.590034 +gpu 0 iter : 22 Arret : 0.000215766 s/iter 3.589880 +gpu 0 iter : 23 Arret : 0.000292282 s/iter 3.567063 +gpu 0 iter : 24 Arret : 7.59488E-05 s/iter 3.557992 +gpu 0 iter : 25 Arret : 8.78575E-06 s/iter 3.569234 +gpu 0 iter : 26 Arret : 1.71E-07 s/iter 3.545083 +gpu 0 iter : 27 Arret : 3.25965E-13 s/iter 3.556937 +temps : 161.369 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.32861E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 1 dimgrid2 684 start 175104 size 175104 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 684 start 0 size 175104 +gpu 0 iter : 1 Arret : 7.32344E-06 s/iter 12.954303 +gpu 0 iter : 2 Arret : 7.07863E-06 s/iter 12.981308 +gpu 0 iter : 3 Arret : 6.90431E-06 s/iter 12.986614 +gpu 0 iter : 4 Arret : 7.26859E-06 s/iter 12.992632 +gpu 0 iter : 5 Arret : 6.9268E-06 s/iter 13.005304 +gpu 0 iter : 6 Arret : 6.766E-06 s/iter 12.980752 +gpu 0 iter : 7 Arret : 7.08928E-06 s/iter 12.936596 +gpu 0 iter : 8 Arret : 7.80045E-06 s/iter 12.948599 +gpu 0 iter : 9 Arret : 9.75059E-06 s/iter 12.933171 +gpu 0 iter : 10 Arret : 0.000389813 s/iter 12.982388 +gpu 0 iter : 11 Arret : 0.00168924 s/iter 12.933771 +gpu 0 iter : 12 Arret : 0.00163024 s/iter 16.015025 +gpu 0 iter : 13 Arret : 0.831287 s/iter 12.991337 +gpu 0 iter : 14 Arret : 3.41318 s/iter 13.007981 +gpu 0 iter : 15 Arret : 0.111579 s/iter 13.648097 +gpu 0 iter : 16 Arret : 0.0536558 s/iter 13.532104 +gpu 0 iter : 17 Arret : 0.0316379 s/iter 12.902939 +gpu 0 iter : 18 Arret : 0.0221392 s/iter 15.777843 +gpu 0 iter : 19 Arret : 0.023782 s/iter 13.053666 +gpu 0 iter : 20 Arret : 0.0188987 s/iter 16.564822 +gpu 0 iter : 21 Arret : 0.0391672 s/iter 17.699510 +gpu 0 iter : 22 Arret : 0.0433525 s/iter 14.316996 +gpu 0 iter : 23 Arret : 0.0310573 s/iter 12.886593 +gpu 0 iter : 24 Arret : 0.0130632 s/iter 14.221913 +gpu 0 iter : 25 Arret : 0.00228986 s/iter 12.848043 +gpu 0 iter : 26 Arret : 0.00142186 s/iter 12.844861 +gpu 0 iter : 27 Arret : 0.000342562 s/iter 12.846961 +gpu 0 iter : 28 Arret : 7.29744E-05 s/iter 12.848477 +gpu 0 iter : 29 Arret : 6.11624E-06 s/iter 12.846333 +gpu 0 iter : 30 Arret : 1.04055E-05 s/iter 12.845798 +gpu 0 iter : 31 Arret : 8.14262E-06 s/iter 12.846716 +gpu 0 iter : 32 Arret : 2.39311E-06 s/iter 12.848384 +gpu 0 iter : 33 Arret : 1.15675E-08 s/iter 12.847822 +gpu 0 iter : 34 Arret : 4.74404E-14 s/iter 12.843750 +temps : 458.792 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.14439E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287595 +i* -0.999586| 1| 4.76598E-14 +i*-1.43895E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 1 dimgrid2 977 start 250112 size 250112 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 977 start 0 size 250112 +gpu 0 iter : 1 Arret : 5.66981E-06 s/iter 26.243500 +gpu 0 iter : 2 Arret : 4.82614E-06 s/iter 26.155609 +gpu 0 iter : 3 Arret : 5.08487E-06 s/iter 26.220032 +gpu 0 iter : 4 Arret : 4.81813E-06 s/iter 26.206135 +gpu 0 iter : 5 Arret : 5.52439E-06 s/iter 26.225948 +gpu 0 iter : 6 Arret : 4.73134E-06 s/iter 26.199860 +gpu 0 iter : 7 Arret : 4.95057E-06 s/iter 26.197320 +gpu 0 iter : 8 Arret : 5.2867E-06 s/iter 26.218407 +gpu 0 iter : 9 Arret : 6.39202E-06 s/iter 26.195373 +gpu 0 iter : 10 Arret : 5.44877E-05 s/iter 26.194619 +gpu 0 iter : 11 Arret : 0.00113955 s/iter 26.198648 +gpu 0 iter : 12 Arret : 0.00233295 s/iter 26.205898 +gpu 0 iter : 13 Arret : 0.00269137 s/iter 26.219943 +gpu 0 iter : 14 Arret : 0.00436419 s/iter 26.210349 +gpu 0 iter : 15 Arret : 0.0325608 s/iter 26.028106 +gpu 0 iter : 16 Arret : 0.0458093 s/iter 20.473858 +gpu 0 iter : 17 Arret : 1.39035 s/iter 21.967251 +gpu 0 iter : 18 Arret : 0.0686378 s/iter 22.648105 +gpu 0 iter : 19 Arret : 0.0167258 s/iter 19.073745 +gpu 0 iter : 20 Arret : 0.0073255 s/iter 18.809805 +gpu 0 iter : 21 Arret : 0.00825181 s/iter 16.400626 +gpu 0 iter : 22 Arret : 0.00369807 s/iter 17.676396 +gpu 0 iter : 23 Arret : 0.00143206 s/iter 14.057186 +gpu 0 iter : 24 Arret : 0.000362864 s/iter 12.988505 +gpu 0 iter : 25 Arret : 5.99505E-05 s/iter 12.740882 +gpu 0 iter : 26 Arret : 1.38177E-05 s/iter 11.720352 +gpu 0 iter : 27 Arret : 7.95915E-06 s/iter 11.636867 +gpu 0 iter : 28 Arret : 2.45128E-06 s/iter 11.537776 +gpu 0 iter : 29 Arret : 4.00503E-08 s/iter 11.539953 +gpu 0 iter : 30 Arret : 2.18749E-13 s/iter 11.544507 +temps : 628.842 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 4.27998E-06 s/iter 37.322864 +gpu 0 iter : 2 Arret : 4.10617E-06 s/iter 37.241818 +gpu 0 iter : 3 Arret : 4.53518E-06 s/iter 37.266422 +gpu 0 iter : 4 Arret : 4.06183E-06 s/iter 37.257521 +gpu 0 iter : 5 Arret : 4.08957E-06 s/iter 37.242975 +gpu 0 iter : 6 Arret : 4.1063E-06 s/iter 37.243477 +gpu 0 iter : 7 Arret : 4.11679E-06 s/iter 37.260449 +gpu 0 iter : 8 Arret : 4.55908E-06 s/iter 37.268788 +gpu 0 iter : 9 Arret : 5.63978E-06 s/iter 37.274568 +gpu 0 iter : 10 Arret : 3.12352E-05 s/iter 37.263840 +gpu 0 iter : 11 Arret : 0.000760143 s/iter 37.275869 +gpu 0 iter : 12 Arret : 0.00101593 s/iter 37.272537 +gpu 0 iter : 13 Arret : 2.01147 s/iter 45.273128 +gpu 0 iter : 14 Arret : 0.399191 s/iter 37.620123 +gpu 0 iter : 15 Arret : 0.349288 s/iter 37.631719 +gpu 0 iter : 16 Arret : 0.208253 s/iter 39.378074 +gpu 0 iter : 17 Arret : 0.0357115 s/iter 36.777203 +gpu 0 iter : 18 Arret : 0.00764262 s/iter 36.020848 +gpu 0 iter : 19 Arret : 0.00870865 s/iter 35.507205 +gpu 0 iter : 20 Arret : 0.00636133 s/iter 36.016380 +gpu 0 iter : 21 Arret : 0.00247744 s/iter 34.115098 +gpu 0 iter : 22 Arret : 0.00232921 s/iter 33.193981 +gpu 0 iter : 23 Arret : 0.000237628 s/iter 33.032645 +gpu 0 iter : 24 Arret : 2.29813E-05 s/iter 32.946598 +gpu 0 iter : 25 Arret : 2.02338E-05 s/iter 32.928243 +gpu 0 iter : 26 Arret : 2.55188E-05 s/iter 32.809567 +gpu 0 iter : 27 Arret : 5.88928E-06 s/iter 32.589015 +gpu 0 iter : 28 Arret : 5.50518E-09 s/iter 32.619895 +gpu 0 iter : 29 Arret : 1.64317E-14 s/iter 32.704855 +temps : 1049.55 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 1 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid2 1368 start 350080 size 350080 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 0 dimgrid2 1368 start 0 size 350080 +gpu 0 iter : 1 Arret : 3.85506E-06 s/iter 50.537882 +gpu 0 iter : 2 Arret : 3.66998E-06 s/iter 50.446787 +gpu 0 iter : 3 Arret : 3.5726E-06 s/iter 50.500062 +gpu 0 iter : 4 Arret : 3.62569E-06 s/iter 50.536621 +gpu 0 iter : 5 Arret : 3.53038E-06 s/iter 50.517457 +gpu 0 iter : 6 Arret : 3.56934E-06 s/iter 50.509400 +gpu 0 iter : 7 Arret : 3.64216E-06 s/iter 50.424296 +gpu 0 iter : 8 Arret : 3.67185E-06 s/iter 50.440541 +gpu 0 iter : 9 Arret : 3.63502E-06 s/iter 50.438151 +gpu 0 iter : 10 Arret : 9.16823E-06 s/iter 50.456984 +gpu 0 iter : 11 Arret : 0.000775983 s/iter 50.442631 +gpu 0 iter : 12 Arret : 0.00172532 s/iter 50.492134 +gpu 0 iter : 13 Arret : 0.00299803 s/iter 51.124560 +gpu 0 iter : 14 Arret : 0.00358296 s/iter 56.913865 +gpu 0 iter : 15 Arret : 0.00444746 s/iter 51.832479 +gpu 0 iter : 16 Arret : 0.0771326 s/iter 55.051554 +gpu 0 iter : 17 Arret : 0.187135 s/iter 50.619418 +gpu 0 iter : 18 Arret : 0.0318843 s/iter 52.931554 +gpu 0 iter : 19 Arret : 0.0152072 s/iter 50.308926 +gpu 0 iter : 20 Arret : 0.0163219 s/iter 56.692462 +gpu 0 iter : 21 Arret : 0.00872806 s/iter 57.177894 +gpu 0 iter : 22 Arret : 0.0115686 s/iter 50.015870 +gpu 0 iter : 23 Arret : 0.0199021 s/iter 50.011047 +gpu 0 iter : 24 Arret : 0.00353983 s/iter 50.010630 +gpu 0 iter : 25 Arret : 0.000449015 s/iter 50.024349 +gpu 0 iter : 26 Arret : 0.000359858 s/iter 50.022460 +gpu 0 iter : 27 Arret : 0.000264692 s/iter 50.007880 +gpu 0 iter : 28 Arret : 9.80473E-05 s/iter 50.011312 +gpu 0 iter : 29 Arret : 1.12945E-05 s/iter 50.013302 +gpu 0 iter : 30 Arret : 1.06056E-08 s/iter 49.925806 +gpu 0 iter : 31 Arret : 5.50569E-15 s/iter 49.926960 +temps : 1589.66 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 5.50569E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1563 start 0 size 400000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1563 start 400000 size 400000 +gpu 0 iter : 1 Arret : 3.10089E-06 s/iter 66.233735 +gpu 0 iter : 2 Arret : 3.0838E-06 s/iter 65.987108 +gpu 0 iter : 3 Arret : 3.06149E-06 s/iter 66.189454 +gpu 0 iter : 4 Arret : 3.0062E-06 s/iter 65.996849 +gpu 0 iter : 5 Arret : 3.0175E-06 s/iter 65.939646 +gpu 0 iter : 6 Arret : 3.04713E-06 s/iter 65.973994 +gpu 0 iter : 7 Arret : 3.05645E-06 s/iter 66.066266 +gpu 0 iter : 8 Arret : 3.30702E-06 s/iter 65.988454 +gpu 0 iter : 9 Arret : 4.07591E-06 s/iter 65.937363 +gpu 0 iter : 10 Arret : 8.87751E-06 s/iter 65.957225 +gpu 0 iter : 11 Arret : 0.00223658 s/iter 66.065550 +gpu 0 iter : 12 Arret : 0.00280193 s/iter 66.350461 +gpu 0 iter : 13 Arret : 2.16738 s/iter 71.352901 +gpu 0 iter : 14 Arret : 0.942103 s/iter 66.359607 +gpu 0 iter : 15 Arret : 4.73642 s/iter 71.197413 +gpu 0 iter : 16 Arret : 0.106528 s/iter 66.581428 +gpu 0 iter : 17 Arret : 0.126902 s/iter 68.405076 +gpu 0 iter : 18 Arret : 0.0671442 s/iter 65.117577 +gpu 0 iter : 19 Arret : 0.0842362 s/iter 64.328947 +gpu 0 iter : 20 Arret : 0.06511 s/iter 58.256373 +gpu 0 iter : 21 Arret : 0.0412827 s/iter 62.163236 +gpu 0 iter : 22 Arret : 0.0193263 s/iter 56.316208 +gpu 0 iter : 23 Arret : 0.0142222 s/iter 56.754546 +gpu 0 iter : 24 Arret : 0.00245535 s/iter 47.889436 +gpu 0 iter : 25 Arret : 0.000939196 s/iter 46.695509 +gpu 0 iter : 26 Arret : 2.31722E-05 s/iter 46.175563 +gpu 0 iter : 27 Arret : 1.05871E-06 s/iter 45.766439 +gpu 0 iter : 28 Arret : 1.17662E-11 s/iter 45.536542 +gpu 0 iter : 29 Arret : 1.57009E-16 s/iter 45.801905 +temps : 1778.69 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_openmp/full_openmp_2GPU.sge b/Simulations/full_openmp/full_openmp_2GPU.sge new file mode 100644 index 0000000..82276b2 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_2GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 2 +#$ -V +#$ -cwd +#$ -N full_openmp_2GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=2 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/full_openmp/full_openmp_3GPU.o140163 b/Simulations/full_openmp/full_openmp_3GPU.o140163 new file mode 100644 index 0000000..693fb02 --- /dev/null +++ b/Simulations/full_openmp/full_openmp_3GPU.o140163 @@ -0,0 +1,565 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +zone limite de 'log-exp' 1.00593 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 1 dimgrid2 79 start 20053 size 20053 +gpu 2 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 79 start 0 size 20053 +gpu 2 dimgrid2 79 start 40106 size 20053 +gpu 0 iter : 1 Arret : 4.45023E-05 s/iter 0.365910 +gpu 0 iter : 2 Arret : 3.97664E-05 s/iter 0.365783 +gpu 0 iter : 3 Arret : 3.83563E-05 s/iter 0.365808 +gpu 0 iter : 4 Arret : 4.09098E-05 s/iter 0.365792 +gpu 0 iter : 5 Arret : 4.06402E-05 s/iter 0.365790 +gpu 0 iter : 6 Arret : 4.41483E-05 s/iter 0.365795 +gpu 0 iter : 7 Arret : 5.50719E-05 s/iter 0.365797 +gpu 0 iter : 8 Arret : 0.000118506 s/iter 0.365824 +gpu 0 iter : 9 Arret : 0.00173508 s/iter 0.365741 +gpu 0 iter : 10 Arret : 0.0219619 s/iter 0.365806 +gpu 0 iter : 11 Arret : 2.12669 s/iter 1.163297 +gpu 0 iter : 12 Arret : 0.293659 s/iter 0.365830 +gpu 0 iter : 13 Arret : 0.150913 s/iter 1.192984 +gpu 0 iter : 14 Arret : 0.0525383 s/iter 1.193344 +gpu 0 iter : 15 Arret : 0.017941 s/iter 1.188756 +gpu 0 iter : 16 Arret : 0.00949223 s/iter 1.183377 +gpu 0 iter : 17 Arret : 0.00618922 s/iter 1.174720 +gpu 0 iter : 18 Arret : 0.00478541 s/iter 1.021119 +gpu 0 iter : 19 Arret : 0.0209781 s/iter 0.355703 +gpu 0 iter : 20 Arret : 0.00277186 s/iter 0.354432 +gpu 0 iter : 21 Arret : 0.00126164 s/iter 0.350947 +gpu 0 iter : 22 Arret : 0.0813 s/iter 0.342869 +gpu 0 iter : 23 Arret : 0.0695633 s/iter 0.341054 +gpu 0 iter : 24 Arret : 0.0249049 s/iter 0.344095 +gpu 0 iter : 25 Arret : 0.0236872 s/iter 0.333915 +gpu 0 iter : 26 Arret : 0.000649816 s/iter 0.333141 +gpu 0 iter : 27 Arret : 0.000117833 s/iter 0.336843 +gpu 0 iter : 28 Arret : 3.89955E-05 s/iter 0.333571 +gpu 0 iter : 29 Arret : 2.68794E-06 s/iter 0.331813 +gpu 0 iter : 30 Arret : 1.05565E-09 s/iter 0.327860 +gpu 0 iter : 31 Arret : 3.2677E-14 s/iter 0.331070 +temps : 17.7034 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583426 +i* -0.812166| 1| 4.94882E-14 +i*-9.16107E-15| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 196 start 0 size 50005 +gpu 1 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 1 dimgrid2 196 start 50005 size 50005 +gpu 2 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 2 dimgrid2 196 start 100010 size 50005 +gpu 0 iter : 1 Arret : 1.83196E-05 s/iter 1.828662 +gpu 0 iter : 2 Arret : 1.8175E-05 s/iter 1.828375 +gpu 0 iter : 3 Arret : 1.80869E-05 s/iter 1.828381 +gpu 0 iter : 4 Arret : 1.75155E-05 s/iter 1.828566 +gpu 0 iter : 5 Arret : 1.69231E-05 s/iter 1.828230 +gpu 0 iter : 6 Arret : 1.76582E-05 s/iter 1.828408 +gpu 0 iter : 7 Arret : 1.98465E-05 s/iter 1.828242 +gpu 0 iter : 8 Arret : 2.53794E-05 s/iter 1.828046 +gpu 0 iter : 9 Arret : 0.00032835 s/iter 1.833783 +gpu 0 iter : 10 Arret : 0.00175922 s/iter 1.828220 +gpu 0 iter : 11 Arret : 0.0175731 s/iter 1.828275 +gpu 0 iter : 12 Arret : 0.00953654 s/iter 1.828216 +gpu 0 iter : 13 Arret : 1.39903 s/iter 3.476936 +gpu 0 iter : 14 Arret : 0.171392 s/iter 1.827262 +gpu 0 iter : 15 Arret : 0.0745773 s/iter 2.751869 +gpu 0 iter : 16 Arret : 0.035733 s/iter 3.807813 +gpu 0 iter : 17 Arret : 0.00850526 s/iter 1.825655 +gpu 0 iter : 18 Arret : 0.00549164 s/iter 1.822042 +gpu 0 iter : 19 Arret : 0.00323678 s/iter 1.812501 +gpu 0 iter : 20 Arret : 0.00178409 s/iter 1.787063 +gpu 0 iter : 21 Arret : 0.00194964 s/iter 1.769047 +gpu 0 iter : 22 Arret : 0.00146162 s/iter 1.771480 +gpu 0 iter : 23 Arret : 0.000624549 s/iter 1.753749 +gpu 0 iter : 24 Arret : 0.000211682 s/iter 1.776112 +gpu 0 iter : 25 Arret : 8.45179E-05 s/iter 1.740231 +gpu 0 iter : 26 Arret : 0.000326207 s/iter 1.768913 +gpu 0 iter : 27 Arret : 0.000200902 s/iter 1.745549 +gpu 0 iter : 28 Arret : 1.1316E-05 s/iter 1.732325 +gpu 0 iter : 29 Arret : 8.18684E-09 s/iter 1.758605 +gpu 0 iter : 30 Arret : 7.64211E-14 s/iter 1.747829 +temps : 59.7653 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26507E-09 +Stabilite : 7.64211E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235938 +i* 0.971768| 1|-1.10779E-14 +i* 1.06056E-13| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0945977 +i* 0.995516| 1| 4.45165E-14 +i* 9.42527E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 1 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 1 dimgrid2 326 start 83370 size 83370 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 326 start 0 size 83370 +gpu 2 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 2 dimgrid2 326 start 166740 size 83370 +gpu 0 iter : 1 Arret : 1.04122E-05 s/iter 4.597080 +gpu 0 iter : 2 Arret : 9.66981E-06 s/iter 4.598575 +gpu 0 iter : 3 Arret : 9.74545E-06 s/iter 4.597108 +gpu 0 iter : 4 Arret : 9.44307E-06 s/iter 4.597489 +gpu 0 iter : 5 Arret : 9.34819E-06 s/iter 4.598001 +gpu 0 iter : 6 Arret : 1.14416E-05 s/iter 4.598661 +gpu 0 iter : 7 Arret : 1.00875E-05 s/iter 4.598097 +gpu 0 iter : 8 Arret : 1.00498E-05 s/iter 4.597534 +gpu 0 iter : 9 Arret : 1.32154E-05 s/iter 4.597416 +gpu 0 iter : 10 Arret : 0.00051254 s/iter 4.597729 +gpu 0 iter : 11 Arret : 0.000628345 s/iter 4.596129 +gpu 0 iter : 12 Arret : 0.00250283 s/iter 4.597678 +gpu 0 iter : 13 Arret : 0.0026566 s/iter 4.597471 +gpu 0 iter : 14 Arret : 0.00107482 s/iter 4.597721 +gpu 0 iter : 15 Arret : 0.0010467 s/iter 4.579817 +gpu 0 iter : 16 Arret : 0.000858809 s/iter 3.750659 +gpu 0 iter : 17 Arret : 0.00453371 s/iter 2.883509 +gpu 0 iter : 18 Arret : 0.298024 s/iter 5.041367 +gpu 0 iter : 19 Arret : 0.0060016 s/iter 5.070989 +gpu 0 iter : 20 Arret : 0.0020976 s/iter 2.833299 +gpu 0 iter : 21 Arret : 0.000787752 s/iter 2.821846 +gpu 0 iter : 22 Arret : 0.00114118 s/iter 2.808072 +gpu 0 iter : 23 Arret : 0.000242876 s/iter 2.800882 +gpu 0 iter : 24 Arret : 6.73756E-05 s/iter 2.794362 +gpu 0 iter : 25 Arret : 2.16461E-05 s/iter 2.813139 +gpu 0 iter : 26 Arret : 2.86679E-06 s/iter 2.821334 +gpu 0 iter : 27 Arret : 9.41388E-09 s/iter 2.791395 +gpu 0 iter : 28 Arret : 1.06079E-14 s/iter 2.796462 +temps : 112.147 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.05316E-09 +Stabilite : 1.06079E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 456 start 0 size 116736 +gpu 2 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 2 dimgrid2 456 start 233472 size 116736 +gpu 1 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 1 dimgrid2 456 start 116736 size 116736 +gpu 0 iter : 1 Arret : 7.55039E-06 s/iter 8.728409 +gpu 0 iter : 2 Arret : 7.39793E-06 s/iter 8.712889 +gpu 0 iter : 3 Arret : 7.14478E-06 s/iter 8.682208 +gpu 0 iter : 4 Arret : 8.2105E-06 s/iter 8.682867 +gpu 0 iter : 5 Arret : 7.11502E-06 s/iter 8.683783 +gpu 0 iter : 6 Arret : 6.76587E-06 s/iter 8.680714 +gpu 0 iter : 7 Arret : 7.0891E-06 s/iter 8.680860 +gpu 0 iter : 8 Arret : 7.80018E-06 s/iter 8.676771 +gpu 0 iter : 9 Arret : 1.16108E-05 s/iter 8.679747 +gpu 0 iter : 10 Arret : 0.000768653 s/iter 8.679484 +gpu 0 iter : 11 Arret : 0.00361976 s/iter 8.676534 +gpu 0 iter : 12 Arret : 0.00104415 s/iter 8.674304 +gpu 0 iter : 13 Arret : 0.820674 s/iter 8.674523 +gpu 0 iter : 14 Arret : 3.33533 s/iter 11.712432 +gpu 0 iter : 15 Arret : 0.122884 s/iter 11.716566 +gpu 0 iter : 16 Arret : 0.0600695 s/iter 11.005801 +gpu 0 iter : 17 Arret : 0.0359638 s/iter 10.051106 +gpu 0 iter : 18 Arret : 0.0231638 s/iter 13.260628 +gpu 0 iter : 19 Arret : 0.0116355 s/iter 13.296853 +gpu 0 iter : 20 Arret : 0.102796 s/iter 11.567596 +gpu 0 iter : 21 Arret : 0.0633274 s/iter 11.618611 +gpu 0 iter : 22 Arret : 0.0252937 s/iter 12.797589 +gpu 0 iter : 23 Arret : 0.0319937 s/iter 11.830702 +gpu 0 iter : 24 Arret : 0.0268738 s/iter 13.413124 +gpu 0 iter : 25 Arret : 0.0121216 s/iter 10.946927 +gpu 0 iter : 26 Arret : 0.00234992 s/iter 8.617752 +gpu 0 iter : 27 Arret : 0.00204079 s/iter 8.617732 +gpu 0 iter : 28 Arret : 0.000634889 s/iter 8.617224 +gpu 0 iter : 29 Arret : 0.000124399 s/iter 8.616406 +gpu 0 iter : 30 Arret : 3.10052E-05 s/iter 8.615337 +gpu 0 iter : 31 Arret : 1.67246E-05 s/iter 8.616948 +gpu 0 iter : 32 Arret : 2.0926E-06 s/iter 8.616524 +gpu 0 iter : 33 Arret : 1.35583E-08 s/iter 8.618103 +gpu 0 iter : 34 Arret : 5.09118E-14 s/iter 8.615345 +temps : 334.994 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 5.09118E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 1 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 1 dimgrid2 652 start 166741 size 166741 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 652 start 0 size 166741 +gpu 2 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 2 dimgrid2 652 start 333482 size 166741 +gpu 0 iter : 1 Arret : 5.71659E-06 s/iter 17.161724 +gpu 0 iter : 2 Arret : 4.8241E-06 s/iter 17.102931 +gpu 0 iter : 3 Arret : 4.62087E-06 s/iter 17.128111 +gpu 0 iter : 4 Arret : 5.16204E-06 s/iter 17.101919 +gpu 0 iter : 5 Arret : 4.94408E-06 s/iter 17.092405 +gpu 0 iter : 6 Arret : 4.816E-06 s/iter 17.112302 +gpu 0 iter : 7 Arret : 4.87888E-06 s/iter 17.096377 +gpu 0 iter : 8 Arret : 5.28527E-06 s/iter 17.102422 +gpu 0 iter : 9 Arret : 6.38912E-06 s/iter 17.095757 +gpu 0 iter : 10 Arret : 0.000225655 s/iter 17.102543 +gpu 0 iter : 11 Arret : 0.000912484 s/iter 17.099976 +gpu 0 iter : 12 Arret : 0.001168 s/iter 17.099389 +gpu 0 iter : 13 Arret : 0.00167187 s/iter 21.294197 +gpu 0 iter : 14 Arret : 0.00151006 s/iter 17.896733 +gpu 0 iter : 15 Arret : 0.00184196 s/iter 17.074701 +gpu 0 iter : 16 Arret : 0.00799101 s/iter 18.651210 +gpu 0 iter : 17 Arret : 1.57022 s/iter 15.558990 +gpu 0 iter : 18 Arret : 0.0777881 s/iter 13.332881 +gpu 0 iter : 19 Arret : 0.020549 s/iter 14.677134 +gpu 0 iter : 20 Arret : 0.00806741 s/iter 15.739566 +gpu 0 iter : 21 Arret : 0.00459564 s/iter 12.928791 +gpu 0 iter : 22 Arret : 0.000774045 s/iter 10.091239 +gpu 0 iter : 23 Arret : 0.000687203 s/iter 9.870933 +gpu 0 iter : 24 Arret : 0.000321475 s/iter 8.758152 +gpu 0 iter : 25 Arret : 7.13963E-05 s/iter 8.577885 +gpu 0 iter : 26 Arret : 4.18738E-05 s/iter 8.536888 +gpu 0 iter : 27 Arret : 7.77414E-06 s/iter 8.435734 +gpu 0 iter : 28 Arret : 4.61674E-07 s/iter 8.385966 +gpu 0 iter : 29 Arret : 3.96914E-10 s/iter 8.211682 +gpu 0 iter : 30 Arret : 1.11723E-15 s/iter 8.267906 +temps : 432.911 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 782 start 400042 size 200021 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 782 start 200021 size 200021 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 782 start 0 size 200021 +gpu 0 iter : 1 Arret : 4.17374E-06 s/iter 25.502913 +gpu 0 iter : 2 Arret : 4.12988E-06 s/iter 25.466465 +gpu 0 iter : 3 Arret : 3.89098E-06 s/iter 25.456717 +gpu 0 iter : 4 Arret : 3.93498E-06 s/iter 25.471780 +gpu 0 iter : 5 Arret : 4.075E-06 s/iter 25.480147 +gpu 0 iter : 6 Arret : 4.05328E-06 s/iter 25.490152 +gpu 0 iter : 7 Arret : 4.09388E-06 s/iter 25.467915 +gpu 0 iter : 8 Arret : 4.4692E-06 s/iter 25.472589 +gpu 0 iter : 9 Arret : 5.3977E-06 s/iter 25.487936 +gpu 0 iter : 10 Arret : 1.31096E-05 s/iter 25.504106 +gpu 0 iter : 11 Arret : 0.000429141 s/iter 25.483586 +gpu 0 iter : 12 Arret : 0.00225971 s/iter 25.488006 +gpu 0 iter : 13 Arret : 0.918253 s/iter 25.485654 +gpu 0 iter : 14 Arret : 0.738628 s/iter 28.610440 +gpu 0 iter : 15 Arret : 1.06679 s/iter 25.657526 +gpu 0 iter : 16 Arret : 0.00754293 s/iter 28.023636 +gpu 0 iter : 17 Arret : 0.00928206 s/iter 27.385101 +gpu 0 iter : 18 Arret : 0.00238733 s/iter 27.805420 +gpu 0 iter : 19 Arret : 0.0221226 s/iter 23.602314 +gpu 0 iter : 20 Arret : 0.00167275 s/iter 23.298279 +gpu 0 iter : 21 Arret : 0.000828652 s/iter 23.099043 +gpu 0 iter : 22 Arret : 0.00089783 s/iter 22.283044 +gpu 0 iter : 23 Arret : 0.000189743 s/iter 21.934545 +gpu 0 iter : 24 Arret : 5.2959E-05 s/iter 21.894963 +gpu 0 iter : 25 Arret : 1.63869E-05 s/iter 21.689444 +gpu 0 iter : 26 Arret : 5.47754E-06 s/iter 21.811193 +gpu 0 iter : 27 Arret : 1.27747E-07 s/iter 21.641069 +gpu 0 iter : 28 Arret : 4.20926E-13 s/iter 21.740517 +temps : 693.102 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 4.20926E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 2 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 2 dimgrid2 912 start 466772 size 233386 +gpu 1 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid2 912 start 233386 size 233386 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 0 dimgrid2 912 start 0 size 233386 +gpu 0 iter : 1 Arret : 4.07574E-06 s/iter 34.223058 +gpu 0 iter : 2 Arret : 3.55154E-06 s/iter 34.224642 +gpu 0 iter : 3 Arret : 3.46878E-06 s/iter 34.212867 +gpu 0 iter : 4 Arret : 3.42717E-06 s/iter 34.222285 +gpu 0 iter : 5 Arret : 3.26935E-06 s/iter 34.215281 +gpu 0 iter : 6 Arret : 3.34195E-06 s/iter 34.197991 +gpu 0 iter : 7 Arret : 3.3903E-06 s/iter 34.208738 +gpu 0 iter : 8 Arret : 3.49838E-06 s/iter 34.196075 +gpu 0 iter : 9 Arret : 3.56276E-06 s/iter 34.209024 +gpu 0 iter : 10 Arret : 5.84108E-06 s/iter 34.213481 +gpu 0 iter : 11 Arret : 0.00066379 s/iter 34.219783 +gpu 0 iter : 12 Arret : 0.00134105 s/iter 34.213025 +gpu 0 iter : 13 Arret : 0.00258505 s/iter 34.466511 +gpu 0 iter : 14 Arret : 0.0103479 s/iter 43.404986 +gpu 0 iter : 15 Arret : 0.00921676 s/iter 37.016770 +gpu 0 iter : 16 Arret : 0.00524991 s/iter 34.402114 +gpu 0 iter : 17 Arret : 0.00461832 s/iter 34.685302 +gpu 0 iter : 18 Arret : 0.0111077 s/iter 37.320698 +gpu 0 iter : 19 Arret : 0.277174 s/iter 35.309915 +gpu 0 iter : 20 Arret : 0.0136382 s/iter 37.689142 +gpu 0 iter : 21 Arret : 0.0160865 s/iter 34.656561 +gpu 0 iter : 22 Arret : 0.0117015 s/iter 34.545629 +gpu 0 iter : 23 Arret : 0.00660409 s/iter 34.694858 +gpu 0 iter : 24 Arret : 0.0024069 s/iter 35.413033 +gpu 0 iter : 25 Arret : 0.00112793 s/iter 34.552170 +gpu 0 iter : 26 Arret : 0.000118329 s/iter 34.545882 +gpu 0 iter : 27 Arret : 7.75369E-06 s/iter 34.554405 +gpu 0 iter : 28 Arret : 1.97801E-06 s/iter 34.600018 +gpu 0 iter : 29 Arret : 1.19455E-08 s/iter 34.514124 +gpu 0 iter : 30 Arret : 5.31286E-15 s/iter 34.636400 +temps : 1053.03 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46263E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1042 start 0 size 266666 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 1042 start 533332 size 266666 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1042 start 266666 size 266666 +gpu 0 iter : 1 Arret : 3.43128E-06 s/iter 44.316497 +gpu 0 iter : 2 Arret : 3.77153E-06 s/iter 44.131572 +gpu 0 iter : 3 Arret : 3.23873E-06 s/iter 44.315408 +gpu 0 iter : 4 Arret : 3.15113E-06 s/iter 44.328033 +gpu 0 iter : 5 Arret : 3.60598E-06 s/iter 44.311559 +gpu 0 iter : 6 Arret : 3.57581E-06 s/iter 44.316239 +gpu 0 iter : 7 Arret : 3.25175E-06 s/iter 44.224296 +gpu 0 iter : 8 Arret : 3.4699E-06 s/iter 44.325585 +gpu 0 iter : 9 Arret : 4.55022E-06 s/iter 44.283208 +gpu 0 iter : 10 Arret : 3.7857E-05 s/iter 44.288810 +gpu 0 iter : 11 Arret : 0.000824026 s/iter 44.305832 +gpu 0 iter : 12 Arret : 0.00406403 s/iter 49.181390 +gpu 0 iter : 13 Arret : 1.91903 s/iter 44.281962 +gpu 0 iter : 14 Arret : 0.315909 s/iter 52.995186 +gpu 0 iter : 15 Arret : 0.325705 s/iter 48.752573 +gpu 0 iter : 16 Arret : 0.25171 s/iter 48.906019 +gpu 0 iter : 17 Arret : 0.107387 s/iter 44.063529 +gpu 0 iter : 18 Arret : 0.063654 s/iter 40.922131 +gpu 0 iter : 19 Arret : 0.0247294 s/iter 39.343896 +gpu 0 iter : 20 Arret : 0.015705 s/iter 38.504441 +gpu 0 iter : 21 Arret : 0.00670205 s/iter 39.597806 +gpu 0 iter : 22 Arret : 0.00378517 s/iter 35.764039 +gpu 0 iter : 23 Arret : 0.00973025 s/iter 33.436854 +gpu 0 iter : 24 Arret : 0.00954051 s/iter 32.742842 +gpu 0 iter : 25 Arret : 0.000557232 s/iter 31.071844 +gpu 0 iter : 26 Arret : 2.73926E-05 s/iter 30.889921 +gpu 0 iter : 27 Arret : 2.78216E-06 s/iter 30.780761 +gpu 0 iter : 28 Arret : 2.46904E-08 s/iter 30.743643 +gpu 0 iter : 29 Arret : 6.07909E-14 s/iter 30.869112 +temps : 1191.46 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.0233219 +Stabilite : 3.24723E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +799998 racines de module = 1 + 2 racines de module = 0.999973 diff --git a/Simulations/full_openmp/full_openmp_3GPU.sge b/Simulations/full_openmp/full_openmp_3GPU.sge new file mode 100644 index 0000000..c3a277c --- /dev/null +++ b/Simulations/full_openmp/full_openmp_3GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 3 +#$ -V +#$ -cwd +#$ -N full_openmp_3GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/full_openmp/full_openmp_4GPU.o140162 b/Simulations/full_openmp/full_openmp_4GPU.o140162 new file mode 100644 index 0000000..5a3649d --- /dev/null +++ b/Simulations/full_openmp/full_openmp_4GPU.o140162 @@ -0,0 +1,590 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +zone limite de 'log-exp' 1.00593 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 3 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 3 dimgrid2 59 start 45120 size 15040 +gpu 2 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 2 dimgrid2 59 start 30080 size 15040 +gpu 0 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 0 dimgrid2 59 start 0 size 15040 +gpu 1 dimgrid 235 dimblock 256 degrePoly 60000 +gpu 1 dimgrid2 59 start 15040 size 15040 +gpu 0 iter : 1 Arret : 4.54253E-05 s/iter 0.204175 +gpu 0 iter : 2 Arret : 4.02349E-05 s/iter 0.189665 +gpu 0 iter : 3 Arret : 3.82695E-05 s/iter 0.189681 +gpu 0 iter : 4 Arret : 3.90123E-05 s/iter 0.189717 +gpu 0 iter : 5 Arret : 4.05115E-05 s/iter 0.189657 +gpu 0 iter : 6 Arret : 4.39547E-05 s/iter 0.189790 +gpu 0 iter : 7 Arret : 5.45799E-05 s/iter 0.189703 +gpu 0 iter : 8 Arret : 0.000119388 s/iter 0.189738 +gpu 0 iter : 9 Arret : 0.00119487 s/iter 0.189634 +gpu 0 iter : 10 Arret : 0.00289573 s/iter 0.189661 +gpu 0 iter : 11 Arret : 2.16041 s/iter 0.189628 +gpu 0 iter : 12 Arret : 0.350069 s/iter 0.189703 +gpu 0 iter : 13 Arret : 0.131331 s/iter 1.021619 +gpu 0 iter : 14 Arret : 0.0516998 s/iter 1.018752 +gpu 0 iter : 15 Arret : 0.0205122 s/iter 1.016639 +gpu 0 iter : 16 Arret : 0.012334 s/iter 1.013349 +gpu 0 iter : 17 Arret : 0.00704057 s/iter 1.007092 +gpu 0 iter : 18 Arret : 0.00458473 s/iter 0.868843 +gpu 0 iter : 19 Arret : 0.00325386 s/iter 0.853210 +gpu 0 iter : 20 Arret : 0.00249036 s/iter 0.836780 +gpu 0 iter : 21 Arret : 0.0018094 s/iter 0.184672 +gpu 0 iter : 22 Arret : 0.00401767 s/iter 0.184541 +gpu 0 iter : 23 Arret : 0.048161 s/iter 0.183544 +gpu 0 iter : 24 Arret : 0.00734855 s/iter 0.178753 +gpu 0 iter : 25 Arret : 0.0107124 s/iter 0.178628 +gpu 0 iter : 26 Arret : 0.00180991 s/iter 0.172491 +gpu 0 iter : 27 Arret : 0.000329189 s/iter 0.172292 +gpu 0 iter : 28 Arret : 7.3153E-05 s/iter 0.172287 +gpu 0 iter : 29 Arret : 9.70999E-06 s/iter 0.172276 +gpu 0 iter : 30 Arret : 5.49374E-08 s/iter 0.172248 +gpu 0 iter : 31 Arret : 1.71107E-12 s/iter 0.172323 +gpu 0 iter : 32 Arret : 1.57009E-16 s/iter 0.172301 +temps : 13.5366 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.35784E-10 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540783 +i* 0.841162| 1|-7.58456E-14 +i* 3.78031E-14| +| 2| -0.992343 +i* -0.123513| 1|-4.36456E-15 +i* 3.59435E-15| +| 3| 0.0563346 +i* 0.998412| 1| 5.70377E-15 +i* 3.3501E-14| +| 4| -0.802793 +i* -0.596258| 1| 2.03657E-15 +i* 1.01915E-14| +| 5| 0.730552 +i* -0.682857| 1|-7.48429E-14 +i* 6.77011E-14| +| 6| -0.442728 +i* 0.896656| 1|-3.77198E-14 +i*-1.89779E-15| +| 7| -0.404888 +i* -0.914366| 1| 3.20195E-14 +i* 9.65894E-15| +| 8| 0.972126 +i* -0.23446| 1| 4.02421E-14 +i*-1.54755E-14| +| 9| -0.826939 +i* 0.562292| 1| -2.4928E-14 +i*-1.59889E-14| +| 10| 0.0979895 +i* -0.995187| 1| 2.90878E-14 +i*-6.75675E-15| +| 11| 0.961513 +i* 0.27476| 1|-9.39769E-14 +i*-2.63912E-13| +| 12| -0.996627 +i* 0.0820589| 1| 2.39773E-14 +i* 1.74825E-14| +| 13| 0.575447 +i* -0.817839| 1|-3.49894E-14 +i*-7.98545E-14| +| 14| 0.701466 +i* 0.712703| 1| 7.52211E-14 +i* 1.53991E-14| +| 15| 0.259346 +i* 0.965785| 1|-2.14863E-14 +i*-2.81355E-14| +| 16| -0.907773 +i* -0.419461| 1|-3.62869E-14 +i*-9.49414E-15| +| 17| 0.903623 +i* -0.428329| 1|-1.24969E-14 +i* 7.51222E-14| +| 18| -0.249979 +i* 0.968251| 1|-1.59074E-14 +i*-1.09721E-14| +| 19| -0.583341 +i* -0.812227| 1| 1.92242E-14 +i* 2.27058E-14| +| 20| 0.997383 +i* 0.072297| 1| 2.53037E-13 +i*-5.92819E-13| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 1 +zone limite de 'log-exp' 1.00237 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 0 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 0 dimgrid2 147 start 0 size 37504 +gpu 3 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 3 dimgrid2 147 start 112512 size 37504 +gpu 1 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 1 dimgrid2 147 start 37504 size 37504 +gpu 2 dimgrid 586 dimblock 256 degrePoly 150000 +gpu 2 dimgrid2 147 start 75008 size 37504 +gpu 0 iter : 1 Arret : 1.6116E-05 s/iter 1.403394 +gpu 0 iter : 2 Arret : 1.52925E-05 s/iter 1.387067 +gpu 0 iter : 3 Arret : 1.51523E-05 s/iter 1.386759 +gpu 0 iter : 4 Arret : 1.86476E-05 s/iter 1.382149 +gpu 0 iter : 5 Arret : 1.57671E-05 s/iter 1.386808 +gpu 0 iter : 6 Arret : 1.6295E-05 s/iter 1.386892 +gpu 0 iter : 7 Arret : 1.80188E-05 s/iter 1.386856 +gpu 0 iter : 8 Arret : 2.08003E-05 s/iter 1.386801 +gpu 0 iter : 9 Arret : 3.59837E-05 s/iter 1.386900 +gpu 0 iter : 10 Arret : 0.00139949 s/iter 1.381972 +gpu 0 iter : 11 Arret : 0.00379917 s/iter 1.387000 +gpu 0 iter : 12 Arret : 0.00480593 s/iter 2.678954 +gpu 0 iter : 13 Arret : 0.0063728 s/iter 2.972359 +gpu 0 iter : 14 Arret : 0.0158488 s/iter 1.381889 +gpu 0 iter : 15 Arret : 0.0137848 s/iter 3.041156 +gpu 0 iter : 16 Arret : 0.0131859 s/iter 1.379081 +gpu 0 iter : 17 Arret : 1.29468 s/iter 3.020840 +gpu 0 iter : 18 Arret : 0.0424345 s/iter 3.418165 +gpu 0 iter : 19 Arret : 0.0201069 s/iter 3.422654 +gpu 0 iter : 20 Arret : 0.00607561 s/iter 2.950185 +gpu 0 iter : 21 Arret : 0.00629018 s/iter 3.290739 +gpu 0 iter : 22 Arret : 0.00557589 s/iter 1.335444 +gpu 0 iter : 23 Arret : 0.000991862 s/iter 1.330521 +gpu 0 iter : 24 Arret : 0.00206487 s/iter 1.322392 +gpu 0 iter : 25 Arret : 0.000365679 s/iter 1.334823 +gpu 0 iter : 26 Arret : 0.000144648 s/iter 1.333867 +gpu 0 iter : 27 Arret : 0.00033044 s/iter 1.332139 +gpu 0 iter : 28 Arret : 1.48376E-05 s/iter 1.334037 +gpu 0 iter : 29 Arret : 4.12386E-10 s/iter 1.324928 +gpu 0 iter : 30 Arret : 4.00547E-15 s/iter 1.333918 +temps : 56.2628 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.26535E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540528 +i* 0.841326| 1| 8.68923E-14 +i* 2.2979E-13| +| 2| -0.905603 +i* -0.424127| 1| 6.50001E-14 +i* -3.0061E-14| +| 3| -0.774122 +i* 0.633037| 1|-3.89619E-14 +i*-6.71876E-14| +| 4| 0.317935 +i* -0.948113| 1| 4.656E-15 +i* 1.15645E-13| +| 5| 0.235978 +i* 0.971758| 1|-2.91295E-14 +i*-3.06716E-14| +| 6| -0.717299 +i* -0.696766| 1| 5.63785E-15 +i*-6.71685E-14| +| 7| 0.992349 +i* -0.123462| 1|-4.81056E-13 +i* 9.00335E-13| +| 8| -0.938482 +i* 0.345329| 1|-6.95555E-14 +i*-3.79159E-14| +| 9| 0.610294 +i* -0.792175| 1| -5.4852E-14 +i*-3.26232E-14| +| 10| -0.0946394 +i* 0.995512| 1|-4.73788E-14 +i*-8.10827E-14| +| 11| -0.450242 +i* -0.892906| 1| 2.41855E-14 +i*-3.23699E-15| +| 12| 0.978218 +i* 0.207583| 1|-2.84429E-13 +i* 4.69725E-13| +| 13| -0.999806 +i* 0.0197069| 1|-4.72365E-14 +i*-2.55716E-14| +| 14| 0.835648 +i* -0.549265| 1|-2.95892E-13 +i* 2.34143E-13| +| 15| -0.414707 +i* 0.909955| 1| 7.26225E-14 +i*-1.70003E-15| +| 16| -0.133754 +i* -0.991015| 1|-2.88485E-14 +i* 2.14499E-14| +| 17| 0.856687 +i* 0.515837| 1| 1.49106E-13 +i* 3.95153E-14| +| 18| -0.951361 +i* -0.308079| 1| 3.78308E-14 +i* 4.65843E-14| +| 19| 0.969257 +i* -0.24605| 1| 5.51163E-13 +i*-4.79498E-13| +| 20| -0.689285 +i* 0.724491| 1| 2.40086E-15 +i*-3.61777E-14| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1 +zone limite de 'log-exp' 1.00142 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 2 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 2 dimgrid2 245 start 125056 size 62528 +gpu 0 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 0 dimgrid2 245 start 0 size 62528 +gpu 3 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 3 dimgrid2 245 start 187584 size 62528 +gpu 1 dimgrid 977 dimblock 256 degrePoly 250000 +gpu 1 dimgrid2 245 start 62528 size 62528 +gpu 0 iter : 1 Arret : 1.14841E-05 s/iter 3.820958 +gpu 0 iter : 2 Arret : 9.97904E-06 s/iter 3.814972 +gpu 0 iter : 3 Arret : 1.0158E-05 s/iter 3.809374 +gpu 0 iter : 4 Arret : 9.50123E-06 s/iter 3.808973 +gpu 0 iter : 5 Arret : 9.84188E-06 s/iter 3.808465 +gpu 0 iter : 6 Arret : 9.56156E-06 s/iter 3.815126 +gpu 0 iter : 7 Arret : 9.85167E-06 s/iter 3.816179 +gpu 0 iter : 8 Arret : 1.00437E-05 s/iter 3.818435 +gpu 0 iter : 9 Arret : 3.05444E-05 s/iter 3.817012 +gpu 0 iter : 10 Arret : 0.00147405 s/iter 3.816247 +gpu 0 iter : 11 Arret : 0.00154571 s/iter 3.810174 +gpu 0 iter : 12 Arret : 0.000731342 s/iter 3.808902 +gpu 0 iter : 13 Arret : 0.00122682 s/iter 3.808356 +gpu 0 iter : 14 Arret : 0.00109532 s/iter 3.815259 +gpu 0 iter : 15 Arret : 0.0011892 s/iter 3.779459 +gpu 0 iter : 16 Arret : 0.000794066 s/iter 2.968072 +gpu 0 iter : 17 Arret : 0.00960632 s/iter 2.174069 +gpu 0 iter : 18 Arret : 0.3054 s/iter 4.920214 +gpu 0 iter : 19 Arret : 0.00164869 s/iter 2.134462 +gpu 0 iter : 20 Arret : 0.00100296 s/iter 2.137935 +gpu 0 iter : 21 Arret : 0.000263024 s/iter 2.128112 +gpu 0 iter : 22 Arret : 0.0007086 s/iter 2.111936 +gpu 0 iter : 23 Arret : 0.00101441 s/iter 2.112455 +gpu 0 iter : 24 Arret : 0.000848875 s/iter 2.109033 +gpu 0 iter : 25 Arret : 0.00150539 s/iter 2.111749 +gpu 0 iter : 26 Arret : 5.16459E-05 s/iter 2.096918 +gpu 0 iter : 27 Arret : 1.87546E-07 s/iter 2.098589 +gpu 0 iter : 28 Arret : 2.77608E-13 s/iter 2.110056 +temps : 89.8766 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.3128E-09 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540427 +i* 0.841391| 1| 9.7148E-14 +i*-1.98189E-13| +| 2| -0.997949 +i* 0.0640067| 1| 1.02696E-14 +i* 2.88415E-14| +| 3| 0.450991 +i* -0.892528| 1| 2.39739E-15 +i* 7.66835E-14| +| 4| 0.42851 +i* -0.903537| 1| 1.03733E-13 +i* 1.27433E-14| +| 5| -0.996035 +i* 0.0889649| 1| 5.1386E-14 +i* 4.21729E-14| +| 6| 0.581876 +i* 0.813277| 1| 3.29906E-13 +i* -3.5718E-15| +| 7| 0.405761 +i* -0.913979| 1| 1.69923E-13 +i*-8.86062E-14| +| 8| -0.993496 +i* 0.113867| 1| 6.34562E-14 +i* 6.04291E-14| +| 9| 0.60205 +i* 0.798458| 1| 2.39371E-13 +i* -2.2848E-13| +| 10| 0.382757 +i* -0.923849| 1| 6.36852E-14 +i* 1.1601E-13| +| 11| -0.990335 +i* 0.138698| 1| 8.32286E-14 +i* 4.57395E-14| +| 12| 0.621846 +i* 0.783139| 1| 3.5482E-14 +i*-1.57841E-13| +| 13| 0.359514 +i* -0.93314| 1| 1.00985E-13 +i*-2.52237E-13| +| 14| -0.986553 +i* 0.163442| 1| 3.24636E-14 +i* 4.58574E-14| +| 15| 0.641253 +i* 0.767329| 1| 1.79533E-13 +i* 3.03096E-13| +| 16| 0.336045 +i* -0.941846| 1| 1.38948E-13 +i*-8.14071E-14| +| 17| -0.982153 +i* 0.188084| 1| 6.94549E-14 +i* 3.09405E-14| +| 18| 0.660258 +i* 0.751039| 1| 4.21871E-13 +i* 5.02185E-14| +| 19| 0.312366 +i* -0.949962| 1|-6.37199E-14 +i*-7.39669E-14| +| 20| -0.977138 +i* 0.212608| 1|-3.80633E-14 +i* -8.4285E-14| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 1 +zone limite de 'log-exp' 1.00101 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 3 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 3 dimgrid2 342 start 262656 size 87552 +gpu 2 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 2 dimgrid2 342 start 175104 size 87552 +gpu 1 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 1 dimgrid2 342 start 87552 size 87552 +gpu 0 dimgrid 1368 dimblock 256 degrePoly 350000 +gpu 0 dimgrid2 342 start 0 size 87552 +gpu 0 iter : 1 Arret : 6.88539E-06 s/iter 6.540061 +gpu 0 iter : 2 Arret : 6.8684E-06 s/iter 6.536458 +gpu 0 iter : 3 Arret : 7.55734E-06 s/iter 6.535814 +gpu 0 iter : 4 Arret : 6.96901E-06 s/iter 6.536741 +gpu 0 iter : 5 Arret : 6.72451E-06 s/iter 6.533504 +gpu 0 iter : 6 Arret : 6.76555E-06 s/iter 6.534876 +gpu 0 iter : 7 Arret : 7.08866E-06 s/iter 6.534819 +gpu 0 iter : 8 Arret : 7.79946E-06 s/iter 6.533534 +gpu 0 iter : 9 Arret : 9.74863E-06 s/iter 6.531511 +gpu 0 iter : 10 Arret : 0.000378804 s/iter 6.530246 +gpu 0 iter : 11 Arret : 0.000478777 s/iter 6.545753 +gpu 0 iter : 12 Arret : 0.0010319 s/iter 6.531644 +gpu 0 iter : 13 Arret : 0.810083 s/iter 6.532661 +gpu 0 iter : 14 Arret : 3.38477 s/iter 9.611632 +gpu 0 iter : 15 Arret : 0.137317 s/iter 9.586509 +gpu 0 iter : 16 Arret : 0.0655441 s/iter 11.282824 +gpu 0 iter : 17 Arret : 0.0396702 s/iter 11.222823 +gpu 0 iter : 18 Arret : 0.165636 s/iter 11.248406 +gpu 0 iter : 19 Arret : 0.114767 s/iter 11.345882 +gpu 0 iter : 20 Arret : 0.0535778 s/iter 11.198285 +gpu 0 iter : 21 Arret : 0.0468459 s/iter 10.374819 +gpu 0 iter : 22 Arret : 0.0531479 s/iter 11.376048 +gpu 0 iter : 23 Arret : 0.0587573 s/iter 9.681631 +gpu 0 iter : 24 Arret : 0.380742 s/iter 9.616663 +gpu 0 iter : 25 Arret : 0.158886 s/iter 6.481929 +gpu 0 iter : 26 Arret : 0.19048 s/iter 10.400978 +gpu 0 iter : 27 Arret : 0.115233 s/iter 7.157960 +gpu 0 iter : 28 Arret : 0.0624603 s/iter 7.226846 +gpu 0 iter : 29 Arret : 0.00065803 s/iter 6.480500 +gpu 0 iter : 30 Arret : 2.18809E-05 s/iter 6.480583 +gpu 0 iter : 31 Arret : 3.02291E-05 s/iter 6.478820 +gpu 0 iter : 32 Arret : 6.59107E-06 s/iter 6.479051 +gpu 0 iter : 33 Arret : 1.18098E-07 s/iter 6.480090 +gpu 0 iter : 34 Arret : 1.37334E-12 s/iter 6.481310 +gpu 0 iter : 35 Arret : 1.11023E-16 s/iter 6.479636 +temps : 279.804 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.46096E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540399 +i* 0.841409| 1| 5.12961E-13 +i*-3.37404E-15| +| 2| -0.385479 +i* 0.922716| 1| -1.616E-13 +i*-2.73566E-14| +| 3| -0.770131 +i* 0.637886| 1|-1.38431E-15 +i* 1.70921E-13| +| 4| -0.978357 +i* 0.206925| 1|-3.07393E-15 +i* 4.96131E-15| +| 5| -0.962455 +i* -0.27144| 1|-5.85088E-14 +i* 7.9714E-14| +| 6| -0.72607 +i* -0.687621| 1| -2.0612E-14 +i* 2.87948E-13| +| 7| -0.323352 +i* -0.946279| 1| 2.27159E-13 +i* 7.30891E-14| +| 8| 0.153459 +i* -0.988155| 1| 4.60049E-15 +i*-2.43555E-14| +| 9| 0.595097 +i* -0.803654| 1|-3.46265E-13 +i* 1.60098E-14| +| 10| 0.900408 +i* -0.435047| 1| 3.20081E-13 +i*-1.77827E-14| +| 11| 0.999448 +i* 0.0332229| 1|-5.70342E-13 +i* 1.21308E-12| +| 12| 0.869529 +i* 0.493882| 1| 3.01252E-14 +i* 6.11216E-13| +| 13| 0.211292 +i* 0.977423| 1|-6.97532E-14 +i* 1.23212E-13| +| 14| -0.267139 +i* 0.963658| 1|-9.26238E-14 +i*-7.20968E-14| +| 15| -0.684372 +i* 0.729133| 1| 1.64042E-13 +i*-1.89831E-14| +| 16| -0.944825 +i* 0.327574| 1| 3.70572E-14 +i*-6.84904E-14| +| 17| -0.988833 +i* -0.149027| 1|-1.41002E-13 +i* 2.02581E-14| +| 18| -0.806314 +i* -0.591488| 1| 1.24668E-13 +i*-2.62805E-13| +| 19| -0.439079 +i* -0.898448| 1|-1.76949E-13 +i*-1.05707E-13| +| 20| 0.0287415 +i* -0.999587| 1| 1.62724E-13 +i*-6.82891E-14| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 1 +zone limite de 'log-exp' 1.00071 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 3 dimgrid2 489 start 375168 size 125056 +gpu 1 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 1 dimgrid2 489 start 125056 size 125056 +gpu 0 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 0 dimgrid2 489 start 0 size 125056 +gpu 2 dimgrid 1954 dimblock 256 degrePoly 500000 +gpu 2 dimgrid2 489 start 250112 size 125056 +gpu 0 iter : 1 Arret : 5.43682E-06 s/iter 13.802902 +gpu 0 iter : 2 Arret : 4.91044E-06 s/iter 13.790958 +gpu 0 iter : 3 Arret : 4.91315E-06 s/iter 13.790511 +gpu 0 iter : 4 Arret : 4.67858E-06 s/iter 13.806112 +gpu 0 iter : 5 Arret : 4.77709E-06 s/iter 13.805612 +gpu 0 iter : 6 Arret : 4.66912E-06 s/iter 13.804348 +gpu 0 iter : 7 Arret : 4.83022E-06 s/iter 13.804019 +gpu 0 iter : 8 Arret : 5.21278E-06 s/iter 13.800214 +gpu 0 iter : 9 Arret : 6.23421E-06 s/iter 13.801225 +gpu 0 iter : 10 Arret : 0.000564578 s/iter 13.800687 +gpu 0 iter : 11 Arret : 0.000810388 s/iter 13.802100 +gpu 0 iter : 12 Arret : 0.00138997 s/iter 13.800427 +gpu 0 iter : 13 Arret : 0.00220275 s/iter 18.005536 +gpu 0 iter : 14 Arret : 0.00421803 s/iter 13.791507 +gpu 0 iter : 15 Arret : 0.00623459 s/iter 13.530051 +gpu 0 iter : 16 Arret : 1.4756 s/iter 11.805523 +gpu 0 iter : 17 Arret : 0.0156198 s/iter 14.532176 +gpu 0 iter : 18 Arret : 0.0107648 s/iter 13.020495 +gpu 0 iter : 19 Arret : 0.0045075 s/iter 12.656318 +gpu 0 iter : 20 Arret : 0.00121976 s/iter 8.450054 +gpu 0 iter : 21 Arret : 0.000890648 s/iter 11.499489 +gpu 0 iter : 22 Arret : 0.00233504 s/iter 7.388259 +gpu 0 iter : 23 Arret : 0.00149094 s/iter 7.283653 +gpu 0 iter : 24 Arret : 0.00113868 s/iter 11.307597 +gpu 0 iter : 25 Arret : 0.000125947 s/iter 7.035207 +gpu 0 iter : 26 Arret : 2.52318E-05 s/iter 6.864347 +gpu 0 iter : 27 Arret : 3.0855E-08 s/iter 6.748053 +gpu 0 iter : 28 Arret : 9.3245E-14 s/iter 5.878949 +temps : 337.034 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.48768E-08 +Stabilite : 1.41899E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540372 +i* 0.841426| 1|-3.05235E-13 +i* 1.38721E-13| +| 2| 0.561316 +i* 0.827602| 1|-2.60021E-13 +i* 1.9206E-13| +| 3| 0.57165 +i* 0.820497| 1|-1.83308E-13 +i* 6.15844E-14| +| 4| 0.581895 +i* 0.813264| 1| 3.05839E-13 +i* 6.52482E-14| +| 5| 0.592048 +i* 0.805902| 1|-7.14016E-13 +i*-3.98882E-14| +| 6| 0.602109 +i* 0.798414| 1| 2.66658E-13 +i*-4.75979E-13| +| 7| 0.612074 +i* 0.7908| 1| 3.16743E-13 +i*-3.40844E-13| +| 8| 0.621943 +i* 0.783062| 1| 5.64146E-13 +i*-3.14632E-13| +| 9| 0.631715 +i* 0.775201| 1|-3.83756E-14 +i* 5.41086E-13| +| 10| 0.641387 +i* 0.767218| 1| 4.00499E-13 +i*-3.71465E-13| +| 11| 0.650958 +i* 0.759114| 1| 7.58768E-15 +i*-5.54055E-13| +| 12| 0.660427 +i* 0.750891| 1| 7.47999E-13 +i* 2.73089E-13| +| 13| 0.669792 +i* 0.742549| 1| 9.40577E-13 +i* 3.39433E-14| +| 14| 0.679051 +i* 0.734091| 1| 4.34264E-13 +i*-1.04887E-13| +| 15| 0.688204 +i* 0.725517| 1|-6.26926E-13 +i*-1.86798E-13| +| 16| 0.697248 +i* 0.71683| 1| 2.2389E-13 +i*-9.46795E-14| +| 17| 0.706183 +i* 0.708029| 1| 4.79186E-13 +i* 4.75144E-13| +| 18| 0.715007 +i* 0.699117| 1| 6.39138E-13 +i* 4.95824E-13| +| 19| 0.723718 +i* 0.690096| 1| -1.2694E-13 +i* 4.44528E-13| +| 20| 0.732316 +i* 0.680965| 1|-2.76158E-13 +i* 1.17734E-13| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +zone limite de 'log-exp' 1.00059 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 586 start 300032 size 150016 +gpu 3 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 3 dimgrid2 586 start 450048 size 150016 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 586 start 150016 size 150016 +gpu 0 iter : 1 Arret : 4.20321E-06 s/iter 18.776658 +gpu 0 iter : 2 Arret : 4.13056E-06 s/iter 18.721323 +gpu 0 iter : 3 Arret : 4.11084E-06 s/iter 18.739702 +gpu 0 iter : 4 Arret : 4.14768E-06 s/iter 18.725990 +gpu 0 iter : 5 Arret : 3.97777E-06 s/iter 18.735245 +gpu 0 iter : 6 Arret : 4.16195E-06 s/iter 18.723334 +gpu 0 iter : 7 Arret : 4.19454E-06 s/iter 18.733188 +gpu 0 iter : 8 Arret : 4.62315E-06 s/iter 18.730439 +gpu 0 iter : 9 Arret : 6.05437E-06 s/iter 18.723590 +gpu 0 iter : 10 Arret : 1.53978E-05 s/iter 18.723454 +gpu 0 iter : 11 Arret : 0.000456524 s/iter 18.740808 +gpu 0 iter : 12 Arret : 0.00137167 s/iter 18.729445 +gpu 0 iter : 13 Arret : 0.00165831 s/iter 18.748008 +gpu 0 iter : 14 Arret : 1.38016 s/iter 18.749001 +gpu 0 iter : 15 Arret : 0.619057 s/iter 19.564421 +gpu 0 iter : 16 Arret : 0.0544873 s/iter 20.890543 +gpu 0 iter : 17 Arret : 0.0338392 s/iter 23.493737 +gpu 0 iter : 18 Arret : 0.0124964 s/iter 20.037893 +gpu 0 iter : 19 Arret : 0.00639686 s/iter 21.581791 +gpu 0 iter : 20 Arret : 0.00399724 s/iter 18.002558 +gpu 0 iter : 21 Arret : 0.00256288 s/iter 17.692790 +gpu 0 iter : 22 Arret : 0.000413689 s/iter 17.539980 +gpu 0 iter : 23 Arret : 0.0010819 s/iter 17.582527 +gpu 0 iter : 24 Arret : 0.000517706 s/iter 17.387151 +gpu 0 iter : 25 Arret : 1.40294E-05 s/iter 17.415382 +gpu 0 iter : 26 Arret : 1.44098E-06 s/iter 17.345061 +gpu 0 iter : 27 Arret : 2.93009E-09 s/iter 16.538716 +gpu 0 iter : 28 Arret : 8.5314E-15 s/iter 16.484147 +temps : 525.532 seconde(s) +Nb iterations : 28 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.38109E-08 +Stabilite : 8.5314E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540365 +i* 0.841431| 1| 4.39062E-13 +i* 5.83011E-13| +| 2| -0.553493 +i* -0.832854| 1|-5.02858E-13 +i* 3.83374E-15| +| 3| -0.579338 +i* -0.815087| 1| 4.42365E-13 +i* 2.65846E-14| +| 4| 0.592057 +i* 0.805896| 1| 2.06783E-13 +i* 1.94549E-13| +| 5| -0.604613 +i* -0.796519| 1| 2.39135E-13 +i* 2.96967E-13| +| 6| 0.617037 +i* 0.786934| 1|-3.70964E-13 +i* 2.85104E-13| +| 7| -0.629293 +i* -0.777168| 1| 3.4002E-13 +i* 1.14925E-14| +| 8| 0.641411 +i* 0.767198| 1|-6.01835E-13 +i* 5.70316E-13| +| 9| -0.653354 +i* -0.757052| 1| 3.00003E-14 +i* 4.1084E-13| +| 10| 0.665153 +i* 0.746707| 1|-9.55243E-14 +i* 7.739E-13| +| 11| -0.676773 +i* -0.736192| 1|-3.70891E-13 +i* 4.31963E-14| +| 12| 0.688242 +i* 0.725482| 1| 4.17319E-13 +i*-2.25125E-13| +| 13| -0.699526 +i* -0.714607| 1|-1.55074E-13 +i* 3.9467E-13| +| 14| 0.710653 +i* 0.703543| 1|-7.94843E-13 +i* 5.61671E-13| +| 15| -0.721591 +i* -0.69232| 1|-8.20351E-14 +i* 3.39909E-13| +| 16| 0.732366 +i* 0.680912| 1| 5.01595E-13 +i* 2.59279E-13| +| 17| -0.742946 +i* -0.669351| 1|-1.90181E-13 +i* 1.23972E-13| +| 18| 0.753358 +i* 0.657611| 1|-7.14661E-13 +i*-3.96187E-13| +| 19| -0.76357 +i* -0.645725| 1|-3.31242E-13 +i*-8.50865E-14| +| 20| 0.773609 +i* 0.633664| 1|-7.93813E-13 +i* 2.09313E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 1 +zone limite de 'log-exp' 1.00051 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 2 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 2 dimgrid2 684 start 350080 size 175040 +gpu 0 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 1 dimgrid2 684 start 175040 size 175040 +gpu 0 dimgrid2 684 start 0 size 175040 +gpu 3 dimgrid 2735 dimblock 256 degrePoly 700000 +gpu 3 dimgrid2 684 start 525120 size 175040 +gpu 0 iter : 1 Arret : 4.05179E-06 s/iter 26.057760 +gpu 0 iter : 2 Arret : 3.69041E-06 s/iter 26.006401 +gpu 0 iter : 3 Arret : 3.54349E-06 s/iter 26.017285 +gpu 0 iter : 4 Arret : 3.54342E-06 s/iter 26.011286 +gpu 0 iter : 5 Arret : 3.59693E-06 s/iter 26.022969 +gpu 0 iter : 6 Arret : 3.48529E-06 s/iter 26.021812 +gpu 0 iter : 7 Arret : 3.57662E-06 s/iter 26.011888 +gpu 0 iter : 8 Arret : 3.69147E-06 s/iter 26.008709 +gpu 0 iter : 9 Arret : 3.94782E-06 s/iter 26.004937 +gpu 0 iter : 10 Arret : 6.25107E-05 s/iter 26.012739 +gpu 0 iter : 11 Arret : 0.00192614 s/iter 26.023084 +gpu 0 iter : 12 Arret : 0.00191367 s/iter 26.017884 +gpu 0 iter : 13 Arret : 0.0032574 s/iter 26.009004 +gpu 0 iter : 14 Arret : 0.00729301 s/iter 35.180983 +gpu 0 iter : 15 Arret : 0.00245317 s/iter 26.015276 +gpu 0 iter : 16 Arret : 0.00433319 s/iter 25.893105 +gpu 0 iter : 17 Arret : 0.00843918 s/iter 31.680916 +gpu 0 iter : 18 Arret : 0.00512235 s/iter 31.753281 +gpu 0 iter : 19 Arret : 0.161408 s/iter 28.844658 +gpu 0 iter : 20 Arret : 0.0369396 s/iter 28.748462 +gpu 0 iter : 21 Arret : 0.0443209 s/iter 28.918638 +gpu 0 iter : 22 Arret : 0.00926227 s/iter 28.518098 +gpu 0 iter : 23 Arret : 0.10139 s/iter 28.915161 +gpu 0 iter : 24 Arret : 0.087367 s/iter 28.998391 +gpu 0 iter : 25 Arret : 0.00915331 s/iter 28.869297 +gpu 0 iter : 26 Arret : 0.000166928 s/iter 25.732016 +gpu 0 iter : 27 Arret : 8.36929E-05 s/iter 25.736037 +gpu 0 iter : 28 Arret : 1.72536E-05 s/iter 25.733697 +gpu 0 iter : 29 Arret : 7.0611E-08 s/iter 25.745297 +gpu 0 iter : 30 Arret : 2.0544E-12 s/iter 25.733511 +gpu 0 iter : 31 Arret : 1.57009E-16 s/iter 25.739637 +temps : 846.791 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.46262E-08 +Stabilite : 1.57009E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540352 +i* 0.841439| 1| 4.39978E-13 +i* 6.25043E-13| +| 2| -0.996034 +i* 0.0889731| 1| 2.2073E-13 +i* 1.55296E-13| +| 3| 0.439836 +i* -0.898078| 1|-3.55927E-13 +i*-1.21738E-13| +| 4| 0.38266 +i* -0.923889| 1|-2.56142E-13 +i*-7.02285E-14| +| 5| -0.988496 +i* 0.15125| 1|-1.52652E-13 +i*-1.11329E-13| +| 6| 0.641421 +i* 0.767189| 1|-1.31044E-13 +i* 5.61736E-13| +| 7| 0.323979 +i* -0.946064| 1|-4.52336E-13 +i* 8.74596E-14| +| 8| -0.977067 +i* 0.212932| 1| 8.58341E-14 +i* 1.73412E-13| +| 9| 0.688262 +i* 0.725462| 1| 4.28754E-14 +i* 1.08849E-12| +| 10| 0.264022 +i* -0.964517| 1|-3.63883E-13 +i*-8.14886E-14| +| 11| -0.961793 +i* 0.273776| 1| -3.0213E-13 +i*-2.13897E-13| +| 12| 0.732395 +i* 0.68088| 1|-3.65194E-14 +i* 7.95483E-13| +| 13| 0.203027 +i* -0.979173| 1|-3.14502E-13 +i* 2.96924E-13| +| 14| -0.942735 +i* 0.333543| 1| 1.82947E-13 +i*-4.73458E-14| +| 15| 0.773646 +i* 0.633619| 1| 2.24352E-13 +i* 2.79674E-13| +| 16| 0.141232 +i* -0.989977| 1| -1.0035E-13 +i* 1.5693E-13| +| 17| -0.919967 +i* 0.391997| 1| 2.89213E-14 +i*-1.86252E-13| +| 18| 0.811852 +i* 0.583864| 1|-1.59939E-12 +i*-4.13669E-13| +| 19| 0.0788818 +i* -0.996884| 1|-2.83003E-13 +i* 1.04711E-13| +| 20| -0.893578 +i* 0.448908| 1| 4.59736E-14 +i* 1.31414E-13| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 1 +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 3 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 3 dimgrid2 782 start 600000 size 200000 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 782 start 400000 size 200000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 782 start 0 size 200000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 782 start 200000 size 200000 +gpu 0 iter : 1 Arret : 3.03518E-06 s/iter 34.140422 +gpu 0 iter : 2 Arret : 3.08048E-06 s/iter 34.112195 +gpu 0 iter : 3 Arret : 3.01956E-06 s/iter 34.096993 +gpu 0 iter : 4 Arret : 3.09293E-06 s/iter 34.110543 +gpu 0 iter : 5 Arret : 3.08006E-06 s/iter 34.076662 +gpu 0 iter : 6 Arret : 3.01434E-06 s/iter 34.084058 +gpu 0 iter : 7 Arret : 3.18584E-06 s/iter 34.136831 +gpu 0 iter : 8 Arret : 3.3042E-06 s/iter 34.131267 +gpu 0 iter : 9 Arret : 4.06872E-06 s/iter 34.106772 +gpu 0 iter : 10 Arret : 8.81449E-06 s/iter 34.108408 +gpu 0 iter : 11 Arret : 0.000633965 s/iter 34.129789 +gpu 0 iter : 12 Arret : 0.00092939 s/iter 34.108349 +gpu 0 iter : 13 Arret : 2.168 s/iter 34.099124 +gpu 0 iter : 14 Arret : 0.959162 s/iter 39.514454 +gpu 0 iter : 15 Arret : 1.25264 s/iter 39.163345 +gpu 0 iter : 16 Arret : 0.0492202 s/iter 41.068013 +gpu 0 iter : 17 Arret : 0.0215834 s/iter 32.733350 +gpu 0 iter : 18 Arret : 0.0247446 s/iter 37.879052 +gpu 0 iter : 19 Arret : 0.0179454 s/iter 29.650763 +gpu 0 iter : 20 Arret : 0.0206764 s/iter 29.407317 +gpu 0 iter : 21 Arret : 0.0222049 s/iter 35.012713 +gpu 0 iter : 22 Arret : 0.00255914 s/iter 27.067142 +gpu 0 iter : 23 Arret : 0.000919373 s/iter 25.980531 +gpu 0 iter : 24 Arret : 0.0031468 s/iter 24.573430 +gpu 0 iter : 25 Arret : 0.00100214 s/iter 23.918440 +gpu 0 iter : 26 Arret : 4.12095E-06 s/iter 23.670339 +gpu 0 iter : 27 Arret : 1.25002E-07 s/iter 23.794441 +gpu 0 iter : 28 Arret : 1.03352E-11 s/iter 23.663739 +gpu 0 iter : 29 Arret : 1.57009E-16 s/iter 23.563580 +temps : 925.912 seconde(s) +Nb iterations : 29 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.26383E-08 +Stabilite : 1.11022E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540349 +i* 0.841441| 1|-1.16344E-13 +i* 9.55619E-13| +| 2| 0.592061 +i* 0.805893| 1|-1.57249E-13 +i*-4.43364E-13| +| 3| 0.617051 +i* 0.786923| 1|-6.42805E-13 +i*-3.49094E-13| +| 4| 0.641434 +i* 0.767178| 1| 1.00022E-12 +i*-5.90578E-13| +| 5| 0.665186 +i* 0.746678| 1|-2.53998E-14 +i*-1.14684E-12| +| 6| 0.688283 +i* 0.725442| 1|-8.68732E-13 +i* 8.52696E-13| +| 7| 0.710703 +i* 0.703493| 1| 2.02581E-13 +i* 4.54699E-13| +| 8| 0.732422 +i* 0.680851| 1|-5.22353E-13 +i*-3.99873E-13| +| 9| 0.753421 +i* 0.657538| 1| 1.23356E-13 +i*-1.05986E-12| +| 10| 0.773678 +i* 0.633579| 1|-6.75196E-13 +i* 3.60108E-13| +| 11| 0.793174 +i* 0.608995| 1| 4.43853E-13 +i*-1.42398E-12| +| 12| 0.811888 +i* 0.583813| 1|-4.10491E-13 +i*-4.46651E-13| +| 13| 0.829804 +i* 0.558055| 1| 1.30045E-12 +i* 1.12788E-13| +| 14| 0.846902 +i* 0.531748| 1|-8.09419E-13 +i* 4.98091E-13| +| 15| 0.863167 +i* 0.504918| 1| 2.98522E-13 +i* 3.81547E-13| +| 16| 0.878582 +i* 0.477591| 1|-3.06581E-13 +i*-6.95869E-13| +| 17| 0.893133 +i* 0.449793| 1| 1.24355E-13 +i* -1.3239E-12| +| 18| 0.906804 +i* 0.421553| 1|-1.23117E-12 +i*-5.57117E-13| +| 19| 0.919582 +i* 0.392898| 1|-1.03648E-12 +i* 2.90445E-14| +| 20| 0.931455 +i* 0.363856| 1|-6.42708E-13 +i*-1.50318E-12| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 1 diff --git a/Simulations/full_openmp/full_openmp_4GPU.sge b/Simulations/full_openmp/full_openmp_4GPU.sge new file mode 100644 index 0000000..4aab3cf --- /dev/null +++ b/Simulations/full_openmp/full_openmp_4GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 4 +#$ -V +#$ -cwd +#$ -N full_openmp_4GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +#./template -r -i 900000 700000 +#./template -r -i 1000000 800000 +#./template -r -i 1500000 500000 + + diff --git a/Simulations/mpi.txt b/Simulations/mpi.txt new file mode 100644 index 0000000..e7156d7 --- /dev/null +++ b/Simulations/mpi.txt @@ -0,0 +1,9 @@ +#degree S1GPU S2GPU S3GPU S4GPU F1GPU F2GPU F3GPU F4GPU +100000 16.1017 8.65634 7.13273 4.60588 24.1491 15.9313 16.3645 13.0123 +200000 63.5651 40.9684 39.5342 21.5922 146.49 78.4263 63.3058 51.6331 +400000 452.145 122.138 81.0542 63.5457 300.171 169.022 122.621 98.5095 +600000 646.009 297.134 193.628 153.471 757.352 457.417 350.829 289.016 +800000 1656.28 746.426 545.367 282.444 1148.46 637.538 410.952 358.278 +1000000 3173.19 812.655 542.745 440.06 2059.61 1055.82 688.615 539.966 +1200000 3906.03 1647.22 1617.65 1762.58 2827.9 1484.54 985.364 871.12 +1400000 3229.79 1991.85 1707.73 1478.01 3326.77 1766.95 1218.9 917.174 \ No newline at end of file diff --git a/Simulations/mpivsomp.txt b/Simulations/mpivsomp.txt new file mode 100644 index 0000000..4de459d --- /dev/null +++ b/Simulations/mpivsomp.txt @@ -0,0 +1,5 @@ +#nbGPU SMPI.14 SOMP.14 FMPI.14 FOMP.14 SMPI.8 SOMP.8 FMPI.8 FOMP.8 SMPI.2 SOMP.2 FMPI.2 FOMP.2 +1 3229.79 3523.14 3326.77 3442.42 1656.28 1180.82 1148.46 1194.76 63.5651 70.1186 146.49 151.38 +2 1991.85 2371.12 1766.95 1778.69 746.426 576.437 637.538 628.842 40.9684 35.62 78.4263 82.6744 +3 1707.73 1786.83 1218.9 1191.46 545.367 351.42 410.952 432.911 39.5342 37.8394 63.3058 59.7653 +4 1478.01 1704.89 917.174 925.912 282.444 258.82 358.278 337.034 21.5922 22.9576 51.6331 56.2628 \ No newline at end of file diff --git a/Simulations/openmp.txt b/Simulations/openmp.txt new file mode 100644 index 0000000..14d6a4d --- /dev/null +++ b/Simulations/openmp.txt @@ -0,0 +1,9 @@ +#degree S1GPU S2GPU S3GPU S4GPU F1GPU F2GPU F3GPU F4GPU +100000 16.1926 9.12342 8.00955 5.86914 24.3248 16.8078 17.7034 13.5366 +200000 70.1186 35.62 37.8394 22.9576 151.38 82.6744 59.7653 56.2628 +400000 248.893 122.327 86.1208 68.0633 296.321 161.369 112.147 89.8766 +600000 589.718 297.898 202.419 154.313 833.807 458.792 334.994 279.804 +800000 1180.82 576.437 351.42 258.82 1194.76 628.842 432.911 337.034 +1000000 1621.79 850.208 598.968 422.324 1931.46 1049.55 693.102 525.532 +1200000 4148.3 1631.66 2056.31 1556.58 3017.33 1589.66 1053.03 846.791 +1400000 3523.14 2371.12 1786.83 1704.89 3442.42 1778.69 1191.46 925.912 \ No newline at end of file diff --git a/Simulations/sparse_mpi/sparse_mpi_1GPU.o140032 b/Simulations/sparse_mpi/sparse_mpi_1GPU.o140032 new file mode 100644 index 0000000..42d7416 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_1GPU.o140032 @@ -0,0 +1,642 @@ +REMAINING: 1 +Taking GPU #3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 100096 +proc 0 start 0 size 100096 +iter : 1 Arret : 0.00679606 s/iter 0.774483 +iter : 2 Arret : 0.0240773 s/iter 0.852783 +iter : 3 Arret : 0.0190607 s/iter 0.841876 +iter : 4 Arret : 0.00753578 s/iter 0.774557 +iter : 5 Arret : 0.0903866 s/iter 0.774496 +iter : 6 Arret : 0.0766923 s/iter 0.843947 +iter : 7 Arret : 0.0135773 s/iter 0.851241 +iter : 8 Arret : 0.00988122 s/iter 0.846496 +iter : 9 Arret : 0.00740796 s/iter 0.842720 +iter : 10 Arret : 0.00490463 s/iter 0.774748 +iter : 11 Arret : 0.00478656 s/iter 0.774554 +iter : 12 Arret : 0.00116597 s/iter 0.774390 +iter : 13 Arret : 0.000965078 s/iter 0.774238 +iter : 14 Arret : 0.000208722 s/iter 0.774212 +iter : 15 Arret : 0.00022059 s/iter 0.774088 +iter : 16 Arret : 2.47061E-05 s/iter 0.774123 +iter : 17 Arret : 2.20962E-07 s/iter 0.774117 +iter : 18 Arret : 7.04174E-10 s/iter 0.774131 +iter : 19 Arret : 2.22676E-12 s/iter 0.773993 +iter : 20 Arret : 7.50806E-15 s/iter 0.774073 +temps : 16.1017 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.61117E-09 +Stabilite : 7.50806E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226711 +i* -0.973923| 0.999962|-4.27658E-13 +i* 6.01027E-13| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996021 +i* 0.0886823| 0.999962| 2.0266E-12 +i*-2.01894E-13| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968049 +i* 0.250607| 0.999962|-1.07025E-13 +i*-1.15224E-12| +| 10| -0.286815 +i* -0.957946| 0.999962|-6.55254E-13 +i* 1.20869E-12| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988582 +i* 0.150427| 0.999962|-1.54698E-12 +i*-6.48537E-13| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.981756 +i* 0.189945| 0.999962|-9.84324E-13 +i*-1.03573E-12| +| 19| -0.345809 +i* -0.938264| 0.999962| 1.03906E-12 +i* 1.95398E-12| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 200192 +proc 0 start 0 size 200192 +iter : 1 Arret : 0.000149243 s/iter 3.009897 +iter : 2 Arret : 0.000107669 s/iter 3.006186 +iter : 3 Arret : 0.000104952 s/iter 3.008833 +iter : 4 Arret : 0.000608712 s/iter 3.007077 +iter : 5 Arret : 0.00102516 s/iter 3.006467 +iter : 6 Arret : 0.00265088 s/iter 3.006726 +iter : 7 Arret : 0.0373682 s/iter 3.008694 +iter : 8 Arret : 0.0563565 s/iter 3.008459 +iter : 9 Arret : 0.130843 s/iter 3.042271 +iter : 10 Arret : 0.213629 s/iter 3.036578 +iter : 11 Arret : 0.153708 s/iter 3.075704 +iter : 12 Arret : 0.0916516 s/iter 3.036504 +iter : 13 Arret : 0.0619829 s/iter 3.025077 +iter : 14 Arret : 0.0382728 s/iter 3.001649 +iter : 15 Arret : 0.0125846 s/iter 3.026965 +iter : 16 Arret : 0.00175812 s/iter 3.007895 +iter : 17 Arret : 0.000317125 s/iter 3.006004 +iter : 18 Arret : 1.05887E-05 s/iter 3.006536 +iter : 19 Arret : 5.5903E-08 s/iter 3.012414 +iter : 20 Arret : 5.55768E-12 s/iter 3.013007 +iter : 21 Arret : 5.57854E-16 s/iter 3.013024 +temps : 63.5651 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.52377E-08 +Stabilite : 5.57854E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540195 +i* 0.841595| 1.00005|-2.98043E-09 +i*-3.27611E-08| +| 2| -0.837195 +i* 0.546877| 0.999985| 7.09943E-12 +i* 5.1133E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828525 +i* -0.559925| 0.999985|-4.34675E-12 +i* 1.07137E-12| +| 5| -0.819774 +i* 0.572768| 1.00005| 2.53887E-08 +i* 2.42315E-09| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591869 +i* 0.806015| 0.999985| 1.73195E-13 +i* 8.72591E-12| +| 9| -0.801379 +i* 0.598131| 0.999985| -1.2701E-12 +i* 3.96189E-12| +| 10| -0.60436 +i* -0.796769| 1.00005|-3.33815E-08 +i* 3.89061E-08| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628985 +i* -0.777398| 0.999985|-4.05476E-12 +i*-5.17236E-12| +| 15| 0.772548 +i* -0.635029| 1.00005| 1.1634E-09 +i* 1.87351E-08| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752229 +i* -0.658879| 0.999985| 1.34497E-11 +i*-6.49125E-12| +| 20| 0.664729 +i* 0.747146| 1.00005|-1.71597E-08 +i* 8.68463E-09| ++---+----------------------------+------------+----------------------------+ +50000 racines de module = 1.00005 +150000 racines de module = 0.999985 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 400128 +proc 0 start 0 size 400128 +iter : 1 Arret : 0.00730522 s/iter 11.729578 +iter : 2 Arret : 8.77601 s/iter 11.759538 +iter : 3 Arret : 1.00039 s/iter 11.791553 +iter : 4 Arret : 1.66037 s/iter 11.980569 +iter : 5 Arret : 1.60415 s/iter 11.887203 +iter : 6 Arret : 1.09308 s/iter 11.903519 +iter : 7 Arret : 1.03725 s/iter 11.950159 +iter : 8 Arret : 0.785865 s/iter 12.039659 +iter : 9 Arret : 0.676674 s/iter 12.064157 +iter : 10 Arret : 0.653102 s/iter 12.043182 +iter : 11 Arret : 0.61815 s/iter 12.032295 +iter : 12 Arret : 0.572922 s/iter 11.944839 +iter : 13 Arret : 0.514395 s/iter 11.923777 +iter : 14 Arret : 0.460854 s/iter 11.923746 +iter : 15 Arret : 0.546102 s/iter 11.925322 +iter : 16 Arret : 0.44308 s/iter 11.925810 +iter : 17 Arret : 0.411387 s/iter 11.926822 +iter : 18 Arret : 0.391387 s/iter 11.925774 +iter : 19 Arret : 0.377716 s/iter 11.927355 +iter : 20 Arret : 0.368007 s/iter 11.928976 +iter : 21 Arret : 0.476382 s/iter 11.927179 +iter : 22 Arret : 0.434562 s/iter 11.925163 +iter : 23 Arret : 0.42152 s/iter 11.926021 +iter : 24 Arret : 0.423381 s/iter 11.925847 +iter : 25 Arret : 0.433232 s/iter 11.929953 +iter : 26 Arret : 0.401895 s/iter 11.931379 +iter : 27 Arret : 0.411949 s/iter 11.917976 +iter : 28 Arret : 0.186193 s/iter 11.913066 +iter : 29 Arret : 0.106074 s/iter 11.943724 +iter : 30 Arret : 0.0412794 s/iter 11.831994 +iter : 31 Arret : 0.0419846 s/iter 11.810695 +iter : 32 Arret : 0.0167499 s/iter 11.814252 +iter : 33 Arret : 0.00536444 s/iter 11.787890 +iter : 34 Arret : 0.000655097 s/iter 11.754599 +iter : 35 Arret : 3.44296E-07 s/iter 11.747199 +iter : 36 Arret : 7.50023E-10 s/iter 11.751889 +iter : 37 Arret : 1.61565E-12 s/iter 11.752682 +iter : 38 Arret : 3.38203E-15 s/iter 11.747277 +temps : 452.145 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 3.38203E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540313 +i* 0.841453| 0.999991| 9.34197E-12 +i*-1.23633E-11| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991| 1.67755E-11 +i* 4.06477E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991| 1.73468E-11 +i*-3.74729E-12| +| 13| -0.983286 +i* 0.18202| 0.999991| 3.21676E-12 +i*-9.48297E-13| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.66503 +i* 0.746804| 0.999991| 5.74873E-13 +i* 8.53884E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-7.47291E-12 +i*-5.77033E-12| +| 17| 0.294374 +i* -0.955681| 0.999991| 1.82907E-11 +i*-2.45448E-12| +| 18| 0.688087 +i* 0.725616| 0.999991|-1.67164E-11 +i*-1.12573E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +iter : 1 Arret : 0.00438586 s/iter 26.290359 +iter : 2 Arret : 0.424079 s/iter 26.667931 +iter : 3 Arret : 0.949363 s/iter 26.761853 +iter : 4 Arret : 11.5671 s/iter 26.845045 +iter : 5 Arret : 0.975219 s/iter 27.289618 +iter : 6 Arret : 9.61533 s/iter 27.433768 +iter : 7 Arret : 1.85508 s/iter 27.722970 +iter : 8 Arret : 0.857551 s/iter 27.711823 +iter : 9 Arret : 1.17971 s/iter 27.827595 +iter : 10 Arret : 0.452875 s/iter 27.966012 +iter : 11 Arret : 0.892919 s/iter 27.734509 +iter : 12 Arret : 0.512768 s/iter 27.492632 +iter : 13 Arret : 0.378076 s/iter 27.324440 +iter : 14 Arret : 0.0806363 s/iter 26.960487 +iter : 15 Arret : 0.0453167 s/iter 26.499557 +iter : 16 Arret : 0.0240592 s/iter 26.395465 +iter : 17 Arret : 0.0199765 s/iter 26.315790 +iter : 18 Arret : 0.00860028 s/iter 26.347303 +iter : 19 Arret : 0.00210663 s/iter 26.347784 +iter : 20 Arret : 5.04056E-05 s/iter 26.356018 +iter : 21 Arret : 4.72721E-06 s/iter 26.365127 +iter : 22 Arret : 3.9901E-08 s/iter 26.360411 +iter : 23 Arret : 1.57869E-10 s/iter 26.353428 +iter : 24 Arret : 6.28564E-13 s/iter 26.351250 +temps : 646.009 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.58777E-07 +Stabilite : 6.28564E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-4.48197E-12 +i* 2.11486E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592043 +i* 0.805898| 0.999993|-1.75726E-12 +i*-2.31848E-11| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993| 1.4493E-11 +i* 1.3687E-11| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699509 +i* -0.714614| 0.999993| 1.85989E-11 +i*-4.93269E-12| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742916 +i* -0.669375| 0.999993| 1.59349E-11 +i* 1.71025E-11| +| 18| 0.753326 +i* 0.657637| 0.999993| 2.26833E-11 +i* 1.58007E-11| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773555 +i* 0.633743| 1.00001| 3.19794E-09 +i*-4.58601E-10| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 800000 +proc 0 start 0 size 800000 +iter : 1 Arret : 0.00154846 s/iter 46.736609 +iter : 2 Arret : 0.00623603 s/iter 46.773178 +iter : 3 Arret : 0.0858187 s/iter 46.841571 +iter : 4 Arret : 1.67232 s/iter 47.156772 +iter : 5 Arret : 1.01806 s/iter 47.406800 +iter : 6 Arret : 1.57506 s/iter 47.457844 +iter : 7 Arret : 1.13953 s/iter 47.697558 +iter : 8 Arret : 0.73881 s/iter 48.174119 +iter : 9 Arret : 0.626435 s/iter 48.572632 +iter : 10 Arret : 0.622256 s/iter 48.458622 +iter : 11 Arret : 0.692053 s/iter 48.464982 +iter : 12 Arret : 1.00181 s/iter 48.341828 +iter : 13 Arret : 0.551097 s/iter 48.068502 +iter : 14 Arret : 1.04389 s/iter 47.905646 +iter : 15 Arret : 1.21414 s/iter 47.815372 +iter : 16 Arret : 2.39612 s/iter 47.598487 +iter : 17 Arret : 0.78181 s/iter 47.580209 +iter : 18 Arret : 1.57712 s/iter 47.513484 +iter : 19 Arret : 0.980627 s/iter 47.491805 +iter : 20 Arret : 2.61529 s/iter 47.318510 +iter : 21 Arret : 0.836959 s/iter 47.192301 +iter : 22 Arret : 0.6961 s/iter 47.065027 +iter : 23 Arret : 1.08455 s/iter 47.015412 +iter : 24 Arret : 0.186278 s/iter 46.892588 +iter : 25 Arret : 0.155923 s/iter 46.834330 +iter : 26 Arret : 0.090441 s/iter 46.771351 +iter : 27 Arret : 0.093651 s/iter 46.749380 +iter : 28 Arret : 0.0452468 s/iter 46.755619 +iter : 29 Arret : 0.00859257 s/iter 46.764196 +iter : 30 Arret : 0.00968923 s/iter 46.773667 +iter : 31 Arret : 0.00619702 s/iter 46.763704 +iter : 32 Arret : 0.000332677 s/iter 46.713764 +iter : 33 Arret : 1.75349E-07 s/iter 46.747193 +iter : 34 Arret : 4.01254E-10 s/iter 46.753422 +iter : 35 Arret : 8.64369E-13 s/iter 46.729435 +temps : 1656.28 seconde(s) +Nb iterations : 35 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.64697E-07 +Stabilite : 8.64369E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 3.40094E-11 +i* 1.45989E-12| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 1000192 +proc 0 start 0 size 1000192 +iter : 1 Arret : 0.00156919 s/iter 72.939595 +iter : 2 Arret : 1.90389 s/iter 73.046565 +iter : 3 Arret : 0.502696 s/iter 73.071131 +iter : 4 Arret : 1.00039 s/iter 73.810096 +iter : 5 Arret : 1.69451 s/iter 73.906653 +iter : 6 Arret : 1.26606 s/iter 73.980438 +iter : 7 Arret : 0.651915 s/iter 74.703433 +iter : 8 Arret : 0.531762 s/iter 74.806612 +iter : 9 Arret : 0.502687 s/iter 74.773948 +iter : 10 Arret : 0.48618 s/iter 74.532337 +iter : 11 Arret : 0.444215 s/iter 74.279878 +iter : 12 Arret : 0.427439 s/iter 74.140663 +iter : 13 Arret : 0.41232 s/iter 74.008804 +iter : 14 Arret : 0.406535 s/iter 74.075135 +iter : 15 Arret : 0.401671 s/iter 74.022094 +iter : 16 Arret : 0.398196 s/iter 74.055174 +iter : 17 Arret : 0.395555 s/iter 73.932752 +iter : 18 Arret : 0.394204 s/iter 74.040270 +iter : 19 Arret : 0.39412 s/iter 73.999365 +iter : 20 Arret : 0.395512 s/iter 74.042163 +iter : 21 Arret : 0.398528 s/iter 73.913334 +iter : 22 Arret : 0.404063 s/iter 74.043199 +iter : 23 Arret : 0.413614 s/iter 74.018474 +iter : 24 Arret : 0.430817 s/iter 73.977216 +iter : 25 Arret : 0.464104 s/iter 73.990264 +iter : 26 Arret : 0.534702 s/iter 73.999109 +iter : 27 Arret : 0.777706 s/iter 73.922712 +iter : 28 Arret : 0.780386 s/iter 73.805326 +iter : 29 Arret : 0.391957 s/iter 73.593419 +iter : 30 Arret : 0.489974 s/iter 73.269694 +iter : 31 Arret : 0.327545 s/iter 73.343344 +iter : 32 Arret : 0.110619 s/iter 73.177304 +iter : 33 Arret : 0.19712 s/iter 73.089524 +iter : 34 Arret : 0.288284 s/iter 73.082763 +iter : 35 Arret : 0.0226925 s/iter 73.058524 +iter : 36 Arret : 0.00572618 s/iter 73.055652 +iter : 37 Arret : 0.00398682 s/iter 72.948081 +iter : 38 Arret : 0.000421174 s/iter 72.910444 +iter : 39 Arret : 5.0226E-07 s/iter 72.907146 +iter : 40 Arret : 7.2296E-09 s/iter 72.950438 +iter : 41 Arret : 1.02029E-10 s/iter 72.929637 +iter : 42 Arret : 1.43894E-12 s/iter 72.923863 +iter : 43 Arret : 2.03366E-14 s/iter 72.908337 +temps : 3173.19 seconde(s) +Nb iterations : 43 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65132E-08 +Stabilite : 2.03366E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.52971 +i* 0.848174| 0.999996|-2.56639E-12 +i*-3.27674E-11| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502834 +i* 0.864379| 0.999996|-2.85585E-11 +i* 6.91519E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491932 +i* 0.870629| 0.999996|-1.74121E-11 +i*-2.86359E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475463 +i* 0.879732| 0.999996|-5.09415E-12 +i*-3.20905E-11| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447623 +i* 0.894218| 0.999996| -2.5447E-11 +i*-4.61239E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-3.70284E-11 +i*-5.06729E-12| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 1200128 +proc 0 start 0 size 1200128 +iter : 1 Arret : 0.00677598 s/iter 104.842623 +iter : 2 Arret : 1.43332 s/iter 108.451498 +iter : 3 Arret : 0.428119 s/iter 109.604920 +iter : 4 Arret : 0.429249 s/iter 111.528327 +iter : 5 Arret : 1.08646 s/iter 112.126605 +iter : 6 Arret : 4.298 s/iter 112.878995 +iter : 7 Arret : 1.29187 s/iter 114.015483 +iter : 8 Arret : 4.5768 s/iter 114.431935 +iter : 9 Arret : 0.867548 s/iter 114.405770 +iter : 10 Arret : 1.11265 s/iter 113.890021 +iter : 11 Arret : 0.535846 s/iter 113.718788 +iter : 12 Arret : 0.531876 s/iter 112.691524 +iter : 13 Arret : 2.32463 s/iter 111.476924 +iter : 14 Arret : 0.834993 s/iter 110.712739 +iter : 15 Arret : 1.67285 s/iter 110.494250 +iter : 16 Arret : 1.01044 s/iter 109.494899 +iter : 17 Arret : 0.807065 s/iter 109.193175 +iter : 18 Arret : 0.909238 s/iter 108.712803 +iter : 19 Arret : 1.14066 s/iter 108.492397 +iter : 20 Arret : 0.335581 s/iter 107.960425 +iter : 21 Arret : 0.196963 s/iter 107.373274 +iter : 22 Arret : 0.128663 s/iter 106.913981 +iter : 23 Arret : 0.275217 s/iter 106.284145 +iter : 24 Arret : 0.179897 s/iter 106.054702 +iter : 25 Arret : 0.420437 s/iter 105.799691 +iter : 26 Arret : 0.358355 s/iter 105.198589 +iter : 27 Arret : 0.11514 s/iter 105.120453 +iter : 28 Arret : 0.217484 s/iter 104.911034 +iter : 29 Arret : 0.207195 s/iter 104.903818 +iter : 30 Arret : 0.037319 s/iter 104.938544 +iter : 31 Arret : 0.0122038 s/iter 104.836750 +iter : 32 Arret : 0.000983648 s/iter 104.776137 +iter : 33 Arret : 4.35825E-07 s/iter 104.872755 +iter : 34 Arret : 1.94444E-09 s/iter 104.822262 +iter : 35 Arret : 1.37935E-11 s/iter 104.776349 +iter : 36 Arret : 1.88726E-13 s/iter 104.825146 +temps : 3906.03 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.78618E-08 +Stabilite : 1.88726E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540312 +i* 0.841461| 0.999997|-2.16913E-11 +i* 1.91294E-11| +| 2| 0.513645 +i* 0.857999| 0.999997|-6.29718E-12 +i*-2.39364E-12| +| 3| 0.486457 +i* 0.873701| 0.999997| 1.53235E-11 +i* 6.36435E-13| +| 4| 0.458805 +i* 0.888533| 0.999997| 1.78773E-11 +i* 1.55684E-11| +| 5| 0.430685 +i* 0.902499| 0.999997| 2.12053E-13 +i*-1.16324E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997| -2.5707E-11 +i* 3.11093E-13| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223614 +i* 0.974674| 0.999997| 7.05391E-12 +i* 1.2797E-11| +| 13| 0.192915 +i* 0.981212| 0.999997| 1.07495E-11 +i* 5.766E-12| +| 14| 0.162052 +i* 0.986779| 0.999997|-2.06171E-11 +i* 5.16515E-12| +| 15| 0.130977 +i* 0.991382| 0.999997| 5.89659E-11 +i* 7.29122E-12| +| 16| 0.0998077 +i* 0.995003| 0.999997|-3.45761E-11 +i*-1.61701E-11| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.04742E-11 +i* 1.15624E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 1400064 +proc 0 start 0 size 1400064 +iter : 1 Arret : 0.00938725 s/iter 142.328326 +iter : 2 Arret : 0.761578 s/iter 147.052418 +iter : 3 Arret : 1.35081 s/iter 149.289333 +iter : 4 Arret : 0.488828 s/iter 151.454940 +iter : 5 Arret : 0.352825 s/iter 152.322211 +iter : 6 Arret : 0.142284 s/iter 153.010051 +iter : 7 Arret : 0.0560259 s/iter 152.431968 +iter : 8 Arret : 0.196308 s/iter 152.003440 +iter : 9 Arret : 0.124897 s/iter 151.872606 +iter : 10 Arret : 0.0975323 s/iter 151.560877 +iter : 11 Arret : 0.147128 s/iter 149.300671 +iter : 12 Arret : 0.109558 s/iter 147.230298 +iter : 13 Arret : 0.0563761 s/iter 144.834459 +iter : 14 Arret : 0.0352169 s/iter 143.795377 +iter : 15 Arret : 0.0177334 s/iter 143.112879 +iter : 16 Arret : 0.0155926 s/iter 142.695503 +iter : 17 Arret : 0.00246736 s/iter 142.533975 +iter : 18 Arret : 9.78659E-05 s/iter 142.374961 +iter : 19 Arret : 5.69989E-07 s/iter 142.290712 +iter : 20 Arret : 3.43839E-09 s/iter 142.588568 +iter : 21 Arret : 1.59577E-11 s/iter 142.684647 +iter : 22 Arret : 7.40742E-14 s/iter 142.549602 +temps : 3229.79 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.95958E-08 +Stabilite : 7.40742E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-5.74141E-12 +i*-6.39521E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997|-8.89955E-13 +i* 2.61938E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416439 +i* -0.90916| 0.999997|-1.66807E-11 +i* 2.56219E-11| +| 12| 0.373179 +i* 0.927756| 0.999997|-7.07252E-11 +i*-5.29587E-11| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-3.74776E-11 +i*-3.89954E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:823 terminated with signal 11 at PC=404ae1 SP=7fff080bdf50. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 823 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:827 terminated with signal 11 at PC=404ae1 SP=7fffb55d2a00. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 827 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^1500000 + (1 +i*0)*x^2000000 + +(-50000 +i*0)*x^499999 + (-1.5E+07 +i*0)*x^1499999 + (2E+06 +i*0)*x^1999999 + + +template:831 terminated with signal 11 at PC=404ae1 SP=7fff64363320. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 831 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- diff --git a/Simulations/sparse_mpi/sparse_mpi_1GPU.sge b/Simulations/sparse_mpi/sparse_mpi_1GPU.sge new file mode 100644 index 0000000..8661da2 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_1GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_1GPU +#$ -pe mpi 1 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_mpi/sparse_mpi_2GPU.o140031 b/Simulations/sparse_mpi/sparse_mpi_2GPU.o140031 new file mode 100644 index 0000000..15b43d7 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_2GPU.o140031 @@ -0,0 +1,662 @@ +REMAINING: 2 +Taking GPU #0 +Taking GPU #1 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 50048 size 50048 +proc 1 start 50048 size 50048 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 50048 +proc 0 start 0 size 50048 +iter : 1 Arret : 0.00512448 s/iter 0.442006 +iter : 2 Arret : 0.00518524 s/iter 0.441749 +iter : 3 Arret : 0.0136123 s/iter 0.441743 +iter : 4 Arret : 0.0172088 s/iter 0.520551 +iter : 5 Arret : 0.0127637 s/iter 0.441752 +iter : 6 Arret : 0.00575024 s/iter 0.441718 +iter : 7 Arret : 0.00480045 s/iter 0.441722 +iter : 8 Arret : 0.0058672 s/iter 0.441765 +iter : 9 Arret : 0.00681665 s/iter 0.439578 +iter : 10 Arret : 0.00633876 s/iter 0.441755 +iter : 11 Arret : 0.0024546 s/iter 0.441765 +iter : 12 Arret : 0.00167883 s/iter 0.441695 +iter : 13 Arret : 0.000524245 s/iter 0.441627 +iter : 14 Arret : 0.000135332 s/iter 0.441622 +iter : 15 Arret : 4.9518E-06 s/iter 0.441652 +iter : 16 Arret : 7.49618E-08 s/iter 0.441569 +iter : 17 Arret : 1.11657E-09 s/iter 0.441553 +iter : 18 Arret : 1.66345E-11 s/iter 0.441549 +iter : 19 Arret : 2.47882E-13 s/iter 0.441578 +temps : 8.65634 seconde(s) +Nb iterations : 19 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.43376E-08 +Stabilite : 3.20054E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 2.07334E-12 +i* 2.33003E-12| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006| 1.35693E-10 +i*-3.47657E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 100096 size 100096 +proc 1 start 100096 size 100096 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 100096 +proc 0 start 0 size 100096 +iter : 1 Arret : 0.000100591 s/iter 1.548764 +iter : 2 Arret : 9.98047E-05 s/iter 1.548592 +iter : 3 Arret : 0.000401454 s/iter 1.548606 +iter : 4 Arret : 0.000612146 s/iter 1.548661 +iter : 5 Arret : 0.00261257 s/iter 1.548859 +iter : 6 Arret : 0.00389809 s/iter 1.707848 +iter : 7 Arret : 0.108958 s/iter 1.548567 +iter : 8 Arret : 0.0989986 s/iter 1.548572 +iter : 9 Arret : 0.159452 s/iter 1.549964 +iter : 10 Arret : 0.284956 s/iter 1.552722 +iter : 11 Arret : 0.805953 s/iter 1.552547 +iter : 12 Arret : 0.51544 s/iter 1.711577 +iter : 13 Arret : 0.544938 s/iter 1.707829 +iter : 14 Arret : 0.643974 s/iter 1.548388 +iter : 15 Arret : 1.69207 s/iter 1.548432 +iter : 16 Arret : 0.924273 s/iter 1.548552 +iter : 17 Arret : 0.444862 s/iter 1.548574 +iter : 18 Arret : 4.9242 s/iter 1.549903 +iter : 19 Arret : 0.716282 s/iter 1.548377 +iter : 20 Arret : 0.40305 s/iter 1.548788 +iter : 21 Arret : 0.294354 s/iter 1.548624 +iter : 22 Arret : 0.0209093 s/iter 1.548518 +iter : 23 Arret : 0.00144046 s/iter 1.548527 +iter : 24 Arret : 0.000306925 s/iter 1.548770 +iter : 25 Arret : 3.17447E-10 s/iter 1.548617 +iter : 26 Arret : 3.17541E-14 s/iter 1.548825 +temps : 40.9684 seconde(s) +Nb iterations : 26 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.58606E-05 +Stabilite : 6.47336E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005|-3.72767E-08 +i*-1.30274E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-1.93379E-12 +i*-1.29726E-11| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 200064 +proc 0 start 0 size 200064 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 200064 size 200064 +proc 1 start 200064 size 200064 +iter : 1 Arret : 0.000550449 s/iter 6.082917 +iter : 2 Arret : 0.00291862 s/iter 6.079734 +iter : 3 Arret : 0.00675438 s/iter 6.082746 +iter : 4 Arret : 0.00891928 s/iter 6.157166 +iter : 5 Arret : 0.0118747 s/iter 6.150345 +iter : 6 Arret : 0.0109883 s/iter 6.091520 +iter : 7 Arret : 0.00656673 s/iter 6.112417 +iter : 8 Arret : 0.00575864 s/iter 6.085608 +iter : 9 Arret : 0.00288805 s/iter 6.150350 +iter : 10 Arret : 0.00168944 s/iter 6.083333 +iter : 11 Arret : 0.00101594 s/iter 6.079295 +iter : 12 Arret : 0.000961205 s/iter 6.079555 +iter : 13 Arret : 0.000805832 s/iter 6.078713 +iter : 14 Arret : 0.00034457 s/iter 6.079666 +iter : 15 Arret : 0.000125967 s/iter 6.080354 +iter : 16 Arret : 2.22934E-05 s/iter 6.079409 +iter : 17 Arret : 5.34301E-06 s/iter 6.079653 +iter : 18 Arret : 3.49738E-08 s/iter 6.081697 +iter : 19 Arret : 7.48893E-11 s/iter 6.080662 +iter : 20 Arret : 1.61404E-13 s/iter 6.081309 +temps : 122.138 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.09706E-08 +Stabilite : 1.61404E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.43989 +i* -0.898041| 0.999991|-2.08855E-12 +i*-1.75276E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991|-1.29017E-11 +i*-4.43427E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991|-4.70735E-12 +i* -1.4127E-11| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688087 +i* 0.725616| 0.999991| 6.67011E-12 +i* 1.57173E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 300032 size 300032 +proc 1 start 300032 size 300032 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +iter : 1 Arret : 0.00169532 s/iter 13.268293 +iter : 2 Arret : 0.00577451 s/iter 13.754899 +iter : 3 Arret : 0.00560656 s/iter 13.317734 +iter : 4 Arret : 0.026637 s/iter 13.287596 +iter : 5 Arret : 0.0224878 s/iter 13.756785 +iter : 6 Arret : 0.0273249 s/iter 14.009301 +iter : 7 Arret : 0.0242205 s/iter 13.722890 +iter : 8 Arret : 0.0206627 s/iter 14.046207 +iter : 9 Arret : 0.0154355 s/iter 14.068750 +iter : 10 Arret : 0.0112335 s/iter 13.832264 +iter : 11 Arret : 0.00926749 s/iter 13.793343 +iter : 12 Arret : 0.0165133 s/iter 13.276606 +iter : 13 Arret : 0.00281445 s/iter 13.275977 +iter : 14 Arret : 0.0019915 s/iter 13.269355 +iter : 15 Arret : 0.00135028 s/iter 13.267568 +iter : 16 Arret : 0.00186824 s/iter 13.268070 +iter : 17 Arret : 0.000810658 s/iter 13.268154 +iter : 18 Arret : 0.000232438 s/iter 13.268534 +iter : 19 Arret : 3.11501E-07 s/iter 13.267454 +iter : 20 Arret : 1.18566E-09 s/iter 13.267871 +iter : 21 Arret : 9.65413E-12 s/iter 13.268070 +iter : 22 Arret : 1.37719E-13 s/iter 13.267729 +temps : 297.134 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.32595E-08 +Stabilite : 1.37719E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993| 1.33613E-11 +i*-1.98701E-11| +| 4| 0.591992 +i* 0.805956| 1.00001|-3.89872E-09 +i* 2.08385E-09| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993|-4.77973E-12 +i* 2.40621E-11| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| -2.6851E-11 +i*-1.44801E-11| +| 15| -0.721524 +i* -0.69238| 0.999993| 2.63193E-11 +i*-6.76318E-13| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.74294 +i* -0.669349| 0.999993| 1.02707E-12 +i* 2.14607E-11| +| 18| 0.753317 +i* 0.657672| 1.00001| 2.8295E-09 +i*-3.45603E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773543 +i* 0.633733| 0.999993|-3.47811E-12 +i*-5.94756E-12| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 400000 +proc 0 start 0 size 400000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 400000 size 400000 +proc 1 start 400000 size 400000 +iter : 1 Arret : 0.00108387 s/iter 23.672446 +iter : 2 Arret : 0.00660333 s/iter 23.805408 +iter : 3 Arret : 1.16255 s/iter 23.798567 +iter : 4 Arret : 1.00538 s/iter 23.799772 +iter : 5 Arret : 4.35503 s/iter 23.835095 +iter : 6 Arret : 2.85741 s/iter 24.191376 +iter : 7 Arret : 1.06724 s/iter 24.343970 +iter : 8 Arret : 0.752896 s/iter 24.414141 +iter : 9 Arret : 0.681451 s/iter 24.504496 +iter : 10 Arret : 0.666362 s/iter 24.940388 +iter : 11 Arret : 0.660981 s/iter 25.494551 +iter : 12 Arret : 0.6721 s/iter 24.530242 +iter : 13 Arret : 0.722307 s/iter 24.518027 +iter : 14 Arret : 0.735973 s/iter 24.579973 +iter : 15 Arret : 1.60274 s/iter 24.425419 +iter : 16 Arret : 1.08224 s/iter 24.263282 +iter : 17 Arret : 1.66761 s/iter 24.117742 +iter : 18 Arret : 0.562533 s/iter 23.946009 +iter : 19 Arret : 0.334526 s/iter 23.926164 +iter : 20 Arret : 0.247191 s/iter 23.871930 +iter : 21 Arret : 0.0856694 s/iter 23.809304 +iter : 22 Arret : 0.100266 s/iter 23.817817 +iter : 23 Arret : 0.0450244 s/iter 23.791545 +iter : 24 Arret : 0.0252731 s/iter 23.803368 +iter : 25 Arret : 0.0214701 s/iter 23.778507 +iter : 26 Arret : 0.00697008 s/iter 23.796671 +iter : 27 Arret : 0.00107605 s/iter 23.651300 +iter : 28 Arret : 1.6145E-06 s/iter 23.654996 +iter : 29 Arret : 4.22205E-09 s/iter 23.650903 +iter : 30 Arret : 9.10881E-12 s/iter 23.650544 +iter : 31 Arret : 1.96015E-14 s/iter 23.654309 +temps : 746.426 seconde(s) +Nb iterations : 31 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.73089E-06 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995| -2.03E-11 +i* 2.74701E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 1.7531E-11 +i*-4.02243E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 500096 size 500096 +proc 1 start 500096 size 500096 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 500096 +proc 0 start 0 size 500096 +iter : 1 Arret : 0.00111034 s/iter 36.535863 +iter : 2 Arret : 0.00130138 s/iter 36.531318 +iter : 3 Arret : 0.095171 s/iter 36.617316 +iter : 4 Arret : 0.110384 s/iter 36.603388 +iter : 5 Arret : 0.0159644 s/iter 37.200734 +iter : 6 Arret : 0.0148525 s/iter 37.186773 +iter : 7 Arret : 0.0189588 s/iter 37.285760 +iter : 8 Arret : 0.0122669 s/iter 37.242480 +iter : 9 Arret : 0.025395 s/iter 37.493437 +iter : 10 Arret : 0.0249756 s/iter 36.552191 +iter : 11 Arret : 0.0032083 s/iter 36.587117 +iter : 12 Arret : 0.00514671 s/iter 36.496415 +iter : 13 Arret : 0.0026206 s/iter 36.537986 +iter : 14 Arret : 0.0021181 s/iter 36.525452 +iter : 15 Arret : 0.000448616 s/iter 36.534784 +iter : 16 Arret : 0.000260446 s/iter 36.531377 +iter : 17 Arret : 9.00305E-05 s/iter 36.520451 +iter : 18 Arret : 0.000137571 s/iter 36.497467 +iter : 19 Arret : 3.90888E-05 s/iter 36.496056 +iter : 20 Arret : 8.22264E-08 s/iter 36.494517 +iter : 21 Arret : 2.59921E-10 s/iter 36.529540 +iter : 22 Arret : 8.21945E-13 s/iter 36.531093 +temps : 812.655 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.28809E-07 +Stabilite : 8.21945E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841476| 1.00001| 4.82795E-10 +i* 3.31212E-09| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513638 +i* 0.858002| 0.999996|-2.64786E-11 +i* 1.3235E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 1.87346E-11 +i* 4.7471E-11| +| 9| 0.491932 +i* 0.870629| 0.999996|-2.65525E-11 +i* 1.22525E-11| +| 10| 0.486462 +i* 0.873698| 0.999996|-2.18452E-11 +i*-1.14808E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996|-5.47384E-12 +i* 1.02452E-11| +| 15| 0.458801 +i* 0.888545| 1.00001| 8.56622E-10 +i* 9.50588E-10| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1.00001 +600000 racines de module = 0.999996 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 600064 +proc 0 start 0 size 600064 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 600064 size 600064 +proc 1 start 600064 size 600064 +iter : 1 Arret : 0.0323131 s/iter 52.941074 +iter : 2 Arret : 2.76888 s/iter 55.568853 +iter : 3 Arret : 2.88621 s/iter 56.575624 +iter : 4 Arret : 1.26993 s/iter 55.935739 +iter : 5 Arret : 3.86036 s/iter 56.102261 +iter : 6 Arret : 5.37784 s/iter 57.046755 +iter : 7 Arret : 1.03129 s/iter 56.920764 +iter : 8 Arret : 3.95796 s/iter 57.471965 +iter : 9 Arret : 1.30769 s/iter 57.104425 +iter : 10 Arret : 1.0707 s/iter 57.036191 +iter : 11 Arret : 1.02855 s/iter 56.856622 +iter : 12 Arret : 0.563478 s/iter 56.398393 +iter : 13 Arret : 1.5244 s/iter 56.034393 +iter : 14 Arret : 1.47905 s/iter 55.457328 +iter : 15 Arret : 0.774422 s/iter 55.020273 +iter : 16 Arret : 10.8889 s/iter 54.981257 +iter : 17 Arret : 0.715912 s/iter 54.702463 +iter : 18 Arret : 0.577843 s/iter 54.436841 +iter : 19 Arret : 0.747995 s/iter 54.297662 +iter : 20 Arret : 0.163426 s/iter 53.892957 +iter : 21 Arret : 0.181209 s/iter 53.840332 +iter : 22 Arret : 0.0761215 s/iter 53.719165 +iter : 23 Arret : 0.0217437 s/iter 53.677726 +iter : 24 Arret : 0.00705727 s/iter 53.242080 +iter : 25 Arret : 0.00154816 s/iter 52.922070 +iter : 26 Arret : 1.96753E-05 s/iter 52.904231 +iter : 27 Arret : 2.53613E-08 s/iter 52.924736 +iter : 28 Arret : 3.62869E-10 s/iter 52.921481 +iter : 29 Arret : 5.17537E-12 s/iter 52.895150 +iter : 30 Arret : 7.38669E-14 s/iter 52.910075 +temps : 1647.22 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.62324E-08 +Stabilite : 7.38669E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540304 +i* 0.841466| 0.999997| 3.08649E-11 +i* 2.05843E-11| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1|-5.85295E-09 +i*-2.49566E-10| +| 4| 0.458812 +i* 0.888539| 1|-7.79592E-09 +i*-3.64417E-09| +| 5| 0.430677 +i* 0.902502| 0.999997|-2.03271E-11 +i*-3.18325E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192897 +i* 0.981224| 1| 2.91999E-10 +i* 9.18678E-11| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130967 +i* 0.991391| 1| 1.71549E-09 +i* 3.54225E-10| +| 16| 0.099812 +i* 0.995011| 1|-4.01255E-09 +i*-1.01435E-08| +| 17| 0.0685136 +i* 0.997647| 0.999997|-2.98188E-11 +i* 2.79243E-12| +| 18| 0.0371504 +i* 0.999314| 1|-1.38879E-09 +i*-2.32658E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 700032 +proc 0 start 0 size 700032 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 700032 size 700032 +proc 1 start 700032 size 700032 +iter : 1 Arret : 0.00634591 s/iter 71.315735 +iter : 2 Arret : 0.356583 s/iter 73.499155 +iter : 3 Arret : 0.616585 s/iter 74.055679 +iter : 4 Arret : 0.383366 s/iter 75.001269 +iter : 5 Arret : 0.113316 s/iter 76.417550 +iter : 6 Arret : 0.198101 s/iter 77.541428 +iter : 7 Arret : 0.157259 s/iter 77.127574 +iter : 8 Arret : 0.381996 s/iter 77.411132 +iter : 9 Arret : 0.254414 s/iter 77.254944 +iter : 10 Arret : 0.178383 s/iter 77.505940 +iter : 11 Arret : 0.147268 s/iter 76.909819 +iter : 12 Arret : 0.0894984 s/iter 77.135647 +iter : 13 Arret : 0.117288 s/iter 74.937817 +iter : 14 Arret : 0.0966418 s/iter 73.691614 +iter : 15 Arret : 0.0293232 s/iter 72.705894 +iter : 16 Arret : 0.0436007 s/iter 72.446877 +iter : 17 Arret : 0.0302845 s/iter 72.160465 +iter : 18 Arret : 0.00422446 s/iter 71.431150 +iter : 19 Arret : 0.00359251 s/iter 71.490724 +iter : 20 Arret : 0.00270137 s/iter 71.471506 +iter : 21 Arret : 0.00209394 s/iter 71.343579 +iter : 22 Arret : 0.000416465 s/iter 71.476428 +iter : 23 Arret : 4.15934E-05 s/iter 71.308920 +iter : 24 Arret : 5.37967E-08 s/iter 71.432393 +iter : 25 Arret : 2.48195E-10 s/iter 71.421751 +iter : 26 Arret : 1.15205E-12 s/iter 71.414405 +iter : 27 Arret : 5.31631E-15 s/iter 71.409806 +temps : 1991.85 seconde(s) +Nb iterations : 27 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.8707E-07 +Stabilite : 3.51082E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997| 5.65794E-11 +i*-4.66756E-12| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-8.72191E-12 +i* 2.97079E-11| +| 4| 0.486439 +i* 0.873711| 0.999997|-3.15932E-11 +i*-1.15957E-12| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472673 +i* -0.881242| 1|-5.56631E-09 +i*-2.23833E-09| +| 8| 0.430664 +i* 0.902517| 1|-8.83373E-11 +i*-2.09199E-09| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.06317E-11 +i* 7.08794E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-3.74776E-11 +i*-3.89954E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 1.02587E-11 +i*-4.25648E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:32580 terminated with signal 11 at PC=404ae1 SP=7fffd45f56a0. Backtrace: + +template:32579 terminated with signal 11 at PC=404ae1 SP=7fff316ce300. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 32580 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 1 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:32586 terminated with signal 11 at PC=404ae1 SP=7fffbfe9f8d0. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:32587 terminated with signal 11 at PC=404ae1 SP=7fff632aee60. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 32587 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^1500000 + (1 +i*0)*x^2000000 + +(-50000 +i*0)*x^499999 + (-1.5E+07 +i*0)*x^1499999 + (2E+06 +i*0)*x^1999999 + + +template:32594 terminated with signal 11 at PC=404ae1 SP=7fff28fd9250. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:32593 terminated with signal 11 at PC=404ae1 SP=7fffe3e03f90. Backtrace: +./template[0x404ae1] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 32594 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- diff --git a/Simulations/sparse_mpi/sparse_mpi_2GPU.sge b/Simulations/sparse_mpi/sparse_mpi_2GPU.sge new file mode 100644 index 0000000..2817b6b --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_2GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_2GPU +#$ -pe mpi 2 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_mpi/sparse_mpi_3GPU.o140030 b/Simulations/sparse_mpi/sparse_mpi_3GPU.o140030 new file mode 100644 index 0000000..b62c8d1 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_3GPU.o140030 @@ -0,0 +1,758 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 33365 +proc 0 start 0 size 33365 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 33365 size 33365 +proc 1 start 33365 size 33365 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 2, start 66730 size 33365 +proc 2 start 66730 size 33365 +iter : 1 Arret : 0.00638362 s/iter 0.326715 +iter : 2 Arret : 0.00780885 s/iter 0.399767 +iter : 3 Arret : 0.00278939 s/iter 0.327124 +iter : 4 Arret : 0.00312024 s/iter 0.327290 +iter : 5 Arret : 0.00261461 s/iter 0.327081 +iter : 6 Arret : 0.00443129 s/iter 0.326569 +iter : 7 Arret : 0.00529933 s/iter 0.326526 +iter : 8 Arret : 0.00962751 s/iter 0.327146 +iter : 9 Arret : 0.0107359 s/iter 0.326473 +iter : 10 Arret : 0.00603516 s/iter 0.326463 +iter : 11 Arret : 0.00278461 s/iter 0.327154 +iter : 12 Arret : 0.000336786 s/iter 0.326455 +iter : 13 Arret : 0.000245415 s/iter 0.326273 +iter : 14 Arret : 0.000266948 s/iter 0.326718 +iter : 15 Arret : 0.000254585 s/iter 0.326250 +iter : 16 Arret : 0.000456802 s/iter 0.326186 +iter : 17 Arret : 0.000147565 s/iter 0.326750 +iter : 18 Arret : 2.07387E-07 s/iter 0.326144 +iter : 19 Arret : 3.08546E-09 s/iter 0.326199 +iter : 20 Arret : 4.59676E-11 s/iter 0.326798 +iter : 21 Arret : 6.84814E-13 s/iter 0.326219 +temps : 7.13273 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.61117E-09 +Stabilite : 6.84814E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226885 +i* -0.973981| 1.00006|-5.81993E-10 +i*-4.18547E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 1.02962E-12 +i*-4.51911E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 2, start 133460 size 66730 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 66730 size 66730 +proc 1 start 66730 size 66730 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 66730 +proc 0 start 0 size 66730 +proc 2 start 133460 size 66730 +iter : 1 Arret : 0.000533936 s/iter 1.097687 +iter : 2 Arret : 0.00054918 s/iter 1.097788 +iter : 3 Arret : 0.000302619 s/iter 1.097094 +iter : 4 Arret : 0.000610723 s/iter 1.097469 +iter : 5 Arret : 0.0013942 s/iter 1.097408 +iter : 6 Arret : 0.0123305 s/iter 1.097332 +iter : 7 Arret : 0.0276413 s/iter 1.097585 +iter : 8 Arret : 0.0390327 s/iter 1.097910 +iter : 9 Arret : 0.0768762 s/iter 1.098286 +iter : 10 Arret : 0.261559 s/iter 1.199021 +iter : 11 Arret : 0.996838 s/iter 1.231967 +iter : 12 Arret : 2.41454 s/iter 1.226149 +iter : 13 Arret : 2.18621 s/iter 1.224592 +iter : 14 Arret : 1.07886 s/iter 1.189416 +iter : 15 Arret : 2.0468 s/iter 1.225182 +iter : 16 Arret : 2.06331 s/iter 1.228381 +iter : 17 Arret : 0.85728 s/iter 1.201017 +iter : 18 Arret : 0.652722 s/iter 1.225600 +iter : 19 Arret : 0.985485 s/iter 1.227406 +iter : 20 Arret : 4.10993 s/iter 1.228101 +iter : 21 Arret : 0.600123 s/iter 1.227670 +iter : 22 Arret : 0.86582 s/iter 1.231663 +iter : 23 Arret : 0.31213 s/iter 1.227752 +iter : 24 Arret : 0.424877 s/iter 1.223962 +iter : 25 Arret : 0.275449 s/iter 1.097197 +iter : 26 Arret : 0.212806 s/iter 1.221990 +iter : 27 Arret : 0.124734 s/iter 1.097336 +iter : 28 Arret : 0.088182 s/iter 1.096934 +iter : 29 Arret : 0.0330763 s/iter 1.097169 +iter : 30 Arret : 0.0100338 s/iter 1.097086 +iter : 31 Arret : 0.000168049 s/iter 1.097161 +iter : 32 Arret : 7.37376E-08 s/iter 1.096969 +iter : 33 Arret : 7.38629E-12 s/iter 1.097234 +iter : 34 Arret : 7.3696E-16 s/iter 1.097489 +temps : 39.5342 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.52377E-08 +Stabilite : 7.3696E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.592783 +i* 0.805419| 1.00005| 1.3403E-08 +i* 2.35166E-09| +| 9| -0.800777 +i* 0.59904| 1.00005|-1.05967E-08 +i* 2.82759E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-7.79776E-12 +i*-2.52076E-13| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 133376 size 133376 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 2, start 266752 size 133376 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 133376 +proc 2 start 266752 size 133376 +proc 1 start 133376 size 133376 +proc 0 start 0 size 133376 +iter : 1 Arret : 0.000533421 s/iter 3.991725 +iter : 2 Arret : 0.00367072 s/iter 3.993299 +iter : 3 Arret : 0.00493773 s/iter 4.310647 +iter : 4 Arret : 0.00496697 s/iter 3.992603 +iter : 5 Arret : 0.0140779 s/iter 3.991503 +iter : 6 Arret : 0.0122345 s/iter 3.993227 +iter : 7 Arret : 0.0118851 s/iter 4.320085 +iter : 8 Arret : 0.00413608 s/iter 3.992019 +iter : 9 Arret : 0.0042286 s/iter 4.269756 +iter : 10 Arret : 0.00316824 s/iter 3.992259 +iter : 11 Arret : 0.00072238 s/iter 3.992655 +iter : 12 Arret : 0.000430893 s/iter 3.992601 +iter : 13 Arret : 0.000433942 s/iter 3.991813 +iter : 14 Arret : 0.000150382 s/iter 3.993178 +iter : 15 Arret : 0.000238887 s/iter 3.991814 +iter : 16 Arret : 0.000121494 s/iter 3.993291 +iter : 17 Arret : 9.71544E-07 s/iter 3.992093 +iter : 18 Arret : 2.43359E-09 s/iter 3.992688 +iter : 19 Arret : 5.24302E-12 s/iter 3.992746 +iter : 20 Arret : 5.96461E-14 s/iter 3.992444 +temps : 81.0542 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 1.1328E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411559 +i* -0.9114| 1.00002| 1.04334E-09 +i*-9.84037E-10| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.988534 +i* 0.151098| 1.00002|-8.27014E-10 +i* 9.44171E-10| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641299 +i* 0.767311| 1.00002|-2.44657E-09 +i* -6.7886E-11| +| 13| -0.983286 +i* 0.18202| 0.999991| 3.21676E-12 +i*-9.48297E-13| +| 14| 0.324176 +i* -0.945987| 0.999991| 1.53594E-11 +i*-1.57324E-12| +| 15| 0.66503 +i* 0.746804| 0.999991| 5.74873E-13 +i* 8.53884E-12| +| 16| -0.977132 +i* 0.212706| 1.00002|-2.02093E-10 +i* 3.44548E-10| +| 17| 0.294374 +i* -0.955681| 0.999991| -1.2063E-11 +i* 1.32238E-11| +| 18| 0.688092 +i* 0.725645| 1.00002|-4.51021E-09 +i* 1.95437E-09| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991| 2.5573E-11 +i*-6.45539E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 2 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 200021 size 200021 +proc 1 start 200021 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 200021 +proc 0 start 0 size 200021 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 400042 size 200021 +proc 2 start 400042 size 200021 +iter : 1 Arret : 0.00226498 s/iter 9.046598 +iter : 2 Arret : 0.286514 s/iter 9.041345 +iter : 3 Arret : 0.37126 s/iter 9.194828 +iter : 4 Arret : 0.357158 s/iter 9.425406 +iter : 5 Arret : 0.489627 s/iter 9.503770 +iter : 6 Arret : 0.0394603 s/iter 9.532369 +iter : 7 Arret : 0.0346491 s/iter 9.595128 +iter : 8 Arret : 0.058482 s/iter 9.502225 +iter : 9 Arret : 0.0456855 s/iter 9.517820 +iter : 10 Arret : 0.00888245 s/iter 9.163517 +iter : 11 Arret : 0.00755074 s/iter 9.164057 +iter : 12 Arret : 0.00999277 s/iter 9.132635 +iter : 13 Arret : 0.00331316 s/iter 9.163813 +iter : 14 Arret : 0.00348352 s/iter 9.037872 +iter : 15 Arret : 0.00131143 s/iter 9.062842 +iter : 16 Arret : 0.000194649 s/iter 9.032916 +iter : 17 Arret : 0.000108537 s/iter 9.040569 +iter : 18 Arret : 4.32539E-06 s/iter 9.040533 +iter : 19 Arret : 1.30764E-08 s/iter 9.032518 +iter : 20 Arret : 5.19734E-11 s/iter 9.039277 +iter : 21 Arret : 2.06945E-13 s/iter 9.037120 +temps : 193.628 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.29984E-05 +Stabilite : 6.87034E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-4.48197E-12 +i* 2.11486E-11| +| 3| -0.579282 +i* -0.815119| 0.999993| 1.33613E-11 +i*-1.98701E-11| +| 4| 0.592014 +i* 0.805919| 0.999993|-3.98037E-12 +i* 9.55808E-12| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993|-4.77973E-12 +i* 2.40621E-11| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742904 +i* -0.669389| 0.999993|-7.78222E-12 +i* 1.50098E-11| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.763538 +i* -0.645777| 1.00001|-8.22278E-10 +i*-5.86372E-10| +| 20| 0.773539 +i* 0.633763| 1.00001| -4.2314E-09 +i* 1.86243E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 266666 size 266666 +proc 1 start 266666 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 2, start 533332 size 266666 +proc 2 start 533332 size 266666 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 266666 +proc 0 start 0 size 266666 +iter : 1 Arret : 0.013303 s/iter 15.845449 +iter : 2 Arret : 1.22368 s/iter 15.831599 +iter : 3 Arret : 0.34478 s/iter 15.835186 +iter : 4 Arret : 0.804966 s/iter 15.861997 +iter : 5 Arret : 0.957981 s/iter 15.872722 +iter : 6 Arret : 0.716801 s/iter 16.172143 +iter : 7 Arret : 0.496135 s/iter 16.224317 +iter : 8 Arret : 0.326979 s/iter 16.181063 +iter : 9 Arret : 0.252467 s/iter 16.538160 +iter : 10 Arret : 0.244395 s/iter 16.297675 +iter : 11 Arret : 0.173672 s/iter 16.136429 +iter : 12 Arret : 0.197369 s/iter 16.323607 +iter : 13 Arret : 0.168305 s/iter 16.324722 +iter : 14 Arret : 0.168579 s/iter 16.212899 +iter : 15 Arret : 0.208926 s/iter 16.207350 +iter : 16 Arret : 0.165995 s/iter 16.153929 +iter : 17 Arret : 0.223284 s/iter 16.250807 +iter : 18 Arret : 0.324113 s/iter 16.164325 +iter : 19 Arret : 0.771739 s/iter 16.136061 +iter : 20 Arret : 1.00477 s/iter 16.138977 +iter : 21 Arret : 1.00247 s/iter 16.140663 +iter : 22 Arret : 0.543015 s/iter 16.140175 +iter : 23 Arret : 0.476319 s/iter 15.852664 +iter : 24 Arret : 0.401176 s/iter 15.844834 +iter : 25 Arret : 0.142005 s/iter 15.837565 +iter : 26 Arret : 0.0393995 s/iter 15.832097 +iter : 27 Arret : 0.0199662 s/iter 15.824967 +iter : 28 Arret : 0.00992138 s/iter 15.835004 +iter : 29 Arret : 0.00549329 s/iter 15.825203 +iter : 30 Arret : 0.000480868 s/iter 15.805032 +iter : 31 Arret : 3.00435E-06 s/iter 15.832975 +iter : 32 Arret : 3.08148E-09 s/iter 15.816239 +iter : 33 Arret : 6.64256E-12 s/iter 15.831931 +iter : 34 Arret : 1.43767E-14 s/iter 15.816196 +temps : 545.367 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 12.9528 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995| -2.03E-11 +i* 2.74701E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995| 6.90537E-12 +i*-5.12417E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710675 +i* 0.703514| 0.999995|-8.58691E-12 +i* 2.79902E-11| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995|-1.40248E-11 +i* 5.11502E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-1.80345E-12 +i* 5.96675E-11| +| 15| 0.863146 +i* 0.504945| 0.999995|-1.01228E-11 +i* 1.20409E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +499999 racines de module = 0.999995 +299999 racines de module = 1.00001 + 2 racines de module = 1 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 333397 size 333397 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 2, start 666794 size 333397 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 333397 +proc 0 start 0 size 333397 +proc 1 start 333397 size 333397 +proc 2 start 666794 size 333397 +iter : 1 Arret : 0.000575468 s/iter 24.305180 +iter : 2 Arret : 0.00170361 s/iter 24.785627 +iter : 3 Arret : 0.00222192 s/iter 24.748506 +iter : 4 Arret : 0.017164 s/iter 24.358793 +iter : 5 Arret : 0.0140181 s/iter 24.395447 +iter : 6 Arret : 0.00863706 s/iter 24.606501 +iter : 7 Arret : 0.00646893 s/iter 24.858810 +iter : 8 Arret : 0.00503905 s/iter 24.788762 +iter : 9 Arret : 0.0052262 s/iter 24.427751 +iter : 10 Arret : 0.00485981 s/iter 24.358969 +iter : 11 Arret : 0.00893375 s/iter 24.357900 +iter : 12 Arret : 0.00681765 s/iter 24.368587 +iter : 13 Arret : 0.0016963 s/iter 24.362646 +iter : 14 Arret : 0.00106588 s/iter 24.361655 +iter : 15 Arret : 0.000173681 s/iter 24.354770 +iter : 16 Arret : 1.82719E-05 s/iter 24.350867 +iter : 17 Arret : 2.03911E-05 s/iter 24.358719 +iter : 18 Arret : 3.78438E-06 s/iter 24.284202 +iter : 19 Arret : 1.28475E-07 s/iter 24.295585 +iter : 20 Arret : 1.88663E-09 s/iter 24.290679 +iter : 21 Arret : 2.81124E-11 s/iter 24.288024 +iter : 22 Arret : 4.1882E-13 s/iter 24.288788 +temps : 542.745 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.4225E-07 +Stabilite : 4.77796E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491932 +i* 0.870629| 0.999996|-1.74121E-11 +i*-2.86359E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996| 2.92226E-11 +i* 2.71536E-11| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 400042 size 400042 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 400042 +proc 1 start 400042 size 400042 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 2, start 800084 size 400042 +proc 2 start 800084 size 400042 +proc 0 start 0 size 400042 +iter : 1 Arret : 0.00577737 s/iter 35.191437 +iter : 2 Arret : 1.60124 s/iter 35.687308 +iter : 3 Arret : 2.50845 s/iter 38.522110 +iter : 4 Arret : 0.88974 s/iter 37.972511 +iter : 5 Arret : 1.13571 s/iter 38.354084 +iter : 6 Arret : 0.802875 s/iter 38.309790 +iter : 7 Arret : 1.23189 s/iter 38.251469 +iter : 8 Arret : 2.00112 s/iter 38.369432 +iter : 9 Arret : 0.783463 s/iter 39.250540 +iter : 10 Arret : 1.64822 s/iter 38.419390 +iter : 11 Arret : 1.13791 s/iter 38.520696 +iter : 12 Arret : 4.19099 s/iter 38.244319 +iter : 13 Arret : 1.7036 s/iter 37.449747 +iter : 14 Arret : 0.953437 s/iter 37.710513 +iter : 15 Arret : 0.86512 s/iter 37.422749 +iter : 16 Arret : 3.83001 s/iter 37.601442 +iter : 17 Arret : 1.37636 s/iter 37.548538 +iter : 18 Arret : 1.57226 s/iter 37.331887 +iter : 19 Arret : 0.995472 s/iter 37.376323 +iter : 20 Arret : 0.780537 s/iter 37.065303 +iter : 21 Arret : 3.73222 s/iter 36.965816 +iter : 22 Arret : 1.52875 s/iter 36.851015 +iter : 23 Arret : 0.925666 s/iter 36.788322 +iter : 24 Arret : 0.416457 s/iter 36.673216 +iter : 25 Arret : 1.21819 s/iter 36.551043 +iter : 26 Arret : 0.782138 s/iter 36.720148 +iter : 27 Arret : 0.611118 s/iter 36.382233 +iter : 28 Arret : 1.40936 s/iter 36.605900 +iter : 29 Arret : 0.136834 s/iter 36.551610 +iter : 30 Arret : 0.982775 s/iter 36.549899 +iter : 31 Arret : 0.482303 s/iter 36.446318 +iter : 32 Arret : 0.314354 s/iter 35.262030 +iter : 33 Arret : 0.221468 s/iter 35.437839 +iter : 34 Arret : 0.148832 s/iter 35.903162 +iter : 35 Arret : 0.0771528 s/iter 35.243527 +iter : 36 Arret : 0.00786376 s/iter 35.408694 +iter : 37 Arret : 0.00153832 s/iter 35.423139 +iter : 38 Arret : 0.00226222 s/iter 35.250849 +iter : 39 Arret : 0.000875734 s/iter 35.254600 +iter : 40 Arret : 2.10425E-05 s/iter 35.253398 +iter : 41 Arret : 2.59204E-06 s/iter 35.253869 +iter : 42 Arret : 2.06088E-08 s/iter 35.143640 +iter : 43 Arret : 8.18267E-11 s/iter 35.260245 +iter : 44 Arret : 3.25714E-13 s/iter 35.264980 +temps : 1617.65 seconde(s) +Nb iterations : 44 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.09088E-05 +Stabilite : 2.22047E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1|-5.85295E-09 +i*-2.49566E-10| +| 4| 0.458789 +i* 0.888542| 0.999997| 2.48135E-13 +i*-2.88822E-11| +| 5| 0.430677 +i* 0.902502| 0.999997|-2.03271E-11 +i*-3.18325E-11| +| 6| 0.402092 +i* 0.915605| 1| 5.55538E-09 +i*-1.34284E-09| +| 7| 0.3732 +i* 0.927747| 0.999997| -2.5707E-11 +i* 3.11093E-13| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 5.41895E-11 +i*-2.05278E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192915 +i* 0.981212| 0.999997| 1.07495E-11 +i* 5.766E-12| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130977 +i* 0.991382| 0.999997| 5.89659E-11 +i* 7.29122E-12| +| 16| 0.0997898 +i* 0.995005| 0.999997|-3.84177E-11 +i*-1.21923E-11| +| 17| 0.0685136 +i* 0.997647| 0.999997|-2.98188E-11 +i* 2.79243E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 466688 size 466688 +proc 1 start 466688 size 466688 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 2, start 933376 size 466688 +proc 2 start 933376 size 466688 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 466688 +proc 0 start 0 size 466688 +iter : 1 Arret : 0.0476652 s/iter 48.053051 +iter : 2 Arret : 1.02145 s/iter 49.162936 +iter : 3 Arret : 3.11851 s/iter 50.138080 +iter : 4 Arret : 1.87547 s/iter 50.661272 +iter : 5 Arret : 1.24028 s/iter 52.617942 +iter : 6 Arret : 1.33274 s/iter 52.723740 +iter : 7 Arret : 1.1089 s/iter 52.451625 +iter : 8 Arret : 1.32856 s/iter 53.817849 +iter : 9 Arret : 0.584436 s/iter 54.233382 +iter : 10 Arret : 0.682561 s/iter 53.018367 +iter : 11 Arret : 1.10899 s/iter 52.903852 +iter : 12 Arret : 1.24673 s/iter 52.699001 +iter : 13 Arret : 2.03756 s/iter 51.822577 +iter : 14 Arret : 0.74595 s/iter 51.940124 +iter : 15 Arret : 0.336711 s/iter 51.566761 +iter : 16 Arret : 0.386748 s/iter 51.449106 +iter : 17 Arret : 0.175345 s/iter 51.008579 +iter : 18 Arret : 0.0799077 s/iter 50.523143 +iter : 19 Arret : 0.106562 s/iter 50.311514 +iter : 20 Arret : 0.102063 s/iter 50.013859 +iter : 21 Arret : 0.0811226 s/iter 48.967237 +iter : 22 Arret : 0.0777804 s/iter 48.802184 +iter : 23 Arret : 0.06176 s/iter 48.968763 +iter : 24 Arret : 0.0274141 s/iter 48.869900 +iter : 25 Arret : 0.0246722 s/iter 48.033190 +iter : 26 Arret : 0.0140326 s/iter 48.024256 +iter : 27 Arret : 0.00823776 s/iter 48.046597 +iter : 28 Arret : 0.00458441 s/iter 48.050189 +iter : 29 Arret : 0.000250093 s/iter 48.028503 +iter : 30 Arret : 6.92011E-06 s/iter 48.046144 +iter : 31 Arret : 1.1801E-07 s/iter 48.051103 +iter : 32 Arret : 1.60292E-09 s/iter 48.032612 +iter : 33 Arret : 2.20691E-11 s/iter 48.032677 +iter : 34 Arret : 3.03651E-13 s/iter 48.049192 +temps : 1707.73 seconde(s) +Nb iterations : 34 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.35409E-07 +Stabilite : 2.22046E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-8.47142E-11 +i* 1.92466E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997|-3.15932E-11 +i*-1.15957E-12| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997|-8.89955E-13 +i* 2.61938E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-3.74776E-11 +i*-3.89954E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 1.02587E-11 +i*-4.25648E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 0 +proc 1 +proc 2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:31135 terminated with signal 11 at PC=404b41 SP=7fffb89650f0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31134 terminated with signal 11 at PC=404b41 SP=7fff9a829580. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31136 terminated with signal 11 at PC=404b41 SP=7fffe0fa8a40. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 31135 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:31146 terminated with signal 11 at PC=404b41 SP=7fff82ca5fc0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31144 terminated with signal 11 at PC=404b41 SP=7fff0a32a700. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31145 terminated with signal 11 at PC=404b41 SP=7fff9885ac60. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 31145 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 1 +proc 2 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^1500000 + (1 +i*0)*x^2000000 + +(-50000 +i*0)*x^499999 + (-1.5E+07 +i*0)*x^1499999 + (2E+06 +i*0)*x^1999999 + + +template:31155 terminated with signal 11 at PC=404b41 SP=7fff5c26c610. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31154 terminated with signal 11 at PC=404b41 SP=7fffd7c701a0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:31156 terminated with signal 11 at PC=404b41 SP=7fff9a2a1b00. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 31155 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- diff --git a/Simulations/sparse_mpi/sparse_mpi_3GPU.sge b/Simulations/sparse_mpi/sparse_mpi_3GPU.sge new file mode 100644 index 0000000..e779c55 --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_3GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_3GPU +#$ -pe mpi 3 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_mpi/sparse_mpi_4GPU.o140023 b/Simulations/sparse_mpi/sparse_mpi_4GPU.o140023 new file mode 100644 index 0000000..872679a --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_4GPU.o140023 @@ -0,0 +1,841 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +proc 2 +proc 3 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +zone limite de 'log-exp' 1.00356 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 2, start 50048 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 0, start 0 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 1, start 25024 size 25024 +proc 2 start 50048 size 25024 +dimgrid 391 dimblock 256 degrePoly 100000 +proc 3, start 75072 size 25024 +proc 3 start 75072 size 25024 +proc 0 start 0 size 25024 +proc 1 start 25024 size 25024 +iter : 1 Arret : 0.00317264 s/iter 0.222955 +iter : 2 Arret : 0.00227167 s/iter 0.222762 +iter : 3 Arret : 0.00211003 s/iter 0.222838 +iter : 4 Arret : 0.00200743 s/iter 0.222746 +iter : 5 Arret : 0.00207223 s/iter 0.222703 +iter : 6 Arret : 0.00517083 s/iter 0.222804 +iter : 7 Arret : 0.0188667 s/iter 0.297002 +iter : 8 Arret : 0.0181557 s/iter 0.222717 +iter : 9 Arret : 0.0045178 s/iter 0.295501 +iter : 10 Arret : 0.000994006 s/iter 0.222726 +iter : 11 Arret : 0.00103689 s/iter 0.222762 +iter : 12 Arret : 0.000385068 s/iter 0.222694 +iter : 13 Arret : 0.000378374 s/iter 0.222655 +iter : 14 Arret : 0.000135377 s/iter 0.222528 +iter : 15 Arret : 2.77949E-05 s/iter 0.222508 +iter : 16 Arret : 6.74524E-07 s/iter 0.222580 +iter : 17 Arret : 2.18155E-09 s/iter 0.222640 +iter : 18 Arret : 2.22292E-11 s/iter 0.222554 +iter : 19 Arret : 3.31178E-13 s/iter 0.222495 +temps : 4.60588 seconde(s) +Nb iterations : 19 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.75156E-07 +Stabilite : 1.57015E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962|-4.03455E-13 +i* 2.85139E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +zone limite de 'log-exp' 1.00178 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 3, start 150144 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 2, start 100096 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 1, start 50048 size 50048 +proc 2 start 100096 size 50048 +proc 3 start 150144 size 50048 +dimgrid 782 dimblock 256 degrePoly 200000 +proc 0, start 0 size 50048 +proc 0 start 0 size 50048 +proc 1 start 50048 size 50048 +iter : 1 Arret : 0.000151301 s/iter 0.883876 +iter : 2 Arret : 0.000148172 s/iter 0.883954 +iter : 3 Arret : 0.000150921 s/iter 0.883918 +iter : 4 Arret : 0.00104559 s/iter 0.884013 +iter : 5 Arret : 0.00193123 s/iter 0.883951 +iter : 6 Arret : 0.0272836 s/iter 1.046760 +iter : 7 Arret : 0.102911 s/iter 1.039676 +iter : 8 Arret : 0.511951 s/iter 1.007660 +iter : 9 Arret : 0.34938 s/iter 1.017711 +iter : 10 Arret : 0.169476 s/iter 1.028045 +iter : 11 Arret : 0.0996115 s/iter 1.022146 +iter : 12 Arret : 0.0682782 s/iter 1.027682 +iter : 13 Arret : 0.0829552 s/iter 0.882503 +iter : 14 Arret : 0.0066689 s/iter 0.883836 +iter : 15 Arret : 0.0948233 s/iter 0.883899 +iter : 16 Arret : 0.00657146 s/iter 0.883885 +iter : 17 Arret : 0.00573604 s/iter 0.883894 +iter : 18 Arret : 0.00176675 s/iter 0.883914 +iter : 19 Arret : 0.000248502 s/iter 0.883875 +iter : 20 Arret : 6.04596E-05 s/iter 0.883987 +iter : 21 Arret : 4.48743E-06 s/iter 0.883955 +iter : 22 Arret : 4.98896E-09 s/iter 0.883421 +iter : 23 Arret : 4.99197E-13 s/iter 0.883862 +temps : 21.5922 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.000249603 +Stabilite : 2.22061E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985| 8.64808E-12 +i* 7.46794E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005| 2.77439E-08 +i*-6.74504E-09| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-7.79776E-12 +i*-2.52076E-13| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +zone limite de 'log-exp' 1.00089 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 1, start 100032 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 0, start 0 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 2, start 200064 size 100032 +proc 0 start 0 size 100032 +dimgrid 1563 dimblock 256 degrePoly 400000 +proc 3, start 300096 size 100032 +proc 3 start 300096 size 100032 +proc 1 start 100032 size 100032 +proc 2 start 200064 size 100032 +iter : 1 Arret : 0.00163991 s/iter 3.109950 +iter : 2 Arret : 0.00132877 s/iter 3.110375 +iter : 3 Arret : 0.00184513 s/iter 3.110742 +iter : 4 Arret : 0.00262495 s/iter 3.111236 +iter : 5 Arret : 0.0150209 s/iter 3.111022 +iter : 6 Arret : 0.0137099 s/iter 3.414358 +iter : 7 Arret : 0.00835719 s/iter 3.385934 +iter : 8 Arret : 0.00440643 s/iter 3.394557 +iter : 9 Arret : 0.0060742 s/iter 3.385816 +iter : 10 Arret : 0.0050336 s/iter 3.099272 +iter : 11 Arret : 0.00112426 s/iter 3.099497 +iter : 12 Arret : 0.000775148 s/iter 3.099486 +iter : 13 Arret : 0.000376719 s/iter 3.099346 +iter : 14 Arret : 0.00024255 s/iter 3.099473 +iter : 15 Arret : 0.00012922 s/iter 3.099323 +iter : 16 Arret : 7.83137E-06 s/iter 3.099139 +iter : 17 Arret : 1.24719E-07 s/iter 3.099356 +iter : 18 Arret : 1.90294E-09 s/iter 3.099211 +iter : 19 Arret : 2.90173E-11 s/iter 3.099200 +iter : 20 Arret : 4.42472E-13 s/iter 3.099323 +temps : 63.5457 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 4.42472E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540313 +i* 0.841453| 0.999991| 9.34197E-12 +i*-1.23633E-11| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439833 +i* -0.898097| 1.00002| 5.42841E-10 +i*-5.60653E-10| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411559 +i* -0.9114| 1.00002| 1.04334E-09 +i*-9.84037E-10| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.988534 +i* 0.151098| 1.00002|-8.27014E-10 +i* 9.44171E-10| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641299 +i* 0.767311| 1.00002|-2.44657E-09 +i* -6.7886E-11| +| 13| -0.983301 +i* 0.182074| 1.00002| 4.64689E-09 +i* 2.00425E-09| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.665084 +i* 0.746789| 1.00002| 1.80952E-09 +i* 3.83855E-09| +| 16| -0.977132 +i* 0.212706| 1.00002|-2.02093E-10 +i* 3.44548E-10| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688092 +i* 0.725645| 1.00002|-4.51021E-09 +i* 1.95437E-09| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +proc 1 +proc 2 +proc 3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +zone limite de 'log-exp' 1.00059 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 0, start 0 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 1, start 150016 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 2, start 300032 size 150016 +proc 2 start 300032 size 150016 +dimgrid 2344 dimblock 256 degrePoly 600000 +proc 3, start 450048 size 150016 +proc 3 start 450048 size 150016 +proc 0 start 0 size 150016 +proc 1 start 150016 size 150016 +iter : 1 Arret : 0.00232098 s/iter 6.732718 +iter : 2 Arret : 0.0100189 s/iter 7.051391 +iter : 3 Arret : 0.283193 s/iter 6.895968 +iter : 4 Arret : 0.546502 s/iter 7.050469 +iter : 5 Arret : 1.13206 s/iter 7.216506 +iter : 6 Arret : 0.441232 s/iter 7.188011 +iter : 7 Arret : 0.210349 s/iter 7.506718 +iter : 8 Arret : 0.182959 s/iter 7.511723 +iter : 9 Arret : 0.15465 s/iter 7.074342 +iter : 10 Arret : 0.0273709 s/iter 7.116926 +iter : 11 Arret : 0.0179972 s/iter 7.067210 +iter : 12 Arret : 0.00914143 s/iter 7.085819 +iter : 13 Arret : 0.0269815 s/iter 7.021625 +iter : 14 Arret : 0.0268503 s/iter 6.729633 +iter : 15 Arret : 0.00822944 s/iter 6.729247 +iter : 16 Arret : 0.000264736 s/iter 6.731353 +iter : 17 Arret : 8.47333E-05 s/iter 6.730750 +iter : 18 Arret : 5.17416E-06 s/iter 6.730768 +iter : 19 Arret : 1.12397E-07 s/iter 6.731123 +iter : 20 Arret : 1.61278E-09 s/iter 6.731670 +iter : 21 Arret : 2.30014E-11 s/iter 6.731613 +iter : 22 Arret : 3.28041E-13 s/iter 6.730969 +temps : 153.471 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.81388E-08 +Stabilite : 3.28041E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592012 +i* 0.805941| 1.00001| 4.1526E-09 +i* 1.02046E-09| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742916 +i* -0.669375| 0.999993| 1.59349E-11 +i* 1.71025E-11| +| 18| 0.7533 +i* 0.657691| 1.00001|-2.76219E-09 +i* 4.10298E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773539 +i* 0.633763| 1.00001|-3.80449E-10 +i* 3.97541E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +proc 1 +proc 2 +proc 3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +zone limite de 'log-exp' 1.00044 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 3, start 600000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 1, start 200000 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 0, start 0 size 200000 +dimgrid 3125 dimblock 256 degrePoly 800000 +proc 3 start 600000 size 200000 +proc 0 start 0 size 200000 +proc 1 start 200000 size 200000 +proc 2, start 400000 size 200000 +proc 2 start 400000 size 200000 +iter : 1 Arret : 0.00108417 s/iter 12.159097 +iter : 2 Arret : 0.00154617 s/iter 12.285160 +iter : 3 Arret : 0.0140448 s/iter 12.174373 +iter : 4 Arret : 0.150783 s/iter 12.211473 +iter : 5 Arret : 0.984534 s/iter 12.253215 +iter : 6 Arret : 0.846873 s/iter 12.667593 +iter : 7 Arret : 0.850687 s/iter 12.449265 +iter : 8 Arret : 0.239017 s/iter 12.498637 +iter : 9 Arret : 0.0932856 s/iter 12.372293 +iter : 10 Arret : 0.0273595 s/iter 12.770787 +iter : 11 Arret : 0.0236411 s/iter 12.268012 +iter : 12 Arret : 0.0229952 s/iter 12.192238 +iter : 13 Arret : 0.00327267 s/iter 12.153660 +iter : 14 Arret : 0.00103051 s/iter 12.183109 +iter : 15 Arret : 0.000584357 s/iter 12.153559 +iter : 16 Arret : 0.000158231 s/iter 12.151369 +iter : 17 Arret : 9.49875E-05 s/iter 12.153222 +iter : 18 Arret : 4.14038E-05 s/iter 12.152653 +iter : 19 Arret : 3.27846E-05 s/iter 12.153803 +iter : 20 Arret : 7.57551E-06 s/iter 12.157708 +iter : 21 Arret : 4.73473E-08 s/iter 12.155670 +iter : 22 Arret : 1.01116E-10 s/iter 12.154833 +iter : 23 Arret : 2.17895E-13 s/iter 12.155276 +temps : 282.444 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.01989E-05 +Stabilite : 2.17895E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 1.7531E-11 +i*-4.02243E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-1.80345E-12 +i* 5.96675E-11| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +zone limite de 'log-exp' 1.00035 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 1, start 250048 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 2, start 500096 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 3, start 750144 size 250048 +dimgrid 3907 dimblock 256 degrePoly 1000000 +proc 0, start 0 size 250048 +proc 0 start 0 size 250048 +proc 1 start 250048 size 250048 +proc 2 start 500096 size 250048 +proc 3 start 750144 size 250048 +iter : 1 Arret : 0.00113008 s/iter 18.764692 +iter : 2 Arret : 0.00490148 s/iter 18.766269 +iter : 3 Arret : 0.00255472 s/iter 18.765964 +iter : 4 Arret : 0.00771565 s/iter 19.551743 +iter : 5 Arret : 0.0148595 s/iter 19.510100 +iter : 6 Arret : 0.079485 s/iter 18.780627 +iter : 7 Arret : 1.0761 s/iter 19.466310 +iter : 8 Arret : 0.523791 s/iter 19.319585 +iter : 9 Arret : 0.256077 s/iter 18.918614 +iter : 10 Arret : 0.128041 s/iter 18.796063 +iter : 11 Arret : 0.0619619 s/iter 18.783666 +iter : 12 Arret : 0.0408163 s/iter 18.797339 +iter : 13 Arret : 0.028885 s/iter 18.787154 +iter : 14 Arret : 0.0101069 s/iter 18.869406 +iter : 15 Arret : 0.00233147 s/iter 18.789676 +iter : 16 Arret : 0.000443751 s/iter 18.784933 +iter : 17 Arret : 2.02171E-05 s/iter 18.760903 +iter : 18 Arret : 3.97233E-05 s/iter 18.758606 +iter : 19 Arret : 4.71594E-06 s/iter 18.782682 +iter : 20 Arret : 1.93517E-07 s/iter 18.760467 +iter : 21 Arret : 1.50186E-09 s/iter 18.801736 +iter : 22 Arret : 2.23717E-11 s/iter 18.757476 +iter : 23 Arret : 3.33298E-13 s/iter 18.760972 +temps : 440.06 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.68365E-07 +Stabilite : 2.22044E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540414 +i* 0.841394| 0.999996| 2.27135E-11 +i*-8.06094E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 1.87346E-11 +i* 4.7471E-11| +| 9| 0.491932 +i* 0.870629| 0.999996|-2.65525E-11 +i* 1.22525E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996|-3.09397E-11 +i*-1.68578E-11| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996|-5.47384E-12 +i* 1.02452E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +proc 1 +proc 2 +proc 3 +proc 0 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +zone limite de 'log-exp' 1.0003 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 1, start 300032 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 0, start 0 size 300032 +proc 0 start 0 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 2, start 600064 size 300032 +proc 2 start 600064 size 300032 +dimgrid 4688 dimblock 256 degrePoly 1200000 +proc 3, start 900096 size 300032 +proc 3 start 900096 size 300032 +proc 1 start 300032 size 300032 +iter : 1 Arret : 0.00819256 s/iter 26.577664 +iter : 2 Arret : 2.02982 s/iter 28.548195 +iter : 3 Arret : 1.20559 s/iter 28.444826 +iter : 4 Arret : 2.45066 s/iter 28.500080 +iter : 5 Arret : 2.54532 s/iter 28.613591 +iter : 6 Arret : 2.62994 s/iter 29.464998 +iter : 7 Arret : 0.906074 s/iter 29.815525 +iter : 8 Arret : 0.993745 s/iter 29.873610 +iter : 9 Arret : 0.405461 s/iter 30.471669 +iter : 10 Arret : 0.367721 s/iter 30.642427 +iter : 11 Arret : 0.351446 s/iter 30.327877 +iter : 12 Arret : 0.35197 s/iter 30.656805 +iter : 13 Arret : 0.356371 s/iter 29.659115 +iter : 14 Arret : 0.361711 s/iter 29.463647 +iter : 15 Arret : 0.337763 s/iter 29.495300 +iter : 16 Arret : 0.31327 s/iter 29.423447 +iter : 17 Arret : 0.311198 s/iter 29.291099 +iter : 18 Arret : 0.318456 s/iter 29.460846 +iter : 19 Arret : 0.32907 s/iter 29.325250 +iter : 20 Arret : 0.301059 s/iter 29.261791 +iter : 21 Arret : 0.265061 s/iter 29.531117 +iter : 22 Arret : 0.259472 s/iter 29.429866 +iter : 23 Arret : 0.281898 s/iter 29.291621 +iter : 24 Arret : 0.346388 s/iter 29.302478 +iter : 25 Arret : 1.26802 s/iter 29.286807 +iter : 26 Arret : 0.283944 s/iter 29.171558 +iter : 27 Arret : 1.48554 s/iter 29.009241 +iter : 28 Arret : 1.52006 s/iter 28.992115 +iter : 29 Arret : 0.739441 s/iter 28.878319 +iter : 30 Arret : 0.752787 s/iter 28.680746 +iter : 31 Arret : 0.846761 s/iter 28.681431 +iter : 32 Arret : 1.66027 s/iter 28.631316 +iter : 33 Arret : 1.18999 s/iter 28.536383 +iter : 34 Arret : 1.7472 s/iter 28.533855 +iter : 35 Arret : 0.99662 s/iter 28.619741 +iter : 36 Arret : 0.685041 s/iter 28.524906 +iter : 37 Arret : 3.10061 s/iter 28.469691 +iter : 38 Arret : 2.19552 s/iter 28.360443 +iter : 39 Arret : 0.82349 s/iter 28.436085 +iter : 40 Arret : 3.50591 s/iter 28.172287 +iter : 41 Arret : 1.02641 s/iter 27.664102 +iter : 42 Arret : 1.74412 s/iter 27.599336 +iter : 43 Arret : 0.666046 s/iter 27.622028 +iter : 44 Arret : 0.436645 s/iter 27.665222 +iter : 45 Arret : 0.362378 s/iter 27.576919 +iter : 46 Arret : 0.355561 s/iter 27.619140 +iter : 47 Arret : 0.261884 s/iter 27.609494 +iter : 48 Arret : 0.135369 s/iter 27.625744 +iter : 49 Arret : 0.0915402 s/iter 27.430183 +iter : 50 Arret : 0.161087 s/iter 27.574724 +iter : 51 Arret : 0.133264 s/iter 27.503435 +iter : 52 Arret : 0.19955 s/iter 27.556902 +iter : 53 Arret : 0.16774 s/iter 27.535538 +iter : 54 Arret : 0.0367464 s/iter 26.597157 +iter : 55 Arret : 0.0226237 s/iter 26.593894 +iter : 56 Arret : 0.0108181 s/iter 26.570226 +iter : 57 Arret : 0.00267111 s/iter 26.648842 +iter : 58 Arret : 0.000387499 s/iter 26.572189 +iter : 59 Arret : 3.11267E-06 s/iter 26.574203 +iter : 60 Arret : 2.51854E-08 s/iter 26.572782 +iter : 61 Arret : 1.01362E-10 s/iter 26.570380 +iter : 62 Arret : 4.03524E-13 s/iter 26.570734 +temps : 1762.58 seconde(s) +Nb iterations : 62 +Nb de depassements de capacite exponentielle : 0 +Precision : 5.06807E-05 +Stabilite : 1.0906E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1| 1.95054E-09 +i* 6.77633E-10| +| 4| 0.458789 +i* 0.888542| 0.999997| 2.48135E-13 +i*-2.88822E-11| +| 5| 0.430685 +i* 0.902499| 0.999997| 2.12053E-13 +i*-1.16324E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192897 +i* 0.981224| 1| 2.91999E-10 +i* 9.18678E-11| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130967 +i* 0.991391| 1| 1.71549E-09 +i* 3.54225E-10| +| 16| 0.0997898 +i* 0.995005| 0.999997| -3.8231E-11 +i* 3.92186E-14| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371504 +i* 0.999314| 1|-1.38879E-09 +i*-2.32658E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +proc 2 +proc 3 +proc 0 +proc 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +zone limite de 'log-exp' 1.00025 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 3, start 1050048 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 1, start 350016 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 2, start 700032 size 350016 +proc 2 start 700032 size 350016 +dimgrid 5469 dimblock 256 degrePoly 1400000 +proc 0, start 0 size 350016 +proc 0 start 0 size 350016 +proc 3 start 1050048 size 350016 +proc 1 start 350016 size 350016 +iter : 1 Arret : 0.00218957 s/iter 36.159933 +iter : 2 Arret : 0.133227 s/iter 36.695373 +iter : 3 Arret : 6.01621 s/iter 37.299386 +iter : 4 Arret : 3.16113 s/iter 37.976941 +iter : 5 Arret : 2.89902 s/iter 37.835787 +iter : 6 Arret : 1.55692 s/iter 38.098839 +iter : 7 Arret : 1.64303 s/iter 39.033767 +iter : 8 Arret : 9.63322 s/iter 39.962469 +iter : 9 Arret : 3.25551 s/iter 40.250439 +iter : 10 Arret : 1.80839 s/iter 41.322631 +iter : 11 Arret : 2.10312 s/iter 39.721944 +iter : 12 Arret : 1.27787 s/iter 40.175542 +iter : 13 Arret : 1.28405 s/iter 39.345510 +iter : 14 Arret : 1.10597 s/iter 39.326031 +iter : 15 Arret : 1.54753 s/iter 39.371562 +iter : 16 Arret : 3.97338 s/iter 39.040715 +iter : 17 Arret : 1.16165 s/iter 39.074694 +iter : 18 Arret : 1.33248 s/iter 38.851097 +iter : 19 Arret : 0.864994 s/iter 38.922556 +iter : 20 Arret : 0.781144 s/iter 38.428134 +iter : 21 Arret : 0.717927 s/iter 38.952301 +iter : 22 Arret : 0.651466 s/iter 38.352980 +iter : 23 Arret : 0.458583 s/iter 38.047111 +iter : 24 Arret : 0.283507 s/iter 38.133746 +iter : 25 Arret : 0.279826 s/iter 37.853592 +iter : 26 Arret : 0.243863 s/iter 36.926821 +iter : 27 Arret : 0.220856 s/iter 37.645303 +iter : 28 Arret : 0.139293 s/iter 36.485655 +iter : 29 Arret : 0.66161 s/iter 36.276980 +iter : 30 Arret : 0.269576 s/iter 36.156120 +iter : 31 Arret : 0.139673 s/iter 36.247656 +iter : 32 Arret : 0.055674 s/iter 36.155399 +iter : 33 Arret : 0.0217982 s/iter 36.204812 +iter : 34 Arret : 0.00427148 s/iter 36.153944 +iter : 35 Arret : 0.000628248 s/iter 36.153697 +iter : 36 Arret : 1.01228E-07 s/iter 36.154597 +iter : 37 Arret : 4.84665E-10 s/iter 36.152819 +iter : 38 Arret : 2.2498E-12 s/iter 36.150757 +iter : 39 Arret : 1.80732E-14 s/iter 36.149673 +temps : 1478.01 seconde(s) +Nb iterations : 39 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.34519E-06 +Stabilite : 2.22046E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997| 5.65794E-11 +i*-4.66756E-12| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472673 +i* -0.881242| 1|-5.56631E-09 +i*-2.23833E-09| +| 8| 0.430664 +i* 0.902517| 1|-8.83373E-11 +i*-2.09199E-09| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-4.93405E-11 +i*-7.15173E-13| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^700000 + (-10 +i*0)*x^900000 + (1 +i*0)*x^1600000 + +(-70000 +i*0)*x^699999 + (-9E+06 +i*0)*x^899999 + (1.6E+06 +i*0)*x^1599999 + + +template:29834 terminated with signal 11 at PC=404b41 SP=7fff0b4740b0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29835 terminated with signal 11 at PC=404b41 SP=7fff081a2530. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29833 terminated with signal 11 at PC=404b41 SP=7fffe6ecdf90. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29836 terminated with signal 11 at PC=404b41 SP=7fff35c7eff0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 1 with PID 29834 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 0 +proc 1 +proc 2 +proc 3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^800000 + (-10 +i*0)*x^1000000 + (1 +i*0)*x^1800000 + +(-80000 +i*0)*x^799999 + (-1E+07 +i*0)*x^999999 + (1.8E+06 +i*0)*x^1799999 + + +template:29849 terminated with signal 11 at PC=404b41 SP=7fff6792aa30. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29846 terminated with signal 11 at PC=404b41 SP=7ffffaf225e0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29848 terminated with signal 11 at PC=404b41 SP=7fff7de06640. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] + +template:29847 terminated with signal 11 at PC=404b41 SP=7fff5bacc3f0. Backtrace: +./template[0x404b41] +./template[0x406726] +/lib64/libc.so.6(__libc_start_main+0xfd)[0x36e341ecdd] +./template[0x4031f9] +-------------------------------------------------------------------------- +mpirun has exited due to process rank 0 with PID 29846 on +node node1-50 exiting improperly. There are two reasons this could occur: + +1. this process did not call "init" before exiting, but others in +the job did. This can cause a job to hang indefinitely while it waits +for all processes to call "init". By rule, if one process calls "init", +then ALL processes must call "init" prior to termination. + +2. this process called "init", but exited without calling "finalize". +By rule, all processes that call "init" MUST call "finalize" prior to +exiting or it will be considered an "abnormal termination" + +This may have caused other processes in the application to be +terminated by signals sent by mpirun (as reported here). +-------------------------------------------------------------------------- +proc 2 +proc 3 +proc 0 +proc 1 +zone limite de 'log-exp' 1.03613 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^2000 + (-10 +i*0)*x^8000 + (1 +i*0)*x^10000 + +(-200 +i*0)*x^1999 + (-80000 +i*0)*x^7999 + (10000 +i*0)*x^9999 + +zone limite de 'log-exp' 1.03613 +zone limite de 'log-exp' 1.03613 +zone limite de 'log-exp' 1.03613 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 1, start 2560 size 2560 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 0, start 0 size 2560 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 3, start 7680 size 2560 +proc 0 start 0 size 2560 +proc 3 start 7680 size 2560 +proc 1 start 2560 size 2560 +dimgrid 40 dimblock 256 degrePoly 10000 +proc 2, start 5120 size 2560 +proc 2 start 5120 size 2560 +iter : 1 Arret : 0.000540066 s/iter 0.008420 +iter : 2 Arret : 0.0239499 s/iter 0.008298 +iter : 3 Arret : 0.0108994 s/iter 0.008290 +iter : 4 Arret : 0.00347071 s/iter 0.008305 +iter : 5 Arret : 0.00757939 s/iter 0.008311 +iter : 6 Arret : 0.00186666 s/iter 0.008310 +iter : 7 Arret : 0.00179112 s/iter 0.008306 +iter : 8 Arret : 0.00147265 s/iter 0.008305 +iter : 9 Arret : 0.00165602 s/iter 0.008296 +iter : 10 Arret : 0.00248191 s/iter 0.008307 +iter : 11 Arret : 0.000812537 s/iter 0.008297 +iter : 12 Arret : 5.39531E-05 s/iter 0.008412 +iter : 13 Arret : 1.08824E-08 s/iter 0.008404 +iter : 14 Arret : 1.089E-13 s/iter 0.008419 +temps : 0.323036 seconde(s) +Nb iterations : 14 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.17761E-05 +Stabilite : 8.2797E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.547024 +i* 0.838493| 1.00115|-6.21719E-10 +i*-5.53774E-09| +| 2| -0.540305 +i* 0.841127| 0.999712|-1.60982E-13 +i*-4.97213E-14| +| 3| -0.909192 +i* 0.415685| 0.999712| 4.35207E-14 +i* 5.29003E-13| +| 4| -0.989628 +i* -0.141638| 0.999712|-2.84439E-13 +i*-1.69935E-14| +| 5| -0.759236 +i* -0.652585| 1.00115|-6.07508E-09 +i* 4.66733E-09| +| 6| -0.281925 +i* -0.959136| 0.999712|-1.54099E-13 +i* 3.80991E-14| +| 7| 0.281172 +i* -0.959357| 0.999712|-1.43663E-13 +i*-1.53777E-13| +| 8| 0.755064 +i* -0.655212| 0.999712| 4.61076E-13 +i* 3.15322E-13| +| 9| 0.989404 +i* -0.143192| 0.999712|-1.63203E-13 +i*-1.45101E-14| +| 10| 0.912453 +i* 0.411988| 1.00115|-1.77634E-10 +i* 4.15663E-09| +| 11| 0.540966 +i* 0.840703| 0.999712| -2.5091E-14 +i*-1.99096E-13| +| 12| 0.540305 +i* 0.841127| 0.999712| 3.22853E-13 +i* 1.07785E-13| +| 13| 0.00314521 +i* 1.00115| 1.00115| 4.5119E-09 +i*-6.21719E-11| +| 14| -0.540966 +i* 0.840703| 0.999712| -2.5091E-14 +i* 1.99096E-13| +| 15| -0.909518 +i* 0.414971| 0.999712|-1.80966E-13 +i*-6.20692E-14| +| 16| -0.989516 +i* -0.142415| 0.999712| 2.81108E-13 +i* 5.11239E-14| +| 17| -0.755579 +i* -0.654618| 0.999712| 5.59774E-13 +i* 8.84721E-14| +| 18| -0.285348 +i* -0.959626| 1.00115|-9.98303E-09 +i*-1.88292E-09| +| 19| 0.281925 +i* -0.959136| 0.999712| 1.08247E-13 +i*-4.02221E-13| +| 20| 0.755579 +i* -0.654618| 0.999712| 5.59774E-13 +i*-8.84721E-14| ++---+----------------------------+------------+----------------------------+ +2000 racines de module = 1.00115 +8000 racines de module = 0.999712 diff --git a/Simulations/sparse_mpi/sparse_mpi_4GPU.sge b/Simulations/sparse_mpi/sparse_mpi_4GPU.sge new file mode 100644 index 0000000..d9ab42c --- /dev/null +++ b/Simulations/sparse_mpi/sparse_mpi_4GPU.sge @@ -0,0 +1,25 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -V +#$ -cwd +#$ -N sparse_mpi_4GPU +#$ -pe mpi 4 + + +module load cuda/7.0 +module load ompi/gcc + +mpirun -np $NSLOTS ./template -r -i 60000 40000 +mpirun -np $NSLOTS ./template -r -i 150000 50000 +mpirun -np $NSLOTS ./template -r -i 250000 150000 +mpirun -np $NSLOTS ./template -r -i 350000 250000 +mpirun -np $NSLOTS ./template -r -i 500000 300000 +mpirun -np $NSLOTS ./template -r -i 600000 400000 +mpirun -np $NSLOTS ./template -r -i 700000 500000 +mpirun -np $NSLOTS ./template -r -i 800000 600000 +mpirun -np $NSLOTS ./template -r -i 900000 700000 +mpirun -np $NSLOTS ./template -r -i 1000000 800000 +mpirun -np $NSLOTS ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_1GPU.o140100 b/Simulations/sparse_openmp/sparse_openmp_1GPU.o140100 new file mode 100644 index 0000000..7332981 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_1GPU.o140100 @@ -0,0 +1,512 @@ +REMAINING: 1 +Taking GPU #3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 391 start 0 size 100096 +gpu 0 iter : 1 Arret : 0.0052669 s/iter 0.775408 +gpu 0 iter : 2 Arret : 0.00752645 s/iter 0.775369 +gpu 0 iter : 3 Arret : 0.0240999 s/iter 0.775305 +gpu 0 iter : 4 Arret : 0.0224589 s/iter 0.850697 +gpu 0 iter : 5 Arret : 0.00804703 s/iter 0.844340 +gpu 0 iter : 6 Arret : 0.00438171 s/iter 0.775251 +gpu 0 iter : 7 Arret : 0.00744568 s/iter 0.775238 +gpu 0 iter : 8 Arret : 0.00764888 s/iter 0.775261 +gpu 0 iter : 9 Arret : 0.00410621 s/iter 0.775320 +gpu 0 iter : 10 Arret : 0.00247273 s/iter 0.775247 +gpu 0 iter : 11 Arret : 0.00227795 s/iter 0.775273 +gpu 0 iter : 12 Arret : 0.00210901 s/iter 0.775117 +gpu 0 iter : 13 Arret : 0.000438336 s/iter 0.774935 +gpu 0 iter : 14 Arret : 0.000273199 s/iter 0.774865 +gpu 0 iter : 15 Arret : 0.000137109 s/iter 0.774789 +gpu 0 iter : 16 Arret : 1.40101E-05 s/iter 0.774828 +gpu 0 iter : 17 Arret : 1.89958E-07 s/iter 0.774719 +gpu 0 iter : 18 Arret : 2.82623E-09 s/iter 0.774706 +gpu 0 iter : 19 Arret : 4.21054E-11 s/iter 0.774674 +gpu 0 iter : 20 Arret : 6.27215E-13 s/iter 0.774731 +temps : 16.1926 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.61117E-09 +Stabilite : 6.27215E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226711 +i* -0.973923| 0.999962|-4.27658E-13 +i* 6.01027E-13| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996021 +i* 0.0886823| 0.999962| 1.17772E-12 +i* 6.16285E-13| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968049 +i* 0.250607| 0.999962|-1.07025E-13 +i*-1.15224E-12| +| 10| -0.286815 +i* -0.957946| 0.999962|-6.55254E-13 +i* 1.20869E-12| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988582 +i* 0.150427| 0.999962|-1.54698E-12 +i*-6.48537E-13| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.981756 +i* 0.189945| 0.999962|-1.13665E-12 +i* 1.13043E-12| +| 19| -0.345809 +i* -0.938264| 0.999962| 1.03906E-12 +i* 1.95398E-12| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 782 start 0 size 200192 +gpu 0 iter : 1 Arret : 0.000149329 s/iter 3.019382 +gpu 0 iter : 2 Arret : 0.000107708 s/iter 3.016857 +gpu 0 iter : 3 Arret : 0.000113605 s/iter 3.016990 +gpu 0 iter : 4 Arret : 0.000830779 s/iter 3.018300 +gpu 0 iter : 5 Arret : 0.00353705 s/iter 3.017239 +gpu 0 iter : 6 Arret : 0.0150507 s/iter 3.033347 +gpu 0 iter : 7 Arret : 0.0172496 s/iter 3.028650 +gpu 0 iter : 8 Arret : 0.032361 s/iter 3.025908 +gpu 0 iter : 9 Arret : 0.0281394 s/iter 3.030298 +gpu 0 iter : 10 Arret : 0.116314 s/iter 3.043482 +gpu 0 iter : 11 Arret : 0.129494 s/iter 3.073542 +gpu 0 iter : 12 Arret : 0.0352338 s/iter 3.047419 +gpu 0 iter : 13 Arret : 0.0316693 s/iter 3.041094 +gpu 0 iter : 14 Arret : 0.0153664 s/iter 3.020001 +gpu 0 iter : 15 Arret : 0.0125995 s/iter 3.011952 +gpu 0 iter : 16 Arret : 0.00505109 s/iter 3.013206 +gpu 0 iter : 17 Arret : 0.0072726 s/iter 3.013400 +gpu 0 iter : 18 Arret : 0.00841241 s/iter 3.012671 +gpu 0 iter : 19 Arret : 0.00316401 s/iter 3.011866 +gpu 0 iter : 20 Arret : 1.36142E-05 s/iter 3.011905 +gpu 0 iter : 21 Arret : 1.07816E-09 s/iter 3.012487 +gpu 0 iter : 22 Arret : 2.83648E-12 s/iter 3.012609 +gpu 0 iter : 23 Arret : 4.24948E-14 s/iter 3.012386 +temps : 70.1186 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.52377E-08 +Stabilite : 4.24948E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540195 +i* 0.841595| 1.00005|-2.98043E-09 +i*-3.27611E-08| +| 2| -0.837195 +i* 0.546877| 0.999985| 7.09943E-12 +i* 5.1133E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828525 +i* -0.559925| 0.999985|-4.34675E-12 +i* 1.07137E-12| +| 5| -0.819774 +i* 0.572768| 1.00005| 2.53887E-08 +i* 2.42315E-09| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985| 8.64808E-12 +i* 7.46794E-12| +| 8| 0.591869 +i* 0.806015| 0.999985| 1.73195E-13 +i* 8.72591E-12| +| 9| -0.801379 +i* 0.598131| 0.999985| -1.2701E-12 +i* 3.96189E-12| +| 10| -0.60436 +i* -0.796769| 1.00005|-3.33815E-08 +i* 3.89061E-08| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628985 +i* -0.777398| 0.999985|-4.05476E-12 +i*-5.17236E-12| +| 15| 0.772548 +i* -0.635029| 1.00005| 1.1634E-09 +i* 1.87351E-08| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752229 +i* -0.658879| 0.999985|-5.97611E-12 +i* 1.03431E-11| +| 20| 0.664729 +i* 0.747146| 1.00005|-1.71597E-08 +i* 8.68463E-09| ++---+----------------------------+------------+----------------------------+ +50000 racines de module = 1.00005 +150000 racines de module = 0.999985 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 1563 start 0 size 400128 +gpu 0 iter : 1 Arret : 0.00172099 s/iter 11.753718 +gpu 0 iter : 2 Arret : 0.0208557 s/iter 11.747391 +gpu 0 iter : 3 Arret : 0.221528 s/iter 11.807046 +gpu 0 iter : 4 Arret : 0.572248 s/iter 11.998301 +gpu 0 iter : 5 Arret : 0.542189 s/iter 11.842988 +gpu 0 iter : 6 Arret : 0.306206 s/iter 11.822805 +gpu 0 iter : 7 Arret : 0.0317191 s/iter 12.059261 +gpu 0 iter : 8 Arret : 0.0184143 s/iter 12.061589 +gpu 0 iter : 9 Arret : 0.030511 s/iter 11.936705 +gpu 0 iter : 10 Arret : 0.023696 s/iter 11.899096 +gpu 0 iter : 11 Arret : 0.0135298 s/iter 11.850230 +gpu 0 iter : 12 Arret : 0.0119889 s/iter 11.808974 +gpu 0 iter : 13 Arret : 0.00485045 s/iter 11.776383 +gpu 0 iter : 14 Arret : 0.00522437 s/iter 11.809750 +gpu 0 iter : 15 Arret : 0.00252909 s/iter 11.735442 +gpu 0 iter : 16 Arret : 0.000417464 s/iter 11.739448 +gpu 0 iter : 17 Arret : 0.000235756 s/iter 11.733345 +gpu 0 iter : 18 Arret : 6.4985E-07 s/iter 11.743853 +gpu 0 iter : 19 Arret : 1.48939E-09 s/iter 11.732225 +gpu 0 iter : 20 Arret : 3.20792E-12 s/iter 11.734648 +gpu 0 iter : 21 Arret : 1.34164E-14 s/iter 11.732088 +temps : 248.893 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 1.34164E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991| 1.11042E-11 +i*-9.27687E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991| 1.67755E-11 +i* 4.06477E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991| 1.73468E-11 +i*-3.74729E-12| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991| 1.53594E-11 +i*-1.57324E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991| -1.2063E-11 +i* 1.32238E-11| +| 18| 0.688087 +i* 0.725616| 0.999991|-1.67164E-11 +i*-1.12573E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 0 iter : 1 Arret : 0.00525558 s/iter 26.336656 +gpu 0 iter : 2 Arret : 0.441677 s/iter 26.703831 +gpu 0 iter : 3 Arret : 0.906705 s/iter 26.966169 +gpu 0 iter : 4 Arret : 3.755 s/iter 26.950936 +gpu 0 iter : 5 Arret : 1.26305 s/iter 27.316144 +gpu 0 iter : 6 Arret : 3.03186 s/iter 27.389925 +gpu 0 iter : 7 Arret : 0.213406 s/iter 27.490831 +gpu 0 iter : 8 Arret : 1.0101 s/iter 27.559501 +gpu 0 iter : 9 Arret : 0.207377 s/iter 27.194849 +gpu 0 iter : 10 Arret : 0.0920517 s/iter 27.466967 +gpu 0 iter : 11 Arret : 0.0893085 s/iter 27.380003 +gpu 0 iter : 12 Arret : 0.0218947 s/iter 26.617878 +gpu 0 iter : 13 Arret : 0.00718218 s/iter 26.491846 +gpu 0 iter : 14 Arret : 0.014641 s/iter 26.379537 +gpu 0 iter : 15 Arret : 0.00209026 s/iter 26.349906 +gpu 0 iter : 16 Arret : 0.00174853 s/iter 26.344560 +gpu 0 iter : 17 Arret : 0.00249398 s/iter 26.348383 +gpu 0 iter : 18 Arret : 0.00020801 s/iter 26.354612 +gpu 0 iter : 19 Arret : 1.26142E-07 s/iter 26.370520 +gpu 0 iter : 20 Arret : 5.14341E-10 s/iter 26.370752 +gpu 0 iter : 21 Arret : 2.04751E-12 s/iter 26.372247 +gpu 0 iter : 22 Arret : 8.06082E-15 s/iter 26.364052 +temps : 589.718 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.32595E-08 +Stabilite : 8.06082E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993| 2.30783E-11 +i*-6.91999E-12| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592029 +i* 0.805909| 0.999993| 8.2111E-12 +i* 2.02799E-11| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| -2.6851E-11 +i*-1.44801E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 2.88447E-09 +i* 3.69506E-09| +| 16| 0.73231 +i* 0.680962| 0.999993|-5.73186E-12 +i* 1.14335E-11| +| 17| -0.742916 +i* -0.669375| 0.999993| 1.59349E-11 +i* 1.71025E-11| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773539 +i* 0.633763| 1.00001| -4.2314E-09 +i* 1.86243E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 3125 start 0 size 800000 +gpu 0 iter : 1 Arret : 0.00051726 s/iter 46.868704 +gpu 0 iter : 2 Arret : 0.00517255 s/iter 46.735194 +gpu 0 iter : 3 Arret : 0.0728679 s/iter 46.891988 +gpu 0 iter : 4 Arret : 0.771691 s/iter 46.979491 +gpu 0 iter : 5 Arret : 0.75662 s/iter 47.336136 +gpu 0 iter : 6 Arret : 0.635995 s/iter 47.811859 +gpu 0 iter : 7 Arret : 0.505749 s/iter 48.056193 +gpu 0 iter : 8 Arret : 0.931022 s/iter 48.270194 +gpu 0 iter : 9 Arret : 0.398721 s/iter 48.514679 +gpu 0 iter : 10 Arret : 0.247741 s/iter 48.434629 +gpu 0 iter : 11 Arret : 0.0707263 s/iter 48.136785 +gpu 0 iter : 12 Arret : 0.0344289 s/iter 47.624785 +gpu 0 iter : 13 Arret : 0.0278743 s/iter 46.948359 +gpu 0 iter : 14 Arret : 0.0109553 s/iter 46.857728 +gpu 0 iter : 15 Arret : 0.0093023 s/iter 46.844682 +gpu 0 iter : 16 Arret : 0.00935315 s/iter 46.835990 +gpu 0 iter : 17 Arret : 0.0162429 s/iter 46.715238 +gpu 0 iter : 18 Arret : 0.00648616 s/iter 46.741249 +gpu 0 iter : 19 Arret : 0.000839627 s/iter 46.741507 +gpu 0 iter : 20 Arret : 0.00184254 s/iter 46.754071 +gpu 0 iter : 21 Arret : 4.91346E-06 s/iter 46.769016 +gpu 0 iter : 22 Arret : 4.60158E-08 s/iter 46.820581 +gpu 0 iter : 23 Arret : 6.70363E-10 s/iter 46.824110 +gpu 0 iter : 24 Arret : 9.78247E-12 s/iter 46.828052 +gpu 0 iter : 25 Arret : 1.42634E-13 s/iter 46.828472 +temps : 1180.82 seconde(s) +Nb iterations : 25 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.1101E-08 +Stabilite : 1.42634E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 3.40094E-11 +i* 1.45989E-12| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995| 3.88137E-11 +i*-3.00611E-11| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 3907 start 0 size 1000192 +gpu 0 iter : 1 Arret : 0.00369829 s/iter 72.960026 +gpu 0 iter : 2 Arret : 0.656453 s/iter 73.009854 +gpu 0 iter : 3 Arret : 1.85379 s/iter 73.909530 +gpu 0 iter : 4 Arret : 0.184697 s/iter 73.870387 +gpu 0 iter : 5 Arret : 0.149335 s/iter 73.917721 +gpu 0 iter : 6 Arret : 0.0961951 s/iter 74.759550 +gpu 0 iter : 7 Arret : 0.0847578 s/iter 74.840915 +gpu 0 iter : 8 Arret : 0.0292103 s/iter 74.694556 +gpu 0 iter : 9 Arret : 0.0283648 s/iter 74.484213 +gpu 0 iter : 10 Arret : 0.0181273 s/iter 73.989131 +gpu 0 iter : 11 Arret : 0.0158134 s/iter 73.602331 +gpu 0 iter : 12 Arret : 0.0047499 s/iter 73.110712 +gpu 0 iter : 13 Arret : 0.00558216 s/iter 73.004439 +gpu 0 iter : 14 Arret : 0.00502349 s/iter 72.957971 +gpu 0 iter : 15 Arret : 0.00203782 s/iter 72.966516 +gpu 0 iter : 16 Arret : 0.000101539 s/iter 72.953065 +gpu 0 iter : 17 Arret : 0.000105985 s/iter 72.981166 +gpu 0 iter : 18 Arret : 7.62032E-06 s/iter 72.955710 +gpu 0 iter : 19 Arret : 2.53593E-08 s/iter 72.953928 +gpu 0 iter : 20 Arret : 2.22162E-10 s/iter 72.808169 +gpu 0 iter : 21 Arret : 3.30983E-12 s/iter 72.824788 +gpu 0 iter : 22 Arret : 4.92853E-14 s/iter 72.871341 +temps : 1621.79 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65132E-08 +Stabilite : 4.92853E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841476| 1.00001| 4.82795E-10 +i* 3.31212E-09| +| 2| 0.52971 +i* 0.848174| 0.999996|-2.56639E-12 +i*-3.27674E-11| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.519019 +i* 0.854758| 0.999996|-1.39375E-11 +i* 5.79731E-12| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502834 +i* 0.864379| 0.999996|-2.85585E-11 +i* 6.91519E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491942 +i* 0.870624| 0.999996| -1.9825E-11 +i*-1.52329E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46438 +i* 0.885632| 0.999996| 1.33844E-11 +i*-1.06731E-12| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447623 +i* 0.894218| 0.999996| 3.85803E-11 +i* 3.3129E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.43636 +i* 0.899768| 0.999996| 3.23241E-12 +i* 9.4037E-12| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +400000 racines de module = 1.00001 +600000 racines de module = 0.999996 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 4688 start 0 size 1200128 +gpu 0 iter : 1 Arret : 0.0182376 s/iter 104.837597 +gpu 0 iter : 2 Arret : 1.12373 s/iter 108.563668 +gpu 0 iter : 3 Arret : 0.426381 s/iter 110.022983 +gpu 0 iter : 4 Arret : 0.721244 s/iter 111.488820 +gpu 0 iter : 5 Arret : 1.17091 s/iter 111.916174 +gpu 0 iter : 6 Arret : 0.351155 s/iter 112.354360 +gpu 0 iter : 7 Arret : 0.375654 s/iter 113.067528 +gpu 0 iter : 8 Arret : 1.04032 s/iter 113.381487 +gpu 0 iter : 9 Arret : 1.12875 s/iter 114.128347 +gpu 0 iter : 10 Arret : 12.358 s/iter 114.591594 +gpu 0 iter : 11 Arret : 1.18398 s/iter 114.167437 +gpu 0 iter : 12 Arret : 4.45048 s/iter 113.754284 +gpu 0 iter : 13 Arret : 5.09703 s/iter 112.914247 +gpu 0 iter : 14 Arret : 1.04453 s/iter 112.076259 +gpu 0 iter : 15 Arret : 3.05711 s/iter 111.467739 +gpu 0 iter : 16 Arret : 0.859735 s/iter 110.945464 +gpu 0 iter : 17 Arret : 4.25309 s/iter 110.793391 +gpu 0 iter : 18 Arret : 0.893951 s/iter 110.388272 +gpu 0 iter : 19 Arret : 0.603038 s/iter 110.132291 +gpu 0 iter : 20 Arret : 3.09335 s/iter 109.413247 +gpu 0 iter : 21 Arret : 1.28616 s/iter 109.106140 +gpu 0 iter : 22 Arret : 2.25952 s/iter 109.082492 +gpu 0 iter : 23 Arret : 1.67614 s/iter 108.802369 +gpu 0 iter : 24 Arret : 0.645561 s/iter 108.387380 +gpu 0 iter : 25 Arret : 0.661038 s/iter 108.106268 +gpu 0 iter : 26 Arret : 0.728448 s/iter 107.627940 +gpu 0 iter : 27 Arret : 0.456849 s/iter 107.304474 +gpu 0 iter : 28 Arret : 0.254278 s/iter 106.811137 +gpu 0 iter : 29 Arret : 0.111958 s/iter 106.339104 +gpu 0 iter : 30 Arret : 0.0531874 s/iter 105.891059 +gpu 0 iter : 31 Arret : 0.0531871 s/iter 105.523621 +gpu 0 iter : 32 Arret : 0.013254 s/iter 105.034027 +gpu 0 iter : 33 Arret : 0.00334602 s/iter 104.894966 +gpu 0 iter : 34 Arret : 0.00027649 s/iter 104.840988 +gpu 0 iter : 35 Arret : 1.17344E-07 s/iter 104.858305 +gpu 0 iter : 36 Arret : 4.79311E-10 s/iter 104.840632 +gpu 0 iter : 37 Arret : 1.90774E-12 s/iter 104.820758 +gpu 0 iter : 38 Arret : 8.88875E-15 s/iter 104.804403 +temps : 4148.3 seconde(s) +Nb iterations : 38 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.76717E-08 +Stabilite : 8.88875E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540312 +i* 0.841461| 0.999997|-2.16913E-11 +i* 1.91294E-11| +| 2| 0.513645 +i* 0.857999| 0.999997|-6.29718E-12 +i*-2.39364E-12| +| 3| 0.486457 +i* 0.873701| 0.999997| 1.53235E-11 +i* 6.36435E-13| +| 4| 0.458797 +i* 0.888537| 0.999997| 1.72345E-11 +i* 1.48229E-11| +| 5| 0.430698 +i* 0.902501| 1| 9.83414E-09 +i*-4.46881E-09| +| 6| 0.402138 +i* 0.915584| 1|-5.37264E-09 +i* 9.04446E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192915 +i* 0.981212| 0.999997| 1.07495E-11 +i* 5.766E-12| +| 14| 0.162034 +i* 0.986782| 0.999997| 3.99512E-11 +i* 6.63664E-12| +| 15| 0.130977 +i* 0.991382| 0.999997| 5.89659E-11 +i* 7.29122E-12| +| 16| 0.0997987 +i* 0.995004| 0.999997|-2.34084E-11 +i*-4.34534E-12| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371629 +i* 0.999314| 1| 1.55887E-09 +i*-4.23222E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 0 (of 1) uses CUDA device 0 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 5469 start 0 size 1400064 +gpu 0 iter : 1 Arret : 0.00928965 s/iter 142.375846 +gpu 0 iter : 2 Arret : 0.576413 s/iter 147.373084 +gpu 0 iter : 3 Arret : 0.762551 s/iter 150.232559 +gpu 0 iter : 4 Arret : 1.07413 s/iter 151.768093 +gpu 0 iter : 5 Arret : 0.0991065 s/iter 153.056251 +gpu 0 iter : 6 Arret : 0.123507 s/iter 152.742000 +gpu 0 iter : 7 Arret : 0.136183 s/iter 152.857808 +gpu 0 iter : 8 Arret : 0.113786 s/iter 152.881427 +gpu 0 iter : 9 Arret : 0.0800623 s/iter 152.835777 +gpu 0 iter : 10 Arret : 0.0571798 s/iter 151.922898 +gpu 0 iter : 11 Arret : 0.0727241 s/iter 150.276395 +gpu 0 iter : 12 Arret : 0.0702862 s/iter 147.770220 +gpu 0 iter : 13 Arret : 0.0246309 s/iter 145.850735 +gpu 0 iter : 14 Arret : 0.0213611 s/iter 144.099565 +gpu 0 iter : 15 Arret : 0.0247135 s/iter 143.346943 +gpu 0 iter : 16 Arret : 0.0164575 s/iter 142.914262 +gpu 0 iter : 17 Arret : 0.00452215 s/iter 142.729324 +gpu 0 iter : 18 Arret : 0.00260492 s/iter 142.530031 +gpu 0 iter : 19 Arret : 0.000151029 s/iter 142.510219 +gpu 0 iter : 20 Arret : 1.40988E-06 s/iter 142.510180 +gpu 0 iter : 21 Arret : 1.38776E-08 s/iter 142.480080 +gpu 0 iter : 22 Arret : 1.91581E-10 s/iter 142.453226 +gpu 0 iter : 23 Arret : 2.63708E-12 s/iter 142.412633 +gpu 0 iter : 24 Arret : 3.63243E-14 s/iter 142.487841 +temps : 3523.14 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65661E-08 +Stabilite : 3.63243E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-8.47142E-11 +i* 1.92466E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416439 +i* -0.90916| 0.999997|-1.66807E-11 +i* 2.56219E-11| +| 12| 0.373179 +i* 0.927756| 0.999997| 2.89372E-11 +i*-2.61371E-11| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.06317E-11 +i* 7.08794E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-4.93405E-11 +i*-7.15173E-13| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140100: line 23: 13069 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140100: line 24: 13073 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140100: line 25: 13075 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_1GPU.sge b/Simulations/sparse_openmp/sparse_openmp_1GPU.sge new file mode 100644 index 0000000..ceb97b1 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_1GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=1 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 1 +#$ -V +#$ -cwd +#$ -N sparse_openmp_1GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=1 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Simulations/sparse_openmp/sparse_openmp_2GPU.o140099 b/Simulations/sparse_openmp/sparse_openmp_2GPU.o140099 new file mode 100644 index 0000000..b18a418 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_2GPU.o140099 @@ -0,0 +1,534 @@ +REMAINING: 2 +Taking GPU #0 +Taking GPU #1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 0 iter : 1 Arret : 0.00380313 s/iter 0.441566 +gpu 0 iter : 2 Arret : 0.00367222 s/iter 0.441506 +gpu 0 iter : 3 Arret : 0.00329063 s/iter 0.441545 +gpu 0 iter : 4 Arret : 0.00599232 s/iter 0.441517 +gpu 0 iter : 5 Arret : 0.00559475 s/iter 0.441533 +gpu 0 iter : 6 Arret : 0.0062995 s/iter 0.441538 +gpu 0 iter : 7 Arret : 0.00458799 s/iter 0.441558 +gpu 0 iter : 8 Arret : 0.00622521 s/iter 0.441510 +gpu 0 iter : 9 Arret : 0.0073983 s/iter 0.439550 +gpu 0 iter : 10 Arret : 0.00804763 s/iter 0.441536 +gpu 0 iter : 11 Arret : 0.00548469 s/iter 0.441528 +gpu 0 iter : 12 Arret : 0.00120813 s/iter 0.441416 +gpu 0 iter : 13 Arret : 0.000406962 s/iter 0.441414 +gpu 0 iter : 14 Arret : 0.00112455 s/iter 0.441391 +gpu 0 iter : 15 Arret : 0.000729656 s/iter 0.441398 +gpu 0 iter : 16 Arret : 6.06095E-06 s/iter 0.441340 +gpu 0 iter : 17 Arret : 1.51135E-08 s/iter 0.441471 +gpu 0 iter : 18 Arret : 4.78213E-11 s/iter 0.441372 +gpu 0 iter : 19 Arret : 1.51316E-13 s/iter 0.441309 +temps : 9.12342 seconde(s) +Nb iterations : 19 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.21439E-09 +Stabilite : 1.51316E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006| 1.35693E-10 +i*-3.47657E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962| 1.58029E-12 +i*-2.34379E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 1.02962E-12 +i*-4.51911E-12| +| 18| 0.981895 +i* 0.189225| 0.999962|-4.05187E-12 +i* 1.36536E-13| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 391 start 100096 size 100096 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 391 start 0 size 100096 +gpu 0 iter : 1 Arret : 0.000107626 s/iter 1.547978 +gpu 0 iter : 2 Arret : 9.81369E-05 s/iter 1.548082 +gpu 0 iter : 3 Arret : 0.000765995 s/iter 1.548065 +gpu 0 iter : 4 Arret : 0.000973277 s/iter 1.548057 +gpu 0 iter : 5 Arret : 0.00848586 s/iter 1.548089 +gpu 0 iter : 6 Arret : 0.0120973 s/iter 1.707264 +gpu 0 iter : 7 Arret : 0.029256 s/iter 1.698285 +gpu 0 iter : 8 Arret : 0.134426 s/iter 1.548025 +gpu 0 iter : 9 Arret : 0.152262 s/iter 1.549290 +gpu 0 iter : 10 Arret : 0.121741 s/iter 1.710977 +gpu 0 iter : 11 Arret : 0.196968 s/iter 1.549235 +gpu 0 iter : 12 Arret : 0.832961 s/iter 1.703810 +gpu 0 iter : 13 Arret : 0.389199 s/iter 1.552020 +gpu 0 iter : 14 Arret : 0.303622 s/iter 1.712838 +gpu 0 iter : 15 Arret : 0.0708981 s/iter 1.549269 +gpu 0 iter : 16 Arret : 0.0516286 s/iter 1.547858 +gpu 0 iter : 17 Arret : 0.0237403 s/iter 1.547965 +gpu 0 iter : 18 Arret : 0.00575736 s/iter 1.548048 +gpu 0 iter : 19 Arret : 0.00016543 s/iter 1.547970 +gpu 0 iter : 20 Arret : 8.19796E-06 s/iter 1.547960 +gpu 0 iter : 21 Arret : 1.89926E-09 s/iter 1.548018 +gpu 0 iter : 22 Arret : 1.89968E-13 s/iter 1.548057 +temps : 35.62 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 9.49941E-05 +Stabilite : 5.04191E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005|-3.72767E-08 +i*-1.30274E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-7.79776E-12 +i*-2.52076E-13| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 782 start 0 size 200064 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 782 start 200064 size 200064 +gpu 0 iter : 1 Arret : 0.000533421 s/iter 6.081044 +gpu 0 iter : 2 Arret : 0.00294166 s/iter 6.077042 +gpu 0 iter : 3 Arret : 0.00816274 s/iter 6.076551 +gpu 0 iter : 4 Arret : 0.0970896 s/iter 6.051363 +gpu 0 iter : 5 Arret : 0.1861 s/iter 6.117092 +gpu 0 iter : 6 Arret : 0.205221 s/iter 6.087839 +gpu 0 iter : 7 Arret : 0.0897097 s/iter 6.084694 +gpu 0 iter : 8 Arret : 0.0591358 s/iter 6.078173 +gpu 0 iter : 9 Arret : 0.023858 s/iter 6.079091 +gpu 0 iter : 10 Arret : 0.00304425 s/iter 6.076912 +gpu 0 iter : 11 Arret : 0.00136708 s/iter 6.063903 +gpu 0 iter : 12 Arret : 0.000789721 s/iter 6.076452 +gpu 0 iter : 13 Arret : 0.00195862 s/iter 6.078631 +gpu 0 iter : 14 Arret : 0.00243823 s/iter 6.075599 +gpu 0 iter : 15 Arret : 0.000282668 s/iter 6.076158 +gpu 0 iter : 16 Arret : 4.27745E-05 s/iter 6.075788 +gpu 0 iter : 17 Arret : 4.20725E-06 s/iter 6.077506 +gpu 0 iter : 18 Arret : 1.6828E-08 s/iter 6.078853 +gpu 0 iter : 19 Arret : 3.63614E-11 s/iter 6.079236 +gpu 0 iter : 20 Arret : 1.38589E-13 s/iter 6.077430 +temps : 122.327 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.45366E-07 +Stabilite : 1.02274E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540319 +i* 0.841478| 1.00002|-2.32809E-09 +i* 1.97672E-09| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.43989 +i* -0.898041| 0.999991|-2.08855E-12 +i*-1.75276E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991| 1.11042E-11 +i*-9.27687E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991|-1.29017E-11 +i*-4.43427E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991|-4.70735E-12 +i* -1.4127E-11| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688087 +i* 0.725616| 0.999991| 6.67011E-12 +i* 1.57173E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991|-6.93356E-12 +i*-6.23118E-12| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 1.00002 +250000 racines de module = 0.999991 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 0.00183894 s/iter 13.264868 +gpu 0 iter : 2 Arret : 0.00332589 s/iter 13.263027 +gpu 0 iter : 3 Arret : 0.0778545 s/iter 13.329862 +gpu 0 iter : 4 Arret : 0.134953 s/iter 13.784249 +gpu 0 iter : 5 Arret : 0.100777 s/iter 14.153947 +gpu 0 iter : 6 Arret : 0.107368 s/iter 13.911608 +gpu 0 iter : 7 Arret : 0.112184 s/iter 13.982400 +gpu 0 iter : 8 Arret : 0.0819523 s/iter 13.863669 +gpu 0 iter : 9 Arret : 0.0470621 s/iter 13.750970 +gpu 0 iter : 10 Arret : 0.0265395 s/iter 13.686381 +gpu 0 iter : 11 Arret : 0.0114418 s/iter 13.768352 +gpu 0 iter : 12 Arret : 0.0132102 s/iter 13.687711 +gpu 0 iter : 13 Arret : 0.0107799 s/iter 13.263263 +gpu 0 iter : 14 Arret : 0.00702915 s/iter 13.271004 +gpu 0 iter : 15 Arret : 0.00272883 s/iter 13.265259 +gpu 0 iter : 16 Arret : 0.000385595 s/iter 13.264764 +gpu 0 iter : 17 Arret : 0.000332015 s/iter 13.264693 +gpu 0 iter : 18 Arret : 0.000909613 s/iter 13.264925 +gpu 0 iter : 19 Arret : 9.10926E-07 s/iter 13.264547 +gpu 0 iter : 20 Arret : 4.37366E-09 s/iter 13.265195 +gpu 0 iter : 21 Arret : 1.73951E-11 s/iter 13.264664 +gpu 0 iter : 22 Arret : 6.9226E-14 s/iter 13.264587 +temps : 297.898 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.80963E-08 +Stabilite : 6.9226E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592012 +i* 0.805941| 1.00001| 4.1526E-09 +i* 1.02046E-09| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993|-4.77973E-12 +i* 2.40621E-11| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| -2.6851E-11 +i*-1.44801E-11| +| 15| -0.721524 +i* -0.69238| 0.999993| 2.63193E-11 +i*-6.76318E-13| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742928 +i* -0.669362| 0.999993| 3.04134E-12 +i*-9.84154E-12| +| 18| 0.7533 +i* 0.657691| 1.00001|-2.76219E-09 +i* 4.10298E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773543 +i* 0.633733| 0.999993| 6.56308E-12 +i* 2.27492E-11| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1563 start 400000 size 400000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1563 start 0 size 400000 +gpu 0 iter : 1 Arret : 0.000985945 s/iter 23.676133 +gpu 0 iter : 2 Arret : 0.00575711 s/iter 23.813100 +gpu 0 iter : 3 Arret : 0.80372 s/iter 23.766696 +gpu 0 iter : 4 Arret : 1.12755 s/iter 23.828097 +gpu 0 iter : 5 Arret : 0.927252 s/iter 23.871271 +gpu 0 iter : 6 Arret : 1.8727 s/iter 23.858341 +gpu 0 iter : 7 Arret : 1.02108 s/iter 24.362443 +gpu 0 iter : 8 Arret : 0.40485 s/iter 24.813205 +gpu 0 iter : 9 Arret : 0.204025 s/iter 24.848475 +gpu 0 iter : 10 Arret : 0.322307 s/iter 24.766030 +gpu 0 iter : 11 Arret : 0.966794 s/iter 24.450352 +gpu 0 iter : 12 Arret : 0.519786 s/iter 24.347418 +gpu 0 iter : 13 Arret : 0.209179 s/iter 24.204030 +gpu 0 iter : 14 Arret : 0.0738373 s/iter 23.789427 +gpu 0 iter : 15 Arret : 0.0394797 s/iter 23.786761 +gpu 0 iter : 16 Arret : 0.0224964 s/iter 23.792150 +gpu 0 iter : 17 Arret : 0.0104646 s/iter 23.802294 +gpu 0 iter : 18 Arret : 0.00882482 s/iter 23.804999 +gpu 0 iter : 19 Arret : 0.000586803 s/iter 23.663425 +gpu 0 iter : 20 Arret : 1.2904E-06 s/iter 23.667331 +gpu 0 iter : 21 Arret : 2.17443E-08 s/iter 23.669417 +gpu 0 iter : 22 Arret : 3.31651E-10 s/iter 23.663042 +gpu 0 iter : 23 Arret : 5.05742E-12 s/iter 23.667395 +gpu 0 iter : 24 Arret : 7.71156E-14 s/iter 23.671701 +temps : 576.437 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.80859E-08 +Stabilite : 7.7914E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995|-1.40248E-11 +i* 5.11502E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-1.80345E-12 +i* 5.96675E-11| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 1954 start 0 size 500096 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 1954 start 500096 size 500096 +gpu 0 iter : 1 Arret : 0.000661333 s/iter 36.538739 +gpu 0 iter : 2 Arret : 0.00112864 s/iter 36.545395 +gpu 0 iter : 3 Arret : 0.00370767 s/iter 36.541300 +gpu 0 iter : 4 Arret : 0.00748235 s/iter 37.223998 +gpu 0 iter : 5 Arret : 0.0147148 s/iter 37.021293 +gpu 0 iter : 6 Arret : 0.0212816 s/iter 37.146418 +gpu 0 iter : 7 Arret : 0.00895178 s/iter 37.219267 +gpu 0 iter : 8 Arret : 0.00887668 s/iter 37.316626 +gpu 0 iter : 9 Arret : 0.00504713 s/iter 36.647500 +gpu 0 iter : 10 Arret : 0.00709815 s/iter 37.285606 +gpu 0 iter : 11 Arret : 0.00694487 s/iter 36.891551 +gpu 0 iter : 12 Arret : 0.00243476 s/iter 36.546690 +gpu 0 iter : 13 Arret : 0.00268555 s/iter 36.502800 +gpu 0 iter : 14 Arret : 0.000904871 s/iter 36.508349 +gpu 0 iter : 15 Arret : 0.0005848 s/iter 36.503946 +gpu 0 iter : 16 Arret : 8.64186E-05 s/iter 36.503619 +gpu 0 iter : 17 Arret : 8.33778E-05 s/iter 36.511641 +gpu 0 iter : 18 Arret : 1.10486E-05 s/iter 36.503510 +gpu 0 iter : 19 Arret : 1.76382E-05 s/iter 36.534320 +gpu 0 iter : 20 Arret : 1.2926E-06 s/iter 36.537729 +gpu 0 iter : 21 Arret : 5.95413E-09 s/iter 36.503894 +gpu 0 iter : 22 Arret : 1.88485E-11 s/iter 36.540363 +gpu 0 iter : 23 Arret : 5.96427E-14 s/iter 36.541307 +temps : 850.208 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65132E-08 +Stabilite : 5.96427E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 1.87346E-11 +i* 4.7471E-11| +| 9| 0.491932 +i* 0.870629| 0.999996|-1.74121E-11 +i*-2.86359E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.60997E-11 +i*-9.69844E-12| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996| 2.73914E-12 +i* 2.25153E-11| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 0 (of 2) uses CUDA device 0 +CPU thread 1 (of 2) uses CUDA device 1 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 2344 start 0 size 600064 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 2344 start 600064 size 600064 +gpu 0 iter : 1 Arret : 0.00780904 s/iter 52.957678 +gpu 0 iter : 2 Arret : 0.698753 s/iter 54.370408 +gpu 0 iter : 3 Arret : 0.512229 s/iter 55.903856 +gpu 0 iter : 4 Arret : 0.256495 s/iter 56.546686 +gpu 0 iter : 5 Arret : 0.481397 s/iter 56.384400 +gpu 0 iter : 6 Arret : 0.892443 s/iter 56.641431 +gpu 0 iter : 7 Arret : 1.58519 s/iter 56.603728 +gpu 0 iter : 8 Arret : 1.00461 s/iter 56.787414 +gpu 0 iter : 9 Arret : 0.667954 s/iter 56.936636 +gpu 0 iter : 10 Arret : 1.69048 s/iter 56.433809 +gpu 0 iter : 11 Arret : 0.673973 s/iter 56.247309 +gpu 0 iter : 12 Arret : 0.286904 s/iter 55.583712 +gpu 0 iter : 13 Arret : 0.809155 s/iter 54.972406 +gpu 0 iter : 14 Arret : 1.04967 s/iter 54.200475 +gpu 0 iter : 15 Arret : 0.767419 s/iter 54.073912 +gpu 0 iter : 16 Arret : 1.25055 s/iter 53.969523 +gpu 0 iter : 17 Arret : 0.313555 s/iter 53.619940 +gpu 0 iter : 18 Arret : 0.0612844 s/iter 53.103551 +gpu 0 iter : 19 Arret : 0.0812813 s/iter 53.087654 +gpu 0 iter : 20 Arret : 0.0798413 s/iter 52.895378 +gpu 0 iter : 21 Arret : 0.0193508 s/iter 52.929617 +gpu 0 iter : 22 Arret : 0.0112127 s/iter 52.923694 +gpu 0 iter : 23 Arret : 0.00926876 s/iter 52.906420 +gpu 0 iter : 24 Arret : 0.00234025 s/iter 52.924598 +gpu 0 iter : 25 Arret : 0.000902467 s/iter 52.922805 +gpu 0 iter : 26 Arret : 2.88058E-05 s/iter 52.927734 +gpu 0 iter : 27 Arret : 3.35406E-07 s/iter 52.973958 +gpu 0 iter : 28 Arret : 1.39702E-09 s/iter 52.974028 +gpu 0 iter : 29 Arret : 8.02785E-12 s/iter 52.966681 +gpu 0 iter : 30 Arret : 1.1441E-13 s/iter 52.951515 +temps : 1631.66 seconde(s) +Nb iterations : 30 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.74574E-08 +Stabilite : 2.21335E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540304 +i* 0.841466| 0.999997| 3.08649E-11 +i* 2.05843E-11| +| 2| 0.513629 +i* 0.858008| 0.999997| 3.02357E-11 +i* 3.41858E-11| +| 3| 0.486451 +i* 0.873713| 1| 1.95054E-09 +i* 6.77633E-10| +| 4| 0.458805 +i* 0.888533| 0.999997| 1.78773E-11 +i* 1.55684E-11| +| 5| 0.43071 +i* 0.902487| 0.999997|-9.50928E-12 +i*-1.85143E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997| -2.5707E-11 +i* 3.11093E-13| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192909 +i* 0.981221| 1|-1.95729E-09 +i* 4.84549E-09| +| 14| 0.162017 +i* 0.986785| 0.999997| 4.59321E-12 +i*-4.42106E-13| +| 15| 0.130967 +i* 0.991391| 1|-1.93729E-10 +i*-4.06442E-10| +| 16| 0.0998077 +i* 0.995003| 0.999997| -4.5103E-11 +i*-6.66658E-12| +| 17| 0.0685225 +i* 0.997646| 0.999997| 2.33641E-11 +i* 2.51787E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +700000 racines de module = 0.999997 +500000 racines de module = 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 1 (of 2) uses CUDA device 1 +CPU thread 0 (of 2) uses CUDA device 0 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 2735 start 700032 size 700032 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 2735 start 0 size 700032 +gpu 0 iter : 1 Arret : 0.00527111 s/iter 71.308499 +gpu 0 iter : 2 Arret : 0.172644 s/iter 72.713414 +gpu 0 iter : 3 Arret : 0.69639 s/iter 72.958242 +gpu 0 iter : 4 Arret : 1.18582 s/iter 75.255529 +gpu 0 iter : 5 Arret : 0.29345 s/iter 76.866618 +gpu 0 iter : 6 Arret : 0.163076 s/iter 77.369587 +gpu 0 iter : 7 Arret : 1.88246 s/iter 78.558083 +gpu 0 iter : 8 Arret : 1.71023 s/iter 77.826546 +gpu 0 iter : 9 Arret : 1.23231 s/iter 77.642649 +gpu 0 iter : 10 Arret : 0.367931 s/iter 79.759527 +gpu 0 iter : 11 Arret : 1.0997 s/iter 78.755024 +gpu 0 iter : 12 Arret : 2.11197 s/iter 77.725889 +gpu 0 iter : 13 Arret : 0.848296 s/iter 76.267112 +gpu 0 iter : 14 Arret : 0.433295 s/iter 75.435820 +gpu 0 iter : 15 Arret : 0.817759 s/iter 74.683488 +gpu 0 iter : 16 Arret : 0.767209 s/iter 74.057568 +gpu 0 iter : 17 Arret : 0.573024 s/iter 73.720984 +gpu 0 iter : 18 Arret : 0.597274 s/iter 73.499266 +gpu 0 iter : 19 Arret : 0.303085 s/iter 72.741656 +gpu 0 iter : 20 Arret : 0.180774 s/iter 72.806213 +gpu 0 iter : 21 Arret : 0.0722903 s/iter 72.559828 +gpu 0 iter : 22 Arret : 0.146427 s/iter 72.512488 +gpu 0 iter : 23 Arret : 0.129512 s/iter 72.128992 +gpu 0 iter : 24 Arret : 0.0402274 s/iter 71.576335 +gpu 0 iter : 25 Arret : 0.0124264 s/iter 71.526353 +gpu 0 iter : 26 Arret : 0.00203683 s/iter 71.463273 +gpu 0 iter : 27 Arret : 0.000373803 s/iter 71.462289 +gpu 0 iter : 28 Arret : 7.43881E-07 s/iter 71.336304 +gpu 0 iter : 29 Arret : 9.02153E-09 s/iter 71.333249 +gpu 0 iter : 30 Arret : 1.20401E-10 s/iter 71.481701 +gpu 0 iter : 31 Arret : 1.60504E-12 s/iter 71.339739 +gpu 0 iter : 32 Arret : 2.14019E-14 s/iter 71.437524 +temps : 2371.12 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.65661E-08 +Stabilite : 5.97875E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997| 5.65794E-11 +i*-4.66756E-12| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-8.72191E-12 +i* 2.97079E-11| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.84962E-11 +i* 2.59646E-11| +| 15| -0.358575 +i* -0.933498| 0.999997| 8.13599E-11 +i*-1.42233E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140099: line 23: 12958 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140099: line 24: 12962 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140099: line 25: 12964 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_2GPU.sge b/Simulations/sparse_openmp/sparse_openmp_2GPU.sge new file mode 100644 index 0000000..769c2b7 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_2GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=2 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 2 +#$ -V +#$ -cwd +#$ -N sparse_openmp_2GPU + +module load gcc/4.9.0 +module load cuda/7.0 +export OMP_NUM_THREADS=2 + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Simulations/sparse_openmp/sparse_openmp_3GPU.o140098 b/Simulations/sparse_openmp/sparse_openmp_3GPU.o140098 new file mode 100644 index 0000000..2aea52b --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_3GPU.o140098 @@ -0,0 +1,602 @@ +REMAINING: 3 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 131 start 0 size 33365 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 131 start 33365 size 33365 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 131 start 66730 size 33365 +gpu 0 iter : 1 Arret : 0.00638376 s/iter 0.326852 +gpu 0 iter : 2 Arret : 0.00780969 s/iter 0.399828 +gpu 0 iter : 3 Arret : 0.00239395 s/iter 0.326756 +gpu 0 iter : 4 Arret : 0.00316529 s/iter 0.326768 +gpu 0 iter : 5 Arret : 0.0038084 s/iter 0.326767 +gpu 0 iter : 6 Arret : 0.00482452 s/iter 0.326696 +gpu 0 iter : 7 Arret : 0.00928999 s/iter 0.326751 +gpu 0 iter : 8 Arret : 0.0101647 s/iter 0.326710 +gpu 0 iter : 9 Arret : 0.0111077 s/iter 0.326857 +gpu 0 iter : 10 Arret : 0.00655022 s/iter 0.326801 +gpu 0 iter : 11 Arret : 0.00316276 s/iter 0.326810 +gpu 0 iter : 12 Arret : 0.000516233 s/iter 0.326609 +gpu 0 iter : 13 Arret : 0.00040416 s/iter 0.326572 +gpu 0 iter : 14 Arret : 0.000177079 s/iter 0.326480 +gpu 0 iter : 15 Arret : 8.53367E-05 s/iter 0.326486 +gpu 0 iter : 16 Arret : 4.34291E-05 s/iter 0.326528 +gpu 0 iter : 17 Arret : 2.94612E-06 s/iter 0.326471 +gpu 0 iter : 18 Arret : 4.24038E-08 s/iter 0.326469 +gpu 0 iter : 19 Arret : 6.31898E-10 s/iter 0.326431 +gpu 0 iter : 20 Arret : 9.41384E-12 s/iter 0.326448 +gpu 0 iter : 21 Arret : 1.40182E-13 s/iter 0.326484 +temps : 8.00955 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.10777E-09 +Stabilite : 1.57015E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54036 +i* 0.841503| 1.00006|-5.00602E-11 +i* 9.0853E-12| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226885 +i* -0.973981| 1.00006|-5.81993E-10 +i*-4.18547E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962|-4.03455E-13 +i* 2.85139E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 1.02962E-12 +i*-4.51911E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| -8.9615E-10 +i* 1.84549E-11| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +40000 racines de module = 1.00006 +60000 racines de module = 0.999962 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 261 start 66730 size 66730 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 261 start 0 size 66730 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 261 start 133460 size 66730 +gpu 0 iter : 1 Arret : 0.000229669 s/iter 1.096870 +gpu 0 iter : 2 Arret : 0.00021193 s/iter 1.097026 +gpu 0 iter : 3 Arret : 0.000280313 s/iter 1.096954 +gpu 0 iter : 4 Arret : 0.000636926 s/iter 1.096899 +gpu 0 iter : 5 Arret : 0.00105388 s/iter 1.096829 +gpu 0 iter : 6 Arret : 0.0149052 s/iter 1.096638 +gpu 0 iter : 7 Arret : 0.0123684 s/iter 1.096797 +gpu 0 iter : 8 Arret : 0.0421817 s/iter 1.098043 +gpu 0 iter : 9 Arret : 0.0899445 s/iter 1.098654 +gpu 0 iter : 10 Arret : 0.204522 s/iter 1.186313 +gpu 0 iter : 11 Arret : 2.97201 s/iter 1.218384 +gpu 0 iter : 12 Arret : 0.648253 s/iter 1.218710 +gpu 0 iter : 13 Arret : 1.88772 s/iter 1.241862 +gpu 0 iter : 14 Arret : 1.33785 s/iter 1.208066 +gpu 0 iter : 15 Arret : 1.70034 s/iter 1.098449 +gpu 0 iter : 16 Arret : 1.16245 s/iter 1.197714 +gpu 0 iter : 17 Arret : 2.06315 s/iter 1.228122 +gpu 0 iter : 18 Arret : 1.22433 s/iter 1.198366 +gpu 0 iter : 19 Arret : 0.795342 s/iter 1.228114 +gpu 0 iter : 20 Arret : 0.622909 s/iter 1.095861 +gpu 0 iter : 21 Arret : 1.12395 s/iter 1.224956 +gpu 0 iter : 22 Arret : 1.99041 s/iter 1.227156 +gpu 0 iter : 23 Arret : 1.15739 s/iter 1.209773 +gpu 0 iter : 24 Arret : 0.455675 s/iter 1.226888 +gpu 0 iter : 25 Arret : 0.680625 s/iter 1.097847 +gpu 0 iter : 26 Arret : 0.577238 s/iter 1.095693 +gpu 0 iter : 27 Arret : 0.0687706 s/iter 1.095867 +gpu 0 iter : 28 Arret : 0.0224681 s/iter 1.096036 +gpu 0 iter : 29 Arret : 0.002804 s/iter 1.095993 +gpu 0 iter : 30 Arret : 6.05493E-06 s/iter 1.095754 +gpu 0 iter : 31 Arret : 3.11042E-10 s/iter 1.095829 +gpu 0 iter : 32 Arret : 3.1096E-14 s/iter 1.096050 +temps : 37.8394 seconde(s) +Nb iterations : 32 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.30431E-05 +Stabilite : 3.1096E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985| 8.64808E-12 +i* 7.46794E-12| +| 8| 0.59177 +i* 0.806164| 1.00005|-6.74238E-09 +i* 4.40492E-09| +| 9| -0.801529 +i* 0.598033| 1.00005| 7.19885E-09 +i* 8.43319E-09| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628894 +i* -0.777551| 1.00005| 2.29838E-09 +i* 1.59417E-08| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985|-3.47633E-12 +i* 1.20617E-11| +| 17| -0.762458 +i* 0.647014| 0.999985|-7.74447E-12 +i* 7.566E-12| +| 18| -0.652967 +i* -0.757366| 0.999985|-6.31406E-12 +i* 8.49495E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-1.93379E-12 +i*-1.29726E-11| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 521 start 133376 size 133376 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 521 start 0 size 133376 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 521 start 266752 size 133376 +gpu 0 iter : 1 Arret : 0.00053336 s/iter 4.015433 +gpu 0 iter : 2 Arret : 0.00165478 s/iter 4.015274 +gpu 0 iter : 3 Arret : 0.00149659 s/iter 4.015225 +gpu 0 iter : 4 Arret : 0.00476307 s/iter 4.014142 +gpu 0 iter : 5 Arret : 0.0270497 s/iter 4.020618 +gpu 0 iter : 6 Arret : 0.0269319 s/iter 4.340327 +gpu 0 iter : 7 Arret : 0.0180523 s/iter 4.298465 +gpu 0 iter : 8 Arret : 0.0146534 s/iter 4.308899 +gpu 0 iter : 9 Arret : 0.00619736 s/iter 4.011731 +gpu 0 iter : 10 Arret : 0.00299981 s/iter 4.010855 +gpu 0 iter : 11 Arret : 0.00111873 s/iter 4.009952 +gpu 0 iter : 12 Arret : 0.000851809 s/iter 4.011669 +gpu 0 iter : 13 Arret : 0.000757841 s/iter 4.011889 +gpu 0 iter : 14 Arret : 0.000509989 s/iter 4.011347 +gpu 0 iter : 15 Arret : 0.000667055 s/iter 4.011093 +gpu 0 iter : 16 Arret : 2.71105E-05 s/iter 4.000315 +gpu 0 iter : 17 Arret : 8.00906E-06 s/iter 3.991624 +gpu 0 iter : 18 Arret : 1.99192E-07 s/iter 3.991746 +gpu 0 iter : 19 Arret : 3.11567E-09 s/iter 3.991734 +gpu 0 iter : 20 Arret : 4.89263E-11 s/iter 3.991803 +gpu 0 iter : 21 Arret : 7.68172E-13 s/iter 3.991754 +temps : 86.1208 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.49185E-08 +Stabilite : 7.68172E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540334 +i* 0.84144| 0.999991| 6.97609E-12 +i* 5.61207E-12| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.43989 +i* -0.898041| 0.999991|-2.08855E-12 +i*-1.75276E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411533 +i* -0.911385| 0.999991|-2.45048E-12 +i* 4.6238E-12| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991| 1.11042E-11 +i*-9.27687E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.98851 +i* 0.151094| 0.999991|-1.29017E-11 +i*-4.43427E-12| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641283 +i* 0.767292| 0.999991| 1.73468E-11 +i*-3.74729E-12| +| 13| -0.98329 +i* 0.181995| 0.999991|-6.62759E-12 +i*-5.46796E-12| +| 14| 0.324176 +i* -0.945987| 0.999991| 1.53594E-11 +i*-1.57324E-12| +| 15| 0.665012 +i* 0.746821| 0.999991| 5.27178E-12 +i*-4.27913E-12| +| 16| -0.977104 +i* 0.212717| 0.999991|-1.01148E-11 +i* 2.41479E-12| +| 17| 0.294374 +i* -0.955681| 0.999991| -1.2063E-11 +i* 1.32238E-11| +| 18| 0.688087 +i* 0.725616| 0.999991| 6.67011E-12 +i* 1.57173E-11| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991| 2.5573E-11 +i*-6.45539E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 782 start 200021 size 200021 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 782 start 400042 size 200021 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 782 start 0 size 200021 +gpu 0 iter : 1 Arret : 0.00574299 s/iter 9.047838 +gpu 0 iter : 2 Arret : 0.00960381 s/iter 9.043639 +gpu 0 iter : 3 Arret : 0.130996 s/iter 9.471525 +gpu 0 iter : 4 Arret : 0.142079 s/iter 9.198199 +gpu 0 iter : 5 Arret : 0.0868349 s/iter 9.506055 +gpu 0 iter : 6 Arret : 0.0882721 s/iter 9.145065 +gpu 0 iter : 7 Arret : 0.114689 s/iter 9.172845 +gpu 0 iter : 8 Arret : 0.108656 s/iter 9.193791 +gpu 0 iter : 9 Arret : 0.0356399 s/iter 9.170752 +gpu 0 iter : 10 Arret : 0.0134072 s/iter 9.594206 +gpu 0 iter : 11 Arret : 0.00832588 s/iter 9.158565 +gpu 0 iter : 12 Arret : 0.00682235 s/iter 9.135471 +gpu 0 iter : 13 Arret : 0.00415856 s/iter 9.143664 +gpu 0 iter : 14 Arret : 0.00311193 s/iter 9.065571 +gpu 0 iter : 15 Arret : 0.000707097 s/iter 9.044745 +gpu 0 iter : 16 Arret : 0.000778409 s/iter 9.042087 +gpu 0 iter : 17 Arret : 0.000667704 s/iter 9.043931 +gpu 0 iter : 18 Arret : 9.33212E-06 s/iter 9.043636 +gpu 0 iter : 19 Arret : 7.71387E-08 s/iter 9.041264 +gpu 0 iter : 20 Arret : 1.09443E-09 s/iter 9.041736 +gpu 0 iter : 21 Arret : 1.56107E-11 s/iter 9.047621 +gpu 0 iter : 22 Arret : 2.22664E-13 s/iter 9.046678 +temps : 202.419 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 7.53549E-08 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993| 1.33613E-11 +i*-1.98701E-11| +| 4| 0.592014 +i* 0.805919| 0.999993|-3.98037E-12 +i* 9.55808E-12| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993|-4.43978E-12 +i*-2.31382E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 2.88447E-09 +i* 3.69506E-09| +| 16| 0.73231 +i* 0.680962| 0.999993|-5.73186E-12 +i* 1.14335E-11| +| 17| -0.742904 +i* -0.669389| 0.999993|-7.78222E-12 +i* 1.50098E-11| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.76354 +i* -0.64575| 0.999993| 2.24043E-11 +i*-1.30496E-12| +| 20| 0.773539 +i* 0.633763| 1.00001| 5.39271E-09 +i*-2.77636E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 1042 start 266666 size 266666 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 1042 start 0 size 266666 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 1042 start 533332 size 266666 +gpu 0 iter : 1 Arret : 0.000985945 s/iter 15.851621 +gpu 0 iter : 2 Arret : 0.00155936 s/iter 15.788402 +gpu 0 iter : 3 Arret : 0.0129473 s/iter 15.851181 +gpu 0 iter : 4 Arret : 0.0558872 s/iter 16.300649 +gpu 0 iter : 5 Arret : 0.19954 s/iter 15.808251 +gpu 0 iter : 6 Arret : 0.377937 s/iter 15.879884 +gpu 0 iter : 7 Arret : 0.514814 s/iter 16.303367 +gpu 0 iter : 8 Arret : 0.338633 s/iter 15.914224 +gpu 0 iter : 9 Arret : 0.206607 s/iter 16.151496 +gpu 0 iter : 10 Arret : 0.138277 s/iter 16.399153 +gpu 0 iter : 11 Arret : 0.113953 s/iter 15.857365 +gpu 0 iter : 12 Arret : 0.0627751 s/iter 15.843953 +gpu 0 iter : 13 Arret : 0.0358213 s/iter 15.848470 +gpu 0 iter : 14 Arret : 0.0221421 s/iter 15.846627 +gpu 0 iter : 15 Arret : 0.00243723 s/iter 15.842171 +gpu 0 iter : 16 Arret : 0.000254217 s/iter 15.843580 +gpu 0 iter : 17 Arret : 0.000130358 s/iter 15.845033 +gpu 0 iter : 18 Arret : 0.00018532 s/iter 15.849105 +gpu 0 iter : 19 Arret : 1.35363E-05 s/iter 15.847663 +gpu 0 iter : 20 Arret : 2.14908E-09 s/iter 15.847042 +gpu 0 iter : 21 Arret : 4.62703E-12 s/iter 15.807436 +gpu 0 iter : 22 Arret : 9.97217E-15 s/iter 15.847751 +temps : 351.42 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 12.9528 +Stabilite : 7.80251E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995|-5.33817E-12 +i*-1.81878E-11| +| 2| 0.592014 +i* 0.805922| 0.999995| 2.33948E-11 +i*-2.13005E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995|-4.99742E-11 +i* 1.43873E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 1.7531E-11 +i*-4.02243E-11| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995| 4.13796E-11 +i*-2.48189E-11| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +499998 racines de module = 0.999995 +300000 racines de module = 1.00001 + 2 racines de module = 1 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 2 (of 3) uses CUDA device 2 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 1303 start 666794 size 333397 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 1303 start 333397 size 333397 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 1303 start 0 size 333397 +gpu 0 iter : 1 Arret : 0.0011104 s/iter 24.284964 +gpu 0 iter : 2 Arret : 0.00309979 s/iter 24.283383 +gpu 0 iter : 3 Arret : 0.247623 s/iter 24.789931 +gpu 0 iter : 4 Arret : 0.461817 s/iter 24.581195 +gpu 0 iter : 5 Arret : 0.334336 s/iter 25.044367 +gpu 0 iter : 6 Arret : 0.274486 s/iter 25.665034 +gpu 0 iter : 7 Arret : 0.159668 s/iter 26.197375 +gpu 0 iter : 8 Arret : 0.0519691 s/iter 25.694996 +gpu 0 iter : 9 Arret : 0.0269291 s/iter 25.673851 +gpu 0 iter : 10 Arret : 0.0602316 s/iter 25.604792 +gpu 0 iter : 11 Arret : 0.0619642 s/iter 24.773954 +gpu 0 iter : 12 Arret : 0.0234 s/iter 24.787706 +gpu 0 iter : 13 Arret : 0.0244077 s/iter 24.353884 +gpu 0 iter : 14 Arret : 0.00963063 s/iter 24.344876 +gpu 0 iter : 15 Arret : 0.00340716 s/iter 24.345219 +gpu 0 iter : 16 Arret : 0.000234823 s/iter 24.297435 +gpu 0 iter : 17 Arret : 0.000256334 s/iter 24.352140 +gpu 0 iter : 18 Arret : 0.000224052 s/iter 24.290971 +gpu 0 iter : 19 Arret : 0.000781478 s/iter 24.296445 +gpu 0 iter : 20 Arret : 0.000194356 s/iter 24.291281 +gpu 0 iter : 21 Arret : 2.40806E-07 s/iter 24.291827 +gpu 0 iter : 22 Arret : 3.31687E-09 s/iter 24.291690 +gpu 0 iter : 23 Arret : 4.67724E-11 s/iter 24.290907 +gpu 0 iter : 24 Arret : 6.59569E-13 s/iter 24.293931 +temps : 598.968 seconde(s) +Nb iterations : 24 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.52682E-07 +Stabilite : 6.59569E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.519015 +i* 0.854772| 1.00001| 2.38413E-09 +i*-5.89917E-09| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491942 +i* 0.870624| 0.999996| -1.9825E-11 +i*-1.52329E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996|-3.09397E-11 +i*-1.68578E-11| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46438 +i* 0.885632| 0.999996| 1.33844E-11 +i*-1.06731E-12| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436355 +i* 0.899781| 1.00001| 4.84598E-09 +i*-1.12092E-09| +| 20| 0.430689 +i* 0.902496| 0.999996|-1.25435E-11 +i* 3.86925E-13| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 0 (of 3) uses CUDA device 0 +CPU thread 1 (of 3) uses CUDA device 1 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1563 start 0 size 400042 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1563 start 400042 size 400042 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 2 dimgrid2 1563 start 800084 size 400042 +gpu 0 iter : 1 Arret : 0.0129118 s/iter 35.194295 +gpu 0 iter : 2 Arret : 1.14226 s/iter 37.357952 +gpu 0 iter : 3 Arret : 1.41831 s/iter 37.472613 +gpu 0 iter : 4 Arret : 1.98712 s/iter 37.475866 +gpu 0 iter : 5 Arret : 0.777118 s/iter 37.323598 +gpu 0 iter : 6 Arret : 0.414132 s/iter 38.133114 +gpu 0 iter : 7 Arret : 0.596053 s/iter 38.249814 +gpu 0 iter : 8 Arret : 0.923957 s/iter 38.214227 +gpu 0 iter : 9 Arret : 1.37764 s/iter 38.802357 +gpu 0 iter : 10 Arret : 3.75882 s/iter 38.537349 +gpu 0 iter : 11 Arret : 3.50583 s/iter 39.060169 +gpu 0 iter : 12 Arret : 3.46154 s/iter 38.314523 +gpu 0 iter : 13 Arret : 1.44838 s/iter 38.304672 +gpu 0 iter : 14 Arret : 2.97866 s/iter 38.101085 +gpu 0 iter : 15 Arret : 1.47363 s/iter 37.961455 +gpu 0 iter : 16 Arret : 3.02916 s/iter 37.963549 +gpu 0 iter : 17 Arret : 3.44273 s/iter 37.562647 +gpu 0 iter : 18 Arret : 9.75818 s/iter 37.462847 +gpu 0 iter : 19 Arret : 3.55089 s/iter 37.388809 +gpu 0 iter : 20 Arret : 1.23127 s/iter 37.253955 +gpu 0 iter : 21 Arret : 2.15757 s/iter 37.181593 +gpu 0 iter : 22 Arret : 1.41689 s/iter 37.239248 +gpu 0 iter : 23 Arret : 2.71181 s/iter 37.183043 +gpu 0 iter : 24 Arret : 1.74358 s/iter 37.093614 +gpu 0 iter : 25 Arret : 1.20275 s/iter 37.190846 +gpu 0 iter : 26 Arret : 4.12739 s/iter 37.151827 +gpu 0 iter : 27 Arret : 0.963355 s/iter 37.085124 +gpu 0 iter : 28 Arret : 0.780804 s/iter 37.089879 +gpu 0 iter : 29 Arret : 1.04543 s/iter 37.116299 +gpu 0 iter : 30 Arret : 0.861461 s/iter 36.766134 +gpu 0 iter : 31 Arret : 0.882203 s/iter 36.884355 +gpu 0 iter : 32 Arret : 1.2718 s/iter 36.769843 +gpu 0 iter : 33 Arret : 2.35224 s/iter 36.354615 +gpu 0 iter : 34 Arret : 0.727156 s/iter 36.255055 +gpu 0 iter : 35 Arret : 1.44624 s/iter 36.206611 +gpu 0 iter : 36 Arret : 0.991076 s/iter 36.090368 +gpu 0 iter : 37 Arret : 1.04914 s/iter 35.800864 +gpu 0 iter : 38 Arret : 1.8416 s/iter 35.547956 +gpu 0 iter : 39 Arret : 73.3357 s/iter 35.569370 +gpu 0 iter : 40 Arret : 1.27526 s/iter 35.589183 +gpu 0 iter : 41 Arret : 0.664432 s/iter 35.572552 +gpu 0 iter : 42 Arret : 2.02267 s/iter 35.596663 +gpu 0 iter : 43 Arret : 3.3247 s/iter 35.518933 +gpu 0 iter : 44 Arret : 0.753208 s/iter 35.558919 +gpu 0 iter : 45 Arret : 0.406779 s/iter 35.517839 +gpu 0 iter : 46 Arret : 0.190344 s/iter 35.499532 +gpu 0 iter : 47 Arret : 0.053701 s/iter 35.454469 +gpu 0 iter : 48 Arret : 0.0180092 s/iter 35.423771 +gpu 0 iter : 49 Arret : 0.0103853 s/iter 35.469037 +gpu 0 iter : 50 Arret : 0.00392672 s/iter 35.295894 +gpu 0 iter : 51 Arret : 0.00130348 s/iter 35.285682 +gpu 0 iter : 52 Arret : 5.94285E-05 s/iter 35.279833 +gpu 0 iter : 53 Arret : 3.66884E-07 s/iter 35.262013 +gpu 0 iter : 54 Arret : 1.24856E-09 s/iter 35.260448 +gpu 0 iter : 55 Arret : 1.23865E-11 s/iter 35.262868 +gpu 0 iter : 56 Arret : 1.69469E-13 s/iter 35.261163 +temps : 2056.31 seconde(s) +Nb iterations : 56 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.48302E-06 +Stabilite : 1.69469E-13 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513633 +i* 0.858015| 1| 1.54651E-09 +i*-2.27023E-10| +| 3| 0.486464 +i* 0.873697| 0.999997| 5.22282E-12 +i* 2.0872E-11| +| 4| 0.458789 +i* 0.888542| 0.999997| 2.48135E-13 +i*-2.88822E-11| +| 5| 0.430701 +i* 0.902491| 0.999997| 1.55062E-11 +i*-3.45463E-12| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192909 +i* 0.981221| 1|-1.95729E-09 +i* 4.84549E-09| +| 14| 0.162018 +i* 0.986792| 1| 1.18712E-08 +i* 5.95858E-09| +| 15| 0.128886 +i* 0.991664| 1|-2.36358E-09 +i* 3.79427E-11| +| 16| 0.099787 +i* 0.995013| 1|-7.20324E-09 +i* 2.86361E-09| +| 17| 0.0685404 +i* 0.997645| 0.999997| 1.01124E-11 +i* 3.1089E-12| +| 18| 0.0371504 +i* 0.999314| 1|-3.18728E-10 +i*-2.97119E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 2 (of 3) uses CUDA device 2 +CPU thread 1 (of 3) uses CUDA device 1 +CPU thread 0 (of 3) uses CUDA device 0 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1823 start 466688 size 466688 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1823 start 933376 size 466688 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 1823 start 0 size 466688 +gpu 0 iter : 1 Arret : 0.047657 s/iter 48.025151 +gpu 0 iter : 2 Arret : 0.964913 s/iter 49.123050 +gpu 0 iter : 3 Arret : 2.4727 s/iter 49.732738 +gpu 0 iter : 4 Arret : 2.06376 s/iter 50.210543 +gpu 0 iter : 5 Arret : 0.958099 s/iter 51.132618 +gpu 0 iter : 6 Arret : 0.828164 s/iter 51.281245 +gpu 0 iter : 7 Arret : 2.24981 s/iter 51.515152 +gpu 0 iter : 8 Arret : 1.27056 s/iter 52.721722 +gpu 0 iter : 9 Arret : 1.7356 s/iter 52.706102 +gpu 0 iter : 10 Arret : 0.542543 s/iter 52.785746 +gpu 0 iter : 11 Arret : 0.703757 s/iter 52.816724 +gpu 0 iter : 12 Arret : 0.310008 s/iter 52.461451 +gpu 0 iter : 13 Arret : 0.443499 s/iter 51.910352 +gpu 0 iter : 14 Arret : 0.600068 s/iter 51.409402 +gpu 0 iter : 15 Arret : 0.482174 s/iter 51.392959 +gpu 0 iter : 16 Arret : 0.771182 s/iter 50.626111 +gpu 0 iter : 17 Arret : 0.532518 s/iter 50.225728 +gpu 0 iter : 18 Arret : 0.257696 s/iter 49.125636 +gpu 0 iter : 19 Arret : 0.177381 s/iter 48.905491 +gpu 0 iter : 20 Arret : 0.130753 s/iter 48.447574 +gpu 0 iter : 21 Arret : 0.0607806 s/iter 48.417696 +gpu 0 iter : 22 Arret : 3.28538 s/iter 48.161859 +gpu 0 iter : 23 Arret : 1.32615 s/iter 48.015609 +gpu 0 iter : 24 Arret : 0.026712 s/iter 48.032029 +gpu 0 iter : 25 Arret : 0.0189921 s/iter 48.023109 +gpu 0 iter : 26 Arret : 0.0252448 s/iter 48.022355 +gpu 0 iter : 27 Arret : 0.0183014 s/iter 48.029077 +gpu 0 iter : 28 Arret : 0.0259939 s/iter 48.031196 +gpu 0 iter : 29 Arret : 0.0148008 s/iter 48.034595 +gpu 0 iter : 30 Arret : 0.00511391 s/iter 48.034650 +gpu 0 iter : 31 Arret : 0.000444388 s/iter 48.016595 +gpu 0 iter : 32 Arret : 1.35417E-05 s/iter 48.015821 +gpu 0 iter : 33 Arret : 5.22681E-07 s/iter 48.020076 +gpu 0 iter : 34 Arret : 2.63971E-09 s/iter 48.039932 +gpu 0 iter : 35 Arret : 1.22535E-11 s/iter 48.040535 +gpu 0 iter : 36 Arret : 5.68579E-14 s/iter 48.039757 +temps : 1786.83 seconde(s) +Nb iterations : 36 +Nb de depassements de capacite exponentielle : 0 +Precision : 3.48488E-08 +Stabilite : 5.68579E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-8.47142E-11 +i* 1.92466E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997|-8.89955E-13 +i* 2.61938E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997|-1.30287E-11 +i*-2.87501E-11| +| 15| -0.358575 +i* -0.933498| 0.999997|-4.93405E-11 +i*-7.15173E-13| +| 16| 0.314233 +i* 0.949343| 0.999997| 1.02587E-11 +i*-4.25648E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140098: line 23: 11749 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140098: line 24: 11753 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140098: line 25: 11755 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_3GPU.sge b/Simulations/sparse_openmp/sparse_openmp_3GPU.sge new file mode 100644 index 0000000..f3bb47b --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_3GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=3 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 3 +#$ -V +#$ -cwd +#$ -N sparse_openmp_3GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097 b/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097 new file mode 100644 index 0000000..2edc5c1 --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_4GPU.o140097 @@ -0,0 +1,621 @@ +REMAINING: 4 +Taking GPU #0 +Taking GPU #1 +Taking GPU #2 +Taking GPU #3 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^40000 + (-10 +i*0)*x^60000 + (1 +i*0)*x^100000 + +(-4000 +i*0)*x^39999 + (-600000 +i*0)*x^59999 + (100000 +i*0)*x^99999 + +zone limite de 'log-exp' 1.00356 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 0 dimgrid2 98 start 0 size 25024 +gpu 2 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 2 dimgrid2 98 start 50048 size 25024 +gpu 3 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 3 dimgrid2 98 start 75072 size 25024 +gpu 1 dimgrid 391 dimblock 256 degrePoly 100000 +gpu 1 dimgrid2 98 start 25024 size 25024 +gpu 0 iter : 1 Arret : 0.00317265 s/iter 0.236357 +gpu 0 iter : 2 Arret : 0.00227157 s/iter 0.222729 +gpu 0 iter : 3 Arret : 0.00205316 s/iter 0.222769 +gpu 0 iter : 4 Arret : 0.00128297 s/iter 0.222748 +gpu 0 iter : 5 Arret : 0.00112626 s/iter 0.222747 +gpu 0 iter : 6 Arret : 0.0020822 s/iter 0.222736 +gpu 0 iter : 7 Arret : 0.0115304 s/iter 0.222730 +gpu 0 iter : 8 Arret : 0.0115653 s/iter 0.295379 +gpu 0 iter : 9 Arret : 0.00182694 s/iter 0.222647 +gpu 0 iter : 10 Arret : 0.000971807 s/iter 0.222690 +gpu 0 iter : 11 Arret : 0.00050868 s/iter 0.222743 +gpu 0 iter : 12 Arret : 0.000554626 s/iter 0.222588 +gpu 0 iter : 13 Arret : 0.000773549 s/iter 0.222519 +gpu 0 iter : 14 Arret : 0.000652981 s/iter 0.222480 +gpu 0 iter : 15 Arret : 7.85268E-05 s/iter 0.222478 +gpu 0 iter : 16 Arret : 1.67519E-05 s/iter 0.222489 +gpu 0 iter : 17 Arret : 1.93862E-07 s/iter 0.222504 +gpu 0 iter : 18 Arret : 2.89153E-09 s/iter 0.222440 +gpu 0 iter : 19 Arret : 4.30769E-11 s/iter 0.222397 +gpu 0 iter : 20 Arret : 6.41743E-13 s/iter 0.222499 +temps : 5.86914 seconde(s) +Nb iterations : 20 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.09748E-08 +Stabilite : 1.57015E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540308 +i* 0.841422| 0.999962|-1.95866E-12 +i*-4.55465E-13| +| 2| -0.113164 +i* 0.993538| 0.999962|-4.34919E-12 +i* 9.60242E-13| +| 3| -0.226732 +i* -0.974016| 1.00006|-1.34468E-09 +i*-3.70749E-10| +| 4| -0.715763 +i* 0.698289| 0.999962| 9.11271E-13 +i* 2.47219E-12| +| 5| 0.439922 +i* -0.897993| 0.999962|-3.49498E-13 +i* 1.66432E-12| +| 6| -0.996122 +i* 0.0886386| 1.00006| 4.72785E-10 +i* 4.13616E-11| +| 7| 0.908546 +i* -0.417692| 0.999962| 4.78506E-13 +i* 1.54377E-13| +| 8| -0.827813 +i* -0.560935| 0.999962| 9.76996E-13 +i*-2.04309E-12| +| 9| 0.968129 +i* 0.250682| 1.00006|-2.31715E-10 +i* 1.34848E-10| +| 10| -0.286842 +i* -0.958038| 1.00006|-5.93554E-10 +i*-2.45345E-10| +| 11| 0.591653 +i* 0.806145| 0.999962|-9.87654E-13 +i*-3.03635E-12| +| 12| -0.0511836 +i* 0.998651| 0.999962|-2.22622E-12 +i*-3.69013E-14| +| 13| -0.67097 +i* 0.741432| 0.999962|-8.03801E-14 +i*-1.68204E-12| +| 14| 0.383249 +i* -0.923603| 0.999962|-1.29119E-12 +i*-1.37426E-12| +| 15| -0.988685 +i* 0.15039| 1.00006|-1.61051E-10 +i* 7.18515E-11| +| 16| 0.880824 +i* -0.473363| 0.999962|-4.03455E-13 +i* 2.85139E-12| +| 17| -0.861082 +i* -0.508391| 0.999962| 9.8066E-13 +i* 3.40478E-12| +| 18| 0.98184 +i* 0.190015| 1.00006| 8.88373E-10 +i*-2.66385E-10| +| 19| -0.345842 +i* -0.938354| 1.00006| 1.38421E-10 +i*-2.31696E-10| +| 20| 0.640621 +i* 0.767807| 0.999962|-6.98774E-13 +i* 1.13798E-12| ++---+----------------------------+------------+----------------------------+ +60000 racines de module = 0.999962 +40000 racines de module = 1.00006 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^50000 + (-10 +i*0)*x^150000 + (1 +i*0)*x^200000 + +(-5000 +i*0)*x^49999 + (-1.5E+06 +i*0)*x^149999 + (200000 +i*0)*x^199999 + +zone limite de 'log-exp' 1.00178 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +gpu 1 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 1 dimgrid2 196 start 50048 size 50048 +gpu 2 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 2 dimgrid2 196 start 100096 size 50048 +gpu 3 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 3 dimgrid2 196 start 150144 size 50048 +gpu 0 dimgrid 782 dimblock 256 degrePoly 200000 +gpu 0 dimgrid2 196 start 0 size 50048 +gpu 0 iter : 1 Arret : 0.000151294 s/iter 0.873722 +gpu 0 iter : 2 Arret : 0.000148163 s/iter 0.876720 +gpu 0 iter : 3 Arret : 0.000156239 s/iter 0.876483 +gpu 0 iter : 4 Arret : 0.000917016 s/iter 0.876408 +gpu 0 iter : 5 Arret : 0.00193309 s/iter 0.877387 +gpu 0 iter : 6 Arret : 0.012901 s/iter 1.040793 +gpu 0 iter : 7 Arret : 0.0696679 s/iter 1.039198 +gpu 0 iter : 8 Arret : 0.0831135 s/iter 1.017396 +gpu 0 iter : 9 Arret : 0.655093 s/iter 1.021459 +gpu 0 iter : 10 Arret : 0.310762 s/iter 1.026425 +gpu 0 iter : 11 Arret : 0.25028 s/iter 1.016739 +gpu 0 iter : 12 Arret : 0.12787 s/iter 1.024487 +gpu 0 iter : 13 Arret : 0.174578 s/iter 0.991808 +gpu 0 iter : 14 Arret : 0.13471 s/iter 1.020582 +gpu 0 iter : 15 Arret : 0.260288 s/iter 0.881413 +gpu 0 iter : 16 Arret : 0.151424 s/iter 1.018801 +gpu 0 iter : 17 Arret : 0.070357 s/iter 0.881097 +gpu 0 iter : 18 Arret : 0.0196537 s/iter 0.881104 +gpu 0 iter : 19 Arret : 0.00113921 s/iter 0.878041 +gpu 0 iter : 20 Arret : 4.42128E-05 s/iter 0.877967 +gpu 0 iter : 21 Arret : 3.87634E-06 s/iter 0.878342 +gpu 0 iter : 22 Arret : 3.63936E-09 s/iter 0.878295 +gpu 0 iter : 23 Arret : 3.63838E-13 s/iter 0.878170 +temps : 22.9576 seconde(s) +Nb iterations : 23 +Nb de depassements de capacite exponentielle : 0 +Precision : 0.000181892 +Stabilite : 2.22061E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540303 +i* 0.841453| 0.999985| 1.08703E-11 +i*-2.49217E-12| +| 2| -0.837195 +i* 0.546877| 0.999985| -5.4492E-12 +i* 1.09163E-12| +| 3| -0.553418 +i* -0.832885| 0.999985| -1.9722E-12 +i*-7.40397E-12| +| 4| 0.828599 +i* -0.559925| 1.00005|-7.54521E-09 +i* 1.47059E-08| +| 5| -0.8197 +i* 0.572767| 0.999985|-4.21663E-13 +i* -2.8616E-12| +| 6| -0.57917 +i* -0.815188| 0.999985|-5.13034E-12 +i*-1.52645E-12| +| 7| 0.810626 +i* -0.585537| 0.999985|-6.36846E-12 +i*-5.86797E-12| +| 8| 0.591872 +i* 0.806089| 1.00005|-1.69803E-09 +i* 9.43795E-09| +| 9| -0.801454 +i* 0.598134| 1.00005| 5.92533E-09 +i* 3.55911E-08| +| 10| -0.604356 +i* -0.796695| 0.999985|-1.64091E-13 +i* 1.59084E-12| +| 11| 0.791937 +i* -0.610578| 0.999985| 6.0707E-13 +i* 1.52922E-12| +| 12| 0.616763 +i* 0.78713| 0.999985|-4.48042E-12 +i* -2.6295E-12| +| 13| -0.782301 +i* 0.622877| 0.999985|-2.15827E-12 +i*-6.27114E-12| +| 14| -0.628991 +i* -0.777472| 1.00005| 6.93065E-09 +i*-8.65443E-09| +| 15| 0.772474 +i* -0.635023| 0.999985| 1.54783E-11 +i*-1.81338E-12| +| 16| 0.641054 +i* 0.767476| 0.999985| 9.05009E-12 +i*-2.91295E-12| +| 17| -0.762458 +i* 0.647014| 0.999985| 5.81724E-12 +i*-9.99384E-12| +| 18| -0.652967 +i* -0.757366| 0.999985| 5.10392E-12 +i*-6.61069E-12| +| 19| 0.752302 +i* -0.658888| 1.00005| 3.99107E-09 +i* 1.02117E-08| +| 20| 0.66472 +i* 0.747072| 0.999985|-1.93379E-12 +i*-1.29726E-11| ++---+----------------------------+------------+----------------------------+ +150000 racines de module = 0.999985 +50000 racines de module = 1.00005 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^150000 + (-10 +i*0)*x^250000 + (1 +i*0)*x^400000 + +(-15000 +i*0)*x^149999 + (-2.5E+06 +i*0)*x^249999 + (400000 +i*0)*x^399999 + +zone limite de 'log-exp' 1.00089 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 0 dimgrid2 391 start 0 size 100032 +gpu 2 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 2 dimgrid2 391 start 200064 size 100032 +gpu 3 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 3 dimgrid2 391 start 300096 size 100032 +gpu 1 dimgrid 1563 dimblock 256 degrePoly 400000 +gpu 1 dimgrid2 391 start 100032 size 100032 +gpu 0 iter : 1 Arret : 0.00053336 s/iter 3.114080 +gpu 0 iter : 2 Arret : 0.00132869 s/iter 3.113006 +gpu 0 iter : 3 Arret : 0.00304211 s/iter 3.113002 +gpu 0 iter : 4 Arret : 0.0081892 s/iter 3.421884 +gpu 0 iter : 5 Arret : 0.0174091 s/iter 3.393637 +gpu 0 iter : 6 Arret : 0.0170263 s/iter 3.378163 +gpu 0 iter : 7 Arret : 0.00925735 s/iter 3.423651 +gpu 0 iter : 8 Arret : 0.00879968 s/iter 3.111951 +gpu 0 iter : 9 Arret : 0.0133997 s/iter 3.368852 +gpu 0 iter : 10 Arret : 0.00968114 s/iter 3.111774 +gpu 0 iter : 11 Arret : 0.00462525 s/iter 3.110863 +gpu 0 iter : 12 Arret : 0.00341319 s/iter 3.111132 +gpu 0 iter : 13 Arret : 0.00439696 s/iter 3.110364 +gpu 0 iter : 14 Arret : 0.000354857 s/iter 3.110007 +gpu 0 iter : 15 Arret : 0.00105657 s/iter 3.109831 +gpu 0 iter : 16 Arret : 0.000563123 s/iter 3.109784 +gpu 0 iter : 17 Arret : 2.74759E-05 s/iter 3.109683 +gpu 0 iter : 18 Arret : 3.06801E-07 s/iter 3.109172 +gpu 0 iter : 19 Arret : 7.06164E-10 s/iter 3.108923 +gpu 0 iter : 20 Arret : 1.07684E-11 s/iter 3.109509 +gpu 0 iter : 21 Arret : 1.64161E-13 s/iter 3.109378 +temps : 68.0633 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.09466E-07 +Stabilite : 3.51078E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540313 +i* 0.841453| 0.999991| 9.34197E-12 +i*-1.23633E-11| +| 2| -0.998329 +i* 0.057622| 0.999991| 4.43912E-12 +i* 1.27665E-12| +| 3| 0.439867 +i* -0.898052| 0.999991|-8.50653E-12 +i*-8.85586E-12| +| 4| -0.996033 +i* 0.0888768| 0.999991|-3.15592E-12 +i* 1.17456E-12| +| 5| 0.411521 +i* -0.911417| 1.00002|-2.94737E-09 +i* 1.73005E-09| +| 6| 0.59196 +i* 0.805956| 0.999991| 5.24358E-13 +i*-8.53073E-12| +| 7| -0.992759 +i* 0.120044| 0.999991| 2.58804E-12 +i* 2.47274E-12| +| 8| 0.382796 +i* -0.923823| 0.999991|-1.63092E-11 +i* 4.26312E-12| +| 9| 0.616925 +i* 0.78701| 0.999991| 4.27514E-12 +i*-1.13966E-11| +| 10| -0.988534 +i* 0.151098| 1.00002|-8.27014E-10 +i* 9.44171E-10| +| 11| 0.35366 +i* -0.935364| 0.999991|-1.92664E-11 +i* 1.19958E-11| +| 12| 0.641299 +i* 0.767311| 1.00002|-2.44657E-09 +i* -6.7886E-11| +| 13| -0.983286 +i* 0.18202| 0.999991| 3.21676E-12 +i*-9.48297E-13| +| 14| 0.324176 +i* -0.945987| 0.999991|-5.20695E-12 +i*-7.06984E-12| +| 15| 0.66503 +i* 0.746804| 0.999991| 5.74873E-13 +i* 8.53884E-12| +| 16| -0.977123 +i* 0.212747| 1.00002| 1.09185E-09 +i* 2.38902E-10| +| 17| 0.294374 +i* -0.955681| 0.999991|-2.37395E-11 +i*-2.53098E-12| +| 18| 0.688122 +i* 0.725616| 1.00002|-2.54456E-09 +i* 8.15125E-10| +| 19| -0.969965 +i* 0.243206| 0.999991| 6.88072E-12 +i* 3.20268E-13| +| 20| 0.264283 +i* -0.964436| 0.999991| 2.5573E-11 +i*-6.45539E-12| ++---+----------------------------+------------+----------------------------+ +250000 racines de module = 0.999991 +150000 racines de module = 1.00002 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^250000 + (-10 +i*0)*x^350000 + (1 +i*0)*x^600000 + +(-25000 +i*0)*x^249999 + (-3.5E+06 +i*0)*x^349999 + (600000 +i*0)*x^599999 + +zone limite de 'log-exp' 1.00059 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 0 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 0 dimgrid2 586 start 0 size 150016 +gpu 2 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 2 dimgrid2 586 start 300032 size 150016 +gpu 1 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 1 dimgrid2 586 start 150016 size 150016 +gpu 3 dimgrid 2344 dimblock 256 degrePoly 600000 +gpu 3 dimgrid2 586 start 450048 size 150016 +gpu 0 iter : 1 Arret : 0.00166144 s/iter 6.733254 +gpu 0 iter : 2 Arret : 0.00663307 s/iter 6.721345 +gpu 0 iter : 3 Arret : 0.0196947 s/iter 6.725089 +gpu 0 iter : 4 Arret : 0.0354088 s/iter 7.044531 +gpu 0 iter : 5 Arret : 0.0344666 s/iter 7.231490 +gpu 0 iter : 6 Arret : 0.0255965 s/iter 7.223546 +gpu 0 iter : 7 Arret : 0.0250307 s/iter 7.248225 +gpu 0 iter : 8 Arret : 0.0220818 s/iter 7.524758 +gpu 0 iter : 9 Arret : 0.0193422 s/iter 7.217155 +gpu 0 iter : 10 Arret : 0.0384961 s/iter 7.206267 +gpu 0 iter : 11 Arret : 0.0308611 s/iter 7.198073 +gpu 0 iter : 12 Arret : 0.0139003 s/iter 7.227655 +gpu 0 iter : 13 Arret : 0.00821788 s/iter 6.730489 +gpu 0 iter : 14 Arret : 0.00366002 s/iter 7.146524 +gpu 0 iter : 15 Arret : 0.00103013 s/iter 6.725238 +gpu 0 iter : 16 Arret : 0.000538911 s/iter 6.724848 +gpu 0 iter : 17 Arret : 0.000270623 s/iter 6.725086 +gpu 0 iter : 18 Arret : 4.24795E-05 s/iter 6.724157 +gpu 0 iter : 19 Arret : 5.07342E-09 s/iter 6.723896 +gpu 0 iter : 20 Arret : 7.14369E-11 s/iter 6.724108 +gpu 0 iter : 21 Arret : 1.00557E-12 s/iter 6.725050 +gpu 0 iter : 22 Arret : 1.41479E-14 s/iter 6.724347 +temps : 154.313 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 1.37653E-08 +Stabilite : 2.77613E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540302 +i* 0.841463| 0.999993| 8.34199E-12 +i* -1.9051E-11| +| 2| -0.553438 +i* -0.832883| 0.999993|-2.10654E-12 +i*-2.55273E-11| +| 3| -0.579282 +i* -0.815119| 0.999993|-1.44751E-12 +i* 7.66798E-12| +| 4| 0.592014 +i* 0.805919| 0.999993|-3.98037E-12 +i* 9.55808E-12| +| 5| -0.604557 +i* -0.796554| 0.999993|-2.82974E-12 +i* 9.99473E-12| +| 6| 0.61698 +i* 0.78697| 0.999993| 9.01823E-12 +i*-5.69156E-12| +| 7| -0.629237 +i* -0.777205| 0.999993|-2.92122E-12 +i*-4.85867E-12| +| 8| 0.641354 +i* 0.767237| 0.999993|-1.64209E-11 +i* 1.12904E-12| +| 9| -0.653299 +i* -0.757092| 0.999993|-8.22453E-13 +i* 2.82818E-12| +| 10| 0.665096 +i* 0.746749| 0.999993| -1.2145E-11 +i* 1.89129E-11| +| 11| -0.676717 +i* -0.736234| 0.999993|-1.26079E-11 +i*-1.25073E-11| +| 12| 0.688185 +i* 0.725526| 0.999993| 2.69875E-11 +i* 1.65411E-11| +| 13| -0.699466 +i* -0.714679| 1.00001| 3.92343E-10 +i*-3.02623E-09| +| 14| 0.710597 +i* 0.70359| 0.999993| 1.28564E-11 +i* 1.56626E-11| +| 15| -0.721517 +i* -0.69241| 1.00001| 1.76709E-09 +i*-4.04041E-09| +| 16| 0.73231 +i* 0.680962| 0.999993| 1.34706E-11 +i*-4.43489E-12| +| 17| -0.742944 +i* -0.669367| 1.00001| 9.14394E-11 +i*-3.49261E-09| +| 18| 0.7533 +i* 0.657691| 1.00001| 1.64587E-09 +i*-3.03669E-09| +| 19| -0.763551 +i* -0.645737| 0.999993| 1.68299E-11 +i* 1.43271E-11| +| 20| 0.773539 +i* 0.633763| 1.00001| -4.2314E-09 +i* 1.86243E-09| ++---+----------------------------+------------+----------------------------+ +350000 racines de module = 0.999993 +250000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^300000 + (-10 +i*0)*x^500000 + (1 +i*0)*x^800000 + +(-30000 +i*0)*x^299999 + (-5E+06 +i*0)*x^499999 + (800000 +i*0)*x^799999 + +zone limite de 'log-exp' 1.00044 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 3 dimgrid2 782 start 600000 size 200000 +gpu 1 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 1 dimgrid2 782 start 200000 size 200000 +gpu 0 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 0 dimgrid2 782 start 0 size 200000 +gpu 2 dimgrid 3125 dimblock 256 degrePoly 800000 +gpu 2 dimgrid2 782 start 400000 size 200000 +gpu 0 iter : 1 Arret : 0.00108387 s/iter 12.149827 +gpu 0 iter : 2 Arret : 0.00154284 s/iter 12.327396 +gpu 0 iter : 3 Arret : 0.00442373 s/iter 12.172431 +gpu 0 iter : 4 Arret : 0.0484674 s/iter 12.229082 +gpu 0 iter : 5 Arret : 0.0462186 s/iter 12.248952 +gpu 0 iter : 6 Arret : 0.0672711 s/iter 12.235166 +gpu 0 iter : 7 Arret : 0.0371959 s/iter 12.355881 +gpu 0 iter : 8 Arret : 0.0332451 s/iter 12.399234 +gpu 0 iter : 9 Arret : 0.0347928 s/iter 12.369857 +gpu 0 iter : 10 Arret : 0.0382283 s/iter 12.701023 +gpu 0 iter : 11 Arret : 0.010893 s/iter 12.800482 +gpu 0 iter : 12 Arret : 0.0100182 s/iter 12.206749 +gpu 0 iter : 13 Arret : 0.000870471 s/iter 12.137340 +gpu 0 iter : 14 Arret : 0.00222619 s/iter 12.140578 +gpu 0 iter : 15 Arret : 0.000360359 s/iter 12.119427 +gpu 0 iter : 16 Arret : 0.000163251 s/iter 12.146378 +gpu 0 iter : 17 Arret : 8.3446E-05 s/iter 12.146441 +gpu 0 iter : 18 Arret : 5.95325E-07 s/iter 12.141680 +gpu 0 iter : 19 Arret : 1.07969E-09 s/iter 12.142666 +gpu 0 iter : 20 Arret : 2.37954E-12 s/iter 12.145013 +gpu 0 iter : 21 Arret : 3.63218E-14 s/iter 12.145853 +temps : 258.82 seconde(s) +Nb iterations : 21 +Nb de depassements de capacite exponentielle : 0 +Precision : 6.97756E-07 +Stabilite : 2.22043E-16 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.540305 +i* 0.841464| 0.999995| -2.03E-11 +i* 2.74701E-11| +| 2| 0.592014 +i* 0.805922| 0.999995|-1.82734E-11 +i* 2.10218E-11| +| 3| 0.617007 +i* 0.786952| 0.999995| 4.23442E-11 +i* -6.2147E-12| +| 4| 0.641392 +i* 0.767207| 0.999995| 6.90537E-12 +i*-5.12417E-11| +| 5| 0.665146 +i* 0.746707| 0.999995| 2.02977E-11 +i* 7.48579E-12| +| 6| 0.688245 +i* 0.725472| 0.999995|-1.73153E-11 +i* -1.2656E-11| +| 7| 0.710667 +i* 0.703522| 0.999995| 3.69782E-12 +i* 2.3081E-12| +| 8| 0.732388 +i* 0.68088| 0.999995| 9.45355E-12 +i* 2.09024E-11| +| 9| 0.753381 +i* 0.657577| 0.999995| 3.40094E-11 +i* 1.45989E-12| +| 10| 0.77364 +i* 0.633618| 0.999995|-1.72307E-11 +i* 1.22723E-11| +| 11| 0.793138 +i* 0.609034| 0.999995| 3.89222E-12 +i* 2.21356E-11| +| 12| 0.811855 +i* 0.583851| 0.999995|-1.28337E-11 +i*-5.47207E-12| +| 13| 0.829772 +i* 0.558094| 0.999995|-1.63114E-11 +i*-1.64246E-12| +| 14| 0.846873 +i* 0.531786| 0.999995|-3.30451E-11 +i*-8.10676E-12| +| 15| 0.86314 +i* 0.504956| 0.999995|-4.00413E-12 +i* 3.04823E-11| +| 16| 0.878557 +i* 0.477628| 0.999995|-2.16493E-12 +i* 1.10533E-11| +| 17| 0.893104 +i* 0.449841| 0.999995|-1.48552E-11 +i* 1.06063E-11| +| 18| 0.906777 +i* 0.4216| 0.999995|-1.38745E-11 +i* 5.33384E-12| +| 19| 0.919557 +i* 0.392944| 0.999995|-3.33245E-11 +i* 5.94386E-12| +| 20| 0.931433 +i* 0.363901| 0.999995| 4.93219E-11 +i*-2.82651E-11| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 0.999995 +300000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^400000 + (-10 +i*0)*x^600000 + (1 +i*0)*x^1000000 + +(-40000 +i*0)*x^399999 + (-6E+06 +i*0)*x^599999 + (1E+06 +i*0)*x^999999 + +zone limite de 'log-exp' 1.00035 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 2 (of 4) uses CUDA device 2 +gpu 3 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 3 dimgrid2 977 start 750144 size 250048 +gpu 0 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 0 dimgrid2 977 start 0 size 250048 +gpu 1 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 1 dimgrid2 977 start 250048 size 250048 +gpu 2 dimgrid 3907 dimblock 256 degrePoly 1000000 +gpu 2 dimgrid2 977 start 500096 size 250048 +gpu 0 iter : 1 Arret : 0.000456228 s/iter 18.772328 +gpu 0 iter : 2 Arret : 0.00142575 s/iter 18.751830 +gpu 0 iter : 3 Arret : 0.00549425 s/iter 18.764447 +gpu 0 iter : 4 Arret : 0.0229296 s/iter 19.538754 +gpu 0 iter : 5 Arret : 0.0173741 s/iter 19.273977 +gpu 0 iter : 6 Arret : 0.0179817 s/iter 19.297823 +gpu 0 iter : 7 Arret : 0.0102999 s/iter 18.835443 +gpu 0 iter : 8 Arret : 0.00783109 s/iter 19.616467 +gpu 0 iter : 9 Arret : 0.00443683 s/iter 19.576776 +gpu 0 iter : 10 Arret : 0.00652305 s/iter 18.757222 +gpu 0 iter : 11 Arret : 0.00589396 s/iter 18.772725 +gpu 0 iter : 12 Arret : 0.00781914 s/iter 18.746761 +gpu 0 iter : 13 Arret : 0.00825508 s/iter 18.745513 +gpu 0 iter : 14 Arret : 0.00209831 s/iter 18.746669 +gpu 0 iter : 15 Arret : 0.000157396 s/iter 18.747760 +gpu 0 iter : 16 Arret : 0.000185725 s/iter 18.747416 +gpu 0 iter : 17 Arret : 0.000163905 s/iter 18.747056 +gpu 0 iter : 18 Arret : 6.34206E-05 s/iter 18.748309 +gpu 0 iter : 19 Arret : 5.65573E-06 s/iter 18.749904 +gpu 0 iter : 20 Arret : 7.0784E-09 s/iter 18.749738 +gpu 0 iter : 21 Arret : 2.24468E-11 s/iter 18.748487 +gpu 0 iter : 22 Arret : 7.09418E-14 s/iter 18.747345 +temps : 422.324 seconde(s) +Nb iterations : 22 +Nb de depassements de capacite exponentielle : 0 +Precision : 8.97857E-06 +Stabilite : 5.20859E-14 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841468| 0.999996| 5.07216E-12 +i* 6.41236E-12| +| 2| 0.529701 +i* 0.84818| 0.999996|-4.61853E-13 +i*-4.17888E-12| +| 3| 0.524361 +i* 0.851491| 0.999996|-2.47296E-11 +i* 1.78327E-11| +| 4| 0.51901 +i* 0.854764| 0.999996| 9.45599E-12 +i* 2.07434E-11| +| 5| 0.513629 +i* 0.858008| 0.999996| 2.32483E-11 +i* 6.70747E-12| +| 6| 0.508237 +i* 0.861213| 0.999996|-1.34339E-11 +i* 9.87854E-12| +| 7| 0.502825 +i* 0.864384| 0.999996|-3.18459E-11 +i* 7.64744E-12| +| 8| 0.497384 +i* 0.867526| 0.999996| 2.97429E-11 +i*-6.06626E-13| +| 9| 0.491932 +i* 0.870629| 0.999996|-2.65525E-11 +i* 1.22525E-11| +| 10| 0.486452 +i* 0.873703| 0.999996| 3.0312E-11 +i* 1.02214E-11| +| 11| 0.480962 +i* 0.876737| 0.999996| 1.81546E-11 +i* 8.04012E-12| +| 12| 0.475453 +i* 0.879736| 0.999996| 3.09861E-11 +i* 4.093E-12| +| 13| 0.469917 +i* 0.882706| 0.999996|-1.29106E-11 +i*-2.31489E-11| +| 14| 0.46437 +i* 0.885637| 0.999996| 1.38481E-11 +i* -1.517E-11| +| 15| 0.458797 +i* 0.888537| 0.999996| 2.78862E-11 +i* 1.10441E-11| +| 16| 0.453214 +i* 0.891397| 0.999996| 2.45506E-11 +i* 3.1726E-11| +| 17| 0.447614 +i* 0.894223| 0.999996|-1.08491E-12 +i*-2.12277E-11| +| 18| 0.441986 +i* 0.897017| 0.999996| 2.72476E-11 +i* 3.22485E-11| +| 19| 0.436351 +i* 0.899772| 0.999996|-1.24334E-11 +i*-2.66317E-11| +| 20| 0.430689 +i* 0.902496| 0.999996| 2.73914E-12 +i* 2.25153E-11| ++---+----------------------------+------------+----------------------------+ +600000 racines de module = 0.999996 +400000 racines de module = 1.00001 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^500000 + (-10 +i*0)*x^700000 + (1 +i*0)*x^1200000 + +(-50000 +i*0)*x^499999 + (-7E+06 +i*0)*x^699999 + (1.2E+06 +i*0)*x^1199999 + +zone limite de 'log-exp' 1.0003 +CPU thread 3 (of 4) uses CUDA device 3 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 1 (of 4) uses CUDA device 1 +gpu 0 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 3 dimgrid2 1172 start 900096 size 300032 +gpu 2 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 0 dimgrid2 1172 start 0 size 300032 +gpu 2 dimgrid2 1172 start 600064 size 300032 +gpu 1 dimgrid 4688 dimblock 256 degrePoly 1200000 +gpu 1 dimgrid2 1172 start 300032 size 300032 +gpu 0 iter : 1 Arret : 0.00368442 s/iter 26.569710 +gpu 0 iter : 2 Arret : 3.704 s/iter 28.385681 +gpu 0 iter : 3 Arret : 1.74615 s/iter 28.502041 +gpu 0 iter : 4 Arret : 2.12336 s/iter 28.609424 +gpu 0 iter : 5 Arret : 2.13811 s/iter 29.338801 +gpu 0 iter : 6 Arret : 0.766739 s/iter 29.346300 +gpu 0 iter : 7 Arret : 0.657775 s/iter 29.516021 +gpu 0 iter : 8 Arret : 0.597705 s/iter 29.678298 +gpu 0 iter : 9 Arret : 0.573945 s/iter 29.579526 +gpu 0 iter : 10 Arret : 0.542611 s/iter 29.795670 +gpu 0 iter : 11 Arret : 0.488156 s/iter 29.717429 +gpu 0 iter : 12 Arret : 0.463721 s/iter 29.588883 +gpu 0 iter : 13 Arret : 0.442782 s/iter 29.618542 +gpu 0 iter : 14 Arret : 0.43109 s/iter 29.294507 +gpu 0 iter : 15 Arret : 0.427026 s/iter 29.324604 +gpu 0 iter : 16 Arret : 0.434845 s/iter 29.362199 +gpu 0 iter : 17 Arret : 0.442084 s/iter 29.279579 +gpu 0 iter : 18 Arret : 0.46093 s/iter 29.338081 +gpu 0 iter : 19 Arret : 0.48645 s/iter 29.333743 +gpu 0 iter : 20 Arret : 0.496349 s/iter 29.369982 +gpu 0 iter : 21 Arret : 1.56187 s/iter 28.940178 +gpu 0 iter : 22 Arret : 2.3748 s/iter 28.784866 +gpu 0 iter : 23 Arret : 1.09653 s/iter 28.933834 +gpu 0 iter : 24 Arret : 1.43739 s/iter 28.700919 +gpu 0 iter : 25 Arret : 2.22796 s/iter 28.722635 +gpu 0 iter : 26 Arret : 1.54855 s/iter 28.698877 +gpu 0 iter : 27 Arret : 1.95651 s/iter 28.629259 +gpu 0 iter : 28 Arret : 0.897983 s/iter 28.648379 +gpu 0 iter : 29 Arret : 7.34662 s/iter 28.534855 +gpu 0 iter : 30 Arret : 1.74621 s/iter 28.422914 +gpu 0 iter : 31 Arret : 0.597689 s/iter 28.621303 +gpu 0 iter : 32 Arret : 0.857922 s/iter 28.617561 +gpu 0 iter : 33 Arret : 1.33974 s/iter 28.328536 +gpu 0 iter : 34 Arret : 10.8161 s/iter 28.390666 +gpu 0 iter : 35 Arret : 6.6951 s/iter 28.507533 +gpu 0 iter : 36 Arret : 0.757761 s/iter 28.460493 +gpu 0 iter : 37 Arret : 0.588104 s/iter 28.489026 +gpu 0 iter : 38 Arret : 0.593958 s/iter 28.232970 +gpu 0 iter : 39 Arret : 0.333943 s/iter 27.617579 +gpu 0 iter : 40 Arret : 0.276517 s/iter 27.632546 +gpu 0 iter : 41 Arret : 0.137564 s/iter 27.552902 +gpu 0 iter : 42 Arret : 0.0648876 s/iter 27.307198 +gpu 0 iter : 43 Arret : 0.0511538 s/iter 27.320582 +gpu 0 iter : 44 Arret : 0.0242118 s/iter 26.798806 +gpu 0 iter : 45 Arret : 0.00922443 s/iter 26.583042 +gpu 0 iter : 46 Arret : 0.00927718 s/iter 26.616458 +gpu 0 iter : 47 Arret : 0.0412361 s/iter 26.563085 +gpu 0 iter : 48 Arret : 0.0405407 s/iter 26.561073 +gpu 0 iter : 49 Arret : 0.00788436 s/iter 26.567749 +gpu 0 iter : 50 Arret : 0.00128029 s/iter 26.567412 +gpu 0 iter : 51 Arret : 0.000171237 s/iter 26.567449 +gpu 0 iter : 52 Arret : 7.02979E-07 s/iter 26.567944 +gpu 0 iter : 53 Arret : 2.0296E-09 s/iter 26.567809 +gpu 0 iter : 54 Arret : 8.07801E-12 s/iter 26.567272 +gpu 0 iter : 55 Arret : 3.21626E-14 s/iter 26.572179 +temps : 1556.58 seconde(s) +Nb iterations : 55 +Nb de depassements de capacite exponentielle : 0 +Precision : 4.03717E-06 +Stabilite : 4.93017E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.54031 +i* 0.841472| 1| 1.4588E-09 +i* 4.51768E-09| +| 2| 0.513633 +i* 0.858015| 1| 1.54651E-09 +i*-2.27023E-10| +| 3| 0.486451 +i* 0.873713| 1| 1.95054E-09 +i* 6.77633E-10| +| 4| 0.458805 +i* 0.888533| 0.999997| 1.78773E-11 +i* 1.55684E-11| +| 5| 0.430685 +i* 0.902499| 0.999997| 2.12053E-13 +i*-1.16324E-11| +| 6| 0.402126 +i* 0.915589| 1| 2.50282E-09 +i*-6.10471E-09| +| 7| 0.3732 +i* 0.927747| 0.999997|-1.54374E-11 +i*-2.76083E-11| +| 8| 0.3439 +i* 0.939003| 0.999997|-1.12714E-11 +i* 1.5453E-11| +| 9| 0.314261 +i* 0.949333| 0.999997| 1.93628E-11 +i* 2.50909E-11| +| 10| 0.284313 +i* 0.958728| 0.999997| 2.69426E-11 +i* 2.77974E-11| +| 11| 0.254084 +i* 0.967179| 0.999997| 1.5277E-11 +i* 4.73027E-12| +| 12| 0.223605 +i* 0.974676| 0.999997| -8.1017E-11 +i*-3.77299E-11| +| 13| 0.192909 +i* 0.981221| 1|-1.95729E-09 +i* 4.84549E-09| +| 14| 0.162018 +i* 0.986792| 1| 1.80241E-09 +i* 1.03051E-10| +| 15| 0.130967 +i* 0.991391| 1|-1.93729E-10 +i*-4.06442E-10| +| 16| 0.0998077 +i* 0.995003| 0.999997| -4.5103E-11 +i*-6.66658E-12| +| 17| 0.0685404 +i* 0.997645| 0.999997| 1.01124E-11 +i* 3.1089E-12| +| 18| 0.0371504 +i* 0.999314| 1|-1.38879E-09 +i*-2.32658E-09| +| 19| 0.00578048 +i* 0.99998| 0.999997| 3.46787E-11 +i* 1.94857E-13| +| 20| -0.0256056 +i* 0.999669| 0.999997| 2.01068E-11 +i*-1.22213E-12| ++---+----------------------------+------------+----------------------------+ +500000 racines de module = 1 +700000 racines de module = 0.999997 +(1 +i*0)*x^0 + (-0.1 +i*0)*x^600000 + (-10 +i*0)*x^800000 + (1 +i*0)*x^1400000 + +(-60000 +i*0)*x^599999 + (-8E+06 +i*0)*x^799999 + (1.4E+06 +i*0)*x^1399999 + +zone limite de 'log-exp' 1.00025 +CPU thread 1 (of 4) uses CUDA device 1 +CPU thread 0 (of 4) uses CUDA device 0 +CPU thread 2 (of 4) uses CUDA device 2 +CPU thread 3 (of 4) uses CUDA device 3 +gpu 0 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 0 dimgrid2 1368 start 0 size 350016 +gpu 1 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 1 dimgrid2 1368 start 350016 size 350016 +gpu 2 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 2 dimgrid2 1368 start 700032 size 350016 +gpu 3 dimgrid 5469 dimblock 256 degrePoly 1400000 +gpu 3 dimgrid2 1368 start 1050048 size 350016 +gpu 0 iter : 1 Arret : 0.00408309 s/iter 36.124369 +gpu 0 iter : 2 Arret : 0.208632 s/iter 36.641290 +gpu 0 iter : 3 Arret : 1.37702 s/iter 37.617641 +gpu 0 iter : 4 Arret : 1.45346 s/iter 37.349167 +gpu 0 iter : 5 Arret : 1.6393 s/iter 37.990887 +gpu 0 iter : 6 Arret : 3.4316 s/iter 38.064434 +gpu 0 iter : 7 Arret : 1.9865 s/iter 38.951955 +gpu 0 iter : 8 Arret : 4.57739 s/iter 39.092906 +gpu 0 iter : 9 Arret : 2.70182 s/iter 39.516603 +gpu 0 iter : 10 Arret : 2.54353 s/iter 40.448257 +gpu 0 iter : 11 Arret : 1.82865 s/iter 40.236603 +gpu 0 iter : 12 Arret : 0.783909 s/iter 39.432599 +gpu 0 iter : 13 Arret : 1.89333 s/iter 39.521084 +gpu 0 iter : 14 Arret : 1.37044 s/iter 39.264476 +gpu 0 iter : 15 Arret : 3.05361 s/iter 38.860385 +gpu 0 iter : 16 Arret : 2.08571 s/iter 38.971159 +gpu 0 iter : 17 Arret : 2.09101 s/iter 38.887096 +gpu 0 iter : 18 Arret : 1.02745 s/iter 38.910018 +gpu 0 iter : 19 Arret : 0.704384 s/iter 38.234669 +gpu 0 iter : 20 Arret : 0.741087 s/iter 38.350019 +gpu 0 iter : 21 Arret : 0.788627 s/iter 38.106199 +gpu 0 iter : 22 Arret : 1.04305 s/iter 37.990724 +gpu 0 iter : 23 Arret : 2.78018 s/iter 38.167968 +gpu 0 iter : 24 Arret : 3.62183 s/iter 38.203661 +gpu 0 iter : 25 Arret : 5.50084 s/iter 37.940466 +gpu 0 iter : 26 Arret : 0.606592 s/iter 38.122389 +gpu 0 iter : 27 Arret : 0.700038 s/iter 37.866885 +gpu 0 iter : 28 Arret : 0.418813 s/iter 37.840730 +gpu 0 iter : 29 Arret : 0.495401 s/iter 37.808439 +gpu 0 iter : 30 Arret : 0.988549 s/iter 37.865318 +gpu 0 iter : 31 Arret : 0.749386 s/iter 37.753243 +gpu 0 iter : 32 Arret : 0.852267 s/iter 37.713161 +gpu 0 iter : 33 Arret : 1.16501 s/iter 37.855558 +gpu 0 iter : 34 Arret : 0.385689 s/iter 37.935460 +gpu 0 iter : 35 Arret : 0.393423 s/iter 37.441807 +gpu 0 iter : 36 Arret : 0.317888 s/iter 36.669962 +gpu 0 iter : 37 Arret : 0.23539 s/iter 36.318606 +gpu 0 iter : 38 Arret : 0.0527559 s/iter 36.193597 +gpu 0 iter : 39 Arret : 0.0143793 s/iter 36.106964 +gpu 0 iter : 40 Arret : 0.00318939 s/iter 36.183822 +gpu 0 iter : 41 Arret : 2.64184E-05 s/iter 36.123292 +gpu 0 iter : 42 Arret : 1.30802E-08 s/iter 36.116093 +gpu 0 iter : 43 Arret : 1.80499E-10 s/iter 36.117759 +gpu 0 iter : 44 Arret : 2.48451E-12 s/iter 36.115451 +gpu 0 iter : 45 Arret : 3.41814E-14 s/iter 36.113705 +temps : 1704.89 seconde(s) +Nb iterations : 45 +Nb de depassements de capacite exponentielle : 0 +Precision : 2.68566E-08 +Stabilite : 7.85076E-15 ++---+----------------------------+------------+----------------------------+ +| i | Zi | mod(Zi) | P(Zi) | ++---+----------------------------+------------+----------------------------+ +| 1| 0.5403 +i* 0.841469| 0.999997|-5.74141E-12 +i*-6.39521E-11| +| 2| 0.513623 +i* 0.858013| 0.999997|-2.15776E-11 +i*-2.98557E-11| +| 3| -0.52703 +i* -0.849843| 0.999997|-6.50922E-11 +i* 8.44216E-12| +| 4| 0.486439 +i* 0.873711| 0.999997| 5.60277E-11 +i* 4.36779E-11| +| 5| -0.500096 +i* -0.865967| 0.999997| 3.56147E-11 +i*-3.12713E-11| +| 6| 0.458776 +i* 0.888549| 0.999997|-1.89702E-11 +i* 4.08274E-12| +| 7| -0.472669 +i* -0.881237| 0.999997|-1.66496E-11 +i*-3.61498E-11| +| 8| 0.430661 +i* 0.902511| 0.999997|-1.60558E-11 +i*-1.29949E-11| +| 9| -0.444791 +i* -0.895631| 0.999997| 3.68259E-11 +i* 1.36002E-12| +| 10| 0.402136 +i* 0.915577| 0.999997| 6.5834E-12 +i* -1.3935E-11| +| 11| -0.416432 +i* -0.909164| 0.999997| 1.97816E-11 +i* 3.10848E-11| +| 12| 0.373171 +i* 0.927759| 0.999997|-2.17995E-11 +i*-2.96867E-12| +| 13| -0.387698 +i* -0.921783| 0.999997|-1.86324E-11 +i* -4.6545E-11| +| 14| 0.343875 +i* 0.939012| 0.999997| 3.06317E-11 +i* 7.08794E-11| +| 15| -0.358575 +i* -0.933498| 0.999997| 8.13599E-11 +i*-1.42233E-11| +| 16| 0.314233 +i* 0.949343| 0.999997| 3.86503E-11 +i* 2.08775E-11| +| 17| -0.329098 +i* -0.944293| 0.999997|-1.57903E-11 +i* 2.05052E-11| +| 18| 0.284281 +i* 0.958738| 0.999997| 2.51592E-11 +i* 2.09243E-11| +| 19| -0.299297 +i* -0.954157| 0.999997| 5.03608E-12 +i* 1.70503E-11| +| 20| 0.254048 +i* 0.967189| 0.999997|-2.81228E-11 +i*-1.66302E-11| ++---+----------------------------+------------+----------------------------+ +800000 racines de module = 0.999997 +600000 racines de module = 1 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 23: 10309 Segmentation fault (core dumped) ./template -r -i 900000 700000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 24: 10313 Segmentation fault (core dumped) ./template -r -i 1000000 800000 +/Softs/Sge/mesodell/spool/node1-50/job_scripts/140097: line 25: 10315 Segmentation fault (core dumped) ./template -r -i 1500000 500000 diff --git a/Simulations/sparse_openmp/sparse_openmp_4GPU.sge b/Simulations/sparse_openmp/sparse_openmp_4GPU.sge new file mode 100644 index 0000000..1b5ae2f --- /dev/null +++ b/Simulations/sparse_openmp/sparse_openmp_4GPU.sge @@ -0,0 +1,27 @@ +#!/bin/bash -l +#$ -q tesla.q +#$ -l gpu=4 +## adapter selon besoin +#$ -l h_vmem=15G +#$ -pe openmp 4 +#$ -V +#$ -cwd +#$ -N sparse_openmp_4GPU + +module load gcc/4.9.0 +module load cuda/7.0 + + +./template -r -i 60000 40000 +./template -r -i 150000 50000 +./template -r -i 250000 150000 +./template -r -i 350000 250000 +./template -r -i 500000 300000 +./template -r -i 600000 400000 +./template -r -i 700000 500000 +./template -r -i 800000 600000 +./template -r -i 900000 700000 +./template -r -i 1000000 800000 +./template -r -i 1500000 500000 + + diff --git a/Sparse_mpi.pdf b/Sparse_mpi.pdf new file mode 100644 index 0000000..2bdfcfa Binary files /dev/null and b/Sparse_mpi.pdf differ diff --git a/Sparse_mpivsomp.pdf b/Sparse_mpivsomp.pdf new file mode 100644 index 0000000..4b4412a Binary files /dev/null and b/Sparse_mpivsomp.pdf differ diff --git a/Sparse_openmp.pdf b/Sparse_openmp.pdf new file mode 100644 index 0000000..3c41967 Binary files /dev/null and b/Sparse_openmp.pdf differ diff --git a/paper.tex b/paper.tex index 6c21bfa..c4f142d 100644 --- a/paper.tex +++ b/paper.tex @@ -571,18 +571,46 @@ Algorithm~\ref{alg2-cuda} shows a sketch of the Ehrlich-Aberth method using CUDA \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.6\textwidth]{GPU_openmp} -\caption{Execution times in seconds of the Ehrlich-Aberth method on GPUs using shared memory paradigm with OpenMP} + \includegraphics[angle=-90,width=0.5\textwidth]{Sparse_openmp} +\caption{Execution times in seconds of the Ehrlich-Aberth method for solving sparse polynomials on GPUs using shared memory paradigm with OpenMP} \label{fig:01} \end{figure} \begin{figure}[htbp] \centering - \includegraphics[angle=-90,width=0.6\textwidth]{GPU_mpi} -\caption{Execution times in seconds of the Ehrlich-Aberth method on GPUs using distributed memory paradigm with MPI} + \includegraphics[angle=-90,width=0.5\textwidth]{Sparse_mpi} +\caption{Execution times in seconds of the Ehrlich-Aberth method for solving sparse polynomials on GPUs using distributed memory paradigm with MPI} \label{fig:02} \end{figure} +\begin{figure}[htbp] +\centering + \includegraphics[angle=-90,width=0.5\textwidth]{Full_openmp} +\caption{Execution times in seconds of the Ehrlich-Aberth method for solving full polynomials on GPUs using shared memory paradigm with OpenMP} +\label{fig:03} +\end{figure} + +\begin{figure}[htbp] +\centering + \includegraphics[angle=-90,width=0.5\textwidth]{Full_mpi} +\caption{Execution times in seconds of the Ehrlich-Aberth method for full polynomials on GPUs using distributed memory paradigm with MPI} +\label{fig:04} +\end{figure} + +\begin{figure}[htbp] +\centering + \includegraphics[angle=-90,width=0.5\textwidth]{Sparse_mpivsomp} +\caption{Comparaison between MPI and OpenMP versions of the Ehrlich-Aberth method for solving sparse plynomials on GPUs} +\label{fig:05} +\end{figure} + +\begin{figure}[htbp] +\centering + \includegraphics[angle=-90,width=0.5\textwidth]{Full_mpivsomp} +\caption{Comparaison between MPI and OpenMP versions of the Ehrlich-Aberth method for solving full polynomials on GPUs} +\label{fig:06} +\end{figure} + % An example of a floating figure using the graphicx package. % Note that \label must occur AFTER (or within) \caption. % For figures, \caption should occur after the \includegraphics.