<html><head></head><body style="word-wrap: break-word; -webkit-nbsp-mode: space; -webkit-line-break: after-white-space; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Hi,</span></font><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Le 15 déc. 2011 à 17:22, Bernard Chambon a écrit :</span></font></div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br class="Apple-interchange-newline"></span></font><blockquote type="cite"><span class="Apple-style-span" style="border-collapse: separate; font-style: normal; font-variant: normal; font-weight: normal; letter-spacing: normal; line-height: normal; orphans: 2; text-indent: 0px; text-transform: none; white-space: normal; widows: 2; word-spacing: 0px; -webkit-border-horizontal-spacing: 0px; -webkit-border-vertical-spacing: 0px; -webkit-text-decorations-in-effect: none; -webkit-text-size-adjust: auto; -webkit-text-stroke-width: 0px; "><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">I'm still working on failures encountered as the number of tasks increases</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">(Using mpich2-1.4, compiled with gcc 4.1, on Scientific Linux 5 , 2.6.18-238.12cc.el5)</span></font></div></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br class="Apple-interchange-newline"></span></font></blockquote><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Other tests, on the same machine with mpich2 1.0 then 1.1, 1.2 etc</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpich2version</span></font></div><div><b><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Version: </span></font></b><span class="Apple-tab-span" style="white-space: pre; "><b><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></b></span><b><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">1.0.8p1</span></font></b></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Release date:</span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Unknown, built on Tue Apr 21 13:52:10 CEST 2009</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Device: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">ch3:sock</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 configure: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">-prefix=/usr/local/mpich2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 CC: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">gcc -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 CXX: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">c++ -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 F77: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">g77 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 F90: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">f95 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpicc -O2 -I $MPICH_HOME/include -L $MPICH_HOME/lib -o bin/basic_test basic_test.c</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 256 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 256 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 512 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 512 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 512 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 512 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4" style="font-size: 21px; "><span class="Apple-style-span" style="font-size: 14px; "><div>With Mpich2 1.1 and beyond , I got error with around 150 tasks</div><div>I probably ommitted something when compiling those versions , but I don't know where to look for</div><div><br></div><div><br></div></span></font></div></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 18px; "><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpich2version </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>MPICH2 Version: </b></span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>        </b></span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>1.1b1</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Release date:</span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Unknown, built on Fri Dec 16 15:30:19 CET 2011</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Device: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">ch3:nemesis</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 configure: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">--prefix=//scratch/BC/mpich2-1.1</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 CC: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">/usr/bin/gcc -m64 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 CXX: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">c++ -m64 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 F77: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">/usr/bin/f77 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 F90: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">f95 -O2</span></font></div></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpicc -O2 -I $MPICH_HOME/include -L $MPICH_HOME/lib -o bin/basic_test basic_test.c</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 100 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 100 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 120 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 120 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b> >mpiexec -np 150 bin/basic_test</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>Assertion failed in file /scratch/BC/mpich2-1.1b1/src/util/wrappers/mpiu_shm_wrappers.h at line 919: seg_sz > 0</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>internal ABORT - process 0</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>rank 0 in job 26 ccwpge0001_56217 caused collective abort of all ranks</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b> exit status of rank 0: return code 1 </b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div></div></span></font></div><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpich2version </span></font></div><div><b><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Version: </span></font></b><span class="Apple-tab-span" style="white-space: pre; "><b><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></b></span><b><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">1.2.1</span></font></b></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Release date:</span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Unknown, built on Fri Dec 16 13:40:20 CET 2011</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 Device: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">ch3:nemesis</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 configure: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">--prefix=//scratch/BC/mpich2-1.2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 CC: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">/usr/bin/gcc -m64 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 CXX: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">c++ -m64 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 F77: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">/usr/bin/f77 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">MPICH2 F90: </span></font><span class="Apple-tab-span" style="white-space: pre; "><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">        </span></font></span><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">f95 -O2</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpicc -O2 -I $MPICH_HOME/include -L $MPICH_HOME/lib -o bin/basic_test basic_test.c</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 96 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 96 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 96 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 96 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 120 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 120 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "> >mpiexec -np 120 bin/basic_test</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Running 120 tasks </span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b> >mpiexec -np 130 bin/basic_test</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>Assertion failed in file /scratch/BC/mpich2-1.2.1/src/util/wrappers/mpiu_shm_wrappers.h at line 923: seg_sz > 0</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>internal ABORT - process 0</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b>rank 0 in job 16 ccwpge0001_56217 caused collective abort of all ranks</b></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><b> exit status of rank 0: return code 1 </b></span></font></div></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div></div></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">Best regards</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">PS :</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">the test code</span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><div>int basicTest(int argc, char** argv) {</div><div> if (MPI_Init(&argc, &argv) != MPI_SUCCESS ) {</div><div> printf("Error calling MPI_Init !!, exiting \n") ; fflush(stdout);</div><div> return(1);</div><div> }</div><div><br></div><div> int rank;</div><div> if ( MPI_Comm_rank(MPI_COMM_WORLD, &rank)!= MPI_SUCCESS ) {</div><div> printf("Error calling MPI_Comm_rank !!, exiting \n") ; fflush(stdout);</div><div> MPI_Abort(MPI_COMM_WORLD, 1);</div><div> return(1);</div><div> }</div><div> </div><div> if (rank == 0) {</div><div> int nprocs;</div><div> if (MPI_Comm_size(MPI_COMM_WORLD, &nprocs)!= MPI_SUCCESS ) {</div><div> printf("Error calling MPI_Comm_size !!, exiting \n") ; fflush(stdout);</div><div> MPI_Abort(MPI_COMM_WORLD, 1);</div><div> return(1);</div><div> }</div><div> </div><div> printf("Running %d tasks \n", nprocs) ; fflush(stdout);</div><div> MPI_Finalize(); </div><div> return(0); </div><div> } else {</div><div> sleep(1);</div><div> MPI_Finalize(); // Necessaire ssi <= mpich2-1.2</div><div> return(0);</div><div> }</div><div><br></div><div>}</div><div>/******************************/</div></span></font></div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; "><div>int main(int argc, char** argv) {</div><div> basicTest(argc, argv); </div><div>}</div><div><br></div></span></font></div><div><div><font class="Apple-style-span" size="4" style="font-size: 21px; "><span class="Apple-style-span" style="font-size: 14px; "><br></span></font></div></div><div>
<div><div><div><div><div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">---------------<br>Bernard CHAMBON<br>IN2P3 / CNRS<br>04 72 69 42 18<br></span></font></div></div></div></div></div><font class="Apple-style-span" size="4"><span class="Apple-style-span" style="font-size: 14px; ">
</span></font></div>
<br></div></body></html>