| 1 | //
 | 
|---|
| 2 | // messmpi.cc
 | 
|---|
| 3 | //
 | 
|---|
| 4 | // Copyright (C) 1996 Limit Point Systems, Inc.
 | 
|---|
| 5 | //
 | 
|---|
| 6 | // Author: Curtis Janssen <cljanss@limitpt.com>
 | 
|---|
| 7 | // Maintainer: LPS
 | 
|---|
| 8 | //
 | 
|---|
| 9 | // This file is part of the SC Toolkit.
 | 
|---|
| 10 | //
 | 
|---|
| 11 | // The SC Toolkit is free software; you can redistribute it and/or modify
 | 
|---|
| 12 | // it under the terms of the GNU Library General Public License as published by
 | 
|---|
| 13 | // the Free Software Foundation; either version 2, or (at your option)
 | 
|---|
| 14 | // any later version.
 | 
|---|
| 15 | //
 | 
|---|
| 16 | // The SC Toolkit is distributed in the hope that it will be useful,
 | 
|---|
| 17 | // but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
|---|
| 18 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
|---|
| 19 | // GNU Library General Public License for more details.
 | 
|---|
| 20 | //
 | 
|---|
| 21 | // You should have received a copy of the GNU Library General Public License
 | 
|---|
| 22 | // along with the SC Toolkit; see the file COPYING.LIB.  If not, write to
 | 
|---|
| 23 | // the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
 | 
|---|
| 24 | //
 | 
|---|
| 25 | // The U.S. Government is granted a limited license as per AL 91-7.
 | 
|---|
| 26 | //
 | 
|---|
| 27 | 
 | 
|---|
| 28 | #include <stdio.h> // for sprintf
 | 
|---|
| 29 | #include <unistd.h> // for fchdir etc.
 | 
|---|
| 30 | #include <fcntl.h> // for open on AIX
 | 
|---|
| 31 | 
 | 
|---|
| 32 | #define MPICH_SKIP_MPICXX
 | 
|---|
| 33 | #include <mpi.h>
 | 
|---|
| 34 | extern int MPI_Initialized(int *); // missing in mpi.h
 | 
|---|
| 35 | 
 | 
|---|
| 36 | #include <util/keyval/keyval.h>
 | 
|---|
| 37 | #include <util/group/messmpi.h>
 | 
|---|
| 38 | #include <util/misc/formio.h>
 | 
|---|
| 39 | #include <util/misc/newstring.h>
 | 
|---|
| 40 | 
 | 
|---|
| 41 | MPI_Comm global_commgrp;
 | 
|---|
| 42 | 
 | 
|---|
| 43 | using namespace std;
 | 
|---|
| 44 | using namespace sc;
 | 
|---|
| 45 | 
 | 
|---|
| 46 | // Define this to use immediate mode.  This was added added to work
 | 
|---|
| 47 | // around bugs in non-immediate mode optimizations in an MPI impl.
 | 
|---|
| 48 | #undef USE_IMMEDIATE_MODE
 | 
|---|
| 49 | 
 | 
|---|
| 50 | // OP_COMMUTES is zero to work around a bug in MPI/Pro 1.5b5 and earlier
 | 
|---|
| 51 | #define OP_COMMUTES 1
 | 
|---|
| 52 | 
 | 
|---|
| 53 | ///////////////////////////////////////////////////////////////////////
 | 
|---|
| 54 | 
 | 
|---|
| 55 | int MPIMessageGrp::nmpi_grps=0;
 | 
|---|
| 56 | Ref<ThreadLock> MPIMessageGrp::grplock;
 | 
|---|
| 57 | 
 | 
|---|
| 58 | static
 | 
|---|
| 59 | void
 | 
|---|
| 60 | print_error_and_abort(int me, int mpierror)
 | 
|---|
| 61 | {
 | 
|---|
| 62 |   char msg[MPI_MAX_ERROR_STRING+1];
 | 
|---|
| 63 |   int size;
 | 
|---|
| 64 |   MPI_Error_string(mpierror, msg, &size);
 | 
|---|
| 65 |   msg[size] = '\0';
 | 
|---|
| 66 |   ExEnv::outn() << me << ": " << msg << endl;
 | 
|---|
| 67 |   ExEnv::outn().flush();
 | 
|---|
| 68 |   //MPI_Abort(MPI_COMM_WORLD, mpierror);
 | 
|---|
| 69 | }
 | 
|---|
| 70 | 
 | 
|---|
| 71 | static
 | 
|---|
| 72 | const char *
 | 
|---|
| 73 | mpi_thread_string(int level)
 | 
|---|
| 74 | {
 | 
|---|
| 75 |   switch (level) {
 | 
|---|
| 76 | #ifdef HAVE_MPI_INIT_THREAD
 | 
|---|
| 77 |   case MPI_THREAD_SINGLE:
 | 
|---|
| 78 |       return "MPI_THREAD_SINGLE";
 | 
|---|
| 79 |   case MPI_THREAD_FUNNELED:
 | 
|---|
| 80 |       return "MPI_THREAD_FUNNELED";
 | 
|---|
| 81 |   case MPI_THREAD_SERIALIZED:
 | 
|---|
| 82 |       return "MPI_THREAD_SERIALIZED";
 | 
|---|
| 83 |   case MPI_THREAD_MULTIPLE:
 | 
|---|
| 84 |       return "MPI_THREAD_MULTIPLE";
 | 
|---|
| 85 | #endif
 | 
|---|
| 86 |   default:
 | 
|---|
| 87 |       return "unknown";
 | 
|---|
| 88 |     }
 | 
|---|
| 89 | }
 | 
|---|
| 90 | 
 | 
|---|
| 91 | ///////////////////////////////////////////////////////////////////////
 | 
|---|
| 92 | // The MPIMessageGrp class
 | 
|---|
| 93 | 
 | 
|---|
| 94 | static ClassDesc MPIMessageGrp_cd(
 | 
|---|
| 95 |   typeid(MPIMessageGrp),"MPIMessageGrp",1,"public MessageGrp",
 | 
|---|
| 96 |   create<MPIMessageGrp>, create<MPIMessageGrp>, 0);
 | 
|---|
| 97 | 
 | 
|---|
| 98 | MPIMessageGrp::MPIMessageGrp()
 | 
|---|
| 99 | {
 | 
|---|
| 100 |   init(MPI_COMM_WORLD);
 | 
|---|
| 101 | }
 | 
|---|
| 102 | 
 | 
|---|
| 103 | MPIMessageGrp::MPIMessageGrp(MPI_Comm comm)
 | 
|---|
| 104 | {
 | 
|---|
| 105 |   init(comm);
 | 
|---|
| 106 | }
 | 
|---|
| 107 | 
 | 
|---|
| 108 | MPIMessageGrp::MPIMessageGrp(int *argc, char ***argv)
 | 
|---|
| 109 | {
 | 
|---|
| 110 |   init(MPI_COMM_WORLD,argc,argv);
 | 
|---|
| 111 | }
 | 
|---|
| 112 | 
 | 
|---|
| 113 | MPIMessageGrp::MPIMessageGrp(const Ref<KeyVal>& keyval):
 | 
|---|
| 114 |   MessageGrp(keyval)
 | 
|---|
| 115 | {
 | 
|---|
| 116 |   if (keyval->exists("argv")) {
 | 
|---|
| 117 |       int argc = keyval->count("argv");
 | 
|---|
| 118 |       char **argv = new char*[argc+1];
 | 
|---|
| 119 |       argv[argc] = 0;
 | 
|---|
| 120 |       for (int arg=0; arg<argc; arg++) {
 | 
|---|
| 121 |           argv[arg] = keyval->pcharvalue("argv",arg);
 | 
|---|
| 122 |         }
 | 
|---|
| 123 |       init(MPI_COMM_WORLD, &argc, &argv);
 | 
|---|
| 124 |     }
 | 
|---|
| 125 |   else {
 | 
|---|
| 126 |       init(MPI_COMM_WORLD);
 | 
|---|
| 127 |     }
 | 
|---|
| 128 | 
 | 
|---|
| 129 |   if (keyval->booleanvalue("errors_return")) {
 | 
|---|
| 130 |       if (me()==0)
 | 
|---|
| 131 |           ExEnv::outn() << indent << "MPIMessageGrp: errors_return is true" << endl;
 | 
|---|
| 132 |       MPI_Comm_set_errhandler(commgrp, MPI_ERRORS_RETURN);
 | 
|---|
| 133 |     }
 | 
|---|
| 134 | 
 | 
|---|
| 135 |   if (debug_) {
 | 
|---|
| 136 |       ExEnv::outn() << indent << "MPIMessageGrp: KeyVal CTOR: done" << endl;
 | 
|---|
| 137 |     }
 | 
|---|
| 138 | }
 | 
|---|
| 139 | 
 | 
|---|
| 140 | void
 | 
|---|
| 141 | MPIMessageGrp::init(MPI_Comm comm, int *argc, char ***argv)
 | 
|---|
| 142 | {
 | 
|---|
| 143 |   int me, nproc;
 | 
|---|
| 144 | 
 | 
|---|
| 145 |   if (debug_) {
 | 
|---|
| 146 |       ExEnv::outn() << "MPIMessageGrp::init: entered" << endl;
 | 
|---|
| 147 |     }
 | 
|---|
| 148 | 
 | 
|---|
| 149 |   int flag;
 | 
|---|
| 150 |   MPI_Initialized(&flag);
 | 
|---|
| 151 |   if (!flag) {
 | 
|---|
| 152 |       int tmp_argc;
 | 
|---|
| 153 |       char **tmp_argv;
 | 
|---|
| 154 |       int *inits_argc;
 | 
|---|
| 155 |       char ***inits_argv;
 | 
|---|
| 156 |       if (argc && argv) {
 | 
|---|
| 157 |           inits_argc = argc;
 | 
|---|
| 158 |           inits_argv = argv;
 | 
|---|
| 159 |         }
 | 
|---|
| 160 |       else {
 | 
|---|
| 161 |           tmp_argc = 0;
 | 
|---|
| 162 |           tmp_argv = new char*[tmp_argc+1];
 | 
|---|
| 163 |           tmp_argv[tmp_argc] = 0;
 | 
|---|
| 164 |           inits_argc = &tmp_argc;
 | 
|---|
| 165 |           inits_argv = &tmp_argv;
 | 
|---|
| 166 |         }
 | 
|---|
| 167 |       // This dot business is to work around problems with some MPI
 | 
|---|
| 168 |       // implementations.
 | 
|---|
| 169 |       int dot = open(".",O_RDONLY);
 | 
|---|
| 170 |       if (debug_) {
 | 
|---|
| 171 |           ExEnv::outn() << indent
 | 
|---|
| 172 |                << "Calling MPI_Init with";
 | 
|---|
| 173 |           for (int i=0; i<*argc; i++) {
 | 
|---|
| 174 |               ExEnv::outn() << " " << *argv[i];
 | 
|---|
| 175 |             }
 | 
|---|
| 176 |           ExEnv::outn() << endl;
 | 
|---|
| 177 |         }
 | 
|---|
| 178 | #ifdef HAVE_MPI_INIT_THREAD
 | 
|---|
| 179 |       int provided, desired = SC_MPI_THREAD_LEVEL;
 | 
|---|
| 180 |       MPI_Init_thread(inits_argc, inits_argv, desired, &provided);
 | 
|---|
| 181 |       int me;
 | 
|---|
| 182 |       MPI_Comm_rank(MPI_COMM_WORLD, &me);
 | 
|---|
| 183 |       if (provided != desired && me == 0) {
 | 
|---|
| 184 |           ExEnv::outn() << indent
 | 
|---|
| 185 |                         << "WARNING: desired "
 | 
|---|
| 186 |                         << mpi_thread_string(desired)
 | 
|---|
| 187 |                         << " MPI threading support but got "
 | 
|---|
| 188 |                         << mpi_thread_string(provided)
 | 
|---|
| 189 |                         << endl;
 | 
|---|
| 190 |         }
 | 
|---|
| 191 | #else
 | 
|---|
| 192 |       MPI_Init(inits_argc, inits_argv);
 | 
|---|
| 193 | #endif
 | 
|---|
| 194 | #ifdef HAVE_FCHDIR
 | 
|---|
| 195 |       fchdir(dot);
 | 
|---|
| 196 | #endif
 | 
|---|
| 197 |       close(dot);
 | 
|---|
| 198 |     }
 | 
|---|
| 199 | 
 | 
|---|
| 200 |   MPI_Comm_dup(comm, &commgrp);
 | 
|---|
| 201 |   global_commgrp = commgrp;
 | 
|---|
| 202 | 
 | 
|---|
| 203 |   MPI_Comm_set_errhandler(commgrp, MPI_ERRORS_ARE_FATAL);
 | 
|---|
| 204 | 
 | 
|---|
| 205 |    if (!nmpi_grps) {
 | 
|---|
| 206 |       threadgrp = ThreadGrp::get_default_threadgrp();
 | 
|---|
| 207 |       grplock = threadgrp->new_lock();
 | 
|---|
| 208 |      }
 | 
|---|
| 209 |       grplock->lock();
 | 
|---|
| 210 |       nmpi_grps++;
 | 
|---|
| 211 |       grplock->unlock();
 | 
|---|
| 212 | 
 | 
|---|
| 213 |   MPI_Comm_rank(commgrp,&me);
 | 
|---|
| 214 |   MPI_Comm_size(commgrp, &nproc);
 | 
|---|
| 215 |   bufsize = 4000000;
 | 
|---|
| 216 |   buf = 0;
 | 
|---|
| 217 |   //buf = (void*) new char[bufsize];
 | 
|---|
| 218 |   //MPI_Buffer_attach(buf,bufsize);
 | 
|---|
| 219 | 
 | 
|---|
| 220 |   if (getenv("MPIMESSAGEGRP_MESSAGEGRP_COLLECTIVES"))
 | 
|---|
| 221 |       use_messagegrp_collectives_ = true;
 | 
|---|
| 222 |   else
 | 
|---|
| 223 |       use_messagegrp_collectives_ = false;
 | 
|---|
| 224 |   
 | 
|---|
| 225 |   initialize(me, nproc);
 | 
|---|
| 226 | 
 | 
|---|
| 227 |   //MPIL_Trace_on();
 | 
|---|
| 228 | 
 | 
|---|
| 229 |   if (debug_) {
 | 
|---|
| 230 |       ExEnv::outn() << me << ": MPIMessageGrp::init: done" << endl;
 | 
|---|
| 231 |     }
 | 
|---|
| 232 | 
 | 
|---|
| 233 |   SCFormIO::init_mp(me);
 | 
|---|
| 234 | }
 | 
|---|
| 235 | 
 | 
|---|
| 236 | MPIMessageGrp::~MPIMessageGrp()
 | 
|---|
| 237 | {
 | 
|---|
| 238 |   //MPIL_Trace_off();
 | 
|---|
| 239 |   //MPI_Buffer_detach(&buf, &bufsize);
 | 
|---|
| 240 |   delete[] (char*) buf;
 | 
|---|
| 241 | 
 | 
|---|
| 242 |   grplock->lock();
 | 
|---|
| 243 |   nmpi_grps--;
 | 
|---|
| 244 |   if (!nmpi_grps) MPI_Finalize();
 | 
|---|
| 245 |   grplock->unlock();
 | 
|---|
| 246 |   
 | 
|---|
| 247 | }
 | 
|---|
| 248 | 
 | 
|---|
| 249 | Ref<MessageGrp> MPIMessageGrp::clone(void)
 | 
|---|
| 250 | {
 | 
|---|
| 251 |   Ref<MessageGrp> mgrp = new MPIMessageGrp;
 | 
|---|
| 252 |   return mgrp;
 | 
|---|
| 253 | }
 | 
|---|
| 254 | 
 | 
|---|
| 255 | void
 | 
|---|
| 256 | MPIMessageGrp::raw_send(int target, const void* data, int nbyte)
 | 
|---|
| 257 | {
 | 
|---|
| 258 |   if (debug_) {
 | 
|---|
| 259 |       ExEnv::outn() << scprintf("%3d: MPI_Send"
 | 
|---|
| 260 |                        "(0x%08x, %5d, MPI_BYTE, %3d, 0, commgrp)",
 | 
|---|
| 261 |                        me(), data, nbyte, target)
 | 
|---|
| 262 |            << endl;
 | 
|---|
| 263 |     }
 | 
|---|
| 264 |   int ret;
 | 
|---|
| 265 | #ifndef USE_IMMEDIATE_MODE
 | 
|---|
| 266 |   ret = MPI_Send(const_cast<void*>(data),nbyte,MPI_BYTE,target,0,commgrp);
 | 
|---|
| 267 | #else
 | 
|---|
| 268 |   MPI_Request mpireq;
 | 
|---|
| 269 |   MPI_Status status;
 | 
|---|
| 270 |   ret = MPI_Isend(data,nbyte,MPI_BYTE,target,0,commgrp,&mpireq);
 | 
|---|
| 271 |   if (ret == MPI_SUCCESS) ret = MPI_Wait(&mpireq,&status);
 | 
|---|
| 272 | #endif // USE_IMMEDIATE_MODE
 | 
|---|
| 273 |   if (ret != MPI_SUCCESS) {
 | 
|---|
| 274 |       ExEnv::outn() << me() << ": MPIMessageGrp::raw_send("
 | 
|---|
| 275 |           << target << ",," << nbyte << "): mpi error:" << endl;
 | 
|---|
| 276 |       print_error_and_abort(me(), ret);
 | 
|---|
| 277 |     }
 | 
|---|
| 278 |   if (debug_) ExEnv::outn() << scprintf("%3d: sent\n", me()) << endl;
 | 
|---|
| 279 | }
 | 
|---|
| 280 | 
 | 
|---|
| 281 | void
 | 
|---|
| 282 | MPIMessageGrp::raw_recv(int sender, void* data, int nbyte)
 | 
|---|
| 283 | {
 | 
|---|
| 284 |   MPI_Status status;
 | 
|---|
| 285 |   if (sender == -1) sender = MPI_ANY_SOURCE;
 | 
|---|
| 286 |   if (debug_) {
 | 
|---|
| 287 |       ExEnv::outn() << scprintf("%3d: MPI_Recv"
 | 
|---|
| 288 |                        "(0x%08x, %5d, MPI_BYTE, %3d, 0, commgrp,)",
 | 
|---|
| 289 |                        me(), data, nbyte, sender)
 | 
|---|
| 290 |            << endl;
 | 
|---|
| 291 |     }
 | 
|---|
| 292 |   int ret;
 | 
|---|
| 293 | #ifndef USE_IMMEDIATE_MODE
 | 
|---|
| 294 |   ret = MPI_Recv(data,nbyte,MPI_BYTE,sender,0,commgrp,&status);
 | 
|---|
| 295 | #else
 | 
|---|
| 296 |   MPI_Request mpireq;
 | 
|---|
| 297 |   ret = MPI_Irecv(data,nbyte,MPI_BYTE,sender,0,commgrp,&mpireq);
 | 
|---|
| 298 |   if (ret == MPI_SUCCESS) ret = MPI_Wait(&mpireq,&status);
 | 
|---|
| 299 | #endif // USE_IMMEDIATE_MODE
 | 
|---|
| 300 |   if (ret != MPI_SUCCESS) {
 | 
|---|
| 301 |       ExEnv::outn() << me() << ": MPIMessageGrp::raw_recv("
 | 
|---|
| 302 |           << sender << ",," << nbyte << "): mpi error:" << endl;
 | 
|---|
| 303 |       print_error_and_abort(me(), ret);
 | 
|---|
| 304 |     }
 | 
|---|
| 305 |   rnode = status.MPI_SOURCE;
 | 
|---|
| 306 |   rtag = status.MPI_TAG;
 | 
|---|
| 307 |   rlen = nbyte;
 | 
|---|
| 308 |   if (debug_) ExEnv::outn() << scprintf("%3d: recvd %d bytes\n", me(), rlen) << endl;
 | 
|---|
| 309 | }
 | 
|---|
| 310 | 
 | 
|---|
| 311 | void
 | 
|---|
| 312 | MPIMessageGrp::raw_sendt(int target, int type, const void* data, int nbyte)
 | 
|---|
| 313 | {
 | 
|---|
| 314 |   type = (type<<1) + 1;
 | 
|---|
| 315 |   if (debug_) {
 | 
|---|
| 316 |       ExEnv::outn() << scprintf("%3d: MPI_Send"
 | 
|---|
| 317 |                        "(0x%08x, %5d, MPI_BYTE, %3d, %5d, commgrp)",
 | 
|---|
| 318 |                        me(), data, nbyte, target, type)
 | 
|---|
| 319 |            << endl;
 | 
|---|
| 320 |     }
 | 
|---|
| 321 |   int ret;
 | 
|---|
| 322 | #ifndef USE_IMMEDIATE_MODE
 | 
|---|
| 323 |   ret = MPI_Send(const_cast<void*>(data),nbyte,MPI_BYTE,target,type,commgrp);
 | 
|---|
| 324 | #else
 | 
|---|
| 325 |   MPI_Request mpireq;
 | 
|---|
| 326 |   MPI_Status status;
 | 
|---|
| 327 |   ret = MPI_Isend(data,nbyte,MPI_BYTE,target,type,commgrp,&mpireq);
 | 
|---|
| 328 |   if (ret == MPI_SUCCESS) ret = MPI_Wait(&mpireq,&status);
 | 
|---|
| 329 | #endif
 | 
|---|
| 330 |   if (ret != MPI_SUCCESS) {
 | 
|---|
| 331 |       ExEnv::outn() << me() << ": MPIMessageGrp::raw_sendt("
 | 
|---|
| 332 |           << target << "," << type << ",," << nbyte << "): mpi error:" << endl;
 | 
|---|
| 333 |       print_error_and_abort(me(), ret);
 | 
|---|
| 334 |     }
 | 
|---|
| 335 |   if (debug_) ExEnv::outn() << scprintf("%3d: sent\n", me()) << endl;
 | 
|---|
| 336 | }
 | 
|---|
| 337 | 
 | 
|---|
| 338 | void
 | 
|---|
| 339 | MPIMessageGrp::raw_recvt(int type, void* data, int nbyte)
 | 
|---|
| 340 | {
 | 
|---|
| 341 |   MPI_Status status;
 | 
|---|
| 342 |   if (type == -1) type = MPI_ANY_TAG;
 | 
|---|
| 343 |   else type = (type<<1) + 1;
 | 
|---|
| 344 |   if (debug_) {
 | 
|---|
| 345 |       ExEnv::outn() << scprintf("%3d: MPI_Recv(0x%08x, %5d, MPI_BYTE, "
 | 
|---|
| 346 |                        "MPI_ANY_SOURCE, %5d, commgrp,)",
 | 
|---|
| 347 |                        me(), data, nbyte, type)
 | 
|---|
| 348 |            << endl;
 | 
|---|
| 349 |     }
 | 
|---|
| 350 |   int ret;
 | 
|---|
| 351 | #ifndef USE_IMMEDIATE_MODE
 | 
|---|
| 352 |   ret = MPI_Recv(data,nbyte,MPI_BYTE,MPI_ANY_SOURCE,type,commgrp,&status);
 | 
|---|
| 353 | #else
 | 
|---|
| 354 |   MPI_Request mpireq;
 | 
|---|
| 355 |   ret = MPI_Irecv(data,nbyte,MPI_BYTE,MPI_ANY_SOURCE,type,commgrp,&mpireq);
 | 
|---|
| 356 |   if (ret == MPI_SUCCESS) ret = MPI_Wait(&mpireq,&status);
 | 
|---|
| 357 | #endif // USE_IMMEDIATE_MODE
 | 
|---|
| 358 |   if (ret != MPI_SUCCESS) {
 | 
|---|
| 359 |       ExEnv::outn() << me() << ": MPIMessageGrp::raw_recvt("
 | 
|---|
| 360 |           << type << ",," << nbyte << "): mpi error:" << endl;
 | 
|---|
| 361 |       print_error_and_abort(me(), ret);
 | 
|---|
| 362 |     }
 | 
|---|
| 363 |   rnode = status.MPI_SOURCE;
 | 
|---|
| 364 |   rtag = status.MPI_TAG;
 | 
|---|
| 365 |   rlen = nbyte;
 | 
|---|
| 366 |   if (debug_) {
 | 
|---|
| 367 |       ExEnv::outn() << scprintf("%3d: recvd %d bytes from %d with tag %d\n",
 | 
|---|
| 368 |                        me(), rlen, rnode, rtag) << endl;
 | 
|---|
| 369 |     }
 | 
|---|
| 370 | }
 | 
|---|
| 371 | 
 | 
|---|
| 372 | int
 | 
|---|
| 373 | MPIMessageGrp::probet(int type)
 | 
|---|
| 374 | {
 | 
|---|
| 375 |   int flag;
 | 
|---|
| 376 |   MPI_Status status;
 | 
|---|
| 377 | 
 | 
|---|
| 378 |   if (type == -1) type = MPI_ANY_TAG;
 | 
|---|
| 379 |   else type = (type<<1) + 1;
 | 
|---|
| 380 |   int ret;
 | 
|---|
| 381 |   if (debug_) {
 | 
|---|
| 382 |       ExEnv::outn() << scprintf("%3d: MPI_Iprobe(MPI_ANY_SOURCE, %5d, commgrp, "
 | 
|---|
| 383 |                        "&flag, &status)", me(), type)
 | 
|---|
| 384 |            << endl;
 | 
|---|
| 385 |     }
 | 
|---|
| 386 |   if ((ret = MPI_Iprobe(MPI_ANY_SOURCE,type,commgrp,&flag,&status))
 | 
|---|
| 387 |       != MPI_SUCCESS ) {
 | 
|---|
| 388 |       ExEnv::outn() << me() << ": MPIMessageGrp::probet("
 | 
|---|
| 389 |           << type << "): mpi error:" << endl;
 | 
|---|
| 390 |       print_error_and_abort(me(), ret);
 | 
|---|
| 391 |     }
 | 
|---|
| 392 |   if (flag) {
 | 
|---|
| 393 |     rnode = status.MPI_SOURCE;
 | 
|---|
| 394 |     rtag = status.MPI_TAG;
 | 
|---|
| 395 |     MPI_Get_count(&status, MPI_BYTE, &rlen);
 | 
|---|
| 396 |     return 1;
 | 
|---|
| 397 |     }
 | 
|---|
| 398 |   else {
 | 
|---|
| 399 |     rnode = rtag = rlen = 0;
 | 
|---|
| 400 |     }
 | 
|---|
| 401 |     
 | 
|---|
| 402 |   return 0;
 | 
|---|
| 403 | }
 | 
|---|
| 404 | 
 | 
|---|
| 405 | void
 | 
|---|
| 406 | MPIMessageGrp::sync()
 | 
|---|
| 407 | {
 | 
|---|
| 408 |   int ret;
 | 
|---|
| 409 |   if (debug_) {
 | 
|---|
| 410 |       ExEnv::outn() << scprintf("%3d: MPI_Barrier(commgrp)", me()) << endl;
 | 
|---|
| 411 |     }
 | 
|---|
| 412 |   if ((ret = MPI_Barrier(commgrp)) != MPI_SUCCESS) {
 | 
|---|
| 413 |       ExEnv::outn() << me() << ": MPIMessageGrp::sync(): mpi error:" << endl;
 | 
|---|
| 414 |       print_error_and_abort(me(), ret);
 | 
|---|
| 415 |     }
 | 
|---|
| 416 | }
 | 
|---|
| 417 | 
 | 
|---|
| 418 | #define REDUCEMEMBER(name, type, mpitype) \
 | 
|---|
| 419 | static GrpReduce<type>* name ## reduceobject; \
 | 
|---|
| 420 | extern "C" void \
 | 
|---|
| 421 | name ## reduce(void*b, void*a, int*len, MPI_Datatype*datatype) \
 | 
|---|
| 422 | { \
 | 
|---|
| 423 |   name ## reduceobject->reduce((type*)a, (type*)b, *len); \
 | 
|---|
| 424 | } \
 | 
|---|
| 425 | void \
 | 
|---|
| 426 | MPIMessageGrp::reduce(type*d, int n, GrpReduce<type>&r, \
 | 
|---|
| 427 |                       type*scratch, int target) \
 | 
|---|
| 428 | { \
 | 
|---|
| 429 |   if (use_messagegrp_collectives_) { \
 | 
|---|
| 430 |       MessageGrp::reduce(d,n,r,scratch,target); \
 | 
|---|
| 431 |       return; \
 | 
|---|
| 432 |     } \
 | 
|---|
| 433 |  \
 | 
|---|
| 434 |   name ## reduceobject = &r; \
 | 
|---|
| 435 |  \
 | 
|---|
| 436 |   MPI_Op op; \
 | 
|---|
| 437 |   MPI_Op_create(name ## reduce, OP_COMMUTES, &op); \
 | 
|---|
| 438 |  \
 | 
|---|
| 439 |   type *work; \
 | 
|---|
| 440 |   if (!scratch) work = new type[n]; \
 | 
|---|
| 441 |   else work = scratch; \
 | 
|---|
| 442 |  \
 | 
|---|
| 443 |   int ret; \
 | 
|---|
| 444 |  \
 | 
|---|
| 445 |   if (target == -1) { \
 | 
|---|
| 446 |       if (debug_) { \
 | 
|---|
| 447 |           ExEnv::outn() << scprintf("%3d: MPI_Allreduce" \
 | 
|---|
| 448 |           "(0x%08x, 0x%08x, %5d, %3d, op, commgrp)", \
 | 
|---|
| 449 |           me(), d, work, n, mpitype) \
 | 
|---|
| 450 |                << endl; \
 | 
|---|
| 451 |         } \
 | 
|---|
| 452 |       ret = MPI_Allreduce(d, work, n, mpitype, op, commgrp); \
 | 
|---|
| 453 |       if (debug_) \
 | 
|---|
| 454 |         ExEnv::outn() << scprintf("%3d: done with Allreduce", me()) << endl; \
 | 
|---|
| 455 |     } \
 | 
|---|
| 456 |   else { \
 | 
|---|
| 457 |       if (debug_) { \
 | 
|---|
| 458 |           ExEnv::outn() << scprintf("%3d: MPI_Reduce" \
 | 
|---|
| 459 |           "(0x%08x, 0x%08x, %5d, %3d, op, %3d, commgrp)", \
 | 
|---|
| 460 |           me(), d, work, n, mpitype, target) \
 | 
|---|
| 461 |                << endl; \
 | 
|---|
| 462 |         } \
 | 
|---|
| 463 |       ret = MPI_Reduce(d, work, n, mpitype, op, target, commgrp); \
 | 
|---|
| 464 |       if (debug_) \
 | 
|---|
| 465 |         ExEnv::outn() << scprintf("%3d: done with Reduce", me()) << endl; \
 | 
|---|
| 466 |     } \
 | 
|---|
| 467 |  \
 | 
|---|
| 468 |   if (ret != MPI_SUCCESS) { \
 | 
|---|
| 469 |       ExEnv::outn() << me() << ": MPIMessageGrp::reduce(," \
 | 
|---|
| 470 |           << n << ",,," << target << "): mpi error:" << endl; \
 | 
|---|
| 471 |       print_error_and_abort(me(), ret); \
 | 
|---|
| 472 |     } \
 | 
|---|
| 473 |  \
 | 
|---|
| 474 |   if (target == -1 || target == me()) { \
 | 
|---|
| 475 |      for (int i=0; i<n; i++) d[i] = work[i]; \
 | 
|---|
| 476 |     } \
 | 
|---|
| 477 |  \
 | 
|---|
| 478 |   MPI_Op_free(&op); \
 | 
|---|
| 479 |  \
 | 
|---|
| 480 |   if (!scratch) delete[] work; \
 | 
|---|
| 481 | }
 | 
|---|
| 482 | 
 | 
|---|
| 483 | REDUCEMEMBER(double, double, MPI_DOUBLE)
 | 
|---|
| 484 | REDUCEMEMBER(float, float, MPI_FLOAT)
 | 
|---|
| 485 | REDUCEMEMBER(uint, unsigned int, MPI_INT)
 | 
|---|
| 486 | REDUCEMEMBER(int, int, MPI_INT)
 | 
|---|
| 487 | REDUCEMEMBER(short, short, MPI_SHORT)
 | 
|---|
| 488 | REDUCEMEMBER(long, long, MPI_LONG)
 | 
|---|
| 489 | REDUCEMEMBER(char, char, MPI_CHAR)
 | 
|---|
| 490 | REDUCEMEMBER(uchar, unsigned char, MPI_UNSIGNED_CHAR)
 | 
|---|
| 491 | #ifdef MPI_SIGNED_CHAR
 | 
|---|
| 492 | REDUCEMEMBER(schar, signed char, MPI_SIGNED_CHAR)
 | 
|---|
| 493 | #else
 | 
|---|
| 494 | void
 | 
|---|
| 495 | MPIMessageGrp::reduce(signed char* d, int n, GrpReduce<signed char>& r,
 | 
|---|
| 496 |                       signed char*scratch, int target)
 | 
|---|
| 497 | {
 | 
|---|
| 498 |   MessageGrp::reduce(d,n,r,scratch,target);
 | 
|---|
| 499 | }
 | 
|---|
| 500 | #endif
 | 
|---|
| 501 | 
 | 
|---|
| 502 | #define SUMMEMBER(name, type, mpitype) \
 | 
|---|
| 503 | void \
 | 
|---|
| 504 | MPIMessageGrp::sum(type*d, int n, type*scratch, int target) \
 | 
|---|
| 505 | { \
 | 
|---|
| 506 |   if (use_messagegrp_collectives_) { \
 | 
|---|
| 507 |       MessageGrp::sum(d,n,scratch,target); \
 | 
|---|
| 508 |       return; \
 | 
|---|
| 509 |     } \
 | 
|---|
| 510 |  \
 | 
|---|
| 511 |   type *work; \
 | 
|---|
| 512 |   if (!scratch) work = new type[n]; \
 | 
|---|
| 513 |   else work = scratch; \
 | 
|---|
| 514 |  \
 | 
|---|
| 515 |   int ret; \
 | 
|---|
| 516 |  \
 | 
|---|
| 517 |   if (target == -1) { \
 | 
|---|
| 518 |       if (debug_) { \
 | 
|---|
| 519 |           ExEnv::outn() << scprintf("%3d: MPI_Allreduce" \
 | 
|---|
| 520 |           "(0x%08x, 0x%08x, %5d, %3d, MPI_SUM, commgrp)", \
 | 
|---|
| 521 |           me(), d, work, n, mpitype) \
 | 
|---|
| 522 |                << endl; \
 | 
|---|
| 523 |         } \
 | 
|---|
| 524 |       ret = MPI_Allreduce(d, work, n, mpitype, MPI_SUM, commgrp); \
 | 
|---|
| 525 |       if (debug_) \
 | 
|---|
| 526 |         ExEnv::outn() << scprintf("%3d: done with Allreduce", me()) << endl; \
 | 
|---|
| 527 |     } \
 | 
|---|
| 528 |   else { \
 | 
|---|
| 529 |       if (debug_) { \
 | 
|---|
| 530 |           ExEnv::outn() << scprintf("%3d: MPI_Reduce" \
 | 
|---|
| 531 |           "(0x%08x, 0x%08x, %5d, %3d, MPI_SUM, %3d, commgrp)", \
 | 
|---|
| 532 |           me(), d, work, n, mpitype, target) \
 | 
|---|
| 533 |                << endl; \
 | 
|---|
| 534 |         } \
 | 
|---|
| 535 |       ret = MPI_Reduce(d, work, n, mpitype, MPI_SUM, target, commgrp); \
 | 
|---|
| 536 |       if (debug_) \
 | 
|---|
| 537 |         ExEnv::outn() << scprintf("%3d: done with Reduce", me()) << endl; \
 | 
|---|
| 538 |     } \
 | 
|---|
| 539 |  \
 | 
|---|
| 540 |   if (ret != MPI_SUCCESS) { \
 | 
|---|
| 541 |       ExEnv::outn() << me() << ": MPIMessageGrp::sum(," \
 | 
|---|
| 542 |           << n << ",,," << target << "): mpi error:" << endl; \
 | 
|---|
| 543 |       print_error_and_abort(me(), ret); \
 | 
|---|
| 544 |     } \
 | 
|---|
| 545 |  \
 | 
|---|
| 546 |   if (target == -1 || target == me()) { \
 | 
|---|
| 547 |      for (int i=0; i<n; i++) d[i] = work[i]; \
 | 
|---|
| 548 |     } \
 | 
|---|
| 549 |  \
 | 
|---|
| 550 |   if (!scratch) delete[] work; \
 | 
|---|
| 551 | }
 | 
|---|
| 552 | SUMMEMBER(double, double, MPI_DOUBLE)
 | 
|---|
| 553 | SUMMEMBER(int, int, MPI_INT)
 | 
|---|
| 554 | 
 | 
|---|
| 555 | void
 | 
|---|
| 556 | MPIMessageGrp::raw_bcast(void* data, int nbyte, int from)
 | 
|---|
| 557 | {
 | 
|---|
| 558 |   if (n() == 1) return;
 | 
|---|
| 559 | 
 | 
|---|
| 560 |   if (use_messagegrp_collectives_) {
 | 
|---|
| 561 |       MessageGrp::raw_bcast(data,nbyte,from);
 | 
|---|
| 562 |       return;
 | 
|---|
| 563 |     }
 | 
|---|
| 564 | 
 | 
|---|
| 565 |   if (debug_) {
 | 
|---|
| 566 |       ExEnv::outn() << scprintf("%3d: MPI_Bcast("
 | 
|---|
| 567 |                        "0x%08x, %5d, MPI_BYTE, %3d, commgrp)",
 | 
|---|
| 568 |                        me(), data, nbyte, from)
 | 
|---|
| 569 |            << endl;
 | 
|---|
| 570 |     }
 | 
|---|
| 571 |   int ret;
 | 
|---|
| 572 |   if ((ret = MPI_Bcast(data, nbyte, MPI_BYTE, from, commgrp))
 | 
|---|
| 573 |       != MPI_SUCCESS) {
 | 
|---|
| 574 |       ExEnv::outn() << me() << ": MPIMessageGrp::raw_bcast(,"
 | 
|---|
| 575 |           << nbyte << "," << from << "): mpi error:" << endl;
 | 
|---|
| 576 |       print_error_and_abort(me(), ret);
 | 
|---|
| 577 |     }
 | 
|---|
| 578 |   if (debug_) {
 | 
|---|
| 579 |       ExEnv::outn() << scprintf("%3d: done with bcast", me()) << endl;
 | 
|---|
| 580 |     }
 | 
|---|
| 581 | }
 | 
|---|
| 582 | 
 | 
|---|
| 583 | /////////////////////////////////////////////////////////////////////////////
 | 
|---|
| 584 | 
 | 
|---|
| 585 | // Local Variables:
 | 
|---|
| 586 | // mode: c++
 | 
|---|
| 587 | // c-file-style: "CLJ"
 | 
|---|
| 588 | // End:
 | 
|---|