git-svn-id: svn://svn.icms.temple.edu/lammps-ro/trunk@8954 f3b2605a-c512-4ea7-a41b-209d697bcdaa

2012-10-12 19:53:21 +00:00 · 2012-10-12 19:53:21 +00:00 · 946ec565c2
parent 5b6ec31a14
commit 946ec565c2
3 changed files with 600 additions and 0 deletions
--- a/src/KSPACE/Install.sh
+++ b/src/KSPACE/Install.sh
@ -2,6 +2,7 @@

 if (test $1 = 1) then

+  cp commgrid.cpp ..
  cp ewald.cpp ..
  cp ewald_disp.cpp ..
  cp msm.cpp ..
@ -30,6 +31,7 @@ if (test $1 = 1) then
  cp remap.cpp ..
  cp remap_wrap.cpp ..

+  cp commgrid.h ..
  cp ewald.h ..
  cp ewald_disp.h ..
  cp msm.h ..
@ -63,6 +65,7 @@ if (test $1 = 1) then

 elif (test $1 = 0) then

+  rm -f ../commgrid.cpp
  rm -f ../ewald.cpp
  rm -f ../ewald_disp.cpp
  rm -f ../msm.cpp
@ -91,6 +94,7 @@ elif (test $1 = 0) then
  rm -f ../remap.cpp
  rm -f ../remap_wrap.cpp

+  rm -f ../commgrid.h
  rm -f ../ewald.h
  rm -f ../ewald_disp.h
  rm -f ../msm.h
--- a/src/KSPACE/commgrid.cpp
+++ b/src/KSPACE/commgrid.cpp
@ -0,0 +1,515 @@
+/* ----------------------------------------------------------------------
+   LAMMPS - Large-scale Atomic/Molecular Massively Parallel Simulator
+   http://lammps.sandia.gov, Sandia National Laboratories
+   Steve Plimpton, sjplimp@sandia.gov
+
+   Copyright (2003) Sandia Corporation.  Under the terms of Contract
+   DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains
+   certain rights in this software.  This software is distributed under
+   the GNU General Public License.
+
+   See the README file in the top-level LAMMPS directory.
+------------------------------------------------------------------------- */
+
+#include "mpi.h"
+#include "commgrid.h"
+#include "comm.h"
+#include "kspace.h"
+#include "memory.h"
+#include "error.h"
+
+using namespace LAMMPS_NS;
+
+#define SWAPDELTA 8
+
+/* ---------------------------------------------------------------------- */
+
+CommGrid::CommGrid(LAMMPS *lmp, MPI_Comm gcomm, int forward, int reverse,
+                   int ixlo, int ixhi, int iylo, int iyhi, int izlo, int izhi,
+                   int oxlo, int oxhi, int oylo, int oyhi, int ozlo, int ozhi,
+                   int pxlo, int pxhi, int pylo, int pyhi, int pzlo, int pzhi) 
+  : Pointers(lmp)
+{
+  me = comm->me;
+  gridcomm = gcomm;
+
+  nforward = forward;
+  nreverse = reverse;
+
+  inxlo = ixlo;
+  inxhi = ixhi;
+  inylo = iylo;
+  inyhi = iyhi;
+  inzlo = izlo;
+  inzhi = izhi;
+
+  outxlo = oxlo;
+  outxhi = oxhi;
+  outylo = oylo;
+  outyhi = oyhi;
+  outzlo = ozlo;
+  outzhi = ozhi;
+
+  procxlo = pxlo;
+  procxhi = pxhi;
+  procylo = pylo;
+  procyhi = pyhi;
+  proczlo = pzlo;
+  proczhi = pzhi;
+
+  nswap = 0;
+  swap = NULL;
+  buf1 = buf2 = NULL;
+}
+
+/* ---------------------------------------------------------------------- */
+
+CommGrid::~CommGrid()
+{
+  for (int i = 0; i < nswap; i++) {
+    memory->destroy(swap[i].packlist);
+    memory->destroy(swap[i].unpacklist);
+  }
+  memory->sfree(swap);
+
+  memory->destroy(buf1);
+  memory->destroy(buf2);
+}
+
+/* ----------------------------------------------------------------------
+   notify 6 neighbor procs how many ghost grid planes I need from them
+   ghostxlo = # of lower grid planes I own that are needed from me
+              by procxlo to become its upper ghost planes
+   ghostxhi = # of upper grid planes I own that are needed from me
+              by procxhi to become its lower ghost planes
+   if no neighbor proc, value is from self
+------------------------------------------------------------------------- */
+
+void CommGrid::ghost_notify()
+{
+  int nplanes = inxlo - outxlo;
+  if (procxlo != me)
+      MPI_Sendrecv(&nplanes,1,MPI_INT,procxlo,0,
+                   &ghostxhi,1,MPI_INT,procxhi,0,gridcomm,&status);
+  else ghostxhi = nplanes;
+
+  nplanes = outxhi - inxhi;
+  if (procxhi != me)
+      MPI_Sendrecv(&nplanes,1,MPI_INT,procxhi,0,
+                   &ghostxlo,1,MPI_INT,procxlo,0,gridcomm,&status);
+  else ghostxlo = nplanes;
+
+  nplanes = inylo - outylo;
+  if (procylo != me)
+    MPI_Sendrecv(&nplanes,1,MPI_INT,procylo,0,
+                 &ghostyhi,1,MPI_INT,procyhi,0,gridcomm,&status);
+  else ghostyhi = nplanes;
+
+  nplanes = outyhi - inyhi;
+  if (procyhi != me)
+    MPI_Sendrecv(&nplanes,1,MPI_INT,procyhi,0,
+                 &ghostylo,1,MPI_INT,procylo,0,gridcomm,&status);
+  else ghostylo = nplanes;
+
+  nplanes = inzlo - outzlo;
+  if (proczlo != me)
+    MPI_Sendrecv(&nplanes,1,MPI_INT,proczlo,0,
+                 &ghostzhi,1,MPI_INT,proczhi,0,gridcomm,&status);
+  else ghostzhi = nplanes;
+
+  nplanes = outzhi - inzhi;
+  if (proczhi != me)
+    MPI_Sendrecv(&nplanes,1,MPI_INT,proczhi,0,
+                 &ghostzlo,1,MPI_INT,proczlo,0,gridcomm,&status);
+  else ghostzlo = nplanes;
+}
+
+/* ----------------------------------------------------------------------
+   check if all ghost grid comm needs overlap into non nearest-neighbor proc
+   if yes, return 1, else return 0
+------------------------------------------------------------------------- */
+
+int CommGrid::ghost_overlap()
+{
+  int nearest = 0;
+  if (ghostxlo > inxhi-inxlo+1) nearest = 1;
+  if (ghostxhi > inxhi-inxlo+1) nearest = 1;
+  if (ghostylo > inyhi-inylo+1) nearest = 1;
+  if (ghostyhi > inyhi-inylo+1) nearest = 1;
+  if (ghostzlo > inzhi-inzlo+1) nearest = 1;
+  if (ghostzhi > inzhi-inzlo+1) nearest = 1;
+  
+  int nearest_all;
+  MPI_Allreduce(&nearest,&nearest_all,1,MPI_INT,MPI_MIN,gridcomm);
+
+  return nearest_all;
+}
+
+/* ----------------------------------------------------------------------
+   create swap stencil for grid own/ghost communication
+   swaps covers all 3 dimensions and both directions
+   swaps cover multiple iterations in a direction if need grid pts
+     from further away than nearest-neighbor proc
+   same swap list used by forward and reverse communication
+------------------------------------------------------------------------- */
+
+void CommGrid::setup()
+{
+  int nsent,sendfirst,sendlast,recvfirst,recvlast;
+  int sendplanes,recvplanes;
+  int notdoneme,notdone;
+
+  int maxswap = 6;
+  swap = (Swap *) memory->smalloc(maxswap*sizeof(Swap),"Commgrid:swap");
+  nswap = 0;
+
+  // send own grid pts to -x processor, recv ghost grid pts from +x processor
+
+  nsent = 0;
+  sendfirst = inxlo;
+  sendlast = inxhi;
+  recvfirst = inxhi+1;
+  notdone = 1;
+
+  while (notdone) {
+    if (nswap == maxswap) {
+      maxswap += SWAPDELTA;
+      swap = (Swap *) 
+        memory->srealloc(swap,maxswap*sizeof(Swap),"Commgrid:swap");
+    }
+
+    swap[nswap].sendproc = procxlo;
+    swap[nswap].recvproc = procxhi;
+    sendplanes = MIN(sendlast-sendfirst+1,ghostxlo-nsent);
+    swap[nswap].npack = 
+      indices(swap[nswap].packlist,
+              sendfirst,sendfirst+sendplanes-1,inylo,inyhi,inzlo,inzhi);
+
+    if (procxlo != me)
+      MPI_Sendrecv(&sendplanes,1,MPI_INT,procxlo,0,
+                   &recvplanes,1,MPI_INT,procxhi,0,gridcomm,&status);
+    else recvplanes = sendplanes;
+
+    swap[nswap].nunpack = 
+      indices(swap[nswap].unpacklist,
+              recvfirst,recvfirst+recvplanes-1,inylo,inyhi,inzlo,inzhi);
+
+    nsent += sendplanes;
+    sendfirst += sendplanes;
+    sendlast += recvplanes;
+    recvfirst += recvplanes;
+    nswap++;
+
+    if (nsent < ghostxlo) notdoneme = 1;
+    else notdoneme = 0;
+    MPI_Allreduce(&notdoneme,&notdone,1,MPI_INT,MPI_SUM,gridcomm);
+  }
+
+  // send own grid pts to +x processor, recv ghost grid pts from -x processor
+
+  nsent = 0;
+  sendfirst = inxlo;
+  sendlast = inxhi;
+  recvlast = inxlo-1;
+  notdone = 1;
+
+  while (notdone) {
+    if (nswap == maxswap) {
+      maxswap += 1;
+      swap = (Swap *) 
+        memory->srealloc(swap,maxswap*sizeof(Swap),"Commgrid:swap");
+    }
+
+    swap[nswap].sendproc = procxhi;
+    swap[nswap].recvproc = procxlo;
+    sendplanes = MIN(sendlast-sendfirst+1,ghostxhi-nsent);
+    swap[nswap].npack = 
+      indices(swap[nswap].packlist,
+              sendlast-sendplanes+1,sendlast,inylo,inyhi,inzlo,inzhi);
+
+    if (procxhi != me)
+      MPI_Sendrecv(&sendplanes,1,MPI_INT,procxhi,0,
+                   &recvplanes,1,MPI_INT,procxlo,0,gridcomm,&status);
+    else recvplanes = sendplanes;
+
+    swap[nswap].nunpack = 
+      indices(swap[nswap].unpacklist,
+              recvlast-recvplanes+1,recvlast,inylo,inyhi,inzlo,inzhi);
+
+    nsent += sendplanes;
+    sendfirst -= recvplanes;
+    sendlast -= sendplanes;
+    recvlast -= recvplanes;
+    nswap++;
+
+    if (nsent < ghostxhi) notdoneme = 1;
+    else notdoneme = 0;
+    MPI_Allreduce(&notdoneme,&notdone,1,MPI_INT,MPI_SUM,gridcomm);
+  }
+
+  // send own grid pts to -y processor, recv ghost grid pts from +y processor
+
+  nsent = 0;
+  sendfirst = inylo;
+  sendlast = inyhi;
+  recvfirst = inyhi+1;
+  notdone = 1;
+
+  while (notdone) {
+    if (nswap == maxswap) {
+      maxswap += SWAPDELTA;
+      swap = (Swap *) 
+        memory->srealloc(swap,maxswap*sizeof(Swap),"Commgrid:swap");
+    }
+
+    swap[nswap].sendproc = procylo;
+    swap[nswap].recvproc = procyhi;
+    sendplanes = MIN(sendlast-sendfirst+1,ghostylo-nsent);
+    swap[nswap].npack = 
+      indices(swap[nswap].packlist,
+              outxlo,outxhi,sendfirst,sendfirst+sendplanes-1,inzlo,inzhi);
+
+    if (procylo != me)
+      MPI_Sendrecv(&sendplanes,1,MPI_INT,procylo,0,
+                   &recvplanes,1,MPI_INT,procyhi,0,gridcomm,&status);
+    else recvplanes = sendplanes;
+
+    swap[nswap].nunpack = 
+      indices(swap[nswap].unpacklist,
+              outxlo,outxhi,recvfirst,recvfirst+recvplanes-1,inzlo,inzhi);
+
+    nsent += sendplanes;
+    sendfirst += sendplanes;
+    sendlast += recvplanes;
+    recvfirst += recvplanes;
+    nswap++;
+
+    if (nsent < ghostylo) notdoneme = 1;
+    else notdoneme = 0;
+    MPI_Allreduce(&notdoneme,&notdone,1,MPI_INT,MPI_SUM,gridcomm);
+  }
+
+  // send own grid pts to +y processor, recv ghost grid pts from -y processor
+
+  nsent = 0;
+  sendfirst = inylo;
+  sendlast = inyhi;
+  recvlast = inylo-1;
+  notdone = 1;
+
+  while (notdone) {
+    if (nswap == maxswap) {
+      maxswap += 1;
+      swap = (Swap *) 
+        memory->srealloc(swap,maxswap*sizeof(Swap),"Commgrid:swap");
+    }
+
+    swap[nswap].sendproc = procyhi;
+    swap[nswap].recvproc = procylo;
+    sendplanes = MIN(sendlast-sendfirst+1,ghostyhi-nsent);
+    swap[nswap].npack = 
+      indices(swap[nswap].packlist,
+              outxlo,outxhi,sendlast-sendplanes+1,sendlast,inzlo,inzhi);
+
+    if (procyhi != me)
+      MPI_Sendrecv(&sendplanes,1,MPI_INT,procyhi,0,
+                   &recvplanes,1,MPI_INT,procylo,0,gridcomm,&status);
+    else recvplanes = sendplanes;
+
+    swap[nswap].nunpack = 
+      indices(swap[nswap].unpacklist,
+              outxlo,outxhi,recvlast-recvplanes+1,recvlast,inzlo,inzhi);
+
+    nsent += sendplanes;
+    sendfirst -= recvplanes;
+    sendlast -= sendplanes;
+    recvlast -= recvplanes;
+    nswap++;
+
+    if (nsent < ghostyhi) notdoneme = 1;
+    else notdoneme = 0;
+    MPI_Allreduce(&notdoneme,&notdone,1,MPI_INT,MPI_SUM,gridcomm);
+  }
+
+  // send own grid pts to -z processor, recv ghost grid pts from +z processor
+
+  nsent = 0;
+  sendfirst = inzlo;
+  sendlast = inzhi;
+  recvfirst = inzhi+1;
+  notdone = 1;
+
+  while (notdone) {
+    if (nswap == maxswap) {
+      maxswap += SWAPDELTA;
+      swap = (Swap *) 
+        memory->srealloc(swap,maxswap*sizeof(Swap),"Commgrid:swap");
+    }
+
+    swap[nswap].sendproc = proczlo;
+    swap[nswap].recvproc = proczhi;
+    sendplanes = MIN(sendlast-sendfirst+1,ghostzlo-nsent);
+    swap[nswap].npack = 
+      indices(swap[nswap].packlist,
+              outxlo,outxhi,outylo,outyhi,sendfirst,sendfirst+sendplanes-1);
+
+    if (proczlo != me)
+      MPI_Sendrecv(&sendplanes,1,MPI_INT,proczlo,0,
+                   &recvplanes,1,MPI_INT,proczhi,0,gridcomm,&status);
+    else recvplanes = sendplanes;
+
+    swap[nswap].nunpack = 
+      indices(swap[nswap].unpacklist,
+              outxlo,outxhi,outylo,outyhi,recvfirst,recvfirst+recvplanes-1);
+
+    nsent += sendplanes;
+    sendfirst += sendplanes;
+    sendlast += recvplanes;
+    recvfirst += recvplanes;
+    nswap++;
+
+    if (nsent < ghostzlo) notdoneme = 1;
+    else notdoneme = 0;
+    MPI_Allreduce(&notdoneme,&notdone,1,MPI_INT,MPI_SUM,gridcomm);
+  }
+
+  // send own grid pts to +z processor, recv ghost grid pts from -z processor
+
+  nsent = 0;
+  sendfirst = inzlo;
+  sendlast = inzhi;
+  recvlast = inzlo-1;
+  notdone = 1;
+
+  while (notdone) {
+    if (nswap == maxswap) {
+      maxswap += 1;
+      swap = (Swap *) 
+        memory->srealloc(swap,maxswap*sizeof(Swap),"Commgrid:swap");
+    }
+
+    swap[nswap].sendproc = proczhi;
+    swap[nswap].recvproc = proczlo;
+    sendplanes = MIN(sendlast-sendfirst+1,ghostzhi-nsent);
+    swap[nswap].npack = 
+      indices(swap[nswap].packlist,
+              outxlo,outxhi,outylo,outyhi,sendlast-sendplanes+1,sendlast);
+
+    if (proczhi != me)
+      MPI_Sendrecv(&sendplanes,1,MPI_INT,proczhi,0,
+                   &recvplanes,1,MPI_INT,proczlo,0,gridcomm,&status);
+    else recvplanes = sendplanes;
+
+    swap[nswap].nunpack = 
+      indices(swap[nswap].unpacklist,
+              outxlo,outxhi,outylo,outyhi,recvlast-recvplanes+1,recvlast);
+
+    nsent += sendplanes;
+    sendfirst -= recvplanes;
+    sendlast -= sendplanes;
+    recvlast -= recvplanes;
+    nswap++;
+
+    if (nsent < ghostzhi) notdoneme = 1;
+    else notdoneme = 0;
+    MPI_Allreduce(&notdoneme,&notdone,1,MPI_INT,MPI_SUM,gridcomm);
+  }
+
+  // nbuf = max of any forward/reverse pack/unpack
+
+  nbuf = 0;
+  for (int i = 0; i < nswap; i++) {
+    nbuf = MAX(nbuf,swap[i].npack);
+    nbuf = MAX(nbuf,swap[i].nunpack);
+  }
+  nbuf *= MAX(nforward,nreverse);
+  memory->create(buf1,nbuf,"Commgrid:buf1");
+  memory->create(buf2,nbuf,"Commgrid:buf2");
+}
+
+/* ----------------------------------------------------------------------
+   use swap list in forward order to acquire copy of all needed ghost grid pts
+------------------------------------------------------------------------- */
+
+void CommGrid::forward_comm(KSpace *kspace, int which)
+{
+  int i,n;
+
+  for (int m = 0; m < nswap; m++) {
+    if (swap[m].sendproc == me) 
+      kspace->pack_forward(which,buf2,swap[m].npack,swap[m].packlist);
+    else
+      kspace->pack_forward(which,buf1,swap[m].npack,swap[m].packlist);
+
+    if (swap[m].sendproc != me) {
+      MPI_Irecv(buf2,nforward*swap[m].nunpack,MPI_FFT_SCALAR,
+                swap[m].recvproc,0,gridcomm,&request);
+      MPI_Send(buf1,nforward*swap[m].npack,MPI_FFT_SCALAR,
+               swap[m].sendproc,0,gridcomm);
+      MPI_Wait(&request,&status);
+    }
+    
+    kspace->unpack_forward(which,buf2,swap[m].nunpack,swap[m].unpacklist);
+  }
+}
+
+/* ----------------------------------------------------------------------
+   use swap list in reverse order to compute fully summed value
+   for each owned grid pt that some other proc has copy of as a ghost grid pt
+------------------------------------------------------------------------- */
+
+void CommGrid::reverse_comm(KSpace *kspace, int which)
+{
+  int i,n;
+
+  for (int m = nswap-1; m >= 0; m--) {
+    if (swap[m].recvproc == me) 
+      kspace->pack_reverse(which,buf2,swap[m].nunpack,swap[m].unpacklist);
+    else
+      kspace->pack_reverse(which,buf1,swap[m].nunpack,swap[m].unpacklist);
+
+    if (swap[m].recvproc != me) {
+      MPI_Irecv(buf2,nreverse*swap[m].npack,MPI_FFT_SCALAR,
+                swap[m].sendproc,0,gridcomm,&request);
+      MPI_Send(buf1,nreverse*swap[m].nunpack,MPI_FFT_SCALAR,
+               swap[m].recvproc,0,gridcomm);
+      MPI_Wait(&request,&status);
+    }
+    
+    kspace->unpack_reverse(which,buf2,swap[m].npack,swap[m].packlist);
+  }
+}
+
+/* ----------------------------------------------------------------------
+   create 1d list of offsets into 3d array section (xlo:xhi,ylo:yhi,zlo:zhi)
+   assume 3d array is allocated as (outxlo:outxhi,outylo:outyhi,outzlo:outzhi)
+------------------------------------------------------------------------- */
+
+int CommGrid::indices(int *&list, 
+                       int xlo, int xhi, int ylo, int yhi, int zlo, int zhi)
+{
+  int nmax = (xhi-xlo+1) * (yhi-ylo+1) * (zhi-zlo+1);
+  memory->create(list,nmax,"Commgrid:list");
+
+  int nx = (outxhi-outxlo+1);
+  int ny = (outyhi-outylo+1);
+
+  int n = 0;
+  int ix,iy,iz;
+  for (iz = zlo; iz <= zhi; iz++)
+    for (iy = ylo; iy <= yhi; iy++)
+      for (ix = xlo; ix <= xhi; ix++)
+        list[n++] = (iz-outzlo)*ny*nx + (iy-outylo)*nx + (ix-outxlo);
+
+  return nmax;
+}
+
+/* ----------------------------------------------------------------------
+   memory usage of send/recv bufs
+------------------------------------------------------------------------- */
+
+double CommGrid::memory_usage()
+{
+  double bytes = 2*nbuf * sizeof(double);
+  return bytes;
+}
--- a/src/KSPACE/commgrid.h
+++ b/src/KSPACE/commgrid.h
@ -0,0 +1,81 @@
+/* ----------------------------------------------------------------------
+   LAMMPS - Large-scale Atomic/Molecular Massively Parallel Simulator
+   http://lammps.sandia.gov, Sandia National Laboratories
+   Steve Plimpton, sjplimp@sandia.gov
+
+   Copyright (2003) Sandia Corporation.  Under the terms of Contract
+   DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains
+   certain rights in this software.  This software is distributed under
+   the GNU General Public License.
+
+   See the README file in the top-level LAMMPS directory.
+------------------------------------------------------------------------- */
+
+#ifndef LMP_COMMGRID_H
+#define LMP_COMMGRID_H
+
+#include "pointers.h"
+
+#ifdef FFT_SINGLE
+typedef float FFT_SCALAR;
+#define MPI_FFT_SCALAR MPI_FLOAT
+#else
+typedef double FFT_SCALAR;
+#define MPI_FFT_SCALAR MPI_DOUBLE
+#endif
+
+namespace LAMMPS_NS {
+
+class CommGrid : protected Pointers {
+ public:
+  CommGrid(class LAMMPS *, MPI_Comm, int, int,
+           int, int, int, int, int, int,
+           int, int, int, int, int, int,
+           int, int, int, int, int, int);
+  ~CommGrid();
+  void ghost_notify();
+  int ghost_overlap();
+  void setup();
+  void forward_comm(class KSpace *, int);
+  void reverse_comm(class KSpace *, int);
+  double memory_usage();
+
+ private:
+  int me;
+  int nforward,nreverse;
+  MPI_Comm gridcomm;
+  MPI_Request request;
+  MPI_Status status;
+
+  // in = inclusive indices of 3d grid chunk that I own
+  // out = inclusive indices of 3d grid chunk I own plus ghosts I use
+  // proc = 6 neighbor procs that surround me
+  // ghost = # of my owned grid planes needed from me
+  //         by each of 6 neighbor procs to become their ghost planes
+
+  int inxlo,inxhi,inylo,inyhi,inzlo,inzhi;
+  int outxlo,outxhi,outylo,outyhi,outzlo,outzhi;
+  int procxlo,procxhi,procylo,procyhi,proczlo,proczhi;
+  int ghostxlo,ghostxhi,ghostylo,ghostyhi,ghostzlo,ghostzhi;
+
+  int nbuf;
+  FFT_SCALAR *buf1,*buf2;
+
+  struct Swap {
+    int sendproc;       // proc to send to for forward comm
+    int recvproc;       // proc to recv from for forward comm
+    int npack;          // # of datums to pack
+    int nunpack;        // # of datums to unpack
+    int *packlist;      // 3d array offsets to pack
+    int *unpacklist;    // 3d array offsets to unpack
+  };
+
+  int nswap;
+  Swap *swap;
+
+  int indices(int *&, int, int, int, int, int, int);
+};
+
+}
+
+#endif