Fix issue #100: get_val with HAVE_MPI (#112)

thchr · web-flow · commit 692b5e2a3ff6 · 2020-02-13T22:06:21.000-05:00
* Make get_val(...) work under HAVE_MPI

* Exclude vscode-specific setting files from git

* Move mpi_allreduce_1 calls from get_val to interp_val
diff --git a/.gitignore b/.gitignore
@@ -67,6 +67,9 @@ mpb/mpbi_mpi
 src/mpbi_mpi.h
 mpb/mu.c
 
+# local editor settings
+.vscode
+
 # test output:
 check-epsilon.h5
 check-mu.h5
diff --git a/mpb/fields.c b/mpb/fields.c
@@ -547,6 +547,10 @@ void fix_field_phase(void)
 /* Functions to return epsilon, fields, energies, etcetera, at a specified
    point, linearly interpolating if necessary. */
 
+/* get_val returns process-specific output for HAVE_MPI: if the "point" (ix, iy, iz; stride)
+   is on the local process, the value of data at that point is returned returned; otherwise
+   (i.e. point is not on local process) 0.0 is returned: calls to get_val should therefore 
+   be followed by sum-reduction via mpi_allreduce_1(..) in the caller (as in interp_val) */
 static real get_val(int ix, int iy, int iz,
 		    int nx, int ny, int nz, int last_dim_size,
 		    real *data, int stride, int conjugate)
@@ -569,20 +573,33 @@ static real get_val(int ix, int iy, int iz,
 #endif
 
 #ifdef HAVE_MPI
-     CHECK(0, "get-*-point not yet implemented for MPI!");
-#else
-     if (conjugate)
-	  return -data[(((ix * ny) + iy) * nz + iz) * stride];
-     else
-	  return data[(((ix * ny) + iy) * nz + iz) * stride];
+	 /* due to real-space xy=>yx transposition in MPI configuration, we need to
+	    do a little extra work here; see details e.g. in XYZ_LOOP macro */
+     int local_ny = mdata->local_ny; /* dim of local process over y-indices */
+     int local_y_start = mdata->local_y_start;
+     int local_iy = iy - local_y_start;
+	 real val = 0; /* reduce local processes over this variable later */
+
+	 /* check if local_iy is in the current process' data block */
+     if (local_iy >= 0 && local_iy < local_ny) { 
+         val = data[(((local_iy * nx) + ix) * nz + iz) * stride]; /* note transposition in x and y indices */
+	 }
+
+#else /* no MPI */
+	real val = data[(((ix * ny) + iy) * nz + iz) * stride];
 #endif
+
+if (conjugate)
+	return -val;
+else
+	return val;
 }
 
 static real interp_val(vector3 p, int nx, int ny, int nz, int last_dim_size,
 		       real *data, int stride, int conjugate)
 {
      double ipart;
-     real rx, ry, rz, dx, dy, dz;
+     real rx, ry, rz, dx, dy, dz, v;
      int x, y, z, x2, y2, z2;
 
      rx = modf(p.x/geometry_lattice.size.x + 0.5, &ipart); if (rx < 0) rx += 1;
@@ -611,10 +628,13 @@ static real interp_val(vector3 p, int nx, int ny, int nz, int last_dim_size,
 
 #define D(x,y,z) (get_val(x,y,z,nx,ny,nz,last_dim_size, data,stride,conjugate))
 
-     return(((D(x,y,z)*(1.0-dx) + D(x2,y,z)*dx) * (1.0-dy) +
-             (D(x,y2,z)*(1.0-dx) + D(x2,y2,z)*dx) * dy) * (1.0-dz) +
-            ((D(x,y,z2)*(1.0-dx) + D(x2,y,z2)*dx) * (1.0-dy) +
-             (D(x,y2,z2)*(1.0-dx) + D(x2,y2,z2)*dx) * dy) * dz);
+     v = (((D(x,y,z)   * (1.0-dx) + D(x2,y,z)   * dx) * (1.0-dy) +
+           (D(x,y2,z)  * (1.0-dx) + D(x2,y2,z)  * dx) * dy         ) * (1.0-dz) +
+          ((D(x,y,z2)  * (1.0-dx) + D(x2,y,z2)  * dx) * (1.0-dy) +
+           (D(x,y2,z2) * (1.0-dx) + D(x2,y2,z2) * dx) * dy         ) * dz);
+
+     mpi_allreduce_1(&v, real, SCALAR_MPI_TYPE, MPI_SUM, mpb_comm);
+     return v;
 
 #undef D
 }