我在从一个进程发送列并由另一个进程接收的通信MPI_Send
方面存在问题。MPI_Recv
为了调试,我在下面向您展示了一个基本示例,其中我使用和初始化了一个 10x10 矩阵(x0
数组)。对于测试,我只是用 . 初始化 2D 数组值。x_domain = 4
y_domain = 4
x0[i][j] = i+j
您能否尝试编译并执行以下测试代码,它只是rank=2
从rank=0
nproc=4
#include <stdio.h>
#include <stdlib.h>
#include <math.h>
#include "mpi.h"
int main(int argc, char *argv[])
{
/* size of the discretization */
double** x;
double** x0;
int bonk1, bonk2;
int i,j,k,l;
int nproc;
int ndims;
int S=0, E=1, N=2, W=3;
int NeighBor[4];
int xcell, ycell, size_tot_x, size_tot_y;
int *xs,*ys,*xe,*ye;
int size_x = 4;
int size_y = 4;
int me;
int x_domains=2;
int y_domains=2;
int flag = 1;
MPI_Comm comm, comm2d;
int dims[2];
int periods[2];
int reorganisation = 0;
int row;
MPI_Datatype column_type;
MPI_Status status;
size_tot_x=size_x+2*x_domains+2;
size_tot_y=size_y+2*y_domains+2;
xcell=(size_x/x_domains);
ycell=(size_y/y_domains);
MPI_Init(&argc, &argv);
comm = MPI_COMM_WORLD;
MPI_Comm_size(comm,&nproc);
MPI_Comm_rank(comm,&me);
x = malloc(size_tot_y*sizeof(double*));
x0 = malloc(size_tot_y*sizeof(double*));
for(j=0;j<=size_tot_y-1;j++) {
x[j] = malloc(size_tot_x*sizeof(double));
x0[j] = malloc(size_tot_x*sizeof(double));
}
xs = malloc(nproc*sizeof(int));
xe = malloc(nproc*sizeof(int));
ys = malloc(nproc*sizeof(int));
ye = malloc(nproc*sizeof(int));
/* Create 2D cartesian grid */
periods[0] = 0;
periods[1] = 0;
ndims = 2;
dims[0]=x_domains;
dims[1]=y_domains;
MPI_Cart_create(comm, ndims, dims, periods, reorganisation, &comm2d);
/* Identify neighbors */
NeighBor[0] = MPI_PROC_NULL;
NeighBor[1] = MPI_PROC_NULL;
NeighBor[2] = MPI_PROC_NULL;
NeighBor[3] = MPI_PROC_NULL;
/* Left/West and right/Est neigbors */
MPI_Cart_shift(comm2d,0,1,&NeighBor[W],&NeighBor[E]);
/* Bottom/South and Upper/North neigbors */
MPI_Cart_shift(comm2d,1,1,&NeighBor[S],&NeighBor[N]);
/* coordinates of current cell with me rank */
xcell=(size_x/x_domains);
ycell=(size_y/y_domains);
ys[me]=(y_domains-me%(y_domains)-1)*(ycell+2)+2;
ye[me]=ys[me]+ycell-1;
for(i=0;i<=y_domains-1;i++)
{xs[i]=2;}
for(i=0;i<=y_domains-1;i++)
{xe[i]=xs[i]+xcell-1;}
for(i=1;i<=(x_domains-1);i++)
{ for(j=0;j<=(y_domains-1);j++)
{
xs[i*y_domains+j]=xs[(i-1)*y_domains+j]+xcell+2;
xe[i*y_domains+j]=xs[i*y_domains+j]+xcell-1;
}
}
for(i=0;i<=size_tot_y-1;i++)
{ for(j=0;j<=size_tot_x-1;j++)
{ x0[i][j]= i+j;
}
}
/* Create column data type to communicate with South and North neighbors */
MPI_Type_vector( ycell, 1, size_tot_x, MPI_DOUBLE, &column_type);
MPI_Type_commit(&column_type);
if(me==2) {
printf("Before Send - Process 2 subarray\n");
for(i=ys[me]-1;i<=ye[me]+1;i++)
{ for(j=xs[me]-1;j<=xe[me]+1;j++)
{ printf("%f ",x0[i][j]);
}
printf("\n");
}
printf("\n");
MPI_Send(&(x0[ys[2]][xs[2]]), 1, column_type, 0, flag, comm2d );
}
if(me==0) {
MPI_Recv(&(x0[ys[0]][xe[0]]), 1, column_type, 2, flag, comm2d , &status);
printf("After Receive - Process 0 subarray\n");
for(i=ys[me]-1;i<=ye[me]+1;i++)
{ for(j=xs[me]-1;j<=xe[me]+1;j++)
{ printf("%f ",x0[i][j]);
}
printf("\n");
}
printf("\n");
MPI_Get_count(&status,column_type,&bonk1);
MPI_Get_elements(&status,MPI_DOUBLE,&bonk2);
printf("got %d elements of type column_type\n",bonk1);
printf("which contained %d elements of type MPI_DOUBLE\n",bonk2);
printf("\n");
}
for(i=0;i<=size_tot_y-1;i++)
{
free(x[i]);
free(x0[i]);
}
free(x);
free(x0);
free(xs);
free(xe);
free(ys);
free(ye);
MPI_Finalize();
return 0;
}
xs[me]
和分别xe[me]
对应于x_start[me]
和x_end[me]
。rank = me
这对于ys[me]
和是一样的ye[me]
。
正如我在前一篇文章中所说,只有列的第一个值由 rank 进程接收0
。这是这个程序的输出:
Before Send - Process 2 subarray
10.000000 11.000000 12.000000 13.000000
11.000000 **12.000000** 13.000000 14.000000
12.000000 **13.000000** 14.000000 15.000000
13.000000 14.000000 15.000000 16.000000
After Receive - Process 0 subarray
6.000000 7.000000 8.000000 9.000000
7.000000 8.000000 **12.000000** 10.000000
8.000000 9.000000 **10.000000** 11.000000
9.000000 10.000000 11.000000 12.000000
got 1 elements of type column_type
which contained 2 elements of type MPI_DOUBLE
我得到12.00000
第一个元素,但对于第二个元素,我有10.00000
而不是13.00000
.
我定义column_type
为:
MPI_Type_vector( ycell, 1, size_tot_x, MPI_DOUBLE, &column_type);
MPI_Type_commit(&column_type);
size_tot_x
等于全局数组的总列数x0
。
任何帮助将非常感激。