xref: /petsc/src/mat/impls/aij/mpi/mpb_aij.c (revision 5d22bc9f7f1d7cba2bb2e4593dec7d4798362bd6)
196c04dfeSSatish Balay #include "../src/mat/impls/aij/mpi/mpiaij.h"
296c04dfeSSatish Balay 
396c04dfeSSatish Balay /*
496c04dfeSSatish Balay 
596c04dfeSSatish Balay   This routine creates multiple [bjacobi] 'parallel submatrices' from
696c04dfeSSatish Balay   a given 'mat' object. Each submatrix can span multiple procs.
796c04dfeSSatish Balay 
896c04dfeSSatish Balay   The submatrix partition across processors is dicated by 'subComm' a
996c04dfeSSatish Balay   communicator obtained by com_split(comm). Note: the comm_split
1096c04dfeSSatish Balay   is not restriced to be grouped with consequitive original ranks.
1196c04dfeSSatish Balay 
1296c04dfeSSatish Balay   Due the comm_split() usage, the parallel layout of the submatrices
1396c04dfeSSatish Balay   map directly to the layout of the original matrix [wrt the local
1496c04dfeSSatish Balay   row,col partitioning]. So the original 'DiagonalMat' naturally maps
1596c04dfeSSatish Balay   into the 'DiagonalMat' of the subMat, hence it is used directly from
1696c04dfeSSatish Balay   the subMat. However the offDiagMat looses some columns - and this is
1796c04dfeSSatish Balay   reconstructed with MatSetValues()
1896c04dfeSSatish Balay 
1996c04dfeSSatish Balay  */
2096c04dfeSSatish Balay 
2196c04dfeSSatish Balay #undef __FUNCT__
2296c04dfeSSatish Balay #define __FUNCT__ "MatGetMultiProcBlock_MPIAIJ"
2396c04dfeSSatish Balay PetscErrorCode  MatGetMultiProcBlock_MPIAIJ(Mat mat, MPI_Comm subComm, Mat* subMat)
2496c04dfeSSatish Balay {
2596c04dfeSSatish Balay   PetscErrorCode ierr;
2696c04dfeSSatish Balay   Mat_MPIAIJ     *aij = (Mat_MPIAIJ*)mat->data;
2796c04dfeSSatish Balay   Mat_SeqAIJ*    aijB = (Mat_SeqAIJ*)aij->B->data;
2896c04dfeSSatish Balay   PetscMPIInt    commRank,subCommSize,subCommRank;
29*5d22bc9fSHong Zhang   PetscMPIInt    *commRankMap,subRank,rank,commsize;
3096c04dfeSSatish Balay   PetscInt       *garrayCMap,col,i,j,*nnz,newRow,newCol;
3196c04dfeSSatish Balay 
3296c04dfeSSatish Balay   PetscFunctionBegin;
33*5d22bc9fSHong Zhang   ierr = MPI_Comm_size(((PetscObject)mat)->comm,&commsize);CHKERRQ(ierr);
34*5d22bc9fSHong Zhang   ierr = MPI_Comm_size(subComm,&subCommSize);CHKERRQ(ierr);
35*5d22bc9fSHong Zhang   if (subCommSize > commsize) SETERRQ2(((PetscObject)mat)->comm,PETSC_ERR_ARG_OUTOFRANGE,"CommSize %D < SubCommZize %D",commsize,subCommSize);
36*5d22bc9fSHong Zhang   if (commsize == 1){
37*5d22bc9fSHong Zhang     ierr = MatDuplicate(mat,MAT_COPY_VALUES,subMat);CHKERRQ(ierr);
38*5d22bc9fSHong Zhang     PetscFunctionReturn(0);
39*5d22bc9fSHong Zhang   }
4096c04dfeSSatish Balay 
4196c04dfeSSatish Balay   /* create subMat object with the relavent layout */
4296c04dfeSSatish Balay   ierr = MatCreate(subComm,subMat);CHKERRQ(ierr);
4396c04dfeSSatish Balay   ierr = MatSetType(*subMat,MATMPIAIJ);CHKERRQ(ierr);
4496c04dfeSSatish Balay   ierr = MatSetSizes(*subMat,mat->rmap->n,mat->cmap->n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
4596c04dfeSSatish Balay   /* need to setup rmap and cmap before Preallocation */
4696c04dfeSSatish Balay   ierr = PetscLayoutSetBlockSize((*subMat)->rmap,mat->rmap->bs);CHKERRQ(ierr);
4796c04dfeSSatish Balay   ierr = PetscLayoutSetBlockSize((*subMat)->cmap,mat->cmap->bs);CHKERRQ(ierr);
4896c04dfeSSatish Balay   ierr = PetscLayoutSetUp((*subMat)->rmap);CHKERRQ(ierr);
4996c04dfeSSatish Balay   ierr = PetscLayoutSetUp((*subMat)->cmap);CHKERRQ(ierr);
5096c04dfeSSatish Balay 
5196c04dfeSSatish Balay   /* create a map of comm_rank from subComm to comm */
5296c04dfeSSatish Balay   ierr = MPI_Comm_rank(((PetscObject)mat)->comm,&commRank);CHKERRQ(ierr);
5396c04dfeSSatish Balay   ierr = MPI_Comm_rank(subComm,&subCommRank);CHKERRQ(ierr);
5496c04dfeSSatish Balay   ierr = PetscMalloc(subCommSize*sizeof(PetscMPIInt),&commRankMap);CHKERRQ(ierr);
5596c04dfeSSatish Balay   ierr = MPI_Allgather(&commRank,1,MPI_INT,commRankMap,1,MPI_INT,subComm);CHKERRQ(ierr);
5696c04dfeSSatish Balay 
5796c04dfeSSatish Balay   /* Traverse garray and identify column indices [of offdiag mat] that
5896c04dfeSSatish Balay    should be discarded. For the ones not discarded, store the newCol+1
5996c04dfeSSatish Balay    value in garrayCMap */
6096c04dfeSSatish Balay   ierr = PetscMalloc(aij->B->cmap->n*sizeof(PetscInt),&garrayCMap);CHKERRQ(ierr);
6196c04dfeSSatish Balay   ierr = PetscMemzero(garrayCMap,aij->B->cmap->n*sizeof(PetscInt));CHKERRQ(ierr);
6296c04dfeSSatish Balay   for (i=0; i<aij->B->cmap->n; i++) {
6396c04dfeSSatish Balay     col = aij->garray[i];
6496c04dfeSSatish Balay     for (subRank=0; subRank<subCommSize; subRank++) {
6596c04dfeSSatish Balay       rank = commRankMap[subRank];
6696c04dfeSSatish Balay       if ((col >= mat->cmap->range[rank]) && (col < mat->cmap->range[rank+1])) {
6796c04dfeSSatish Balay         garrayCMap[i] = (*subMat)->cmap->range[subRank] + col - mat->cmap->range[rank]+1;
6896c04dfeSSatish Balay         break;
6996c04dfeSSatish Balay       }
7096c04dfeSSatish Balay     }
7196c04dfeSSatish Balay   }
7296c04dfeSSatish Balay 
7396c04dfeSSatish Balay   /* Now compute preallocation for the offdiag mat */
7496c04dfeSSatish Balay   ierr = PetscMalloc(aij->B->rmap->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
7596c04dfeSSatish Balay   ierr = PetscMemzero(nnz,aij->B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr);
7696c04dfeSSatish Balay   for (i=0; i<aij->B->rmap->n; i++) {
7796c04dfeSSatish Balay     for (j=aijB->i[i]; j<aijB->i[i+1]; j++) {
7896c04dfeSSatish Balay       if (garrayCMap[aijB->j[j]]) nnz[i]++;
7996c04dfeSSatish Balay     }
8096c04dfeSSatish Balay   }
8196c04dfeSSatish Balay   ierr = MatMPIAIJSetPreallocation(*(subMat),PETSC_NULL,PETSC_NULL,PETSC_NULL,nnz);CHKERRQ(ierr);
8296c04dfeSSatish Balay 
8396c04dfeSSatish Balay   /* reuse diag block with the new submat */
8496c04dfeSSatish Balay   ierr = MatDestroy(((Mat_MPIAIJ*)((*subMat)->data))->A);CHKERRQ(ierr);
8596c04dfeSSatish Balay   ((Mat_MPIAIJ*)((*subMat)->data))->A = aij->A;
8696c04dfeSSatish Balay   ierr = PetscObjectReference((PetscObject)aij->A);CHKERRQ(ierr);
8796c04dfeSSatish Balay 
8896c04dfeSSatish Balay   /* Now traverse aij->B and insert values into subMat */
8996c04dfeSSatish Balay   for (i=0; i<aij->B->rmap->n; i++) {
9096c04dfeSSatish Balay     newRow = (*subMat)->rmap->range[subCommRank] + i;
9196c04dfeSSatish Balay     for (j=aijB->i[i]; j<aijB->i[i+1]; j++) {
9296c04dfeSSatish Balay       newCol = garrayCMap[aijB->j[j]];
9396c04dfeSSatish Balay       if (newCol) {
9496c04dfeSSatish Balay         newCol--; /* remove the increment */
9596c04dfeSSatish Balay         ierr = MatSetValues(*subMat,1,&newRow,1,&newCol,(aijB->a+j),INSERT_VALUES);CHKERRQ(ierr);
9696c04dfeSSatish Balay       }
9796c04dfeSSatish Balay     }
9896c04dfeSSatish Balay   }
9996c04dfeSSatish Balay 
10096c04dfeSSatish Balay   /* assemble the submat */
10196c04dfeSSatish Balay   ierr = MatAssemblyBegin(*subMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
10296c04dfeSSatish Balay   ierr = MatAssemblyEnd(*subMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
10396c04dfeSSatish Balay 
10496c04dfeSSatish Balay   /* deallocate temporary data */
10596c04dfeSSatish Balay   ierr = PetscFree(commRankMap);CHKERRQ(ierr);
10696c04dfeSSatish Balay   ierr = PetscFree(garrayCMap);CHKERRQ(ierr);
10796c04dfeSSatish Balay   ierr = PetscFree(nnz);CHKERRQ(ierr);
10896c04dfeSSatish Balay   PetscFunctionReturn(0);
10996c04dfeSSatish Balay }
110