1c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> 296c04dfeSSatish Balay 33233f0ddSHong Zhang PetscErrorCode MatGetMultiProcBlock_MPIAIJ(Mat mat, MPI_Comm subComm, MatReuse scall,Mat *subMat) 496c04dfeSSatish Balay { 596c04dfeSSatish Balay Mat_MPIAIJ *aij = (Mat_MPIAIJ*)mat->data; 696c04dfeSSatish Balay Mat_SeqAIJ *aijB = (Mat_SeqAIJ*)aij->B->data; 72da392ccSBarry Smith PetscMPIInt subCommSize,subCommRank; 82da392ccSBarry Smith PetscMPIInt *commRankMap,subRank,rank,commRank; 996c04dfeSSatish Balay PetscInt *garrayCMap,col,i,j,*nnz,newRow,newCol; 1096c04dfeSSatish Balay 1196c04dfeSSatish Balay PetscFunctionBegin; 12*9566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(subComm,&subCommSize)); 13*9566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(subComm,&subCommRank)); 14*9566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PetscObjectComm((PetscObject)mat),&commRank)); 1596c04dfeSSatish Balay 162da392ccSBarry Smith /* create subMat object with the relevant layout */ 17ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 18*9566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm,subMat)); 19*9566063dSJacob Faibussowitsch PetscCall(MatSetType(*subMat,MATMPIAIJ)); 20*9566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*subMat,mat->rmap->n,mat->cmap->n,PETSC_DECIDE,PETSC_DECIDE)); 21*9566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*subMat,mat,mat)); 22fc08c53fSHong Zhang 2396c04dfeSSatish Balay /* need to setup rmap and cmap before Preallocation */ 24*9566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp((*subMat)->rmap)); 25*9566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp((*subMat)->cmap)); 26ce1d8e51SHong Zhang } 2796c04dfeSSatish Balay 28ce1d8e51SHong Zhang /* create a map of comm_rank from subComm to comm - should commRankMap and garrayCMap be kept for reused? */ 29*9566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(subCommSize,&commRankMap)); 30*9566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allgather(&commRank,1,MPI_INT,commRankMap,1,MPI_INT,subComm)); 3196c04dfeSSatish Balay 3296c04dfeSSatish Balay /* Traverse garray and identify column indices [of offdiag mat] that 3396c04dfeSSatish Balay should be discarded. For the ones not discarded, store the newCol+1 3496c04dfeSSatish Balay value in garrayCMap */ 35*9566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(aij->B->cmap->n,&garrayCMap)); 3696c04dfeSSatish Balay for (i=0; i<aij->B->cmap->n; i++) { 3796c04dfeSSatish Balay col = aij->garray[i]; 3896c04dfeSSatish Balay for (subRank=0; subRank<subCommSize; subRank++) { 3996c04dfeSSatish Balay rank = commRankMap[subRank]; 4096c04dfeSSatish Balay if ((col >= mat->cmap->range[rank]) && (col < mat->cmap->range[rank+1])) { 4196c04dfeSSatish Balay garrayCMap[i] = (*subMat)->cmap->range[subRank] + col - mat->cmap->range[rank]+1; 4296c04dfeSSatish Balay break; 4396c04dfeSSatish Balay } 4496c04dfeSSatish Balay } 4596c04dfeSSatish Balay } 4696c04dfeSSatish Balay 47ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 482da392ccSBarry Smith /* Compute preallocation for the offdiag mat */ 49*9566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(aij->B->rmap->n,&nnz)); 5096c04dfeSSatish Balay for (i=0; i<aij->B->rmap->n; i++) { 5196c04dfeSSatish Balay for (j=aijB->i[i]; j<aijB->i[i+1]; j++) { 5296c04dfeSSatish Balay if (garrayCMap[aijB->j[j]]) nnz[i]++; 5396c04dfeSSatish Balay } 5496c04dfeSSatish Balay } 55*9566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(*(subMat),0,NULL,0,nnz)); 5696c04dfeSSatish Balay 5796c04dfeSSatish Balay /* reuse diag block with the new submat */ 58*9566063dSJacob Faibussowitsch PetscCall(MatDestroy(&((Mat_MPIAIJ*)((*subMat)->data))->A)); 5996c04dfeSSatish Balay ((Mat_MPIAIJ*)((*subMat)->data))->A = aij->A; 60*9566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)aij->A)); 61ce1d8e51SHong Zhang } else if (((Mat_MPIAIJ*)(*subMat)->data)->A != aij->A) { 62ce1d8e51SHong Zhang PetscObject obj = (PetscObject)((Mat_MPIAIJ*)((*subMat)->data))->A; 63*9566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)obj)); 64ce1d8e51SHong Zhang ((Mat_MPIAIJ*)((*subMat)->data))->A = aij->A; 65*9566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)aij->A)); 66ce1d8e51SHong Zhang } 6796c04dfeSSatish Balay 682da392ccSBarry Smith /* Traverse aij->B and insert values into subMat */ 692da392ccSBarry Smith if ((*subMat)->assembled) { 702da392ccSBarry Smith (*subMat)->was_assembled = PETSC_TRUE; 712da392ccSBarry Smith (*subMat)->assembled = PETSC_FALSE; 722da392ccSBarry Smith } 7396c04dfeSSatish Balay for (i=0; i<aij->B->rmap->n; i++) { 7496c04dfeSSatish Balay newRow = (*subMat)->rmap->range[subCommRank] + i; 7596c04dfeSSatish Balay for (j=aijB->i[i]; j<aijB->i[i+1]; j++) { 7696c04dfeSSatish Balay newCol = garrayCMap[aijB->j[j]]; 7796c04dfeSSatish Balay if (newCol) { 7896c04dfeSSatish Balay newCol--; /* remove the increment */ 79*9566063dSJacob Faibussowitsch PetscCall(MatSetValues_MPIAIJ(*subMat,1,&newRow,1,&newCol,(aijB->a+j),INSERT_VALUES)); 8096c04dfeSSatish Balay } 8196c04dfeSSatish Balay } 8296c04dfeSSatish Balay } 83*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*subMat,MAT_FINAL_ASSEMBLY)); 84*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*subMat,MAT_FINAL_ASSEMBLY)); 8596c04dfeSSatish Balay 8696c04dfeSSatish Balay /* deallocate temporary data */ 87*9566063dSJacob Faibussowitsch PetscCall(PetscFree(commRankMap)); 88*9566063dSJacob Faibussowitsch PetscCall(PetscFree(garrayCMap)); 89ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 90*9566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 91ce1d8e51SHong Zhang } 9296c04dfeSSatish Balay PetscFunctionReturn(0); 9396c04dfeSSatish Balay } 94