1c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> 296c04dfeSSatish Balay 3d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_MPIAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 4d71ae5a4SJacob Faibussowitsch { 596c04dfeSSatish Balay Mat_MPIAIJ *aij = (Mat_MPIAIJ *)mat->data; 696c04dfeSSatish Balay Mat_SeqAIJ *aijB = (Mat_SeqAIJ *)aij->B->data; 72da392ccSBarry Smith PetscMPIInt subCommSize, subCommRank; 82da392ccSBarry Smith PetscMPIInt *commRankMap, subRank, rank, commRank; 996c04dfeSSatish Balay PetscInt *garrayCMap, col, i, j, *nnz, newRow, newCol; 1096c04dfeSSatish Balay 1196c04dfeSSatish Balay PetscFunctionBegin; 129566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(subComm, &subCommSize)); 139566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(subComm, &subCommRank)); 149566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PetscObjectComm((PetscObject)mat), &commRank)); 1596c04dfeSSatish Balay 162da392ccSBarry Smith /* create subMat object with the relevant layout */ 17ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 189566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, subMat)); 199566063dSJacob Faibussowitsch PetscCall(MatSetType(*subMat, MATMPIAIJ)); 209566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*subMat, mat->rmap->n, mat->cmap->n, PETSC_DECIDE, PETSC_DECIDE)); 219566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*subMat, mat, mat)); 22fc08c53fSHong Zhang 2396c04dfeSSatish Balay /* need to setup rmap and cmap before Preallocation */ 249566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp((*subMat)->rmap)); 259566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp((*subMat)->cmap)); 26ce1d8e51SHong Zhang } 2796c04dfeSSatish Balay 28ce1d8e51SHong Zhang /* create a map of comm_rank from subComm to comm - should commRankMap and garrayCMap be kept for reused? */ 299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(subCommSize, &commRankMap)); 309566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allgather(&commRank, 1, MPI_INT, commRankMap, 1, MPI_INT, subComm)); 3196c04dfeSSatish Balay 3296c04dfeSSatish Balay /* Traverse garray and identify column indices [of offdiag mat] that 3396c04dfeSSatish Balay should be discarded. For the ones not discarded, store the newCol+1 3496c04dfeSSatish Balay value in garrayCMap */ 359566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(aij->B->cmap->n, &garrayCMap)); 3696c04dfeSSatish Balay for (i = 0; i < aij->B->cmap->n; i++) { 3796c04dfeSSatish Balay col = aij->garray[i]; 3896c04dfeSSatish Balay for (subRank = 0; subRank < subCommSize; subRank++) { 3996c04dfeSSatish Balay rank = commRankMap[subRank]; 4096c04dfeSSatish Balay if ((col >= mat->cmap->range[rank]) && (col < mat->cmap->range[rank + 1])) { 4196c04dfeSSatish Balay garrayCMap[i] = (*subMat)->cmap->range[subRank] + col - mat->cmap->range[rank] + 1; 4296c04dfeSSatish Balay break; 4396c04dfeSSatish Balay } 4496c04dfeSSatish Balay } 4596c04dfeSSatish Balay } 4696c04dfeSSatish Balay 47ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 482da392ccSBarry Smith /* Compute preallocation for the offdiag mat */ 499566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(aij->B->rmap->n, &nnz)); 5096c04dfeSSatish Balay for (i = 0; i < aij->B->rmap->n; i++) { 5196c04dfeSSatish Balay for (j = aijB->i[i]; j < aijB->i[i + 1]; j++) { 5296c04dfeSSatish Balay if (garrayCMap[aijB->j[j]]) nnz[i]++; 5396c04dfeSSatish Balay } 5496c04dfeSSatish Balay } 559566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(*(subMat), 0, NULL, 0, nnz)); 5696c04dfeSSatish Balay 5796c04dfeSSatish Balay /* reuse diag block with the new submat */ 589566063dSJacob Faibussowitsch PetscCall(MatDestroy(&((Mat_MPIAIJ *)((*subMat)->data))->A)); 5996c04dfeSSatish Balay ((Mat_MPIAIJ *)((*subMat)->data))->A = aij->A; 609566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)aij->A)); 61ce1d8e51SHong Zhang } else if (((Mat_MPIAIJ *)(*subMat)->data)->A != aij->A) { 62ce1d8e51SHong Zhang PetscObject obj = (PetscObject)((Mat_MPIAIJ *)((*subMat)->data))->A; 639566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)obj)); 64ce1d8e51SHong Zhang ((Mat_MPIAIJ *)((*subMat)->data))->A = aij->A; 659566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)aij->A)); 66ce1d8e51SHong Zhang } 6796c04dfeSSatish Balay 682da392ccSBarry Smith /* Traverse aij->B and insert values into subMat */ 692da392ccSBarry Smith if ((*subMat)->assembled) { 702da392ccSBarry Smith (*subMat)->was_assembled = PETSC_TRUE; 712da392ccSBarry Smith (*subMat)->assembled = PETSC_FALSE; 722da392ccSBarry Smith } 7396c04dfeSSatish Balay for (i = 0; i < aij->B->rmap->n; i++) { 7496c04dfeSSatish Balay newRow = (*subMat)->rmap->range[subCommRank] + i; 7596c04dfeSSatish Balay for (j = aijB->i[i]; j < aijB->i[i + 1]; j++) { 7696c04dfeSSatish Balay newCol = garrayCMap[aijB->j[j]]; 7796c04dfeSSatish Balay if (newCol) { 7896c04dfeSSatish Balay newCol--; /* remove the increment */ 79*57508eceSPierre Jolivet PetscCall(MatSetValues_MPIAIJ(*subMat, 1, &newRow, 1, &newCol, aijB->a + j, INSERT_VALUES)); 8096c04dfeSSatish Balay } 8196c04dfeSSatish Balay } 8296c04dfeSSatish Balay } 839566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*subMat, MAT_FINAL_ASSEMBLY)); 849566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*subMat, MAT_FINAL_ASSEMBLY)); 8596c04dfeSSatish Balay 8696c04dfeSSatish Balay /* deallocate temporary data */ 879566063dSJacob Faibussowitsch PetscCall(PetscFree(commRankMap)); 889566063dSJacob Faibussowitsch PetscCall(PetscFree(garrayCMap)); 8948a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscFree(nnz)); 903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9196c04dfeSSatish Balay } 92