1e8271787SHong Zhang #include <../src/mat/impls/baij/mpi/mpibaij.h> 2e8271787SHong Zhang 39371c9d4SSatish Balay PetscErrorCode MatGetMultiProcBlock_MPIBAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) { 4e8271787SHong Zhang Mat_MPIBAIJ *aij = (Mat_MPIBAIJ *)mat->data; 5e8271787SHong Zhang Mat_SeqBAIJ *aijB = (Mat_SeqBAIJ *)aij->B->data; 6e8271787SHong Zhang PetscMPIInt commRank, subCommSize, subCommRank; 7e8271787SHong Zhang PetscMPIInt *commRankMap, subRank, rank, commsize; 802e9429cSHong Zhang PetscInt *garrayCMap, col, i, j, *nnz, newRow, newCol, *newbRow, *newbCol, k, k1; 9e8271787SHong Zhang PetscInt bs = mat->rmap->bs; 1002e9429cSHong Zhang PetscScalar *vals, *aijBvals; 11e8271787SHong Zhang 12e8271787SHong Zhang PetscFunctionBegin; 139566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)mat), &commsize)); 149566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(subComm, &subCommSize)); 15e8271787SHong Zhang 16a5b23f4aSJose E. Roman /* create subMat object with the relevant layout */ 17e8271787SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 189566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, subMat)); 199566063dSJacob Faibussowitsch PetscCall(MatSetType(*subMat, MATMPIBAIJ)); 209566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*subMat, mat->rmap->n, mat->cmap->n, PETSC_DECIDE, PETSC_DECIDE)); 219566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(*subMat, mat->rmap->bs, mat->cmap->bs)); 22e8271787SHong Zhang 23e8271787SHong Zhang /* need to setup rmap and cmap before Preallocation */ 249566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize((*subMat)->rmap, mat->rmap->bs)); 259566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize((*subMat)->cmap, mat->cmap->bs)); 269566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp((*subMat)->rmap)); 279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp((*subMat)->cmap)); 28e8271787SHong Zhang } 29e8271787SHong Zhang 30e8271787SHong Zhang /* create a map of comm_rank from subComm to comm - should commRankMap and garrayCMap be kept for reused? */ 319566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PetscObjectComm((PetscObject)mat), &commRank)); 329566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(subComm, &subCommRank)); 339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(subCommSize, &commRankMap)); 349566063dSJacob Faibussowitsch PetscCallMPI(MPI_Allgather(&commRank, 1, MPI_INT, commRankMap, 1, MPI_INT, subComm)); 35e8271787SHong Zhang 36e8271787SHong Zhang /* Traverse garray and identify blocked column indices [of offdiag mat] that 37e8271787SHong Zhang should be discarded. For the ones not discarded, store the newCol+1 38e8271787SHong Zhang value in garrayCMap */ 399566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(aij->B->cmap->n / bs, &garrayCMap)); 40e8271787SHong Zhang for (i = 0; i < aij->B->cmap->n / bs; i++) { 41e8271787SHong Zhang col = aij->garray[i]; /* blocked column index */ 42e8271787SHong Zhang for (subRank = 0; subRank < subCommSize; subRank++) { 43e8271787SHong Zhang rank = commRankMap[subRank]; 44e8271787SHong Zhang if ((col >= mat->cmap->range[rank] / bs) && (col < mat->cmap->range[rank + 1] / bs)) { 4502e9429cSHong Zhang garrayCMap[i] = (((*subMat)->cmap->range[subRank] - mat->cmap->range[rank]) / bs + col + 1); 46e8271787SHong Zhang break; 47e8271787SHong Zhang } 48e8271787SHong Zhang } 49e8271787SHong Zhang } 50e8271787SHong Zhang 51e8271787SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 52e8271787SHong Zhang /* Now compute preallocation for the offdiag mat */ 539566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(aij->B->rmap->n / bs, &nnz)); 54e8271787SHong Zhang for (i = 0; i < aij->B->rmap->n / bs; i++) { 55e8271787SHong Zhang for (j = aijB->i[i]; j < aijB->i[i + 1]; j++) { 56e8271787SHong Zhang if (garrayCMap[aijB->j[j]]) nnz[i]++; 57e8271787SHong Zhang } 58e8271787SHong Zhang } 599566063dSJacob Faibussowitsch PetscCall(MatMPIBAIJSetPreallocation(*(subMat), bs, 0, NULL, 0, nnz)); 60e8271787SHong Zhang 61e8271787SHong Zhang /* reuse diag block with the new submat */ 629566063dSJacob Faibussowitsch PetscCall(MatDestroy(&((Mat_MPIBAIJ *)((*subMat)->data))->A)); 63e8271787SHong Zhang 64e8271787SHong Zhang ((Mat_MPIBAIJ *)((*subMat)->data))->A = aij->A; 65e8271787SHong Zhang 669566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)aij->A)); 67e8271787SHong Zhang } else if (((Mat_MPIBAIJ *)(*subMat)->data)->A != aij->A) { 68e8271787SHong Zhang PetscObject obj = (PetscObject)((Mat_MPIBAIJ *)((*subMat)->data))->A; 69e8271787SHong Zhang 709566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)obj)); 71e8271787SHong Zhang 72e8271787SHong Zhang ((Mat_MPIBAIJ *)((*subMat)->data))->A = aij->A; 73e8271787SHong Zhang 749566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)aij->A)); 75e8271787SHong Zhang } 76e8271787SHong Zhang 77e8271787SHong Zhang /* Now traverse aij->B and insert values into subMat */ 789566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &newbRow, bs, &newbCol, bs * bs, &vals)); 79e8271787SHong Zhang for (i = 0; i < aij->B->rmap->n / bs; i++) { 80e8271787SHong Zhang newRow = (*subMat)->rmap->range[subCommRank] + i * bs; 81e8271787SHong Zhang for (j = aijB->i[i]; j < aijB->i[i + 1]; j++) { 82e8271787SHong Zhang newCol = garrayCMap[aijB->j[j]]; 83e8271787SHong Zhang if (newCol) { 84e8271787SHong Zhang newCol--; /* remove the increment */ 85e8271787SHong Zhang newCol *= bs; 86e8271787SHong Zhang for (k = 0; k < bs; k++) { 87e8271787SHong Zhang newbRow[k] = newRow + k; 88e8271787SHong Zhang newbCol[k] = newCol + k; 89e8271787SHong Zhang } 90e8271787SHong Zhang /* copy column-oriented aijB->a into row-oriented vals */ 9102e9429cSHong Zhang aijBvals = aijB->a + j * bs * bs; 92e8271787SHong Zhang for (k1 = 0; k1 < bs; k1++) { 939371c9d4SSatish Balay for (k = 0; k < bs; k++) { vals[k1 + k * bs] = *aijBvals++; } 94e8271787SHong Zhang } 959566063dSJacob Faibussowitsch PetscCall(MatSetValues(*subMat, bs, newbRow, bs, newbCol, vals, INSERT_VALUES)); 96e8271787SHong Zhang } 97e8271787SHong Zhang } 98e8271787SHong Zhang } 999566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*subMat, MAT_FINAL_ASSEMBLY)); 1009566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*subMat, MAT_FINAL_ASSEMBLY)); 101e8271787SHong Zhang 102e8271787SHong Zhang /* deallocate temporary data */ 1039566063dSJacob Faibussowitsch PetscCall(PetscFree3(newbRow, newbCol, vals)); 1049566063dSJacob Faibussowitsch PetscCall(PetscFree(commRankMap)); 1059566063dSJacob Faibussowitsch PetscCall(PetscFree(garrayCMap)); 106*48a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscFree(nnz)); 107e8271787SHong Zhang PetscFunctionReturn(0); 108e8271787SHong Zhang } 109