xref: /petsc/src/mat/impls/baij/mpi/mpb_baij.c (revision 48a46eb9bd028bec07ec0f396b1a3abb43f14558)
1e8271787SHong Zhang #include <../src/mat/impls/baij/mpi/mpibaij.h>
2e8271787SHong Zhang 
39371c9d4SSatish Balay PetscErrorCode MatGetMultiProcBlock_MPIBAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) {
4e8271787SHong Zhang   Mat_MPIBAIJ *aij  = (Mat_MPIBAIJ *)mat->data;
5e8271787SHong Zhang   Mat_SeqBAIJ *aijB = (Mat_SeqBAIJ *)aij->B->data;
6e8271787SHong Zhang   PetscMPIInt  commRank, subCommSize, subCommRank;
7e8271787SHong Zhang   PetscMPIInt *commRankMap, subRank, rank, commsize;
802e9429cSHong Zhang   PetscInt    *garrayCMap, col, i, j, *nnz, newRow, newCol, *newbRow, *newbCol, k, k1;
9e8271787SHong Zhang   PetscInt     bs = mat->rmap->bs;
1002e9429cSHong Zhang   PetscScalar *vals, *aijBvals;
11e8271787SHong Zhang 
12e8271787SHong Zhang   PetscFunctionBegin;
139566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)mat), &commsize));
149566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(subComm, &subCommSize));
15e8271787SHong Zhang 
16a5b23f4aSJose E. Roman   /* create subMat object with the relevant layout */
17e8271787SHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
189566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, subMat));
199566063dSJacob Faibussowitsch     PetscCall(MatSetType(*subMat, MATMPIBAIJ));
209566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(*subMat, mat->rmap->n, mat->cmap->n, PETSC_DECIDE, PETSC_DECIDE));
219566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizes(*subMat, mat->rmap->bs, mat->cmap->bs));
22e8271787SHong Zhang 
23e8271787SHong Zhang     /* need to setup rmap and cmap before Preallocation */
249566063dSJacob Faibussowitsch     PetscCall(PetscLayoutSetBlockSize((*subMat)->rmap, mat->rmap->bs));
259566063dSJacob Faibussowitsch     PetscCall(PetscLayoutSetBlockSize((*subMat)->cmap, mat->cmap->bs));
269566063dSJacob Faibussowitsch     PetscCall(PetscLayoutSetUp((*subMat)->rmap));
279566063dSJacob Faibussowitsch     PetscCall(PetscLayoutSetUp((*subMat)->cmap));
28e8271787SHong Zhang   }
29e8271787SHong Zhang 
30e8271787SHong Zhang   /* create a map of comm_rank from subComm to comm - should commRankMap and garrayCMap be kept for reused? */
319566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_rank(PetscObjectComm((PetscObject)mat), &commRank));
329566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_rank(subComm, &subCommRank));
339566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(subCommSize, &commRankMap));
349566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Allgather(&commRank, 1, MPI_INT, commRankMap, 1, MPI_INT, subComm));
35e8271787SHong Zhang 
36e8271787SHong Zhang   /* Traverse garray and identify blocked column indices [of offdiag mat] that
37e8271787SHong Zhang    should be discarded. For the ones not discarded, store the newCol+1
38e8271787SHong Zhang    value in garrayCMap */
399566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(aij->B->cmap->n / bs, &garrayCMap));
40e8271787SHong Zhang   for (i = 0; i < aij->B->cmap->n / bs; i++) {
41e8271787SHong Zhang     col = aij->garray[i]; /* blocked column index */
42e8271787SHong Zhang     for (subRank = 0; subRank < subCommSize; subRank++) {
43e8271787SHong Zhang       rank = commRankMap[subRank];
44e8271787SHong Zhang       if ((col >= mat->cmap->range[rank] / bs) && (col < mat->cmap->range[rank + 1] / bs)) {
4502e9429cSHong Zhang         garrayCMap[i] = (((*subMat)->cmap->range[subRank] - mat->cmap->range[rank]) / bs + col + 1);
46e8271787SHong Zhang         break;
47e8271787SHong Zhang       }
48e8271787SHong Zhang     }
49e8271787SHong Zhang   }
50e8271787SHong Zhang 
51e8271787SHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
52e8271787SHong Zhang     /* Now compute preallocation for the offdiag mat */
539566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(aij->B->rmap->n / bs, &nnz));
54e8271787SHong Zhang     for (i = 0; i < aij->B->rmap->n / bs; i++) {
55e8271787SHong Zhang       for (j = aijB->i[i]; j < aijB->i[i + 1]; j++) {
56e8271787SHong Zhang         if (garrayCMap[aijB->j[j]]) nnz[i]++;
57e8271787SHong Zhang       }
58e8271787SHong Zhang     }
599566063dSJacob Faibussowitsch     PetscCall(MatMPIBAIJSetPreallocation(*(subMat), bs, 0, NULL, 0, nnz));
60e8271787SHong Zhang 
61e8271787SHong Zhang     /* reuse diag block with the new submat */
629566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&((Mat_MPIBAIJ *)((*subMat)->data))->A));
63e8271787SHong Zhang 
64e8271787SHong Zhang     ((Mat_MPIBAIJ *)((*subMat)->data))->A = aij->A;
65e8271787SHong Zhang 
669566063dSJacob Faibussowitsch     PetscCall(PetscObjectReference((PetscObject)aij->A));
67e8271787SHong Zhang   } else if (((Mat_MPIBAIJ *)(*subMat)->data)->A != aij->A) {
68e8271787SHong Zhang     PetscObject obj = (PetscObject)((Mat_MPIBAIJ *)((*subMat)->data))->A;
69e8271787SHong Zhang 
709566063dSJacob Faibussowitsch     PetscCall(PetscObjectReference((PetscObject)obj));
71e8271787SHong Zhang 
72e8271787SHong Zhang     ((Mat_MPIBAIJ *)((*subMat)->data))->A = aij->A;
73e8271787SHong Zhang 
749566063dSJacob Faibussowitsch     PetscCall(PetscObjectReference((PetscObject)aij->A));
75e8271787SHong Zhang   }
76e8271787SHong Zhang 
77e8271787SHong Zhang   /* Now traverse aij->B and insert values into subMat */
789566063dSJacob Faibussowitsch   PetscCall(PetscMalloc3(bs, &newbRow, bs, &newbCol, bs * bs, &vals));
79e8271787SHong Zhang   for (i = 0; i < aij->B->rmap->n / bs; i++) {
80e8271787SHong Zhang     newRow = (*subMat)->rmap->range[subCommRank] + i * bs;
81e8271787SHong Zhang     for (j = aijB->i[i]; j < aijB->i[i + 1]; j++) {
82e8271787SHong Zhang       newCol = garrayCMap[aijB->j[j]];
83e8271787SHong Zhang       if (newCol) {
84e8271787SHong Zhang         newCol--; /* remove the increment */
85e8271787SHong Zhang         newCol *= bs;
86e8271787SHong Zhang         for (k = 0; k < bs; k++) {
87e8271787SHong Zhang           newbRow[k] = newRow + k;
88e8271787SHong Zhang           newbCol[k] = newCol + k;
89e8271787SHong Zhang         }
90e8271787SHong Zhang         /* copy column-oriented aijB->a into row-oriented vals */
9102e9429cSHong Zhang         aijBvals = aijB->a + j * bs * bs;
92e8271787SHong Zhang         for (k1 = 0; k1 < bs; k1++) {
939371c9d4SSatish Balay           for (k = 0; k < bs; k++) { vals[k1 + k * bs] = *aijBvals++; }
94e8271787SHong Zhang         }
959566063dSJacob Faibussowitsch         PetscCall(MatSetValues(*subMat, bs, newbRow, bs, newbCol, vals, INSERT_VALUES));
96e8271787SHong Zhang       }
97e8271787SHong Zhang     }
98e8271787SHong Zhang   }
999566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*subMat, MAT_FINAL_ASSEMBLY));
1009566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*subMat, MAT_FINAL_ASSEMBLY));
101e8271787SHong Zhang 
102e8271787SHong Zhang   /* deallocate temporary data */
1039566063dSJacob Faibussowitsch   PetscCall(PetscFree3(newbRow, newbCol, vals));
1049566063dSJacob Faibussowitsch   PetscCall(PetscFree(commRankMap));
1059566063dSJacob Faibussowitsch   PetscCall(PetscFree(garrayCMap));
106*48a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscFree(nnz));
107e8271787SHong Zhang   PetscFunctionReturn(0);
108e8271787SHong Zhang }
109