xref: /petsc/src/mat/impls/aij/mpi/mmaij.c (revision eec179cf895b6fbcd6a0b58694319392b06e361b)
1be1d678aSKris Buschelman 
28c79f6d3SBarry Smith /*
38c79f6d3SBarry Smith    Support for the parallel AIJ matrix vector multiply
48c79f6d3SBarry Smith */
5c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h>
6aeda0f58SHong Zhang #include <petsc/private/vecimpl.h>
7af0996ceSBarry Smith #include <petsc/private/isimpl.h> /* needed because accesses data structure of ISLocalToGlobalMapping directly */
88c79f6d3SBarry Smith 
9d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUpMultiply_MPIAIJ(Mat mat)
10d71ae5a4SJacob Faibussowitsch {
1144a69424SLois Curfman McInnes   Mat_MPIAIJ *aij = (Mat_MPIAIJ *)mat->data;
12ec8511deSBarry Smith   Mat_SeqAIJ *B   = (Mat_SeqAIJ *)(aij->B->data);
13b3c64f9dSJunchao Zhang   PetscInt    i, j, *aj = B->j, *garray;
14b3c64f9dSJunchao Zhang   PetscInt    ec = 0; /* Number of nonzero external columns */
151eb62cbbSBarry Smith   IS          from, to;
161eb62cbbSBarry Smith   Vec         gvec;
17aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
18*eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1 = NULL;
19*eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
20b1d57f15SBarry Smith   PetscInt      gid, lid;
216f531f54SSatish Balay #else
22d0f46423SBarry Smith   PetscInt N = mat->cmap->N, *indices;
232066d6f7SSatish Balay #endif
242066d6f7SSatish Balay 
253a40ed3dSBarry Smith   PetscFunctionBegin;
264b8d542aSHong Zhang   if (!aij->garray) {
2728b400f6SJacob Faibussowitsch     PetscCheck(aij->B, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Missing B mat");
28aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
29c5bfad50SMark F. Adams     /* use a table */
30*eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapICreateWithSize(aij->B->rmap->n, &gid1_lid1));
31d0f46423SBarry Smith     for (i = 0; i < aij->B->rmap->n; i++) {
322066d6f7SSatish Balay       for (j = 0; j < B->ilen[i]; j++) {
33b1d57f15SBarry Smith         PetscInt data, gid1 = aj[B->i[i] + j] + 1;
34*eec179cfSJacob Faibussowitsch         PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
35fa46199cSSatish Balay         if (!data) {
362066d6f7SSatish Balay           /* one based table */
37*eec179cfSJacob Faibussowitsch           PetscCall(PetscHMapISetWithMode(gid1_lid1, gid1, ++ec, INSERT_VALUES));
382066d6f7SSatish Balay         }
392066d6f7SSatish Balay       }
402066d6f7SSatish Balay     }
412066d6f7SSatish Balay     /* form array of columns we need */
429566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(ec, &garray));
43*eec179cfSJacob Faibussowitsch     PetscHashIterBegin(gid1_lid1, tpos);
44*eec179cfSJacob Faibussowitsch     while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
45*eec179cfSJacob Faibussowitsch       PetscHashIterGetKey(gid1_lid1, tpos, gid);
46*eec179cfSJacob Faibussowitsch       PetscHashIterGetVal(gid1_lid1, tpos, lid);
47*eec179cfSJacob Faibussowitsch       PetscHashIterNext(gid1_lid1, tpos);
48b0a32e0cSBarry Smith       gid--;
49b0a32e0cSBarry Smith       lid--;
502066d6f7SSatish Balay       garray[lid] = gid;
512066d6f7SSatish Balay     }
529566063dSJacob Faibussowitsch     PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
53*eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIClear(gid1_lid1));
54*eec179cfSJacob Faibussowitsch     for (i = 0; i < ec; i++) PetscCall(PetscHMapISetWithMode(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES));
552066d6f7SSatish Balay     /* compact out the extra columns in B */
56d0f46423SBarry Smith     for (i = 0; i < aij->B->rmap->n; i++) {
572066d6f7SSatish Balay       for (j = 0; j < B->ilen[i]; j++) {
58b1d57f15SBarry Smith         PetscInt gid1 = aj[B->i[i] + j] + 1;
59*eec179cfSJacob Faibussowitsch         PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
60fa46199cSSatish Balay         lid--;
61b3fb0a6cSMatthew Knepley         aj[B->i[i] + j] = lid;
622066d6f7SSatish Balay       }
632066d6f7SSatish Balay     }
649566063dSJacob Faibussowitsch     PetscCall(PetscLayoutDestroy(&aij->B->cmap));
659566063dSJacob Faibussowitsch     PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)aij->B), ec, ec, 1, &aij->B->cmap));
66*eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy(&gid1_lid1));
672066d6f7SSatish Balay #else
6811285404SBarry Smith     /* Make an array as long as the number of columns */
691eb62cbbSBarry Smith     /* mark those columns that are in aij->B */
709566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(N, &indices));
71d0f46423SBarry Smith     for (i = 0; i < aij->B->rmap->n; i++) {
72d6dfbf8fSBarry Smith       for (j = 0; j < B->ilen[i]; j++) {
73bfec09a0SHong Zhang         if (!indices[aj[B->i[i] + j]]) ec++;
74bfec09a0SHong Zhang         indices[aj[B->i[i] + j]] = 1;
75416022c9SBarry Smith       }
761eb62cbbSBarry Smith     }
778c79f6d3SBarry Smith 
781eb62cbbSBarry Smith     /* form array of columns we need */
799566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(ec, &garray));
801eb62cbbSBarry Smith     ec = 0;
811eb62cbbSBarry Smith     for (i = 0; i < N; i++) {
821eb62cbbSBarry Smith       if (indices[i]) garray[ec++] = i;
831eb62cbbSBarry Smith     }
841eb62cbbSBarry Smith 
851eb62cbbSBarry Smith     /* make indices now point into garray */
86ad540459SPierre Jolivet     for (i = 0; i < ec; i++) indices[garray[i]] = i;
871eb62cbbSBarry Smith 
881eb62cbbSBarry Smith     /* compact out the extra columns in B */
89d0f46423SBarry Smith     for (i = 0; i < aij->B->rmap->n; i++) {
90ad540459SPierre Jolivet       for (j = 0; j < B->ilen[i]; j++) aj[B->i[i] + j] = indices[aj[B->i[i] + j]];
91d6dfbf8fSBarry Smith     }
929566063dSJacob Faibussowitsch     PetscCall(PetscLayoutDestroy(&aij->B->cmap));
939566063dSJacob Faibussowitsch     PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)aij->B), ec, ec, 1, &aij->B->cmap));
949566063dSJacob Faibussowitsch     PetscCall(PetscFree(indices));
952066d6f7SSatish Balay #endif
964b8d542aSHong Zhang   } else {
974b8d542aSHong Zhang     garray = aij->garray;
984b8d542aSHong Zhang   }
994b8d542aSHong Zhang 
1004b8d542aSHong Zhang   if (!aij->lvec) {
10128b400f6SJacob Faibussowitsch     PetscCheck(aij->B, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Missing B mat");
1029566063dSJacob Faibussowitsch     PetscCall(MatCreateVecs(aij->B, &aij->lvec, NULL));
1034b8d542aSHong Zhang   }
1049566063dSJacob Faibussowitsch   PetscCall(VecGetSize(aij->lvec, &ec));
1051eb62cbbSBarry Smith 
106d6dfbf8fSBarry Smith   /* create two temporary Index sets for build scatter gather */
1079566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, ec, garray, PETSC_COPY_VALUES, &from));
1089566063dSJacob Faibussowitsch   PetscCall(ISCreateStride(PETSC_COMM_SELF, ec, 0, 1, &to));
1091eb62cbbSBarry Smith 
1101eb62cbbSBarry Smith   /* create temporary global vector to generate scatter context */
111b5eb4454SBarry Smith   /* This does not allocate the array's memory so is efficient */
1129566063dSJacob Faibussowitsch   PetscCall(VecCreateMPIWithArray(PetscObjectComm((PetscObject)mat), 1, mat->cmap->n, mat->cmap->N, NULL, &gvec));
1131eb62cbbSBarry Smith 
1142d336d48SLois Curfman McInnes   /* generate the scatter context */
1159566063dSJacob Faibussowitsch   PetscCall(VecScatterDestroy(&aij->Mvctx));
1169566063dSJacob Faibussowitsch   PetscCall(VecScatterCreate(gvec, from, aij->lvec, to, &aij->Mvctx));
1179566063dSJacob Faibussowitsch   PetscCall(VecScatterViewFromOptions(aij->Mvctx, (PetscObject)mat, "-matmult_vecscatter_view"));
11867bb5161SHong Zhang   aij->garray = garray;
1194b8d542aSHong Zhang 
1209566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&from));
1219566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&to));
1229566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&gvec));
1233a40ed3dSBarry Smith   PetscFunctionReturn(0);
1248c79f6d3SBarry Smith }
1259e25ed09SBarry Smith 
126fff043a9SJunchao Zhang /* Disassemble the off-diag portion of the MPIAIJXxx matrix.
127fff043a9SJunchao Zhang    In other words, change the B from reduced format using local col ids
128fff043a9SJunchao Zhang    to expanded format using global col ids, which will make it easier to
129fff043a9SJunchao Zhang    insert new nonzeros (with global col ids) into the matrix.
130fff043a9SJunchao Zhang    The off-diag B determines communication in the matrix vector multiply.
1312493cbb0SBarry Smith */
132d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDisAssemble_MPIAIJ(Mat A)
133d71ae5a4SJacob Faibussowitsch {
1342493cbb0SBarry Smith   Mat_MPIAIJ        *aij  = (Mat_MPIAIJ *)A->data;
1352493cbb0SBarry Smith   Mat                B    = aij->B, Bnew;
136ec8511deSBarry Smith   Mat_SeqAIJ        *Baij = (Mat_SeqAIJ *)B->data;
1374dfa11a4SJacob Faibussowitsch   PetscInt           i, j, m = B->rmap->n, n = A->cmap->N, col, ct = 0, *garray = aij->garray, *nz;
13887828ca2SBarry Smith   PetscScalar        v;
139fff043a9SJunchao Zhang   const PetscScalar *ba;
1402493cbb0SBarry Smith 
1413a40ed3dSBarry Smith   PetscFunctionBegin;
1422493cbb0SBarry Smith   /* free stuff related to matrix-vec multiply */
1439566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&aij->lvec));
144464493b3SBarry Smith   if (aij->colmap) {
145aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
146*eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy(&aij->colmap));
1472066d6f7SSatish Balay #else
1489566063dSJacob Faibussowitsch     PetscCall(PetscFree(aij->colmap));
1492066d6f7SSatish Balay #endif
150464493b3SBarry Smith   }
1512493cbb0SBarry Smith 
1522493cbb0SBarry Smith   /* make sure that B is assembled so we can access its values */
1539566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
1549566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
1552493cbb0SBarry Smith 
1562493cbb0SBarry Smith   /* invent new B and copy stuff over */
1579566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nz));
158ad540459SPierre Jolivet   for (i = 0; i < m; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
1599566063dSJacob Faibussowitsch   PetscCall(MatCreate(PETSC_COMM_SELF, &Bnew));
1609566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(Bnew, m, n, m, n)); /* Bnew now uses A->cmap->N as its col size */
1619566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(Bnew, A, A));
1629566063dSJacob Faibussowitsch   PetscCall(MatSetType(Bnew, ((PetscObject)B)->type_name));
1639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(Bnew, 0, nz));
1642205254eSKarl Rupp 
165b38c15b3SStefano Zampini   if (Baij->nonew >= 0) { /* Inherit insertion error options (if positive). */
166b38c15b3SStefano Zampini     ((Mat_SeqAIJ *)Bnew->data)->nonew = Baij->nonew;
167b38c15b3SStefano Zampini   }
168b38c15b3SStefano Zampini 
16977341eacSDmitry Karpeev   /*
17077341eacSDmitry Karpeev    Ensure that B's nonzerostate is monotonically increasing.
17177341eacSDmitry Karpeev    Or should this follow the MatSetValues() loop to preserve B's nonzerstate across a MatDisAssemble() call?
17277341eacSDmitry Karpeev    */
173f69fde56SShane Stafford   Bnew->nonzerostate = B->nonzerostate;
1742205254eSKarl Rupp 
1759566063dSJacob Faibussowitsch   PetscCall(PetscFree(nz));
1769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
1772493cbb0SBarry Smith   for (i = 0; i < m; i++) {
178bfec09a0SHong Zhang     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
179bfec09a0SHong Zhang       col = garray[Baij->j[ct]];
180fff043a9SJunchao Zhang       v   = ba[ct++];
1819566063dSJacob Faibussowitsch       PetscCall(MatSetValues(Bnew, 1, &i, 1, &col, &v, B->insertmode));
1822493cbb0SBarry Smith     }
1832493cbb0SBarry Smith   }
1849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
185fff043a9SJunchao Zhang 
1869566063dSJacob Faibussowitsch   PetscCall(PetscFree(aij->garray));
1879566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&B));
1882205254eSKarl Rupp 
1892493cbb0SBarry Smith   aij->B           = Bnew;
190227d817aSBarry Smith   A->was_assembled = PETSC_FALSE;
1913a40ed3dSBarry Smith   PetscFunctionReturn(0);
1922493cbb0SBarry Smith }
1932493cbb0SBarry Smith 
1942cd6534aSBarry Smith /*      ugly stuff added for Glenn someday we should fix this up */
1952cd6534aSBarry Smith 
196f4259b30SLisandro Dalcin static PetscInt *auglyrmapd = NULL, *auglyrmapo = NULL; /* mapping from the local ordering to the "diagonal" and "off-diagonal" parts of the local matrix */
197f4259b30SLisandro Dalcin static Vec       auglydd = NULL, auglyoo = NULL;        /* work vectors used to scale the two parts of the local matrix */
1982cd6534aSBarry Smith 
199d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMPIAIJDiagonalScaleLocalSetUp(Mat inA, Vec scale)
200d71ae5a4SJacob Faibussowitsch {
2012cd6534aSBarry Smith   Mat_MPIAIJ *ina = (Mat_MPIAIJ *)inA->data; /*access private part of matrix */
202b1d57f15SBarry Smith   PetscInt    i, n, nt, cstart, cend, no, *garray = ina->garray, *lindices;
203b1d57f15SBarry Smith   PetscInt   *r_rmapd, *r_rmapo;
2042cd6534aSBarry Smith 
2052cd6534aSBarry Smith   PetscFunctionBegin;
2069566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(inA, &cstart, &cend));
2079566063dSJacob Faibussowitsch   PetscCall(MatGetSize(ina->A, NULL, &n));
2089566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(inA->rmap->mapping->n + 1, &r_rmapd));
2092cd6534aSBarry Smith   nt = 0;
210992144d0SBarry Smith   for (i = 0; i < inA->rmap->mapping->n; i++) {
211992144d0SBarry Smith     if (inA->rmap->mapping->indices[i] >= cstart && inA->rmap->mapping->indices[i] < cend) {
2122cd6534aSBarry Smith       nt++;
213992144d0SBarry Smith       r_rmapd[i] = inA->rmap->mapping->indices[i] + 1;
2142cd6534aSBarry Smith     }
2152cd6534aSBarry Smith   }
21608401ef6SPierre Jolivet   PetscCheck(nt == n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Hmm nt %" PetscInt_FMT " n %" PetscInt_FMT, nt, n);
2179566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &auglyrmapd));
218992144d0SBarry Smith   for (i = 0; i < inA->rmap->mapping->n; i++) {
219ad540459SPierre Jolivet     if (r_rmapd[i]) auglyrmapd[(r_rmapd[i] - 1) - cstart] = i;
2202cd6534aSBarry Smith   }
2219566063dSJacob Faibussowitsch   PetscCall(PetscFree(r_rmapd));
2229566063dSJacob Faibussowitsch   PetscCall(VecCreateSeq(PETSC_COMM_SELF, n, &auglydd));
2232cd6534aSBarry Smith 
2249566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(inA->cmap->N + 1, &lindices));
225ad540459SPierre Jolivet   for (i = 0; i < ina->B->cmap->n; i++) lindices[garray[i]] = i + 1;
226992144d0SBarry Smith   no = inA->rmap->mapping->n - nt;
2279566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(inA->rmap->mapping->n + 1, &r_rmapo));
2282cd6534aSBarry Smith   nt = 0;
229992144d0SBarry Smith   for (i = 0; i < inA->rmap->mapping->n; i++) {
230992144d0SBarry Smith     if (lindices[inA->rmap->mapping->indices[i]]) {
2312cd6534aSBarry Smith       nt++;
232992144d0SBarry Smith       r_rmapo[i] = lindices[inA->rmap->mapping->indices[i]];
2332cd6534aSBarry Smith     }
2342cd6534aSBarry Smith   }
23508401ef6SPierre Jolivet   PetscCheck(nt <= no, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Hmm nt %" PetscInt_FMT " no %" PetscInt_FMT, nt, n);
2369566063dSJacob Faibussowitsch   PetscCall(PetscFree(lindices));
2379566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nt + 1, &auglyrmapo));
238992144d0SBarry Smith   for (i = 0; i < inA->rmap->mapping->n; i++) {
239ad540459SPierre Jolivet     if (r_rmapo[i]) auglyrmapo[(r_rmapo[i] - 1)] = i;
2402cd6534aSBarry Smith   }
2419566063dSJacob Faibussowitsch   PetscCall(PetscFree(r_rmapo));
2429566063dSJacob Faibussowitsch   PetscCall(VecCreateSeq(PETSC_COMM_SELF, nt, &auglyoo));
2432cd6534aSBarry Smith   PetscFunctionReturn(0);
2442cd6534aSBarry Smith }
2452cd6534aSBarry Smith 
246d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMPIAIJDiagonalScaleLocal(Mat A, Vec scale)
247d71ae5a4SJacob Faibussowitsch {
24892b32695SKris Buschelman   /* This routine should really be abandoned as it duplicates MatDiagonalScaleLocal */
24992b32695SKris Buschelman 
25092b32695SKris Buschelman   PetscFunctionBegin;
251cac4c232SBarry Smith   PetscTryMethod(A, "MatDiagonalScaleLocal_C", (Mat, Vec), (A, scale));
25292b32695SKris Buschelman   PetscFunctionReturn(0);
25392b32695SKris Buschelman }
25492b32695SKris Buschelman 
255d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScaleLocal_MPIAIJ(Mat A, Vec scale)
256d71ae5a4SJacob Faibussowitsch {
2572cd6534aSBarry Smith   Mat_MPIAIJ        *a = (Mat_MPIAIJ *)A->data; /*access private part of matrix */
258b1d57f15SBarry Smith   PetscInt           n, i;
259bca11509SBarry Smith   PetscScalar       *d, *o;
260bca11509SBarry Smith   const PetscScalar *s;
2612cd6534aSBarry Smith 
2622cd6534aSBarry Smith   PetscFunctionBegin;
26348a46eb9SPierre Jolivet   if (!auglyrmapd) PetscCall(MatMPIAIJDiagonalScaleLocalSetUp(A, scale));
2642cd6534aSBarry Smith 
2659566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(scale, &s));
2662cd6534aSBarry Smith 
2679566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(auglydd, &n));
2689566063dSJacob Faibussowitsch   PetscCall(VecGetArray(auglydd, &d));
2699371c9d4SSatish Balay   for (i = 0; i < n; i++) { d[i] = s[auglyrmapd[i]]; /* copy "diagonal" (true local) portion of scale into dd vector */ }
2709566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(auglydd, &d));
2712cd6534aSBarry Smith   /* column scale "diagonal" portion of local matrix */
2729566063dSJacob Faibussowitsch   PetscCall(MatDiagonalScale(a->A, NULL, auglydd));
2732cd6534aSBarry Smith 
2749566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(auglyoo, &n));
2759566063dSJacob Faibussowitsch   PetscCall(VecGetArray(auglyoo, &o));
2769371c9d4SSatish Balay   for (i = 0; i < n; i++) { o[i] = s[auglyrmapo[i]]; /* copy "off-diagonal" portion of scale into oo vector */ }
2779566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(scale, &s));
2789566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(auglyoo, &o));
2792cd6534aSBarry Smith   /* column scale "off-diagonal" portion of local matrix */
2809566063dSJacob Faibussowitsch   PetscCall(MatDiagonalScale(a->B, NULL, auglyoo));
2812cd6534aSBarry Smith   PetscFunctionReturn(0);
2822cd6534aSBarry Smith }
283